diff --git "a/wandb/run-20220228_122826-3vepvy3m/files/wandb-summary.json" "b/wandb/run-20220228_122826-3vepvy3m/files/wandb-summary.json" --- "a/wandb/run-20220228_122826-3vepvy3m/files/wandb-summary.json" +++ "b/wandb/run-20220228_122826-3vepvy3m/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.0199, "train/learning_rate": 7.653061224489796e-08, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 7825, "_timestamp": 1646059131, "_step": 894, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 101.0, 880.0, 34.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.887240409851074, -9.418985366821289, -2.9507312774658203, 3.517523765563965, 9.985777854919434, 16.45403289794922, 22.922286987304688, 29.390541076660156, 35.858795166015625, 42.327049255371094, 48.79530334472656, 55.26355743408203, 61.7318115234375, 68.2000732421875, 74.66831970214844, 81.13658142089844, 87.6048355102539, 94.07308959960938, 100.54134368896484, 107.00959777832031, 113.47785186767578, 119.94610595703125, 126.41436767578125, 132.8826141357422, 139.3508758544922, 145.8191375732422, 152.28738403320312, 158.75564575195312, 165.22389221191406, 171.69215393066406, 178.160400390625, 184.628662109375, 191.09690856933594, 197.56517028808594, 204.03341674804688, 210.50167846679688, 216.9699249267578, 223.4381866455078, 229.90643310546875, 236.37469482421875, 242.8429412841797, 249.3112030029297, 255.77944946289062, 262.2477111816406, 268.7159729003906, 275.1842041015625, 281.6524658203125, 288.1207275390625, 294.5889892578125, 301.0572509765625, 307.5255126953125, 313.9937438964844, 320.4620056152344, 326.9302673339844, 333.3985290527344, 339.86676025390625, 346.33502197265625, 352.80328369140625, 359.27154541015625, 365.7397766113281, 372.2080383300781, 378.6763000488281, 385.1445617675781, 391.61279296875, 398.0810546875]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 11.0, 5.0, 13.0, 5.0, 16.0, 23.0, 19.0, 22.0, 31.0, 42.0, 36.0, 35.0, 42.0, 39.0, 52.0, 63.0, 66.0, 56.0, 65.0, 65.0, 46.0, 40.0, 50.0, 26.0, 31.0, 19.0, 19.0, 17.0, 7.0, 11.0, 11.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.502586364746094, -29.423606872558594, -28.344627380371094, -27.265649795532227, -26.186670303344727, -25.107690811157227, -24.02871322631836, -22.94973373413086, -21.87075424194336, -20.79177474975586, -19.71279525756836, -18.633817672729492, -17.554838180541992, -16.475858688354492, -15.396880149841309, -14.317901611328125, -13.238922119140625, -12.159942626953125, -11.080964088439941, -10.001985549926758, -8.923006057739258, -7.844027042388916, -6.765048027038574, -5.686069011688232, -4.607089996337891, -3.528110980987549, -2.449131965637207, -1.3701529502868652, -0.29117393493652344, 0.7878050804138184, 1.8667840957641602, 2.945763111114502, 4.024742126464844, 5.1037211418151855, 6.182700157165527, 7.261679172515869, 8.340658187866211, 9.419637680053711, 10.498616218566895, 11.577594757080078, 12.656574249267578, 13.735553741455078, 14.814532279968262, 15.893510818481445, 16.972490310668945, 18.051469802856445, 19.130447387695312, 20.209426879882812, 21.288406372070312, 22.367385864257812, 23.446365356445312, 24.52534294128418, 25.60432243347168, 26.68330192565918, 27.762279510498047, 28.841259002685547, 29.920238494873047, 30.999217987060547, 32.07819747924805, 33.15717697143555, 34.23615264892578, 35.31513214111328, 36.39411163330078, 37.47309112548828, 38.55207061767578]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 9.0, 9.0, 10.0, 6.0, 13.0, 9.0, 17.0, 21.0, 26.0, 21.0, 20.0, 26.0, 45.0, 50.0, 43.0, 57.0, 31.0, 41.0, 60.0, 58.0, 55.0, 58.0, 46.0, 44.0, 38.0, 31.0, 27.0, 20.0, 15.0, 15.0, 20.0, 16.0, 11.0, 12.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9337921142578125, -1.877349853515625, -1.8209075927734375, -1.76446533203125, -1.7080230712890625, -1.651580810546875, -1.5951385498046875, -1.5386962890625, -1.4822540283203125, -1.425811767578125, -1.3693695068359375, -1.31292724609375, -1.2564849853515625, -1.200042724609375, -1.1436004638671875, -1.087158203125, -1.0307159423828125, -0.974273681640625, -0.9178314208984375, -0.86138916015625, -0.8049468994140625, -0.748504638671875, -0.6920623779296875, -0.6356201171875, -0.5791778564453125, -0.522735595703125, -0.4662933349609375, -0.40985107421875, -0.3534088134765625, -0.296966552734375, -0.2405242919921875, -0.18408203125, -0.1276397705078125, -0.071197509765625, -0.0147552490234375, 0.04168701171875, 0.0981292724609375, 0.154571533203125, 0.2110137939453125, 0.2674560546875, 0.3238983154296875, 0.380340576171875, 0.4367828369140625, 0.49322509765625, 0.5496673583984375, 0.606109619140625, 0.6625518798828125, 0.718994140625, 0.7754364013671875, 0.831878662109375, 0.8883209228515625, 0.94476318359375, 1.0012054443359375, 1.057647705078125, 1.1140899658203125, 1.1705322265625, 1.2269744873046875, 1.283416748046875, 1.3398590087890625, 1.39630126953125, 1.4527435302734375, 1.509185791015625, 1.5656280517578125, 1.6220703125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 8.0, 8.0, 7.0, 17.0, 19.0, 31.0, 43.0, 46.0, 63.0, 102.0, 147.0, 232.0, 318.0, 463.0, 754.0, 1153.0, 2061.0, 3794.0, 8242.0, 23126.0, 90145.0, 629874.0, 2531855.0, 752435.0, 105746.0, 25547.0, 8820.0, 3836.0, 2137.0, 1182.0, 658.0, 450.0, 303.0, 210.0, 143.0, 120.0, 60.0, 32.0, 27.0, 32.0, 14.0, 9.0, 9.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.125, -3.98046875, -3.8359375, -3.69140625, -3.546875, -3.40234375, -3.2578125, -3.11328125, -2.96875, -2.82421875, -2.6796875, -2.53515625, -2.390625, -2.24609375, -2.1015625, -1.95703125, -1.8125, -1.66796875, -1.5234375, -1.37890625, -1.234375, -1.08984375, -0.9453125, -0.80078125, -0.65625, -0.51171875, -0.3671875, -0.22265625, -0.078125, 0.06640625, 0.2109375, 0.35546875, 0.5, 0.64453125, 0.7890625, 0.93359375, 1.078125, 1.22265625, 1.3671875, 1.51171875, 1.65625, 1.80078125, 1.9453125, 2.08984375, 2.234375, 2.37890625, 2.5234375, 2.66796875, 2.8125, 2.95703125, 3.1015625, 3.24609375, 3.390625, 3.53515625, 3.6796875, 3.82421875, 3.96875, 4.11328125, 4.2578125, 4.40234375, 4.546875, 4.69140625, 4.8359375, 4.98046875, 5.125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 5.0, 19.0, 22.0, 41.0, 79.0, 139.0, 250.0, 500.0, 880.0, 859.0, 529.0, 309.0, 172.0, 104.0, 67.0, 34.0, 24.0, 10.0, 6.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.453125, -9.1148681640625, -8.776611328125, -8.4383544921875, -8.10009765625, -7.7618408203125, -7.423583984375, -7.0853271484375, -6.7470703125, -6.4088134765625, -6.070556640625, -5.7322998046875, -5.39404296875, -5.0557861328125, -4.717529296875, -4.3792724609375, -4.041015625, -3.7027587890625, -3.364501953125, -3.0262451171875, -2.68798828125, -2.3497314453125, -2.011474609375, -1.6732177734375, -1.3349609375, -0.9967041015625, -0.658447265625, -0.3201904296875, 0.01806640625, 0.3563232421875, 0.694580078125, 1.0328369140625, 1.37109375, 1.7093505859375, 2.047607421875, 2.3858642578125, 2.72412109375, 3.0623779296875, 3.400634765625, 3.7388916015625, 4.0771484375, 4.4154052734375, 4.753662109375, 5.0919189453125, 5.43017578125, 5.7684326171875, 6.106689453125, 6.4449462890625, 6.783203125, 7.1214599609375, 7.459716796875, 7.7979736328125, 8.13623046875, 8.4744873046875, 8.812744140625, 9.1510009765625, 9.4892578125, 9.8275146484375, 10.165771484375, 10.5040283203125, 10.84228515625, 11.1805419921875, 11.518798828125, 11.8570556640625, 12.1953125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 16.0, 16.0, 20.0, 50.0, 76.0, 159.0, 269.0, 602.0, 1602.0, 8923.0, 3179612.0, 993909.0, 6244.0, 1496.0, 606.0, 279.0, 160.0, 84.0, 52.0, 28.0, 20.0, 14.0, 9.0, 6.0, 5.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.96875, -27.93115234375, -26.8935546875, -25.85595703125, -24.818359375, -23.78076171875, -22.7431640625, -21.70556640625, -20.66796875, -19.63037109375, -18.5927734375, -17.55517578125, -16.517578125, -15.47998046875, -14.4423828125, -13.40478515625, -12.3671875, -11.32958984375, -10.2919921875, -9.25439453125, -8.216796875, -7.17919921875, -6.1416015625, -5.10400390625, -4.06640625, -3.02880859375, -1.9912109375, -0.95361328125, 0.083984375, 1.12158203125, 2.1591796875, 3.19677734375, 4.234375, 5.27197265625, 6.3095703125, 7.34716796875, 8.384765625, 9.42236328125, 10.4599609375, 11.49755859375, 12.53515625, 13.57275390625, 14.6103515625, 15.64794921875, 16.685546875, 17.72314453125, 18.7607421875, 19.79833984375, 20.8359375, 21.87353515625, 22.9111328125, 23.94873046875, 24.986328125, 26.02392578125, 27.0615234375, 28.09912109375, 29.13671875, 30.17431640625, 31.2119140625, 32.24951171875, 33.287109375, 34.32470703125, 35.3623046875, 36.39990234375, 37.4375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 10.0, 599.0, 389.0, 14.0, 1.0, 1.0, 0.0, 1.0], "bins": [-297.2367858886719, -292.0941467285156, -286.9515075683594, -281.8088684082031, -276.6662292480469, -271.5235900878906, -266.3809509277344, -261.2383117675781, -256.0956726074219, -250.95303344726562, -245.81039428710938, -240.66775512695312, -235.52511596679688, -230.38247680664062, -225.23983764648438, -220.09718322753906, -214.95452880859375, -209.8118896484375, -204.66925048828125, -199.526611328125, -194.38397216796875, -189.2413330078125, -184.09869384765625, -178.95603942871094, -173.81341552734375, -168.6707763671875, -163.52813720703125, -158.385498046875, -153.24285888671875, -148.1002197265625, -142.95758056640625, -137.81492614746094, -132.67227172851562, -127.52963256835938, -122.38699340820312, -117.24435424804688, -112.1017074584961, -106.95906829833984, -101.8164291381836, -96.67378234863281, -91.5311508178711, -86.38851165771484, -81.2458724975586, -76.10322570800781, -70.96058654785156, -65.81794738769531, -60.67530822753906, -55.53266525268555, -50.39002227783203, -45.24738311767578, -40.104740142822266, -34.962100982666016, -29.819459915161133, -24.67681884765625, -19.5341796875, -14.391536712646484, -9.248899459838867, -4.106258869171143, 1.036381721496582, 6.179021835327148, 11.321662902832031, 16.464303970336914, 21.606943130493164, 26.74958610534668, 31.89222526550293]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 9.0, 9.0, 5.0, 3.0, 6.0, 13.0, 10.0, 13.0, 13.0, 22.0, 18.0, 24.0, 26.0, 26.0, 35.0, 33.0, 24.0, 38.0, 37.0, 43.0, 42.0, 56.0, 36.0, 44.0, 43.0, 49.0, 34.0, 33.0, 37.0, 33.0, 38.0, 26.0, 24.0, 22.0, 16.0, 10.0, 13.0, 9.0, 13.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-30.77267074584961, -29.925748825073242, -29.078826904296875, -28.23190689086914, -27.384984970092773, -26.538063049316406, -25.691143035888672, -24.844221115112305, -23.997299194335938, -23.15037727355957, -22.303455352783203, -21.45653533935547, -20.6096134185791, -19.762691497802734, -18.915771484375, -18.068849563598633, -17.221927642822266, -16.3750057220459, -15.528084754943848, -14.681163787841797, -13.83424186706543, -12.987319946289062, -12.140398979187012, -11.293478012084961, -10.446556091308594, -9.599634170532227, -8.752713203430176, -7.905791759490967, -7.058870315551758, -6.211948871612549, -5.36502742767334, -4.518105983734131, -3.671182632446289, -2.82426118850708, -1.977339744567871, -1.130418300628662, -0.2834968566894531, 0.5634245872497559, 1.4103460311889648, 2.257267475128174, 3.104188919067383, 3.951110363006592, 4.798031806945801, 5.64495325088501, 6.491874694824219, 7.338796138763428, 8.185717582702637, 9.032638549804688, 9.879560470581055, 10.726482391357422, 11.573403358459473, 12.420324325561523, 13.26724624633789, 14.114168167114258, 14.961089134216309, 15.80801010131836, 16.654932022094727, 17.501853942871094, 18.348773956298828, 19.195695877075195, 20.042617797851562, 20.88953971862793, 21.736461639404297, 22.58338165283203, 23.4303035736084]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 1.0, 5.0, 6.0, 10.0, 12.0, 11.0, 15.0, 21.0, 19.0, 23.0, 24.0, 20.0, 34.0, 44.0, 35.0, 41.0, 42.0, 37.0, 47.0, 54.0, 51.0, 45.0, 46.0, 49.0, 37.0, 43.0, 34.0, 22.0, 31.0, 25.0, 18.0, 29.0, 10.0, 11.0, 8.0, 13.0, 3.0, 5.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.499847412109375, -1.44500732421875, -1.390167236328125, -1.3353271484375, -1.280487060546875, -1.22564697265625, -1.170806884765625, -1.115966796875, -1.061126708984375, -1.00628662109375, -0.951446533203125, -0.8966064453125, -0.841766357421875, -0.78692626953125, -0.732086181640625, -0.67724609375, -0.622406005859375, -0.56756591796875, -0.512725830078125, -0.4578857421875, -0.403045654296875, -0.34820556640625, -0.293365478515625, -0.238525390625, -0.183685302734375, -0.12884521484375, -0.074005126953125, -0.0191650390625, 0.035675048828125, 0.09051513671875, 0.145355224609375, 0.2001953125, 0.255035400390625, 0.30987548828125, 0.364715576171875, 0.4195556640625, 0.474395751953125, 0.52923583984375, 0.584075927734375, 0.638916015625, 0.693756103515625, 0.74859619140625, 0.803436279296875, 0.8582763671875, 0.913116455078125, 0.96795654296875, 1.022796630859375, 1.07763671875, 1.132476806640625, 1.18731689453125, 1.242156982421875, 1.2969970703125, 1.351837158203125, 1.40667724609375, 1.461517333984375, 1.516357421875, 1.571197509765625, 1.62603759765625, 1.680877685546875, 1.7357177734375, 1.790557861328125, 1.84539794921875, 1.900238037109375, 1.955078125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 14.0, 15.0, 17.0, 22.0, 40.0, 54.0, 88.0, 110.0, 148.0, 280.0, 350.0, 479.0, 804.0, 1204.0, 1724.0, 2618.0, 4032.0, 5900.0, 9354.0, 14738.0, 23585.0, 39743.0, 70557.0, 137214.0, 308373.0, 198468.0, 94899.0, 51644.0, 30078.0, 18486.0, 11625.0, 7476.0, 4740.0, 3281.0, 2010.0, 1463.0, 950.0, 596.0, 452.0, 325.0, 193.0, 119.0, 112.0, 67.0, 42.0, 30.0, 14.0, 8.0, 5.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.29345703125, -0.284210205078125, -0.27496337890625, -0.265716552734375, -0.2564697265625, -0.247222900390625, -0.23797607421875, -0.228729248046875, -0.219482421875, -0.210235595703125, -0.20098876953125, -0.191741943359375, -0.1824951171875, -0.173248291015625, -0.16400146484375, -0.154754638671875, -0.1455078125, -0.136260986328125, -0.12701416015625, -0.117767333984375, -0.1085205078125, -0.099273681640625, -0.09002685546875, -0.080780029296875, -0.071533203125, -0.062286376953125, -0.05303955078125, -0.043792724609375, -0.0345458984375, -0.025299072265625, -0.01605224609375, -0.006805419921875, 0.00244140625, 0.011688232421875, 0.02093505859375, 0.030181884765625, 0.0394287109375, 0.048675537109375, 0.05792236328125, 0.067169189453125, 0.076416015625, 0.085662841796875, 0.09490966796875, 0.104156494140625, 0.1134033203125, 0.122650146484375, 0.13189697265625, 0.141143798828125, 0.150390625, 0.159637451171875, 0.16888427734375, 0.178131103515625, 0.1873779296875, 0.196624755859375, 0.20587158203125, 0.215118408203125, 0.224365234375, 0.233612060546875, 0.24285888671875, 0.252105712890625, 0.2613525390625, 0.270599365234375, 0.27984619140625, 0.289093017578125, 0.29833984375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 3.0, 8.0, 4.0, 14.0, 12.0, 11.0, 21.0, 13.0, 12.0, 25.0, 24.0, 33.0, 31.0, 23.0, 32.0, 45.0, 43.0, 40.0, 40.0, 44.0, 1081.0, 27.0, 39.0, 37.0, 32.0, 34.0, 36.0, 26.0, 27.0, 24.0, 25.0, 22.0, 32.0, 20.0, 20.0, 15.0, 15.0, 3.0, 7.0, 6.0, 7.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0634765625, -1.03118896484375, -0.9989013671875, -0.96661376953125, -0.934326171875, -0.90203857421875, -0.8697509765625, -0.83746337890625, -0.80517578125, -0.77288818359375, -0.7406005859375, -0.70831298828125, -0.676025390625, -0.64373779296875, -0.6114501953125, -0.57916259765625, -0.546875, -0.51458740234375, -0.4822998046875, -0.45001220703125, -0.417724609375, -0.38543701171875, -0.3531494140625, -0.32086181640625, -0.28857421875, -0.25628662109375, -0.2239990234375, -0.19171142578125, -0.159423828125, -0.12713623046875, -0.0948486328125, -0.06256103515625, -0.0302734375, 0.00201416015625, 0.0343017578125, 0.06658935546875, 0.098876953125, 0.13116455078125, 0.1634521484375, 0.19573974609375, 0.22802734375, 0.26031494140625, 0.2926025390625, 0.32489013671875, 0.357177734375, 0.38946533203125, 0.4217529296875, 0.45404052734375, 0.486328125, 0.51861572265625, 0.5509033203125, 0.58319091796875, 0.615478515625, 0.64776611328125, 0.6800537109375, 0.71234130859375, 0.74462890625, 0.77691650390625, 0.8092041015625, 0.84149169921875, 0.873779296875, 0.90606689453125, 0.9383544921875, 0.97064208984375, 1.0029296875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 3.0, 9.0, 16.0, 14.0, 23.0, 41.0, 55.0, 63.0, 108.0, 153.0, 223.0, 340.0, 488.0, 654.0, 957.0, 1436.0, 1972.0, 2964.0, 4471.0, 6159.0, 8963.0, 12893.0, 18837.0, 27545.0, 41787.0, 66383.0, 116669.0, 1289573.0, 209407.0, 103500.0, 60285.0, 38497.0, 25841.0, 17584.0, 11864.0, 8388.0, 5704.0, 3864.0, 2744.0, 1912.0, 1381.0, 964.0, 705.0, 447.0, 370.0, 242.0, 189.0, 142.0, 94.0, 77.0, 43.0, 34.0, 29.0, 10.0, 10.0, 8.0, 5.0, 4.0, 0.0, 1.0], "bins": [-0.2288818359375, -0.22170639038085938, -0.21453094482421875, -0.20735549926757812, -0.2001800537109375, -0.19300460815429688, -0.18582916259765625, -0.17865371704101562, -0.171478271484375, -0.16430282592773438, -0.15712738037109375, -0.14995193481445312, -0.1427764892578125, -0.13560104370117188, -0.12842559814453125, -0.12125015258789062, -0.11407470703125, -0.10689926147460938, -0.09972381591796875, -0.09254837036132812, -0.0853729248046875, -0.07819747924804688, -0.07102203369140625, -0.06384658813476562, -0.056671142578125, -0.049495697021484375, -0.04232025146484375, -0.035144805908203125, -0.0279693603515625, -0.020793914794921875, -0.01361846923828125, -0.006443023681640625, 0.000732421875, 0.007907867431640625, 0.01508331298828125, 0.022258758544921875, 0.0294342041015625, 0.036609649658203125, 0.04378509521484375, 0.050960540771484375, 0.058135986328125, 0.06531143188476562, 0.07248687744140625, 0.07966232299804688, 0.0868377685546875, 0.09401321411132812, 0.10118865966796875, 0.10836410522460938, 0.11553955078125, 0.12271499633789062, 0.12989044189453125, 0.13706588745117188, 0.1442413330078125, 0.15141677856445312, 0.15859222412109375, 0.16576766967773438, 0.172943115234375, 0.18011856079101562, 0.18729400634765625, 0.19446945190429688, 0.2016448974609375, 0.20882034301757812, 0.21599578857421875, 0.22317123413085938, 0.2303466796875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 4.0, 9.0, 9.0, 12.0, 14.0, 14.0, 12.0, 20.0, 26.0, 32.0, 39.0, 48.0, 50.0, 55.0, 53.0, 68.0, 71.0, 65.0, 54.0, 48.0, 52.0, 29.0, 41.0, 27.0, 33.0, 26.0, 10.0, 12.0, 10.0, 10.0, 3.0, 8.0, 9.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.937980651855469e-05, -6.724148988723755e-05, -6.510317325592041e-05, -6.296485662460327e-05, -6.082653999328613e-05, -5.8688223361968994e-05, -5.6549906730651855e-05, -5.441159009933472e-05, -5.227327346801758e-05, -5.013495683670044e-05, -4.79966402053833e-05, -4.585832357406616e-05, -4.3720006942749023e-05, -4.1581690311431885e-05, -3.9443373680114746e-05, -3.730505704879761e-05, -3.516674041748047e-05, -3.302842378616333e-05, -3.089010715484619e-05, -2.8751790523529053e-05, -2.6613473892211914e-05, -2.4475157260894775e-05, -2.2336840629577637e-05, -2.0198523998260498e-05, -1.806020736694336e-05, -1.592189073562622e-05, -1.3783574104309082e-05, -1.1645257472991943e-05, -9.506940841674805e-06, -7.368624210357666e-06, -5.230307579040527e-06, -3.0919909477233887e-06, -9.5367431640625e-07, 1.1846423149108887e-06, 3.3229589462280273e-06, 5.461275577545166e-06, 7.599592208862305e-06, 9.737908840179443e-06, 1.1876225471496582e-05, 1.401454210281372e-05, 1.615285873413086e-05, 1.8291175365447998e-05, 2.0429491996765137e-05, 2.2567808628082275e-05, 2.4706125259399414e-05, 2.6844441890716553e-05, 2.898275852203369e-05, 3.112107515335083e-05, 3.325939178466797e-05, 3.539770841598511e-05, 3.7536025047302246e-05, 3.9674341678619385e-05, 4.1812658309936523e-05, 4.395097494125366e-05, 4.60892915725708e-05, 4.822760820388794e-05, 5.036592483520508e-05, 5.250424146652222e-05, 5.4642558097839355e-05, 5.6780874729156494e-05, 5.891919136047363e-05, 6.105750799179077e-05, 6.319582462310791e-05, 6.533414125442505e-05, 6.747245788574219e-05]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 7.0, 5.0, 11.0, 23.0, 16.0, 21.0, 22.0, 46.0, 32.0, 40.0, 47.0, 59.0, 98.0, 128.0, 149.0, 241.0, 317.0, 469.0, 865.0, 13397.0, 1028482.0, 1825.0, 682.0, 413.0, 285.0, 170.0, 147.0, 146.0, 88.0, 73.0, 44.0, 35.0, 24.0, 23.0, 21.0, 35.0, 9.0, 11.0, 10.0, 5.0, 6.0, 10.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0010995864868164062, -0.001063317060470581, -0.0010270476341247559, -0.0009907782077789307, -0.0009545087814331055, -0.0009182393550872803, -0.0008819699287414551, -0.0008457005023956299, -0.0008094310760498047, -0.0007731616497039795, -0.0007368922233581543, -0.0007006227970123291, -0.0006643533706665039, -0.0006280839443206787, -0.0005918145179748535, -0.0005555450916290283, -0.0005192756652832031, -0.00048300623893737793, -0.00044673681259155273, -0.00041046738624572754, -0.00037419795989990234, -0.00033792853355407715, -0.00030165910720825195, -0.00026538968086242676, -0.00022912025451660156, -0.00019285082817077637, -0.00015658140182495117, -0.00012031197547912598, -8.404254913330078e-05, -4.7773122787475586e-05, -1.150369644165039e-05, 2.4765729904174805e-05, 6.103515625e-05, 9.73045825958252e-05, 0.0001335740089416504, 0.00016984343528747559, 0.00020611286163330078, 0.00024238228797912598, 0.00027865171432495117, 0.00031492114067077637, 0.00035119056701660156, 0.00038745999336242676, 0.00042372941970825195, 0.00045999884605407715, 0.0004962682723999023, 0.0005325376987457275, 0.0005688071250915527, 0.0006050765514373779, 0.0006413459777832031, 0.0006776154041290283, 0.0007138848304748535, 0.0007501542568206787, 0.0007864236831665039, 0.0008226931095123291, 0.0008589625358581543, 0.0008952319622039795, 0.0009315013885498047, 0.0009677708148956299, 0.001004040241241455, 0.0010403096675872803, 0.0010765790939331055, 0.0011128485202789307, 0.0011491179466247559, 0.001185387372970581, 0.0012216567993164062]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 35.0, 888.0, 93.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001707318442640826, -0.00016243892605416477, -0.00015414600784424692, -0.00014585308963432908, -0.000137560156872496, -0.00012926723866257817, -0.00012097432045266032, -0.00011268140224274248, -0.00010438847675686702, -9.609555854694918e-05, -8.780263306107372e-05, -7.950971485115588e-05, -7.121679664123803e-05, -6.292387115536258e-05, -5.463095294544473e-05, -4.633803109754808e-05, -3.804510924965143e-05, -2.975218740175478e-05, -2.1459267372847535e-05, -1.3166347343940288e-05, -4.873425496043637e-06, 3.419496351853013e-06, 1.1712414561770856e-05, 2.0005336409667507e-05, 2.8298258257564157e-05, 3.659118010546081e-05, 4.488410195335746e-05, 5.31770201632753e-05, 6.146993837319314e-05, 6.97628638590686e-05, 7.805578206898645e-05, 8.63487075548619e-05, 9.464164031669497e-05, 0.00010293455852661282, 0.00011122748401248828, 0.00011952040222240612, 0.00012781332770828158, 0.00013610624591819942, 0.00014439916412811726, 0.0001526920823380351, 0.00016098501509986818, 0.00016927793330978602, 0.00017757085151970387, 0.00018586378428153694, 0.00019415670249145478, 0.00020244962070137262, 0.00021074253891129047, 0.0002190354571212083, 0.00022732837533112615, 0.000235621293541044, 0.00024391421175096184, 0.0002522071299608797, 0.00026050006272271276, 0.00026879296638071537, 0.00027708589914254844, 0.0002853788319043815, 0.00029367173556238413, 0.0003019646683242172, 0.0003102575719822198, 0.0003185505047440529, 0.0003268434084020555, 0.0003351363411638886, 0.00034342927392572165, 0.00035172217758372426, 0.00036001511034555733]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 7.0, 4.0, 7.0, 10.0, 15.0, 13.0, 15.0, 11.0, 13.0, 19.0, 27.0, 22.0, 32.0, 38.0, 26.0, 32.0, 28.0, 41.0, 27.0, 37.0, 38.0, 46.0, 49.0, 46.0, 37.0, 39.0, 33.0, 21.0, 31.0, 25.0, 15.0, 27.0, 17.0, 40.0, 22.0, 21.0, 14.0, 12.0, 6.0, 9.0, 7.0, 4.0, 5.0, 9.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.635883331298828e-05, -3.5315752029418945e-05, -3.427267074584961e-05, -3.3229589462280273e-05, -3.218650817871094e-05, -3.11434268951416e-05, -3.0100345611572266e-05, -2.905726432800293e-05, -2.8014183044433594e-05, -2.6971101760864258e-05, -2.5928020477294922e-05, -2.4884939193725586e-05, -2.384185791015625e-05, -2.2798776626586914e-05, -2.1755695343017578e-05, -2.0712614059448242e-05, -1.9669532775878906e-05, -1.862645149230957e-05, -1.7583370208740234e-05, -1.65402889251709e-05, -1.5497207641601562e-05, -1.4454126358032227e-05, -1.341104507446289e-05, -1.2367963790893555e-05, -1.1324882507324219e-05, -1.0281801223754883e-05, -9.238719940185547e-06, -8.195638656616211e-06, -7.152557373046875e-06, -6.109476089477539e-06, -5.066394805908203e-06, -4.023313522338867e-06, -2.9802322387695312e-06, -1.9371509552001953e-06, -8.940696716308594e-07, 1.4901161193847656e-07, 1.1920928955078125e-06, 2.2351741790771484e-06, 3.2782554626464844e-06, 4.32133674621582e-06, 5.364418029785156e-06, 6.407499313354492e-06, 7.450580596923828e-06, 8.493661880493164e-06, 9.5367431640625e-06, 1.0579824447631836e-05, 1.1622905731201172e-05, 1.2665987014770508e-05, 1.3709068298339844e-05, 1.475214958190918e-05, 1.5795230865478516e-05, 1.683831214904785e-05, 1.7881393432617188e-05, 1.8924474716186523e-05, 1.996755599975586e-05, 2.1010637283325195e-05, 2.205371856689453e-05, 2.3096799850463867e-05, 2.4139881134033203e-05, 2.518296241760254e-05, 2.6226043701171875e-05, 2.726912498474121e-05, 2.8312206268310547e-05, 2.9355287551879883e-05, 3.039836883544922e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 1.0, 5.0, 6.0, 10.0, 12.0, 11.0, 15.0, 21.0, 19.0, 23.0, 24.0, 20.0, 34.0, 44.0, 35.0, 41.0, 42.0, 37.0, 47.0, 54.0, 51.0, 45.0, 46.0, 49.0, 37.0, 43.0, 34.0, 22.0, 31.0, 25.0, 18.0, 29.0, 10.0, 11.0, 8.0, 13.0, 3.0, 5.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.499847412109375, -1.44500732421875, -1.390167236328125, -1.3353271484375, -1.280487060546875, -1.22564697265625, -1.170806884765625, -1.115966796875, -1.061126708984375, -1.00628662109375, -0.951446533203125, -0.8966064453125, -0.841766357421875, -0.78692626953125, -0.732086181640625, -0.67724609375, -0.622406005859375, -0.56756591796875, -0.512725830078125, -0.4578857421875, -0.403045654296875, -0.34820556640625, -0.293365478515625, -0.238525390625, -0.183685302734375, -0.12884521484375, -0.074005126953125, -0.0191650390625, 0.035675048828125, 0.09051513671875, 0.145355224609375, 0.2001953125, 0.255035400390625, 0.30987548828125, 0.364715576171875, 0.4195556640625, 0.474395751953125, 0.52923583984375, 0.584075927734375, 0.638916015625, 0.693756103515625, 0.74859619140625, 0.803436279296875, 0.8582763671875, 0.913116455078125, 0.96795654296875, 1.022796630859375, 1.07763671875, 1.132476806640625, 1.18731689453125, 1.242156982421875, 1.2969970703125, 1.351837158203125, 1.40667724609375, 1.461517333984375, 1.516357421875, 1.571197509765625, 1.62603759765625, 1.680877685546875, 1.7357177734375, 1.790557861328125, 1.84539794921875, 1.900238037109375, 1.955078125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 5.0, 5.0, 5.0, 13.0, 17.0, 24.0, 24.0, 36.0, 54.0, 65.0, 93.0, 108.0, 167.0, 204.0, 284.0, 385.0, 512.0, 709.0, 1041.0, 1343.0, 1881.0, 2874.0, 4679.0, 8767.0, 20892.0, 101709.0, 672134.0, 176356.0, 27795.0, 10147.0, 5401.0, 3226.0, 2145.0, 1514.0, 1046.0, 707.0, 560.0, 471.0, 280.0, 213.0, 179.0, 129.0, 92.0, 70.0, 59.0, 44.0, 22.0, 19.0, 17.0, 15.0, 9.0, 7.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.87109375, -6.63909912109375, -6.4071044921875, -6.17510986328125, -5.943115234375, -5.71112060546875, -5.4791259765625, -5.24713134765625, -5.01513671875, -4.78314208984375, -4.5511474609375, -4.31915283203125, -4.087158203125, -3.85516357421875, -3.6231689453125, -3.39117431640625, -3.1591796875, -2.92718505859375, -2.6951904296875, -2.46319580078125, -2.231201171875, -1.99920654296875, -1.7672119140625, -1.53521728515625, -1.30322265625, -1.07122802734375, -0.8392333984375, -0.60723876953125, -0.375244140625, -0.14324951171875, 0.0887451171875, 0.32073974609375, 0.552734375, 0.78472900390625, 1.0167236328125, 1.24871826171875, 1.480712890625, 1.71270751953125, 1.9447021484375, 2.17669677734375, 2.40869140625, 2.64068603515625, 2.8726806640625, 3.10467529296875, 3.336669921875, 3.56866455078125, 3.8006591796875, 4.03265380859375, 4.2646484375, 4.49664306640625, 4.7286376953125, 4.96063232421875, 5.192626953125, 5.42462158203125, 5.6566162109375, 5.88861083984375, 6.12060546875, 6.35260009765625, 6.5845947265625, 6.81658935546875, 7.048583984375, 7.28057861328125, 7.5125732421875, 7.74456787109375, 7.9765625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 15.0, 14.0, 17.0, 11.0, 15.0, 21.0, 25.0, 22.0, 30.0, 28.0, 40.0, 37.0, 41.0, 65.0, 113.0, 190.0, 276.0, 1370.0, 167.0, 92.0, 65.0, 62.0, 34.0, 34.0, 28.0, 26.0, 36.0, 17.0, 21.0, 20.0, 18.0, 10.0, 10.0, 10.0, 6.0, 9.0, 9.0, 3.0, 5.0, 2.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0], "bins": [-5.6953125, -5.5328369140625, -5.370361328125, -5.2078857421875, -5.04541015625, -4.8829345703125, -4.720458984375, -4.5579833984375, -4.3955078125, -4.2330322265625, -4.070556640625, -3.9080810546875, -3.74560546875, -3.5831298828125, -3.420654296875, -3.2581787109375, -3.095703125, -2.9332275390625, -2.770751953125, -2.6082763671875, -2.44580078125, -2.2833251953125, -2.120849609375, -1.9583740234375, -1.7958984375, -1.6334228515625, -1.470947265625, -1.3084716796875, -1.14599609375, -0.9835205078125, -0.821044921875, -0.6585693359375, -0.49609375, -0.3336181640625, -0.171142578125, -0.0086669921875, 0.15380859375, 0.3162841796875, 0.478759765625, 0.6412353515625, 0.8037109375, 0.9661865234375, 1.128662109375, 1.2911376953125, 1.45361328125, 1.6160888671875, 1.778564453125, 1.9410400390625, 2.103515625, 2.2659912109375, 2.428466796875, 2.5909423828125, 2.75341796875, 2.9158935546875, 3.078369140625, 3.2408447265625, 3.4033203125, 3.5657958984375, 3.728271484375, 3.8907470703125, 4.05322265625, 4.2156982421875, 4.378173828125, 4.5406494140625, 4.703125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 10.0, 4.0, 6.0, 9.0, 8.0, 11.0, 9.0, 13.0, 16.0, 12.0, 25.0, 14.0, 27.0, 35.0, 35.0, 73.0, 102.0, 154.0, 274.0, 631.0, 2175.0, 68979.0, 3052408.0, 18001.0, 1447.0, 482.0, 242.0, 125.0, 69.0, 54.0, 35.0, 27.0, 39.0, 29.0, 21.0, 11.0, 14.0, 19.0, 11.0, 11.0, 9.0, 6.0, 4.0, 6.0, 1.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.640625, -17.0400390625, -16.439453125, -15.8388671875, -15.23828125, -14.6376953125, -14.037109375, -13.4365234375, -12.8359375, -12.2353515625, -11.634765625, -11.0341796875, -10.43359375, -9.8330078125, -9.232421875, -8.6318359375, -8.03125, -7.4306640625, -6.830078125, -6.2294921875, -5.62890625, -5.0283203125, -4.427734375, -3.8271484375, -3.2265625, -2.6259765625, -2.025390625, -1.4248046875, -0.82421875, -0.2236328125, 0.376953125, 0.9775390625, 1.578125, 2.1787109375, 2.779296875, 3.3798828125, 3.98046875, 4.5810546875, 5.181640625, 5.7822265625, 6.3828125, 6.9833984375, 7.583984375, 8.1845703125, 8.78515625, 9.3857421875, 9.986328125, 10.5869140625, 11.1875, 11.7880859375, 12.388671875, 12.9892578125, 13.58984375, 14.1904296875, 14.791015625, 15.3916015625, 15.9921875, 16.5927734375, 17.193359375, 17.7939453125, 18.39453125, 18.9951171875, 19.595703125, 20.1962890625, 20.796875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 169.0, 657.0, 167.0, 10.0, 0.0, 1.0], "bins": [-82.16666412353516, -80.78565216064453, -79.4046401977539, -78.02362823486328, -76.64261627197266, -75.26160430908203, -73.8805923461914, -72.49958038330078, -71.11856842041016, -69.73755645751953, -68.3565444946289, -66.97553253173828, -65.59452056884766, -64.21350860595703, -62.832496643066406, -61.45148468017578, -60.070472717285156, -58.68946075439453, -57.308448791503906, -55.92743682861328, -54.546424865722656, -53.16541290283203, -51.784400939941406, -50.40338897705078, -49.02237319946289, -47.641361236572266, -46.26034927368164, -44.879337310791016, -43.49832534790039, -42.117313385009766, -40.73630142211914, -39.355289459228516, -37.97427749633789, -36.593265533447266, -35.21225357055664, -33.831241607666016, -32.45022964477539, -31.069217681884766, -29.68820571899414, -28.307193756103516, -26.92618179321289, -25.545169830322266, -24.16415786743164, -22.783145904541016, -21.40213394165039, -20.021121978759766, -18.64011001586914, -17.259098052978516, -15.878084182739258, -14.497072219848633, -13.116060256958008, -11.735048294067383, -10.354036331176758, -8.973024368286133, -7.592011451721191, -6.210999488830566, -4.829987525939941, -3.4489755630493164, -2.0679633617401123, -0.6869511604309082, 0.6940608024597168, 2.075072765350342, 3.456085205078125, 4.83709716796875, 6.218109130859375]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 6.0, 7.0, 9.0, 15.0, 6.0, 6.0, 16.0, 17.0, 16.0, 19.0, 15.0, 27.0, 13.0, 28.0, 30.0, 31.0, 27.0, 36.0, 43.0, 42.0, 28.0, 49.0, 37.0, 41.0, 37.0, 34.0, 43.0, 29.0, 33.0, 37.0, 25.0, 17.0, 39.0, 14.0, 22.0, 25.0, 12.0, 9.0, 16.0, 12.0, 7.0, 6.0, 2.0, 1.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.75569725036621, -16.251174926757812, -15.746650695800781, -15.242127418518066, -14.737604141235352, -14.233081817626953, -13.728558540344238, -13.224035263061523, -12.719511985778809, -12.214988708496094, -11.710465431213379, -11.205942153930664, -10.701419830322266, -10.196895599365234, -9.692373275756836, -9.187849998474121, -8.683326721191406, -8.178803443908691, -7.674280166625977, -7.16975736618042, -6.665234088897705, -6.16071081161499, -5.656188011169434, -5.151664733886719, -4.647141456604004, -4.142618179321289, -3.6380951404571533, -3.1335721015930176, -2.6290488243103027, -2.124525547027588, -1.6200025081634521, -1.1154794692993164, -0.6109542846679688, -0.10643112659454346, 0.39809203147888184, 0.9026151895523071, 1.4071383476257324, 1.9116616249084473, 2.416184663772583, 2.9207077026367188, 3.4252309799194336, 3.9297542572021484, 4.434277534484863, 4.93880033493042, 5.443323612213135, 5.94784688949585, 6.452369689941406, 6.956892967224121, 7.461416244506836, 7.965939521789551, 8.470462799072266, 8.97498607635498, 9.479509353637695, 9.984031677246094, 10.488554954528809, 10.993078231811523, 11.497601509094238, 12.002124786376953, 12.506648063659668, 13.011171340942383, 13.515693664550781, 14.020217895507812, 14.524740219116211, 15.029263496398926, 15.53378677368164]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 10.0, 7.0, 5.0, 11.0, 10.0, 13.0, 19.0, 15.0, 20.0, 27.0, 26.0, 27.0, 31.0, 43.0, 43.0, 26.0, 47.0, 43.0, 47.0, 55.0, 53.0, 44.0, 42.0, 42.0, 45.0, 35.0, 33.0, 28.0, 30.0, 23.0, 17.0, 20.0, 12.0, 18.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.74609375, -1.685760498046875, -1.62542724609375, -1.565093994140625, -1.5047607421875, -1.444427490234375, -1.38409423828125, -1.323760986328125, -1.263427734375, -1.203094482421875, -1.14276123046875, -1.082427978515625, -1.0220947265625, -0.961761474609375, -0.90142822265625, -0.841094970703125, -0.78076171875, -0.720428466796875, -0.66009521484375, -0.599761962890625, -0.5394287109375, -0.479095458984375, -0.41876220703125, -0.358428955078125, -0.298095703125, -0.237762451171875, -0.17742919921875, -0.117095947265625, -0.0567626953125, 0.003570556640625, 0.06390380859375, 0.124237060546875, 0.1845703125, 0.244903564453125, 0.30523681640625, 0.365570068359375, 0.4259033203125, 0.486236572265625, 0.54656982421875, 0.606903076171875, 0.667236328125, 0.727569580078125, 0.78790283203125, 0.848236083984375, 0.9085693359375, 0.968902587890625, 1.02923583984375, 1.089569091796875, 1.14990234375, 1.210235595703125, 1.27056884765625, 1.330902099609375, 1.3912353515625, 1.451568603515625, 1.51190185546875, 1.572235107421875, 1.632568359375, 1.692901611328125, 1.75323486328125, 1.813568115234375, 1.8739013671875, 1.934234619140625, 1.99456787109375, 2.054901123046875, 2.115234375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 11.0, 6.0, 7.0, 15.0, 17.0, 22.0, 29.0, 47.0, 58.0, 89.0, 111.0, 138.0, 217.0, 327.0, 539.0, 925.0, 1530.0, 2854.0, 5924.0, 13750.0, 42170.0, 237811.0, 2545061.0, 1187643.0, 109444.0, 26385.0, 9608.0, 4283.0, 2172.0, 1148.0, 651.0, 391.0, 261.0, 177.0, 108.0, 92.0, 71.0, 41.0, 37.0, 29.0, 15.0, 13.0, 14.0, 6.0, 6.0, 3.0, 6.0, 1.0, 8.0, 2.0, 2.0, 2.0, 1.0], "bins": [-7.64453125, -7.41839599609375, -7.1922607421875, -6.96612548828125, -6.739990234375, -6.51385498046875, -6.2877197265625, -6.06158447265625, -5.83544921875, -5.60931396484375, -5.3831787109375, -5.15704345703125, -4.930908203125, -4.70477294921875, -4.4786376953125, -4.25250244140625, -4.0263671875, -3.80023193359375, -3.5740966796875, -3.34796142578125, -3.121826171875, -2.89569091796875, -2.6695556640625, -2.44342041015625, -2.21728515625, -1.99114990234375, -1.7650146484375, -1.53887939453125, -1.312744140625, -1.08660888671875, -0.8604736328125, -0.63433837890625, -0.408203125, -0.18206787109375, 0.0440673828125, 0.27020263671875, 0.496337890625, 0.72247314453125, 0.9486083984375, 1.17474365234375, 1.40087890625, 1.62701416015625, 1.8531494140625, 2.07928466796875, 2.305419921875, 2.53155517578125, 2.7576904296875, 2.98382568359375, 3.2099609375, 3.43609619140625, 3.6622314453125, 3.88836669921875, 4.114501953125, 4.34063720703125, 4.5667724609375, 4.79290771484375, 5.01904296875, 5.24517822265625, 5.4713134765625, 5.69744873046875, 5.923583984375, 6.14971923828125, 6.3758544921875, 6.60198974609375, 6.828125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 12.0, 11.0, 19.0, 43.0, 66.0, 92.0, 180.0, 266.0, 498.0, 779.0, 794.0, 508.0, 348.0, 197.0, 102.0, 69.0, 43.0, 18.0, 15.0, 10.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.890625, -6.5302734375, -6.169921875, -5.8095703125, -5.44921875, -5.0888671875, -4.728515625, -4.3681640625, -4.0078125, -3.6474609375, -3.287109375, -2.9267578125, -2.56640625, -2.2060546875, -1.845703125, -1.4853515625, -1.125, -0.7646484375, -0.404296875, -0.0439453125, 0.31640625, 0.6767578125, 1.037109375, 1.3974609375, 1.7578125, 2.1181640625, 2.478515625, 2.8388671875, 3.19921875, 3.5595703125, 3.919921875, 4.2802734375, 4.640625, 5.0009765625, 5.361328125, 5.7216796875, 6.08203125, 6.4423828125, 6.802734375, 7.1630859375, 7.5234375, 7.8837890625, 8.244140625, 8.6044921875, 8.96484375, 9.3251953125, 9.685546875, 10.0458984375, 10.40625, 10.7666015625, 11.126953125, 11.4873046875, 11.84765625, 12.2080078125, 12.568359375, 12.9287109375, 13.2890625, 13.6494140625, 14.009765625, 14.3701171875, 14.73046875, 15.0908203125, 15.451171875, 15.8115234375, 16.171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 10.0, 7.0, 15.0, 28.0, 41.0, 72.0, 140.0, 280.0, 878.0, 13716.0, 4160214.0, 17197.0, 1008.0, 329.0, 131.0, 75.0, 54.0, 36.0, 13.0, 17.0, 8.0, 4.0, 5.0, 3.0, 0.0, 3.0], "bins": [-70.9375, -69.475341796875, -68.01318359375, -66.551025390625, -65.0888671875, -63.626708984375, -62.16455078125, -60.702392578125, -59.240234375, -57.778076171875, -56.31591796875, -54.853759765625, -53.3916015625, -51.929443359375, -50.46728515625, -49.005126953125, -47.54296875, -46.080810546875, -44.61865234375, -43.156494140625, -41.6943359375, -40.232177734375, -38.77001953125, -37.307861328125, -35.845703125, -34.383544921875, -32.92138671875, -31.459228515625, -29.9970703125, -28.534912109375, -27.07275390625, -25.610595703125, -24.1484375, -22.686279296875, -21.22412109375, -19.761962890625, -18.2998046875, -16.837646484375, -15.37548828125, -13.913330078125, -12.451171875, -10.989013671875, -9.52685546875, -8.064697265625, -6.6025390625, -5.140380859375, -3.67822265625, -2.216064453125, -0.75390625, 0.708251953125, 2.17041015625, 3.632568359375, 5.0947265625, 6.556884765625, 8.01904296875, 9.481201171875, 10.943359375, 12.405517578125, 13.86767578125, 15.329833984375, 16.7919921875, 18.254150390625, 19.71630859375, 21.178466796875, 22.640625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 31.0, 631.0, 349.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-173.17491149902344, -168.1968994140625, -163.2188720703125, -158.24085998535156, -153.26283264160156, -148.28482055664062, -143.30679321289062, -138.3287811279297, -133.35076904296875, -128.3727569580078, -123.39472961425781, -118.41670989990234, -113.43869018554688, -108.46067810058594, -103.48265838623047, -98.504638671875, -93.526611328125, -88.54859161376953, -83.57057189941406, -78.5925521850586, -73.61453247070312, -68.63652038574219, -63.65850067138672, -58.68048095703125, -53.70246124267578, -48.72444152832031, -43.746421813964844, -38.76840591430664, -33.79038619995117, -28.812366485595703, -23.834348678588867, -18.85633087158203, -13.878326416015625, -8.900307655334473, -3.9222888946533203, 1.055729866027832, 6.033748626708984, 11.011768341064453, 15.989786148071289, 20.967803955078125, 25.945823669433594, 30.923843383789062, 35.90186309814453, 40.879878997802734, 45.8578987121582, 50.83591842651367, 55.813934326171875, 60.791954040527344, 65.76997375488281, 70.74799346923828, 75.72601318359375, 80.70403289794922, 85.68205261230469, 90.66006469726562, 95.6380844116211, 100.61610412597656, 105.59412384033203, 110.5721435546875, 115.55016326904297, 120.52818298339844, 125.50619506835938, 130.48422241210938, 135.4622344970703, 140.44024658203125, 145.41827392578125]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 8.0, 18.0, 6.0, 15.0, 17.0, 21.0, 25.0, 26.0, 25.0, 29.0, 31.0, 34.0, 49.0, 41.0, 52.0, 48.0, 38.0, 49.0, 35.0, 62.0, 38.0, 27.0, 33.0, 36.0, 33.0, 33.0, 26.0, 22.0, 18.0, 15.0, 11.0, 10.0, 9.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-29.26920509338379, -28.47728157043457, -27.68535804748535, -26.893434524536133, -26.101511001586914, -25.309587478637695, -24.517663955688477, -23.725740432739258, -22.93381690979004, -22.14189338684082, -21.3499698638916, -20.558046340942383, -19.766122817993164, -18.974199295043945, -18.182275772094727, -17.390352249145508, -16.59842872619629, -15.80650520324707, -15.014581680297852, -14.222658157348633, -13.430734634399414, -12.638811111450195, -11.846887588500977, -11.054964065551758, -10.263040542602539, -9.47111701965332, -8.679193496704102, -7.887269973754883, -7.095346450805664, -6.303422927856445, -5.511499404907227, -4.719575881958008, -3.927654266357422, -3.135730743408203, -2.3438072204589844, -1.5518836975097656, -0.7599601745605469, 0.031963348388671875, 0.8238868713378906, 1.6158103942871094, 2.407733917236328, 3.199657440185547, 3.9915809631347656, 4.783504486083984, 5.575428009033203, 6.367351531982422, 7.159275054931641, 7.951198577880859, 8.743122100830078, 9.535045623779297, 10.326969146728516, 11.118892669677734, 11.910816192626953, 12.702739715576172, 13.49466323852539, 14.28658676147461, 15.078510284423828, 15.870433807373047, 16.662357330322266, 17.454280853271484, 18.246204376220703, 19.038127899169922, 19.83005142211914, 20.62197494506836, 21.413898468017578]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 1.0, 10.0, 11.0, 6.0, 7.0, 12.0, 12.0, 18.0, 21.0, 14.0, 22.0, 30.0, 26.0, 29.0, 29.0, 33.0, 28.0, 35.0, 37.0, 43.0, 40.0, 61.0, 50.0, 41.0, 46.0, 40.0, 44.0, 38.0, 29.0, 33.0, 25.0, 20.0, 21.0, 11.0, 20.0, 17.0, 11.0, 5.0, 6.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.9409942626953125, -1.881988525390625, -1.8229827880859375, -1.76397705078125, -1.7049713134765625, -1.645965576171875, -1.5869598388671875, -1.5279541015625, -1.4689483642578125, -1.409942626953125, -1.3509368896484375, -1.29193115234375, -1.2329254150390625, -1.173919677734375, -1.1149139404296875, -1.055908203125, -0.9969024658203125, -0.937896728515625, -0.8788909912109375, -0.81988525390625, -0.7608795166015625, -0.701873779296875, -0.6428680419921875, -0.5838623046875, -0.5248565673828125, -0.465850830078125, -0.4068450927734375, -0.34783935546875, -0.2888336181640625, -0.229827880859375, -0.1708221435546875, -0.11181640625, -0.0528106689453125, 0.006195068359375, 0.0652008056640625, 0.12420654296875, 0.1832122802734375, 0.242218017578125, 0.3012237548828125, 0.3602294921875, 0.4192352294921875, 0.478240966796875, 0.5372467041015625, 0.59625244140625, 0.6552581787109375, 0.714263916015625, 0.7732696533203125, 0.832275390625, 0.8912811279296875, 0.950286865234375, 1.0092926025390625, 1.06829833984375, 1.1273040771484375, 1.186309814453125, 1.2453155517578125, 1.3043212890625, 1.3633270263671875, 1.422332763671875, 1.4813385009765625, 1.54034423828125, 1.5993499755859375, 1.658355712890625, 1.7173614501953125, 1.7763671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 9.0, 12.0, 31.0, 28.0, 43.0, 74.0, 102.0, 127.0, 212.0, 341.0, 445.0, 710.0, 988.0, 1548.0, 2371.0, 3366.0, 5271.0, 8430.0, 13109.0, 21275.0, 35288.0, 59312.0, 105862.0, 240259.0, 273999.0, 113601.0, 62751.0, 37111.0, 22422.0, 13931.0, 8684.0, 5610.0, 3744.0, 2474.0, 1596.0, 1085.0, 741.0, 505.0, 351.0, 235.0, 169.0, 103.0, 75.0, 50.0, 41.0, 27.0, 13.0, 9.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.329833984375, -0.3192138671875, -0.30859375, -0.2979736328125, -0.287353515625, -0.2767333984375, -0.26611328125, -0.2554931640625, -0.244873046875, -0.2342529296875, -0.2236328125, -0.2130126953125, -0.202392578125, -0.1917724609375, -0.18115234375, -0.1705322265625, -0.159912109375, -0.1492919921875, -0.138671875, -0.1280517578125, -0.117431640625, -0.1068115234375, -0.09619140625, -0.0855712890625, -0.074951171875, -0.0643310546875, -0.0537109375, -0.0430908203125, -0.032470703125, -0.0218505859375, -0.01123046875, -0.0006103515625, 0.010009765625, 0.0206298828125, 0.03125, 0.0418701171875, 0.052490234375, 0.0631103515625, 0.07373046875, 0.0843505859375, 0.094970703125, 0.1055908203125, 0.1162109375, 0.1268310546875, 0.137451171875, 0.1480712890625, 0.15869140625, 0.1693115234375, 0.179931640625, 0.1905517578125, 0.201171875, 0.2117919921875, 0.222412109375, 0.2330322265625, 0.24365234375, 0.2542724609375, 0.264892578125, 0.2755126953125, 0.2861328125, 0.2967529296875, 0.307373046875, 0.3179931640625, 0.32861328125, 0.3392333984375, 0.349853515625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 4.0, 12.0, 10.0, 9.0, 16.0, 19.0, 20.0, 22.0, 12.0, 14.0, 16.0, 25.0, 29.0, 25.0, 31.0, 30.0, 32.0, 24.0, 40.0, 38.0, 34.0, 1064.0, 31.0, 37.0, 37.0, 46.0, 37.0, 29.0, 34.0, 24.0, 25.0, 28.0, 22.0, 22.0, 18.0, 21.0, 10.0, 16.0, 9.0, 8.0, 8.0, 9.0, 7.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0498046875, -1.0162506103515625, -0.982696533203125, -0.9491424560546875, -0.91558837890625, -0.8820343017578125, -0.848480224609375, -0.8149261474609375, -0.7813720703125, -0.7478179931640625, -0.714263916015625, -0.6807098388671875, -0.64715576171875, -0.6136016845703125, -0.580047607421875, -0.5464935302734375, -0.512939453125, -0.4793853759765625, -0.445831298828125, -0.4122772216796875, -0.37872314453125, -0.3451690673828125, -0.311614990234375, -0.2780609130859375, -0.2445068359375, -0.2109527587890625, -0.177398681640625, -0.1438446044921875, -0.11029052734375, -0.0767364501953125, -0.043182373046875, -0.0096282958984375, 0.02392578125, 0.0574798583984375, 0.091033935546875, 0.1245880126953125, 0.15814208984375, 0.1916961669921875, 0.225250244140625, 0.2588043212890625, 0.2923583984375, 0.3259124755859375, 0.359466552734375, 0.3930206298828125, 0.42657470703125, 0.4601287841796875, 0.493682861328125, 0.5272369384765625, 0.560791015625, 0.5943450927734375, 0.627899169921875, 0.6614532470703125, 0.69500732421875, 0.7285614013671875, 0.762115478515625, 0.7956695556640625, 0.8292236328125, 0.8627777099609375, 0.896331787109375, 0.9298858642578125, 0.96343994140625, 0.9969940185546875, 1.030548095703125, 1.0641021728515625, 1.09765625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 3.0, 8.0, 12.0, 21.0, 39.0, 57.0, 64.0, 90.0, 132.0, 174.0, 280.0, 414.0, 514.0, 696.0, 1026.0, 1412.0, 1910.0, 2671.0, 3779.0, 5171.0, 7078.0, 9874.0, 13753.0, 19038.0, 26981.0, 39583.0, 60424.0, 98990.0, 186081.0, 1275836.0, 119936.0, 69929.0, 45029.0, 30523.0, 21165.0, 15086.0, 10726.0, 7912.0, 5685.0, 4233.0, 3059.0, 2216.0, 1686.0, 1137.0, 793.0, 578.0, 401.0, 275.0, 209.0, 136.0, 111.0, 72.0, 56.0, 25.0, 25.0, 11.0, 7.0, 3.0, 3.0, 2.0, 3.0], "bins": [-0.2374267578125, -0.23004531860351562, -0.22266387939453125, -0.21528244018554688, -0.2079010009765625, -0.20051956176757812, -0.19313812255859375, -0.18575668334960938, -0.178375244140625, -0.17099380493164062, -0.16361236572265625, -0.15623092651367188, -0.1488494873046875, -0.14146804809570312, -0.13408660888671875, -0.12670516967773438, -0.11932373046875, -0.11194229125976562, -0.10456085205078125, -0.09717941284179688, -0.0897979736328125, -0.08241653442382812, -0.07503509521484375, -0.06765365600585938, -0.060272216796875, -0.052890777587890625, -0.04550933837890625, -0.038127899169921875, -0.0307464599609375, -0.023365020751953125, -0.01598358154296875, -0.008602142333984375, -0.001220703125, 0.006160736083984375, 0.01354217529296875, 0.020923614501953125, 0.0283050537109375, 0.035686492919921875, 0.04306793212890625, 0.050449371337890625, 0.057830810546875, 0.06521224975585938, 0.07259368896484375, 0.07997512817382812, 0.0873565673828125, 0.09473800659179688, 0.10211944580078125, 0.10950088500976562, 0.11688232421875, 0.12426376342773438, 0.13164520263671875, 0.13902664184570312, 0.1464080810546875, 0.15378952026367188, 0.16117095947265625, 0.16855239868164062, 0.175933837890625, 0.18331527709960938, 0.19069671630859375, 0.19807815551757812, 0.2054595947265625, 0.21284103393554688, 0.22022247314453125, 0.22760391235351562, 0.2349853515625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 8.0, 9.0, 10.0, 12.0, 20.0, 21.0, 29.0, 40.0, 47.0, 52.0, 59.0, 66.0, 65.0, 81.0, 82.0, 66.0, 49.0, 49.0, 51.0, 39.0, 33.0, 24.0, 18.0, 14.0, 9.0, 6.0, 5.0, 2.0, 5.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.578466415405273e-05, -9.315088391304016e-05, -9.051710367202759e-05, -8.788332343101501e-05, -8.524954319000244e-05, -8.261576294898987e-05, -7.99819827079773e-05, -7.734820246696472e-05, -7.471442222595215e-05, -7.208064198493958e-05, -6.9446861743927e-05, -6.681308150291443e-05, -6.417930126190186e-05, -6.154552102088928e-05, -5.891174077987671e-05, -5.6277960538864136e-05, -5.364418029785156e-05, -5.101040005683899e-05, -4.8376619815826416e-05, -4.574283957481384e-05, -4.310905933380127e-05, -4.0475279092788696e-05, -3.784149885177612e-05, -3.520771861076355e-05, -3.2573938369750977e-05, -2.9940158128738403e-05, -2.730637788772583e-05, -2.4672597646713257e-05, -2.2038817405700684e-05, -1.940503716468811e-05, -1.6771256923675537e-05, -1.4137476682662964e-05, -1.150369644165039e-05, -8.869916200637817e-06, -6.236135959625244e-06, -3.602355718612671e-06, -9.685754776000977e-07, 1.6652047634124756e-06, 4.298985004425049e-06, 6.932765245437622e-06, 9.566545486450195e-06, 1.2200325727462769e-05, 1.4834105968475342e-05, 1.7467886209487915e-05, 2.0101666450500488e-05, 2.273544669151306e-05, 2.5369226932525635e-05, 2.8003007173538208e-05, 3.063678741455078e-05, 3.3270567655563354e-05, 3.590434789657593e-05, 3.85381281375885e-05, 4.1171908378601074e-05, 4.380568861961365e-05, 4.643946886062622e-05, 4.9073249101638794e-05, 5.170702934265137e-05, 5.434080958366394e-05, 5.6974589824676514e-05, 5.960837006568909e-05, 6.224215030670166e-05, 6.487593054771423e-05, 6.75097107887268e-05, 7.014349102973938e-05, 7.277727127075195e-05]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 7.0, 7.0, 7.0, 16.0, 15.0, 23.0, 29.0, 45.0, 60.0, 72.0, 123.0, 158.0, 264.0, 505.0, 1214.0, 978979.0, 64951.0, 910.0, 400.0, 219.0, 147.0, 98.0, 105.0, 57.0, 45.0, 23.0, 19.0, 11.0, 12.0, 8.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015001296997070312, -0.0014442652463912964, -0.0013884007930755615, -0.0013325363397598267, -0.0012766718864440918, -0.001220807433128357, -0.001164942979812622, -0.0011090785264968872, -0.0010532140731811523, -0.0009973496198654175, -0.0009414851665496826, -0.0008856207132339478, -0.0008297562599182129, -0.000773891806602478, -0.0007180273532867432, -0.0006621628999710083, -0.0006062984466552734, -0.0005504339933395386, -0.0004945695400238037, -0.00043870508670806885, -0.000382840633392334, -0.0003269761800765991, -0.00027111172676086426, -0.0002152472734451294, -0.00015938282012939453, -0.00010351836681365967, -4.7653913497924805e-05, 8.210539817810059e-06, 6.407499313354492e-05, 0.00011993944644927979, 0.00017580389976501465, 0.0002316683530807495, 0.0002875328063964844, 0.00034339725971221924, 0.0003992617130279541, 0.00045512616634368896, 0.0005109906196594238, 0.0005668550729751587, 0.0006227195262908936, 0.0006785839796066284, 0.0007344484329223633, 0.0007903128862380981, 0.000846177339553833, 0.0009020417928695679, 0.0009579062461853027, 0.0010137706995010376, 0.0010696351528167725, 0.0011254996061325073, 0.0011813640594482422, 0.001237228512763977, 0.001293092966079712, 0.0013489574193954468, 0.0014048218727111816, 0.0014606863260269165, 0.0015165507793426514, 0.0015724152326583862, 0.001628279685974121, 0.001684144139289856, 0.0017400085926055908, 0.0017958730459213257, 0.0018517374992370605, 0.0019076019525527954, 0.0019634664058685303, 0.002019330859184265, 0.0020751953125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 81.0, 663.0, 255.0, 11.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003224206157028675, -0.0003155171580146998, -0.0003086137003265321, -0.00030171024263836443, -0.00029480678495019674, -0.00028790332726202905, -0.00028099986957386136, -0.00027409641188569367, -0.000267192954197526, -0.0002602894965093583, -0.0002533860388211906, -0.0002464825811330229, -0.0002395791234448552, -0.00023267566575668752, -0.00022577220806851983, -0.00021886876493226737, -0.0002119653217960149, -0.00020506186410784721, -0.00019815840641967952, -0.00019125494873151183, -0.00018435149104334414, -0.00017744803335517645, -0.00017054457566700876, -0.0001636411325307563, -0.00015673766029067338, -0.00014983420260250568, -0.000142930744914338, -0.0001360272872261703, -0.0001291238295380026, -0.00012222037184983492, -0.00011531692143762484, -0.00010841347102541476, -0.00010151002061320469, -9.4606562925037e-05, -8.77031052368693e-05, -8.079965482465923e-05, -7.389619713649154e-05, -6.699273944832385e-05, -6.0089281760156155e-05, -5.318582770996727e-05, -4.628237002179958e-05, -3.937891233363189e-05, -3.2475458283443004e-05, -2.5572000595275313e-05, -1.8668544726097025e-05, -1.1765088856918737e-05, -4.861631168751046e-06, 2.041822881437838e-06, 8.94528056960553e-06, 1.5848736438783817e-05, 2.2752192307962105e-05, 2.9655649996129796e-05, 3.655910404631868e-05, 4.346256173448637e-05, 5.036601942265406e-05, 5.726947347284295e-05, 6.417292752303183e-05, 7.107638521119952e-05, 7.797984289936721e-05, 8.48833005875349e-05, 9.178675099974498e-05, 9.869020868791267e-05, 0.00010559366637608036, 0.00011249711678829044, 0.00011940058175241575]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 6.0, 8.0, 2.0, 7.0, 9.0, 16.0, 10.0, 15.0, 16.0, 11.0, 14.0, 19.0, 29.0, 34.0, 32.0, 24.0, 38.0, 35.0, 39.0, 51.0, 50.0, 46.0, 49.0, 35.0, 37.0, 32.0, 35.0, 31.0, 43.0, 30.0, 37.0, 27.0, 11.0, 28.0, 22.0, 20.0, 11.0, 8.0, 7.0, 12.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.62396240234375e-05, -3.496836870908737e-05, -3.3697113394737244e-05, -3.2425858080387115e-05, -3.115460276603699e-05, -2.988334745168686e-05, -2.861209213733673e-05, -2.7340836822986603e-05, -2.6069581508636475e-05, -2.4798326194286346e-05, -2.3527070879936218e-05, -2.225581556558609e-05, -2.0984560251235962e-05, -1.9713304936885834e-05, -1.8442049622535706e-05, -1.7170794308185577e-05, -1.589953899383545e-05, -1.4628283679485321e-05, -1.3357028365135193e-05, -1.2085773050785065e-05, -1.0814517736434937e-05, -9.543262422084808e-06, -8.27200710773468e-06, -7.000751793384552e-06, -5.729496479034424e-06, -4.458241164684296e-06, -3.1869858503341675e-06, -1.9157305359840393e-06, -6.444752216339111e-07, 6.26780092716217e-07, 1.8980354070663452e-06, 3.1692907214164734e-06, 4.4405460357666016e-06, 5.71180135011673e-06, 6.983056664466858e-06, 8.254311978816986e-06, 9.525567293167114e-06, 1.0796822607517242e-05, 1.206807792186737e-05, 1.3339333236217499e-05, 1.4610588550567627e-05, 1.5881843864917755e-05, 1.7153099179267883e-05, 1.842435449361801e-05, 1.969560980796814e-05, 2.0966865122318268e-05, 2.2238120436668396e-05, 2.3509375751018524e-05, 2.4780631065368652e-05, 2.605188637971878e-05, 2.732314169406891e-05, 2.8594397008419037e-05, 2.9865652322769165e-05, 3.113690763711929e-05, 3.240816295146942e-05, 3.367941826581955e-05, 3.495067358016968e-05, 3.6221928894519806e-05, 3.7493184208869934e-05, 3.876443952322006e-05, 4.003569483757019e-05, 4.130695015192032e-05, 4.257820546627045e-05, 4.3849460780620575e-05, 4.51207160949707e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 1.0, 10.0, 11.0, 6.0, 7.0, 12.0, 12.0, 18.0, 21.0, 14.0, 22.0, 30.0, 26.0, 29.0, 29.0, 33.0, 28.0, 35.0, 37.0, 43.0, 40.0, 61.0, 50.0, 41.0, 46.0, 40.0, 44.0, 38.0, 29.0, 33.0, 25.0, 20.0, 21.0, 11.0, 20.0, 17.0, 11.0, 5.0, 6.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.9409942626953125, -1.881988525390625, -1.8229827880859375, -1.76397705078125, -1.7049713134765625, -1.645965576171875, -1.5869598388671875, -1.5279541015625, -1.4689483642578125, -1.409942626953125, -1.3509368896484375, -1.29193115234375, -1.2329254150390625, -1.173919677734375, -1.1149139404296875, -1.055908203125, -0.9969024658203125, -0.937896728515625, -0.8788909912109375, -0.81988525390625, -0.7608795166015625, -0.701873779296875, -0.6428680419921875, -0.5838623046875, -0.5248565673828125, -0.465850830078125, -0.4068450927734375, -0.34783935546875, -0.2888336181640625, -0.229827880859375, -0.1708221435546875, -0.11181640625, -0.0528106689453125, 0.006195068359375, 0.0652008056640625, 0.12420654296875, 0.1832122802734375, 0.242218017578125, 0.3012237548828125, 0.3602294921875, 0.4192352294921875, 0.478240966796875, 0.5372467041015625, 0.59625244140625, 0.6552581787109375, 0.714263916015625, 0.7732696533203125, 0.832275390625, 0.8912811279296875, 0.950286865234375, 1.0092926025390625, 1.06829833984375, 1.1273040771484375, 1.186309814453125, 1.2453155517578125, 1.3043212890625, 1.3633270263671875, 1.422332763671875, 1.4813385009765625, 1.54034423828125, 1.5993499755859375, 1.658355712890625, 1.7173614501953125, 1.7763671875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 10.0, 8.0, 23.0, 24.0, 22.0, 36.0, 58.0, 81.0, 97.0, 151.0, 199.0, 298.0, 420.0, 718.0, 1287.0, 2288.0, 4678.0, 9991.0, 23459.0, 62141.0, 169298.0, 344182.0, 259544.0, 102242.0, 37395.0, 15451.0, 6761.0, 3280.0, 1712.0, 945.0, 562.0, 366.0, 226.0, 156.0, 124.0, 91.0, 62.0, 54.0, 28.0, 29.0, 13.0, 18.0, 11.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.37109375, -2.3028564453125, -2.234619140625, -2.1663818359375, -2.09814453125, -2.0299072265625, -1.961669921875, -1.8934326171875, -1.8251953125, -1.7569580078125, -1.688720703125, -1.6204833984375, -1.55224609375, -1.4840087890625, -1.415771484375, -1.3475341796875, -1.279296875, -1.2110595703125, -1.142822265625, -1.0745849609375, -1.00634765625, -0.9381103515625, -0.869873046875, -0.8016357421875, -0.7333984375, -0.6651611328125, -0.596923828125, -0.5286865234375, -0.46044921875, -0.3922119140625, -0.323974609375, -0.2557373046875, -0.1875, -0.1192626953125, -0.051025390625, 0.0172119140625, 0.08544921875, 0.1536865234375, 0.221923828125, 0.2901611328125, 0.3583984375, 0.4266357421875, 0.494873046875, 0.5631103515625, 0.63134765625, 0.6995849609375, 0.767822265625, 0.8360595703125, 0.904296875, 0.9725341796875, 1.040771484375, 1.1090087890625, 1.17724609375, 1.2454833984375, 1.313720703125, 1.3819580078125, 1.4501953125, 1.5184326171875, 1.586669921875, 1.6549072265625, 1.72314453125, 1.7913818359375, 1.859619140625, 1.9278564453125, 1.99609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 11.0, 5.0, 12.0, 12.0, 14.0, 15.0, 17.0, 21.0, 31.0, 44.0, 43.0, 36.0, 53.0, 64.0, 91.0, 164.0, 1512.0, 318.0, 136.0, 81.0, 49.0, 44.0, 34.0, 36.0, 36.0, 30.0, 26.0, 26.0, 18.0, 16.0, 6.0, 12.0, 9.0, 2.0, 1.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.390625, -7.1583251953125, -6.926025390625, -6.6937255859375, -6.46142578125, -6.2291259765625, -5.996826171875, -5.7645263671875, -5.5322265625, -5.2999267578125, -5.067626953125, -4.8353271484375, -4.60302734375, -4.3707275390625, -4.138427734375, -3.9061279296875, -3.673828125, -3.4415283203125, -3.209228515625, -2.9769287109375, -2.74462890625, -2.5123291015625, -2.280029296875, -2.0477294921875, -1.8154296875, -1.5831298828125, -1.350830078125, -1.1185302734375, -0.88623046875, -0.6539306640625, -0.421630859375, -0.1893310546875, 0.04296875, 0.2752685546875, 0.507568359375, 0.7398681640625, 0.97216796875, 1.2044677734375, 1.436767578125, 1.6690673828125, 1.9013671875, 2.1336669921875, 2.365966796875, 2.5982666015625, 2.83056640625, 3.0628662109375, 3.295166015625, 3.5274658203125, 3.759765625, 3.9920654296875, 4.224365234375, 4.4566650390625, 4.68896484375, 4.9212646484375, 5.153564453125, 5.3858642578125, 5.6181640625, 5.8504638671875, 6.082763671875, 6.3150634765625, 6.54736328125, 6.7796630859375, 7.011962890625, 7.2442626953125, 7.4765625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 2.0, 2.0, 5.0, 3.0, 9.0, 7.0, 11.0, 11.0, 24.0, 18.0, 28.0, 39.0, 47.0, 59.0, 66.0, 119.0, 197.0, 369.0, 1019.0, 5349.0, 451560.0, 2672278.0, 11843.0, 1452.0, 450.0, 239.0, 121.0, 89.0, 68.0, 43.0, 47.0, 25.0, 17.0, 18.0, 18.0, 10.0, 8.0, 10.0, 14.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-14.46875, -14.004150390625, -13.53955078125, -13.074951171875, -12.6103515625, -12.145751953125, -11.68115234375, -11.216552734375, -10.751953125, -10.287353515625, -9.82275390625, -9.358154296875, -8.8935546875, -8.428955078125, -7.96435546875, -7.499755859375, -7.03515625, -6.570556640625, -6.10595703125, -5.641357421875, -5.1767578125, -4.712158203125, -4.24755859375, -3.782958984375, -3.318359375, -2.853759765625, -2.38916015625, -1.924560546875, -1.4599609375, -0.995361328125, -0.53076171875, -0.066162109375, 0.3984375, 0.863037109375, 1.32763671875, 1.792236328125, 2.2568359375, 2.721435546875, 3.18603515625, 3.650634765625, 4.115234375, 4.579833984375, 5.04443359375, 5.509033203125, 5.9736328125, 6.438232421875, 6.90283203125, 7.367431640625, 7.83203125, 8.296630859375, 8.76123046875, 9.225830078125, 9.6904296875, 10.155029296875, 10.61962890625, 11.084228515625, 11.548828125, 12.013427734375, 12.47802734375, 12.942626953125, 13.4072265625, 13.871826171875, 14.33642578125, 14.801025390625, 15.265625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 31.0, 299.0, 569.0, 97.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-73.2428207397461, -71.9386215209961, -70.63442993164062, -69.33023071289062, -68.02603149414062, -66.72183227539062, -65.41764068603516, -64.11344146728516, -62.80924606323242, -61.50505065917969, -60.20085144042969, -58.89665603637695, -57.59245681762695, -56.28826141357422, -54.98406219482422, -53.679866790771484, -52.37567138671875, -51.071475982666016, -49.767276763916016, -48.46308135986328, -47.15888214111328, -45.85468673706055, -44.55049133300781, -43.24629211425781, -41.94209289550781, -40.63789749145508, -39.33369827270508, -38.029502868652344, -36.725303649902344, -35.42110824584961, -34.116912841796875, -32.812713623046875, -31.508520126342773, -30.204322814941406, -28.90012550354004, -27.595928192138672, -26.291732788085938, -24.98753547668457, -23.683338165283203, -22.37914276123047, -21.07494354248047, -19.7707462310791, -18.466548919677734, -17.162353515625, -15.858156204223633, -14.553958892822266, -13.249761581420898, -11.945565223693848, -10.641368865966797, -9.33717155456543, -8.032975196838379, -6.728777885437012, -5.424581050872803, -4.120384216308594, -2.8161869049072266, -1.5119905471801758, -0.2077932357788086, 1.09640371799469, 2.4006006717681885, 3.7047977447509766, 5.0089945793151855, 6.3131914138793945, 7.617388725280762, 8.921585083007812, 10.22578239440918]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 6.0, 5.0, 12.0, 8.0, 7.0, 12.0, 11.0, 12.0, 24.0, 21.0, 28.0, 23.0, 25.0, 30.0, 37.0, 43.0, 45.0, 51.0, 58.0, 47.0, 40.0, 45.0, 37.0, 44.0, 32.0, 38.0, 36.0, 28.0, 32.0, 27.0, 21.0, 25.0, 13.0, 22.0, 13.0, 7.0, 7.0, 6.0, 5.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.31951141357422, -22.629880905151367, -21.940250396728516, -21.250619888305664, -20.560989379882812, -19.871360778808594, -19.18172836303711, -18.49209976196289, -17.80246925354004, -17.112838745117188, -16.423208236694336, -15.733577728271484, -15.04394817352295, -14.354317665100098, -13.664687156677246, -12.975057601928711, -12.285426139831543, -11.595795631408691, -10.90616512298584, -10.216535568237305, -9.526905059814453, -8.837274551391602, -8.14764404296875, -7.458014011383057, -6.768383502960205, -6.0787529945373535, -5.38912296295166, -4.699492454528809, -4.009861946105957, -3.3202319145202637, -2.630601406097412, -1.9409713745117188, -1.2513408660888672, -0.56171053647995, 0.12791979312896729, 0.8175501823425293, 1.5071804523468018, 2.196810722351074, 2.886441230773926, 3.576071262359619, 4.265701770782471, 4.955332279205322, 5.644962310791016, 6.334592819213867, 7.024223327636719, 7.713853359222412, 8.403484344482422, 9.093113899230957, 9.782744407653809, 10.47237491607666, 11.162005424499512, 11.851634979248047, 12.541265487670898, 13.23089599609375, 13.920526504516602, 14.610157012939453, 15.299787521362305, 15.989418029785156, 16.679048538208008, 17.36867904663086, 18.05830955505371, 18.747940063476562, 19.43756866455078, 20.127199172973633, 20.816829681396484]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 8.0, 9.0, 7.0, 12.0, 16.0, 14.0, 26.0, 23.0, 28.0, 23.0, 30.0, 30.0, 34.0, 31.0, 34.0, 42.0, 42.0, 49.0, 56.0, 55.0, 45.0, 66.0, 35.0, 29.0, 42.0, 39.0, 35.0, 24.0, 18.0, 18.0, 15.0, 9.0, 7.0, 13.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30859375, -2.2423858642578125, -2.176177978515625, -2.1099700927734375, -2.04376220703125, -1.9775543212890625, -1.911346435546875, -1.8451385498046875, -1.7789306640625, -1.7127227783203125, -1.646514892578125, -1.5803070068359375, -1.51409912109375, -1.4478912353515625, -1.381683349609375, -1.3154754638671875, -1.249267578125, -1.1830596923828125, -1.116851806640625, -1.0506439208984375, -0.98443603515625, -0.9182281494140625, -0.852020263671875, -0.7858123779296875, -0.7196044921875, -0.6533966064453125, -0.587188720703125, -0.5209808349609375, -0.45477294921875, -0.3885650634765625, -0.322357177734375, -0.2561492919921875, -0.18994140625, -0.1237335205078125, -0.057525634765625, 0.0086822509765625, 0.07489013671875, 0.1410980224609375, 0.207305908203125, 0.2735137939453125, 0.3397216796875, 0.4059295654296875, 0.472137451171875, 0.5383453369140625, 0.60455322265625, 0.6707611083984375, 0.736968994140625, 0.8031768798828125, 0.869384765625, 0.9355926513671875, 1.001800537109375, 1.0680084228515625, 1.13421630859375, 1.2004241943359375, 1.266632080078125, 1.3328399658203125, 1.3990478515625, 1.4652557373046875, 1.531463623046875, 1.5976715087890625, 1.66387939453125, 1.7300872802734375, 1.796295166015625, 1.8625030517578125, 1.9287109375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 9.0, 12.0, 16.0, 19.0, 24.0, 18.0, 20.0, 38.0, 60.0, 86.0, 107.0, 178.0, 270.0, 542.0, 1348.0, 4361.0, 21695.0, 170462.0, 1976015.0, 1832545.0, 159411.0, 20266.0, 4177.0, 1245.0, 549.0, 256.0, 157.0, 106.0, 69.0, 44.0, 33.0, 27.0, 30.0, 21.0, 15.0, 7.0, 9.0, 8.0, 5.0, 5.0, 7.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-6.62109375, -6.43182373046875, -6.2425537109375, -6.05328369140625, -5.864013671875, -5.67474365234375, -5.4854736328125, -5.29620361328125, -5.10693359375, -4.91766357421875, -4.7283935546875, -4.53912353515625, -4.349853515625, -4.16058349609375, -3.9713134765625, -3.78204345703125, -3.5927734375, -3.40350341796875, -3.2142333984375, -3.02496337890625, -2.835693359375, -2.64642333984375, -2.4571533203125, -2.26788330078125, -2.07861328125, -1.88934326171875, -1.7000732421875, -1.51080322265625, -1.321533203125, -1.13226318359375, -0.9429931640625, -0.75372314453125, -0.564453125, -0.37518310546875, -0.1859130859375, 0.00335693359375, 0.192626953125, 0.38189697265625, 0.5711669921875, 0.76043701171875, 0.94970703125, 1.13897705078125, 1.3282470703125, 1.51751708984375, 1.706787109375, 1.89605712890625, 2.0853271484375, 2.27459716796875, 2.4638671875, 2.65313720703125, 2.8424072265625, 3.03167724609375, 3.220947265625, 3.41021728515625, 3.5994873046875, 3.78875732421875, 3.97802734375, 4.16729736328125, 4.3565673828125, 4.54583740234375, 4.735107421875, 4.92437744140625, 5.1136474609375, 5.30291748046875, 5.4921875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 14.0, 6.0, 14.0, 15.0, 22.0, 41.0, 48.0, 53.0, 80.0, 92.0, 138.0, 184.0, 221.0, 318.0, 404.0, 398.0, 419.0, 337.0, 286.0, 227.0, 174.0, 137.0, 118.0, 76.0, 69.0, 42.0, 35.0, 25.0, 19.0, 18.0, 5.0, 7.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.33984375, -6.1593017578125, -5.978759765625, -5.7982177734375, -5.61767578125, -5.4371337890625, -5.256591796875, -5.0760498046875, -4.8955078125, -4.7149658203125, -4.534423828125, -4.3538818359375, -4.17333984375, -3.9927978515625, -3.812255859375, -3.6317138671875, -3.451171875, -3.2706298828125, -3.090087890625, -2.9095458984375, -2.72900390625, -2.5484619140625, -2.367919921875, -2.1873779296875, -2.0068359375, -1.8262939453125, -1.645751953125, -1.4652099609375, -1.28466796875, -1.1041259765625, -0.923583984375, -0.7430419921875, -0.5625, -0.3819580078125, -0.201416015625, -0.0208740234375, 0.15966796875, 0.3402099609375, 0.520751953125, 0.7012939453125, 0.8818359375, 1.0623779296875, 1.242919921875, 1.4234619140625, 1.60400390625, 1.7845458984375, 1.965087890625, 2.1456298828125, 2.326171875, 2.5067138671875, 2.687255859375, 2.8677978515625, 3.04833984375, 3.2288818359375, 3.409423828125, 3.5899658203125, 3.7705078125, 3.9510498046875, 4.131591796875, 4.3121337890625, 4.49267578125, 4.6732177734375, 4.853759765625, 5.0343017578125, 5.21484375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 15.0, 18.0, 34.0, 44.0, 87.0, 143.0, 261.0, 557.0, 2170.0, 62725.0, 3959119.0, 164549.0, 3235.0, 659.0, 286.0, 133.0, 91.0, 52.0, 35.0, 21.0, 14.0, 10.0, 8.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.96875, -29.192138671875, -28.41552734375, -27.638916015625, -26.8623046875, -26.085693359375, -25.30908203125, -24.532470703125, -23.755859375, -22.979248046875, -22.20263671875, -21.426025390625, -20.6494140625, -19.872802734375, -19.09619140625, -18.319580078125, -17.54296875, -16.766357421875, -15.98974609375, -15.213134765625, -14.4365234375, -13.659912109375, -12.88330078125, -12.106689453125, -11.330078125, -10.553466796875, -9.77685546875, -9.000244140625, -8.2236328125, -7.447021484375, -6.67041015625, -5.893798828125, -5.1171875, -4.340576171875, -3.56396484375, -2.787353515625, -2.0107421875, -1.234130859375, -0.45751953125, 0.319091796875, 1.095703125, 1.872314453125, 2.64892578125, 3.425537109375, 4.2021484375, 4.978759765625, 5.75537109375, 6.531982421875, 7.30859375, 8.085205078125, 8.86181640625, 9.638427734375, 10.4150390625, 11.191650390625, 11.96826171875, 12.744873046875, 13.521484375, 14.298095703125, 15.07470703125, 15.851318359375, 16.6279296875, 17.404541015625, 18.18115234375, 18.957763671875, 19.734375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 90.0, 256.0, 334.0, 239.0, 68.0, 11.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.97063446044922, -34.863502502441406, -32.756370544433594, -30.64923858642578, -28.54210662841797, -26.434974670410156, -24.327842712402344, -22.22071075439453, -20.11357879638672, -18.006446838378906, -15.899314880371094, -13.792182922363281, -11.685050964355469, -9.577919006347656, -7.470787048339844, -5.363655090332031, -3.2565231323242188, -1.1493911743164062, 0.9577407836914062, 3.0648727416992188, 5.172004699707031, 7.279136657714844, 9.386268615722656, 11.493400573730469, 13.600532531738281, 15.707664489746094, 17.814796447753906, 19.92192840576172, 22.02906036376953, 24.136192321777344, 26.243324279785156, 28.35045623779297, 30.45758056640625, 32.56471252441406, 34.671844482421875, 36.77897644042969, 38.8861083984375, 40.99324035644531, 43.100372314453125, 45.20750427246094, 47.31463623046875, 49.42176818847656, 51.528900146484375, 53.63603210449219, 55.7431640625, 57.85029602050781, 59.957427978515625, 62.06455993652344, 64.17169189453125, 66.27882385253906, 68.38595581054688, 70.49308776855469, 72.6002197265625, 74.70735168457031, 76.81448364257812, 78.92161560058594, 81.02874755859375, 83.13587951660156, 85.24301147460938, 87.35014343261719, 89.457275390625, 91.56440734863281, 93.67153930664062, 95.77867126464844, 97.88580322265625]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 6.0, 7.0, 10.0, 7.0, 11.0, 19.0, 19.0, 25.0, 16.0, 22.0, 25.0, 37.0, 30.0, 48.0, 46.0, 39.0, 52.0, 45.0, 34.0, 49.0, 44.0, 41.0, 40.0, 44.0, 40.0, 29.0, 30.0, 23.0, 21.0, 13.0, 21.0, 14.0, 16.0, 13.0, 11.0, 10.0, 8.0, 7.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.987842559814453, -19.301700592041016, -18.61556053161621, -17.929418563842773, -17.243276596069336, -16.5571346282959, -15.870994567871094, -15.184852600097656, -14.498710632324219, -13.812569618225098, -13.12642765045166, -12.440286636352539, -11.754144668579102, -11.06800365447998, -10.38186264038086, -9.695720672607422, -9.0095796585083, -8.32343864440918, -7.637296676635742, -6.951155662536621, -6.265013694763184, -5.5788726806640625, -4.892731189727783, -4.206589698791504, -3.5204482078552246, -2.8343067169189453, -2.148165225982666, -1.4620239734649658, -0.7758824825286865, -0.08974099159240723, 0.596400260925293, 1.2825417518615723, 1.9686832427978516, 2.654824733734131, 3.34096622467041, 4.027107238769531, 4.713249206542969, 5.39939022064209, 6.085531711578369, 6.771673202514648, 7.457814693450928, 8.143956184387207, 8.830097198486328, 9.516239166259766, 10.202380180358887, 10.888522148132324, 11.574663162231445, 12.260805130004883, 12.946946144104004, 13.633087158203125, 14.319229125976562, 15.005370140075684, 15.691512107849121, 16.377653121948242, 17.06379508972168, 17.749935150146484, 18.436077117919922, 19.12221908569336, 19.808359146118164, 20.4945011138916, 21.18064308166504, 21.866785049438477, 22.55292510986328, 23.23906707763672, 23.925209045410156]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 1.0, 9.0, 13.0, 7.0, 20.0, 17.0, 7.0, 14.0, 16.0, 15.0, 25.0, 23.0, 33.0, 23.0, 30.0, 30.0, 35.0, 36.0, 50.0, 45.0, 47.0, 53.0, 53.0, 40.0, 43.0, 28.0, 39.0, 37.0, 33.0, 29.0, 31.0, 26.0, 18.0, 12.0, 10.0, 10.0, 8.0, 6.0, 5.0, 3.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.123687744140625, -2.06182861328125, -1.999969482421875, -1.9381103515625, -1.876251220703125, -1.81439208984375, -1.752532958984375, -1.690673828125, -1.628814697265625, -1.56695556640625, -1.505096435546875, -1.4432373046875, -1.381378173828125, -1.31951904296875, -1.257659912109375, -1.19580078125, -1.133941650390625, -1.07208251953125, -1.010223388671875, -0.9483642578125, -0.886505126953125, -0.82464599609375, -0.762786865234375, -0.700927734375, -0.639068603515625, -0.57720947265625, -0.515350341796875, -0.4534912109375, -0.391632080078125, -0.32977294921875, -0.267913818359375, -0.2060546875, -0.144195556640625, -0.08233642578125, -0.020477294921875, 0.0413818359375, 0.103240966796875, 0.16510009765625, 0.226959228515625, 0.288818359375, 0.350677490234375, 0.41253662109375, 0.474395751953125, 0.5362548828125, 0.598114013671875, 0.65997314453125, 0.721832275390625, 0.78369140625, 0.845550537109375, 0.90740966796875, 0.969268798828125, 1.0311279296875, 1.092987060546875, 1.15484619140625, 1.216705322265625, 1.278564453125, 1.340423583984375, 1.40228271484375, 1.464141845703125, 1.5260009765625, 1.587860107421875, 1.64971923828125, 1.711578369140625, 1.7734375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 8.0, 4.0, 5.0, 13.0, 16.0, 20.0, 25.0, 57.0, 76.0, 104.0, 197.0, 303.0, 494.0, 809.0, 1291.0, 2260.0, 3831.0, 6446.0, 11170.0, 19550.0, 35809.0, 68235.0, 146490.0, 357552.0, 205752.0, 86932.0, 44285.0, 23964.0, 13536.0, 7808.0, 4631.0, 2632.0, 1650.0, 982.0, 592.0, 352.0, 238.0, 135.0, 95.0, 74.0, 47.0, 29.0, 25.0, 14.0, 9.0, 2.0, 7.0, 3.0, 7.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3659210205078125, -0.352203369140625, -0.3384857177734375, -0.32476806640625, -0.3110504150390625, -0.297332763671875, -0.2836151123046875, -0.2698974609375, -0.2561798095703125, -0.242462158203125, -0.2287445068359375, -0.21502685546875, -0.2013092041015625, -0.187591552734375, -0.1738739013671875, -0.16015625, -0.1464385986328125, -0.132720947265625, -0.1190032958984375, -0.10528564453125, -0.0915679931640625, -0.077850341796875, -0.0641326904296875, -0.0504150390625, -0.0366973876953125, -0.022979736328125, -0.0092620849609375, 0.00445556640625, 0.0181732177734375, 0.031890869140625, 0.0456085205078125, 0.059326171875, 0.0730438232421875, 0.086761474609375, 0.1004791259765625, 0.11419677734375, 0.1279144287109375, 0.141632080078125, 0.1553497314453125, 0.1690673828125, 0.1827850341796875, 0.196502685546875, 0.2102203369140625, 0.22393798828125, 0.2376556396484375, 0.251373291015625, 0.2650909423828125, 0.27880859375, 0.2925262451171875, 0.306243896484375, 0.3199615478515625, 0.33367919921875, 0.3473968505859375, 0.361114501953125, 0.3748321533203125, 0.3885498046875, 0.4022674560546875, 0.415985107421875, 0.4297027587890625, 0.44342041015625, 0.4571380615234375, 0.470855712890625, 0.4845733642578125, 0.498291015625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 3.0, 11.0, 14.0, 8.0, 13.0, 21.0, 17.0, 22.0, 27.0, 27.0, 32.0, 19.0, 43.0, 43.0, 41.0, 27.0, 38.0, 40.0, 1065.0, 46.0, 40.0, 45.0, 46.0, 23.0, 48.0, 42.0, 32.0, 30.0, 28.0, 29.0, 18.0, 15.0, 13.0, 6.0, 11.0, 6.0, 8.0, 6.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.37890625, -1.3394775390625, -1.300048828125, -1.2606201171875, -1.22119140625, -1.1817626953125, -1.142333984375, -1.1029052734375, -1.0634765625, -1.0240478515625, -0.984619140625, -0.9451904296875, -0.90576171875, -0.8663330078125, -0.826904296875, -0.7874755859375, -0.748046875, -0.7086181640625, -0.669189453125, -0.6297607421875, -0.59033203125, -0.5509033203125, -0.511474609375, -0.4720458984375, -0.4326171875, -0.3931884765625, -0.353759765625, -0.3143310546875, -0.27490234375, -0.2354736328125, -0.196044921875, -0.1566162109375, -0.1171875, -0.0777587890625, -0.038330078125, 0.0010986328125, 0.04052734375, 0.0799560546875, 0.119384765625, 0.1588134765625, 0.1982421875, 0.2376708984375, 0.277099609375, 0.3165283203125, 0.35595703125, 0.3953857421875, 0.434814453125, 0.4742431640625, 0.513671875, 0.5531005859375, 0.592529296875, 0.6319580078125, 0.67138671875, 0.7108154296875, 0.750244140625, 0.7896728515625, 0.8291015625, 0.8685302734375, 0.907958984375, 0.9473876953125, 0.98681640625, 1.0262451171875, 1.065673828125, 1.1051025390625, 1.14453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 6.0, 2.0, 11.0, 11.0, 22.0, 37.0, 47.0, 47.0, 92.0, 141.0, 178.0, 276.0, 424.0, 608.0, 858.0, 1186.0, 1766.0, 2576.0, 3894.0, 5707.0, 8644.0, 13402.0, 20189.0, 31498.0, 49860.0, 83676.0, 158735.0, 1333063.0, 156420.0, 82359.0, 50357.0, 31328.0, 19893.0, 12890.0, 8660.0, 5788.0, 3969.0, 2713.0, 1864.0, 1203.0, 892.0, 557.0, 389.0, 281.0, 201.0, 119.0, 100.0, 72.0, 31.0, 33.0, 18.0, 18.0, 16.0, 7.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.287353515625, -0.278228759765625, -0.26910400390625, -0.259979248046875, -0.2508544921875, -0.241729736328125, -0.23260498046875, -0.223480224609375, -0.21435546875, -0.205230712890625, -0.19610595703125, -0.186981201171875, -0.1778564453125, -0.168731689453125, -0.15960693359375, -0.150482177734375, -0.141357421875, -0.132232666015625, -0.12310791015625, -0.113983154296875, -0.1048583984375, -0.095733642578125, -0.08660888671875, -0.077484130859375, -0.068359375, -0.059234619140625, -0.05010986328125, -0.040985107421875, -0.0318603515625, -0.022735595703125, -0.01361083984375, -0.004486083984375, 0.004638671875, 0.013763427734375, 0.02288818359375, 0.032012939453125, 0.0411376953125, 0.050262451171875, 0.05938720703125, 0.068511962890625, 0.07763671875, 0.086761474609375, 0.09588623046875, 0.105010986328125, 0.1141357421875, 0.123260498046875, 0.13238525390625, 0.141510009765625, 0.150634765625, 0.159759521484375, 0.16888427734375, 0.178009033203125, 0.1871337890625, 0.196258544921875, 0.20538330078125, 0.214508056640625, 0.2236328125, 0.232757568359375, 0.24188232421875, 0.251007080078125, 0.2601318359375, 0.269256591796875, 0.27838134765625, 0.287506103515625, 0.296630859375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 3.0, 8.0, 8.0, 6.0, 8.0, 15.0, 22.0, 23.0, 27.0, 42.0, 37.0, 39.0, 43.0, 77.0, 70.0, 69.0, 62.0, 61.0, 59.0, 56.0, 47.0, 36.0, 34.0, 32.0, 24.0, 19.0, 16.0, 9.0, 7.0, 12.0, 6.0, 2.0, 3.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.128715515136719e-05, -6.90976157784462e-05, -6.690807640552521e-05, -6.471853703260422e-05, -6.252899765968323e-05, -6.033945828676224e-05, -5.814991891384125e-05, -5.596037954092026e-05, -5.377084016799927e-05, -5.158130079507828e-05, -4.939176142215729e-05, -4.72022220492363e-05, -4.501268267631531e-05, -4.282314330339432e-05, -4.063360393047333e-05, -3.844406455755234e-05, -3.625452518463135e-05, -3.406498581171036e-05, -3.187544643878937e-05, -2.9685907065868378e-05, -2.7496367692947388e-05, -2.5306828320026398e-05, -2.3117288947105408e-05, -2.0927749574184418e-05, -1.8738210201263428e-05, -1.6548670828342438e-05, -1.4359131455421448e-05, -1.2169592082500458e-05, -9.980052709579468e-06, -7.790513336658478e-06, -5.600973963737488e-06, -3.411434590816498e-06, -1.2218952178955078e-06, 9.676441550254822e-07, 3.157183527946472e-06, 5.346722900867462e-06, 7.536262273788452e-06, 9.725801646709442e-06, 1.1915341019630432e-05, 1.4104880392551422e-05, 1.6294419765472412e-05, 1.8483959138393402e-05, 2.0673498511314392e-05, 2.2863037884235382e-05, 2.5052577257156372e-05, 2.7242116630077362e-05, 2.9431656002998352e-05, 3.162119537591934e-05, 3.381073474884033e-05, 3.600027412176132e-05, 3.818981349468231e-05, 4.03793528676033e-05, 4.256889224052429e-05, 4.475843161344528e-05, 4.694797098636627e-05, 4.913751035928726e-05, 5.132704973220825e-05, 5.351658910512924e-05, 5.570612847805023e-05, 5.789566785097122e-05, 6.008520722389221e-05, 6.22747465968132e-05, 6.446428596973419e-05, 6.665382534265518e-05, 6.884336471557617e-05]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 9.0, 9.0, 9.0, 13.0, 23.0, 30.0, 32.0, 36.0, 59.0, 66.0, 100.0, 149.0, 168.0, 299.0, 497.0, 1532.0, 669083.0, 373763.0, 1201.0, 456.0, 248.0, 194.0, 156.0, 104.0, 83.0, 63.0, 44.0, 26.0, 18.0, 18.0, 12.0, 14.0, 6.0, 6.0, 2.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0014019012451171875, -0.0013606101274490356, -0.0013193190097808838, -0.001278027892112732, -0.00123673677444458, -0.0011954456567764282, -0.0011541545391082764, -0.0011128634214401245, -0.0010715723037719727, -0.0010302811861038208, -0.000988990068435669, -0.0009476989507675171, -0.0009064078330993652, -0.0008651167154312134, -0.0008238255977630615, -0.0007825344800949097, -0.0007412433624267578, -0.000699952244758606, -0.0006586611270904541, -0.0006173700094223022, -0.0005760788917541504, -0.0005347877740859985, -0.0004934966564178467, -0.0004522055387496948, -0.00041091442108154297, -0.0003696233034133911, -0.00032833218574523926, -0.0002870410680770874, -0.00024574995040893555, -0.0002044588327407837, -0.00016316771507263184, -0.00012187659740447998, -8.058547973632812e-05, -3.929436206817627e-05, 1.996755599975586e-06, 4.328787326812744e-05, 8.45789909362793e-05, 0.00012587010860443115, 0.000167161226272583, 0.00020845234394073486, 0.0002497434616088867, 0.0002910345792770386, 0.00033232569694519043, 0.0003736168146133423, 0.00041490793228149414, 0.000456199049949646, 0.0004974901676177979, 0.0005387812852859497, 0.0005800724029541016, 0.0006213635206222534, 0.0006626546382904053, 0.0007039457559585571, 0.000745236873626709, 0.0007865279912948608, 0.0008278191089630127, 0.0008691102266311646, 0.0009104013442993164, 0.0009516924619674683, 0.0009929835796356201, 0.001034274697303772, 0.0010755658149719238, 0.0011168569326400757, 0.0011581480503082275, 0.0011994391679763794, 0.0012407302856445312]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 15.0, 33.0, 100.0, 184.0, 265.0, 209.0, 117.0, 56.0, 13.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44899157830514e-05, -5.185039117350243e-05, -4.921086292597465e-05, -4.657133831642568e-05, -4.39318100688979e-05, -4.129228545934893e-05, -3.865276084979996e-05, -3.601323260227218e-05, -3.337370799272321e-05, -3.073418338317424e-05, -2.8094655135646462e-05, -2.545513052609749e-05, -2.2815604097559117e-05, -2.0176077669020742e-05, -1.753655305947177e-05, -1.4897026630933397e-05, -1.2257500202395022e-05, -9.617973773856647e-06, -6.9784482548129745e-06, -4.338922735769302e-06, -1.699396307230927e-06, 9.401301213074476e-07, 3.5796547308564186e-06, 6.219181159394793e-06, 8.858707587933168e-06, 1.1498234016471542e-05, 1.4137759535515215e-05, 1.6777285054558888e-05, 1.9416811483097263e-05, 2.2056337911635637e-05, 2.469586252118461e-05, 2.7335388949722983e-05, 2.9974922654218972e-05, 3.261444726376794e-05, 3.525397551129572e-05, 3.789350012084469e-05, 4.053302836837247e-05, 4.317255297792144e-05, 4.581207758747041e-05, 4.845160583499819e-05, 5.109113044454716e-05, 5.373065505409613e-05, 5.637018330162391e-05, 5.900970791117288e-05, 6.164923252072185e-05, 6.428876076824963e-05, 6.692828901577741e-05, 6.956780998734757e-05, 7.220733823487535e-05, 7.484686648240313e-05, 7.74863874539733e-05, 8.012591570150107e-05, 8.276544394902885e-05, 8.540497219655663e-05, 8.804449316812679e-05, 9.068402141565457e-05, 9.332354238722473e-05, 9.596307063475251e-05, 9.860259160632268e-05, 0.00010124211985385045, 0.00010388164810137823, 0.0001065211690729484, 0.00010916069732047617, 0.00011180022556800395, 0.00011443975381553173]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 5.0, 4.0, 11.0, 9.0, 9.0, 23.0, 17.0, 22.0, 21.0, 31.0, 30.0, 44.0, 36.0, 34.0, 48.0, 60.0, 43.0, 49.0, 54.0, 36.0, 52.0, 41.0, 35.0, 41.0, 29.0, 29.0, 28.0, 27.0, 22.0, 19.0, 22.0, 18.0, 15.0, 10.0, 8.0, 2.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.13060188293457e-05, -4.010181874036789e-05, -3.8897618651390076e-05, -3.769341856241226e-05, -3.648921847343445e-05, -3.5285018384456635e-05, -3.408081829547882e-05, -3.287661820650101e-05, -3.167241811752319e-05, -3.046821802854538e-05, -2.9264017939567566e-05, -2.8059817850589752e-05, -2.685561776161194e-05, -2.5651417672634125e-05, -2.444721758365631e-05, -2.3243017494678497e-05, -2.2038817405700684e-05, -2.083461731672287e-05, -1.9630417227745056e-05, -1.8426217138767242e-05, -1.722201704978943e-05, -1.6017816960811615e-05, -1.4813616871833801e-05, -1.3609416782855988e-05, -1.2405216693878174e-05, -1.120101660490036e-05, -9.996816515922546e-06, -8.792616426944733e-06, -7.588416337966919e-06, -6.384216248989105e-06, -5.1800161600112915e-06, -3.975816071033478e-06, -2.771615982055664e-06, -1.5674158930778503e-06, -3.632158041000366e-07, 8.409842848777771e-07, 2.045184373855591e-06, 3.2493844628334045e-06, 4.453584551811218e-06, 5.657784640789032e-06, 6.861984729766846e-06, 8.06618481874466e-06, 9.270384907722473e-06, 1.0474584996700287e-05, 1.16787850856781e-05, 1.2882985174655914e-05, 1.4087185263633728e-05, 1.5291385352611542e-05, 1.6495585441589355e-05, 1.769978553056717e-05, 1.8903985619544983e-05, 2.0108185708522797e-05, 2.131238579750061e-05, 2.2516585886478424e-05, 2.3720785975456238e-05, 2.492498606443405e-05, 2.6129186153411865e-05, 2.733338624238968e-05, 2.8537586331367493e-05, 2.9741786420345306e-05, 3.094598650932312e-05, 3.2150186598300934e-05, 3.335438668727875e-05, 3.455858677625656e-05, 3.5762786865234375e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 1.0, 9.0, 13.0, 7.0, 20.0, 17.0, 7.0, 14.0, 15.0, 16.0, 25.0, 23.0, 33.0, 23.0, 30.0, 30.0, 35.0, 36.0, 50.0, 45.0, 47.0, 53.0, 53.0, 40.0, 43.0, 28.0, 39.0, 37.0, 33.0, 29.0, 31.0, 26.0, 18.0, 12.0, 10.0, 10.0, 8.0, 6.0, 5.0, 3.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.123687744140625, -2.06182861328125, -1.999969482421875, -1.9381103515625, -1.876251220703125, -1.81439208984375, -1.752532958984375, -1.690673828125, -1.628814697265625, -1.56695556640625, -1.505096435546875, -1.4432373046875, -1.381378173828125, -1.31951904296875, -1.257659912109375, -1.19580078125, -1.133941650390625, -1.07208251953125, -1.010223388671875, -0.9483642578125, -0.886505126953125, -0.82464599609375, -0.762786865234375, -0.700927734375, -0.639068603515625, -0.57720947265625, -0.515350341796875, -0.4534912109375, -0.391632080078125, -0.32977294921875, -0.267913818359375, -0.2060546875, -0.144195556640625, -0.08233642578125, -0.020477294921875, 0.0413818359375, 0.103240966796875, 0.16510009765625, 0.226959228515625, 0.288818359375, 0.350677490234375, 0.41253662109375, 0.474395751953125, 0.5362548828125, 0.598114013671875, 0.65997314453125, 0.721832275390625, 0.78369140625, 0.845550537109375, 0.90740966796875, 0.969268798828125, 1.0311279296875, 1.092987060546875, 1.15484619140625, 1.216705322265625, 1.278564453125, 1.340423583984375, 1.40228271484375, 1.464141845703125, 1.5260009765625, 1.587860107421875, 1.64971923828125, 1.711578369140625, 1.7734375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 12.0, 10.0, 14.0, 18.0, 41.0, 54.0, 56.0, 96.0, 136.0, 196.0, 274.0, 474.0, 716.0, 1276.0, 2094.0, 3836.0, 7437.0, 15460.0, 34927.0, 98178.0, 328634.0, 368591.0, 112101.0, 39093.0, 16698.0, 8121.0, 4238.0, 2287.0, 1267.0, 817.0, 446.0, 304.0, 196.0, 138.0, 102.0, 73.0, 58.0, 32.0, 17.0, 8.0, 9.0, 8.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9072265625, -1.8392486572265625, -1.771270751953125, -1.7032928466796875, -1.63531494140625, -1.5673370361328125, -1.499359130859375, -1.4313812255859375, -1.3634033203125, -1.2954254150390625, -1.227447509765625, -1.1594696044921875, -1.09149169921875, -1.0235137939453125, -0.955535888671875, -0.8875579833984375, -0.819580078125, -0.7516021728515625, -0.683624267578125, -0.6156463623046875, -0.54766845703125, -0.4796905517578125, -0.411712646484375, -0.3437347412109375, -0.2757568359375, -0.2077789306640625, -0.139801025390625, -0.0718231201171875, -0.00384521484375, 0.0641326904296875, 0.132110595703125, 0.2000885009765625, 0.26806640625, 0.3360443115234375, 0.404022216796875, 0.4720001220703125, 0.53997802734375, 0.6079559326171875, 0.675933837890625, 0.7439117431640625, 0.8118896484375, 0.8798675537109375, 0.947845458984375, 1.0158233642578125, 1.08380126953125, 1.1517791748046875, 1.219757080078125, 1.2877349853515625, 1.355712890625, 1.4236907958984375, 1.491668701171875, 1.5596466064453125, 1.62762451171875, 1.6956024169921875, 1.763580322265625, 1.8315582275390625, 1.8995361328125, 1.9675140380859375, 2.035491943359375, 2.1034698486328125, 2.17144775390625, 2.2394256591796875, 2.307403564453125, 2.3753814697265625, 2.443359375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 7.0, 14.0, 13.0, 13.0, 14.0, 16.0, 21.0, 25.0, 26.0, 32.0, 34.0, 40.0, 53.0, 51.0, 48.0, 76.0, 129.0, 1543.0, 382.0, 99.0, 63.0, 44.0, 36.0, 37.0, 33.0, 34.0, 22.0, 25.0, 18.0, 18.0, 18.0, 19.0, 11.0, 4.0, 10.0, 2.0, 5.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.515625, -7.27984619140625, -7.0440673828125, -6.80828857421875, -6.572509765625, -6.33673095703125, -6.1009521484375, -5.86517333984375, -5.62939453125, -5.39361572265625, -5.1578369140625, -4.92205810546875, -4.686279296875, -4.45050048828125, -4.2147216796875, -3.97894287109375, -3.7431640625, -3.50738525390625, -3.2716064453125, -3.03582763671875, -2.800048828125, -2.56427001953125, -2.3284912109375, -2.09271240234375, -1.85693359375, -1.62115478515625, -1.3853759765625, -1.14959716796875, -0.913818359375, -0.67803955078125, -0.4422607421875, -0.20648193359375, 0.029296875, 0.26507568359375, 0.5008544921875, 0.73663330078125, 0.972412109375, 1.20819091796875, 1.4439697265625, 1.67974853515625, 1.91552734375, 2.15130615234375, 2.3870849609375, 2.62286376953125, 2.858642578125, 3.09442138671875, 3.3302001953125, 3.56597900390625, 3.8017578125, 4.03753662109375, 4.2733154296875, 4.50909423828125, 4.744873046875, 4.98065185546875, 5.2164306640625, 5.45220947265625, 5.68798828125, 5.92376708984375, 6.1595458984375, 6.39532470703125, 6.631103515625, 6.86688232421875, 7.1026611328125, 7.33843994140625, 7.57421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 14.0, 12.0, 17.0, 21.0, 24.0, 22.0, 39.0, 43.0, 48.0, 66.0, 116.0, 181.0, 342.0, 843.0, 5185.0, 157199.0, 2945351.0, 32345.0, 2371.0, 563.0, 283.0, 147.0, 120.0, 62.0, 53.0, 35.0, 34.0, 37.0, 29.0, 20.0, 11.0, 17.0, 12.0, 2.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4609375, -12.06298828125, -11.6650390625, -11.26708984375, -10.869140625, -10.47119140625, -10.0732421875, -9.67529296875, -9.27734375, -8.87939453125, -8.4814453125, -8.08349609375, -7.685546875, -7.28759765625, -6.8896484375, -6.49169921875, -6.09375, -5.69580078125, -5.2978515625, -4.89990234375, -4.501953125, -4.10400390625, -3.7060546875, -3.30810546875, -2.91015625, -2.51220703125, -2.1142578125, -1.71630859375, -1.318359375, -0.92041015625, -0.5224609375, -0.12451171875, 0.2734375, 0.67138671875, 1.0693359375, 1.46728515625, 1.865234375, 2.26318359375, 2.6611328125, 3.05908203125, 3.45703125, 3.85498046875, 4.2529296875, 4.65087890625, 5.048828125, 5.44677734375, 5.8447265625, 6.24267578125, 6.640625, 7.03857421875, 7.4365234375, 7.83447265625, 8.232421875, 8.63037109375, 9.0283203125, 9.42626953125, 9.82421875, 10.22216796875, 10.6201171875, 11.01806640625, 11.416015625, 11.81396484375, 12.2119140625, 12.60986328125, 13.0078125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 9.0, 19.0, 62.0, 130.0, 184.0, 228.0, 187.0, 93.0, 62.0, 19.0, 9.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.176681518554688, -19.700082778930664, -19.22348403930664, -18.746885299682617, -18.270286560058594, -17.793685913085938, -17.317087173461914, -16.84048843383789, -16.363889694213867, -15.887290954589844, -15.41069221496582, -14.93409252166748, -14.457493782043457, -13.980895042419434, -13.504295349121094, -13.02769660949707, -12.551097869873047, -12.074499130249023, -11.597900390625, -11.12130069732666, -10.644701957702637, -10.168103218078613, -9.691503524780273, -9.21490478515625, -8.738306045532227, -8.261707305908203, -7.7851080894470215, -7.30850887298584, -6.831910133361816, -6.355311393737793, -5.878712177276611, -5.40211296081543, -4.925515174865723, -4.448916435241699, -3.9723172187805176, -3.495718240737915, -3.0191192626953125, -2.54252028465271, -2.0659213066101074, -1.5893223285675049, -1.1127233505249023, -0.6361243724822998, -0.15952539443969727, 0.3170735836029053, 0.7936725616455078, 1.2702715396881104, 1.746870517730713, 2.2234694957733154, 2.700068473815918, 3.1766674518585205, 3.653266429901123, 4.129865646362305, 4.606464385986328, 5.083063125610352, 5.559662342071533, 6.036261558532715, 6.512860298156738, 6.989459037780762, 7.466058254241943, 7.942657470703125, 8.419256210327148, 8.895854949951172, 9.372453689575195, 9.849053382873535, 10.325652122497559]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 6.0, 7.0, 7.0, 9.0, 8.0, 14.0, 15.0, 15.0, 22.0, 17.0, 33.0, 31.0, 20.0, 26.0, 33.0, 36.0, 39.0, 40.0, 34.0, 44.0, 43.0, 46.0, 53.0, 51.0, 42.0, 46.0, 32.0, 29.0, 27.0, 24.0, 32.0, 29.0, 14.0, 20.0, 10.0, 12.0, 7.0, 8.0, 3.0, 3.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.622669219970703, -21.874195098876953, -21.125720977783203, -20.377248764038086, -19.628774642944336, -18.880300521850586, -18.13182830810547, -17.38335418701172, -16.63488006591797, -15.886405944824219, -15.137932777404785, -14.389459609985352, -13.640985488891602, -12.892511367797852, -12.144038200378418, -11.395565032958984, -10.647090911865234, -9.898616790771484, -9.15014362335205, -8.401670455932617, -7.653196334838867, -6.904722690582275, -6.156249046325684, -5.407775402069092, -4.6593017578125, -3.910828113555908, -3.1623544692993164, -2.4138808250427246, -1.6654071807861328, -0.916933536529541, -0.16845989227294922, 0.5800137519836426, 1.3284893035888672, 2.076962947845459, 2.825436592102051, 3.5739102363586426, 4.322383880615234, 5.070857524871826, 5.819331169128418, 6.56780481338501, 7.316278457641602, 8.064752578735352, 8.813225746154785, 9.561698913574219, 10.310173034667969, 11.058647155761719, 11.807120323181152, 12.555593490600586, 13.304067611694336, 14.052541732788086, 14.80101490020752, 15.549488067626953, 16.297962188720703, 17.046436309814453, 17.794910430908203, 18.54338264465332, 19.29185676574707, 20.04033088684082, 20.788803100585938, 21.537277221679688, 22.285751342773438, 23.034225463867188, 23.782699584960938, 24.531171798706055, 25.279645919799805]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 12.0, 11.0, 9.0, 13.0, 17.0, 12.0, 14.0, 15.0, 13.0, 29.0, 24.0, 35.0, 33.0, 27.0, 40.0, 39.0, 37.0, 53.0, 39.0, 49.0, 36.0, 49.0, 45.0, 40.0, 51.0, 43.0, 27.0, 32.0, 32.0, 26.0, 18.0, 15.0, 9.0, 11.0, 5.0, 5.0, 9.0, 6.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.435546875, -2.3675994873046875, -2.299652099609375, -2.2317047119140625, -2.16375732421875, -2.0958099365234375, -2.027862548828125, -1.9599151611328125, -1.8919677734375, -1.8240203857421875, -1.756072998046875, -1.6881256103515625, -1.62017822265625, -1.5522308349609375, -1.484283447265625, -1.4163360595703125, -1.348388671875, -1.2804412841796875, -1.212493896484375, -1.1445465087890625, -1.07659912109375, -1.0086517333984375, -0.940704345703125, -0.8727569580078125, -0.8048095703125, -0.7368621826171875, -0.668914794921875, -0.6009674072265625, -0.53302001953125, -0.4650726318359375, -0.397125244140625, -0.3291778564453125, -0.26123046875, -0.1932830810546875, -0.125335693359375, -0.0573883056640625, 0.01055908203125, 0.0785064697265625, 0.146453857421875, 0.2144012451171875, 0.2823486328125, 0.3502960205078125, 0.418243408203125, 0.4861907958984375, 0.55413818359375, 0.6220855712890625, 0.690032958984375, 0.7579803466796875, 0.825927734375, 0.8938751220703125, 0.961822509765625, 1.0297698974609375, 1.09771728515625, 1.1656646728515625, 1.233612060546875, 1.3015594482421875, 1.3695068359375, 1.4374542236328125, 1.505401611328125, 1.5733489990234375, 1.64129638671875, 1.7092437744140625, 1.777191162109375, 1.8451385498046875, 1.9130859375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 4.0, 6.0, 2.0, 11.0, 7.0, 5.0, 10.0, 10.0, 10.0, 20.0, 14.0, 19.0, 25.0, 21.0, 26.0, 33.0, 50.0, 65.0, 104.0, 330.0, 1407.0, 11399.0, 273402.0, 3590325.0, 302869.0, 11961.0, 1402.0, 272.0, 125.0, 68.0, 48.0, 26.0, 29.0, 29.0, 23.0, 24.0, 20.0, 12.0, 18.0, 10.0, 4.0, 11.0, 5.0, 4.0, 2.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5859375, -10.27001953125, -9.9541015625, -9.63818359375, -9.322265625, -9.00634765625, -8.6904296875, -8.37451171875, -8.05859375, -7.74267578125, -7.4267578125, -7.11083984375, -6.794921875, -6.47900390625, -6.1630859375, -5.84716796875, -5.53125, -5.21533203125, -4.8994140625, -4.58349609375, -4.267578125, -3.95166015625, -3.6357421875, -3.31982421875, -3.00390625, -2.68798828125, -2.3720703125, -2.05615234375, -1.740234375, -1.42431640625, -1.1083984375, -0.79248046875, -0.4765625, -0.16064453125, 0.1552734375, 0.47119140625, 0.787109375, 1.10302734375, 1.4189453125, 1.73486328125, 2.05078125, 2.36669921875, 2.6826171875, 2.99853515625, 3.314453125, 3.63037109375, 3.9462890625, 4.26220703125, 4.578125, 4.89404296875, 5.2099609375, 5.52587890625, 5.841796875, 6.15771484375, 6.4736328125, 6.78955078125, 7.10546875, 7.42138671875, 7.7373046875, 8.05322265625, 8.369140625, 8.68505859375, 9.0009765625, 9.31689453125, 9.6328125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 2.0, 11.0, 20.0, 43.0, 59.0, 100.0, 185.0, 286.0, 506.0, 699.0, 767.0, 560.0, 353.0, 184.0, 137.0, 67.0, 48.0, 19.0, 17.0, 8.0, 6.0, 4.0], "bins": [-16.46875, -16.152923583984375, -15.83709716796875, -15.521270751953125, -15.2054443359375, -14.889617919921875, -14.57379150390625, -14.257965087890625, -13.942138671875, -13.626312255859375, -13.31048583984375, -12.994659423828125, -12.6788330078125, -12.363006591796875, -12.04718017578125, -11.731353759765625, -11.41552734375, -11.099700927734375, -10.78387451171875, -10.468048095703125, -10.1522216796875, -9.836395263671875, -9.52056884765625, -9.204742431640625, -8.888916015625, -8.573089599609375, -8.25726318359375, -7.941436767578125, -7.6256103515625, -7.309783935546875, -6.99395751953125, -6.678131103515625, -6.3623046875, -6.046478271484375, -5.73065185546875, -5.414825439453125, -5.0989990234375, -4.783172607421875, -4.46734619140625, -4.151519775390625, -3.835693359375, -3.519866943359375, -3.20404052734375, -2.888214111328125, -2.5723876953125, -2.256561279296875, -1.94073486328125, -1.624908447265625, -1.30908203125, -0.993255615234375, -0.67742919921875, -0.361602783203125, -0.0457763671875, 0.270050048828125, 0.58587646484375, 0.901702880859375, 1.217529296875, 1.533355712890625, 1.84918212890625, 2.165008544921875, 2.4808349609375, 2.796661376953125, 3.11248779296875, 3.428314208984375, 3.744140625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 18.0, 31.0, 46.0, 96.0, 148.0, 220.0, 400.0, 984.0, 10297.0, 2416651.0, 1755167.0, 8335.0, 930.0, 382.0, 227.0, 135.0, 86.0, 36.0, 34.0, 13.0, 15.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6171875, -13.8038330078125, -12.990478515625, -12.1771240234375, -11.36376953125, -10.5504150390625, -9.737060546875, -8.9237060546875, -8.1103515625, -7.2969970703125, -6.483642578125, -5.6702880859375, -4.85693359375, -4.0435791015625, -3.230224609375, -2.4168701171875, -1.603515625, -0.7901611328125, 0.023193359375, 0.8365478515625, 1.64990234375, 2.4632568359375, 3.276611328125, 4.0899658203125, 4.9033203125, 5.7166748046875, 6.530029296875, 7.3433837890625, 8.15673828125, 8.9700927734375, 9.783447265625, 10.5968017578125, 11.41015625, 12.2235107421875, 13.036865234375, 13.8502197265625, 14.66357421875, 15.4769287109375, 16.290283203125, 17.1036376953125, 17.9169921875, 18.7303466796875, 19.543701171875, 20.3570556640625, 21.17041015625, 21.9837646484375, 22.797119140625, 23.6104736328125, 24.423828125, 25.2371826171875, 26.050537109375, 26.8638916015625, 27.67724609375, 28.4906005859375, 29.303955078125, 30.1173095703125, 30.9306640625, 31.7440185546875, 32.557373046875, 33.3707275390625, 34.18408203125, 34.9974365234375, 35.810791015625, 36.6241455078125, 37.4375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 11.0, 44.0, 100.0, 231.0, 245.0, 220.0, 109.0, 38.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.50689697265625, -67.70074462890625, -65.89459228515625, -64.08843994140625, -62.28228759765625, -60.47613525390625, -58.66998291015625, -56.863834381103516, -55.057682037353516, -53.251529693603516, -51.445377349853516, -49.639225006103516, -47.833072662353516, -46.02692413330078, -44.22077178955078, -42.41461944580078, -40.60846710205078, -38.80231475830078, -36.99616241455078, -35.19001007080078, -33.38385772705078, -31.577707290649414, -29.771554946899414, -27.965404510498047, -26.15924835205078, -24.35309600830078, -22.54694366455078, -20.74079132080078, -18.934640884399414, -17.128488540649414, -15.322336196899414, -13.51618480682373, -11.710033416748047, -9.903881072998047, -8.097729682922363, -6.291577339172363, -4.4854254722595215, -2.6792736053466797, -0.8731212615966797, 0.9330301284790039, 2.739182472229004, 4.545334339141846, 6.3514862060546875, 8.157638549804688, 9.963790893554688, 11.769942283630371, 13.576094627380371, 15.382246017456055, 17.188398361206055, 18.994550704956055, 20.800703048706055, 22.606853485107422, 24.413005828857422, 26.219158172607422, 28.025310516357422, 29.831462860107422, 31.637615203857422, 33.44376754760742, 35.24991989135742, 37.05607223510742, 38.86222457885742, 40.668373107910156, 42.474525451660156, 44.280677795410156, 46.086830139160156]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 14.0, 6.0, 8.0, 9.0, 14.0, 11.0, 11.0, 18.0, 21.0, 23.0, 31.0, 21.0, 31.0, 26.0, 27.0, 36.0, 34.0, 30.0, 43.0, 44.0, 37.0, 38.0, 52.0, 35.0, 28.0, 22.0, 30.0, 29.0, 38.0, 28.0, 26.0, 18.0, 27.0, 16.0, 17.0, 13.0, 12.0, 12.0, 10.0, 7.0, 4.0, 7.0, 11.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.114425659179688, -16.55829620361328, -16.002166748046875, -15.446037292480469, -14.889907836914062, -14.333778381347656, -13.77764892578125, -13.221519470214844, -12.665390014648438, -12.109260559082031, -11.553131103515625, -10.997001647949219, -10.440872192382812, -9.884742736816406, -9.32861328125, -8.772483825683594, -8.216355323791504, -7.660225868225098, -7.104096412658691, -6.547966957092285, -5.991837501525879, -5.435708045959473, -4.879579067230225, -4.323449611663818, -3.767320156097412, -3.211190700531006, -2.6550612449645996, -2.0989320278167725, -1.5428025722503662, -0.98667311668396, -0.4305438995361328, 0.12558555603027344, 0.6817150115966797, 1.237844467163086, 1.7939738035202026, 2.3501031398773193, 2.9062325954437256, 3.462362051010132, 4.018491268157959, 4.574620723724365, 5.1307501792907715, 5.686879634857178, 6.243009090423584, 6.799138069152832, 7.355267524719238, 7.9113969802856445, 8.46752643585205, 9.023655891418457, 9.579785346984863, 10.13591480255127, 10.692044258117676, 11.248173713684082, 11.804303169250488, 12.360432624816895, 12.916561126708984, 13.47269058227539, 14.028820037841797, 14.584949493408203, 15.14107894897461, 15.697208404541016, 16.253337860107422, 16.809467315673828, 17.365596771240234, 17.92172622680664, 18.477855682373047]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 5.0, 8.0, 3.0, 12.0, 16.0, 17.0, 10.0, 16.0, 14.0, 18.0, 19.0, 17.0, 29.0, 23.0, 38.0, 50.0, 39.0, 50.0, 43.0, 44.0, 49.0, 35.0, 41.0, 55.0, 39.0, 36.0, 33.0, 46.0, 38.0, 27.0, 29.0, 18.0, 21.0, 7.0, 14.0, 10.0, 4.0, 5.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.662109375, -2.590667724609375, -2.51922607421875, -2.447784423828125, -2.3763427734375, -2.304901123046875, -2.23345947265625, -2.162017822265625, -2.090576171875, -2.019134521484375, -1.94769287109375, -1.876251220703125, -1.8048095703125, -1.733367919921875, -1.66192626953125, -1.590484619140625, -1.51904296875, -1.447601318359375, -1.37615966796875, -1.304718017578125, -1.2332763671875, -1.161834716796875, -1.09039306640625, -1.018951416015625, -0.947509765625, -0.876068115234375, -0.80462646484375, -0.733184814453125, -0.6617431640625, -0.590301513671875, -0.51885986328125, -0.447418212890625, -0.3759765625, -0.304534912109375, -0.23309326171875, -0.161651611328125, -0.0902099609375, -0.018768310546875, 0.05267333984375, 0.124114990234375, 0.195556640625, 0.266998291015625, 0.33843994140625, 0.409881591796875, 0.4813232421875, 0.552764892578125, 0.62420654296875, 0.695648193359375, 0.76708984375, 0.838531494140625, 0.90997314453125, 0.981414794921875, 1.0528564453125, 1.124298095703125, 1.19573974609375, 1.267181396484375, 1.338623046875, 1.410064697265625, 1.48150634765625, 1.552947998046875, 1.6243896484375, 1.695831298828125, 1.76727294921875, 1.838714599609375, 1.91015625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 12.0, 20.0, 33.0, 41.0, 56.0, 114.0, 171.0, 288.0, 485.0, 770.0, 1301.0, 2218.0, 3646.0, 6347.0, 10521.0, 17924.0, 31885.0, 60797.0, 127073.0, 320745.0, 245575.0, 102906.0, 50152.0, 27372.0, 15777.0, 9015.0, 5336.0, 3225.0, 1850.0, 1138.0, 693.0, 437.0, 244.0, 139.0, 88.0, 43.0, 46.0, 21.0, 16.0, 10.0, 11.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50634765625, -0.4909400939941406, -0.47553253173828125, -0.4601249694824219, -0.4447174072265625, -0.4293098449707031, -0.41390228271484375, -0.3984947204589844, -0.383087158203125, -0.3676795959472656, -0.35227203369140625, -0.3368644714355469, -0.3214569091796875, -0.3060493469238281, -0.29064178466796875, -0.2752342224121094, -0.25982666015625, -0.24441909790039062, -0.22901153564453125, -0.21360397338867188, -0.1981964111328125, -0.18278884887695312, -0.16738128662109375, -0.15197372436523438, -0.136566162109375, -0.12115859985351562, -0.10575103759765625, -0.09034347534179688, -0.0749359130859375, -0.059528350830078125, -0.04412078857421875, -0.028713226318359375, -0.0133056640625, 0.002101898193359375, 0.01750946044921875, 0.032917022705078125, 0.0483245849609375, 0.06373214721679688, 0.07913970947265625, 0.09454727172851562, 0.109954833984375, 0.12536239624023438, 0.14076995849609375, 0.15617752075195312, 0.1715850830078125, 0.18699264526367188, 0.20240020751953125, 0.21780776977539062, 0.23321533203125, 0.24862289428710938, 0.26403045654296875, 0.2794380187988281, 0.2948455810546875, 0.3102531433105469, 0.32566070556640625, 0.3410682678222656, 0.356475830078125, 0.3718833923339844, 0.38729095458984375, 0.4026985168457031, 0.4181060791015625, 0.4335136413574219, 0.44892120361328125, 0.4643287658691406, 0.479736328125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 10.0, 10.0, 7.0, 10.0, 13.0, 22.0, 12.0, 14.0, 23.0, 25.0, 26.0, 30.0, 35.0, 37.0, 37.0, 31.0, 43.0, 35.0, 32.0, 37.0, 1064.0, 27.0, 32.0, 44.0, 37.0, 33.0, 29.0, 36.0, 24.0, 28.0, 25.0, 25.0, 23.0, 17.0, 16.0, 16.0, 6.0, 6.0, 9.0, 11.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3583984375, -1.3172760009765625, -1.276153564453125, -1.2350311279296875, -1.19390869140625, -1.1527862548828125, -1.111663818359375, -1.0705413818359375, -1.0294189453125, -0.9882965087890625, -0.947174072265625, -0.9060516357421875, -0.86492919921875, -0.8238067626953125, -0.782684326171875, -0.7415618896484375, -0.700439453125, -0.6593170166015625, -0.618194580078125, -0.5770721435546875, -0.53594970703125, -0.4948272705078125, -0.453704833984375, -0.4125823974609375, -0.3714599609375, -0.3303375244140625, -0.289215087890625, -0.2480926513671875, -0.20697021484375, -0.1658477783203125, -0.124725341796875, -0.0836029052734375, -0.04248046875, -0.0013580322265625, 0.039764404296875, 0.0808868408203125, 0.12200927734375, 0.1631317138671875, 0.204254150390625, 0.2453765869140625, 0.2864990234375, 0.3276214599609375, 0.368743896484375, 0.4098663330078125, 0.45098876953125, 0.4921112060546875, 0.533233642578125, 0.5743560791015625, 0.615478515625, 0.6566009521484375, 0.697723388671875, 0.7388458251953125, 0.77996826171875, 0.8210906982421875, 0.862213134765625, 0.9033355712890625, 0.9444580078125, 0.9855804443359375, 1.026702880859375, 1.0678253173828125, 1.10894775390625, 1.1500701904296875, 1.191192626953125, 1.2323150634765625, 1.2734375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 5.0, 4.0, 5.0, 9.0, 15.0, 22.0, 35.0, 40.0, 63.0, 110.0, 152.0, 190.0, 331.0, 440.0, 642.0, 885.0, 1219.0, 1738.0, 2416.0, 3516.0, 4800.0, 6669.0, 9396.0, 13324.0, 18943.0, 27182.0, 40491.0, 61636.0, 100250.0, 189570.0, 1277059.0, 118268.0, 69913.0, 45503.0, 30412.0, 20984.0, 14722.0, 10340.0, 7371.0, 5184.0, 3813.0, 2759.0, 1913.0, 1351.0, 1088.0, 655.0, 506.0, 395.0, 252.0, 173.0, 116.0, 83.0, 57.0, 39.0, 30.0, 22.0, 14.0, 9.0, 13.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.2744140625, -0.26560211181640625, -0.2567901611328125, -0.24797821044921875, -0.239166259765625, -0.23035430908203125, -0.2215423583984375, -0.21273040771484375, -0.20391845703125, -0.19510650634765625, -0.1862945556640625, -0.17748260498046875, -0.168670654296875, -0.15985870361328125, -0.1510467529296875, -0.14223480224609375, -0.1334228515625, -0.12461090087890625, -0.1157989501953125, -0.10698699951171875, -0.098175048828125, -0.08936309814453125, -0.0805511474609375, -0.07173919677734375, -0.06292724609375, -0.05411529541015625, -0.0453033447265625, -0.03649139404296875, -0.027679443359375, -0.01886749267578125, -0.0100555419921875, -0.00124359130859375, 0.007568359375, 0.01638031005859375, 0.0251922607421875, 0.03400421142578125, 0.042816162109375, 0.05162811279296875, 0.0604400634765625, 0.06925201416015625, 0.07806396484375, 0.08687591552734375, 0.0956878662109375, 0.10449981689453125, 0.113311767578125, 0.12212371826171875, 0.1309356689453125, 0.13974761962890625, 0.1485595703125, 0.15737152099609375, 0.1661834716796875, 0.17499542236328125, 0.183807373046875, 0.19261932373046875, 0.2014312744140625, 0.21024322509765625, 0.21905517578125, 0.22786712646484375, 0.2366790771484375, 0.24549102783203125, 0.254302978515625, 0.26311492919921875, 0.2719268798828125, 0.28073883056640625, 0.28955078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 6.0, 10.0, 10.0, 8.0, 16.0, 18.0, 21.0, 39.0, 27.0, 33.0, 42.0, 68.0, 55.0, 53.0, 64.0, 69.0, 54.0, 63.0, 48.0, 50.0, 37.0, 27.0, 43.0, 19.0, 21.0, 16.0, 14.0, 16.0, 12.0, 8.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.920099258422852e-05, -6.668083369731903e-05, -6.416067481040955e-05, -6.164051592350006e-05, -5.9120357036590576e-05, -5.660019814968109e-05, -5.4080039262771606e-05, -5.155988037586212e-05, -4.903972148895264e-05, -4.651956260204315e-05, -4.399940371513367e-05, -4.147924482822418e-05, -3.89590859413147e-05, -3.643892705440521e-05, -3.391876816749573e-05, -3.139860928058624e-05, -2.8878450393676758e-05, -2.6358291506767273e-05, -2.3838132619857788e-05, -2.1317973732948303e-05, -1.879781484603882e-05, -1.6277655959129333e-05, -1.3757497072219849e-05, -1.1237338185310364e-05, -8.717179298400879e-06, -6.197020411491394e-06, -3.676861524581909e-06, -1.1567026376724243e-06, 1.3634562492370605e-06, 3.883615136146545e-06, 6.40377402305603e-06, 8.923932909965515e-06, 1.1444091796875e-05, 1.3964250683784485e-05, 1.648440957069397e-05, 1.9004568457603455e-05, 2.152472734451294e-05, 2.4044886231422424e-05, 2.656504511833191e-05, 2.9085204005241394e-05, 3.160536289215088e-05, 3.4125521779060364e-05, 3.664568066596985e-05, 3.9165839552879333e-05, 4.168599843978882e-05, 4.42061573266983e-05, 4.672631621360779e-05, 4.924647510051727e-05, 5.176663398742676e-05, 5.428679287433624e-05, 5.680695176124573e-05, 5.932711064815521e-05, 6.18472695350647e-05, 6.436742842197418e-05, 6.688758730888367e-05, 6.940774619579315e-05, 7.192790508270264e-05, 7.444806396961212e-05, 7.69682228565216e-05, 7.948838174343109e-05, 8.200854063034058e-05, 8.452869951725006e-05, 8.704885840415955e-05, 8.956901729106903e-05, 9.208917617797852e-05]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 8.0, 9.0, 8.0, 10.0, 20.0, 33.0, 35.0, 57.0, 65.0, 75.0, 111.0, 171.0, 286.0, 469.0, 899.0, 135450.0, 907729.0, 1677.0, 511.0, 252.0, 213.0, 92.0, 111.0, 64.0, 47.0, 42.0, 22.0, 17.0, 12.0, 16.0, 11.0, 8.0, 3.0, 3.0, 1.0, 6.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0017881393432617188, -0.001735791563987732, -0.0016834437847137451, -0.0016310960054397583, -0.0015787482261657715, -0.0015264004468917847, -0.0014740526676177979, -0.001421704888343811, -0.0013693571090698242, -0.0013170093297958374, -0.0012646615505218506, -0.0012123137712478638, -0.001159965991973877, -0.0011076182126998901, -0.0010552704334259033, -0.0010029226541519165, -0.0009505748748779297, -0.0008982270956039429, -0.0008458793163299561, -0.0007935315370559692, -0.0007411837577819824, -0.0006888359785079956, -0.0006364881992340088, -0.000584140419960022, -0.0005317926406860352, -0.00047944486141204834, -0.0004270970821380615, -0.0003747493028640747, -0.0003224015235900879, -0.0002700537443161011, -0.00021770596504211426, -0.00016535818576812744, -0.00011301040649414062, -6.066262722015381e-05, -8.314847946166992e-06, 4.4032931327819824e-05, 9.638071060180664e-05, 0.00014872848987579346, 0.00020107626914978027, 0.0002534240484237671, 0.0003057718276977539, 0.0003581196069717407, 0.00041046738624572754, 0.00046281516551971436, 0.0005151629447937012, 0.000567510724067688, 0.0006198585033416748, 0.0006722062826156616, 0.0007245540618896484, 0.0007769018411636353, 0.0008292496204376221, 0.0008815973997116089, 0.0009339451789855957, 0.0009862929582595825, 0.0010386407375335693, 0.0010909885168075562, 0.001143336296081543, 0.0011956840753555298, 0.0012480318546295166, 0.0013003796339035034, 0.0013527274131774902, 0.001405075192451477, 0.0014574229717254639, 0.0015097707509994507, 0.0015621185302734375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 18.0, 74.0, 200.0, 315.0, 251.0, 106.0, 32.0, 9.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014139461563900113, -0.00013720209244638681, -0.0001330095692537725, -0.00012881704606115818, -0.00012462452286854386, -0.00012043199967592955, -0.00011623947648331523, -0.00011204695329070091, -0.0001078544300980866, -0.00010366190690547228, -9.946938371285796e-05, -9.527686052024364e-05, -9.108433732762933e-05, -8.689181413501501e-05, -8.26992909424007e-05, -7.850676774978638e-05, -7.431424455717206e-05, -7.012172136455774e-05, -6.592919817194343e-05, -6.173667497932911e-05, -5.754415178671479e-05, -5.3351628594100475e-05, -4.915910540148616e-05, -4.496658220887184e-05, -4.0774059016257524e-05, -3.658153582364321e-05, -3.238901263102889e-05, -2.8196489438414574e-05, -2.4003966245800257e-05, -1.981144305318594e-05, -1.5618919860571623e-05, -1.1426396667957306e-05, -7.233888027258217e-06, -3.0413648346439004e-06, 1.1511583579704165e-06, 5.3436815505847335e-06, 9.53620474319905e-06, 1.3728727935813367e-05, 1.7921251128427684e-05, 2.2113774321042e-05, 2.6306297513656318e-05, 3.0498820706270635e-05, 3.469134389888495e-05, 3.888386709149927e-05, 4.3076390284113586e-05, 4.72689134767279e-05, 5.146143666934222e-05, 5.565395986195654e-05, 5.9846483054570854e-05, 6.403900624718517e-05, 6.823152943979949e-05, 7.24240526324138e-05, 7.661657582502812e-05, 8.080909901764244e-05, 8.500162221025676e-05, 8.919414540287107e-05, 9.338666859548539e-05, 9.75791917880997e-05, 0.00010177171498071402, 0.00010596423817332834, 0.00011015676136594266, 0.00011434928455855697, 0.00011854180775117129, 0.0001227343309437856, 0.00012692685413639992]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 7.0, 7.0, 11.0, 12.0, 15.0, 12.0, 16.0, 13.0, 24.0, 24.0, 40.0, 29.0, 30.0, 36.0, 43.0, 35.0, 39.0, 40.0, 44.0, 20.0, 42.0, 46.0, 39.0, 36.0, 38.0, 39.0, 37.0, 27.0, 33.0, 29.0, 19.0, 19.0, 16.0, 14.0, 14.0, 8.0, 8.0, 7.0, 9.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.993511199951172e-05, -3.862474113702774e-05, -3.731437027454376e-05, -3.6003999412059784e-05, -3.4693628549575806e-05, -3.338325768709183e-05, -3.207288682460785e-05, -3.076251596212387e-05, -2.9452145099639893e-05, -2.8141774237155914e-05, -2.6831403374671936e-05, -2.5521032512187958e-05, -2.421066164970398e-05, -2.290029078722e-05, -2.1589919924736023e-05, -2.0279549062252045e-05, -1.8969178199768066e-05, -1.7658807337284088e-05, -1.634843647480011e-05, -1.5038065612316132e-05, -1.3727694749832153e-05, -1.2417323887348175e-05, -1.1106953024864197e-05, -9.796582162380219e-06, -8.48621129989624e-06, -7.175840437412262e-06, -5.865469574928284e-06, -4.555098712444305e-06, -3.244727849960327e-06, -1.934356987476349e-06, -6.239861249923706e-07, 6.863847374916077e-07, 1.996755599975586e-06, 3.307126462459564e-06, 4.6174973249435425e-06, 5.927868187427521e-06, 7.238239049911499e-06, 8.548609912395477e-06, 9.858980774879456e-06, 1.1169351637363434e-05, 1.2479722499847412e-05, 1.379009336233139e-05, 1.5100464224815369e-05, 1.6410835087299347e-05, 1.7721205949783325e-05, 1.9031576812267303e-05, 2.0341947674751282e-05, 2.165231853723526e-05, 2.2962689399719238e-05, 2.4273060262203217e-05, 2.5583431124687195e-05, 2.6893801987171173e-05, 2.820417284965515e-05, 2.951454371213913e-05, 3.082491457462311e-05, 3.2135285437107086e-05, 3.3445656299591064e-05, 3.475602716207504e-05, 3.606639802455902e-05, 3.7376768887043e-05, 3.868713974952698e-05, 3.9997510612010956e-05, 4.1307881474494934e-05, 4.261825233697891e-05, 4.392862319946289e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 5.0, 8.0, 3.0, 12.0, 16.0, 17.0, 10.0, 16.0, 14.0, 18.0, 19.0, 17.0, 29.0, 23.0, 38.0, 50.0, 39.0, 50.0, 43.0, 44.0, 49.0, 35.0, 41.0, 55.0, 39.0, 36.0, 33.0, 46.0, 38.0, 27.0, 29.0, 18.0, 21.0, 7.0, 14.0, 10.0, 4.0, 5.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.662109375, -2.590667724609375, -2.51922607421875, -2.447784423828125, -2.3763427734375, -2.304901123046875, -2.23345947265625, -2.162017822265625, -2.090576171875, -2.019134521484375, -1.94769287109375, -1.876251220703125, -1.8048095703125, -1.733367919921875, -1.66192626953125, -1.590484619140625, -1.51904296875, -1.447601318359375, -1.37615966796875, -1.304718017578125, -1.2332763671875, -1.161834716796875, -1.09039306640625, -1.018951416015625, -0.947509765625, -0.876068115234375, -0.80462646484375, -0.733184814453125, -0.6617431640625, -0.590301513671875, -0.51885986328125, -0.447418212890625, -0.3759765625, -0.304534912109375, -0.23309326171875, -0.161651611328125, -0.0902099609375, -0.018768310546875, 0.05267333984375, 0.124114990234375, 0.195556640625, 0.266998291015625, 0.33843994140625, 0.409881591796875, 0.4813232421875, 0.552764892578125, 0.62420654296875, 0.695648193359375, 0.76708984375, 0.838531494140625, 0.90997314453125, 0.981414794921875, 1.0528564453125, 1.124298095703125, 1.19573974609375, 1.267181396484375, 1.338623046875, 1.410064697265625, 1.48150634765625, 1.552947998046875, 1.6243896484375, 1.695831298828125, 1.76727294921875, 1.838714599609375, 1.91015625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 5.0, 9.0, 5.0, 7.0, 20.0, 24.0, 28.0, 44.0, 46.0, 83.0, 89.0, 124.0, 160.0, 265.0, 432.0, 600.0, 1161.0, 2082.0, 4168.0, 9598.0, 27434.0, 103100.0, 415593.0, 357992.0, 84778.0, 23181.0, 8720.0, 3802.0, 1931.0, 1132.0, 624.0, 429.0, 267.0, 180.0, 126.0, 94.0, 60.0, 42.0, 32.0, 20.0, 17.0, 17.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.767578125, -2.6883544921875, -2.609130859375, -2.5299072265625, -2.45068359375, -2.3714599609375, -2.292236328125, -2.2130126953125, -2.1337890625, -2.0545654296875, -1.975341796875, -1.8961181640625, -1.81689453125, -1.7376708984375, -1.658447265625, -1.5792236328125, -1.5, -1.4207763671875, -1.341552734375, -1.2623291015625, -1.18310546875, -1.1038818359375, -1.024658203125, -0.9454345703125, -0.8662109375, -0.7869873046875, -0.707763671875, -0.6285400390625, -0.54931640625, -0.4700927734375, -0.390869140625, -0.3116455078125, -0.232421875, -0.1531982421875, -0.073974609375, 0.0052490234375, 0.08447265625, 0.1636962890625, 0.242919921875, 0.3221435546875, 0.4013671875, 0.4805908203125, 0.559814453125, 0.6390380859375, 0.71826171875, 0.7974853515625, 0.876708984375, 0.9559326171875, 1.03515625, 1.1143798828125, 1.193603515625, 1.2728271484375, 1.35205078125, 1.4312744140625, 1.510498046875, 1.5897216796875, 1.6689453125, 1.7481689453125, 1.827392578125, 1.9066162109375, 1.98583984375, 2.0650634765625, 2.144287109375, 2.2235107421875, 2.302734375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 3.0, 9.0, 10.0, 11.0, 7.0, 9.0, 16.0, 17.0, 18.0, 29.0, 26.0, 37.0, 26.0, 32.0, 37.0, 47.0, 54.0, 54.0, 197.0, 1701.0, 210.0, 70.0, 46.0, 58.0, 37.0, 47.0, 38.0, 31.0, 22.0, 26.0, 27.0, 19.0, 12.0, 16.0, 12.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.376708984375, -6.13623046875, -5.895751953125, -5.6552734375, -5.414794921875, -5.17431640625, -4.933837890625, -4.693359375, -4.452880859375, -4.21240234375, -3.971923828125, -3.7314453125, -3.490966796875, -3.25048828125, -3.010009765625, -2.76953125, -2.529052734375, -2.28857421875, -2.048095703125, -1.8076171875, -1.567138671875, -1.32666015625, -1.086181640625, -0.845703125, -0.605224609375, -0.36474609375, -0.124267578125, 0.1162109375, 0.356689453125, 0.59716796875, 0.837646484375, 1.078125, 1.318603515625, 1.55908203125, 1.799560546875, 2.0400390625, 2.280517578125, 2.52099609375, 2.761474609375, 3.001953125, 3.242431640625, 3.48291015625, 3.723388671875, 3.9638671875, 4.204345703125, 4.44482421875, 4.685302734375, 4.92578125, 5.166259765625, 5.40673828125, 5.647216796875, 5.8876953125, 6.128173828125, 6.36865234375, 6.609130859375, 6.849609375, 7.090087890625, 7.33056640625, 7.571044921875, 7.8115234375, 8.052001953125, 8.29248046875, 8.532958984375, 8.7734375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 5.0, 3.0, 3.0, 11.0, 11.0, 24.0, 24.0, 31.0, 36.0, 61.0, 71.0, 105.0, 182.0, 345.0, 934.0, 4902.0, 431975.0, 2695044.0, 9714.0, 1206.0, 398.0, 220.0, 111.0, 77.0, 40.0, 38.0, 30.0, 23.0, 15.0, 16.0, 14.0, 11.0, 7.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0703125, -14.60107421875, -14.1318359375, -13.66259765625, -13.193359375, -12.72412109375, -12.2548828125, -11.78564453125, -11.31640625, -10.84716796875, -10.3779296875, -9.90869140625, -9.439453125, -8.97021484375, -8.5009765625, -8.03173828125, -7.5625, -7.09326171875, -6.6240234375, -6.15478515625, -5.685546875, -5.21630859375, -4.7470703125, -4.27783203125, -3.80859375, -3.33935546875, -2.8701171875, -2.40087890625, -1.931640625, -1.46240234375, -0.9931640625, -0.52392578125, -0.0546875, 0.41455078125, 0.8837890625, 1.35302734375, 1.822265625, 2.29150390625, 2.7607421875, 3.22998046875, 3.69921875, 4.16845703125, 4.6376953125, 5.10693359375, 5.576171875, 6.04541015625, 6.5146484375, 6.98388671875, 7.453125, 7.92236328125, 8.3916015625, 8.86083984375, 9.330078125, 9.79931640625, 10.2685546875, 10.73779296875, 11.20703125, 11.67626953125, 12.1455078125, 12.61474609375, 13.083984375, 13.55322265625, 14.0224609375, 14.49169921875, 14.9609375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 61.0, 830.0, 123.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6708807945251465, -4.1117095947265625, -1.5525383949279785, 1.0066328048706055, 3.5658040046691895, 6.124975681304932, 8.684146881103516, 11.243316650390625, 13.802488327026367, 16.36166000366211, 18.92082977294922, 21.48000144958496, 24.039173126220703, 26.598344802856445, 29.157516479492188, 31.716686248779297, 34.27585983276367, 36.83502960205078, 39.394203186035156, 41.953372955322266, 44.512542724609375, 47.07171630859375, 49.63088607788086, 52.19005584716797, 54.749229431152344, 57.30839920043945, 59.86757278442383, 62.42674255371094, 64.98591613769531, 67.54508972167969, 70.10425567626953, 72.6634292602539, 75.22259521484375, 77.78176879882812, 80.34093475341797, 82.90010833740234, 85.45928192138672, 88.01844787597656, 90.57762145996094, 93.13679504394531, 95.69596862792969, 98.25514221191406, 100.8143081665039, 103.37348175048828, 105.93265533447266, 108.4918212890625, 111.05099487304688, 113.61016845703125, 116.1693344116211, 118.72850799560547, 121.28767395019531, 123.84684753417969, 126.40602111816406, 128.96519470214844, 131.5243682861328, 134.08352661132812, 136.6427001953125, 139.20187377929688, 141.76104736328125, 144.32022094726562, 146.87937927246094, 149.4385528564453, 151.9977264404297, 154.55690002441406, 157.11607360839844]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 8.0, 11.0, 12.0, 10.0, 19.0, 15.0, 28.0, 33.0, 26.0, 35.0, 39.0, 43.0, 42.0, 41.0, 40.0, 41.0, 50.0, 38.0, 44.0, 41.0, 39.0, 46.0, 32.0, 37.0, 45.0, 37.0, 22.0, 20.0, 16.0, 19.0, 12.0, 6.0, 10.0, 4.0, 8.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.410625457763672, -24.621408462524414, -23.832191467285156, -23.0429744720459, -22.25375747680664, -21.464542388916016, -20.675325393676758, -19.8861083984375, -19.096891403198242, -18.307674407958984, -17.518457412719727, -16.72924041748047, -15.940024375915527, -15.15080738067627, -14.361591339111328, -13.57237434387207, -12.783157348632812, -11.993940353393555, -11.204723358154297, -10.415507316589355, -9.626290321350098, -8.83707332611084, -8.047857284545898, -7.258640289306641, -6.469423294067383, -5.680206298828125, -4.890989780426025, -4.101773262023926, -3.312556266784668, -2.5233395099639893, -1.7341227531433105, -0.9449062347412109, -0.15568923950195312, 0.6335275173187256, 1.4227442741394043, 2.211961030960083, 3.0011777877807617, 3.7903945446014404, 4.579611301422119, 5.368827819824219, 6.158044815063477, 6.947261810302734, 7.736478328704834, 8.525694847106934, 9.314911842346191, 10.10412883758545, 10.89334487915039, 11.682561874389648, 12.471778869628906, 13.260995864868164, 14.050212860107422, 14.839428901672363, 15.628645896911621, 16.417861938476562, 17.20707893371582, 17.996295928955078, 18.785512924194336, 19.574729919433594, 20.36394691467285, 21.15316390991211, 21.942378997802734, 22.731595993041992, 23.52081298828125, 24.310029983520508, 25.099246978759766]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 11.0, 4.0, 6.0, 10.0, 12.0, 14.0, 19.0, 20.0, 12.0, 14.0, 18.0, 23.0, 26.0, 27.0, 34.0, 33.0, 53.0, 34.0, 52.0, 47.0, 45.0, 43.0, 44.0, 47.0, 45.0, 35.0, 34.0, 56.0, 32.0, 24.0, 26.0, 17.0, 25.0, 13.0, 10.0, 5.0, 7.0, 7.0, 6.0, 11.0, 1.0, 0.0, 4.0, 2.0, 3.0], "bins": [-2.92578125, -2.8514556884765625, -2.777130126953125, -2.7028045654296875, -2.62847900390625, -2.5541534423828125, -2.479827880859375, -2.4055023193359375, -2.3311767578125, -2.2568511962890625, -2.182525634765625, -2.1082000732421875, -2.03387451171875, -1.9595489501953125, -1.885223388671875, -1.8108978271484375, -1.736572265625, -1.6622467041015625, -1.587921142578125, -1.5135955810546875, -1.43927001953125, -1.3649444580078125, -1.290618896484375, -1.2162933349609375, -1.1419677734375, -1.0676422119140625, -0.993316650390625, -0.9189910888671875, -0.84466552734375, -0.7703399658203125, -0.696014404296875, -0.6216888427734375, -0.54736328125, -0.4730377197265625, -0.398712158203125, -0.3243865966796875, -0.25006103515625, -0.1757354736328125, -0.101409912109375, -0.0270843505859375, 0.0472412109375, 0.1215667724609375, 0.195892333984375, 0.2702178955078125, 0.34454345703125, 0.4188690185546875, 0.493194580078125, 0.5675201416015625, 0.641845703125, 0.7161712646484375, 0.790496826171875, 0.8648223876953125, 0.93914794921875, 1.0134735107421875, 1.087799072265625, 1.1621246337890625, 1.2364501953125, 1.3107757568359375, 1.385101318359375, 1.4594268798828125, 1.53375244140625, 1.6080780029296875, 1.682403564453125, 1.7567291259765625, 1.8310546875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 7.0, 8.0, 14.0, 21.0, 17.0, 36.0, 34.0, 33.0, 54.0, 83.0, 115.0, 227.0, 441.0, 951.0, 2538.0, 8113.0, 30121.0, 147084.0, 992768.0, 2233312.0, 645707.0, 100963.0, 21946.0, 6151.0, 1940.0, 753.0, 305.0, 142.0, 116.0, 74.0, 48.0, 37.0, 23.0, 20.0, 20.0, 13.0, 10.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-5.25390625, -5.1094970703125, -4.965087890625, -4.8206787109375, -4.67626953125, -4.5318603515625, -4.387451171875, -4.2430419921875, -4.0986328125, -3.9542236328125, -3.809814453125, -3.6654052734375, -3.52099609375, -3.3765869140625, -3.232177734375, -3.0877685546875, -2.943359375, -2.7989501953125, -2.654541015625, -2.5101318359375, -2.36572265625, -2.2213134765625, -2.076904296875, -1.9324951171875, -1.7880859375, -1.6436767578125, -1.499267578125, -1.3548583984375, -1.21044921875, -1.0660400390625, -0.921630859375, -0.7772216796875, -0.6328125, -0.4884033203125, -0.343994140625, -0.1995849609375, -0.05517578125, 0.0892333984375, 0.233642578125, 0.3780517578125, 0.5224609375, 0.6668701171875, 0.811279296875, 0.9556884765625, 1.10009765625, 1.2445068359375, 1.388916015625, 1.5333251953125, 1.677734375, 1.8221435546875, 1.966552734375, 2.1109619140625, 2.25537109375, 2.3997802734375, 2.544189453125, 2.6885986328125, 2.8330078125, 2.9774169921875, 3.121826171875, 3.2662353515625, 3.41064453125, 3.5550537109375, 3.699462890625, 3.8438720703125, 3.98828125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 13.0, 31.0, 39.0, 94.0, 181.0, 323.0, 627.0, 974.0, 806.0, 464.0, 273.0, 117.0, 58.0, 32.0, 17.0, 12.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -16.04931640625, -15.6455078125, -15.24169921875, -14.837890625, -14.43408203125, -14.0302734375, -13.62646484375, -13.22265625, -12.81884765625, -12.4150390625, -12.01123046875, -11.607421875, -11.20361328125, -10.7998046875, -10.39599609375, -9.9921875, -9.58837890625, -9.1845703125, -8.78076171875, -8.376953125, -7.97314453125, -7.5693359375, -7.16552734375, -6.76171875, -6.35791015625, -5.9541015625, -5.55029296875, -5.146484375, -4.74267578125, -4.3388671875, -3.93505859375, -3.53125, -3.12744140625, -2.7236328125, -2.31982421875, -1.916015625, -1.51220703125, -1.1083984375, -0.70458984375, -0.30078125, 0.10302734375, 0.5068359375, 0.91064453125, 1.314453125, 1.71826171875, 2.1220703125, 2.52587890625, 2.9296875, 3.33349609375, 3.7373046875, 4.14111328125, 4.544921875, 4.94873046875, 5.3525390625, 5.75634765625, 6.16015625, 6.56396484375, 6.9677734375, 7.37158203125, 7.775390625, 8.17919921875, 8.5830078125, 8.98681640625, 9.390625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 10.0, 11.0, 26.0, 30.0, 70.0, 155.0, 293.0, 947.0, 24119.0, 4097448.0, 69170.0, 1297.0, 334.0, 154.0, 88.0, 57.0, 19.0, 19.0, 10.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.59375, -22.50048828125, -21.4072265625, -20.31396484375, -19.220703125, -18.12744140625, -17.0341796875, -15.94091796875, -14.84765625, -13.75439453125, -12.6611328125, -11.56787109375, -10.474609375, -9.38134765625, -8.2880859375, -7.19482421875, -6.1015625, -5.00830078125, -3.9150390625, -2.82177734375, -1.728515625, -0.63525390625, 0.4580078125, 1.55126953125, 2.64453125, 3.73779296875, 4.8310546875, 5.92431640625, 7.017578125, 8.11083984375, 9.2041015625, 10.29736328125, 11.390625, 12.48388671875, 13.5771484375, 14.67041015625, 15.763671875, 16.85693359375, 17.9501953125, 19.04345703125, 20.13671875, 21.22998046875, 22.3232421875, 23.41650390625, 24.509765625, 25.60302734375, 26.6962890625, 27.78955078125, 28.8828125, 29.97607421875, 31.0693359375, 32.16259765625, 33.255859375, 34.34912109375, 35.4423828125, 36.53564453125, 37.62890625, 38.72216796875, 39.8154296875, 40.90869140625, 42.001953125, 43.09521484375, 44.1884765625, 45.28173828125, 46.375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 22.0, 62.0, 128.0, 199.0, 208.0, 201.0, 108.0, 46.0, 23.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.61354446411133, -51.95621871948242, -50.29888916015625, -48.641563415527344, -46.98423767089844, -45.326908111572266, -43.66958236694336, -42.01225280761719, -40.35492706298828, -38.697601318359375, -37.0402717590332, -35.3829460144043, -33.725616455078125, -32.06829071044922, -30.410964965820312, -28.753637313842773, -27.096309661865234, -25.438982009887695, -23.781654357910156, -22.12432861328125, -20.46700096130371, -18.809673309326172, -17.152347564697266, -15.495019912719727, -13.837692260742188, -12.180364608764648, -10.523037910461426, -8.865711212158203, -7.208383560180664, -5.551055908203125, -3.8937292098999023, -2.2364025115966797, -0.5790748596191406, 1.0782523155212402, 2.735579490661621, 4.392906665802002, 6.050233840942383, 7.707561492919922, 9.364888191223145, 11.022214889526367, 12.679542541503906, 14.336870193481445, 15.994196891784668, 17.65152359008789, 19.30885124206543, 20.96617889404297, 22.623504638671875, 24.280832290649414, 25.938159942626953, 27.595487594604492, 29.25281524658203, 30.910140991210938, 32.567466735839844, 34.224796295166016, 35.88212203979492, 37.539451599121094, 39.19677734375, 40.854103088378906, 42.51143264770508, 44.168758392333984, 45.826087951660156, 47.48341369628906, 49.14073944091797, 50.798065185546875, 52.45539474487305]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 11.0, 7.0, 10.0, 12.0, 13.0, 15.0, 15.0, 17.0, 25.0, 38.0, 34.0, 29.0, 40.0, 35.0, 45.0, 46.0, 35.0, 41.0, 39.0, 38.0, 46.0, 43.0, 39.0, 45.0, 30.0, 25.0, 29.0, 29.0, 41.0, 17.0, 21.0, 23.0, 13.0, 12.0, 14.0, 4.0, 4.0, 5.0, 4.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.47956657409668, -21.828731536865234, -21.177898406982422, -20.527063369750977, -19.87622833251953, -19.22539520263672, -18.574560165405273, -17.923725128173828, -17.272891998291016, -16.62205696105957, -15.971222877502441, -15.320388793945312, -14.669554710388184, -14.018720626831055, -13.36788558959961, -12.71705150604248, -12.066216468811035, -11.415382385253906, -10.764547348022461, -10.113713264465332, -9.462879180908203, -8.812044143676758, -8.161210060119629, -7.5103759765625, -6.859541416168213, -6.208706855773926, -5.557872772216797, -4.90703821182251, -4.256203651428223, -3.6053695678710938, -2.9545350074768066, -2.3037009239196777, -1.6528663635253906, -1.0020320415496826, -0.35119760036468506, 0.2996368408203125, 0.9504711627960205, 1.6013054847717285, 2.2521400451660156, 2.9029741287231445, 3.5538086891174316, 4.204643249511719, 4.855477333068848, 5.506311893463135, 6.157146453857422, 6.807980537414551, 7.458815097808838, 8.109649658203125, 8.760483741760254, 9.411317825317383, 10.062152862548828, 10.712986946105957, 11.363821029663086, 12.014656066894531, 12.66549015045166, 13.316324234008789, 13.967159271240234, 14.617993354797363, 15.268828392028809, 15.919662475585938, 16.570497512817383, 17.221330642700195, 17.87216567993164, 18.522998809814453, 19.1738338470459]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 11.0, 13.0, 11.0, 16.0, 14.0, 12.0, 21.0, 16.0, 25.0, 30.0, 37.0, 36.0, 42.0, 54.0, 44.0, 45.0, 50.0, 50.0, 52.0, 43.0, 41.0, 47.0, 42.0, 42.0, 39.0, 23.0, 29.0, 24.0, 10.0, 18.0, 14.0, 7.0, 11.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.232421875, -3.1514434814453125, -3.070465087890625, -2.9894866943359375, -2.90850830078125, -2.8275299072265625, -2.746551513671875, -2.6655731201171875, -2.5845947265625, -2.5036163330078125, -2.422637939453125, -2.3416595458984375, -2.26068115234375, -2.1797027587890625, -2.098724365234375, -2.0177459716796875, -1.936767578125, -1.8557891845703125, -1.774810791015625, -1.6938323974609375, -1.61285400390625, -1.5318756103515625, -1.450897216796875, -1.3699188232421875, -1.2889404296875, -1.2079620361328125, -1.126983642578125, -1.0460052490234375, -0.96502685546875, -0.8840484619140625, -0.803070068359375, -0.7220916748046875, -0.64111328125, -0.5601348876953125, -0.479156494140625, -0.3981781005859375, -0.31719970703125, -0.2362213134765625, -0.155242919921875, -0.0742645263671875, 0.0067138671875, 0.0876922607421875, 0.168670654296875, 0.2496490478515625, 0.33062744140625, 0.4116058349609375, 0.492584228515625, 0.5735626220703125, 0.654541015625, 0.7355194091796875, 0.816497802734375, 0.8974761962890625, 0.97845458984375, 1.0594329833984375, 1.140411376953125, 1.2213897705078125, 1.3023681640625, 1.3833465576171875, 1.464324951171875, 1.5453033447265625, 1.62628173828125, 1.7072601318359375, 1.788238525390625, 1.8692169189453125, 1.9501953125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 5.0, 10.0, 12.0, 14.0, 37.0, 56.0, 84.0, 147.0, 250.0, 483.0, 805.0, 1347.0, 2331.0, 3829.0, 6424.0, 10481.0, 17596.0, 30680.0, 56806.0, 118067.0, 316779.0, 261425.0, 102532.0, 49978.0, 27564.0, 16236.0, 9706.0, 5966.0, 3579.0, 2140.0, 1318.0, 761.0, 426.0, 265.0, 151.0, 85.0, 62.0, 30.0, 18.0, 22.0, 9.0, 10.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4462890625, -0.43085479736328125, -0.4154205322265625, -0.39998626708984375, -0.384552001953125, -0.36911773681640625, -0.3536834716796875, -0.33824920654296875, -0.32281494140625, -0.30738067626953125, -0.2919464111328125, -0.27651214599609375, -0.261077880859375, -0.24564361572265625, -0.2302093505859375, -0.21477508544921875, -0.1993408203125, -0.18390655517578125, -0.1684722900390625, -0.15303802490234375, -0.137603759765625, -0.12216949462890625, -0.1067352294921875, -0.09130096435546875, -0.07586669921875, -0.06043243408203125, -0.0449981689453125, -0.02956390380859375, -0.014129638671875, 0.00130462646484375, 0.0167388916015625, 0.03217315673828125, 0.047607421875, 0.06304168701171875, 0.0784759521484375, 0.09391021728515625, 0.109344482421875, 0.12477874755859375, 0.1402130126953125, 0.15564727783203125, 0.17108154296875, 0.18651580810546875, 0.2019500732421875, 0.21738433837890625, 0.232818603515625, 0.24825286865234375, 0.2636871337890625, 0.27912139892578125, 0.2945556640625, 0.30998992919921875, 0.3254241943359375, 0.34085845947265625, 0.356292724609375, 0.37172698974609375, 0.3871612548828125, 0.40259552001953125, 0.41802978515625, 0.43346405029296875, 0.4488983154296875, 0.46433258056640625, 0.479766845703125, 0.49520111083984375, 0.5106353759765625, 0.5260696411132812, 0.54150390625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 4.0, 14.0, 17.0, 15.0, 12.0, 10.0, 17.0, 17.0, 18.0, 18.0, 29.0, 25.0, 26.0, 34.0, 37.0, 35.0, 35.0, 38.0, 47.0, 1067.0, 38.0, 46.0, 37.0, 43.0, 33.0, 43.0, 33.0, 37.0, 26.0, 29.0, 16.0, 24.0, 16.0, 14.0, 10.0, 10.0, 12.0, 6.0, 6.0, 7.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.4453125, -1.4029998779296875, -1.360687255859375, -1.3183746337890625, -1.27606201171875, -1.2337493896484375, -1.191436767578125, -1.1491241455078125, -1.1068115234375, -1.0644989013671875, -1.022186279296875, -0.9798736572265625, -0.93756103515625, -0.8952484130859375, -0.852935791015625, -0.8106231689453125, -0.768310546875, -0.7259979248046875, -0.683685302734375, -0.6413726806640625, -0.59906005859375, -0.5567474365234375, -0.514434814453125, -0.4721221923828125, -0.4298095703125, -0.3874969482421875, -0.345184326171875, -0.3028717041015625, -0.26055908203125, -0.2182464599609375, -0.175933837890625, -0.1336212158203125, -0.09130859375, -0.0489959716796875, -0.006683349609375, 0.0356292724609375, 0.07794189453125, 0.1202545166015625, 0.162567138671875, 0.2048797607421875, 0.2471923828125, 0.2895050048828125, 0.331817626953125, 0.3741302490234375, 0.41644287109375, 0.4587554931640625, 0.501068115234375, 0.5433807373046875, 0.585693359375, 0.6280059814453125, 0.670318603515625, 0.7126312255859375, 0.75494384765625, 0.7972564697265625, 0.839569091796875, 0.8818817138671875, 0.9241943359375, 0.9665069580078125, 1.008819580078125, 1.0511322021484375, 1.09344482421875, 1.1357574462890625, 1.178070068359375, 1.2203826904296875, 1.2626953125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 20.0, 23.0, 35.0, 60.0, 70.0, 105.0, 140.0, 213.0, 272.0, 441.0, 660.0, 862.0, 1267.0, 1818.0, 2627.0, 3591.0, 5277.0, 7562.0, 10803.0, 15374.0, 22404.0, 34066.0, 53037.0, 87605.0, 167943.0, 1317842.0, 141310.0, 76666.0, 47566.0, 30733.0, 20426.0, 13736.0, 9531.0, 6697.0, 4802.0, 3395.0, 2456.0, 1754.0, 1214.0, 898.0, 591.0, 397.0, 284.0, 185.0, 123.0, 94.0, 44.0, 36.0, 24.0, 19.0, 7.0, 14.0, 7.0, 9.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2978515625, -0.288360595703125, -0.27886962890625, -0.269378662109375, -0.2598876953125, -0.250396728515625, -0.24090576171875, -0.231414794921875, -0.221923828125, -0.212432861328125, -0.20294189453125, -0.193450927734375, -0.1839599609375, -0.174468994140625, -0.16497802734375, -0.155487060546875, -0.14599609375, -0.136505126953125, -0.12701416015625, -0.117523193359375, -0.1080322265625, -0.098541259765625, -0.08905029296875, -0.079559326171875, -0.070068359375, -0.060577392578125, -0.05108642578125, -0.041595458984375, -0.0321044921875, -0.022613525390625, -0.01312255859375, -0.003631591796875, 0.005859375, 0.015350341796875, 0.02484130859375, 0.034332275390625, 0.0438232421875, 0.053314208984375, 0.06280517578125, 0.072296142578125, 0.081787109375, 0.091278076171875, 0.10076904296875, 0.110260009765625, 0.1197509765625, 0.129241943359375, 0.13873291015625, 0.148223876953125, 0.15771484375, 0.167205810546875, 0.17669677734375, 0.186187744140625, 0.1956787109375, 0.205169677734375, 0.21466064453125, 0.224151611328125, 0.233642578125, 0.243133544921875, 0.25262451171875, 0.262115478515625, 0.2716064453125, 0.281097412109375, 0.29058837890625, 0.300079345703125, 0.3095703125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 4.0, 7.0, 12.0, 9.0, 14.0, 15.0, 24.0, 23.0, 29.0, 27.0, 40.0, 47.0, 60.0, 71.0, 85.0, 72.0, 69.0, 66.0, 65.0, 44.0, 41.0, 34.0, 33.0, 24.0, 16.0, 15.0, 9.0, 6.0, 5.0, 2.0, 4.0, 2.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.855892181396484e-05, -7.606390863656998e-05, -7.356889545917511e-05, -7.107388228178024e-05, -6.857886910438538e-05, -6.608385592699051e-05, -6.358884274959564e-05, -6.109382957220078e-05, -5.859881639480591e-05, -5.610380321741104e-05, -5.3608790040016174e-05, -5.111377686262131e-05, -4.861876368522644e-05, -4.6123750507831573e-05, -4.3628737330436707e-05, -4.113372415304184e-05, -3.863871097564697e-05, -3.6143697798252106e-05, -3.364868462085724e-05, -3.115367144346237e-05, -2.8658658266067505e-05, -2.6163645088672638e-05, -2.366863191127777e-05, -2.1173618733882904e-05, -1.8678605556488037e-05, -1.618359237909317e-05, -1.3688579201698303e-05, -1.1193566024303436e-05, -8.69855284690857e-06, -6.203539669513702e-06, -3.7085264921188354e-06, -1.2135133147239685e-06, 1.2814998626708984e-06, 3.7765130400657654e-06, 6.271526217460632e-06, 8.7665393948555e-06, 1.1261552572250366e-05, 1.3756565749645233e-05, 1.62515789270401e-05, 1.8746592104434967e-05, 2.1241605281829834e-05, 2.37366184592247e-05, 2.6231631636619568e-05, 2.8726644814014435e-05, 3.12216579914093e-05, 3.371667116880417e-05, 3.6211684346199036e-05, 3.87066975235939e-05, 4.120171070098877e-05, 4.3696723878383636e-05, 4.6191737055778503e-05, 4.868675023317337e-05, 5.118176341056824e-05, 5.3676776587963104e-05, 5.617178976535797e-05, 5.866680294275284e-05, 6.11618161201477e-05, 6.365682929754257e-05, 6.615184247493744e-05, 6.86468556523323e-05, 7.114186882972717e-05, 7.363688200712204e-05, 7.61318951845169e-05, 7.862690836191177e-05, 8.112192153930664e-05]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 2.0, 3.0, 6.0, 7.0, 7.0, 7.0, 13.0, 13.0, 24.0, 25.0, 54.0, 64.0, 89.0, 119.0, 194.0, 315.0, 491.0, 1439.0, 476897.0, 565577.0, 1664.0, 505.0, 316.0, 218.0, 138.0, 93.0, 63.0, 40.0, 32.0, 23.0, 26.0, 21.0, 15.0, 15.0, 15.0, 3.0, 3.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00157928466796875, -0.001531451940536499, -0.001483619213104248, -0.001435786485671997, -0.001387953758239746, -0.0013401210308074951, -0.0012922883033752441, -0.0012444555759429932, -0.0011966228485107422, -0.0011487901210784912, -0.0011009573936462402, -0.0010531246662139893, -0.0010052919387817383, -0.0009574592113494873, -0.0009096264839172363, -0.0008617937564849854, -0.0008139610290527344, -0.0007661283016204834, -0.0007182955741882324, -0.0006704628467559814, -0.0006226301193237305, -0.0005747973918914795, -0.0005269646644592285, -0.00047913193702697754, -0.00043129920959472656, -0.0003834664821624756, -0.0003356337547302246, -0.00028780102729797363, -0.00023996829986572266, -0.00019213557243347168, -0.0001443028450012207, -9.647011756896973e-05, -4.863739013671875e-05, -8.046627044677734e-07, 4.70280647277832e-05, 9.486079216003418e-05, 0.00014269351959228516, 0.00019052624702453613, 0.0002383589744567871, 0.0002861917018890381, 0.00033402442932128906, 0.00038185715675354004, 0.000429689884185791, 0.000477522611618042, 0.000525355339050293, 0.0005731880664825439, 0.0006210207939147949, 0.0006688535213470459, 0.0007166862487792969, 0.0007645189762115479, 0.0008123517036437988, 0.0008601844310760498, 0.0009080171585083008, 0.0009558498859405518, 0.0010036826133728027, 0.0010515153408050537, 0.0010993480682373047, 0.0011471807956695557, 0.0011950135231018066, 0.0012428462505340576, 0.0012906789779663086, 0.0013385117053985596, 0.0013863444328308105, 0.0014341771602630615, 0.0014820098876953125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 35.0, 89.0, 200.0, 292.0, 227.0, 113.0, 41.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019078976765740663, -0.00018678136984817684, -0.00018277298659086227, -0.00017876458878163248, -0.0001747561909724027, -0.0001707477931631729, -0.0001667393953539431, -0.00016273101209662855, -0.00015872261428739876, -0.00015471421647816896, -0.0001507058332208544, -0.0001466974354116246, -0.00014268903760239482, -0.00013868063979316503, -0.00013467224198393524, -0.00013066385872662067, -0.00012665546091739088, -0.0001226470631081611, -0.00011863867257488891, -0.00011463028204161674, -0.00011062188423238695, -0.00010661348642315716, -0.00010260509588988498, -9.85967053566128e-05, -9.458830754738301e-05, -9.057990973815322e-05, -8.657151920488104e-05, -8.256312867160887e-05, -7.855473086237907e-05, -7.454633305314928e-05, -7.05379425198771e-05, -6.652955198660493e-05, -6.252114690141752e-05, -5.851275273016654e-05, -5.4504358558915555e-05, -5.049596438766457e-05, -4.648757021641359e-05, -4.24791760451626e-05, -3.847078187391162e-05, -3.4462387702660635e-05, -3.045399353140965e-05, -2.6445599360158667e-05, -2.2437205188907683e-05, -1.84288110176567e-05, -1.4420416846405715e-05, -1.041202267515473e-05, -6.403628503903747e-06, -2.3952343326527625e-06, 1.6131598385982215e-06, 5.621554009849206e-06, 9.62994818110019e-06, 1.3638342352351174e-05, 1.7646736523602158e-05, 2.1655130694853142e-05, 2.5663524866104126e-05, 2.967191903735511e-05, 3.3680313208606094e-05, 3.768870737985708e-05, 4.169710155110806e-05, 4.5705495722359046e-05, 4.971388989361003e-05, 5.3722284064861014e-05, 5.7730678236112e-05, 6.173907604534179e-05, 6.574746657861397e-05]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 9.0, 5.0, 8.0, 6.0, 7.0, 3.0, 23.0, 14.0, 19.0, 17.0, 21.0, 27.0, 42.0, 37.0, 32.0, 46.0, 41.0, 51.0, 52.0, 43.0, 42.0, 58.0, 47.0, 42.0, 50.0, 42.0, 39.0, 29.0, 31.0, 24.0, 13.0, 11.0, 14.0, 14.0, 11.0, 8.0, 6.0, 3.0, 6.0, 1.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.999471664428711e-05, -3.8691796362400055e-05, -3.7388876080513e-05, -3.6085955798625946e-05, -3.478303551673889e-05, -3.348011523485184e-05, -3.217719495296478e-05, -3.087427467107773e-05, -2.9571354389190674e-05, -2.826843410730362e-05, -2.6965513825416565e-05, -2.566259354352951e-05, -2.4359673261642456e-05, -2.30567529797554e-05, -2.1753832697868347e-05, -2.0450912415981293e-05, -1.9147992134094238e-05, -1.7845071852207184e-05, -1.654215157032013e-05, -1.5239231288433075e-05, -1.393631100654602e-05, -1.2633390724658966e-05, -1.1330470442771912e-05, -1.0027550160884857e-05, -8.724629878997803e-06, -7.421709597110748e-06, -6.118789315223694e-06, -4.815869033336639e-06, -3.512948751449585e-06, -2.2100284695625305e-06, -9.071081876754761e-07, 3.9581209421157837e-07, 1.6987323760986328e-06, 3.0016526579856873e-06, 4.304572939872742e-06, 5.607493221759796e-06, 6.910413503646851e-06, 8.213333785533905e-06, 9.51625406742096e-06, 1.0819174349308014e-05, 1.2122094631195068e-05, 1.3425014913082123e-05, 1.4727935194969177e-05, 1.603085547685623e-05, 1.7333775758743286e-05, 1.863669604063034e-05, 1.9939616322517395e-05, 2.124253660440445e-05, 2.2545456886291504e-05, 2.384837716817856e-05, 2.5151297450065613e-05, 2.6454217731952667e-05, 2.775713801383972e-05, 2.9060058295726776e-05, 3.036297857761383e-05, 3.1665898859500885e-05, 3.296881914138794e-05, 3.4271739423274994e-05, 3.557465970516205e-05, 3.68775799870491e-05, 3.818050026893616e-05, 3.948342055082321e-05, 4.0786340832710266e-05, 4.208926111459732e-05, 4.3392181396484375e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 11.0, 13.0, 11.0, 16.0, 14.0, 12.0, 21.0, 16.0, 25.0, 30.0, 37.0, 36.0, 42.0, 54.0, 44.0, 45.0, 50.0, 50.0, 52.0, 43.0, 41.0, 47.0, 42.0, 42.0, 39.0, 23.0, 29.0, 24.0, 10.0, 18.0, 14.0, 7.0, 11.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.232421875, -3.1514434814453125, -3.070465087890625, -2.9894866943359375, -2.90850830078125, -2.8275299072265625, -2.746551513671875, -2.6655731201171875, -2.5845947265625, -2.5036163330078125, -2.422637939453125, -2.3416595458984375, -2.26068115234375, -2.1797027587890625, -2.098724365234375, -2.0177459716796875, -1.936767578125, -1.8557891845703125, -1.774810791015625, -1.6938323974609375, -1.61285400390625, -1.5318756103515625, -1.450897216796875, -1.3699188232421875, -1.2889404296875, -1.2079620361328125, -1.126983642578125, -1.0460052490234375, -0.96502685546875, -0.8840484619140625, -0.803070068359375, -0.7220916748046875, -0.64111328125, -0.5601348876953125, -0.479156494140625, -0.3981781005859375, -0.31719970703125, -0.2362213134765625, -0.155242919921875, -0.0742645263671875, 0.0067138671875, 0.0876922607421875, 0.168670654296875, 0.2496490478515625, 0.33062744140625, 0.4116058349609375, 0.492584228515625, 0.5735626220703125, 0.654541015625, 0.7355194091796875, 0.816497802734375, 0.8974761962890625, 0.97845458984375, 1.0594329833984375, 1.140411376953125, 1.2213897705078125, 1.3023681640625, 1.3833465576171875, 1.464324951171875, 1.5453033447265625, 1.62628173828125, 1.7072601318359375, 1.788238525390625, 1.8692169189453125, 1.9501953125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 9.0, 14.0, 30.0, 33.0, 48.0, 80.0, 112.0, 169.0, 323.0, 552.0, 1048.0, 1983.0, 3668.0, 7344.0, 15553.0, 37299.0, 94567.0, 231560.0, 338505.0, 186482.0, 73900.0, 29711.0, 12659.0, 6001.0, 3053.0, 1611.0, 915.0, 484.0, 320.0, 187.0, 128.0, 70.0, 55.0, 34.0, 17.0, 15.0, 5.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.24609375, -2.1859893798828125, -2.125885009765625, -2.0657806396484375, -2.00567626953125, -1.9455718994140625, -1.885467529296875, -1.8253631591796875, -1.7652587890625, -1.7051544189453125, -1.645050048828125, -1.5849456787109375, -1.52484130859375, -1.4647369384765625, -1.404632568359375, -1.3445281982421875, -1.284423828125, -1.2243194580078125, -1.164215087890625, -1.1041107177734375, -1.04400634765625, -0.9839019775390625, -0.923797607421875, -0.8636932373046875, -0.8035888671875, -0.7434844970703125, -0.683380126953125, -0.6232757568359375, -0.56317138671875, -0.5030670166015625, -0.442962646484375, -0.3828582763671875, -0.32275390625, -0.2626495361328125, -0.202545166015625, -0.1424407958984375, -0.08233642578125, -0.0222320556640625, 0.037872314453125, 0.0979766845703125, 0.1580810546875, 0.2181854248046875, 0.278289794921875, 0.3383941650390625, 0.39849853515625, 0.4586029052734375, 0.518707275390625, 0.5788116455078125, 0.638916015625, 0.6990203857421875, 0.759124755859375, 0.8192291259765625, 0.87933349609375, 0.9394378662109375, 0.999542236328125, 1.0596466064453125, 1.1197509765625, 1.1798553466796875, 1.239959716796875, 1.3000640869140625, 1.36016845703125, 1.4202728271484375, 1.480377197265625, 1.5404815673828125, 1.6005859375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 9.0, 13.0, 14.0, 12.0, 16.0, 20.0, 22.0, 37.0, 38.0, 50.0, 60.0, 48.0, 76.0, 154.0, 439.0, 1467.0, 126.0, 84.0, 74.0, 49.0, 33.0, 33.0, 30.0, 23.0, 26.0, 22.0, 17.0, 13.0, 13.0, 10.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.07373046875, -9.7490234375, -9.42431640625, -9.099609375, -8.77490234375, -8.4501953125, -8.12548828125, -7.80078125, -7.47607421875, -7.1513671875, -6.82666015625, -6.501953125, -6.17724609375, -5.8525390625, -5.52783203125, -5.203125, -4.87841796875, -4.5537109375, -4.22900390625, -3.904296875, -3.57958984375, -3.2548828125, -2.93017578125, -2.60546875, -2.28076171875, -1.9560546875, -1.63134765625, -1.306640625, -0.98193359375, -0.6572265625, -0.33251953125, -0.0078125, 0.31689453125, 0.6416015625, 0.96630859375, 1.291015625, 1.61572265625, 1.9404296875, 2.26513671875, 2.58984375, 2.91455078125, 3.2392578125, 3.56396484375, 3.888671875, 4.21337890625, 4.5380859375, 4.86279296875, 5.1875, 5.51220703125, 5.8369140625, 6.16162109375, 6.486328125, 6.81103515625, 7.1357421875, 7.46044921875, 7.78515625, 8.10986328125, 8.4345703125, 8.75927734375, 9.083984375, 9.40869140625, 9.7333984375, 10.05810546875, 10.3828125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 14.0, 13.0, 20.0, 21.0, 21.0, 44.0, 45.0, 41.0, 73.0, 104.0, 187.0, 314.0, 759.0, 3352.0, 96768.0, 2997886.0, 42071.0, 2407.0, 666.0, 277.0, 195.0, 103.0, 68.0, 61.0, 33.0, 30.0, 26.0, 20.0, 13.0, 14.0, 14.0, 9.0, 6.0, 5.0, 6.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.4296875, -13.9552001953125, -13.480712890625, -13.0062255859375, -12.53173828125, -12.0572509765625, -11.582763671875, -11.1082763671875, -10.6337890625, -10.1593017578125, -9.684814453125, -9.2103271484375, -8.73583984375, -8.2613525390625, -7.786865234375, -7.3123779296875, -6.837890625, -6.3634033203125, -5.888916015625, -5.4144287109375, -4.93994140625, -4.4654541015625, -3.990966796875, -3.5164794921875, -3.0419921875, -2.5675048828125, -2.093017578125, -1.6185302734375, -1.14404296875, -0.6695556640625, -0.195068359375, 0.2794189453125, 0.75390625, 1.2283935546875, 1.702880859375, 2.1773681640625, 2.65185546875, 3.1263427734375, 3.600830078125, 4.0753173828125, 4.5498046875, 5.0242919921875, 5.498779296875, 5.9732666015625, 6.44775390625, 6.9222412109375, 7.396728515625, 7.8712158203125, 8.345703125, 8.8201904296875, 9.294677734375, 9.7691650390625, 10.24365234375, 10.7181396484375, 11.192626953125, 11.6671142578125, 12.1416015625, 12.6160888671875, 13.090576171875, 13.5650634765625, 14.03955078125, 14.5140380859375, 14.988525390625, 15.4630126953125, 15.9375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 5.0, 15.0, 40.0, 71.0, 137.0, 185.0, 200.0, 168.0, 109.0, 51.0, 19.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6231865882873535, -5.011821269989014, -4.400455474853516, -3.789090156555176, -3.177724599838257, -2.566359043121338, -1.954993724822998, -1.3436279296875, -0.7322626113891602, -0.12089711427688599, 0.4904683828353882, 1.1018338203430176, 1.7131993770599365, 2.3245649337768555, 2.9359302520751953, 3.5472960472106934, 4.158661365509033, 4.770026683807373, 5.381392478942871, 5.992757797241211, 6.604123115539551, 7.215488910675049, 7.826854228973389, 8.438220024108887, 9.049585342407227, 9.660950660705566, 10.272315979003906, 10.883682250976562, 11.495047569274902, 12.106412887573242, 12.717778205871582, 13.329143524169922, 13.940507888793945, 14.551873207092285, 15.163238525390625, 15.774604797363281, 16.385969161987305, 16.99733543395996, 17.608699798583984, 18.22006607055664, 18.831432342529297, 19.442798614501953, 20.054162979125977, 20.665529251098633, 21.276893615722656, 21.888259887695312, 22.49962615966797, 23.110990524291992, 23.722354888916016, 24.333721160888672, 24.945085525512695, 25.55645179748535, 26.167816162109375, 26.77918243408203, 27.390548706054688, 28.00191307067871, 28.613279342651367, 29.224645614624023, 29.836009979248047, 30.447376251220703, 31.058740615844727, 31.670106887817383, 32.281471252441406, 32.89283752441406, 33.50420379638672]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 9.0, 7.0, 4.0, 4.0, 8.0, 12.0, 8.0, 14.0, 18.0, 31.0, 25.0, 21.0, 34.0, 25.0, 26.0, 30.0, 58.0, 47.0, 41.0, 38.0, 44.0, 49.0, 38.0, 37.0, 43.0, 49.0, 35.0, 33.0, 28.0, 24.0, 31.0, 14.0, 11.0, 18.0, 10.0, 16.0, 19.0, 10.0, 10.0, 3.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.636640548706055, -28.737361907958984, -27.838083267211914, -26.938804626464844, -26.039527893066406, -25.140247344970703, -24.240970611572266, -23.341691970825195, -22.442413330078125, -21.543134689331055, -20.643856048583984, -19.744577407836914, -18.845298767089844, -17.946022033691406, -17.046743392944336, -16.147464752197266, -15.248186111450195, -14.348907470703125, -13.449628829956055, -12.5503511428833, -11.65107250213623, -10.75179386138916, -9.852516174316406, -8.953237533569336, -8.053958892822266, -7.154680252075195, -6.255402088165283, -5.356123924255371, -4.456845283508301, -3.5575666427612305, -2.6582884788513184, -1.7590103149414062, -0.8597335815429688, 0.03954482078552246, 0.9388232231140137, 1.8381016254425049, 2.737380027770996, 3.6366586685180664, 4.5359368324279785, 5.435214996337891, 6.334493637084961, 7.233772277832031, 8.133050918579102, 9.032328605651855, 9.931607246398926, 10.830885887145996, 11.73016357421875, 12.62944221496582, 13.52872085571289, 14.427999496459961, 15.327278137207031, 16.2265567779541, 17.125835418701172, 18.02511215209961, 18.92439079284668, 19.82366943359375, 20.72294807434082, 21.62222671508789, 22.52150535583496, 23.42078399658203, 24.32006072998047, 25.219341278076172, 26.11861801147461, 27.01789665222168, 27.91717529296875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 4.0, 10.0, 10.0, 16.0, 9.0, 20.0, 15.0, 12.0, 20.0, 20.0, 23.0, 32.0, 33.0, 43.0, 35.0, 56.0, 47.0, 51.0, 50.0, 44.0, 58.0, 45.0, 44.0, 45.0, 42.0, 39.0, 35.0, 30.0, 20.0, 25.0, 16.0, 9.0, 9.0, 10.0, 12.0, 6.0, 4.0, 6.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.52734375, -3.440399169921875, -3.35345458984375, -3.266510009765625, -3.1795654296875, -3.092620849609375, -3.00567626953125, -2.918731689453125, -2.831787109375, -2.744842529296875, -2.65789794921875, -2.570953369140625, -2.4840087890625, -2.397064208984375, -2.31011962890625, -2.223175048828125, -2.13623046875, -2.049285888671875, -1.96234130859375, -1.875396728515625, -1.7884521484375, -1.701507568359375, -1.61456298828125, -1.527618408203125, -1.440673828125, -1.353729248046875, -1.26678466796875, -1.179840087890625, -1.0928955078125, -1.005950927734375, -0.91900634765625, -0.832061767578125, -0.7451171875, -0.658172607421875, -0.57122802734375, -0.484283447265625, -0.3973388671875, -0.310394287109375, -0.22344970703125, -0.136505126953125, -0.049560546875, 0.037384033203125, 0.12432861328125, 0.211273193359375, 0.2982177734375, 0.385162353515625, 0.47210693359375, 0.559051513671875, 0.64599609375, 0.732940673828125, 0.81988525390625, 0.906829833984375, 0.9937744140625, 1.080718994140625, 1.16766357421875, 1.254608154296875, 1.341552734375, 1.428497314453125, 1.51544189453125, 1.602386474609375, 1.6893310546875, 1.776275634765625, 1.86322021484375, 1.950164794921875, 2.037109375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 8.0, 9.0, 10.0, 14.0, 10.0, 10.0, 21.0, 12.0, 27.0, 36.0, 56.0, 86.0, 115.0, 314.0, 794.0, 3004.0, 18718.0, 189584.0, 2281401.0, 1569903.0, 114078.0, 12595.0, 2273.0, 566.0, 239.0, 121.0, 73.0, 50.0, 39.0, 32.0, 13.0, 15.0, 10.0, 12.0, 8.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.359375, -8.1387939453125, -7.918212890625, -7.6976318359375, -7.47705078125, -7.2564697265625, -7.035888671875, -6.8153076171875, -6.5947265625, -6.3741455078125, -6.153564453125, -5.9329833984375, -5.71240234375, -5.4918212890625, -5.271240234375, -5.0506591796875, -4.830078125, -4.6094970703125, -4.388916015625, -4.1683349609375, -3.94775390625, -3.7271728515625, -3.506591796875, -3.2860107421875, -3.0654296875, -2.8448486328125, -2.624267578125, -2.4036865234375, -2.18310546875, -1.9625244140625, -1.741943359375, -1.5213623046875, -1.30078125, -1.0802001953125, -0.859619140625, -0.6390380859375, -0.41845703125, -0.1978759765625, 0.022705078125, 0.2432861328125, 0.4638671875, 0.6844482421875, 0.905029296875, 1.1256103515625, 1.34619140625, 1.5667724609375, 1.787353515625, 2.0079345703125, 2.228515625, 2.4490966796875, 2.669677734375, 2.8902587890625, 3.11083984375, 3.3314208984375, 3.552001953125, 3.7725830078125, 3.9931640625, 4.2137451171875, 4.434326171875, 4.6549072265625, 4.87548828125, 5.0960693359375, 5.316650390625, 5.5372314453125, 5.7578125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 4.0, 13.0, 25.0, 28.0, 45.0, 81.0, 134.0, 216.0, 317.0, 462.0, 636.0, 633.0, 502.0, 347.0, 237.0, 149.0, 87.0, 60.0, 41.0, 17.0, 12.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.890625, -6.6044921875, -6.318359375, -6.0322265625, -5.74609375, -5.4599609375, -5.173828125, -4.8876953125, -4.6015625, -4.3154296875, -4.029296875, -3.7431640625, -3.45703125, -3.1708984375, -2.884765625, -2.5986328125, -2.3125, -2.0263671875, -1.740234375, -1.4541015625, -1.16796875, -0.8818359375, -0.595703125, -0.3095703125, -0.0234375, 0.2626953125, 0.548828125, 0.8349609375, 1.12109375, 1.4072265625, 1.693359375, 1.9794921875, 2.265625, 2.5517578125, 2.837890625, 3.1240234375, 3.41015625, 3.6962890625, 3.982421875, 4.2685546875, 4.5546875, 4.8408203125, 5.126953125, 5.4130859375, 5.69921875, 5.9853515625, 6.271484375, 6.5576171875, 6.84375, 7.1298828125, 7.416015625, 7.7021484375, 7.98828125, 8.2744140625, 8.560546875, 8.8466796875, 9.1328125, 9.4189453125, 9.705078125, 9.9912109375, 10.27734375, 10.5634765625, 10.849609375, 11.1357421875, 11.421875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 10.0, 9.0, 19.0, 21.0, 28.0, 53.0, 71.0, 131.0, 205.0, 349.0, 800.0, 3643.0, 119067.0, 3885003.0, 178717.0, 4426.0, 821.0, 371.0, 178.0, 121.0, 72.0, 51.0, 43.0, 26.0, 17.0, 12.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.9375, -24.23583984375, -23.5341796875, -22.83251953125, -22.130859375, -21.42919921875, -20.7275390625, -20.02587890625, -19.32421875, -18.62255859375, -17.9208984375, -17.21923828125, -16.517578125, -15.81591796875, -15.1142578125, -14.41259765625, -13.7109375, -13.00927734375, -12.3076171875, -11.60595703125, -10.904296875, -10.20263671875, -9.5009765625, -8.79931640625, -8.09765625, -7.39599609375, -6.6943359375, -5.99267578125, -5.291015625, -4.58935546875, -3.8876953125, -3.18603515625, -2.484375, -1.78271484375, -1.0810546875, -0.37939453125, 0.322265625, 1.02392578125, 1.7255859375, 2.42724609375, 3.12890625, 3.83056640625, 4.5322265625, 5.23388671875, 5.935546875, 6.63720703125, 7.3388671875, 8.04052734375, 8.7421875, 9.44384765625, 10.1455078125, 10.84716796875, 11.548828125, 12.25048828125, 12.9521484375, 13.65380859375, 14.35546875, 15.05712890625, 15.7587890625, 16.46044921875, 17.162109375, 17.86376953125, 18.5654296875, 19.26708984375, 19.96875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 50.0, 143.0, 312.0, 282.0, 162.0, 44.0, 14.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.97673034667969, -57.36958312988281, -54.76243591308594, -52.15528869628906, -49.54814529418945, -46.94099807739258, -44.3338508605957, -41.726707458496094, -39.11956024169922, -36.512413024902344, -33.90526580810547, -31.298120498657227, -28.690975189208984, -26.08382797241211, -23.476680755615234, -20.869535446166992, -18.262386322021484, -15.655240058898926, -13.048093795776367, -10.440946578979492, -7.833800315856934, -5.226654052734375, -2.6195068359375, -0.012361526489257812, 2.594785690307617, 5.201931953430176, 7.809078693389893, 10.41622543334961, 13.023371696472168, 15.630517959594727, 18.2376651763916, 20.844810485839844, 23.45195770263672, 26.059104919433594, 28.666250228881836, 31.27339744567871, 33.88054275512695, 36.48768997192383, 39.0948371887207, 41.70198059082031, 44.30912780761719, 46.91627502441406, 49.52342224121094, 52.13056945800781, 54.73771286010742, 57.3448600769043, 59.95200729370117, 62.55915069580078, 65.16630554199219, 67.77345275878906, 70.38059997558594, 72.98774719238281, 75.59489440917969, 78.20204162597656, 80.80918884277344, 83.41632843017578, 86.02347564697266, 88.63062286376953, 91.2377700805664, 93.84491729736328, 96.45206451416016, 99.0592041015625, 101.66635131835938, 104.27349853515625, 106.88064575195312]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 0.0, 4.0, 10.0, 11.0, 12.0, 19.0, 16.0, 11.0, 22.0, 17.0, 21.0, 19.0, 20.0, 39.0, 41.0, 43.0, 36.0, 36.0, 31.0, 39.0, 42.0, 36.0, 29.0, 33.0, 41.0, 30.0, 47.0, 34.0, 29.0, 23.0, 28.0, 29.0, 26.0, 21.0, 16.0, 15.0, 13.0, 10.0, 4.0, 10.0, 12.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-20.96520233154297, -20.3347225189209, -19.704240798950195, -19.073760986328125, -18.443281173706055, -17.812801361083984, -17.18231964111328, -16.55183982849121, -15.921359062194824, -15.290878295898438, -14.660398483276367, -14.02991771697998, -13.399436950683594, -12.768957138061523, -12.138476371765137, -11.50799560546875, -10.87751579284668, -10.247035026550293, -9.616555213928223, -8.986074447631836, -8.355594635009766, -7.725113868713379, -7.094633102416992, -6.464152812957764, -5.833672523498535, -5.203192234039307, -4.572711944580078, -3.9422311782836914, -3.311750888824463, -2.6812705993652344, -2.0507900714874268, -1.4203095436096191, -0.7898292541503906, -0.15934884548187256, 0.4711315631866455, 1.1016119718551636, 1.7320923805236816, 2.36257266998291, 2.9930531978607178, 3.6235337257385254, 4.254014015197754, 4.884494304656982, 5.514974594116211, 6.145455360412598, 6.775935649871826, 7.406415939331055, 8.036896705627441, 8.667377471923828, 9.297857284545898, 9.928338050842285, 10.558817863464355, 11.189298629760742, 11.819778442382812, 12.4502592086792, 13.080739974975586, 13.711219787597656, 14.341700553894043, 14.97218132019043, 15.6026611328125, 16.23314094543457, 16.863622665405273, 17.494102478027344, 18.124582290649414, 18.755064010620117, 19.385543823242188]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 5.0, 10.0, 10.0, 17.0, 18.0, 13.0, 20.0, 26.0, 24.0, 32.0, 37.0, 37.0, 33.0, 53.0, 50.0, 55.0, 55.0, 51.0, 45.0, 55.0, 55.0, 41.0, 36.0, 33.0, 36.0, 18.0, 29.0, 24.0, 14.0, 15.0, 11.0, 15.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.546875, -3.4552001953125, -3.363525390625, -3.2718505859375, -3.18017578125, -3.0885009765625, -2.996826171875, -2.9051513671875, -2.8134765625, -2.7218017578125, -2.630126953125, -2.5384521484375, -2.44677734375, -2.3551025390625, -2.263427734375, -2.1717529296875, -2.080078125, -1.9884033203125, -1.896728515625, -1.8050537109375, -1.71337890625, -1.6217041015625, -1.530029296875, -1.4383544921875, -1.3466796875, -1.2550048828125, -1.163330078125, -1.0716552734375, -0.97998046875, -0.8883056640625, -0.796630859375, -0.7049560546875, -0.61328125, -0.5216064453125, -0.429931640625, -0.3382568359375, -0.24658203125, -0.1549072265625, -0.063232421875, 0.0284423828125, 0.1201171875, 0.2117919921875, 0.303466796875, 0.3951416015625, 0.48681640625, 0.5784912109375, 0.670166015625, 0.7618408203125, 0.853515625, 0.9451904296875, 1.036865234375, 1.1285400390625, 1.22021484375, 1.3118896484375, 1.403564453125, 1.4952392578125, 1.5869140625, 1.6785888671875, 1.770263671875, 1.8619384765625, 1.95361328125, 2.0452880859375, 2.136962890625, 2.2286376953125, 2.3203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 14.0, 17.0, 26.0, 41.0, 74.0, 101.0, 165.0, 290.0, 421.0, 763.0, 1257.0, 2105.0, 3448.0, 5817.0, 9934.0, 16766.0, 29955.0, 56664.0, 117734.0, 313142.0, 265863.0, 106161.0, 51585.0, 27820.0, 15837.0, 8979.0, 5376.0, 3265.0, 2004.0, 1127.0, 707.0, 436.0, 238.0, 148.0, 88.0, 58.0, 36.0, 24.0, 17.0, 14.0, 10.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5673828125, -0.5496139526367188, -0.5318450927734375, -0.5140762329101562, -0.496307373046875, -0.47853851318359375, -0.4607696533203125, -0.44300079345703125, -0.42523193359375, -0.40746307373046875, -0.3896942138671875, -0.37192535400390625, -0.354156494140625, -0.33638763427734375, -0.3186187744140625, -0.30084991455078125, -0.2830810546875, -0.26531219482421875, -0.2475433349609375, -0.22977447509765625, -0.212005615234375, -0.19423675537109375, -0.1764678955078125, -0.15869903564453125, -0.14093017578125, -0.12316131591796875, -0.1053924560546875, -0.08762359619140625, -0.069854736328125, -0.05208587646484375, -0.0343170166015625, -0.01654815673828125, 0.001220703125, 0.01898956298828125, 0.0367584228515625, 0.05452728271484375, 0.072296142578125, 0.09006500244140625, 0.1078338623046875, 0.12560272216796875, 0.14337158203125, 0.16114044189453125, 0.1789093017578125, 0.19667816162109375, 0.214447021484375, 0.23221588134765625, 0.2499847412109375, 0.26775360107421875, 0.2855224609375, 0.30329132080078125, 0.3210601806640625, 0.33882904052734375, 0.356597900390625, 0.37436676025390625, 0.3921356201171875, 0.40990447998046875, 0.42767333984375, 0.44544219970703125, 0.4632110595703125, 0.48097991943359375, 0.498748779296875, 0.5165176391601562, 0.5342864990234375, 0.5520553588867188, 0.56982421875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 8.0, 2.0, 2.0, 3.0, 10.0, 15.0, 9.0, 9.0, 15.0, 14.0, 24.0, 23.0, 26.0, 28.0, 19.0, 26.0, 31.0, 47.0, 37.0, 48.0, 43.0, 43.0, 1055.0, 44.0, 37.0, 32.0, 35.0, 43.0, 29.0, 38.0, 29.0, 30.0, 31.0, 20.0, 19.0, 18.0, 26.0, 15.0, 5.0, 9.0, 4.0, 6.0, 2.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.470703125, -1.4229278564453125, -1.375152587890625, -1.3273773193359375, -1.27960205078125, -1.2318267822265625, -1.184051513671875, -1.1362762451171875, -1.0885009765625, -1.0407257080078125, -0.992950439453125, -0.9451751708984375, -0.89739990234375, -0.8496246337890625, -0.801849365234375, -0.7540740966796875, -0.706298828125, -0.6585235595703125, -0.610748291015625, -0.5629730224609375, -0.51519775390625, -0.4674224853515625, -0.419647216796875, -0.3718719482421875, -0.3240966796875, -0.2763214111328125, -0.228546142578125, -0.1807708740234375, -0.13299560546875, -0.0852203369140625, -0.037445068359375, 0.0103302001953125, 0.05810546875, 0.1058807373046875, 0.153656005859375, 0.2014312744140625, 0.24920654296875, 0.2969818115234375, 0.344757080078125, 0.3925323486328125, 0.4403076171875, 0.4880828857421875, 0.535858154296875, 0.5836334228515625, 0.63140869140625, 0.6791839599609375, 0.726959228515625, 0.7747344970703125, 0.822509765625, 0.8702850341796875, 0.918060302734375, 0.9658355712890625, 1.01361083984375, 1.0613861083984375, 1.109161376953125, 1.1569366455078125, 1.2047119140625, 1.2524871826171875, 1.300262451171875, 1.3480377197265625, 1.39581298828125, 1.4435882568359375, 1.491363525390625, 1.5391387939453125, 1.5869140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 19.0, 16.0, 20.0, 42.0, 61.0, 98.0, 119.0, 168.0, 271.0, 347.0, 498.0, 667.0, 980.0, 1314.0, 1971.0, 2782.0, 3946.0, 5708.0, 8182.0, 12009.0, 17587.0, 25895.0, 39375.0, 62290.0, 107691.0, 217972.0, 1280980.0, 114065.0, 65832.0, 41027.0, 26663.0, 17942.0, 12212.0, 8565.0, 5910.0, 4172.0, 2856.0, 2048.0, 1398.0, 1055.0, 743.0, 488.0, 331.0, 236.0, 192.0, 113.0, 90.0, 70.0, 40.0, 34.0, 18.0, 15.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.34423828125, -0.33349609375, -0.32275390625, -0.31201171875, -0.30126953125, -0.29052734375, -0.27978515625, -0.26904296875, -0.25830078125, -0.24755859375, -0.23681640625, -0.22607421875, -0.21533203125, -0.20458984375, -0.19384765625, -0.18310546875, -0.17236328125, -0.16162109375, -0.15087890625, -0.14013671875, -0.12939453125, -0.11865234375, -0.10791015625, -0.09716796875, -0.08642578125, -0.07568359375, -0.06494140625, -0.05419921875, -0.04345703125, -0.03271484375, -0.02197265625, -0.01123046875, -0.00048828125, 0.01025390625, 0.02099609375, 0.03173828125, 0.04248046875, 0.05322265625, 0.06396484375, 0.07470703125, 0.08544921875, 0.09619140625, 0.10693359375, 0.11767578125, 0.12841796875, 0.13916015625, 0.14990234375, 0.16064453125, 0.17138671875, 0.18212890625, 0.19287109375, 0.20361328125, 0.21435546875, 0.22509765625, 0.23583984375, 0.24658203125, 0.25732421875, 0.26806640625, 0.27880859375, 0.28955078125, 0.30029296875, 0.31103515625, 0.32177734375, 0.33251953125, 0.34326171875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 11.0, 7.0, 5.0, 7.0, 4.0, 17.0, 14.0, 35.0, 37.0, 44.0, 53.0, 40.0, 56.0, 86.0, 93.0, 82.0, 69.0, 59.0, 58.0, 55.0, 32.0, 28.0, 23.0, 20.0, 10.0, 12.0, 10.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012302398681640625, -0.0001193443313241005, -0.00011566467583179474, -0.00011198502033948898, -0.00010830536484718323, -0.00010462570935487747, -0.00010094605386257172, -9.726639837026596e-05, -9.35867428779602e-05, -8.990708738565445e-05, -8.62274318933487e-05, -8.254777640104294e-05, -7.886812090873718e-05, -7.518846541643143e-05, -7.150880992412567e-05, -6.782915443181992e-05, -6.414949893951416e-05, -6.0469843447208405e-05, -5.679018795490265e-05, -5.311053246259689e-05, -4.943087697029114e-05, -4.575122147798538e-05, -4.2071565985679626e-05, -3.839191049337387e-05, -3.4712255001068115e-05, -3.103259950876236e-05, -2.7352944016456604e-05, -2.367328852415085e-05, -1.9993633031845093e-05, -1.6313977539539337e-05, -1.2634322047233582e-05, -8.954666554927826e-06, -5.27501106262207e-06, -1.5953555703163147e-06, 2.084299921989441e-06, 5.7639554142951965e-06, 9.443610906600952e-06, 1.3123266398906708e-05, 1.6802921891212463e-05, 2.048257738351822e-05, 2.4162232875823975e-05, 2.784188836812973e-05, 3.1521543860435486e-05, 3.520119935274124e-05, 3.8880854845047e-05, 4.256051033735275e-05, 4.624016582965851e-05, 4.9919821321964264e-05, 5.359947681427002e-05, 5.7279132306575775e-05, 6.095878779888153e-05, 6.463844329118729e-05, 6.831809878349304e-05, 7.19977542757988e-05, 7.567740976810455e-05, 7.935706526041031e-05, 8.303672075271606e-05, 8.671637624502182e-05, 9.039603173732758e-05, 9.407568722963333e-05, 9.775534272193909e-05, 0.00010143499821424484, 0.0001051146537065506, 0.00010879430919885635, 0.00011247396469116211]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 8.0, 16.0, 14.0, 25.0, 34.0, 51.0, 77.0, 98.0, 170.0, 268.0, 490.0, 1442.0, 883484.0, 160292.0, 955.0, 426.0, 237.0, 151.0, 112.0, 54.0, 35.0, 32.0, 20.0, 13.0, 9.0, 5.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0021686553955078125, -0.0020935535430908203, -0.002018451690673828, -0.001943349838256836, -0.0018682479858398438, -0.0017931461334228516, -0.0017180442810058594, -0.0016429424285888672, -0.001567840576171875, -0.0014927387237548828, -0.0014176368713378906, -0.0013425350189208984, -0.0012674331665039062, -0.001192331314086914, -0.0011172294616699219, -0.0010421276092529297, -0.0009670257568359375, -0.0008919239044189453, -0.0008168220520019531, -0.0007417201995849609, -0.0006666183471679688, -0.0005915164947509766, -0.0005164146423339844, -0.0004413127899169922, -0.0003662109375, -0.0002911090850830078, -0.00021600723266601562, -0.00014090538024902344, -6.580352783203125e-05, 9.298324584960938e-06, 8.440017700195312e-05, 0.0001595020294189453, 0.0002346038818359375, 0.0003097057342529297, 0.0003848075866699219, 0.00045990943908691406, 0.0005350112915039062, 0.0006101131439208984, 0.0006852149963378906, 0.0007603168487548828, 0.000835418701171875, 0.0009105205535888672, 0.0009856224060058594, 0.0010607242584228516, 0.0011358261108398438, 0.001210927963256836, 0.0012860298156738281, 0.0013611316680908203, 0.0014362335205078125, 0.0015113353729248047, 0.0015864372253417969, 0.001661539077758789, 0.0017366409301757812, 0.0018117427825927734, 0.0018868446350097656, 0.001961946487426758, 0.00203704833984375, 0.002112150192260742, 0.0021872520446777344, 0.0022623538970947266, 0.0023374557495117188, 0.002412557601928711, 0.002487659454345703, 0.0025627613067626953, 0.0026378631591796875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 10.0, 74.0, 178.0, 319.0, 252.0, 126.0, 42.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002227829972980544, -0.00021745401318185031, -0.00021212502906564623, -0.00020679604494944215, -0.00020146706083323807, -0.00019613807671703398, -0.00019080910715274513, -0.00018548010848462582, -0.00018015113892033696, -0.00017482215480413288, -0.0001694931706879288, -0.0001641641865717247, -0.00015883520245552063, -0.00015350621833931655, -0.00014817723422311246, -0.0001428482646588236, -0.0001375192659907043, -0.00013219028187450022, -0.00012686129775829613, -0.00012153231364209205, -0.00011620332952588797, -0.00011087434540968388, -0.00010554536856943741, -0.00010021638445323333, -9.488740033702925e-05, -8.955841622082517e-05, -8.422943210462108e-05, -7.890045526437461e-05, -7.357147114817053e-05, -6.824248703196645e-05, -6.291350291576236e-05, -5.758451879955828e-05, -5.22555346833542e-05, -4.6926550567150116e-05, -4.159756645094603e-05, -3.626858597272076e-05, -3.0939601856516674e-05, -2.561061774031259e-05, -2.0281637262087315e-05, -1.4952653145883232e-05, -9.62366902967915e-06, -4.294685822969768e-06, 1.034297383739613e-06, 6.363279680954292e-06, 1.1692263797158375e-05, 1.702124791336246e-05, 2.2350228391587734e-05, 2.7679212507791817e-05, 3.30081966239959e-05, 3.833718074019998e-05, 4.3666164856404066e-05, 4.899514533462934e-05, 5.4324129450833425e-05, 5.965311356703751e-05, 6.498209404526278e-05, 7.031107816146687e-05, 7.564006227767095e-05, 8.096904639387503e-05, 8.629803051007912e-05, 9.162700735032558e-05, 9.695599146652967e-05, 0.00010228497558273375, 0.00010761395969893783, 0.00011294294381514192, 0.000118271927931346]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 8.0, 8.0, 13.0, 9.0, 11.0, 13.0, 25.0, 17.0, 17.0, 24.0, 22.0, 30.0, 31.0, 42.0, 39.0, 50.0, 33.0, 39.0, 55.0, 39.0, 44.0, 49.0, 37.0, 29.0, 38.0, 34.0, 32.0, 26.0, 38.0, 31.0, 19.0, 11.0, 19.0, 15.0, 10.0, 12.0, 2.0, 6.0, 5.0, 5.0, 6.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.710124969482422e-05, -5.5429525673389435e-05, -5.375780165195465e-05, -5.208607763051987e-05, -5.041435360908508e-05, -4.87426295876503e-05, -4.7070905566215515e-05, -4.539918154478073e-05, -4.372745752334595e-05, -4.205573350191116e-05, -4.038400948047638e-05, -3.8712285459041595e-05, -3.704056143760681e-05, -3.536883741617203e-05, -3.3697113394737244e-05, -3.202538937330246e-05, -3.0353665351867676e-05, -2.8681941330432892e-05, -2.7010217308998108e-05, -2.5338493287563324e-05, -2.366676926612854e-05, -2.1995045244693756e-05, -2.0323321223258972e-05, -1.8651597201824188e-05, -1.6979873180389404e-05, -1.530814915895462e-05, -1.3636425137519836e-05, -1.1964701116085052e-05, -1.0292977094650269e-05, -8.621253073215485e-06, -6.949529051780701e-06, -5.277805030345917e-06, -3.606081008911133e-06, -1.934356987476349e-06, -2.6263296604156494e-07, 1.409091055393219e-06, 3.080815076828003e-06, 4.752539098262787e-06, 6.424263119697571e-06, 8.095987141132355e-06, 9.767711162567139e-06, 1.1439435184001923e-05, 1.3111159205436707e-05, 1.478288322687149e-05, 1.6454607248306274e-05, 1.812633126974106e-05, 1.9798055291175842e-05, 2.1469779312610626e-05, 2.314150333404541e-05, 2.4813227355480194e-05, 2.6484951376914978e-05, 2.8156675398349762e-05, 2.9828399419784546e-05, 3.150012344121933e-05, 3.3171847462654114e-05, 3.48435714840889e-05, 3.651529550552368e-05, 3.8187019526958466e-05, 3.985874354839325e-05, 4.1530467569828033e-05, 4.320219159126282e-05, 4.48739156126976e-05, 4.6545639634132385e-05, 4.821736365556717e-05, 4.988908767700195e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 5.0, 10.0, 10.0, 17.0, 18.0, 13.0, 20.0, 26.0, 24.0, 32.0, 37.0, 37.0, 33.0, 53.0, 50.0, 55.0, 55.0, 51.0, 45.0, 55.0, 55.0, 41.0, 36.0, 33.0, 36.0, 18.0, 29.0, 24.0, 14.0, 15.0, 11.0, 15.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.546875, -3.4552001953125, -3.363525390625, -3.2718505859375, -3.18017578125, -3.0885009765625, -2.996826171875, -2.9051513671875, -2.8134765625, -2.7218017578125, -2.630126953125, -2.5384521484375, -2.44677734375, -2.3551025390625, -2.263427734375, -2.1717529296875, -2.080078125, -1.9884033203125, -1.896728515625, -1.8050537109375, -1.71337890625, -1.6217041015625, -1.530029296875, -1.4383544921875, -1.3466796875, -1.2550048828125, -1.163330078125, -1.0716552734375, -0.97998046875, -0.8883056640625, -0.796630859375, -0.7049560546875, -0.61328125, -0.5216064453125, -0.429931640625, -0.3382568359375, -0.24658203125, -0.1549072265625, -0.063232421875, 0.0284423828125, 0.1201171875, 0.2117919921875, 0.303466796875, 0.3951416015625, 0.48681640625, 0.5784912109375, 0.670166015625, 0.7618408203125, 0.853515625, 0.9451904296875, 1.036865234375, 1.1285400390625, 1.22021484375, 1.3118896484375, 1.403564453125, 1.4952392578125, 1.5869140625, 1.6785888671875, 1.770263671875, 1.8619384765625, 1.95361328125, 2.0452880859375, 2.136962890625, 2.2286376953125, 2.3203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 14.0, 14.0, 16.0, 23.0, 26.0, 50.0, 64.0, 71.0, 168.0, 256.0, 415.0, 793.0, 1380.0, 2698.0, 5352.0, 11418.0, 29065.0, 97757.0, 481515.0, 308960.0, 68181.0, 21553.0, 9296.0, 4360.0, 2244.0, 1162.0, 629.0, 383.0, 210.0, 162.0, 99.0, 67.0, 44.0, 29.0, 32.0, 14.0, 9.0, 8.0, 6.0, 2.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2578125, -3.13653564453125, -3.0152587890625, -2.89398193359375, -2.772705078125, -2.65142822265625, -2.5301513671875, -2.40887451171875, -2.28759765625, -2.16632080078125, -2.0450439453125, -1.92376708984375, -1.802490234375, -1.68121337890625, -1.5599365234375, -1.43865966796875, -1.3173828125, -1.19610595703125, -1.0748291015625, -0.95355224609375, -0.832275390625, -0.71099853515625, -0.5897216796875, -0.46844482421875, -0.34716796875, -0.22589111328125, -0.1046142578125, 0.01666259765625, 0.137939453125, 0.25921630859375, 0.3804931640625, 0.50177001953125, 0.623046875, 0.74432373046875, 0.8656005859375, 0.98687744140625, 1.108154296875, 1.22943115234375, 1.3507080078125, 1.47198486328125, 1.59326171875, 1.71453857421875, 1.8358154296875, 1.95709228515625, 2.078369140625, 2.19964599609375, 2.3209228515625, 2.44219970703125, 2.5634765625, 2.68475341796875, 2.8060302734375, 2.92730712890625, 3.048583984375, 3.16986083984375, 3.2911376953125, 3.41241455078125, 3.53369140625, 3.65496826171875, 3.7762451171875, 3.89752197265625, 4.018798828125, 4.14007568359375, 4.2613525390625, 4.38262939453125, 4.50390625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 1.0, 5.0, 8.0, 10.0, 7.0, 11.0, 15.0, 24.0, 18.0, 35.0, 28.0, 38.0, 44.0, 47.0, 61.0, 63.0, 94.0, 201.0, 1590.0, 201.0, 91.0, 64.0, 64.0, 47.0, 50.0, 38.0, 35.0, 25.0, 20.0, 27.0, 13.0, 21.0, 7.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -8.9923095703125, -8.687744140625, -8.3831787109375, -8.07861328125, -7.7740478515625, -7.469482421875, -7.1649169921875, -6.8603515625, -6.5557861328125, -6.251220703125, -5.9466552734375, -5.64208984375, -5.3375244140625, -5.032958984375, -4.7283935546875, -4.423828125, -4.1192626953125, -3.814697265625, -3.5101318359375, -3.20556640625, -2.9010009765625, -2.596435546875, -2.2918701171875, -1.9873046875, -1.6827392578125, -1.378173828125, -1.0736083984375, -0.76904296875, -0.4644775390625, -0.159912109375, 0.1446533203125, 0.44921875, 0.7537841796875, 1.058349609375, 1.3629150390625, 1.66748046875, 1.9720458984375, 2.276611328125, 2.5811767578125, 2.8857421875, 3.1903076171875, 3.494873046875, 3.7994384765625, 4.10400390625, 4.4085693359375, 4.713134765625, 5.0177001953125, 5.322265625, 5.6268310546875, 5.931396484375, 6.2359619140625, 6.54052734375, 6.8450927734375, 7.149658203125, 7.4542236328125, 7.7587890625, 8.0633544921875, 8.367919921875, 8.6724853515625, 8.97705078125, 9.2816162109375, 9.586181640625, 9.8907470703125, 10.1953125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 13.0, 9.0, 6.0, 12.0, 27.0, 33.0, 41.0, 66.0, 90.0, 146.0, 268.0, 537.0, 2887.0, 386636.0, 2748022.0, 5382.0, 697.0, 288.0, 188.0, 111.0, 59.0, 46.0, 42.0, 17.0, 19.0, 12.0, 12.0, 6.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.890625, -29.01416015625, -28.1376953125, -27.26123046875, -26.384765625, -25.50830078125, -24.6318359375, -23.75537109375, -22.87890625, -22.00244140625, -21.1259765625, -20.24951171875, -19.373046875, -18.49658203125, -17.6201171875, -16.74365234375, -15.8671875, -14.99072265625, -14.1142578125, -13.23779296875, -12.361328125, -11.48486328125, -10.6083984375, -9.73193359375, -8.85546875, -7.97900390625, -7.1025390625, -6.22607421875, -5.349609375, -4.47314453125, -3.5966796875, -2.72021484375, -1.84375, -0.96728515625, -0.0908203125, 0.78564453125, 1.662109375, 2.53857421875, 3.4150390625, 4.29150390625, 5.16796875, 6.04443359375, 6.9208984375, 7.79736328125, 8.673828125, 9.55029296875, 10.4267578125, 11.30322265625, 12.1796875, 13.05615234375, 13.9326171875, 14.80908203125, 15.685546875, 16.56201171875, 17.4384765625, 18.31494140625, 19.19140625, 20.06787109375, 20.9443359375, 21.82080078125, 22.697265625, 23.57373046875, 24.4501953125, 25.32666015625, 26.203125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 6.0, 15.0, 23.0, 33.0, 50.0, 79.0, 98.0, 114.0, 141.0, 112.0, 92.0, 91.0, 53.0, 43.0, 25.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.73713207244873, -9.322479248046875, -8.907827377319336, -8.49317455291748, -8.078522682189941, -7.663869857788086, -7.249217510223389, -6.834565162658691, -6.419912815093994, -6.005260467529297, -5.5906081199646, -5.175955772399902, -4.761302947998047, -4.346651077270508, -3.9319982528686523, -3.517345905303955, -3.102693557739258, -2.6880412101745605, -2.2733888626098633, -1.858736276626587, -1.4440839290618896, -1.0294315814971924, -0.614778995513916, -0.20012664794921875, 0.21452569961547852, 0.6291781067848206, 1.0438305139541626, 1.4584829807281494, 1.8731353282928467, 2.287787675857544, 2.7024402618408203, 3.1170926094055176, 3.5317459106445312, 3.9463982582092285, 4.361050605773926, 4.775703430175781, 5.19035530090332, 5.605008125305176, 6.019660472869873, 6.43431282043457, 6.848965167999268, 7.263617515563965, 7.678269863128662, 8.09292221069336, 8.507575035095215, 8.922226905822754, 9.33687973022461, 9.751531600952148, 10.166184425354004, 10.58083724975586, 10.995489120483398, 11.410141944885254, 11.824793815612793, 12.239446640014648, 12.654098510742188, 13.068751335144043, 13.483404159545898, 13.898056983947754, 14.312708854675293, 14.727361679077148, 15.142013549804688, 15.556666374206543, 15.971319198608398, 16.385971069335938, 16.800622940063477]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 0.0, 3.0, 5.0, 3.0, 3.0, 9.0, 13.0, 10.0, 9.0, 16.0, 20.0, 16.0, 18.0, 25.0, 41.0, 31.0, 23.0, 27.0, 46.0, 34.0, 45.0, 56.0, 49.0, 42.0, 46.0, 42.0, 47.0, 36.0, 34.0, 36.0, 28.0, 28.0, 20.0, 23.0, 15.0, 20.0, 15.0, 14.0, 13.0, 11.0, 11.0, 8.0, 5.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.16049575805664, -27.354175567626953, -26.5478572845459, -25.74153709411621, -24.935216903686523, -24.12889862060547, -23.32257843017578, -22.516258239746094, -21.709938049316406, -20.90361785888672, -20.097299575805664, -19.290979385375977, -18.48465919494629, -17.678340911865234, -16.872020721435547, -16.06570053100586, -15.259382247924805, -14.453063011169434, -13.646742820739746, -12.840423583984375, -12.034103393554688, -11.227784156799316, -10.421464920043945, -9.615144729614258, -8.808825492858887, -8.002506256103516, -7.196186065673828, -6.389866828918457, -5.583547115325928, -4.777227401733398, -3.9709081649780273, -3.164588451385498, -2.358266830444336, -1.5519472360610962, -0.7456276416778564, 0.06069183349609375, 0.867011547088623, 1.6733312606811523, 2.4796504974365234, 3.2859702110290527, 4.092289924621582, 4.898609638214111, 5.704929351806641, 6.511248588562012, 7.317568302154541, 8.12388801574707, 8.930207252502441, 9.736526489257812, 10.5428466796875, 11.349165916442871, 12.155486106872559, 12.96180534362793, 13.768125534057617, 14.574444770812988, 15.38076400756836, 16.187084197998047, 16.993404388427734, 17.799724578857422, 18.606042861938477, 19.412363052368164, 20.21868324279785, 21.025001525878906, 21.831321716308594, 22.63764190673828, 23.443960189819336]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 8.0, 14.0, 14.0, 17.0, 19.0, 19.0, 19.0, 32.0, 28.0, 24.0, 37.0, 52.0, 44.0, 47.0, 49.0, 53.0, 42.0, 51.0, 40.0, 52.0, 47.0, 41.0, 34.0, 24.0, 35.0, 29.0, 18.0, 19.0, 18.0, 15.0, 9.0, 11.0, 7.0, 8.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.52734375, -3.4345703125, -3.341796875, -3.2490234375, -3.15625, -3.0634765625, -2.970703125, -2.8779296875, -2.78515625, -2.6923828125, -2.599609375, -2.5068359375, -2.4140625, -2.3212890625, -2.228515625, -2.1357421875, -2.04296875, -1.9501953125, -1.857421875, -1.7646484375, -1.671875, -1.5791015625, -1.486328125, -1.3935546875, -1.30078125, -1.2080078125, -1.115234375, -1.0224609375, -0.9296875, -0.8369140625, -0.744140625, -0.6513671875, -0.55859375, -0.4658203125, -0.373046875, -0.2802734375, -0.1875, -0.0947265625, -0.001953125, 0.0908203125, 0.18359375, 0.2763671875, 0.369140625, 0.4619140625, 0.5546875, 0.6474609375, 0.740234375, 0.8330078125, 0.92578125, 1.0185546875, 1.111328125, 1.2041015625, 1.296875, 1.3896484375, 1.482421875, 1.5751953125, 1.66796875, 1.7607421875, 1.853515625, 1.9462890625, 2.0390625, 2.1318359375, 2.224609375, 2.3173828125, 2.41015625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 8.0, 4.0, 10.0, 13.0, 15.0, 22.0, 36.0, 39.0, 49.0, 75.0, 105.0, 138.0, 245.0, 378.0, 608.0, 1175.0, 2280.0, 5060.0, 11889.0, 31186.0, 91513.0, 300274.0, 880384.0, 1434242.0, 934082.0, 337108.0, 104542.0, 34983.0, 13094.0, 5404.0, 2450.0, 1202.0, 596.0, 332.0, 211.0, 143.0, 97.0, 89.0, 58.0, 43.0, 26.0, 16.0, 18.0, 10.0, 9.0, 10.0, 2.0, 6.0, 5.0, 1.0, 2.0], "bins": [-3.470703125, -3.375732421875, -3.28076171875, -3.185791015625, -3.0908203125, -2.995849609375, -2.90087890625, -2.805908203125, -2.7109375, -2.615966796875, -2.52099609375, -2.426025390625, -2.3310546875, -2.236083984375, -2.14111328125, -2.046142578125, -1.951171875, -1.856201171875, -1.76123046875, -1.666259765625, -1.5712890625, -1.476318359375, -1.38134765625, -1.286376953125, -1.19140625, -1.096435546875, -1.00146484375, -0.906494140625, -0.8115234375, -0.716552734375, -0.62158203125, -0.526611328125, -0.431640625, -0.336669921875, -0.24169921875, -0.146728515625, -0.0517578125, 0.043212890625, 0.13818359375, 0.233154296875, 0.328125, 0.423095703125, 0.51806640625, 0.613037109375, 0.7080078125, 0.802978515625, 0.89794921875, 0.992919921875, 1.087890625, 1.182861328125, 1.27783203125, 1.372802734375, 1.4677734375, 1.562744140625, 1.65771484375, 1.752685546875, 1.84765625, 1.942626953125, 2.03759765625, 2.132568359375, 2.2275390625, 2.322509765625, 2.41748046875, 2.512451171875, 2.607421875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 5.0, 5.0, 7.0, 23.0, 32.0, 57.0, 72.0, 115.0, 186.0, 282.0, 388.0, 511.0, 633.0, 591.0, 381.0, 259.0, 179.0, 139.0, 81.0, 43.0, 33.0, 25.0, 8.0, 10.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8203125, -10.53961181640625, -10.2589111328125, -9.97821044921875, -9.697509765625, -9.41680908203125, -9.1361083984375, -8.85540771484375, -8.57470703125, -8.29400634765625, -8.0133056640625, -7.73260498046875, -7.451904296875, -7.17120361328125, -6.8905029296875, -6.60980224609375, -6.3291015625, -6.04840087890625, -5.7677001953125, -5.48699951171875, -5.206298828125, -4.92559814453125, -4.6448974609375, -4.36419677734375, -4.08349609375, -3.80279541015625, -3.5220947265625, -3.24139404296875, -2.960693359375, -2.67999267578125, -2.3992919921875, -2.11859130859375, -1.837890625, -1.55718994140625, -1.2764892578125, -0.99578857421875, -0.715087890625, -0.43438720703125, -0.1536865234375, 0.12701416015625, 0.40771484375, 0.68841552734375, 0.9691162109375, 1.24981689453125, 1.530517578125, 1.81121826171875, 2.0919189453125, 2.37261962890625, 2.6533203125, 2.93402099609375, 3.2147216796875, 3.49542236328125, 3.776123046875, 4.05682373046875, 4.3375244140625, 4.61822509765625, 4.89892578125, 5.17962646484375, 5.4603271484375, 5.74102783203125, 6.021728515625, 6.30242919921875, 6.5831298828125, 6.86383056640625, 7.14453125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 9.0, 21.0, 16.0, 15.0, 36.0, 58.0, 86.0, 114.0, 191.0, 372.0, 827.0, 4837.0, 196554.0, 3784228.0, 200357.0, 4862.0, 803.0, 324.0, 187.0, 105.0, 79.0, 56.0, 40.0, 24.0, 20.0, 16.0, 16.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-22.015625, -21.3955078125, -20.775390625, -20.1552734375, -19.53515625, -18.9150390625, -18.294921875, -17.6748046875, -17.0546875, -16.4345703125, -15.814453125, -15.1943359375, -14.57421875, -13.9541015625, -13.333984375, -12.7138671875, -12.09375, -11.4736328125, -10.853515625, -10.2333984375, -9.61328125, -8.9931640625, -8.373046875, -7.7529296875, -7.1328125, -6.5126953125, -5.892578125, -5.2724609375, -4.65234375, -4.0322265625, -3.412109375, -2.7919921875, -2.171875, -1.5517578125, -0.931640625, -0.3115234375, 0.30859375, 0.9287109375, 1.548828125, 2.1689453125, 2.7890625, 3.4091796875, 4.029296875, 4.6494140625, 5.26953125, 5.8896484375, 6.509765625, 7.1298828125, 7.75, 8.3701171875, 8.990234375, 9.6103515625, 10.23046875, 10.8505859375, 11.470703125, 12.0908203125, 12.7109375, 13.3310546875, 13.951171875, 14.5712890625, 15.19140625, 15.8115234375, 16.431640625, 17.0517578125, 17.671875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 18.0, 39.0, 90.0, 189.0, 238.0, 209.0, 130.0, 61.0, 22.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.017578125, -71.08941650390625, -69.16124725341797, -67.23308563232422, -65.30491638183594, -63.37675476074219, -61.44858932495117, -59.520423889160156, -57.59225845336914, -55.664093017578125, -53.73592758178711, -51.807762145996094, -49.879600524902344, -47.95143127441406, -46.02326965332031, -44.0951042175293, -42.16693878173828, -40.238773345947266, -38.31060791015625, -36.382442474365234, -34.45427703857422, -32.52611541748047, -30.597949981689453, -28.669784545898438, -26.741619110107422, -24.813453674316406, -22.88528823852539, -20.957124710083008, -19.028959274291992, -17.100793838500977, -15.172629356384277, -13.244464874267578, -11.316303253173828, -9.388137817382812, -7.459973335266113, -5.531808376312256, -3.6036434173583984, -1.6754779815673828, 0.2526865005493164, 2.1808509826660156, 4.109016418457031, 6.037181377410889, 7.965346336364746, 9.893510818481445, 11.821676254272461, 13.749841690063477, 15.678006172180176, 17.606170654296875, 19.53433609008789, 21.462501525878906, 23.390666961669922, 25.318830490112305, 27.24699592590332, 29.175161361694336, 31.10332489013672, 33.031490325927734, 34.95965576171875, 36.887821197509766, 38.81598663330078, 40.7441520690918, 42.67231750488281, 44.60047912597656, 46.52864456176758, 48.456809997558594, 50.38497543334961]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 9.0, 11.0, 9.0, 14.0, 16.0, 21.0, 20.0, 18.0, 30.0, 26.0, 34.0, 40.0, 42.0, 51.0, 47.0, 38.0, 47.0, 47.0, 48.0, 61.0, 47.0, 25.0, 41.0, 35.0, 31.0, 27.0, 22.0, 21.0, 14.0, 17.0, 22.0, 12.0, 12.0, 8.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.206607818603516, -25.440139770507812, -24.67367172241211, -23.907203674316406, -23.140737533569336, -22.374269485473633, -21.60780143737793, -20.841333389282227, -20.074867248535156, -19.308399200439453, -18.54193115234375, -17.775463104248047, -17.008996963500977, -16.242528915405273, -15.47606086730957, -14.709592819213867, -13.943124771118164, -13.176656723022461, -12.410189628601074, -11.643721580505371, -10.877254486083984, -10.110786437988281, -9.344318389892578, -8.577850341796875, -7.811383247375488, -7.044915676116943, -6.278448104858398, -5.511980056762695, -4.74551248550415, -3.9790449142456055, -3.2125768661499023, -2.4461092948913574, -1.6796398162841797, -0.9131721258163452, -0.14670443534851074, 0.6197633743286133, 1.3862309455871582, 2.152698516845703, 2.9191665649414062, 3.685634136199951, 4.452101707458496, 5.218569278717041, 5.985036849975586, 6.751504898071289, 7.517972469329834, 8.284440040588379, 9.050908088684082, 9.817375183105469, 10.583843231201172, 11.350311279296875, 12.116778373718262, 12.883246421813965, 13.649713516235352, 14.416181564331055, 15.182649612426758, 15.949117660522461, 16.71558380126953, 17.482051849365234, 18.248519897460938, 19.01498794555664, 19.78145408630371, 20.547922134399414, 21.314390182495117, 22.08085823059082, 22.847326278686523]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 3.0, 10.0, 12.0, 10.0, 13.0, 11.0, 23.0, 24.0, 24.0, 22.0, 28.0, 29.0, 33.0, 32.0, 41.0, 41.0, 49.0, 52.0, 51.0, 46.0, 47.0, 38.0, 47.0, 47.0, 36.0, 28.0, 27.0, 32.0, 20.0, 23.0, 18.0, 23.0, 15.0, 8.0, 7.0, 14.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.48828125, -3.39752197265625, -3.3067626953125, -3.21600341796875, -3.125244140625, -3.03448486328125, -2.9437255859375, -2.85296630859375, -2.76220703125, -2.67144775390625, -2.5806884765625, -2.48992919921875, -2.399169921875, -2.30841064453125, -2.2176513671875, -2.12689208984375, -2.0361328125, -1.94537353515625, -1.8546142578125, -1.76385498046875, -1.673095703125, -1.58233642578125, -1.4915771484375, -1.40081787109375, -1.31005859375, -1.21929931640625, -1.1285400390625, -1.03778076171875, -0.947021484375, -0.85626220703125, -0.7655029296875, -0.67474365234375, -0.583984375, -0.49322509765625, -0.4024658203125, -0.31170654296875, -0.220947265625, -0.13018798828125, -0.0394287109375, 0.05133056640625, 0.14208984375, 0.23284912109375, 0.3236083984375, 0.41436767578125, 0.505126953125, 0.59588623046875, 0.6866455078125, 0.77740478515625, 0.8681640625, 0.95892333984375, 1.0496826171875, 1.14044189453125, 1.231201171875, 1.32196044921875, 1.4127197265625, 1.50347900390625, 1.59423828125, 1.68499755859375, 1.7757568359375, 1.86651611328125, 1.957275390625, 2.04803466796875, 2.1387939453125, 2.22955322265625, 2.3203125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 12.0, 16.0, 35.0, 48.0, 85.0, 143.0, 185.0, 298.0, 511.0, 780.0, 1269.0, 2028.0, 3165.0, 5121.0, 8338.0, 13489.0, 22218.0, 37510.0, 67126.0, 134326.0, 323971.0, 209656.0, 93429.0, 50254.0, 29272.0, 17349.0, 10639.0, 6545.0, 4044.0, 2484.0, 1471.0, 984.0, 608.0, 420.0, 234.0, 171.0, 99.0, 63.0, 45.0, 34.0, 23.0, 14.0, 8.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.464111328125, -0.4479713439941406, -0.43183135986328125, -0.4156913757324219, -0.3995513916015625, -0.3834114074707031, -0.36727142333984375, -0.3511314392089844, -0.334991455078125, -0.3188514709472656, -0.30271148681640625, -0.2865715026855469, -0.2704315185546875, -0.2542915344238281, -0.23815155029296875, -0.22201156616210938, -0.20587158203125, -0.18973159790039062, -0.17359161376953125, -0.15745162963867188, -0.1413116455078125, -0.12517166137695312, -0.10903167724609375, -0.09289169311523438, -0.076751708984375, -0.060611724853515625, -0.04447174072265625, -0.028331756591796875, -0.0121917724609375, 0.003948211669921875, 0.02008819580078125, 0.036228179931640625, 0.0523681640625, 0.06850814819335938, 0.08464813232421875, 0.10078811645507812, 0.1169281005859375, 0.13306808471679688, 0.14920806884765625, 0.16534805297851562, 0.181488037109375, 0.19762802124023438, 0.21376800537109375, 0.22990798950195312, 0.2460479736328125, 0.2621879577636719, 0.27832794189453125, 0.2944679260253906, 0.31060791015625, 0.3267478942871094, 0.34288787841796875, 0.3590278625488281, 0.3751678466796875, 0.3913078308105469, 0.40744781494140625, 0.4235877990722656, 0.439727783203125, 0.4558677673339844, 0.47200775146484375, 0.4881477355957031, 0.5042877197265625, 0.5204277038574219, 0.5365676879882812, 0.5527076721191406, 0.56884765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 3.0, 7.0, 6.0, 7.0, 8.0, 11.0, 9.0, 14.0, 15.0, 25.0, 18.0, 26.0, 21.0, 26.0, 24.0, 33.0, 39.0, 40.0, 48.0, 30.0, 49.0, 1073.0, 40.0, 30.0, 58.0, 41.0, 33.0, 38.0, 33.0, 34.0, 30.0, 29.0, 20.0, 15.0, 20.0, 12.0, 13.0, 11.0, 5.0, 11.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7458953857421875, -1.691986083984375, -1.6380767822265625, -1.58416748046875, -1.5302581787109375, -1.476348876953125, -1.4224395751953125, -1.3685302734375, -1.3146209716796875, -1.260711669921875, -1.2068023681640625, -1.15289306640625, -1.0989837646484375, -1.045074462890625, -0.9911651611328125, -0.937255859375, -0.8833465576171875, -0.829437255859375, -0.7755279541015625, -0.72161865234375, -0.6677093505859375, -0.613800048828125, -0.5598907470703125, -0.5059814453125, -0.4520721435546875, -0.398162841796875, -0.3442535400390625, -0.29034423828125, -0.2364349365234375, -0.182525634765625, -0.1286163330078125, -0.07470703125, -0.0207977294921875, 0.033111572265625, 0.0870208740234375, 0.14093017578125, 0.1948394775390625, 0.248748779296875, 0.3026580810546875, 0.3565673828125, 0.4104766845703125, 0.464385986328125, 0.5182952880859375, 0.57220458984375, 0.6261138916015625, 0.680023193359375, 0.7339324951171875, 0.787841796875, 0.8417510986328125, 0.895660400390625, 0.9495697021484375, 1.00347900390625, 1.0573883056640625, 1.111297607421875, 1.1652069091796875, 1.2191162109375, 1.2730255126953125, 1.326934814453125, 1.3808441162109375, 1.43475341796875, 1.4886627197265625, 1.542572021484375, 1.5964813232421875, 1.650390625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 13.0, 10.0, 18.0, 31.0, 44.0, 70.0, 92.0, 160.0, 214.0, 348.0, 488.0, 672.0, 1003.0, 1431.0, 1984.0, 2911.0, 4098.0, 5830.0, 8440.0, 12601.0, 18339.0, 27434.0, 42086.0, 69565.0, 128134.0, 1307992.0, 200803.0, 97701.0, 56548.0, 35408.0, 22665.0, 15471.0, 10498.0, 7310.0, 5170.0, 3462.0, 2530.0, 1663.0, 1157.0, 816.0, 571.0, 402.0, 282.0, 217.0, 128.0, 99.0, 69.0, 45.0, 37.0, 24.0, 21.0, 10.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0], "bins": [-0.385009765625, -0.37290191650390625, -0.3607940673828125, -0.34868621826171875, -0.336578369140625, -0.32447052001953125, -0.3123626708984375, -0.30025482177734375, -0.28814697265625, -0.27603912353515625, -0.2639312744140625, -0.25182342529296875, -0.239715576171875, -0.22760772705078125, -0.2154998779296875, -0.20339202880859375, -0.1912841796875, -0.17917633056640625, -0.1670684814453125, -0.15496063232421875, -0.142852783203125, -0.13074493408203125, -0.1186370849609375, -0.10652923583984375, -0.09442138671875, -0.08231353759765625, -0.0702056884765625, -0.05809783935546875, -0.045989990234375, -0.03388214111328125, -0.0217742919921875, -0.00966644287109375, 0.00244140625, 0.01454925537109375, 0.0266571044921875, 0.03876495361328125, 0.050872802734375, 0.06298065185546875, 0.0750885009765625, 0.08719635009765625, 0.09930419921875, 0.11141204833984375, 0.1235198974609375, 0.13562774658203125, 0.147735595703125, 0.15984344482421875, 0.1719512939453125, 0.18405914306640625, 0.1961669921875, 0.20827484130859375, 0.2203826904296875, 0.23249053955078125, 0.244598388671875, 0.25670623779296875, 0.2688140869140625, 0.28092193603515625, 0.29302978515625, 0.30513763427734375, 0.3172454833984375, 0.32935333251953125, 0.341461181640625, 0.35356903076171875, 0.3656768798828125, 0.37778472900390625, 0.389892578125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 7.0, 9.0, 9.0, 18.0, 13.0, 20.0, 13.0, 26.0, 24.0, 43.0, 35.0, 47.0, 52.0, 61.0, 65.0, 62.0, 67.0, 59.0, 51.0, 50.0, 45.0, 35.0, 24.0, 36.0, 21.0, 13.0, 18.0, 22.0, 9.0, 5.0, 7.0, 4.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.00011789798736572266, -0.00011467467993497849, -0.00011145137250423431, -0.00010822806507349014, -0.00010500475764274597, -0.0001017814502120018, -9.855814278125763e-05, -9.533483535051346e-05, -9.211152791976929e-05, -8.888822048902512e-05, -8.566491305828094e-05, -8.244160562753677e-05, -7.92182981967926e-05, -7.599499076604843e-05, -7.277168333530426e-05, -6.954837590456009e-05, -6.632506847381592e-05, -6.310176104307175e-05, -5.9878453612327576e-05, -5.6655146181583405e-05, -5.3431838750839233e-05, -5.020853132009506e-05, -4.698522388935089e-05, -4.376191645860672e-05, -4.053860902786255e-05, -3.731530159711838e-05, -3.4091994166374207e-05, -3.0868686735630035e-05, -2.7645379304885864e-05, -2.4422071874141693e-05, -2.1198764443397522e-05, -1.797545701265335e-05, -1.475214958190918e-05, -1.1528842151165009e-05, -8.305534720420837e-06, -5.082227289676666e-06, -1.8589198589324951e-06, 1.364387571811676e-06, 4.587695002555847e-06, 7.811002433300018e-06, 1.103430986404419e-05, 1.425761729478836e-05, 1.7480924725532532e-05, 2.0704232156276703e-05, 2.3927539587020874e-05, 2.7150847017765045e-05, 3.0374154448509216e-05, 3.359746187925339e-05, 3.682076930999756e-05, 4.004407674074173e-05, 4.32673841714859e-05, 4.649069160223007e-05, 4.971399903297424e-05, 5.2937306463718414e-05, 5.6160613894462585e-05, 5.9383921325206757e-05, 6.260722875595093e-05, 6.58305361866951e-05, 6.905384361743927e-05, 7.227715104818344e-05, 7.550045847892761e-05, 7.872376590967178e-05, 8.194707334041595e-05, 8.517038077116013e-05, 8.83936882019043e-05]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 7.0, 17.0, 15.0, 20.0, 37.0, 34.0, 60.0, 105.0, 113.0, 189.0, 292.0, 561.0, 1497.0, 598272.0, 444482.0, 1393.0, 553.0, 304.0, 168.0, 129.0, 82.0, 55.0, 38.0, 25.0, 25.0, 12.0, 16.0, 5.0, 8.0, 4.0, 2.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019092559814453125, -0.0018410086631774902, -0.001772761344909668, -0.0017045140266418457, -0.0016362667083740234, -0.0015680193901062012, -0.001499772071838379, -0.0014315247535705566, -0.0013632774353027344, -0.0012950301170349121, -0.0012267827987670898, -0.0011585354804992676, -0.0010902881622314453, -0.001022040843963623, -0.0009537935256958008, -0.0008855462074279785, -0.0008172988891601562, -0.000749051570892334, -0.0006808042526245117, -0.0006125569343566895, -0.0005443096160888672, -0.0004760622978210449, -0.00040781497955322266, -0.0003395676612854004, -0.0002713203430175781, -0.00020307302474975586, -0.0001348257064819336, -6.657838821411133e-05, 1.6689300537109375e-06, 6.99162483215332e-05, 0.00013816356658935547, 0.00020641088485717773, 0.000274658203125, 0.00034290552139282227, 0.00041115283966064453, 0.0004794001579284668, 0.0005476474761962891, 0.0006158947944641113, 0.0006841421127319336, 0.0007523894309997559, 0.0008206367492675781, 0.0008888840675354004, 0.0009571313858032227, 0.001025378704071045, 0.0010936260223388672, 0.0011618733406066895, 0.0012301206588745117, 0.001298367977142334, 0.0013666152954101562, 0.0014348626136779785, 0.0015031099319458008, 0.001571357250213623, 0.0016396045684814453, 0.0017078518867492676, 0.0017760992050170898, 0.0018443465232849121, 0.0019125938415527344, 0.0019808411598205566, 0.002049088478088379, 0.002117335796356201, 0.0021855831146240234, 0.0022538304328918457, 0.002322077751159668, 0.0023903250694274902, 0.0024585723876953125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 57.0, 291.0, 433.0, 206.0, 21.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021717695926781744, -0.00020923932606820017, -0.0002013016928685829, -0.00019336407422088087, -0.0001854264410212636, -0.00017748880782164633, -0.00016955117462202907, -0.0001616135414224118, -0.00015367590822279453, -0.00014573827502317727, -0.00013780064182356, -0.00012986300862394273, -0.0001219253899762407, -0.00011398775677662343, -0.00010605012357700616, -9.81124903773889e-05, -9.017487172968686e-05, -8.223723853006959e-05, -7.429961260640994e-05, -6.636197940679267e-05, -5.842434984515421e-05, -5.048672028351575e-05, -4.2549087083898485e-05, -3.4611457522260025e-05, -2.6673827960621566e-05, -1.8736198398983106e-05, -1.0798567018355243e-05, -2.86093563772738e-06, 5.07669392391108e-06, 1.301432348554954e-05, 2.0951956685166806e-05, 2.8889586246805266e-05, 3.6827230360358953e-05, 4.476485992199741e-05, 5.270248948363587e-05, 6.064012268325314e-05, 6.857774860691279e-05, 7.651538180653006e-05, 8.445301500614733e-05, 9.239064820576459e-05, 0.00010032827412942424, 0.00010826590732904151, 0.00011620353325270116, 0.00012414116645231843, 0.0001320787996519357, 0.00014001643285155296, 0.00014795406605117023, 0.00015589168469887227, 0.00016382931789848953, 0.0001717669510981068, 0.00017970458429772407, 0.0001876422029454261, 0.00019557983614504337, 0.00020351746934466064, 0.0002114551025442779, 0.00021939273574389517, 0.00022733036894351244, 0.0002352680021431297, 0.00024320563534274697, 0.00025114326854236424, 0.0002590809017419815, 0.0002670185058377683, 0.00027495616814121604, 0.00028289377223700285, 0.0002908314054366201]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 5.0, 5.0, 10.0, 11.0, 9.0, 14.0, 14.0, 16.0, 16.0, 27.0, 29.0, 24.0, 40.0, 33.0, 39.0, 43.0, 40.0, 40.0, 36.0, 28.0, 41.0, 40.0, 38.0, 34.0, 39.0, 37.0, 36.0, 43.0, 22.0, 21.0, 22.0, 18.0, 20.0, 17.0, 14.0, 18.0, 10.0, 9.0, 8.0, 4.0, 11.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.881620407104492e-05, -4.726182669401169e-05, -4.5707449316978455e-05, -4.415307193994522e-05, -4.259869456291199e-05, -4.1044317185878754e-05, -3.948993980884552e-05, -3.7935562431812286e-05, -3.638118505477905e-05, -3.482680767774582e-05, -3.3272430300712585e-05, -3.171805292367935e-05, -3.0163675546646118e-05, -2.8609298169612885e-05, -2.705492079257965e-05, -2.5500543415546417e-05, -2.3946166038513184e-05, -2.239178866147995e-05, -2.0837411284446716e-05, -1.9283033907413483e-05, -1.772865653038025e-05, -1.6174279153347015e-05, -1.4619901776313782e-05, -1.3065524399280548e-05, -1.1511147022247314e-05, -9.95676964521408e-06, -8.402392268180847e-06, -6.8480148911476135e-06, -5.29363751411438e-06, -3.7392601370811462e-06, -2.1848827600479126e-06, -6.30505383014679e-07, 9.238719940185547e-07, 2.4782493710517883e-06, 4.032626748085022e-06, 5.587004125118256e-06, 7.141381502151489e-06, 8.695758879184723e-06, 1.0250136256217957e-05, 1.180451363325119e-05, 1.3358891010284424e-05, 1.4913268387317657e-05, 1.646764576435089e-05, 1.8022023141384125e-05, 1.957640051841736e-05, 2.1130777895450592e-05, 2.2685155272483826e-05, 2.423953264951706e-05, 2.5793910026550293e-05, 2.7348287403583527e-05, 2.890266478061676e-05, 3.0457042157649994e-05, 3.201141953468323e-05, 3.356579691171646e-05, 3.5120174288749695e-05, 3.667455166578293e-05, 3.822892904281616e-05, 3.9783306419849396e-05, 4.133768379688263e-05, 4.289206117391586e-05, 4.44464385509491e-05, 4.600081592798233e-05, 4.7555193305015564e-05, 4.91095706820488e-05, 5.066394805908203e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 3.0, 10.0, 12.0, 10.0, 13.0, 11.0, 23.0, 24.0, 24.0, 22.0, 28.0, 29.0, 33.0, 32.0, 41.0, 41.0, 49.0, 52.0, 51.0, 46.0, 47.0, 38.0, 47.0, 47.0, 36.0, 28.0, 27.0, 32.0, 20.0, 23.0, 18.0, 23.0, 15.0, 8.0, 7.0, 14.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.48828125, -3.39752197265625, -3.3067626953125, -3.21600341796875, -3.125244140625, -3.03448486328125, -2.9437255859375, -2.85296630859375, -2.76220703125, -2.67144775390625, -2.5806884765625, -2.48992919921875, -2.399169921875, -2.30841064453125, -2.2176513671875, -2.12689208984375, -2.0361328125, -1.94537353515625, -1.8546142578125, -1.76385498046875, -1.673095703125, -1.58233642578125, -1.4915771484375, -1.40081787109375, -1.31005859375, -1.21929931640625, -1.1285400390625, -1.03778076171875, -0.947021484375, -0.85626220703125, -0.7655029296875, -0.67474365234375, -0.583984375, -0.49322509765625, -0.4024658203125, -0.31170654296875, -0.220947265625, -0.13018798828125, -0.0394287109375, 0.05133056640625, 0.14208984375, 0.23284912109375, 0.3236083984375, 0.41436767578125, 0.505126953125, 0.59588623046875, 0.6866455078125, 0.77740478515625, 0.8681640625, 0.95892333984375, 1.0496826171875, 1.14044189453125, 1.231201171875, 1.32196044921875, 1.4127197265625, 1.50347900390625, 1.59423828125, 1.68499755859375, 1.7757568359375, 1.86651611328125, 1.957275390625, 2.04803466796875, 2.1387939453125, 2.22955322265625, 2.3203125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 5.0, 2.0, 7.0, 9.0, 17.0, 16.0, 32.0, 44.0, 78.0, 118.0, 175.0, 283.0, 464.0, 795.0, 1479.0, 2761.0, 5428.0, 11499.0, 26069.0, 68385.0, 210360.0, 418787.0, 192132.0, 62959.0, 24601.0, 10866.0, 5210.0, 2657.0, 1359.0, 772.0, 486.0, 234.0, 154.0, 99.0, 76.0, 46.0, 25.0, 18.0, 9.0, 11.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0], "bins": [-3.697265625, -3.60113525390625, -3.5050048828125, -3.40887451171875, -3.312744140625, -3.21661376953125, -3.1204833984375, -3.02435302734375, -2.92822265625, -2.83209228515625, -2.7359619140625, -2.63983154296875, -2.543701171875, -2.44757080078125, -2.3514404296875, -2.25531005859375, -2.1591796875, -2.06304931640625, -1.9669189453125, -1.87078857421875, -1.774658203125, -1.67852783203125, -1.5823974609375, -1.48626708984375, -1.39013671875, -1.29400634765625, -1.1978759765625, -1.10174560546875, -1.005615234375, -0.90948486328125, -0.8133544921875, -0.71722412109375, -0.62109375, -0.52496337890625, -0.4288330078125, -0.33270263671875, -0.236572265625, -0.14044189453125, -0.0443115234375, 0.05181884765625, 0.14794921875, 0.24407958984375, 0.3402099609375, 0.43634033203125, 0.532470703125, 0.62860107421875, 0.7247314453125, 0.82086181640625, 0.9169921875, 1.01312255859375, 1.1092529296875, 1.20538330078125, 1.301513671875, 1.39764404296875, 1.4937744140625, 1.58990478515625, 1.68603515625, 1.78216552734375, 1.8782958984375, 1.97442626953125, 2.070556640625, 2.16668701171875, 2.2628173828125, 2.35894775390625, 2.455078125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 5.0, 3.0, 8.0, 6.0, 7.0, 7.0, 16.0, 17.0, 8.0, 23.0, 23.0, 20.0, 25.0, 37.0, 41.0, 43.0, 43.0, 53.0, 96.0, 205.0, 1506.0, 291.0, 115.0, 70.0, 50.0, 47.0, 45.0, 26.0, 31.0, 28.0, 23.0, 17.0, 23.0, 22.0, 19.0, 14.0, 5.0, 10.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0], "bins": [-12.53125, -12.198974609375, -11.86669921875, -11.534423828125, -11.2021484375, -10.869873046875, -10.53759765625, -10.205322265625, -9.873046875, -9.540771484375, -9.20849609375, -8.876220703125, -8.5439453125, -8.211669921875, -7.87939453125, -7.547119140625, -7.21484375, -6.882568359375, -6.55029296875, -6.218017578125, -5.8857421875, -5.553466796875, -5.22119140625, -4.888916015625, -4.556640625, -4.224365234375, -3.89208984375, -3.559814453125, -3.2275390625, -2.895263671875, -2.56298828125, -2.230712890625, -1.8984375, -1.566162109375, -1.23388671875, -0.901611328125, -0.5693359375, -0.237060546875, 0.09521484375, 0.427490234375, 0.759765625, 1.092041015625, 1.42431640625, 1.756591796875, 2.0888671875, 2.421142578125, 2.75341796875, 3.085693359375, 3.41796875, 3.750244140625, 4.08251953125, 4.414794921875, 4.7470703125, 5.079345703125, 5.41162109375, 5.743896484375, 6.076171875, 6.408447265625, 6.74072265625, 7.072998046875, 7.4052734375, 7.737548828125, 8.06982421875, 8.402099609375, 8.734375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 8.0, 4.0, 4.0, 9.0, 6.0, 28.0, 20.0, 41.0, 40.0, 59.0, 85.0, 104.0, 173.0, 301.0, 630.0, 3625.0, 2420970.0, 715503.0, 2713.0, 543.0, 281.0, 184.0, 97.0, 67.0, 48.0, 42.0, 36.0, 26.0, 11.0, 8.0, 11.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.03125, -32.0859375, -31.140625, -30.1953125, -29.25, -28.3046875, -27.359375, -26.4140625, -25.46875, -24.5234375, -23.578125, -22.6328125, -21.6875, -20.7421875, -19.796875, -18.8515625, -17.90625, -16.9609375, -16.015625, -15.0703125, -14.125, -13.1796875, -12.234375, -11.2890625, -10.34375, -9.3984375, -8.453125, -7.5078125, -6.5625, -5.6171875, -4.671875, -3.7265625, -2.78125, -1.8359375, -0.890625, 0.0546875, 1.0, 1.9453125, 2.890625, 3.8359375, 4.78125, 5.7265625, 6.671875, 7.6171875, 8.5625, 9.5078125, 10.453125, 11.3984375, 12.34375, 13.2890625, 14.234375, 15.1796875, 16.125, 17.0703125, 18.015625, 18.9609375, 19.90625, 20.8515625, 21.796875, 22.7421875, 23.6875, 24.6328125, 25.578125, 26.5234375, 27.46875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 178.0, 732.0, 100.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.644240379333496, -12.759722709655762, -9.875204086303711, -6.990686416625977, -4.106168746948242, -1.2216510772705078, 1.662867546081543, 4.547385215759277, 7.431902885437012, 10.316420555114746, 13.200939178466797, 16.08545684814453, 18.969974517822266, 21.8544921875, 24.739009857177734, 27.62352752685547, 30.508045196533203, 33.39256286621094, 36.27708053588867, 39.161598205566406, 42.04611587524414, 44.930633544921875, 47.815155029296875, 50.699668884277344, 53.584190368652344, 56.46870803833008, 59.35322570800781, 62.23774337768555, 65.12226104736328, 68.00678253173828, 70.89129638671875, 73.77581787109375, 76.66033172607422, 79.54485321044922, 82.42936706542969, 85.31388854980469, 88.19840240478516, 91.08292388916016, 93.96743774414062, 96.85195922851562, 99.7364730834961, 102.6209945678711, 105.50550842285156, 108.39002990722656, 111.27454376220703, 114.15906524658203, 117.0435791015625, 119.9281005859375, 122.8126220703125, 125.6971435546875, 128.5816650390625, 131.46617126464844, 134.35069274902344, 137.23521423339844, 140.11973571777344, 143.00424194335938, 145.88876342773438, 148.77328491210938, 151.65780639648438, 154.5423126220703, 157.4268341064453, 160.3113555908203, 163.1958770751953, 166.08038330078125, 168.96490478515625]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 9.0, 10.0, 6.0, 9.0, 13.0, 10.0, 24.0, 24.0, 27.0, 22.0, 36.0, 29.0, 34.0, 38.0, 40.0, 37.0, 38.0, 39.0, 41.0, 44.0, 42.0, 50.0, 38.0, 45.0, 37.0, 27.0, 32.0, 34.0, 19.0, 14.0, 26.0, 25.0, 15.0, 12.0, 16.0, 9.0, 7.0, 4.0, 4.0, 6.0, 5.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.087427139282227, -26.29973602294922, -25.51204490661621, -24.724353790283203, -23.936662673950195, -23.148971557617188, -22.36128044128418, -21.573589324951172, -20.785898208618164, -19.998207092285156, -19.21051597595215, -18.42282485961914, -17.635133743286133, -16.847442626953125, -16.059751510620117, -15.27206039428711, -14.484368324279785, -13.696677207946777, -12.90898609161377, -12.121294975280762, -11.333603858947754, -10.545912742614746, -9.758220672607422, -8.970529556274414, -8.182838439941406, -7.395147323608398, -6.607456207275391, -5.819765090942383, -5.032073974609375, -4.244382858276367, -3.456691265106201, -2.6690001487731934, -1.8813095092773438, -1.093618392944336, -0.3059271574020386, 0.4817640781402588, 1.2694551944732666, 2.0571463108062744, 2.8448376655578613, 3.632528781890869, 4.420219898223877, 5.207911014556885, 5.995602130889893, 6.783293724060059, 7.570984840393066, 8.358675956726074, 9.146367073059082, 9.93405818939209, 10.721749305725098, 11.509440422058105, 12.297131538391113, 13.084822654724121, 13.872513771057129, 14.660204887390137, 15.447896957397461, 16.23558807373047, 17.023279190063477, 17.810970306396484, 18.598661422729492, 19.3863525390625, 20.174043655395508, 20.961734771728516, 21.749425888061523, 22.53711700439453, 23.32480812072754]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 9.0, 2.0, 9.0, 9.0, 13.0, 10.0, 18.0, 18.0, 20.0, 26.0, 29.0, 32.0, 37.0, 33.0, 38.0, 37.0, 52.0, 49.0, 39.0, 50.0, 48.0, 49.0, 43.0, 47.0, 30.0, 36.0, 28.0, 31.0, 22.0, 26.0, 22.0, 20.0, 14.0, 14.0, 11.0, 8.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.72265625, -3.62689208984375, -3.5311279296875, -3.43536376953125, -3.339599609375, -3.24383544921875, -3.1480712890625, -3.05230712890625, -2.95654296875, -2.86077880859375, -2.7650146484375, -2.66925048828125, -2.573486328125, -2.47772216796875, -2.3819580078125, -2.28619384765625, -2.1904296875, -2.09466552734375, -1.9989013671875, -1.90313720703125, -1.807373046875, -1.71160888671875, -1.6158447265625, -1.52008056640625, -1.42431640625, -1.32855224609375, -1.2327880859375, -1.13702392578125, -1.041259765625, -0.94549560546875, -0.8497314453125, -0.75396728515625, -0.658203125, -0.56243896484375, -0.4666748046875, -0.37091064453125, -0.275146484375, -0.17938232421875, -0.0836181640625, 0.01214599609375, 0.10791015625, 0.20367431640625, 0.2994384765625, 0.39520263671875, 0.490966796875, 0.58673095703125, 0.6824951171875, 0.77825927734375, 0.8740234375, 0.96978759765625, 1.0655517578125, 1.16131591796875, 1.257080078125, 1.35284423828125, 1.4486083984375, 1.54437255859375, 1.64013671875, 1.73590087890625, 1.8316650390625, 1.92742919921875, 2.023193359375, 2.11895751953125, 2.2147216796875, 2.31048583984375, 2.40625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 4.0, 7.0, 11.0, 10.0, 10.0, 24.0, 19.0, 21.0, 34.0, 43.0, 49.0, 48.0, 65.0, 78.0, 132.0, 214.0, 558.0, 3366.0, 114100.0, 3649984.0, 417365.0, 6543.0, 741.0, 221.0, 151.0, 85.0, 71.0, 60.0, 41.0, 42.0, 25.0, 32.0, 28.0, 28.0, 12.0, 17.0, 4.0, 11.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-16.578125, -16.14892578125, -15.7197265625, -15.29052734375, -14.861328125, -14.43212890625, -14.0029296875, -13.57373046875, -13.14453125, -12.71533203125, -12.2861328125, -11.85693359375, -11.427734375, -10.99853515625, -10.5693359375, -10.14013671875, -9.7109375, -9.28173828125, -8.8525390625, -8.42333984375, -7.994140625, -7.56494140625, -7.1357421875, -6.70654296875, -6.27734375, -5.84814453125, -5.4189453125, -4.98974609375, -4.560546875, -4.13134765625, -3.7021484375, -3.27294921875, -2.84375, -2.41455078125, -1.9853515625, -1.55615234375, -1.126953125, -0.69775390625, -0.2685546875, 0.16064453125, 0.58984375, 1.01904296875, 1.4482421875, 1.87744140625, 2.306640625, 2.73583984375, 3.1650390625, 3.59423828125, 4.0234375, 4.45263671875, 4.8818359375, 5.31103515625, 5.740234375, 6.16943359375, 6.5986328125, 7.02783203125, 7.45703125, 7.88623046875, 8.3154296875, 8.74462890625, 9.173828125, 9.60302734375, 10.0322265625, 10.46142578125, 10.890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 11.0, 21.0, 23.0, 50.0, 84.0, 111.0, 198.0, 324.0, 463.0, 681.0, 668.0, 518.0, 347.0, 208.0, 134.0, 90.0, 63.0, 22.0, 30.0, 11.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.3507080078125, -10.037353515625, -9.7239990234375, -9.41064453125, -9.0972900390625, -8.783935546875, -8.4705810546875, -8.1572265625, -7.8438720703125, -7.530517578125, -7.2171630859375, -6.90380859375, -6.5904541015625, -6.277099609375, -5.9637451171875, -5.650390625, -5.3370361328125, -5.023681640625, -4.7103271484375, -4.39697265625, -4.0836181640625, -3.770263671875, -3.4569091796875, -3.1435546875, -2.8302001953125, -2.516845703125, -2.2034912109375, -1.89013671875, -1.5767822265625, -1.263427734375, -0.9500732421875, -0.63671875, -0.3233642578125, -0.010009765625, 0.3033447265625, 0.61669921875, 0.9300537109375, 1.243408203125, 1.5567626953125, 1.8701171875, 2.1834716796875, 2.496826171875, 2.8101806640625, 3.12353515625, 3.4368896484375, 3.750244140625, 4.0635986328125, 4.376953125, 4.6903076171875, 5.003662109375, 5.3170166015625, 5.63037109375, 5.9437255859375, 6.257080078125, 6.5704345703125, 6.8837890625, 7.1971435546875, 7.510498046875, 7.8238525390625, 8.13720703125, 8.4505615234375, 8.763916015625, 9.0772705078125, 9.390625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 15.0, 14.0, 33.0, 54.0, 83.0, 149.0, 210.0, 329.0, 901.0, 6439.0, 2433339.0, 1746017.0, 4995.0, 822.0, 324.0, 222.0, 131.0, 75.0, 42.0, 36.0, 15.0, 12.0, 8.0, 4.0, 1.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.21875, -24.28369140625, -23.3486328125, -22.41357421875, -21.478515625, -20.54345703125, -19.6083984375, -18.67333984375, -17.73828125, -16.80322265625, -15.8681640625, -14.93310546875, -13.998046875, -13.06298828125, -12.1279296875, -11.19287109375, -10.2578125, -9.32275390625, -8.3876953125, -7.45263671875, -6.517578125, -5.58251953125, -4.6474609375, -3.71240234375, -2.77734375, -1.84228515625, -0.9072265625, 0.02783203125, 0.962890625, 1.89794921875, 2.8330078125, 3.76806640625, 4.703125, 5.63818359375, 6.5732421875, 7.50830078125, 8.443359375, 9.37841796875, 10.3134765625, 11.24853515625, 12.18359375, 13.11865234375, 14.0537109375, 14.98876953125, 15.923828125, 16.85888671875, 17.7939453125, 18.72900390625, 19.6640625, 20.59912109375, 21.5341796875, 22.46923828125, 23.404296875, 24.33935546875, 25.2744140625, 26.20947265625, 27.14453125, 28.07958984375, 29.0146484375, 29.94970703125, 30.884765625, 31.81982421875, 32.7548828125, 33.68994140625, 34.625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 19.0, 81.0, 217.0, 317.0, 255.0, 92.0, 25.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.065269470214844, -15.283468246459961, -12.501667976379395, -9.719867706298828, -6.938066482543945, -4.1562652587890625, -1.3744659423828125, 1.4073352813720703, 4.189136505126953, 6.970937252044678, 9.752737998962402, 12.534538269042969, 15.316339492797852, 18.098140716552734, 20.879940032958984, 23.661741256713867, 26.44354248046875, 29.225343704223633, 32.007144927978516, 34.788944244384766, 37.57074737548828, 40.35254669189453, 43.13434600830078, 45.91614532470703, 48.69794845581055, 51.4797477722168, 54.26155090332031, 57.04335021972656, 59.82514953613281, 62.60695266723633, 65.38874816894531, 68.1705551147461, 70.95234680175781, 73.73414611816406, 76.51594543457031, 79.29774475097656, 82.07955169677734, 84.8613510131836, 87.64315032958984, 90.4249496459961, 93.20675659179688, 95.98855590820312, 98.77035522460938, 101.55215454101562, 104.3339614868164, 107.11576080322266, 109.8975601196289, 112.67935943603516, 115.4611587524414, 118.24295806884766, 121.0247573852539, 123.80656433105469, 126.58836364746094, 129.3701629638672, 132.15196228027344, 134.9337615966797, 137.71556091308594, 140.4973602294922, 143.27915954589844, 146.0609588623047, 148.84275817871094, 151.62457275390625, 154.4063720703125, 157.18817138671875, 159.969970703125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 7.0, 2.0, 2.0, 7.0, 10.0, 10.0, 7.0, 12.0, 20.0, 16.0, 15.0, 18.0, 18.0, 15.0, 27.0, 25.0, 37.0, 22.0, 31.0, 38.0, 30.0, 36.0, 40.0, 26.0, 43.0, 50.0, 47.0, 31.0, 43.0, 33.0, 33.0, 29.0, 21.0, 34.0, 18.0, 19.0, 16.0, 16.0, 19.0, 11.0, 12.0, 8.0, 8.0, 10.0, 10.0, 6.0, 4.0, 2.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.316221237182617, -17.724740982055664, -17.13326072692871, -16.541780471801758, -15.950300216674805, -15.358819961547852, -14.767340660095215, -14.175860404968262, -13.584380149841309, -12.992899894714355, -12.401419639587402, -11.80993938446045, -11.218460083007812, -10.62697982788086, -10.035499572753906, -9.444019317626953, -8.8525390625, -8.261058807373047, -7.669578552246094, -7.078098773956299, -6.486618518829346, -5.895138263702393, -5.303658485412598, -4.7121782302856445, -4.120697975158691, -3.5292177200317383, -2.9377377033233643, -2.3462576866149902, -1.754777431488037, -1.163297176361084, -0.57181715965271, 0.019662857055664062, 0.61114501953125, 1.2026251554489136, 1.7941052913665771, 2.385585308074951, 2.9770655632019043, 3.5685458183288574, 4.160025596618652, 4.7515058517456055, 5.342986106872559, 5.934466361999512, 6.525946617126465, 7.11742639541626, 7.708906650543213, 8.300386428833008, 8.891866683959961, 9.483346939086914, 10.074827194213867, 10.66630744934082, 11.257787704467773, 11.849267959594727, 12.44074821472168, 13.032228469848633, 13.62370777130127, 14.215188026428223, 14.806668281555176, 15.398148536682129, 15.989628791809082, 16.58110809326172, 17.172588348388672, 17.764068603515625, 18.355548858642578, 18.94702911376953, 19.538509368896484]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 7.0, 5.0, 15.0, 10.0, 14.0, 10.0, 14.0, 19.0, 22.0, 22.0, 28.0, 33.0, 48.0, 43.0, 47.0, 46.0, 34.0, 47.0, 47.0, 50.0, 45.0, 53.0, 45.0, 33.0, 31.0, 26.0, 30.0, 25.0, 34.0, 18.0, 17.0, 22.0, 21.0, 12.0, 6.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.9296875, -3.831787109375, -3.73388671875, -3.635986328125, -3.5380859375, -3.440185546875, -3.34228515625, -3.244384765625, -3.146484375, -3.048583984375, -2.95068359375, -2.852783203125, -2.7548828125, -2.656982421875, -2.55908203125, -2.461181640625, -2.36328125, -2.265380859375, -2.16748046875, -2.069580078125, -1.9716796875, -1.873779296875, -1.77587890625, -1.677978515625, -1.580078125, -1.482177734375, -1.38427734375, -1.286376953125, -1.1884765625, -1.090576171875, -0.99267578125, -0.894775390625, -0.796875, -0.698974609375, -0.60107421875, -0.503173828125, -0.4052734375, -0.307373046875, -0.20947265625, -0.111572265625, -0.013671875, 0.084228515625, 0.18212890625, 0.280029296875, 0.3779296875, 0.475830078125, 0.57373046875, 0.671630859375, 0.76953125, 0.867431640625, 0.96533203125, 1.063232421875, 1.1611328125, 1.259033203125, 1.35693359375, 1.454833984375, 1.552734375, 1.650634765625, 1.74853515625, 1.846435546875, 1.9443359375, 2.042236328125, 2.14013671875, 2.238037109375, 2.3359375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 17.0, 22.0, 33.0, 40.0, 66.0, 113.0, 196.0, 349.0, 598.0, 1173.0, 2159.0, 3912.0, 7220.0, 13312.0, 25795.0, 52789.0, 120005.0, 330069.0, 286200.0, 106489.0, 47495.0, 23536.0, 12517.0, 6712.0, 3496.0, 1859.0, 1000.0, 587.0, 316.0, 184.0, 114.0, 61.0, 36.0, 30.0, 10.0, 14.0, 11.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.75927734375, -0.7369003295898438, -0.7145233154296875, -0.6921463012695312, -0.669769287109375, -0.6473922729492188, -0.6250152587890625, -0.6026382446289062, -0.58026123046875, -0.5578842163085938, -0.5355072021484375, -0.5131301879882812, -0.490753173828125, -0.46837615966796875, -0.4459991455078125, -0.42362213134765625, -0.4012451171875, -0.37886810302734375, -0.3564910888671875, -0.33411407470703125, -0.311737060546875, -0.28936004638671875, -0.2669830322265625, -0.24460601806640625, -0.22222900390625, -0.19985198974609375, -0.1774749755859375, -0.15509796142578125, -0.132720947265625, -0.11034393310546875, -0.0879669189453125, -0.06558990478515625, -0.043212890625, -0.02083587646484375, 0.0015411376953125, 0.02391815185546875, 0.046295166015625, 0.06867218017578125, 0.0910491943359375, 0.11342620849609375, 0.13580322265625, 0.15818023681640625, 0.1805572509765625, 0.20293426513671875, 0.225311279296875, 0.24768829345703125, 0.2700653076171875, 0.29244232177734375, 0.3148193359375, 0.33719635009765625, 0.3595733642578125, 0.38195037841796875, 0.404327392578125, 0.42670440673828125, 0.4490814208984375, 0.47145843505859375, 0.49383544921875, 0.5162124633789062, 0.5385894775390625, 0.5609664916992188, 0.583343505859375, 0.6057205200195312, 0.6280975341796875, 0.6504745483398438, 0.6728515625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 4.0, 6.0, 10.0, 14.0, 11.0, 12.0, 14.0, 15.0, 30.0, 30.0, 27.0, 31.0, 34.0, 31.0, 40.0, 35.0, 31.0, 40.0, 41.0, 44.0, 1060.0, 38.0, 34.0, 29.0, 45.0, 49.0, 34.0, 13.0, 31.0, 22.0, 16.0, 29.0, 17.0, 23.0, 14.0, 10.0, 9.0, 7.0, 13.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8388671875, -1.7852935791015625, -1.731719970703125, -1.6781463623046875, -1.62457275390625, -1.5709991455078125, -1.517425537109375, -1.4638519287109375, -1.4102783203125, -1.3567047119140625, -1.303131103515625, -1.2495574951171875, -1.19598388671875, -1.1424102783203125, -1.088836669921875, -1.0352630615234375, -0.981689453125, -0.9281158447265625, -0.874542236328125, -0.8209686279296875, -0.76739501953125, -0.7138214111328125, -0.660247802734375, -0.6066741943359375, -0.5531005859375, -0.4995269775390625, -0.445953369140625, -0.3923797607421875, -0.33880615234375, -0.2852325439453125, -0.231658935546875, -0.1780853271484375, -0.12451171875, -0.0709381103515625, -0.017364501953125, 0.0362091064453125, 0.08978271484375, 0.1433563232421875, 0.196929931640625, 0.2505035400390625, 0.3040771484375, 0.3576507568359375, 0.411224365234375, 0.4647979736328125, 0.51837158203125, 0.5719451904296875, 0.625518798828125, 0.6790924072265625, 0.732666015625, 0.7862396240234375, 0.839813232421875, 0.8933868408203125, 0.94696044921875, 1.0005340576171875, 1.054107666015625, 1.1076812744140625, 1.1612548828125, 1.2148284912109375, 1.268402099609375, 1.3219757080078125, 1.37554931640625, 1.4291229248046875, 1.482696533203125, 1.5362701416015625, 1.58984375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 8.0, 13.0, 21.0, 27.0, 51.0, 87.0, 126.0, 160.0, 243.0, 343.0, 512.0, 741.0, 1018.0, 1533.0, 2162.0, 3028.0, 4493.0, 6457.0, 9237.0, 13545.0, 19938.0, 29827.0, 46058.0, 73770.0, 132589.0, 1305608.0, 181939.0, 94788.0, 56250.0, 35796.0, 24133.0, 16305.0, 11381.0, 7612.0, 5325.0, 3647.0, 2476.0, 1807.0, 1238.0, 819.0, 614.0, 415.0, 308.0, 195.0, 141.0, 100.0, 67.0, 55.0, 43.0, 37.0, 18.0, 12.0, 10.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.3896484375, -0.3773651123046875, -0.365081787109375, -0.3527984619140625, -0.34051513671875, -0.3282318115234375, -0.315948486328125, -0.3036651611328125, -0.2913818359375, -0.2790985107421875, -0.266815185546875, -0.2545318603515625, -0.24224853515625, -0.2299652099609375, -0.217681884765625, -0.2053985595703125, -0.193115234375, -0.1808319091796875, -0.168548583984375, -0.1562652587890625, -0.14398193359375, -0.1316986083984375, -0.119415283203125, -0.1071319580078125, -0.0948486328125, -0.0825653076171875, -0.070281982421875, -0.0579986572265625, -0.04571533203125, -0.0334320068359375, -0.021148681640625, -0.0088653564453125, 0.00341796875, 0.0157012939453125, 0.027984619140625, 0.0402679443359375, 0.05255126953125, 0.0648345947265625, 0.077117919921875, 0.0894012451171875, 0.1016845703125, 0.1139678955078125, 0.126251220703125, 0.1385345458984375, 0.15081787109375, 0.1631011962890625, 0.175384521484375, 0.1876678466796875, 0.199951171875, 0.2122344970703125, 0.224517822265625, 0.2368011474609375, 0.24908447265625, 0.2613677978515625, 0.273651123046875, 0.2859344482421875, 0.2982177734375, 0.3105010986328125, 0.322784423828125, 0.3350677490234375, 0.34735107421875, 0.3596343994140625, 0.371917724609375, 0.3842010498046875, 0.396484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 11.0, 7.0, 12.0, 9.0, 13.0, 7.0, 24.0, 36.0, 41.0, 53.0, 77.0, 66.0, 84.0, 96.0, 79.0, 73.0, 71.0, 49.0, 44.0, 36.0, 23.0, 14.0, 13.0, 11.0, 8.0, 6.0, 7.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010526180267333984, -0.00010079145431518555, -9.632110595703125e-05, -9.185075759887695e-05, -8.738040924072266e-05, -8.291006088256836e-05, -7.843971252441406e-05, -7.396936416625977e-05, -6.949901580810547e-05, -6.502866744995117e-05, -6.0558319091796875e-05, -5.608797073364258e-05, -5.161762237548828e-05, -4.7147274017333984e-05, -4.267692565917969e-05, -3.820657730102539e-05, -3.3736228942871094e-05, -2.9265880584716797e-05, -2.47955322265625e-05, -2.0325183868408203e-05, -1.5854835510253906e-05, -1.138448715209961e-05, -6.9141387939453125e-06, -2.4437904357910156e-06, 2.0265579223632812e-06, 6.496906280517578e-06, 1.0967254638671875e-05, 1.5437602996826172e-05, 1.990795135498047e-05, 2.4378299713134766e-05, 2.8848648071289062e-05, 3.331899642944336e-05, 3.7789344787597656e-05, 4.225969314575195e-05, 4.673004150390625e-05, 5.120038986206055e-05, 5.5670738220214844e-05, 6.014108657836914e-05, 6.461143493652344e-05, 6.908178329467773e-05, 7.355213165283203e-05, 7.802248001098633e-05, 8.249282836914062e-05, 8.696317672729492e-05, 9.143352508544922e-05, 9.590387344360352e-05, 0.00010037422180175781, 0.00010484457015991211, 0.0001093149185180664, 0.0001137852668762207, 0.000118255615234375, 0.0001227259635925293, 0.0001271963119506836, 0.0001316666603088379, 0.0001361370086669922, 0.00014060735702514648, 0.00014507770538330078, 0.00014954805374145508, 0.00015401840209960938, 0.00015848875045776367, 0.00016295909881591797, 0.00016742944717407227, 0.00017189979553222656, 0.00017637014389038086, 0.00018084049224853516]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 7.0, 2.0, 4.0, 6.0, 6.0, 3.0, 11.0, 8.0, 10.0, 24.0, 30.0, 34.0, 48.0, 65.0, 103.0, 176.0, 338.0, 573.0, 2753.0, 996935.0, 45371.0, 971.0, 397.0, 234.0, 144.0, 99.0, 55.0, 36.0, 27.0, 17.0, 12.0, 13.0, 7.0, 14.0, 4.0, 5.0, 6.0, 2.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.003032684326171875, -0.0029523074626922607, -0.0028719305992126465, -0.0027915537357330322, -0.002711176872253418, -0.0026308000087738037, -0.0025504231452941895, -0.002470046281814575, -0.002389669418334961, -0.0023092925548553467, -0.0022289156913757324, -0.002148538827896118, -0.002068161964416504, -0.0019877851009368896, -0.0019074082374572754, -0.0018270313739776611, -0.0017466545104980469, -0.0016662776470184326, -0.0015859007835388184, -0.001505523920059204, -0.0014251470565795898, -0.0013447701930999756, -0.0012643933296203613, -0.001184016466140747, -0.0011036396026611328, -0.0010232627391815186, -0.0009428858757019043, -0.00086250901222229, -0.0007821321487426758, -0.0007017552852630615, -0.0006213784217834473, -0.000541001558303833, -0.00046062469482421875, -0.0003802478313446045, -0.00029987096786499023, -0.00021949410438537598, -0.00013911724090576172, -5.874037742614746e-05, 2.1636486053466797e-05, 0.00010201334953308105, 0.0001823902130126953, 0.00026276707649230957, 0.00034314393997192383, 0.0004235208034515381, 0.0005038976669311523, 0.0005842745304107666, 0.0006646513938903809, 0.0007450282573699951, 0.0008254051208496094, 0.0009057819843292236, 0.0009861588478088379, 0.0010665357112884521, 0.0011469125747680664, 0.0012272894382476807, 0.001307666301727295, 0.0013880431652069092, 0.0014684200286865234, 0.0015487968921661377, 0.001629173755645752, 0.0017095506191253662, 0.0017899274826049805, 0.0018703043460845947, 0.001950681209564209, 0.0020310580730438232, 0.0021114349365234375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 48.0, 143.0, 282.0, 263.0, 176.0, 68.0, 12.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.282000246457756e-05, -8.704788342583925e-05, -8.127576438710093e-05, -7.550364534836262e-05, -6.973153358558193e-05, -6.395941454684362e-05, -5.818729550810531e-05, -5.2415180107345805e-05, -4.6643061068607494e-05, -4.0870942029869184e-05, -3.509882662910968e-05, -2.932670759037137e-05, -2.3554590370622464e-05, -1.7782473150873557e-05, -1.2010354112135246e-05, -6.238238711375743e-06, -4.661196726374328e-07, 5.305998001858825e-06, 1.1078115676355083e-05, 1.685023380559869e-05, 2.2622351025347598e-05, 2.8394468245096505e-05, 3.4166587283834815e-05, 3.993870268459432e-05, 4.571082172333263e-05, 5.148294076207094e-05, 5.725505616283044e-05, 6.302717520156875e-05, 6.879929424030706e-05, 7.457140600308776e-05, 8.034352504182607e-05, 8.611564408056438e-05, 9.188776311930269e-05, 9.7659882158041e-05, 0.00010343200119677931, 0.00010920412023551762, 0.00011497623199829832, 0.00012074835103703663, 0.00012652046279981732, 0.00013229258183855563, 0.00013806470087729394, 0.00014383681991603225, 0.00014960893895477057, 0.00015538105799350888, 0.00016115317703224719, 0.00016692528151907027, 0.0001726974151097238, 0.0001784695195965469, 0.00018424165318720043, 0.00019001377222593874, 0.00019578589126467705, 0.00020155801030341536, 0.00020733012934215367, 0.00021310223382897675, 0.0002188743674196303, 0.00022464647190645337, 0.00023041859094519168, 0.00023619070998393, 0.0002419628290226683, 0.0002477349480614066, 0.0002535070525482297, 0.00025927918613888323, 0.0002650512906257063, 0.00027082342421635985, 0.00027659552870318294]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 2.0, 10.0, 13.0, 11.0, 16.0, 16.0, 15.0, 15.0, 26.0, 24.0, 32.0, 27.0, 33.0, 38.0, 35.0, 37.0, 42.0, 53.0, 42.0, 38.0, 44.0, 34.0, 43.0, 34.0, 41.0, 35.0, 34.0, 38.0, 25.0, 28.0, 18.0, 19.0, 13.0, 9.0, 11.0, 9.0, 8.0, 6.0, 6.0, 7.0, 0.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.252527236938477e-05, -6.053224205970764e-05, -5.853921175003052e-05, -5.6546181440353394e-05, -5.455315113067627e-05, -5.2560120820999146e-05, -5.056709051132202e-05, -4.85740602016449e-05, -4.6581029891967773e-05, -4.458799958229065e-05, -4.2594969272613525e-05, -4.06019389629364e-05, -3.860890865325928e-05, -3.661587834358215e-05, -3.462284803390503e-05, -3.2629817724227905e-05, -3.063678741455078e-05, -2.8643757104873657e-05, -2.6650726795196533e-05, -2.465769648551941e-05, -2.2664666175842285e-05, -2.067163586616516e-05, -1.8678605556488037e-05, -1.6685575246810913e-05, -1.4692544937133789e-05, -1.2699514627456665e-05, -1.0706484317779541e-05, -8.713454008102417e-06, -6.720423698425293e-06, -4.727393388748169e-06, -2.734363079071045e-06, -7.413327693939209e-07, 1.2516975402832031e-06, 3.244727849960327e-06, 5.237758159637451e-06, 7.230788469314575e-06, 9.2238187789917e-06, 1.1216849088668823e-05, 1.3209879398345947e-05, 1.5202909708023071e-05, 1.7195940017700195e-05, 1.918897032737732e-05, 2.1182000637054443e-05, 2.3175030946731567e-05, 2.516806125640869e-05, 2.7161091566085815e-05, 2.915412187576294e-05, 3.1147152185440063e-05, 3.314018249511719e-05, 3.513321280479431e-05, 3.7126243114471436e-05, 3.911927342414856e-05, 4.1112303733825684e-05, 4.310533404350281e-05, 4.509836435317993e-05, 4.7091394662857056e-05, 4.908442497253418e-05, 5.1077455282211304e-05, 5.307048559188843e-05, 5.506351590156555e-05, 5.7056546211242676e-05, 5.90495765209198e-05, 6.104260683059692e-05, 6.303563714027405e-05, 6.502866744995117e-05]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 7.0, 5.0, 15.0, 10.0, 14.0, 10.0, 14.0, 19.0, 22.0, 22.0, 28.0, 33.0, 48.0, 43.0, 47.0, 46.0, 34.0, 47.0, 47.0, 50.0, 45.0, 53.0, 45.0, 33.0, 31.0, 26.0, 30.0, 25.0, 34.0, 18.0, 17.0, 22.0, 21.0, 12.0, 6.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.9296875, -3.831787109375, -3.73388671875, -3.635986328125, -3.5380859375, -3.440185546875, -3.34228515625, -3.244384765625, -3.146484375, -3.048583984375, -2.95068359375, -2.852783203125, -2.7548828125, -2.656982421875, -2.55908203125, -2.461181640625, -2.36328125, -2.265380859375, -2.16748046875, -2.069580078125, -1.9716796875, -1.873779296875, -1.77587890625, -1.677978515625, -1.580078125, -1.482177734375, -1.38427734375, -1.286376953125, -1.1884765625, -1.090576171875, -0.99267578125, -0.894775390625, -0.796875, -0.698974609375, -0.60107421875, -0.503173828125, -0.4052734375, -0.307373046875, -0.20947265625, -0.111572265625, -0.013671875, 0.084228515625, 0.18212890625, 0.280029296875, 0.3779296875, 0.475830078125, 0.57373046875, 0.671630859375, 0.76953125, 0.867431640625, 0.96533203125, 1.063232421875, 1.1611328125, 1.259033203125, 1.35693359375, 1.454833984375, 1.552734375, 1.650634765625, 1.74853515625, 1.846435546875, 1.9443359375, 2.042236328125, 2.14013671875, 2.238037109375, 2.3359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 12.0, 15.0, 19.0, 19.0, 36.0, 57.0, 77.0, 157.0, 247.0, 469.0, 861.0, 1831.0, 3604.0, 7369.0, 14911.0, 31104.0, 67229.0, 163699.0, 383447.0, 215767.0, 83685.0, 37819.0, 18380.0, 8952.0, 4323.0, 2157.0, 1074.0, 504.0, 279.0, 168.0, 86.0, 55.0, 39.0, 33.0, 24.0, 11.0, 6.0, 10.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.150482177734375, -2.06658935546875, -1.982696533203125, -1.8988037109375, -1.814910888671875, -1.73101806640625, -1.647125244140625, -1.563232421875, -1.479339599609375, -1.39544677734375, -1.311553955078125, -1.2276611328125, -1.143768310546875, -1.05987548828125, -0.975982666015625, -0.89208984375, -0.808197021484375, -0.72430419921875, -0.640411376953125, -0.5565185546875, -0.472625732421875, -0.38873291015625, -0.304840087890625, -0.220947265625, -0.137054443359375, -0.05316162109375, 0.030731201171875, 0.1146240234375, 0.198516845703125, 0.28240966796875, 0.366302490234375, 0.4501953125, 0.534088134765625, 0.61798095703125, 0.701873779296875, 0.7857666015625, 0.869659423828125, 0.95355224609375, 1.037445068359375, 1.121337890625, 1.205230712890625, 1.28912353515625, 1.373016357421875, 1.4569091796875, 1.540802001953125, 1.62469482421875, 1.708587646484375, 1.79248046875, 1.876373291015625, 1.96026611328125, 2.044158935546875, 2.1280517578125, 2.211944580078125, 2.29583740234375, 2.379730224609375, 2.463623046875, 2.547515869140625, 2.63140869140625, 2.715301513671875, 2.7991943359375, 2.883087158203125, 2.96697998046875, 3.050872802734375, 3.134765625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 5.0, 12.0, 4.0, 7.0, 19.0, 17.0, 28.0, 31.0, 45.0, 39.0, 52.0, 52.0, 56.0, 74.0, 184.0, 1578.0, 280.0, 105.0, 56.0, 52.0, 47.0, 45.0, 29.0, 48.0, 30.0, 22.0, 19.0, 16.0, 21.0, 11.0, 6.0, 16.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.9296875, -12.5455322265625, -12.161376953125, -11.7772216796875, -11.39306640625, -11.0089111328125, -10.624755859375, -10.2406005859375, -9.8564453125, -9.4722900390625, -9.088134765625, -8.7039794921875, -8.31982421875, -7.9356689453125, -7.551513671875, -7.1673583984375, -6.783203125, -6.3990478515625, -6.014892578125, -5.6307373046875, -5.24658203125, -4.8624267578125, -4.478271484375, -4.0941162109375, -3.7099609375, -3.3258056640625, -2.941650390625, -2.5574951171875, -2.17333984375, -1.7891845703125, -1.405029296875, -1.0208740234375, -0.63671875, -0.2525634765625, 0.131591796875, 0.5157470703125, 0.89990234375, 1.2840576171875, 1.668212890625, 2.0523681640625, 2.4365234375, 2.8206787109375, 3.204833984375, 3.5889892578125, 3.97314453125, 4.3572998046875, 4.741455078125, 5.1256103515625, 5.509765625, 5.8939208984375, 6.278076171875, 6.6622314453125, 7.04638671875, 7.4305419921875, 7.814697265625, 8.1988525390625, 8.5830078125, 8.9671630859375, 9.351318359375, 9.7354736328125, 10.11962890625, 10.5037841796875, 10.887939453125, 11.2720947265625, 11.65625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 7.0, 14.0, 18.0, 27.0, 52.0, 64.0, 93.0, 156.0, 327.0, 758.0, 19809.0, 3120747.0, 2531.0, 491.0, 230.0, 117.0, 71.0, 55.0, 37.0, 28.0, 17.0, 12.0, 9.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.03125, -61.34228515625, -59.6533203125, -57.96435546875, -56.275390625, -54.58642578125, -52.8974609375, -51.20849609375, -49.51953125, -47.83056640625, -46.1416015625, -44.45263671875, -42.763671875, -41.07470703125, -39.3857421875, -37.69677734375, -36.0078125, -34.31884765625, -32.6298828125, -30.94091796875, -29.251953125, -27.56298828125, -25.8740234375, -24.18505859375, -22.49609375, -20.80712890625, -19.1181640625, -17.42919921875, -15.740234375, -14.05126953125, -12.3623046875, -10.67333984375, -8.984375, -7.29541015625, -5.6064453125, -3.91748046875, -2.228515625, -0.53955078125, 1.1494140625, 2.83837890625, 4.52734375, 6.21630859375, 7.9052734375, 9.59423828125, 11.283203125, 12.97216796875, 14.6611328125, 16.35009765625, 18.0390625, 19.72802734375, 21.4169921875, 23.10595703125, 24.794921875, 26.48388671875, 28.1728515625, 29.86181640625, 31.55078125, 33.23974609375, 34.9287109375, 36.61767578125, 38.306640625, 39.99560546875, 41.6845703125, 43.37353515625, 45.0625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [725.0, 293.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.27552604675293, 0.7519025802612305, 10.77933120727539, 20.806760787963867, 30.83418846130371, 40.86161804199219, 50.88904571533203, 60.916473388671875, 70.94390106201172, 80.97132873535156, 90.9987564086914, 101.02618408203125, 111.05361938476562, 121.08103942871094, 131.1084747314453, 141.13589477539062, 151.163330078125, 161.19076538085938, 171.2181854248047, 181.24562072753906, 191.27304077148438, 201.30047607421875, 211.32791137695312, 221.35533142089844, 231.3827667236328, 241.4102020263672, 251.4376220703125, 261.4650573730469, 271.49249267578125, 281.5198974609375, 291.5473327636719, 301.57476806640625, 311.6022033691406, 321.629638671875, 331.6570739746094, 341.6844787597656, 351.7119140625, 361.7393493652344, 371.76678466796875, 381.794189453125, 391.8216247558594, 401.84906005859375, 411.8764953613281, 421.9039001464844, 431.93133544921875, 441.9587707519531, 451.9862060546875, 462.01361083984375, 472.04107666015625, 482.0685119628906, 492.095947265625, 502.12335205078125, 512.1508178710938, 522.17822265625, 532.2056274414062, 542.2330932617188, 552.260498046875, 562.2879028320312, 572.3153686523438, 582.3427734375, 592.3702392578125, 602.3976440429688, 612.425048828125, 622.4525146484375, 632.4799194335938]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 6.0, 8.0, 12.0, 14.0, 6.0, 15.0, 9.0, 16.0, 15.0, 23.0, 23.0, 32.0, 26.0, 33.0, 37.0, 39.0, 42.0, 49.0, 42.0, 33.0, 30.0, 53.0, 32.0, 39.0, 39.0, 39.0, 43.0, 27.0, 30.0, 23.0, 33.0, 26.0, 17.0, 14.0, 16.0, 12.0, 9.0, 10.0, 8.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-38.100563049316406, -37.094482421875, -36.088401794433594, -35.08232116699219, -34.07624053955078, -33.070159912109375, -32.06407928466797, -31.05799674987793, -30.05191421508789, -29.045833587646484, -28.039752960205078, -27.033672332763672, -26.027589797973633, -25.021509170532227, -24.01542854309082, -23.009347915649414, -22.003267288208008, -20.9971866607666, -19.991106033325195, -18.985023498535156, -17.97894287109375, -16.972862243652344, -15.966781616210938, -14.960700988769531, -13.954619407653809, -12.948538780212402, -11.94245719909668, -10.936376571655273, -9.930295944213867, -8.924214363098145, -7.918133735656738, -6.912052631378174, -5.905971527099609, -4.899890422821045, -3.8938095569610596, -2.887728691101074, -1.8816475868225098, -0.8755664825439453, 0.13051414489746094, 1.1365952491760254, 2.14267635345459, 3.1487574577331543, 4.154838562011719, 5.160919189453125, 6.1670002937316895, 7.173081398010254, 8.17916202545166, 9.185243606567383, 10.191324234008789, 11.197404861450195, 12.203486442565918, 13.209567070007324, 14.215648651123047, 15.221729278564453, 16.22780990600586, 17.233890533447266, 18.239971160888672, 19.246051788330078, 20.252132415771484, 21.25821304321289, 22.26429557800293, 23.270376205444336, 24.276456832885742, 25.28253746032715, 26.288619995117188]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 9.0, 3.0, 18.0, 10.0, 13.0, 11.0, 14.0, 19.0, 23.0, 24.0, 28.0, 35.0, 43.0, 48.0, 50.0, 46.0, 46.0, 36.0, 47.0, 41.0, 44.0, 44.0, 41.0, 37.0, 39.0, 29.0, 27.0, 25.0, 29.0, 26.0, 23.0, 16.0, 15.0, 13.0, 12.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0, -3.892120361328125, -3.78424072265625, -3.676361083984375, -3.5684814453125, -3.460601806640625, -3.35272216796875, -3.244842529296875, -3.136962890625, -3.029083251953125, -2.92120361328125, -2.813323974609375, -2.7054443359375, -2.597564697265625, -2.48968505859375, -2.381805419921875, -2.27392578125, -2.166046142578125, -2.05816650390625, -1.950286865234375, -1.8424072265625, -1.734527587890625, -1.62664794921875, -1.518768310546875, -1.410888671875, -1.303009033203125, -1.19512939453125, -1.087249755859375, -0.9793701171875, -0.871490478515625, -0.76361083984375, -0.655731201171875, -0.5478515625, -0.439971923828125, -0.33209228515625, -0.224212646484375, -0.1163330078125, -0.008453369140625, 0.09942626953125, 0.207305908203125, 0.315185546875, 0.423065185546875, 0.53094482421875, 0.638824462890625, 0.7467041015625, 0.854583740234375, 0.96246337890625, 1.070343017578125, 1.17822265625, 1.286102294921875, 1.39398193359375, 1.501861572265625, 1.6097412109375, 1.717620849609375, 1.82550048828125, 1.933380126953125, 2.041259765625, 2.149139404296875, 2.25701904296875, 2.364898681640625, 2.4727783203125, 2.580657958984375, 2.68853759765625, 2.796417236328125, 2.904296875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 5.0, 2.0, 10.0, 12.0, 9.0, 9.0, 15.0, 12.0, 18.0, 28.0, 26.0, 48.0, 56.0, 93.0, 164.0, 271.0, 424.0, 868.0, 2014.0, 6708.0, 29587.0, 165876.0, 919522.0, 1908192.0, 932550.0, 185288.0, 31737.0, 6888.0, 1962.0, 771.0, 402.0, 242.0, 128.0, 98.0, 61.0, 33.0, 31.0, 28.0, 19.0, 16.0, 13.0, 18.0, 4.0, 8.0, 7.0, 4.0, 5.0, 4.0, 0.0, 4.0], "bins": [-5.8203125, -5.6651611328125, -5.510009765625, -5.3548583984375, -5.19970703125, -5.0445556640625, -4.889404296875, -4.7342529296875, -4.5791015625, -4.4239501953125, -4.268798828125, -4.1136474609375, -3.95849609375, -3.8033447265625, -3.648193359375, -3.4930419921875, -3.337890625, -3.1827392578125, -3.027587890625, -2.8724365234375, -2.71728515625, -2.5621337890625, -2.406982421875, -2.2518310546875, -2.0966796875, -1.9415283203125, -1.786376953125, -1.6312255859375, -1.47607421875, -1.3209228515625, -1.165771484375, -1.0106201171875, -0.85546875, -0.7003173828125, -0.545166015625, -0.3900146484375, -0.23486328125, -0.0797119140625, 0.075439453125, 0.2305908203125, 0.3857421875, 0.5408935546875, 0.696044921875, 0.8511962890625, 1.00634765625, 1.1614990234375, 1.316650390625, 1.4718017578125, 1.626953125, 1.7821044921875, 1.937255859375, 2.0924072265625, 2.24755859375, 2.4027099609375, 2.557861328125, 2.7130126953125, 2.8681640625, 3.0233154296875, 3.178466796875, 3.3336181640625, 3.48876953125, 3.6439208984375, 3.799072265625, 3.9542236328125, 4.109375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 9.0, 19.0, 40.0, 56.0, 91.0, 124.0, 218.0, 313.0, 504.0, 637.0, 647.0, 485.0, 337.0, 228.0, 127.0, 97.0, 64.0, 34.0, 24.0, 10.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.002197265625, -7.66845703125, -7.334716796875, -7.0009765625, -6.667236328125, -6.33349609375, -5.999755859375, -5.666015625, -5.332275390625, -4.99853515625, -4.664794921875, -4.3310546875, -3.997314453125, -3.66357421875, -3.329833984375, -2.99609375, -2.662353515625, -2.32861328125, -1.994873046875, -1.6611328125, -1.327392578125, -0.99365234375, -0.659912109375, -0.326171875, 0.007568359375, 0.34130859375, 0.675048828125, 1.0087890625, 1.342529296875, 1.67626953125, 2.010009765625, 2.34375, 2.677490234375, 3.01123046875, 3.344970703125, 3.6787109375, 4.012451171875, 4.34619140625, 4.679931640625, 5.013671875, 5.347412109375, 5.68115234375, 6.014892578125, 6.3486328125, 6.682373046875, 7.01611328125, 7.349853515625, 7.68359375, 8.017333984375, 8.35107421875, 8.684814453125, 9.0185546875, 9.352294921875, 9.68603515625, 10.019775390625, 10.353515625, 10.687255859375, 11.02099609375, 11.354736328125, 11.6884765625, 12.022216796875, 12.35595703125, 12.689697265625, 13.0234375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 9.0, 10.0, 13.0, 28.0, 25.0, 45.0, 50.0, 70.0, 115.0, 166.0, 245.0, 350.0, 689.0, 2849.0, 89844.0, 3610989.0, 478946.0, 7464.0, 1033.0, 481.0, 287.0, 165.0, 123.0, 88.0, 59.0, 49.0, 28.0, 21.0, 9.0, 9.0, 7.0, 8.0, 5.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-25.046875, -24.4156494140625, -23.784423828125, -23.1531982421875, -22.52197265625, -21.8907470703125, -21.259521484375, -20.6282958984375, -19.9970703125, -19.3658447265625, -18.734619140625, -18.1033935546875, -17.47216796875, -16.8409423828125, -16.209716796875, -15.5784912109375, -14.947265625, -14.3160400390625, -13.684814453125, -13.0535888671875, -12.42236328125, -11.7911376953125, -11.159912109375, -10.5286865234375, -9.8974609375, -9.2662353515625, -8.635009765625, -8.0037841796875, -7.37255859375, -6.7413330078125, -6.110107421875, -5.4788818359375, -4.84765625, -4.2164306640625, -3.585205078125, -2.9539794921875, -2.32275390625, -1.6915283203125, -1.060302734375, -0.4290771484375, 0.2021484375, 0.8333740234375, 1.464599609375, 2.0958251953125, 2.72705078125, 3.3582763671875, 3.989501953125, 4.6207275390625, 5.251953125, 5.8831787109375, 6.514404296875, 7.1456298828125, 7.77685546875, 8.4080810546875, 9.039306640625, 9.6705322265625, 10.3017578125, 10.9329833984375, 11.564208984375, 12.1954345703125, 12.82666015625, 13.4578857421875, 14.089111328125, 14.7203369140625, 15.3515625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 66.0, 197.0, 318.0, 278.0, 108.0, 33.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.41168975830078, -69.58451080322266, -66.75733184814453, -63.93014907836914, -61.102970123291016, -58.275787353515625, -55.4486083984375, -52.621429443359375, -49.79425048828125, -46.967071533203125, -44.139888763427734, -41.31270980834961, -38.485530853271484, -35.658348083496094, -32.83116912841797, -30.003990173339844, -27.176807403564453, -24.349626541137695, -21.52244758605957, -18.695266723632812, -15.868086814880371, -13.04090690612793, -10.213726043701172, -7.386547088623047, -4.559366226196289, -1.7321860790252686, 1.094994068145752, 3.9221744537353516, 6.749354362487793, 9.576534271240234, 12.403715133666992, 15.230894088745117, 18.058074951171875, 20.885255813598633, 23.712434768676758, 26.539615631103516, 29.36679458618164, 32.19397735595703, 35.021156311035156, 37.84833526611328, 40.675514221191406, 43.50269317626953, 46.32987594604492, 49.15705490112305, 51.98423385620117, 54.81141662597656, 57.63859558105469, 60.46577453613281, 63.2929573059082, 66.1201400756836, 68.94731903076172, 71.77449798583984, 74.60167694091797, 77.4288558959961, 80.25604248046875, 83.08322143554688, 85.910400390625, 88.73757934570312, 91.56475830078125, 94.39193725585938, 97.21912384033203, 100.04630279541016, 102.87348175048828, 105.7006607055664, 108.52783966064453]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 1.0, 3.0, 5.0, 8.0, 5.0, 4.0, 8.0, 17.0, 21.0, 11.0, 18.0, 19.0, 30.0, 26.0, 23.0, 21.0, 34.0, 27.0, 32.0, 36.0, 42.0, 31.0, 34.0, 36.0, 39.0, 38.0, 50.0, 48.0, 30.0, 24.0, 24.0, 33.0, 16.0, 26.0, 21.0, 28.0, 26.0, 16.0, 10.0, 14.0, 12.0, 5.0, 9.0, 13.0, 7.0, 1.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0], "bins": [-22.092737197875977, -21.41645622253418, -20.74017333984375, -20.063892364501953, -19.387609481811523, -18.711328506469727, -18.035045623779297, -17.3587646484375, -16.682483673095703, -16.006202697753906, -15.329919815063477, -14.65363883972168, -13.97735595703125, -13.301074981689453, -12.62479305267334, -11.948511123657227, -11.272228240966797, -10.595946311950684, -9.91966438293457, -9.243383407592773, -8.567100524902344, -7.890819072723389, -7.214537620544434, -6.53825569152832, -5.861973762512207, -5.185691833496094, -4.5094099044799805, -3.8331284523010254, -3.156846523284912, -2.480564594268799, -1.8042831420898438, -1.1280012130737305, -0.4517173767089844, 0.22456443309783936, 0.9008462429046631, 1.5771279335021973, 2.2534098625183105, 2.929691791534424, 3.605973243713379, 4.282255172729492, 4.9585371017456055, 5.634819030761719, 6.311100959777832, 6.987382411956787, 7.6636643409729, 8.339946746826172, 9.016227722167969, 9.692509651184082, 10.368791580200195, 11.045073509216309, 11.721355438232422, 12.397636413574219, 13.073919296264648, 13.750200271606445, 14.426482200622559, 15.102764129638672, 15.779046058654785, 16.4553279876709, 17.131608963012695, 17.807891845703125, 18.484172821044922, 19.16045570373535, 19.83673667907715, 20.513019561767578, 21.189300537109375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 14.0, 14.0, 21.0, 15.0, 27.0, 24.0, 34.0, 22.0, 33.0, 39.0, 45.0, 39.0, 47.0, 50.0, 48.0, 50.0, 41.0, 31.0, 61.0, 37.0, 36.0, 35.0, 28.0, 24.0, 35.0, 26.0, 20.0, 12.0, 15.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.00390625, -3.896942138671875, -3.78997802734375, -3.683013916015625, -3.5760498046875, -3.469085693359375, -3.36212158203125, -3.255157470703125, -3.148193359375, -3.041229248046875, -2.93426513671875, -2.827301025390625, -2.7203369140625, -2.613372802734375, -2.50640869140625, -2.399444580078125, -2.29248046875, -2.185516357421875, -2.07855224609375, -1.971588134765625, -1.8646240234375, -1.757659912109375, -1.65069580078125, -1.543731689453125, -1.436767578125, -1.329803466796875, -1.22283935546875, -1.115875244140625, -1.0089111328125, -0.901947021484375, -0.79498291015625, -0.688018798828125, -0.5810546875, -0.474090576171875, -0.36712646484375, -0.260162353515625, -0.1531982421875, -0.046234130859375, 0.06072998046875, 0.167694091796875, 0.274658203125, 0.381622314453125, 0.48858642578125, 0.595550537109375, 0.7025146484375, 0.809478759765625, 0.91644287109375, 1.023406982421875, 1.13037109375, 1.237335205078125, 1.34429931640625, 1.451263427734375, 1.5582275390625, 1.665191650390625, 1.77215576171875, 1.879119873046875, 1.986083984375, 2.093048095703125, 2.20001220703125, 2.306976318359375, 2.4139404296875, 2.520904541015625, 2.62786865234375, 2.734832763671875, 2.841796875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 23.0, 32.0, 30.0, 42.0, 91.0, 123.0, 165.0, 240.0, 348.0, 542.0, 793.0, 1244.0, 1866.0, 2963.0, 4587.0, 7052.0, 10931.0, 17860.0, 28486.0, 47724.0, 86013.0, 174728.0, 314658.0, 153931.0, 77851.0, 44371.0, 26491.0, 16290.0, 10296.0, 6503.0, 4280.0, 2723.0, 1759.0, 1137.0, 810.0, 538.0, 332.0, 238.0, 154.0, 95.0, 64.0, 49.0, 31.0, 21.0, 8.0, 5.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.5859375, -0.5684051513671875, -0.550872802734375, -0.5333404541015625, -0.51580810546875, -0.4982757568359375, -0.480743408203125, -0.4632110595703125, -0.4456787109375, -0.4281463623046875, -0.410614013671875, -0.3930816650390625, -0.37554931640625, -0.3580169677734375, -0.340484619140625, -0.3229522705078125, -0.305419921875, -0.2878875732421875, -0.270355224609375, -0.2528228759765625, -0.23529052734375, -0.2177581787109375, -0.200225830078125, -0.1826934814453125, -0.1651611328125, -0.1476287841796875, -0.130096435546875, -0.1125640869140625, -0.09503173828125, -0.0774993896484375, -0.059967041015625, -0.0424346923828125, -0.02490234375, -0.0073699951171875, 0.010162353515625, 0.0276947021484375, 0.04522705078125, 0.0627593994140625, 0.080291748046875, 0.0978240966796875, 0.1153564453125, 0.1328887939453125, 0.150421142578125, 0.1679534912109375, 0.18548583984375, 0.2030181884765625, 0.220550537109375, 0.2380828857421875, 0.255615234375, 0.2731475830078125, 0.290679931640625, 0.3082122802734375, 0.32574462890625, 0.3432769775390625, 0.360809326171875, 0.3783416748046875, 0.3958740234375, 0.4134063720703125, 0.430938720703125, 0.4484710693359375, 0.46600341796875, 0.4835357666015625, 0.501068115234375, 0.5186004638671875, 0.5361328125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 12.0, 6.0, 9.0, 10.0, 9.0, 13.0, 9.0, 14.0, 26.0, 26.0, 15.0, 29.0, 25.0, 36.0, 24.0, 37.0, 42.0, 42.0, 40.0, 1057.0, 46.0, 42.0, 40.0, 34.0, 34.0, 41.0, 46.0, 38.0, 21.0, 34.0, 25.0, 22.0, 26.0, 14.0, 12.0, 12.0, 10.0, 6.0, 8.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.0078125, -1.946502685546875, -1.88519287109375, -1.823883056640625, -1.7625732421875, -1.701263427734375, -1.63995361328125, -1.578643798828125, -1.517333984375, -1.456024169921875, -1.39471435546875, -1.333404541015625, -1.2720947265625, -1.210784912109375, -1.14947509765625, -1.088165283203125, -1.02685546875, -0.965545654296875, -0.90423583984375, -0.842926025390625, -0.7816162109375, -0.720306396484375, -0.65899658203125, -0.597686767578125, -0.536376953125, -0.475067138671875, -0.41375732421875, -0.352447509765625, -0.2911376953125, -0.229827880859375, -0.16851806640625, -0.107208251953125, -0.0458984375, 0.015411376953125, 0.07672119140625, 0.138031005859375, 0.1993408203125, 0.260650634765625, 0.32196044921875, 0.383270263671875, 0.444580078125, 0.505889892578125, 0.56719970703125, 0.628509521484375, 0.6898193359375, 0.751129150390625, 0.81243896484375, 0.873748779296875, 0.93505859375, 0.996368408203125, 1.05767822265625, 1.118988037109375, 1.1802978515625, 1.241607666015625, 1.30291748046875, 1.364227294921875, 1.425537109375, 1.486846923828125, 1.54815673828125, 1.609466552734375, 1.6707763671875, 1.732086181640625, 1.79339599609375, 1.854705810546875, 1.916015625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 7.0, 14.0, 12.0, 20.0, 23.0, 43.0, 60.0, 91.0, 136.0, 186.0, 264.0, 366.0, 512.0, 684.0, 991.0, 1339.0, 1912.0, 2622.0, 3713.0, 5144.0, 7206.0, 10272.0, 14764.0, 21578.0, 31931.0, 48479.0, 78792.0, 141772.0, 1304729.0, 165472.0, 88323.0, 53985.0, 34884.0, 23131.0, 15901.0, 10951.0, 7489.0, 5463.0, 3944.0, 2739.0, 1970.0, 1441.0, 1039.0, 788.0, 541.0, 418.0, 283.0, 204.0, 152.0, 98.0, 83.0, 51.0, 54.0, 31.0, 23.0, 7.0, 7.0, 9.0, 2.0, 0.0, 1.0], "bins": [-0.42041015625, -0.40711212158203125, -0.3938140869140625, -0.38051605224609375, -0.367218017578125, -0.35391998291015625, -0.3406219482421875, -0.32732391357421875, -0.31402587890625, -0.30072784423828125, -0.2874298095703125, -0.27413177490234375, -0.260833740234375, -0.24753570556640625, -0.2342376708984375, -0.22093963623046875, -0.2076416015625, -0.19434356689453125, -0.1810455322265625, -0.16774749755859375, -0.154449462890625, -0.14115142822265625, -0.1278533935546875, -0.11455535888671875, -0.10125732421875, -0.08795928955078125, -0.0746612548828125, -0.06136322021484375, -0.048065185546875, -0.03476715087890625, -0.0214691162109375, -0.00817108154296875, 0.005126953125, 0.01842498779296875, 0.0317230224609375, 0.04502105712890625, 0.058319091796875, 0.07161712646484375, 0.0849151611328125, 0.09821319580078125, 0.11151123046875, 0.12480926513671875, 0.1381072998046875, 0.15140533447265625, 0.164703369140625, 0.17800140380859375, 0.1912994384765625, 0.20459747314453125, 0.2178955078125, 0.23119354248046875, 0.2444915771484375, 0.25778961181640625, 0.271087646484375, 0.28438568115234375, 0.2976837158203125, 0.31098175048828125, 0.32427978515625, 0.33757781982421875, 0.3508758544921875, 0.36417388916015625, 0.377471923828125, 0.39076995849609375, 0.4040679931640625, 0.41736602783203125, 0.4306640625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 7.0, 8.0, 3.0, 9.0, 4.0, 10.0, 11.0, 10.0, 20.0, 14.0, 23.0, 29.0, 37.0, 44.0, 45.0, 40.0, 53.0, 59.0, 54.0, 66.0, 59.0, 60.0, 48.0, 49.0, 40.0, 30.0, 31.0, 15.0, 19.0, 18.0, 27.0, 5.0, 11.0, 12.0, 8.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.620189666748047e-05, -9.30512323975563e-05, -8.990056812763214e-05, -8.674990385770798e-05, -8.359923958778381e-05, -8.044857531785965e-05, -7.729791104793549e-05, -7.414724677801132e-05, -7.099658250808716e-05, -6.7845918238163e-05, -6.469525396823883e-05, -6.154458969831467e-05, -5.83939254283905e-05, -5.524326115846634e-05, -5.2092596888542175e-05, -4.894193261861801e-05, -4.579126834869385e-05, -4.2640604078769684e-05, -3.948993980884552e-05, -3.6339275538921356e-05, -3.318861126899719e-05, -3.003794699907303e-05, -2.6887282729148865e-05, -2.37366184592247e-05, -2.0585954189300537e-05, -1.7435289919376373e-05, -1.428462564945221e-05, -1.1133961379528046e-05, -7.983297109603882e-06, -4.832632839679718e-06, -1.6819685697555542e-06, 1.4686957001686096e-06, 4.6193599700927734e-06, 7.770024240016937e-06, 1.0920688509941101e-05, 1.4071352779865265e-05, 1.722201704978943e-05, 2.0372681319713593e-05, 2.3523345589637756e-05, 2.667400985956192e-05, 2.9824674129486084e-05, 3.297533839941025e-05, 3.612600266933441e-05, 3.9276666939258575e-05, 4.242733120918274e-05, 4.55779954791069e-05, 4.872865974903107e-05, 5.187932401895523e-05, 5.5029988288879395e-05, 5.818065255880356e-05, 6.133131682872772e-05, 6.448198109865189e-05, 6.763264536857605e-05, 7.078330963850021e-05, 7.393397390842438e-05, 7.708463817834854e-05, 8.02353024482727e-05, 8.338596671819687e-05, 8.653663098812103e-05, 8.96872952580452e-05, 9.283795952796936e-05, 9.598862379789352e-05, 9.913928806781769e-05, 0.00010228995233774185, 0.00010544061660766602]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 11.0, 3.0, 10.0, 16.0, 19.0, 14.0, 25.0, 49.0, 41.0, 64.0, 107.0, 148.0, 267.0, 469.0, 1124.0, 61887.0, 977988.0, 4480.0, 708.0, 382.0, 230.0, 134.0, 106.0, 56.0, 43.0, 33.0, 29.0, 19.0, 10.0, 17.0, 14.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002185821533203125, -0.0021201670169830322, -0.0020545125007629395, -0.0019888579845428467, -0.001923203468322754, -0.0018575489521026611, -0.0017918944358825684, -0.0017262399196624756, -0.0016605854034423828, -0.00159493088722229, -0.0015292763710021973, -0.0014636218547821045, -0.0013979673385620117, -0.001332312822341919, -0.0012666583061218262, -0.0012010037899017334, -0.0011353492736816406, -0.0010696947574615479, -0.001004040241241455, -0.0009383857250213623, -0.0008727312088012695, -0.0008070766925811768, -0.000741422176361084, -0.0006757676601409912, -0.0006101131439208984, -0.0005444586277008057, -0.0004788041114807129, -0.0004131495952606201, -0.00034749507904052734, -0.00028184056282043457, -0.0002161860466003418, -0.00015053153038024902, -8.487701416015625e-05, -1.9222497940063477e-05, 4.64320182800293e-05, 0.00011208653450012207, 0.00017774105072021484, 0.00024339556694030762, 0.0003090500831604004, 0.00037470459938049316, 0.00044035911560058594, 0.0005060136318206787, 0.0005716681480407715, 0.0006373226642608643, 0.000702977180480957, 0.0007686316967010498, 0.0008342862129211426, 0.0008999407291412354, 0.0009655952453613281, 0.001031249761581421, 0.0010969042778015137, 0.0011625587940216064, 0.0012282133102416992, 0.001293867826461792, 0.0013595223426818848, 0.0014251768589019775, 0.0014908313751220703, 0.001556485891342163, 0.0016221404075622559, 0.0016877949237823486, 0.0017534494400024414, 0.0018191039562225342, 0.001884758472442627, 0.0019504129886627197, 0.0020160675048828125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 39.0, 96.0, 225.0, 269.0, 214.0, 111.0, 30.0, 10.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001448805705877021, -0.00013960935757495463, -0.00013433814456220716, -0.0001290669315494597, -0.00012379571853671223, -0.00011852450552396476, -0.00011325328523525968, -0.00010798207222251222, -0.00010271085920976475, -9.743964619701728e-05, -9.216843318426982e-05, -8.689721289556473e-05, -8.162599988281727e-05, -7.63547868700698e-05, -7.108357385732234e-05, -6.581236084457487e-05, -6.05411478318274e-05, -5.5269934819079936e-05, -4.999872180633247e-05, -4.4727505155606195e-05, -3.945629214285873e-05, -3.418507913011126e-05, -2.891386247938499e-05, -2.3642649466637522e-05, -1.8371436453890055e-05, -1.3100222531647887e-05, -7.829008609405719e-06, -2.5577937776688486e-06, 2.713419235078618e-06, 7.984632247826084e-06, 1.3255848898552358e-05, 1.8527061911299825e-05, 2.379828947596252e-05, 2.9069502488709986e-05, 3.434071550145745e-05, 3.9611932152183726e-05, 4.488314516493119e-05, 5.015435817767866e-05, 5.542557482840493e-05, 6.06967878411524e-05, 6.596800085389987e-05, 7.123921386664733e-05, 7.65104268793948e-05, 8.178164716809988e-05, 8.705286018084735e-05, 9.232407319359481e-05, 9.759528620634228e-05, 0.00010286649921908975, 0.00010813771223183721, 0.00011340892524458468, 0.00011868013825733215, 0.0001239513512700796, 0.00012922256428282708, 0.00013449377729557455, 0.00013976500486023724, 0.00014503620332106948, 0.00015030743088573217, 0.00015557864389847964, 0.0001608498569112271, 0.00016612106992397457, 0.00017139228293672204, 0.0001766634959494695, 0.00018193470896221697, 0.00018720593652687967, 0.0001924771349877119]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 5.0, 7.0, 11.0, 14.0, 15.0, 24.0, 30.0, 23.0, 26.0, 22.0, 28.0, 33.0, 38.0, 46.0, 39.0, 45.0, 48.0, 59.0, 40.0, 53.0, 44.0, 42.0, 50.0, 34.0, 29.0, 25.0, 30.0, 27.0, 20.0, 16.0, 14.0, 13.0, 8.0, 12.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9664249420166016e-05, -5.783233791589737e-05, -5.600042641162872e-05, -5.416851490736008e-05, -5.233660340309143e-05, -5.0504691898822784e-05, -4.867278039455414e-05, -4.684086889028549e-05, -4.5008957386016846e-05, -4.31770458817482e-05, -4.134513437747955e-05, -3.951322287321091e-05, -3.768131136894226e-05, -3.5849399864673615e-05, -3.401748836040497e-05, -3.218557685613632e-05, -3.0353665351867676e-05, -2.852175384759903e-05, -2.6689842343330383e-05, -2.4857930839061737e-05, -2.302601933479309e-05, -2.1194107830524445e-05, -1.93621963262558e-05, -1.7530284821987152e-05, -1.5698373317718506e-05, -1.386646181344986e-05, -1.2034550309181213e-05, -1.0202638804912567e-05, -8.370727300643921e-06, -6.538815796375275e-06, -4.706904292106628e-06, -2.874992787837982e-06, -1.043081283569336e-06, 7.888302206993103e-07, 2.6207417249679565e-06, 4.452653229236603e-06, 6.284564733505249e-06, 8.116476237773895e-06, 9.948387742042542e-06, 1.1780299246311188e-05, 1.3612210750579834e-05, 1.544412225484848e-05, 1.7276033759117126e-05, 1.9107945263385773e-05, 2.093985676765442e-05, 2.2771768271923065e-05, 2.460367977619171e-05, 2.6435591280460358e-05, 2.8267502784729004e-05, 3.009941428899765e-05, 3.1931325793266296e-05, 3.376323729753494e-05, 3.559514880180359e-05, 3.7427060306072235e-05, 3.925897181034088e-05, 4.109088331460953e-05, 4.2922794818878174e-05, 4.475470632314682e-05, 4.6586617827415466e-05, 4.841852933168411e-05, 5.025044083595276e-05, 5.2082352340221405e-05, 5.391426384449005e-05, 5.57461753487587e-05, 5.7578086853027344e-05]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 14.0, 14.0, 21.0, 15.0, 27.0, 24.0, 34.0, 22.0, 32.0, 40.0, 45.0, 39.0, 47.0, 50.0, 48.0, 50.0, 41.0, 31.0, 61.0, 37.0, 36.0, 35.0, 28.0, 24.0, 35.0, 26.0, 20.0, 12.0, 15.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.00390625, -3.896942138671875, -3.78997802734375, -3.683013916015625, -3.5760498046875, -3.469085693359375, -3.36212158203125, -3.255157470703125, -3.148193359375, -3.041229248046875, -2.93426513671875, -2.827301025390625, -2.7203369140625, -2.613372802734375, -2.50640869140625, -2.399444580078125, -2.29248046875, -2.185516357421875, -2.07855224609375, -1.971588134765625, -1.8646240234375, -1.757659912109375, -1.65069580078125, -1.543731689453125, -1.436767578125, -1.329803466796875, -1.22283935546875, -1.115875244140625, -1.0089111328125, -0.901947021484375, -0.79498291015625, -0.688018798828125, -0.5810546875, -0.474090576171875, -0.36712646484375, -0.260162353515625, -0.1531982421875, -0.046234130859375, 0.06072998046875, 0.167694091796875, 0.274658203125, 0.381622314453125, 0.48858642578125, 0.595550537109375, 0.7025146484375, 0.809478759765625, 0.91644287109375, 1.023406982421875, 1.13037109375, 1.237335205078125, 1.34429931640625, 1.451263427734375, 1.5582275390625, 1.665191650390625, 1.77215576171875, 1.879119873046875, 1.986083984375, 2.093048095703125, 2.20001220703125, 2.306976318359375, 2.4139404296875, 2.520904541015625, 2.62786865234375, 2.734832763671875, 2.841796875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 3.0, 8.0, 6.0, 16.0, 18.0, 30.0, 45.0, 66.0, 89.0, 114.0, 157.0, 235.0, 346.0, 605.0, 949.0, 1706.0, 3073.0, 5700.0, 11007.0, 20918.0, 40590.0, 76829.0, 147774.0, 255466.0, 225896.0, 122654.0, 63646.0, 33139.0, 17450.0, 8958.0, 4799.0, 2557.0, 1406.0, 809.0, 511.0, 315.0, 214.0, 142.0, 104.0, 58.0, 50.0, 41.0, 13.0, 14.0, 16.0, 4.0, 9.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.520477294921875, -2.44134521484375, -2.362213134765625, -2.2830810546875, -2.203948974609375, -2.12481689453125, -2.045684814453125, -1.966552734375, -1.887420654296875, -1.80828857421875, -1.729156494140625, -1.6500244140625, -1.570892333984375, -1.49176025390625, -1.412628173828125, -1.33349609375, -1.254364013671875, -1.17523193359375, -1.096099853515625, -1.0169677734375, -0.937835693359375, -0.85870361328125, -0.779571533203125, -0.700439453125, -0.621307373046875, -0.54217529296875, -0.463043212890625, -0.3839111328125, -0.304779052734375, -0.22564697265625, -0.146514892578125, -0.0673828125, 0.011749267578125, 0.09088134765625, 0.170013427734375, 0.2491455078125, 0.328277587890625, 0.40740966796875, 0.486541748046875, 0.565673828125, 0.644805908203125, 0.72393798828125, 0.803070068359375, 0.8822021484375, 0.961334228515625, 1.04046630859375, 1.119598388671875, 1.19873046875, 1.277862548828125, 1.35699462890625, 1.436126708984375, 1.5152587890625, 1.594390869140625, 1.67352294921875, 1.752655029296875, 1.831787109375, 1.910919189453125, 1.99005126953125, 2.069183349609375, 2.1483154296875, 2.227447509765625, 2.30657958984375, 2.385711669921875, 2.46484375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 13.0, 13.0, 21.0, 23.0, 33.0, 23.0, 51.0, 43.0, 53.0, 67.0, 104.0, 170.0, 1520.0, 345.0, 132.0, 71.0, 59.0, 57.0, 37.0, 36.0, 30.0, 35.0, 20.0, 16.0, 15.0, 11.0, 7.0, 9.0, 3.0, 10.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-19.484375, -18.9698486328125, -18.455322265625, -17.9407958984375, -17.42626953125, -16.9117431640625, -16.397216796875, -15.8826904296875, -15.3681640625, -14.8536376953125, -14.339111328125, -13.8245849609375, -13.31005859375, -12.7955322265625, -12.281005859375, -11.7664794921875, -11.251953125, -10.7374267578125, -10.222900390625, -9.7083740234375, -9.19384765625, -8.6793212890625, -8.164794921875, -7.6502685546875, -7.1357421875, -6.6212158203125, -6.106689453125, -5.5921630859375, -5.07763671875, -4.5631103515625, -4.048583984375, -3.5340576171875, -3.01953125, -2.5050048828125, -1.990478515625, -1.4759521484375, -0.96142578125, -0.4468994140625, 0.067626953125, 0.5821533203125, 1.0966796875, 1.6112060546875, 2.125732421875, 2.6402587890625, 3.15478515625, 3.6693115234375, 4.183837890625, 4.6983642578125, 5.212890625, 5.7274169921875, 6.241943359375, 6.7564697265625, 7.27099609375, 7.7855224609375, 8.300048828125, 8.8145751953125, 9.3291015625, 9.8436279296875, 10.358154296875, 10.8726806640625, 11.38720703125, 11.9017333984375, 12.416259765625, 12.9307861328125, 13.4453125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 7.0, 12.0, 16.0, 17.0, 19.0, 19.0, 39.0, 51.0, 74.0, 101.0, 135.0, 192.0, 303.0, 579.0, 2800.0, 2409730.0, 728039.0, 2071.0, 541.0, 316.0, 179.0, 101.0, 93.0, 72.0, 50.0, 39.0, 29.0, 15.0, 8.0, 11.0, 6.0, 8.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.78125, -38.49560546875, -37.2099609375, -35.92431640625, -34.638671875, -33.35302734375, -32.0673828125, -30.78173828125, -29.49609375, -28.21044921875, -26.9248046875, -25.63916015625, -24.353515625, -23.06787109375, -21.7822265625, -20.49658203125, -19.2109375, -17.92529296875, -16.6396484375, -15.35400390625, -14.068359375, -12.78271484375, -11.4970703125, -10.21142578125, -8.92578125, -7.64013671875, -6.3544921875, -5.06884765625, -3.783203125, -2.49755859375, -1.2119140625, 0.07373046875, 1.359375, 2.64501953125, 3.9306640625, 5.21630859375, 6.501953125, 7.78759765625, 9.0732421875, 10.35888671875, 11.64453125, 12.93017578125, 14.2158203125, 15.50146484375, 16.787109375, 18.07275390625, 19.3583984375, 20.64404296875, 21.9296875, 23.21533203125, 24.5009765625, 25.78662109375, 27.072265625, 28.35791015625, 29.6435546875, 30.92919921875, 32.21484375, 33.50048828125, 34.7861328125, 36.07177734375, 37.357421875, 38.64306640625, 39.9287109375, 41.21435546875, 42.5]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 12.0, 660.0, 344.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.052346229553223, -9.838336944580078, -4.62432861328125, 0.5896806716918945, 5.803689002990723, 11.01769733428955, 16.231708526611328, 21.445716857910156, 26.659725189208984, 31.873733520507812, 37.08774185180664, 42.30175018310547, 47.51576232910156, 52.729766845703125, 57.94377899169922, 63.15778732299805, 68.37179565429688, 73.58580780029297, 78.79981231689453, 84.01382446289062, 89.22782897949219, 94.44184112548828, 99.65585327148438, 104.86985778808594, 110.0838623046875, 115.2978744506836, 120.51187896728516, 125.72589111328125, 130.9398956298828, 136.15390014648438, 141.367919921875, 146.58192443847656, 151.7959442138672, 157.00994873046875, 162.22396850585938, 167.43797302246094, 172.6519775390625, 177.86598205566406, 183.0800018310547, 188.29400634765625, 193.5080108642578, 198.72201538085938, 203.93603515625, 209.15003967285156, 214.36404418945312, 219.5780487060547, 224.7920684814453, 230.00607299804688, 235.2200927734375, 240.43409729003906, 245.6481170654297, 250.86212158203125, 256.0761413574219, 261.2901306152344, 266.504150390625, 271.7181396484375, 276.9321594238281, 282.14617919921875, 287.36016845703125, 292.5741882324219, 297.7882080078125, 303.002197265625, 308.2162170410156, 313.43023681640625, 318.64422607421875]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 3.0, 1.0, 9.0, 8.0, 4.0, 14.0, 12.0, 11.0, 22.0, 12.0, 20.0, 13.0, 20.0, 23.0, 33.0, 34.0, 33.0, 30.0, 31.0, 28.0, 38.0, 43.0, 28.0, 31.0, 42.0, 50.0, 33.0, 31.0, 39.0, 28.0, 34.0, 29.0, 23.0, 27.0, 19.0, 18.0, 17.0, 13.0, 10.0, 11.0, 21.0, 10.0, 6.0, 7.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-26.892616271972656, -26.06068229675293, -25.228750228881836, -24.39681625366211, -23.564882278442383, -22.732948303222656, -21.901016235351562, -21.069082260131836, -20.23714828491211, -19.405214309692383, -18.57328224182129, -17.741348266601562, -16.909414291381836, -16.07748031616211, -15.245548248291016, -14.413614273071289, -13.581681251525879, -12.749748229980469, -11.917814254760742, -11.085881233215332, -10.253947257995605, -9.422014236450195, -8.590080261230469, -7.758147239685059, -6.92621374130249, -6.094280242919922, -5.2623467445373535, -4.430413246154785, -3.598479986190796, -2.7665467262268066, -1.9346132278442383, -1.10267972946167, -0.27074623107910156, 0.561187207698822, 1.3931206464767456, 2.2250540256500244, 3.0569875240325928, 3.888920783996582, 4.72085428237915, 5.552787780761719, 6.384721279144287, 7.2166547775268555, 8.048587799072266, 8.880521774291992, 9.712454795837402, 10.544387817382812, 11.376321792602539, 12.208255767822266, 13.040188789367676, 13.872121810913086, 14.704055786132812, 15.535988807678223, 16.367921829223633, 17.19985580444336, 18.031789779663086, 18.863723754882812, 19.695655822753906, 20.527589797973633, 21.359521865844727, 22.191455841064453, 23.02338981628418, 23.855323791503906, 24.687255859375, 25.519189834594727, 26.351123809814453]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 4.0, 8.0, 7.0, 11.0, 14.0, 16.0, 13.0, 20.0, 12.0, 30.0, 28.0, 35.0, 37.0, 39.0, 34.0, 46.0, 42.0, 41.0, 55.0, 50.0, 50.0, 39.0, 31.0, 37.0, 37.0, 38.0, 31.0, 24.0, 19.0, 28.0, 23.0, 11.0, 22.0, 18.0, 9.0, 11.0, 6.0, 7.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.955078125, -3.84149169921875, -3.7279052734375, -3.61431884765625, -3.500732421875, -3.38714599609375, -3.2735595703125, -3.15997314453125, -3.04638671875, -2.93280029296875, -2.8192138671875, -2.70562744140625, -2.592041015625, -2.47845458984375, -2.3648681640625, -2.25128173828125, -2.1376953125, -2.02410888671875, -1.9105224609375, -1.79693603515625, -1.683349609375, -1.56976318359375, -1.4561767578125, -1.34259033203125, -1.22900390625, -1.11541748046875, -1.0018310546875, -0.88824462890625, -0.774658203125, -0.66107177734375, -0.5474853515625, -0.43389892578125, -0.3203125, -0.20672607421875, -0.0931396484375, 0.02044677734375, 0.134033203125, 0.24761962890625, 0.3612060546875, 0.47479248046875, 0.58837890625, 0.70196533203125, 0.8155517578125, 0.92913818359375, 1.042724609375, 1.15631103515625, 1.2698974609375, 1.38348388671875, 1.4970703125, 1.61065673828125, 1.7242431640625, 1.83782958984375, 1.951416015625, 2.06500244140625, 2.1785888671875, 2.29217529296875, 2.40576171875, 2.51934814453125, 2.6329345703125, 2.74652099609375, 2.860107421875, 2.97369384765625, 3.0872802734375, 3.20086669921875, 3.314453125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 6.0, 5.0, 2.0, 5.0, 8.0, 11.0, 8.0, 17.0, 17.0, 14.0, 19.0, 16.0, 25.0, 30.0, 39.0, 53.0, 79.0, 167.0, 342.0, 1341.0, 11334.0, 493605.0, 3344308.0, 332975.0, 8046.0, 1031.0, 307.0, 123.0, 78.0, 38.0, 33.0, 27.0, 17.0, 27.0, 26.0, 20.0, 21.0, 14.0, 13.0, 14.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.255126953125, -11.87744140625, -11.499755859375, -11.1220703125, -10.744384765625, -10.36669921875, -9.989013671875, -9.611328125, -9.233642578125, -8.85595703125, -8.478271484375, -8.1005859375, -7.722900390625, -7.34521484375, -6.967529296875, -6.58984375, -6.212158203125, -5.83447265625, -5.456787109375, -5.0791015625, -4.701416015625, -4.32373046875, -3.946044921875, -3.568359375, -3.190673828125, -2.81298828125, -2.435302734375, -2.0576171875, -1.679931640625, -1.30224609375, -0.924560546875, -0.546875, -0.169189453125, 0.20849609375, 0.586181640625, 0.9638671875, 1.341552734375, 1.71923828125, 2.096923828125, 2.474609375, 2.852294921875, 3.22998046875, 3.607666015625, 3.9853515625, 4.363037109375, 4.74072265625, 5.118408203125, 5.49609375, 5.873779296875, 6.25146484375, 6.629150390625, 7.0068359375, 7.384521484375, 7.76220703125, 8.139892578125, 8.517578125, 8.895263671875, 9.27294921875, 9.650634765625, 10.0283203125, 10.406005859375, 10.78369140625, 11.161376953125, 11.5390625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 8.0, 9.0, 18.0, 26.0, 25.0, 47.0, 57.0, 68.0, 116.0, 173.0, 236.0, 315.0, 384.0, 476.0, 467.0, 398.0, 356.0, 239.0, 189.0, 112.0, 92.0, 75.0, 50.0, 42.0, 31.0, 18.0, 10.0, 6.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84765625, -6.60382080078125, -6.3599853515625, -6.11614990234375, -5.872314453125, -5.62847900390625, -5.3846435546875, -5.14080810546875, -4.89697265625, -4.65313720703125, -4.4093017578125, -4.16546630859375, -3.921630859375, -3.67779541015625, -3.4339599609375, -3.19012451171875, -2.9462890625, -2.70245361328125, -2.4586181640625, -2.21478271484375, -1.970947265625, -1.72711181640625, -1.4832763671875, -1.23944091796875, -0.99560546875, -0.75177001953125, -0.5079345703125, -0.26409912109375, -0.020263671875, 0.22357177734375, 0.4674072265625, 0.71124267578125, 0.955078125, 1.19891357421875, 1.4427490234375, 1.68658447265625, 1.930419921875, 2.17425537109375, 2.4180908203125, 2.66192626953125, 2.90576171875, 3.14959716796875, 3.3934326171875, 3.63726806640625, 3.881103515625, 4.12493896484375, 4.3687744140625, 4.61260986328125, 4.8564453125, 5.10028076171875, 5.3441162109375, 5.58795166015625, 5.831787109375, 6.07562255859375, 6.3194580078125, 6.56329345703125, 6.80712890625, 7.05096435546875, 7.2947998046875, 7.53863525390625, 7.782470703125, 8.02630615234375, 8.2701416015625, 8.51397705078125, 8.7578125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 10.0, 7.0, 11.0, 15.0, 21.0, 20.0, 33.0, 44.0, 63.0, 90.0, 97.0, 131.0, 155.0, 271.0, 441.0, 926.0, 6117.0, 230831.0, 3673553.0, 272325.0, 6704.0, 1010.0, 456.0, 253.0, 168.0, 136.0, 94.0, 67.0, 46.0, 43.0, 27.0, 31.0, 21.0, 16.0, 11.0, 7.0, 7.0, 9.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.484375, -18.903076171875, -18.32177734375, -17.740478515625, -17.1591796875, -16.577880859375, -15.99658203125, -15.415283203125, -14.833984375, -14.252685546875, -13.67138671875, -13.090087890625, -12.5087890625, -11.927490234375, -11.34619140625, -10.764892578125, -10.18359375, -9.602294921875, -9.02099609375, -8.439697265625, -7.8583984375, -7.277099609375, -6.69580078125, -6.114501953125, -5.533203125, -4.951904296875, -4.37060546875, -3.789306640625, -3.2080078125, -2.626708984375, -2.04541015625, -1.464111328125, -0.8828125, -0.301513671875, 0.27978515625, 0.861083984375, 1.4423828125, 2.023681640625, 2.60498046875, 3.186279296875, 3.767578125, 4.348876953125, 4.93017578125, 5.511474609375, 6.0927734375, 6.674072265625, 7.25537109375, 7.836669921875, 8.41796875, 8.999267578125, 9.58056640625, 10.161865234375, 10.7431640625, 11.324462890625, 11.90576171875, 12.487060546875, 13.068359375, 13.649658203125, 14.23095703125, 14.812255859375, 15.3935546875, 15.974853515625, 16.55615234375, 17.137451171875, 17.71875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 16.0, 66.0, 167.0, 278.0, 277.0, 141.0, 49.0, 12.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.045875549316406, -29.544979095458984, -27.04408073425293, -24.543182373046875, -22.042285919189453, -19.54138946533203, -17.040491104125977, -14.539592742919922, -12.0386962890625, -9.537798881530762, -7.036901473999023, -4.536004066467285, -2.035106658935547, 0.4657907485961914, 2.9666881561279297, 5.467586517333984, 7.968482971191406, 10.469380378723145, 12.970277786254883, 15.471175193786621, 17.97207260131836, 20.47296905517578, 22.973867416381836, 25.47476577758789, 27.975662231445312, 30.476558685302734, 32.977455139160156, 35.478355407714844, 37.979251861572266, 40.48014831542969, 42.981048583984375, 45.4819450378418, 47.98283386230469, 50.48373031616211, 52.98462677001953, 55.48552703857422, 57.98642349243164, 60.48731994628906, 62.98822021484375, 65.48912048339844, 67.9900131225586, 70.49091339111328, 72.99180603027344, 75.49270629882812, 77.99360656738281, 80.49449920654297, 82.99539947509766, 85.49629211425781, 87.9971923828125, 90.49809265136719, 92.99898529052734, 95.49988555908203, 98.00077819824219, 100.50167846679688, 103.00257873535156, 105.50347900390625, 108.0043716430664, 110.5052719116211, 113.00616455078125, 115.50706481933594, 118.00796508789062, 120.50885772705078, 123.00975799560547, 125.51065063476562, 128.0115509033203]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 2.0, 9.0, 14.0, 11.0, 11.0, 19.0, 13.0, 24.0, 20.0, 22.0, 30.0, 24.0, 35.0, 29.0, 41.0, 30.0, 30.0, 32.0, 45.0, 49.0, 43.0, 42.0, 40.0, 35.0, 31.0, 35.0, 18.0, 24.0, 33.0, 27.0, 31.0, 19.0, 23.0, 15.0, 17.0, 8.0, 19.0, 9.0, 12.0, 7.0, 3.0, 2.0, 9.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.791484832763672, -20.0788631439209, -19.366241455078125, -18.65361976623535, -17.940998077392578, -17.228376388549805, -16.51575469970703, -15.803133964538574, -15.0905122756958, -14.377890586853027, -13.665268898010254, -12.952648162841797, -12.240026473999023, -11.52740478515625, -10.814783096313477, -10.102161407470703, -9.38953971862793, -8.676918029785156, -7.964296340942383, -7.251675128936768, -6.539053440093994, -5.826431751251221, -5.1138105392456055, -4.401188850402832, -3.6885671615600586, -2.975945472717285, -2.263324022293091, -1.5507025718688965, -0.838080883026123, -0.1254591941833496, 0.5871620178222656, 1.299783706665039, 2.0124073028564453, 2.7250289916992188, 3.437650442123413, 4.150271892547607, 4.862893581390381, 5.575515270233154, 6.2881364822387695, 7.000758171081543, 7.713379859924316, 8.42600154876709, 9.138623237609863, 9.85124397277832, 10.563865661621094, 11.276487350463867, 11.98910903930664, 12.701730728149414, 13.414352416992188, 14.126974105834961, 14.839595794677734, 15.552217483520508, 16.26483917236328, 16.977460861206055, 17.690082550048828, 18.40270233154297, 19.115325927734375, 19.82794761657715, 20.540569305419922, 21.253190994262695, 21.96581268310547, 22.678434371948242, 23.391056060791016, 24.103675842285156, 24.81629753112793]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 9.0, 5.0, 12.0, 8.0, 19.0, 18.0, 23.0, 27.0, 22.0, 30.0, 34.0, 29.0, 38.0, 44.0, 49.0, 49.0, 33.0, 42.0, 53.0, 44.0, 50.0, 37.0, 44.0, 26.0, 37.0, 27.0, 24.0, 34.0, 20.0, 25.0, 14.0, 15.0, 11.0, 10.0, 8.0, 6.0, 8.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.47906494140625, -3.3663330078125, -3.25360107421875, -3.140869140625, -3.02813720703125, -2.9154052734375, -2.80267333984375, -2.68994140625, -2.57720947265625, -2.4644775390625, -2.35174560546875, -2.239013671875, -2.12628173828125, -2.0135498046875, -1.90081787109375, -1.7880859375, -1.67535400390625, -1.5626220703125, -1.44989013671875, -1.337158203125, -1.22442626953125, -1.1116943359375, -0.99896240234375, -0.88623046875, -0.77349853515625, -0.6607666015625, -0.54803466796875, -0.435302734375, -0.32257080078125, -0.2098388671875, -0.09710693359375, 0.015625, 0.12835693359375, 0.2410888671875, 0.35382080078125, 0.466552734375, 0.57928466796875, 0.6920166015625, 0.80474853515625, 0.91748046875, 1.03021240234375, 1.1429443359375, 1.25567626953125, 1.368408203125, 1.48114013671875, 1.5938720703125, 1.70660400390625, 1.8193359375, 1.93206787109375, 2.0447998046875, 2.15753173828125, 2.270263671875, 2.38299560546875, 2.4957275390625, 2.60845947265625, 2.72119140625, 2.83392333984375, 2.9466552734375, 3.05938720703125, 3.172119140625, 3.28485107421875, 3.3975830078125, 3.51031494140625, 3.623046875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 2.0, 13.0, 18.0, 21.0, 37.0, 41.0, 68.0, 99.0, 155.0, 228.0, 328.0, 484.0, 685.0, 1046.0, 1520.0, 2301.0, 3405.0, 5078.0, 7474.0, 11643.0, 17644.0, 27880.0, 44875.0, 77510.0, 151498.0, 291996.0, 177524.0, 87259.0, 50113.0, 30731.0, 19319.0, 12444.0, 8348.0, 5438.0, 3704.0, 2450.0, 1670.0, 1156.0, 739.0, 512.0, 340.0, 240.0, 184.0, 112.0, 81.0, 41.0, 31.0, 20.0, 20.0, 15.0, 11.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.56103515625, -0.5427017211914062, -0.5243682861328125, -0.5060348510742188, -0.487701416015625, -0.46936798095703125, -0.4510345458984375, -0.43270111083984375, -0.41436767578125, -0.39603424072265625, -0.3777008056640625, -0.35936737060546875, -0.341033935546875, -0.32270050048828125, -0.3043670654296875, -0.28603363037109375, -0.2677001953125, -0.24936676025390625, -0.2310333251953125, -0.21269989013671875, -0.194366455078125, -0.17603302001953125, -0.1576995849609375, -0.13936614990234375, -0.12103271484375, -0.10269927978515625, -0.0843658447265625, -0.06603240966796875, -0.047698974609375, -0.02936553955078125, -0.0110321044921875, 0.00730133056640625, 0.025634765625, 0.04396820068359375, 0.0623016357421875, 0.08063507080078125, 0.098968505859375, 0.11730194091796875, 0.1356353759765625, 0.15396881103515625, 0.17230224609375, 0.19063568115234375, 0.2089691162109375, 0.22730255126953125, 0.245635986328125, 0.26396942138671875, 0.2823028564453125, 0.30063629150390625, 0.3189697265625, 0.33730316162109375, 0.3556365966796875, 0.37397003173828125, 0.392303466796875, 0.41063690185546875, 0.4289703369140625, 0.44730377197265625, 0.46563720703125, 0.48397064208984375, 0.5023040771484375, 0.5206375122070312, 0.538970947265625, 0.5573043823242188, 0.5756378173828125, 0.5939712524414062, 0.6123046875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 7.0, 10.0, 7.0, 10.0, 14.0, 19.0, 16.0, 24.0, 22.0, 27.0, 33.0, 28.0, 31.0, 27.0, 34.0, 45.0, 37.0, 38.0, 35.0, 1071.0, 53.0, 35.0, 35.0, 32.0, 37.0, 40.0, 22.0, 44.0, 25.0, 27.0, 19.0, 22.0, 16.0, 24.0, 12.0, 8.0, 7.0, 5.0, 8.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9580078125, -1.8905792236328125, -1.823150634765625, -1.7557220458984375, -1.68829345703125, -1.6208648681640625, -1.553436279296875, -1.4860076904296875, -1.4185791015625, -1.3511505126953125, -1.283721923828125, -1.2162933349609375, -1.14886474609375, -1.0814361572265625, -1.014007568359375, -0.9465789794921875, -0.879150390625, -0.8117218017578125, -0.744293212890625, -0.6768646240234375, -0.60943603515625, -0.5420074462890625, -0.474578857421875, -0.4071502685546875, -0.3397216796875, -0.2722930908203125, -0.204864501953125, -0.1374359130859375, -0.07000732421875, -0.0025787353515625, 0.064849853515625, 0.1322784423828125, 0.19970703125, 0.2671356201171875, 0.334564208984375, 0.4019927978515625, 0.46942138671875, 0.5368499755859375, 0.604278564453125, 0.6717071533203125, 0.7391357421875, 0.8065643310546875, 0.873992919921875, 0.9414215087890625, 1.00885009765625, 1.0762786865234375, 1.143707275390625, 1.2111358642578125, 1.278564453125, 1.3459930419921875, 1.413421630859375, 1.4808502197265625, 1.54827880859375, 1.6157073974609375, 1.683135986328125, 1.7505645751953125, 1.8179931640625, 1.8854217529296875, 1.952850341796875, 2.0202789306640625, 2.08770751953125, 2.1551361083984375, 2.222564697265625, 2.2899932861328125, 2.357421875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 10.0, 8.0, 18.0, 19.0, 32.0, 36.0, 60.0, 88.0, 153.0, 208.0, 296.0, 439.0, 598.0, 921.0, 1348.0, 2080.0, 3006.0, 4395.0, 6460.0, 9573.0, 14339.0, 21239.0, 32352.0, 49679.0, 81903.0, 156438.0, 1326280.0, 156362.0, 81740.0, 49621.0, 32315.0, 21433.0, 14119.0, 9565.0, 6470.0, 4300.0, 2940.0, 1967.0, 1348.0, 966.0, 674.0, 418.0, 299.0, 206.0, 135.0, 95.0, 65.0, 47.0, 25.0, 22.0, 12.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.50537109375, -0.4898223876953125, -0.474273681640625, -0.4587249755859375, -0.44317626953125, -0.4276275634765625, -0.412078857421875, -0.3965301513671875, -0.3809814453125, -0.3654327392578125, -0.349884033203125, -0.3343353271484375, -0.31878662109375, -0.3032379150390625, -0.287689208984375, -0.2721405029296875, -0.256591796875, -0.2410430908203125, -0.225494384765625, -0.2099456787109375, -0.19439697265625, -0.1788482666015625, -0.163299560546875, -0.1477508544921875, -0.1322021484375, -0.1166534423828125, -0.101104736328125, -0.0855560302734375, -0.07000732421875, -0.0544586181640625, -0.038909912109375, -0.0233612060546875, -0.0078125, 0.0077362060546875, 0.023284912109375, 0.0388336181640625, 0.05438232421875, 0.0699310302734375, 0.085479736328125, 0.1010284423828125, 0.1165771484375, 0.1321258544921875, 0.147674560546875, 0.1632232666015625, 0.17877197265625, 0.1943206787109375, 0.209869384765625, 0.2254180908203125, 0.240966796875, 0.2565155029296875, 0.272064208984375, 0.2876129150390625, 0.30316162109375, 0.3187103271484375, 0.334259033203125, 0.3498077392578125, 0.3653564453125, 0.3809051513671875, 0.396453857421875, 0.4120025634765625, 0.42755126953125, 0.4430999755859375, 0.458648681640625, 0.4741973876953125, 0.48974609375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 10.0, 10.0, 11.0, 15.0, 21.0, 24.0, 31.0, 39.0, 60.0, 69.0, 75.0, 70.0, 88.0, 74.0, 86.0, 60.0, 55.0, 42.0, 29.0, 39.0, 17.0, 19.0, 14.0, 8.0, 6.0, 11.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001627206802368164, -0.0001574549823999405, -0.00015218928456306458, -0.00014692358672618866, -0.00014165788888931274, -0.00013639219105243683, -0.0001311264932155609, -0.000125860795378685, -0.00012059509754180908, -0.00011532939970493317, -0.00011006370186805725, -0.00010479800403118134, -9.953230619430542e-05, -9.42666083574295e-05, -8.900091052055359e-05, -8.373521268367767e-05, -7.846951484680176e-05, -7.320381700992584e-05, -6.793811917304993e-05, -6.267242133617401e-05, -5.7406723499298096e-05, -5.214102566242218e-05, -4.6875327825546265e-05, -4.160962998867035e-05, -3.6343932151794434e-05, -3.107823431491852e-05, -2.5812536478042603e-05, -2.0546838641166687e-05, -1.528114080429077e-05, -1.0015442967414856e-05, -4.7497451305389404e-06, 5.159527063369751e-07, 5.781650543212891e-06, 1.1047348380088806e-05, 1.631304621696472e-05, 2.1578744053840637e-05, 2.6844441890716553e-05, 3.211013972759247e-05, 3.7375837564468384e-05, 4.26415354013443e-05, 4.7907233238220215e-05, 5.317293107509613e-05, 5.8438628911972046e-05, 6.370432674884796e-05, 6.897002458572388e-05, 7.423572242259979e-05, 7.950142025947571e-05, 8.476711809635162e-05, 9.003281593322754e-05, 9.529851377010345e-05, 0.00010056421160697937, 0.00010582990944385529, 0.0001110956072807312, 0.00011636130511760712, 0.00012162700295448303, 0.00012689270079135895, 0.00013215839862823486, 0.00013742409646511078, 0.0001426897943019867, 0.0001479554921388626, 0.00015322118997573853, 0.00015848688781261444, 0.00016375258564949036, 0.00016901828348636627, 0.0001742839813232422]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 9.0, 16.0, 22.0, 35.0, 50.0, 54.0, 89.0, 153.0, 262.0, 713.0, 7543.0, 1035717.0, 2586.0, 586.0, 268.0, 130.0, 88.0, 61.0, 43.0, 28.0, 34.0, 15.0, 8.0, 11.0, 9.0, 5.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0037899017333984375, -0.0036764442920684814, -0.0035629868507385254, -0.0034495294094085693, -0.0033360719680786133, -0.0032226145267486572, -0.003109157085418701, -0.002995699644088745, -0.002882242202758789, -0.002768784761428833, -0.002655327320098877, -0.002541869878768921, -0.002428412437438965, -0.002314954996109009, -0.0022014975547790527, -0.0020880401134490967, -0.0019745826721191406, -0.0018611252307891846, -0.0017476677894592285, -0.0016342103481292725, -0.0015207529067993164, -0.0014072954654693604, -0.0012938380241394043, -0.0011803805828094482, -0.0010669231414794922, -0.0009534657001495361, -0.0008400082588195801, -0.000726550817489624, -0.000613093376159668, -0.0004996359348297119, -0.00038617849349975586, -0.0002727210521697998, -0.00015926361083984375, -4.5806169509887695e-05, 6.765127182006836e-05, 0.00018110871315002441, 0.00029456615447998047, 0.0004080235958099365, 0.0005214810371398926, 0.0006349384784698486, 0.0007483959197998047, 0.0008618533611297607, 0.0009753108024597168, 0.0010887682437896729, 0.001202225685119629, 0.001315683126449585, 0.001429140567779541, 0.001542598009109497, 0.0016560554504394531, 0.0017695128917694092, 0.0018829703330993652, 0.0019964277744293213, 0.0021098852157592773, 0.0022233426570892334, 0.0023368000984191895, 0.0024502575397491455, 0.0025637149810791016, 0.0026771724224090576, 0.0027906298637390137, 0.0029040873050689697, 0.0030175447463989258, 0.003131002187728882, 0.003244459629058838, 0.003357917070388794, 0.00347137451171875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 22.0, 99.0, 228.0, 302.0, 239.0, 99.0, 15.0, 10.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.797560202656314e-05, -3.105178984696977e-05, -2.41279776673764e-05, -1.7204167306772433e-05, -1.0280355127179064e-05, -3.356544766575098e-06, 3.5672674130182713e-06, 1.049107959261164e-05, 1.741489177220501e-05, 2.433870395179838e-05, 3.126251613139175e-05, 3.818632831098512e-05, 4.511013685259968e-05, 5.203394903219305e-05, 5.895776121178642e-05, 6.588156975340098e-05, 7.280538557097316e-05, 7.972919411258772e-05, 8.66530099301599e-05, 9.357681847177446e-05, 0.00010050063428934664, 0.0001074244428309612, 0.00011434825137257576, 0.00012127206719014794, 0.0001281958830077201, 0.0001351196988252923, 0.00014204350009094924, 0.00014896731590852141, 0.0001558911317260936, 0.00016281494754366577, 0.00016973874880932271, 0.0001766625646268949, 0.00018358636589255184, 0.00019051018171012402, 0.00019743398297578096, 0.00020435779879335314, 0.00021128161461092532, 0.00021820541587658226, 0.00022512923169415444, 0.00023205304751172662, 0.0002389768633292988, 0.00024590067914687097, 0.0002528244804125279, 0.0002597483107820153, 0.00026667211204767227, 0.0002735959133133292, 0.0002805197436828166, 0.00028744354494847357, 0.0002943673462141305, 0.00030129114747978747, 0.0003082149778492749, 0.0003151387791149318, 0.00032206258038058877, 0.0003289864107500762, 0.0003359102120157331, 0.00034283404238522053, 0.0003497578436508775, 0.0003566816449165344, 0.00036360547528602183, 0.0003705292765516788, 0.0003774530778173357, 0.00038437690818682313, 0.0003913007094524801, 0.000398224510718137, 0.00040514834108762443]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 8.0, 7.0, 7.0, 12.0, 7.0, 16.0, 10.0, 6.0, 13.0, 15.0, 17.0, 26.0, 21.0, 27.0, 45.0, 43.0, 34.0, 40.0, 42.0, 42.0, 33.0, 51.0, 32.0, 41.0, 22.0, 44.0, 39.0, 39.0, 35.0, 35.0, 32.0, 28.0, 20.0, 23.0, 20.0, 12.0, 10.0, 14.0, 10.0, 6.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.257129669189453e-05, -5.047023296356201e-05, -4.836916923522949e-05, -4.626810550689697e-05, -4.416704177856445e-05, -4.2065978050231934e-05, -3.9964914321899414e-05, -3.7863850593566895e-05, -3.5762786865234375e-05, -3.3661723136901855e-05, -3.1560659408569336e-05, -2.9459595680236816e-05, -2.7358531951904297e-05, -2.5257468223571777e-05, -2.3156404495239258e-05, -2.1055340766906738e-05, -1.895427703857422e-05, -1.68532133102417e-05, -1.475214958190918e-05, -1.265108585357666e-05, -1.055002212524414e-05, -8.448958396911621e-06, -6.3478946685791016e-06, -4.246830940246582e-06, -2.1457672119140625e-06, -4.470348358154297e-08, 2.0563602447509766e-06, 4.157423973083496e-06, 6.258487701416016e-06, 8.359551429748535e-06, 1.0460615158081055e-05, 1.2561678886413574e-05, 1.4662742614746094e-05, 1.6763806343078613e-05, 1.8864870071411133e-05, 2.0965933799743652e-05, 2.3066997528076172e-05, 2.516806125640869e-05, 2.726912498474121e-05, 2.937018871307373e-05, 3.147125244140625e-05, 3.357231616973877e-05, 3.567337989807129e-05, 3.777444362640381e-05, 3.987550735473633e-05, 4.197657108306885e-05, 4.407763481140137e-05, 4.617869853973389e-05, 4.8279762268066406e-05, 5.0380825996398926e-05, 5.2481889724731445e-05, 5.4582953453063965e-05, 5.6684017181396484e-05, 5.8785080909729004e-05, 6.0886144638061523e-05, 6.298720836639404e-05, 6.508827209472656e-05, 6.718933582305908e-05, 6.92903995513916e-05, 7.139146327972412e-05, 7.349252700805664e-05, 7.559359073638916e-05, 7.769465446472168e-05, 7.97957181930542e-05, 8.189678192138672e-05]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 9.0, 5.0, 12.0, 8.0, 19.0, 18.0, 23.0, 27.0, 22.0, 30.0, 34.0, 29.0, 38.0, 44.0, 49.0, 49.0, 33.0, 42.0, 53.0, 44.0, 50.0, 37.0, 44.0, 26.0, 37.0, 27.0, 24.0, 34.0, 20.0, 25.0, 14.0, 15.0, 11.0, 10.0, 8.0, 6.0, 8.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.47906494140625, -3.3663330078125, -3.25360107421875, -3.140869140625, -3.02813720703125, -2.9154052734375, -2.80267333984375, -2.68994140625, -2.57720947265625, -2.4644775390625, -2.35174560546875, -2.239013671875, -2.12628173828125, -2.0135498046875, -1.90081787109375, -1.7880859375, -1.67535400390625, -1.5626220703125, -1.44989013671875, -1.337158203125, -1.22442626953125, -1.1116943359375, -0.99896240234375, -0.88623046875, -0.77349853515625, -0.6607666015625, -0.54803466796875, -0.435302734375, -0.32257080078125, -0.2098388671875, -0.09710693359375, 0.015625, 0.12835693359375, 0.2410888671875, 0.35382080078125, 0.466552734375, 0.57928466796875, 0.6920166015625, 0.80474853515625, 0.91748046875, 1.03021240234375, 1.1429443359375, 1.25567626953125, 1.368408203125, 1.48114013671875, 1.5938720703125, 1.70660400390625, 1.8193359375, 1.93206787109375, 2.0447998046875, 2.15753173828125, 2.270263671875, 2.38299560546875, 2.4957275390625, 2.60845947265625, 2.72119140625, 2.83392333984375, 2.9466552734375, 3.05938720703125, 3.172119140625, 3.28485107421875, 3.3975830078125, 3.51031494140625, 3.623046875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 13.0, 16.0, 32.0, 41.0, 56.0, 89.0, 136.0, 217.0, 379.0, 672.0, 1432.0, 3494.0, 9328.0, 25098.0, 66703.0, 179319.0, 394431.0, 230284.0, 84595.0, 32163.0, 11969.0, 4402.0, 1778.0, 822.0, 409.0, 239.0, 149.0, 93.0, 59.0, 44.0, 33.0, 14.0, 13.0, 7.0, 7.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5, -3.373291015625, -3.24658203125, -3.119873046875, -2.9931640625, -2.866455078125, -2.73974609375, -2.613037109375, -2.486328125, -2.359619140625, -2.23291015625, -2.106201171875, -1.9794921875, -1.852783203125, -1.72607421875, -1.599365234375, -1.47265625, -1.345947265625, -1.21923828125, -1.092529296875, -0.9658203125, -0.839111328125, -0.71240234375, -0.585693359375, -0.458984375, -0.332275390625, -0.20556640625, -0.078857421875, 0.0478515625, 0.174560546875, 0.30126953125, 0.427978515625, 0.5546875, 0.681396484375, 0.80810546875, 0.934814453125, 1.0615234375, 1.188232421875, 1.31494140625, 1.441650390625, 1.568359375, 1.695068359375, 1.82177734375, 1.948486328125, 2.0751953125, 2.201904296875, 2.32861328125, 2.455322265625, 2.58203125, 2.708740234375, 2.83544921875, 2.962158203125, 3.0888671875, 3.215576171875, 3.34228515625, 3.468994140625, 3.595703125, 3.722412109375, 3.84912109375, 3.975830078125, 4.1025390625, 4.229248046875, 4.35595703125, 4.482666015625, 4.609375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 11.0, 13.0, 12.0, 21.0, 20.0, 28.0, 39.0, 32.0, 45.0, 47.0, 57.0, 103.0, 273.0, 1613.0, 222.0, 88.0, 70.0, 49.0, 44.0, 47.0, 39.0, 38.0, 26.0, 20.0, 15.0, 11.0, 10.0, 10.0, 6.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.0, -13.5408935546875, -13.081787109375, -12.6226806640625, -12.16357421875, -11.7044677734375, -11.245361328125, -10.7862548828125, -10.3271484375, -9.8680419921875, -9.408935546875, -8.9498291015625, -8.49072265625, -8.0316162109375, -7.572509765625, -7.1134033203125, -6.654296875, -6.1951904296875, -5.736083984375, -5.2769775390625, -4.81787109375, -4.3587646484375, -3.899658203125, -3.4405517578125, -2.9814453125, -2.5223388671875, -2.063232421875, -1.6041259765625, -1.14501953125, -0.6859130859375, -0.226806640625, 0.2322998046875, 0.69140625, 1.1505126953125, 1.609619140625, 2.0687255859375, 2.52783203125, 2.9869384765625, 3.446044921875, 3.9051513671875, 4.3642578125, 4.8233642578125, 5.282470703125, 5.7415771484375, 6.20068359375, 6.6597900390625, 7.118896484375, 7.5780029296875, 8.037109375, 8.4962158203125, 8.955322265625, 9.4144287109375, 9.87353515625, 10.3326416015625, 10.791748046875, 11.2508544921875, 11.7099609375, 12.1690673828125, 12.628173828125, 13.0872802734375, 13.54638671875, 14.0054931640625, 14.464599609375, 14.9237060546875, 15.3828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 8.0, 10.0, 14.0, 23.0, 22.0, 39.0, 41.0, 70.0, 94.0, 138.0, 210.0, 462.0, 1612.0, 2845950.0, 294976.0, 1109.0, 362.0, 173.0, 111.0, 71.0, 59.0, 42.0, 31.0, 17.0, 13.0, 13.0, 13.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.6875, -51.0859375, -49.484375, -47.8828125, -46.28125, -44.6796875, -43.078125, -41.4765625, -39.875, -38.2734375, -36.671875, -35.0703125, -33.46875, -31.8671875, -30.265625, -28.6640625, -27.0625, -25.4609375, -23.859375, -22.2578125, -20.65625, -19.0546875, -17.453125, -15.8515625, -14.25, -12.6484375, -11.046875, -9.4453125, -7.84375, -6.2421875, -4.640625, -3.0390625, -1.4375, 0.1640625, 1.765625, 3.3671875, 4.96875, 6.5703125, 8.171875, 9.7734375, 11.375, 12.9765625, 14.578125, 16.1796875, 17.78125, 19.3828125, 20.984375, 22.5859375, 24.1875, 25.7890625, 27.390625, 28.9921875, 30.59375, 32.1953125, 33.796875, 35.3984375, 37.0, 38.6015625, 40.203125, 41.8046875, 43.40625, 45.0078125, 46.609375, 48.2109375, 49.8125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [242.0, 773.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.701264381408691, -1.5497503280639648, 5.601763725280762, 12.753277778625488, 19.90479278564453, 27.056304931640625, 34.207820892333984, 41.359336853027344, 48.51084899902344, 55.66236114501953, 62.81387710571289, 69.96539306640625, 77.11690521240234, 84.26841735839844, 91.41993713378906, 98.57144927978516, 105.72296142578125, 112.87447357177734, 120.02598571777344, 127.17750549316406, 134.32901000976562, 141.48052978515625, 148.63204956054688, 155.7835693359375, 162.93507385253906, 170.0865936279297, 177.23809814453125, 184.38961791992188, 191.5411376953125, 198.69264221191406, 205.8441619873047, 212.99566650390625, 220.14718627929688, 227.2987060546875, 234.45021057128906, 241.6017303466797, 248.75323486328125, 255.90475463867188, 263.0562744140625, 270.2077941894531, 277.35931396484375, 284.5108337402344, 291.662353515625, 298.8138427734375, 305.9653625488281, 313.11688232421875, 320.2684020996094, 327.419921875, 334.5714111328125, 341.7229309082031, 348.87445068359375, 356.02593994140625, 363.1774597167969, 370.3289794921875, 377.4804992675781, 384.63201904296875, 391.78350830078125, 398.9350280761719, 406.0865478515625, 413.238037109375, 420.3895568847656, 427.54107666015625, 434.6925964355469, 441.8441162109375, 448.9956359863281]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 11.0, 5.0, 14.0, 14.0, 15.0, 21.0, 27.0, 21.0, 28.0, 22.0, 32.0, 37.0, 26.0, 41.0, 50.0, 41.0, 53.0, 33.0, 43.0, 37.0, 34.0, 26.0, 34.0, 43.0, 40.0, 41.0, 30.0, 28.0, 19.0, 19.0, 14.0, 11.0, 16.0, 17.0, 12.0, 10.0, 12.0, 5.0, 3.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.32056427001953, -38.190773010253906, -37.06098175048828, -35.93118667602539, -34.801395416259766, -33.67160415649414, -32.541812896728516, -31.41202163696289, -30.282228469848633, -29.152437210083008, -28.02264404296875, -26.892852783203125, -25.7630615234375, -24.633268356323242, -23.503477096557617, -22.37368392944336, -21.243892669677734, -20.11410140991211, -18.98430824279785, -17.854516983032227, -16.72472381591797, -15.594932556152344, -14.465141296386719, -13.335349082946777, -12.205556869506836, -11.075764656066895, -9.945972442626953, -8.816181182861328, -7.686388969421387, -6.556596755981445, -5.426805019378662, -4.297013282775879, -3.167217254638672, -2.0374252796173096, -0.9076333045959473, 0.22215867042541504, 1.3519506454467773, 2.4817428588867188, 3.611534595489502, 4.741326332092285, 5.871118545532227, 7.000910758972168, 8.13070297241211, 9.260494232177734, 10.390286445617676, 11.520078659057617, 12.649869918823242, 13.779662132263184, 14.909454345703125, 16.03924560546875, 17.169038772583008, 18.298830032348633, 19.42862319946289, 20.558414459228516, 21.68820571899414, 22.817996978759766, 23.947790145874023, 25.07758140563965, 26.207374572753906, 27.33716583251953, 28.466957092285156, 29.596750259399414, 30.72654151916504, 31.856334686279297, 32.98612594604492]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 7.0, 4.0, 9.0, 15.0, 13.0, 21.0, 16.0, 21.0, 21.0, 21.0, 32.0, 41.0, 44.0, 43.0, 43.0, 35.0, 35.0, 43.0, 48.0, 39.0, 47.0, 30.0, 49.0, 39.0, 36.0, 35.0, 31.0, 33.0, 28.0, 16.0, 14.0, 12.0, 17.0, 14.0, 7.0, 6.0, 11.0, 6.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.998046875, -3.87109375, -3.744140625, -3.6171875, -3.490234375, -3.36328125, -3.236328125, -3.109375, -2.982421875, -2.85546875, -2.728515625, -2.6015625, -2.474609375, -2.34765625, -2.220703125, -2.09375, -1.966796875, -1.83984375, -1.712890625, -1.5859375, -1.458984375, -1.33203125, -1.205078125, -1.078125, -0.951171875, -0.82421875, -0.697265625, -0.5703125, -0.443359375, -0.31640625, -0.189453125, -0.0625, 0.064453125, 0.19140625, 0.318359375, 0.4453125, 0.572265625, 0.69921875, 0.826171875, 0.953125, 1.080078125, 1.20703125, 1.333984375, 1.4609375, 1.587890625, 1.71484375, 1.841796875, 1.96875, 2.095703125, 2.22265625, 2.349609375, 2.4765625, 2.603515625, 2.73046875, 2.857421875, 2.984375, 3.111328125, 3.23828125, 3.365234375, 3.4921875, 3.619140625, 3.74609375, 3.873046875, 4.0]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 11.0, 9.0, 10.0, 15.0, 18.0, 15.0, 22.0, 25.0, 18.0, 33.0, 48.0, 48.0, 76.0, 131.0, 381.0, 1410.0, 11417.0, 523601.0, 3307037.0, 340126.0, 7977.0, 1084.0, 301.0, 131.0, 58.0, 51.0, 31.0, 26.0, 20.0, 26.0, 23.0, 13.0, 13.0, 17.0, 8.0, 3.0, 10.0, 5.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.125, -12.720458984375, -12.31591796875, -11.911376953125, -11.5068359375, -11.102294921875, -10.69775390625, -10.293212890625, -9.888671875, -9.484130859375, -9.07958984375, -8.675048828125, -8.2705078125, -7.865966796875, -7.46142578125, -7.056884765625, -6.65234375, -6.247802734375, -5.84326171875, -5.438720703125, -5.0341796875, -4.629638671875, -4.22509765625, -3.820556640625, -3.416015625, -3.011474609375, -2.60693359375, -2.202392578125, -1.7978515625, -1.393310546875, -0.98876953125, -0.584228515625, -0.1796875, 0.224853515625, 0.62939453125, 1.033935546875, 1.4384765625, 1.843017578125, 2.24755859375, 2.652099609375, 3.056640625, 3.461181640625, 3.86572265625, 4.270263671875, 4.6748046875, 5.079345703125, 5.48388671875, 5.888427734375, 6.29296875, 6.697509765625, 7.10205078125, 7.506591796875, 7.9111328125, 8.315673828125, 8.72021484375, 9.124755859375, 9.529296875, 9.933837890625, 10.33837890625, 10.742919921875, 11.1474609375, 11.552001953125, 11.95654296875, 12.361083984375, 12.765625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 10.0, 7.0, 6.0, 12.0, 22.0, 42.0, 62.0, 83.0, 130.0, 198.0, 286.0, 365.0, 538.0, 559.0, 515.0, 372.0, 266.0, 202.0, 123.0, 78.0, 70.0, 36.0, 35.0, 16.0, 11.0, 10.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.4124755859375, -8.106201171875, -7.7999267578125, -7.49365234375, -7.1873779296875, -6.881103515625, -6.5748291015625, -6.2685546875, -5.9622802734375, -5.656005859375, -5.3497314453125, -5.04345703125, -4.7371826171875, -4.430908203125, -4.1246337890625, -3.818359375, -3.5120849609375, -3.205810546875, -2.8995361328125, -2.59326171875, -2.2869873046875, -1.980712890625, -1.6744384765625, -1.3681640625, -1.0618896484375, -0.755615234375, -0.4493408203125, -0.14306640625, 0.1632080078125, 0.469482421875, 0.7757568359375, 1.08203125, 1.3883056640625, 1.694580078125, 2.0008544921875, 2.30712890625, 2.6134033203125, 2.919677734375, 3.2259521484375, 3.5322265625, 3.8385009765625, 4.144775390625, 4.4510498046875, 4.75732421875, 5.0635986328125, 5.369873046875, 5.6761474609375, 5.982421875, 6.2886962890625, 6.594970703125, 6.9012451171875, 7.20751953125, 7.5137939453125, 7.820068359375, 8.1263427734375, 8.4326171875, 8.7388916015625, 9.045166015625, 9.3514404296875, 9.65771484375, 9.9639892578125, 10.270263671875, 10.5765380859375, 10.8828125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 6.0, 14.0, 21.0, 16.0, 37.0, 58.0, 90.0, 114.0, 162.0, 273.0, 385.0, 777.0, 9814.0, 3827696.0, 351404.0, 1916.0, 515.0, 302.0, 200.0, 169.0, 104.0, 67.0, 46.0, 27.0, 17.0, 15.0, 9.0, 12.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.59375, -37.5146484375, -36.435546875, -35.3564453125, -34.27734375, -33.1982421875, -32.119140625, -31.0400390625, -29.9609375, -28.8818359375, -27.802734375, -26.7236328125, -25.64453125, -24.5654296875, -23.486328125, -22.4072265625, -21.328125, -20.2490234375, -19.169921875, -18.0908203125, -17.01171875, -15.9326171875, -14.853515625, -13.7744140625, -12.6953125, -11.6162109375, -10.537109375, -9.4580078125, -8.37890625, -7.2998046875, -6.220703125, -5.1416015625, -4.0625, -2.9833984375, -1.904296875, -0.8251953125, 0.25390625, 1.3330078125, 2.412109375, 3.4912109375, 4.5703125, 5.6494140625, 6.728515625, 7.8076171875, 8.88671875, 9.9658203125, 11.044921875, 12.1240234375, 13.203125, 14.2822265625, 15.361328125, 16.4404296875, 17.51953125, 18.5986328125, 19.677734375, 20.7568359375, 21.8359375, 22.9150390625, 23.994140625, 25.0732421875, 26.15234375, 27.2314453125, 28.310546875, 29.3896484375, 30.46875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 232.0, 594.0, 172.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.4194793701172, -152.83926391601562, -147.25904846191406, -141.6788330078125, -136.09861755371094, -130.51840209960938, -124.93819427490234, -119.35797882080078, -113.77776336669922, -108.19754791259766, -102.6173324584961, -97.03712463378906, -91.4569091796875, -85.87669372558594, -80.29647827148438, -74.71626281738281, -69.13604736328125, -63.55583190917969, -57.975616455078125, -52.39540481567383, -46.815189361572266, -41.2349739074707, -35.654762268066406, -30.074546813964844, -24.49433135986328, -18.91411590576172, -13.333902359008789, -7.753688812255859, -2.173473358154297, 3.4067420959472656, 8.986953735351562, 14.567169189453125, 20.147369384765625, 25.727584838867188, 31.307798385620117, 36.88801193237305, 42.46822738647461, 48.04844284057617, 53.62865447998047, 59.20886993408203, 64.7890853881836, 70.36930084228516, 75.94951629638672, 81.52972412109375, 87.10993957519531, 92.69015502929688, 98.27037048339844, 103.8505859375, 109.43080139160156, 115.01101684570312, 120.59123229980469, 126.17144775390625, 131.7516632080078, 137.33187866210938, 142.91207885742188, 148.4923095703125, 154.072509765625, 159.65272521972656, 165.23294067382812, 170.8131561279297, 176.39337158203125, 181.9735870361328, 187.55380249023438, 193.13400268554688, 198.7142333984375]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 5.0, 7.0, 12.0, 8.0, 9.0, 16.0, 13.0, 17.0, 18.0, 26.0, 24.0, 26.0, 30.0, 27.0, 41.0, 40.0, 36.0, 39.0, 37.0, 45.0, 50.0, 47.0, 38.0, 37.0, 42.0, 40.0, 34.0, 27.0, 28.0, 25.0, 23.0, 23.0, 23.0, 10.0, 11.0, 15.0, 10.0, 14.0, 5.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.617599487304688, -24.805749893188477, -23.993900299072266, -23.182048797607422, -22.37019920349121, -21.558349609375, -20.74650001525879, -19.934650421142578, -19.122798919677734, -18.310949325561523, -17.499099731445312, -16.68724822998047, -15.875398635864258, -15.063549041748047, -14.251699447631836, -13.439849853515625, -12.628000259399414, -11.816150665283203, -11.004300117492676, -10.192450523376465, -9.380599975585938, -8.568750381469727, -7.756900787353516, -6.9450507164001465, -6.133200645446777, -5.321350574493408, -4.509500503540039, -3.697650909423828, -2.885800838470459, -2.07395076751709, -1.262101173400879, -0.45025110244750977, 0.3616008758544922, 1.1734508275985718, 1.9853007793426514, 2.7971506118774414, 3.6090006828308105, 4.42085075378418, 5.232700347900391, 6.04455041885376, 6.856400489807129, 7.668250560760498, 8.480100631713867, 9.291950225830078, 10.103799819946289, 10.915650367736816, 11.727499961853027, 12.539350509643555, 13.351200103759766, 14.163049697875977, 14.974900245666504, 15.786749839782715, 16.598600387573242, 17.410449981689453, 18.222299575805664, 19.034149169921875, 19.84600067138672, 20.65785026550293, 21.46969985961914, 22.281551361083984, 23.093400955200195, 23.905250549316406, 24.717100143432617, 25.528949737548828, 26.34079933166504]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 4.0, 9.0, 7.0, 5.0, 18.0, 10.0, 15.0, 23.0, 23.0, 23.0, 24.0, 30.0, 29.0, 33.0, 38.0, 46.0, 40.0, 30.0, 54.0, 46.0, 43.0, 38.0, 45.0, 43.0, 33.0, 37.0, 39.0, 38.0, 26.0, 19.0, 9.0, 16.0, 21.0, 15.0, 11.0, 8.0, 14.0, 12.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8984375, -3.78204345703125, -3.6656494140625, -3.54925537109375, -3.432861328125, -3.31646728515625, -3.2000732421875, -3.08367919921875, -2.96728515625, -2.85089111328125, -2.7344970703125, -2.61810302734375, -2.501708984375, -2.38531494140625, -2.2689208984375, -2.15252685546875, -2.0361328125, -1.91973876953125, -1.8033447265625, -1.68695068359375, -1.570556640625, -1.45416259765625, -1.3377685546875, -1.22137451171875, -1.10498046875, -0.98858642578125, -0.8721923828125, -0.75579833984375, -0.639404296875, -0.52301025390625, -0.4066162109375, -0.29022216796875, -0.173828125, -0.05743408203125, 0.0589599609375, 0.17535400390625, 0.291748046875, 0.40814208984375, 0.5245361328125, 0.64093017578125, 0.75732421875, 0.87371826171875, 0.9901123046875, 1.10650634765625, 1.222900390625, 1.33929443359375, 1.4556884765625, 1.57208251953125, 1.6884765625, 1.80487060546875, 1.9212646484375, 2.03765869140625, 2.154052734375, 2.27044677734375, 2.3868408203125, 2.50323486328125, 2.61962890625, 2.73602294921875, 2.8524169921875, 2.96881103515625, 3.085205078125, 3.20159912109375, 3.3179931640625, 3.43438720703125, 3.55078125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 11.0, 11.0, 22.0, 31.0, 36.0, 54.0, 74.0, 113.0, 163.0, 230.0, 352.0, 511.0, 711.0, 992.0, 1471.0, 2058.0, 3092.0, 4357.0, 6194.0, 9273.0, 13450.0, 20537.0, 31857.0, 51407.0, 89186.0, 176059.0, 283937.0, 144756.0, 76359.0, 45400.0, 28111.0, 18476.0, 12333.0, 8357.0, 5685.0, 3894.0, 2703.0, 1873.0, 1284.0, 922.0, 686.0, 468.0, 345.0, 220.0, 149.0, 114.0, 78.0, 46.0, 42.0, 31.0, 7.0, 14.0, 8.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.6064453125, -0.5882720947265625, -0.570098876953125, -0.5519256591796875, -0.53375244140625, -0.5155792236328125, -0.497406005859375, -0.4792327880859375, -0.4610595703125, -0.4428863525390625, -0.424713134765625, -0.4065399169921875, -0.38836669921875, -0.3701934814453125, -0.352020263671875, -0.3338470458984375, -0.315673828125, -0.2975006103515625, -0.279327392578125, -0.2611541748046875, -0.24298095703125, -0.2248077392578125, -0.206634521484375, -0.1884613037109375, -0.1702880859375, -0.1521148681640625, -0.133941650390625, -0.1157684326171875, -0.09759521484375, -0.0794219970703125, -0.061248779296875, -0.0430755615234375, -0.02490234375, -0.0067291259765625, 0.011444091796875, 0.0296173095703125, 0.04779052734375, 0.0659637451171875, 0.084136962890625, 0.1023101806640625, 0.1204833984375, 0.1386566162109375, 0.156829833984375, 0.1750030517578125, 0.19317626953125, 0.2113494873046875, 0.229522705078125, 0.2476959228515625, 0.265869140625, 0.2840423583984375, 0.302215576171875, 0.3203887939453125, 0.33856201171875, 0.3567352294921875, 0.374908447265625, 0.3930816650390625, 0.4112548828125, 0.4294281005859375, 0.447601318359375, 0.4657745361328125, 0.48394775390625, 0.5021209716796875, 0.520294189453125, 0.5384674072265625, 0.556640625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 8.0, 9.0, 8.0, 13.0, 6.0, 15.0, 12.0, 24.0, 16.0, 19.0, 17.0, 28.0, 22.0, 39.0, 25.0, 28.0, 34.0, 43.0, 41.0, 38.0, 1061.0, 36.0, 40.0, 46.0, 31.0, 44.0, 35.0, 26.0, 42.0, 38.0, 22.0, 21.0, 18.0, 21.0, 15.0, 21.0, 9.0, 10.0, 13.0, 11.0, 2.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.158203125, -2.088470458984375, -2.01873779296875, -1.949005126953125, -1.8792724609375, -1.809539794921875, -1.73980712890625, -1.670074462890625, -1.600341796875, -1.530609130859375, -1.46087646484375, -1.391143798828125, -1.3214111328125, -1.251678466796875, -1.18194580078125, -1.112213134765625, -1.04248046875, -0.972747802734375, -0.90301513671875, -0.833282470703125, -0.7635498046875, -0.693817138671875, -0.62408447265625, -0.554351806640625, -0.484619140625, -0.414886474609375, -0.34515380859375, -0.275421142578125, -0.2056884765625, -0.135955810546875, -0.06622314453125, 0.003509521484375, 0.0732421875, 0.142974853515625, 0.21270751953125, 0.282440185546875, 0.3521728515625, 0.421905517578125, 0.49163818359375, 0.561370849609375, 0.631103515625, 0.700836181640625, 0.77056884765625, 0.840301513671875, 0.9100341796875, 0.979766845703125, 1.04949951171875, 1.119232177734375, 1.18896484375, 1.258697509765625, 1.32843017578125, 1.398162841796875, 1.4678955078125, 1.537628173828125, 1.60736083984375, 1.677093505859375, 1.746826171875, 1.816558837890625, 1.88629150390625, 1.956024169921875, 2.0257568359375, 2.095489501953125, 2.16522216796875, 2.234954833984375, 2.3046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 14.0, 11.0, 10.0, 22.0, 28.0, 49.0, 57.0, 99.0, 122.0, 168.0, 248.0, 354.0, 539.0, 728.0, 1063.0, 1507.0, 2031.0, 2870.0, 4194.0, 5664.0, 8085.0, 11297.0, 16352.0, 23637.0, 34971.0, 53150.0, 87596.0, 163476.0, 1304221.0, 142133.0, 77933.0, 48841.0, 32228.0, 21839.0, 14966.0, 10609.0, 7468.0, 5277.0, 3740.0, 2751.0, 1903.0, 1414.0, 997.0, 704.0, 522.0, 362.0, 264.0, 184.0, 139.0, 89.0, 72.0, 41.0, 32.0, 33.0, 13.0, 10.0, 6.0, 2.0, 5.0, 3.0], "bins": [-0.494384765625, -0.4791259765625, -0.4638671875, -0.4486083984375, -0.433349609375, -0.4180908203125, -0.40283203125, -0.3875732421875, -0.372314453125, -0.3570556640625, -0.341796875, -0.3265380859375, -0.311279296875, -0.2960205078125, -0.28076171875, -0.2655029296875, -0.250244140625, -0.2349853515625, -0.2197265625, -0.2044677734375, -0.189208984375, -0.1739501953125, -0.15869140625, -0.1434326171875, -0.128173828125, -0.1129150390625, -0.09765625, -0.0823974609375, -0.067138671875, -0.0518798828125, -0.03662109375, -0.0213623046875, -0.006103515625, 0.0091552734375, 0.0244140625, 0.0396728515625, 0.054931640625, 0.0701904296875, 0.08544921875, 0.1007080078125, 0.115966796875, 0.1312255859375, 0.146484375, 0.1617431640625, 0.177001953125, 0.1922607421875, 0.20751953125, 0.2227783203125, 0.238037109375, 0.2532958984375, 0.2685546875, 0.2838134765625, 0.299072265625, 0.3143310546875, 0.32958984375, 0.3448486328125, 0.360107421875, 0.3753662109375, 0.390625, 0.4058837890625, 0.421142578125, 0.4364013671875, 0.45166015625, 0.4669189453125, 0.482177734375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 6.0, 6.0, 5.0, 5.0, 7.0, 8.0, 16.0, 17.0, 23.0, 46.0, 32.0, 43.0, 49.0, 51.0, 63.0, 60.0, 80.0, 62.0, 59.0, 63.0, 53.0, 50.0, 38.0, 28.0, 29.0, 23.0, 20.0, 12.0, 8.0, 10.0, 5.0, 4.0, 1.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012958049774169922, -0.00012500397861003876, -0.0001204274594783783, -0.00011585094034671783, -0.00011127442121505737, -0.00010669790208339691, -0.00010212138295173645, -9.754486382007599e-05, -9.296834468841553e-05, -8.839182555675507e-05, -8.38153064250946e-05, -7.923878729343414e-05, -7.466226816177368e-05, -7.008574903011322e-05, -6.550922989845276e-05, -6.09327107667923e-05, -5.6356191635131836e-05, -5.1779672503471375e-05, -4.720315337181091e-05, -4.262663424015045e-05, -3.805011510848999e-05, -3.347359597682953e-05, -2.8897076845169067e-05, -2.4320557713508606e-05, -1.9744038581848145e-05, -1.5167519450187683e-05, -1.0591000318527222e-05, -6.01448118686676e-06, -1.4379620552062988e-06, 3.1385570764541626e-06, 7.715076208114624e-06, 1.2291595339775085e-05, 1.6868114471435547e-05, 2.1444633603096008e-05, 2.602115273475647e-05, 3.059767186641693e-05, 3.517419099807739e-05, 3.9750710129737854e-05, 4.4327229261398315e-05, 4.890374839305878e-05, 5.348026752471924e-05, 5.80567866563797e-05, 6.263330578804016e-05, 6.720982491970062e-05, 7.178634405136108e-05, 7.636286318302155e-05, 8.093938231468201e-05, 8.551590144634247e-05, 9.009242057800293e-05, 9.466893970966339e-05, 9.924545884132385e-05, 0.00010382197797298431, 0.00010839849710464478, 0.00011297501623630524, 0.0001175515353679657, 0.00012212805449962616, 0.00012670457363128662, 0.00013128109276294708, 0.00013585761189460754, 0.000140434131026268, 0.00014501065015792847, 0.00014958716928958893, 0.0001541636884212494, 0.00015874020755290985, 0.0001633167266845703]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 8.0, 16.0, 16.0, 27.0, 26.0, 32.0, 41.0, 70.0, 99.0, 131.0, 217.0, 368.0, 1119.0, 209194.0, 834384.0, 1637.0, 467.0, 229.0, 120.0, 86.0, 56.0, 58.0, 32.0, 24.0, 18.0, 16.0, 12.0, 4.0, 8.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0035247802734375, -0.00342714786529541, -0.0033295154571533203, -0.0032318830490112305, -0.0031342506408691406, -0.0030366182327270508, -0.002938985824584961, -0.002841353416442871, -0.0027437210083007812, -0.0026460886001586914, -0.0025484561920166016, -0.0024508237838745117, -0.002353191375732422, -0.002255558967590332, -0.002157926559448242, -0.0020602941513061523, -0.0019626617431640625, -0.0018650293350219727, -0.0017673969268798828, -0.001669764518737793, -0.0015721321105957031, -0.0014744997024536133, -0.0013768672943115234, -0.0012792348861694336, -0.0011816024780273438, -0.001083970069885254, -0.000986337661743164, -0.0008887052536010742, -0.0007910728454589844, -0.0006934404373168945, -0.0005958080291748047, -0.0004981756210327148, -0.000400543212890625, -0.00030291080474853516, -0.0002052783966064453, -0.00010764598846435547, -1.0013580322265625e-05, 8.761882781982422e-05, 0.00018525123596191406, 0.0002828836441040039, 0.00038051605224609375, 0.0004781484603881836, 0.0005757808685302734, 0.0006734132766723633, 0.0007710456848144531, 0.000868678092956543, 0.0009663105010986328, 0.0010639429092407227, 0.0011615753173828125, 0.0012592077255249023, 0.0013568401336669922, 0.001454472541809082, 0.0015521049499511719, 0.0016497373580932617, 0.0017473697662353516, 0.0018450021743774414, 0.0019426345825195312, 0.002040266990661621, 0.002137899398803711, 0.0022355318069458008, 0.0023331642150878906, 0.0024307966232299805, 0.0025284290313720703, 0.00262606143951416, 0.00272369384765625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 10.0, 38.0, 159.0, 275.0, 277.0, 157.0, 70.0, 16.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016755824617575854, -0.00016060580674093217, -0.0001536533673061058, -0.00014670092787127942, -0.00013974847388453782, -0.00013279603444971144, -0.00012584359501488507, -0.0001188911555800587, -0.00011193871614523232, -0.00010498627671040595, -9.803383727557957e-05, -9.108139056479558e-05, -8.412895112996921e-05, -7.717651169514284e-05, -7.022406498435885e-05, -6.327162554953247e-05, -5.63191861147061e-05, -4.9366746679879725e-05, -4.2414303607074544e-05, -3.546186053426936e-05, -2.850942109944299e-05, -2.1556981664616615e-05, -1.4604538591811433e-05, -7.652095519006252e-06, -6.996560841798782e-07, 6.252785169635899e-06, 1.3205226423451677e-05, 2.0157667677267455e-05, 2.7110108931083232e-05, 3.4062548365909606e-05, 4.101499143871479e-05, 4.796743451151997e-05, 5.491988849826157e-05, 6.187232793308794e-05, 6.882476736791432e-05, 7.577721407869831e-05, 8.272965351352468e-05, 8.968209294835106e-05, 9.663453965913504e-05, 0.00010358697909396142, 0.00011053941852878779, 0.00011749185796361417, 0.00012444429739844054, 0.00013139673683326691, 0.00013834919082000852, 0.0001453016302548349, 0.00015225406968966126, 0.00015920650912448764, 0.000166158948559314, 0.0001731113879941404, 0.00018006382742896676, 0.00018701626686379313, 0.0001939687062986195, 0.00020092114573344588, 0.00020787359972018749, 0.00021482603915501386, 0.00022177847858984023, 0.0002287309180246666, 0.00023568335745949298, 0.00024263579689431936, 0.00024958825088106096, 0.00025654069031588733, 0.0002634931297507137, 0.0002704455691855401, 0.00027739800862036645]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 3.0, 6.0, 4.0, 6.0, 3.0, 10.0, 7.0, 18.0, 14.0, 12.0, 19.0, 38.0, 17.0, 25.0, 24.0, 33.0, 39.0, 48.0, 32.0, 38.0, 31.0, 37.0, 50.0, 47.0, 40.0, 36.0, 32.0, 29.0, 31.0, 33.0, 25.0, 28.0, 26.0, 19.0, 17.0, 22.0, 12.0, 9.0, 18.0, 13.0, 7.0, 8.0, 3.0, 8.0, 5.0, 11.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.538629531860352e-05, -6.334111094474792e-05, -6.129592657089233e-05, -5.925074219703674e-05, -5.720555782318115e-05, -5.516037344932556e-05, -5.311518907546997e-05, -5.107000470161438e-05, -4.902482032775879e-05, -4.69796359539032e-05, -4.493445158004761e-05, -4.2889267206192017e-05, -4.0844082832336426e-05, -3.8798898458480835e-05, -3.6753714084625244e-05, -3.470852971076965e-05, -3.266334533691406e-05, -3.061816096305847e-05, -2.857297658920288e-05, -2.652779221534729e-05, -2.44826078414917e-05, -2.243742346763611e-05, -2.0392239093780518e-05, -1.8347054719924927e-05, -1.6301870346069336e-05, -1.4256685972213745e-05, -1.2211501598358154e-05, -1.0166317224502563e-05, -8.121132850646973e-06, -6.075948476791382e-06, -4.030764102935791e-06, -1.9855797290802e-06, 5.960464477539063e-08, 2.1047890186309814e-06, 4.149973392486572e-06, 6.195157766342163e-06, 8.240342140197754e-06, 1.0285526514053345e-05, 1.2330710887908936e-05, 1.4375895261764526e-05, 1.6421079635620117e-05, 1.8466264009475708e-05, 2.05114483833313e-05, 2.255663275718689e-05, 2.460181713104248e-05, 2.664700150489807e-05, 2.8692185878753662e-05, 3.073737025260925e-05, 3.2782554626464844e-05, 3.4827739000320435e-05, 3.6872923374176025e-05, 3.8918107748031616e-05, 4.096329212188721e-05, 4.30084764957428e-05, 4.505366086959839e-05, 4.709884524345398e-05, 4.914402961730957e-05, 5.118921399116516e-05, 5.323439836502075e-05, 5.527958273887634e-05, 5.7324767112731934e-05, 5.9369951486587524e-05, 6.141513586044312e-05, 6.34603202342987e-05, 6.55055046081543e-05]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 4.0, 9.0, 7.0, 5.0, 18.0, 10.0, 15.0, 23.0, 23.0, 23.0, 24.0, 30.0, 29.0, 33.0, 38.0, 46.0, 40.0, 30.0, 54.0, 46.0, 43.0, 38.0, 45.0, 43.0, 33.0, 37.0, 39.0, 38.0, 26.0, 19.0, 9.0, 16.0, 21.0, 15.0, 11.0, 8.0, 14.0, 12.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8984375, -3.78204345703125, -3.6656494140625, -3.54925537109375, -3.432861328125, -3.31646728515625, -3.2000732421875, -3.08367919921875, -2.96728515625, -2.85089111328125, -2.7344970703125, -2.61810302734375, -2.501708984375, -2.38531494140625, -2.2689208984375, -2.15252685546875, -2.0361328125, -1.91973876953125, -1.8033447265625, -1.68695068359375, -1.570556640625, -1.45416259765625, -1.3377685546875, -1.22137451171875, -1.10498046875, -0.98858642578125, -0.8721923828125, -0.75579833984375, -0.639404296875, -0.52301025390625, -0.4066162109375, -0.29022216796875, -0.173828125, -0.05743408203125, 0.0589599609375, 0.17535400390625, 0.291748046875, 0.40814208984375, 0.5245361328125, 0.64093017578125, 0.75732421875, 0.87371826171875, 0.9901123046875, 1.10650634765625, 1.222900390625, 1.33929443359375, 1.4556884765625, 1.57208251953125, 1.6884765625, 1.80487060546875, 1.9212646484375, 2.03765869140625, 2.154052734375, 2.27044677734375, 2.3868408203125, 2.50323486328125, 2.61962890625, 2.73602294921875, 2.8524169921875, 2.96881103515625, 3.085205078125, 3.20159912109375, 3.3179931640625, 3.43438720703125, 3.55078125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 17.0, 10.0, 20.0, 25.0, 37.0, 55.0, 57.0, 89.0, 121.0, 197.0, 308.0, 460.0, 873.0, 1687.0, 3702.0, 8564.0, 20025.0, 48135.0, 115888.0, 271075.0, 327819.0, 144160.0, 60278.0, 25085.0, 10444.0, 4628.0, 2077.0, 1074.0, 581.0, 334.0, 213.0, 130.0, 119.0, 70.0, 55.0, 43.0, 33.0, 25.0, 7.0, 13.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.68359375, -3.568939208984375, -3.45428466796875, -3.339630126953125, -3.2249755859375, -3.110321044921875, -2.99566650390625, -2.881011962890625, -2.766357421875, -2.651702880859375, -2.53704833984375, -2.422393798828125, -2.3077392578125, -2.193084716796875, -2.07843017578125, -1.963775634765625, -1.84912109375, -1.734466552734375, -1.61981201171875, -1.505157470703125, -1.3905029296875, -1.275848388671875, -1.16119384765625, -1.046539306640625, -0.931884765625, -0.817230224609375, -0.70257568359375, -0.587921142578125, -0.4732666015625, -0.358612060546875, -0.24395751953125, -0.129302978515625, -0.0146484375, 0.100006103515625, 0.21466064453125, 0.329315185546875, 0.4439697265625, 0.558624267578125, 0.67327880859375, 0.787933349609375, 0.902587890625, 1.017242431640625, 1.13189697265625, 1.246551513671875, 1.3612060546875, 1.475860595703125, 1.59051513671875, 1.705169677734375, 1.81982421875, 1.934478759765625, 2.04913330078125, 2.163787841796875, 2.2784423828125, 2.393096923828125, 2.50775146484375, 2.622406005859375, 2.737060546875, 2.851715087890625, 2.96636962890625, 3.081024169921875, 3.1956787109375, 3.310333251953125, 3.42498779296875, 3.539642333984375, 3.654296875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 10.0, 6.0, 2.0, 7.0, 14.0, 12.0, 13.0, 13.0, 24.0, 27.0, 28.0, 36.0, 41.0, 39.0, 56.0, 58.0, 60.0, 121.0, 279.0, 1507.0, 210.0, 83.0, 64.0, 50.0, 45.0, 38.0, 30.0, 24.0, 28.0, 21.0, 23.0, 18.0, 17.0, 7.0, 6.0, 7.0, 10.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.3604736328125, -11.924072265625, -11.4876708984375, -11.05126953125, -10.6148681640625, -10.178466796875, -9.7420654296875, -9.3056640625, -8.8692626953125, -8.432861328125, -7.9964599609375, -7.56005859375, -7.1236572265625, -6.687255859375, -6.2508544921875, -5.814453125, -5.3780517578125, -4.941650390625, -4.5052490234375, -4.06884765625, -3.6324462890625, -3.196044921875, -2.7596435546875, -2.3232421875, -1.8868408203125, -1.450439453125, -1.0140380859375, -0.57763671875, -0.1412353515625, 0.295166015625, 0.7315673828125, 1.16796875, 1.6043701171875, 2.040771484375, 2.4771728515625, 2.91357421875, 3.3499755859375, 3.786376953125, 4.2227783203125, 4.6591796875, 5.0955810546875, 5.531982421875, 5.9683837890625, 6.40478515625, 6.8411865234375, 7.277587890625, 7.7139892578125, 8.150390625, 8.5867919921875, 9.023193359375, 9.4595947265625, 9.89599609375, 10.3323974609375, 10.768798828125, 11.2052001953125, 11.6416015625, 12.0780029296875, 12.514404296875, 12.9508056640625, 13.38720703125, 13.8236083984375, 14.260009765625, 14.6964111328125, 15.1328125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 2.0, 8.0, 11.0, 11.0, 10.0, 11.0, 11.0, 15.0, 20.0, 25.0, 58.0, 64.0, 107.0, 188.0, 311.0, 653.0, 6130.0, 3131795.0, 4728.0, 625.0, 341.0, 178.0, 109.0, 74.0, 57.0, 38.0, 39.0, 15.0, 21.0, 6.0, 12.0, 5.0, 7.0, 3.0, 3.0, 7.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.1875, -64.1494140625, -62.111328125, -60.0732421875, -58.03515625, -55.9970703125, -53.958984375, -51.9208984375, -49.8828125, -47.8447265625, -45.806640625, -43.7685546875, -41.73046875, -39.6923828125, -37.654296875, -35.6162109375, -33.578125, -31.5400390625, -29.501953125, -27.4638671875, -25.42578125, -23.3876953125, -21.349609375, -19.3115234375, -17.2734375, -15.2353515625, -13.197265625, -11.1591796875, -9.12109375, -7.0830078125, -5.044921875, -3.0068359375, -0.96875, 1.0693359375, 3.107421875, 5.1455078125, 7.18359375, 9.2216796875, 11.259765625, 13.2978515625, 15.3359375, 17.3740234375, 19.412109375, 21.4501953125, 23.48828125, 25.5263671875, 27.564453125, 29.6025390625, 31.640625, 33.6787109375, 35.716796875, 37.7548828125, 39.79296875, 41.8310546875, 43.869140625, 45.9072265625, 47.9453125, 49.9833984375, 52.021484375, 54.0595703125, 56.09765625, 58.1357421875, 60.173828125, 62.2119140625, 64.25]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 16.0, 110.0, 511.0, 338.0, 38.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.560304641723633, -17.05166244506836, -14.543020248413086, -12.034379005432129, -9.525736808776855, -7.017094612121582, -4.508453369140625, -1.9998111724853516, 0.5088310241699219, 3.017472982406616, 5.5261149406433105, 8.034756660461426, 10.5433988571167, 13.052041053771973, 15.56068229675293, 18.069324493408203, 20.577966690063477, 23.08660888671875, 25.595251083374023, 28.103893280029297, 30.612533569335938, 33.121177673339844, 35.629817962646484, 38.138458251953125, 40.64710235595703, 43.15574264526367, 45.66438674926758, 48.17302703857422, 50.681671142578125, 53.190311431884766, 55.698951721191406, 58.20759582519531, 60.71623992919922, 63.22488021850586, 65.7335205078125, 68.2421646118164, 70.75080871582031, 73.25945281982422, 75.7680892944336, 78.2767333984375, 80.7853775024414, 83.29402160644531, 85.80265808105469, 88.3113021850586, 90.8199462890625, 93.3285903930664, 95.83722686767578, 98.34587097167969, 100.85450744628906, 103.36315155029297, 105.87178802490234, 108.38043212890625, 110.88907623291016, 113.39772033691406, 115.90635681152344, 118.41500091552734, 120.92364501953125, 123.43228912353516, 125.94092559814453, 128.44956970214844, 130.9582061767578, 133.46685791015625, 135.97549438476562, 138.484130859375, 140.99278259277344]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 1.0, 5.0, 3.0, 12.0, 8.0, 8.0, 16.0, 15.0, 14.0, 10.0, 14.0, 23.0, 20.0, 18.0, 25.0, 18.0, 28.0, 37.0, 41.0, 38.0, 38.0, 35.0, 40.0, 29.0, 32.0, 33.0, 37.0, 28.0, 32.0, 29.0, 26.0, 40.0, 25.0, 28.0, 27.0, 30.0, 25.0, 23.0, 11.0, 13.0, 8.0, 13.0, 12.0, 7.0, 4.0, 4.0, 5.0, 8.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0], "bins": [-32.69915771484375, -31.740915298461914, -30.782670974731445, -29.82442855834961, -28.86618423461914, -27.907941818237305, -26.94969940185547, -25.991455078125, -25.033212661743164, -24.074970245361328, -23.11672592163086, -22.158483505249023, -21.200241088867188, -20.24199676513672, -19.283754348754883, -18.325511932373047, -17.367267608642578, -16.409025192260742, -15.450780868530273, -14.492538452148438, -13.534295082092285, -12.576051712036133, -11.617809295654297, -10.659565925598145, -9.701322555541992, -8.74307918548584, -7.784836292266846, -6.826593399047852, -5.868350028991699, -4.910106658935547, -3.9518637657165527, -2.9936208724975586, -2.0353755950927734, -1.0771324634552002, -0.11888933181762695, 0.8393537998199463, 1.7975969314575195, 2.755840301513672, 3.714083194732666, 4.67232608795166, 5.6305694580078125, 6.588812828063965, 7.547055721282959, 8.505298614501953, 9.463541984558105, 10.421785354614258, 11.380027770996094, 12.338271141052246, 13.296514511108398, 14.25475788116455, 15.213001251220703, 16.17124366760254, 17.129486083984375, 18.087730407714844, 19.04597282409668, 20.004215240478516, 20.962459564208984, 21.92070198059082, 22.87894630432129, 23.837188720703125, 24.795433044433594, 25.75367546081543, 26.711917877197266, 27.670162200927734, 28.62840461730957]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 11.0, 10.0, 16.0, 7.0, 8.0, 11.0, 17.0, 16.0, 18.0, 25.0, 22.0, 28.0, 29.0, 41.0, 37.0, 35.0, 52.0, 41.0, 34.0, 44.0, 40.0, 42.0, 51.0, 40.0, 30.0, 38.0, 34.0, 29.0, 36.0, 21.0, 16.0, 18.0, 16.0, 15.0, 13.0, 15.0, 6.0, 8.0, 4.0, 11.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 4.0], "bins": [-4.75390625, -4.62432861328125, -4.4947509765625, -4.36517333984375, -4.235595703125, -4.10601806640625, -3.9764404296875, -3.84686279296875, -3.71728515625, -3.58770751953125, -3.4581298828125, -3.32855224609375, -3.198974609375, -3.06939697265625, -2.9398193359375, -2.81024169921875, -2.6806640625, -2.55108642578125, -2.4215087890625, -2.29193115234375, -2.162353515625, -2.03277587890625, -1.9031982421875, -1.77362060546875, -1.64404296875, -1.51446533203125, -1.3848876953125, -1.25531005859375, -1.125732421875, -0.99615478515625, -0.8665771484375, -0.73699951171875, -0.607421875, -0.47784423828125, -0.3482666015625, -0.21868896484375, -0.089111328125, 0.04046630859375, 0.1700439453125, 0.29962158203125, 0.42919921875, 0.55877685546875, 0.6883544921875, 0.81793212890625, 0.947509765625, 1.07708740234375, 1.2066650390625, 1.33624267578125, 1.4658203125, 1.59539794921875, 1.7249755859375, 1.85455322265625, 1.984130859375, 2.11370849609375, 2.2432861328125, 2.37286376953125, 2.50244140625, 2.63201904296875, 2.7615966796875, 2.89117431640625, 3.020751953125, 3.15032958984375, 3.2799072265625, 3.40948486328125, 3.5390625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 8.0, 11.0, 7.0, 15.0, 12.0, 11.0, 20.0, 21.0, 24.0, 37.0, 59.0, 77.0, 106.0, 167.0, 285.0, 676.0, 2834.0, 33418.0, 785883.0, 2789221.0, 553822.0, 23917.0, 2219.0, 581.0, 283.0, 162.0, 99.0, 64.0, 58.0, 34.0, 33.0, 21.0, 15.0, 12.0, 9.0, 10.0, 10.0, 5.0, 9.0, 6.0, 5.0, 5.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.0, -10.6895751953125, -10.379150390625, -10.0687255859375, -9.75830078125, -9.4478759765625, -9.137451171875, -8.8270263671875, -8.5166015625, -8.2061767578125, -7.895751953125, -7.5853271484375, -7.27490234375, -6.9644775390625, -6.654052734375, -6.3436279296875, -6.033203125, -5.7227783203125, -5.412353515625, -5.1019287109375, -4.79150390625, -4.4810791015625, -4.170654296875, -3.8602294921875, -3.5498046875, -3.2393798828125, -2.928955078125, -2.6185302734375, -2.30810546875, -1.9976806640625, -1.687255859375, -1.3768310546875, -1.06640625, -0.7559814453125, -0.445556640625, -0.1351318359375, 0.17529296875, 0.4857177734375, 0.796142578125, 1.1065673828125, 1.4169921875, 1.7274169921875, 2.037841796875, 2.3482666015625, 2.65869140625, 2.9691162109375, 3.279541015625, 3.5899658203125, 3.900390625, 4.2108154296875, 4.521240234375, 4.8316650390625, 5.14208984375, 5.4525146484375, 5.762939453125, 6.0733642578125, 6.3837890625, 6.6942138671875, 7.004638671875, 7.3150634765625, 7.62548828125, 7.9359130859375, 8.246337890625, 8.5567626953125, 8.8671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 7.0, 9.0, 6.0, 17.0, 17.0, 26.0, 20.0, 43.0, 50.0, 74.0, 98.0, 125.0, 148.0, 230.0, 317.0, 371.0, 411.0, 443.0, 401.0, 326.0, 245.0, 185.0, 135.0, 93.0, 60.0, 53.0, 36.0, 37.0, 29.0, 15.0, 8.0, 14.0, 10.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.41644287109375, -7.1766357421875, -6.93682861328125, -6.697021484375, -6.45721435546875, -6.2174072265625, -5.97760009765625, -5.73779296875, -5.49798583984375, -5.2581787109375, -5.01837158203125, -4.778564453125, -4.53875732421875, -4.2989501953125, -4.05914306640625, -3.8193359375, -3.57952880859375, -3.3397216796875, -3.09991455078125, -2.860107421875, -2.62030029296875, -2.3804931640625, -2.14068603515625, -1.90087890625, -1.66107177734375, -1.4212646484375, -1.18145751953125, -0.941650390625, -0.70184326171875, -0.4620361328125, -0.22222900390625, 0.017578125, 0.25738525390625, 0.4971923828125, 0.73699951171875, 0.976806640625, 1.21661376953125, 1.4564208984375, 1.69622802734375, 1.93603515625, 2.17584228515625, 2.4156494140625, 2.65545654296875, 2.895263671875, 3.13507080078125, 3.3748779296875, 3.61468505859375, 3.8544921875, 4.09429931640625, 4.3341064453125, 4.57391357421875, 4.813720703125, 5.05352783203125, 5.2933349609375, 5.53314208984375, 5.77294921875, 6.01275634765625, 6.2525634765625, 6.49237060546875, 6.732177734375, 6.97198486328125, 7.2117919921875, 7.45159912109375, 7.69140625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 4.0, 10.0, 14.0, 18.0, 17.0, 27.0, 39.0, 52.0, 66.0, 78.0, 92.0, 146.0, 190.0, 259.0, 388.0, 556.0, 2700.0, 316918.0, 3824235.0, 45760.0, 1124.0, 464.0, 277.0, 175.0, 154.0, 118.0, 114.0, 73.0, 53.0, 41.0, 24.0, 27.0, 20.0, 14.0, 8.0, 10.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.21875, -25.40771484375, -24.5966796875, -23.78564453125, -22.974609375, -22.16357421875, -21.3525390625, -20.54150390625, -19.73046875, -18.91943359375, -18.1083984375, -17.29736328125, -16.486328125, -15.67529296875, -14.8642578125, -14.05322265625, -13.2421875, -12.43115234375, -11.6201171875, -10.80908203125, -9.998046875, -9.18701171875, -8.3759765625, -7.56494140625, -6.75390625, -5.94287109375, -5.1318359375, -4.32080078125, -3.509765625, -2.69873046875, -1.8876953125, -1.07666015625, -0.265625, 0.54541015625, 1.3564453125, 2.16748046875, 2.978515625, 3.78955078125, 4.6005859375, 5.41162109375, 6.22265625, 7.03369140625, 7.8447265625, 8.65576171875, 9.466796875, 10.27783203125, 11.0888671875, 11.89990234375, 12.7109375, 13.52197265625, 14.3330078125, 15.14404296875, 15.955078125, 16.76611328125, 17.5771484375, 18.38818359375, 19.19921875, 20.01025390625, 20.8212890625, 21.63232421875, 22.443359375, 23.25439453125, 24.0654296875, 24.87646484375, 25.6875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 52.0, 185.0, 376.0, 286.0, 93.0, 12.0, 2.0, 1.0, 0.0, 1.0], "bins": [-181.3253936767578, -178.1287078857422, -174.93203735351562, -171.7353515625, -168.53868103027344, -165.3419952392578, -162.14532470703125, -158.94863891601562, -155.751953125, -152.55526733398438, -149.3585968017578, -146.1619110107422, -142.96524047851562, -139.7685546875, -136.57186889648438, -133.3751983642578, -130.17852783203125, -126.98184967041016, -123.78517150878906, -120.58848571777344, -117.39180755615234, -114.19512939453125, -110.99845123291016, -107.80177307128906, -104.60508728027344, -101.40840911865234, -98.21173095703125, -95.01504516601562, -91.81836700439453, -88.62168884277344, -85.42501068115234, -82.22833251953125, -79.03164672851562, -75.83496856689453, -72.63829040527344, -69.44160461425781, -66.24492645263672, -63.048248291015625, -59.85157012939453, -56.65489196777344, -53.458213806152344, -50.26153564453125, -47.06485366821289, -43.8681755065918, -40.6714973449707, -37.474815368652344, -34.27813720703125, -31.081459045410156, -27.88477897644043, -24.688098907470703, -21.49142074584961, -18.294740676879883, -15.098061561584473, -11.901382446289062, -8.704702377319336, -5.508024215698242, -2.3113441467285156, 0.8853352069854736, 4.082014560699463, 7.278694152832031, 10.475373268127441, 13.672052383422852, 16.868732452392578, 20.065410614013672, 23.2620906829834]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 12.0, 6.0, 13.0, 13.0, 20.0, 18.0, 24.0, 26.0, 30.0, 37.0, 27.0, 47.0, 36.0, 36.0, 37.0, 41.0, 40.0, 42.0, 44.0, 42.0, 42.0, 42.0, 31.0, 39.0, 38.0, 29.0, 27.0, 25.0, 18.0, 22.0, 14.0, 18.0, 16.0, 8.0, 7.0, 8.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.400285720825195, -26.552488327026367, -25.704692840576172, -24.856895446777344, -24.009098052978516, -23.161300659179688, -22.313505172729492, -21.465707778930664, -20.61791229248047, -19.77011489868164, -18.922319412231445, -18.074522018432617, -17.22672462463379, -16.378929138183594, -15.531131744384766, -14.683334350585938, -13.83553695678711, -12.987740516662598, -12.13994312286377, -11.292146682739258, -10.44434928894043, -9.596552848815918, -8.748756408691406, -7.900959491729736, -7.053162574768066, -6.2053656578063965, -5.357568740844727, -4.509772300720215, -3.661975383758545, -2.814178466796875, -1.9663820266723633, -1.1185851097106934, -0.2707862854003906, 0.5770105123519897, 1.4248073101043701, 2.272603988647461, 3.120400905609131, 3.968197822570801, 4.8159942626953125, 5.663791179656982, 6.511588096618652, 7.359385013580322, 8.207181930541992, 9.054978370666504, 9.902774810791016, 10.750572204589844, 11.598368644714355, 12.446165084838867, 13.293962478637695, 14.141758918762207, 14.989556312561035, 15.837352752685547, 16.685150146484375, 17.532947540283203, 18.3807430267334, 19.228540420532227, 20.076335906982422, 20.92413330078125, 21.771928787231445, 22.619726181030273, 23.4675235748291, 24.315319061279297, 25.163116455078125, 26.010913848876953, 26.85871124267578]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 8.0, 9.0, 12.0, 12.0, 13.0, 16.0, 21.0, 17.0, 26.0, 20.0, 30.0, 26.0, 29.0, 30.0, 34.0, 41.0, 32.0, 30.0, 55.0, 39.0, 45.0, 36.0, 38.0, 32.0, 41.0, 35.0, 41.0, 32.0, 25.0, 23.0, 19.0, 23.0, 18.0, 15.0, 8.0, 8.0, 13.0, 9.0, 7.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.507965087890625, -3.39288330078125, -3.277801513671875, -3.1627197265625, -3.047637939453125, -2.93255615234375, -2.817474365234375, -2.702392578125, -2.587310791015625, -2.47222900390625, -2.357147216796875, -2.2420654296875, -2.126983642578125, -2.01190185546875, -1.896820068359375, -1.78173828125, -1.666656494140625, -1.55157470703125, -1.436492919921875, -1.3214111328125, -1.206329345703125, -1.09124755859375, -0.976165771484375, -0.861083984375, -0.746002197265625, -0.63092041015625, -0.515838623046875, -0.4007568359375, -0.285675048828125, -0.17059326171875, -0.055511474609375, 0.0595703125, 0.174652099609375, 0.28973388671875, 0.404815673828125, 0.5198974609375, 0.634979248046875, 0.75006103515625, 0.865142822265625, 0.980224609375, 1.095306396484375, 1.21038818359375, 1.325469970703125, 1.4405517578125, 1.555633544921875, 1.67071533203125, 1.785797119140625, 1.90087890625, 2.015960693359375, 2.13104248046875, 2.246124267578125, 2.3612060546875, 2.476287841796875, 2.59136962890625, 2.706451416015625, 2.821533203125, 2.936614990234375, 3.05169677734375, 3.166778564453125, 3.2818603515625, 3.396942138671875, 3.51202392578125, 3.627105712890625, 3.7421875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 9.0, 13.0, 22.0, 25.0, 43.0, 67.0, 98.0, 129.0, 188.0, 274.0, 402.0, 578.0, 834.0, 1165.0, 1766.0, 2577.0, 3796.0, 5471.0, 8384.0, 12478.0, 19027.0, 29713.0, 47320.0, 78849.0, 146605.0, 282241.0, 170482.0, 89136.0, 52020.0, 32468.0, 20932.0, 13398.0, 9145.0, 5962.0, 3992.0, 2753.0, 1932.0, 1370.0, 925.0, 577.0, 424.0, 326.0, 185.0, 132.0, 125.0, 68.0, 54.0, 23.0, 18.0, 20.0, 11.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.62060546875, -0.6015701293945312, -0.5825347900390625, -0.5634994506835938, -0.544464111328125, -0.5254287719726562, -0.5063934326171875, -0.48735809326171875, -0.46832275390625, -0.44928741455078125, -0.4302520751953125, -0.41121673583984375, -0.392181396484375, -0.37314605712890625, -0.3541107177734375, -0.33507537841796875, -0.3160400390625, -0.29700469970703125, -0.2779693603515625, -0.25893402099609375, -0.239898681640625, -0.22086334228515625, -0.2018280029296875, -0.18279266357421875, -0.16375732421875, -0.14472198486328125, -0.1256866455078125, -0.10665130615234375, -0.087615966796875, -0.06858062744140625, -0.0495452880859375, -0.03050994873046875, -0.011474609375, 0.00756072998046875, 0.0265960693359375, 0.04563140869140625, 0.064666748046875, 0.08370208740234375, 0.1027374267578125, 0.12177276611328125, 0.14080810546875, 0.15984344482421875, 0.1788787841796875, 0.19791412353515625, 0.216949462890625, 0.23598480224609375, 0.2550201416015625, 0.27405548095703125, 0.2930908203125, 0.31212615966796875, 0.3311614990234375, 0.35019683837890625, 0.369232177734375, 0.38826751708984375, 0.4073028564453125, 0.42633819580078125, 0.44537353515625, 0.46440887451171875, 0.4834442138671875, 0.5024795532226562, 0.521514892578125, 0.5405502319335938, 0.5595855712890625, 0.5786209106445312, 0.59765625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 6.0, 11.0, 6.0, 16.0, 12.0, 19.0, 21.0, 23.0, 25.0, 24.0, 29.0, 22.0, 28.0, 33.0, 22.0, 42.0, 39.0, 43.0, 1069.0, 45.0, 28.0, 40.0, 36.0, 48.0, 37.0, 37.0, 34.0, 36.0, 32.0, 18.0, 22.0, 23.0, 19.0, 17.0, 8.0, 14.0, 6.0, 5.0, 6.0, 3.0, 5.0, 9.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.42578125, -2.3487548828125, -2.271728515625, -2.1947021484375, -2.11767578125, -2.0406494140625, -1.963623046875, -1.8865966796875, -1.8095703125, -1.7325439453125, -1.655517578125, -1.5784912109375, -1.50146484375, -1.4244384765625, -1.347412109375, -1.2703857421875, -1.193359375, -1.1163330078125, -1.039306640625, -0.9622802734375, -0.88525390625, -0.8082275390625, -0.731201171875, -0.6541748046875, -0.5771484375, -0.5001220703125, -0.423095703125, -0.3460693359375, -0.26904296875, -0.1920166015625, -0.114990234375, -0.0379638671875, 0.0390625, 0.1160888671875, 0.193115234375, 0.2701416015625, 0.34716796875, 0.4241943359375, 0.501220703125, 0.5782470703125, 0.6552734375, 0.7322998046875, 0.809326171875, 0.8863525390625, 0.96337890625, 1.0404052734375, 1.117431640625, 1.1944580078125, 1.271484375, 1.3485107421875, 1.425537109375, 1.5025634765625, 1.57958984375, 1.6566162109375, 1.733642578125, 1.8106689453125, 1.8876953125, 1.9647216796875, 2.041748046875, 2.1187744140625, 2.19580078125, 2.2728271484375, 2.349853515625, 2.4268798828125, 2.50390625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 8.0, 13.0, 26.0, 47.0, 60.0, 81.0, 124.0, 189.0, 232.0, 306.0, 477.0, 653.0, 944.0, 1371.0, 2014.0, 2689.0, 3915.0, 5623.0, 8057.0, 11734.0, 16563.0, 24304.0, 35424.0, 53516.0, 86596.0, 163923.0, 1307802.0, 140440.0, 77334.0, 48535.0, 32141.0, 21961.0, 15181.0, 10528.0, 7489.0, 5188.0, 3615.0, 2512.0, 1774.0, 1189.0, 783.0, 591.0, 390.0, 268.0, 176.0, 128.0, 61.0, 58.0, 36.0, 15.0, 14.0, 13.0, 11.0, 4.0, 2.0, 3.0, 0.0, 3.0], "bins": [-0.5380859375, -0.5214767456054688, -0.5048675537109375, -0.48825836181640625, -0.471649169921875, -0.45503997802734375, -0.4384307861328125, -0.42182159423828125, -0.40521240234375, -0.38860321044921875, -0.3719940185546875, -0.35538482666015625, -0.338775634765625, -0.32216644287109375, -0.3055572509765625, -0.28894805908203125, -0.2723388671875, -0.25572967529296875, -0.2391204833984375, -0.22251129150390625, -0.205902099609375, -0.18929290771484375, -0.1726837158203125, -0.15607452392578125, -0.13946533203125, -0.12285614013671875, -0.1062469482421875, -0.08963775634765625, -0.073028564453125, -0.05641937255859375, -0.0398101806640625, -0.02320098876953125, -0.006591796875, 0.01001739501953125, 0.0266265869140625, 0.04323577880859375, 0.059844970703125, 0.07645416259765625, 0.0930633544921875, 0.10967254638671875, 0.12628173828125, 0.14289093017578125, 0.1595001220703125, 0.17610931396484375, 0.192718505859375, 0.20932769775390625, 0.2259368896484375, 0.24254608154296875, 0.2591552734375, 0.27576446533203125, 0.2923736572265625, 0.30898284912109375, 0.325592041015625, 0.34220123291015625, 0.3588104248046875, 0.37541961669921875, 0.39202880859375, 0.40863800048828125, 0.4252471923828125, 0.44185638427734375, 0.458465576171875, 0.47507476806640625, 0.4916839599609375, 0.5082931518554688, 0.52490234375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 9.0, 5.0, 7.0, 12.0, 18.0, 17.0, 18.0, 24.0, 28.0, 28.0, 39.0, 35.0, 63.0, 68.0, 68.0, 71.0, 70.0, 65.0, 68.0, 55.0, 38.0, 34.0, 42.0, 27.0, 28.0, 11.0, 5.0, 9.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001456737518310547, -0.00014094635844230652, -0.00013621896505355835, -0.00013149157166481018, -0.000126764178276062, -0.00012203678488731384, -0.00011730939149856567, -0.0001125819981098175, -0.00010785460472106934, -0.00010312721133232117, -9.8399817943573e-05, -9.367242455482483e-05, -8.894503116607666e-05, -8.421763777732849e-05, -7.949024438858032e-05, -7.476285099983215e-05, -7.003545761108398e-05, -6.530806422233582e-05, -6.0580670833587646e-05, -5.585327744483948e-05, -5.112588405609131e-05, -4.639849066734314e-05, -4.167109727859497e-05, -3.69437038898468e-05, -3.221631050109863e-05, -2.7488917112350464e-05, -2.2761523723602295e-05, -1.8034130334854126e-05, -1.3306736946105957e-05, -8.579343557357788e-06, -3.851950168609619e-06, 8.754432201385498e-07, 5.602836608886719e-06, 1.0330229997634888e-05, 1.5057623386383057e-05, 1.9785016775131226e-05, 2.4512410163879395e-05, 2.9239803552627563e-05, 3.396719694137573e-05, 3.86945903301239e-05, 4.342198371887207e-05, 4.814937710762024e-05, 5.287677049636841e-05, 5.760416388511658e-05, 6.233155727386475e-05, 6.705895066261292e-05, 7.178634405136108e-05, 7.651373744010925e-05, 8.124113082885742e-05, 8.596852421760559e-05, 9.069591760635376e-05, 9.542331099510193e-05, 0.0001001507043838501, 0.00010487809777259827, 0.00010960549116134644, 0.0001143328845500946, 0.00011906027793884277, 0.00012378767132759094, 0.0001285150647163391, 0.00013324245810508728, 0.00013796985149383545, 0.00014269724488258362, 0.0001474246382713318, 0.00015215203166007996, 0.00015687942504882812]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 5.0, 5.0, 16.0, 11.0, 16.0, 24.0, 36.0, 50.0, 70.0, 80.0, 119.0, 237.0, 511.0, 2830.0, 1034999.0, 8152.0, 605.0, 266.0, 155.0, 75.0, 58.0, 53.0, 38.0, 27.0, 24.0, 18.0, 13.0, 18.0, 9.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003475189208984375, -0.003368556499481201, -0.0032619237899780273, -0.0031552910804748535, -0.0030486583709716797, -0.002942025661468506, -0.002835392951965332, -0.002728760242462158, -0.0026221275329589844, -0.0025154948234558105, -0.0024088621139526367, -0.002302229404449463, -0.002195596694946289, -0.0020889639854431152, -0.0019823312759399414, -0.0018756985664367676, -0.0017690658569335938, -0.00166243314743042, -0.001555800437927246, -0.0014491677284240723, -0.0013425350189208984, -0.0012359023094177246, -0.0011292695999145508, -0.001022636890411377, -0.0009160041809082031, -0.0008093714714050293, -0.0007027387619018555, -0.0005961060523986816, -0.0004894733428955078, -0.000382840633392334, -0.00027620792388916016, -0.00016957521438598633, -6.29425048828125e-05, 4.369020462036133e-05, 0.00015032291412353516, 0.000256955623626709, 0.0003635883331298828, 0.00047022104263305664, 0.0005768537521362305, 0.0006834864616394043, 0.0007901191711425781, 0.000896751880645752, 0.0010033845901489258, 0.0011100172996520996, 0.0012166500091552734, 0.0013232827186584473, 0.001429915428161621, 0.001536548137664795, 0.0016431808471679688, 0.0017498135566711426, 0.0018564462661743164, 0.0019630789756774902, 0.002069711685180664, 0.002176344394683838, 0.0022829771041870117, 0.0023896098136901855, 0.0024962425231933594, 0.002602875232696533, 0.002709507942199707, 0.002816140651702881, 0.0029227733612060547, 0.0030294060707092285, 0.0031360387802124023, 0.003242671489715576, 0.00334930419921875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 64.0, 330.0, 447.0, 145.0, 23.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005411451566033065, -0.0005305749364197254, -0.0005200047162361443, -0.0005094344960525632, -0.0004988642176613212, -0.00048829399747774, -0.00047772377729415894, -0.0004671535571105778, -0.0004565833369269967, -0.0004460131167434156, -0.000435442867456004, -0.0004248726472724229, -0.0004143024270888418, -0.0004037321778014302, -0.0003931619576178491, -0.000382591737434268, -0.00037202148814685643, -0.0003614512679632753, -0.00035088101867586374, -0.00034031079849228263, -0.0003297405783087015, -0.0003191703581251204, -0.00030860010883770883, -0.0002980298886541277, -0.00028745963936671615, -0.00027688941918313503, -0.00026631916989572346, -0.00025574894971214235, -0.00024517872952856123, -0.0002346084947930649, -0.00022403826005756855, -0.00021346803987398744, -0.00020289779058657587, -0.00019232755585107952, -0.0001817573356674984, -0.00017118710093200207, -0.00016061688074842095, -0.0001500466460129246, -0.00013947641127742827, -0.00012890619109384716, -0.00011833595635835081, -0.00010776572889881209, -9.719550143927336e-05, -8.662526670377702e-05, -7.605503924423829e-05, -6.548481178469956e-05, -5.491457704920322e-05, -4.434434958966449e-05, -3.377412213012576e-05, -2.320389285159763e-05, -1.2633663573069498e-05, -2.063432475551963e-06, 8.506794983986765e-06, 1.9077022443525493e-05, 2.9647257179021835e-05, 4.021748463856056e-05, 5.078771209809929e-05, 6.135793955763802e-05, 7.192816701717675e-05, 8.249840175267309e-05, 9.306862921221182e-05, 0.00010363885667175055, 0.00011420909140724689, 0.00012477932614274323, 0.00013534954632632434]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 12.0, 9.0, 8.0, 13.0, 25.0, 20.0, 16.0, 30.0, 45.0, 33.0, 27.0, 31.0, 47.0, 42.0, 47.0, 48.0, 43.0, 43.0, 51.0, 53.0, 48.0, 39.0, 32.0, 37.0, 27.0, 35.0, 32.0, 17.0, 15.0, 14.0, 10.0, 16.0, 14.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.338689804077148e-05, -8.092913776636124e-05, -7.847137749195099e-05, -7.601361721754074e-05, -7.355585694313049e-05, -7.109809666872025e-05, -6.864033639431e-05, -6.618257611989975e-05, -6.37248158454895e-05, -6.126705557107925e-05, -5.8809295296669006e-05, -5.635153502225876e-05, -5.389377474784851e-05, -5.143601447343826e-05, -4.8978254199028015e-05, -4.652049392461777e-05, -4.406273365020752e-05, -4.160497337579727e-05, -3.9147213101387024e-05, -3.6689452826976776e-05, -3.423169255256653e-05, -3.177393227815628e-05, -2.9316172003746033e-05, -2.6858411729335785e-05, -2.4400651454925537e-05, -2.194289118051529e-05, -1.948513090610504e-05, -1.7027370631694794e-05, -1.4569610357284546e-05, -1.2111850082874298e-05, -9.65408980846405e-06, -7.1963295340538025e-06, -4.738569259643555e-06, -2.280808985233307e-06, 1.7695128917694092e-07, 2.6347115635871887e-06, 5.0924718379974365e-06, 7.550232112407684e-06, 1.0007992386817932e-05, 1.246575266122818e-05, 1.4923512935638428e-05, 1.7381273210048676e-05, 1.9839033484458923e-05, 2.229679375886917e-05, 2.475455403327942e-05, 2.7212314307689667e-05, 2.9670074582099915e-05, 3.212783485651016e-05, 3.458559513092041e-05, 3.704335540533066e-05, 3.9501115679740906e-05, 4.1958875954151154e-05, 4.44166362285614e-05, 4.687439650297165e-05, 4.93321567773819e-05, 5.1789917051792145e-05, 5.424767732620239e-05, 5.670543760061264e-05, 5.916319787502289e-05, 6.162095814943314e-05, 6.407871842384338e-05, 6.653647869825363e-05, 6.899423897266388e-05, 7.145199924707413e-05, 7.390975952148438e-05]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 8.0, 9.0, 12.0, 12.0, 13.0, 16.0, 21.0, 17.0, 26.0, 20.0, 30.0, 26.0, 29.0, 30.0, 34.0, 41.0, 32.0, 30.0, 55.0, 39.0, 45.0, 36.0, 38.0, 32.0, 41.0, 35.0, 41.0, 32.0, 25.0, 23.0, 19.0, 23.0, 18.0, 15.0, 8.0, 8.0, 13.0, 9.0, 7.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.507965087890625, -3.39288330078125, -3.277801513671875, -3.1627197265625, -3.047637939453125, -2.93255615234375, -2.817474365234375, -2.702392578125, -2.587310791015625, -2.47222900390625, -2.357147216796875, -2.2420654296875, -2.126983642578125, -2.01190185546875, -1.896820068359375, -1.78173828125, -1.666656494140625, -1.55157470703125, -1.436492919921875, -1.3214111328125, -1.206329345703125, -1.09124755859375, -0.976165771484375, -0.861083984375, -0.746002197265625, -0.63092041015625, -0.515838623046875, -0.4007568359375, -0.285675048828125, -0.17059326171875, -0.055511474609375, 0.0595703125, 0.174652099609375, 0.28973388671875, 0.404815673828125, 0.5198974609375, 0.634979248046875, 0.75006103515625, 0.865142822265625, 0.980224609375, 1.095306396484375, 1.21038818359375, 1.325469970703125, 1.4405517578125, 1.555633544921875, 1.67071533203125, 1.785797119140625, 1.90087890625, 2.015960693359375, 2.13104248046875, 2.246124267578125, 2.3612060546875, 2.476287841796875, 2.59136962890625, 2.706451416015625, 2.821533203125, 2.936614990234375, 3.05169677734375, 3.166778564453125, 3.2818603515625, 3.396942138671875, 3.51202392578125, 3.627105712890625, 3.7421875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 5.0, 3.0, 10.0, 11.0, 16.0, 24.0, 21.0, 34.0, 40.0, 44.0, 90.0, 117.0, 176.0, 231.0, 372.0, 676.0, 1407.0, 2775.0, 6289.0, 14848.0, 34883.0, 84010.0, 196458.0, 371859.0, 191496.0, 81830.0, 34303.0, 14367.0, 6225.0, 2749.0, 1333.0, 702.0, 374.0, 220.0, 145.0, 102.0, 77.0, 57.0, 42.0, 25.0, 23.0, 22.0, 11.0, 13.0, 12.0, 6.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.5234375, -3.411529541015625, -3.29962158203125, -3.187713623046875, -3.0758056640625, -2.963897705078125, -2.85198974609375, -2.740081787109375, -2.628173828125, -2.516265869140625, -2.40435791015625, -2.292449951171875, -2.1805419921875, -2.068634033203125, -1.95672607421875, -1.844818115234375, -1.73291015625, -1.621002197265625, -1.50909423828125, -1.397186279296875, -1.2852783203125, -1.173370361328125, -1.06146240234375, -0.949554443359375, -0.837646484375, -0.725738525390625, -0.61383056640625, -0.501922607421875, -0.3900146484375, -0.278106689453125, -0.16619873046875, -0.054290771484375, 0.0576171875, 0.169525146484375, 0.28143310546875, 0.393341064453125, 0.5052490234375, 0.617156982421875, 0.72906494140625, 0.840972900390625, 0.952880859375, 1.064788818359375, 1.17669677734375, 1.288604736328125, 1.4005126953125, 1.512420654296875, 1.62432861328125, 1.736236572265625, 1.84814453125, 1.960052490234375, 2.07196044921875, 2.183868408203125, 2.2957763671875, 2.407684326171875, 2.51959228515625, 2.631500244140625, 2.743408203125, 2.855316162109375, 2.96722412109375, 3.079132080078125, 3.1910400390625, 3.302947998046875, 3.41485595703125, 3.526763916015625, 3.638671875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 8.0, 5.0, 14.0, 15.0, 15.0, 16.0, 15.0, 13.0, 22.0, 26.0, 18.0, 27.0, 35.0, 33.0, 40.0, 35.0, 54.0, 90.0, 174.0, 1505.0, 344.0, 124.0, 73.0, 48.0, 45.0, 34.0, 34.0, 17.0, 27.0, 23.0, 21.0, 18.0, 15.0, 14.0, 15.0, 13.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8359375, -11.3946533203125, -10.953369140625, -10.5120849609375, -10.07080078125, -9.6295166015625, -9.188232421875, -8.7469482421875, -8.3056640625, -7.8643798828125, -7.423095703125, -6.9818115234375, -6.54052734375, -6.0992431640625, -5.657958984375, -5.2166748046875, -4.775390625, -4.3341064453125, -3.892822265625, -3.4515380859375, -3.01025390625, -2.5689697265625, -2.127685546875, -1.6864013671875, -1.2451171875, -0.8038330078125, -0.362548828125, 0.0787353515625, 0.52001953125, 0.9613037109375, 1.402587890625, 1.8438720703125, 2.28515625, 2.7264404296875, 3.167724609375, 3.6090087890625, 4.05029296875, 4.4915771484375, 4.932861328125, 5.3741455078125, 5.8154296875, 6.2567138671875, 6.697998046875, 7.1392822265625, 7.58056640625, 8.0218505859375, 8.463134765625, 8.9044189453125, 9.345703125, 9.7869873046875, 10.228271484375, 10.6695556640625, 11.11083984375, 11.5521240234375, 11.993408203125, 12.4346923828125, 12.8759765625, 13.3172607421875, 13.758544921875, 14.1998291015625, 14.64111328125, 15.0823974609375, 15.523681640625, 15.9649658203125, 16.40625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 6.0, 3.0, 5.0, 7.0, 9.0, 9.0, 23.0, 32.0, 25.0, 71.0, 102.0, 161.0, 331.0, 790.0, 15921.0, 3124723.0, 2358.0, 476.0, 226.0, 141.0, 95.0, 69.0, 39.0, 29.0, 15.0, 8.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.375, -68.9365234375, -66.498046875, -64.0595703125, -61.62109375, -59.1826171875, -56.744140625, -54.3056640625, -51.8671875, -49.4287109375, -46.990234375, -44.5517578125, -42.11328125, -39.6748046875, -37.236328125, -34.7978515625, -32.359375, -29.9208984375, -27.482421875, -25.0439453125, -22.60546875, -20.1669921875, -17.728515625, -15.2900390625, -12.8515625, -10.4130859375, -7.974609375, -5.5361328125, -3.09765625, -0.6591796875, 1.779296875, 4.2177734375, 6.65625, 9.0947265625, 11.533203125, 13.9716796875, 16.41015625, 18.8486328125, 21.287109375, 23.7255859375, 26.1640625, 28.6025390625, 31.041015625, 33.4794921875, 35.91796875, 38.3564453125, 40.794921875, 43.2333984375, 45.671875, 48.1103515625, 50.548828125, 52.9873046875, 55.42578125, 57.8642578125, 60.302734375, 62.7412109375, 65.1796875, 67.6181640625, 70.056640625, 72.4951171875, 74.93359375, 77.3720703125, 79.810546875, 82.2490234375, 84.6875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 713.0, 301.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.10687255859375, -18.36716079711914, -13.627450942993164, -8.887740135192871, -4.148029327392578, 0.5916824340820312, 5.331392288208008, 10.071102142333984, 14.810813903808594, 19.550525665283203, 24.29023551940918, 29.029945373535156, 33.769657135009766, 38.509368896484375, 43.24907684326172, 47.98878860473633, 52.72850036621094, 57.46821212768555, 62.207923889160156, 66.9476318359375, 71.68734741210938, 76.42705535888672, 81.16676330566406, 85.90647888183594, 90.64618682861328, 95.38589477539062, 100.1256103515625, 104.86531829833984, 109.60502624511719, 114.34474182128906, 119.0844497680664, 123.82415771484375, 128.56387329101562, 133.3035888671875, 138.0432891845703, 142.7830047607422, 147.52272033691406, 152.26242065429688, 157.00213623046875, 161.74185180664062, 166.4815673828125, 171.22128295898438, 175.9609832763672, 180.70069885253906, 185.44041442871094, 190.18011474609375, 194.91983032226562, 199.6595458984375, 204.3992462158203, 209.1389617919922, 213.878662109375, 218.61837768554688, 223.35809326171875, 228.09780883789062, 232.83750915527344, 237.5772247314453, 242.31692504882812, 247.056640625, 251.7963409423828, 256.53607177734375, 261.2757568359375, 266.0154724121094, 270.75518798828125, 275.4949035644531, 280.234619140625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 2.0, 5.0, 10.0, 13.0, 12.0, 14.0, 16.0, 15.0, 19.0, 14.0, 21.0, 24.0, 26.0, 42.0, 43.0, 30.0, 36.0, 43.0, 38.0, 35.0, 44.0, 56.0, 50.0, 37.0, 30.0, 41.0, 31.0, 28.0, 29.0, 30.0, 31.0, 20.0, 22.0, 22.0, 18.0, 10.0, 8.0, 8.0, 8.0, 5.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.92547607421875, -33.87828063964844, -32.831085205078125, -31.78388786315918, -30.736690521240234, -29.689495086669922, -28.64229965209961, -27.595104217529297, -26.54790687561035, -25.50071144104004, -24.453514099121094, -23.40631866455078, -22.35912322998047, -21.311925888061523, -20.26473045349121, -19.217533111572266, -18.170337677001953, -17.12314224243164, -16.075944900512695, -15.028749465942383, -13.981553077697754, -12.934356689453125, -11.887161254882812, -10.839964866638184, -9.792768478393555, -8.745572090148926, -7.698376178741455, -6.651180267333984, -5.6039838790893555, -4.556787490844727, -3.509591579437256, -2.462395668029785, -1.4151992797851562, -0.36800312995910645, 0.6791930198669434, 1.7263891696929932, 2.773585319519043, 3.820781707763672, 4.867977619171143, 5.915173530578613, 6.962369918823242, 8.009566307067871, 9.0567626953125, 10.103958129882812, 11.151154518127441, 12.19835090637207, 13.245546340942383, 14.292742729187012, 15.33993911743164, 16.387134552001953, 17.4343318939209, 18.48152732849121, 19.528724670410156, 20.57592010498047, 21.62311553955078, 22.670310974121094, 23.71750831604004, 24.76470375061035, 25.811901092529297, 26.85909652709961, 27.906291961669922, 28.953489303588867, 30.00068473815918, 31.047882080078125, 32.09507751464844]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 5.0, 12.0, 10.0, 9.0, 20.0, 17.0, 20.0, 17.0, 18.0, 31.0, 38.0, 23.0, 28.0, 38.0, 48.0, 41.0, 37.0, 37.0, 34.0, 43.0, 46.0, 51.0, 45.0, 43.0, 23.0, 46.0, 39.0, 27.0, 16.0, 20.0, 24.0, 9.0, 15.0, 8.0, 11.0, 12.0, 5.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.1005859375, -3.966796875, -3.8330078125, -3.69921875, -3.5654296875, -3.431640625, -3.2978515625, -3.1640625, -3.0302734375, -2.896484375, -2.7626953125, -2.62890625, -2.4951171875, -2.361328125, -2.2275390625, -2.09375, -1.9599609375, -1.826171875, -1.6923828125, -1.55859375, -1.4248046875, -1.291015625, -1.1572265625, -1.0234375, -0.8896484375, -0.755859375, -0.6220703125, -0.48828125, -0.3544921875, -0.220703125, -0.0869140625, 0.046875, 0.1806640625, 0.314453125, 0.4482421875, 0.58203125, 0.7158203125, 0.849609375, 0.9833984375, 1.1171875, 1.2509765625, 1.384765625, 1.5185546875, 1.65234375, 1.7861328125, 1.919921875, 2.0537109375, 2.1875, 2.3212890625, 2.455078125, 2.5888671875, 2.72265625, 2.8564453125, 2.990234375, 3.1240234375, 3.2578125, 3.3916015625, 3.525390625, 3.6591796875, 3.79296875, 3.9267578125, 4.060546875, 4.1943359375, 4.328125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 5.0, 2.0, 8.0, 9.0, 12.0, 20.0, 16.0, 18.0, 35.0, 25.0, 39.0, 43.0, 37.0, 57.0, 59.0, 90.0, 127.0, 147.0, 336.0, 791.0, 3354.0, 37166.0, 707376.0, 2696852.0, 704982.0, 37445.0, 3324.0, 850.0, 318.0, 155.0, 109.0, 88.0, 68.0, 53.0, 35.0, 44.0, 27.0, 31.0, 25.0, 24.0, 19.0, 9.0, 16.0, 12.0, 2.0, 8.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.453369140625, -8.15673828125, -7.860107421875, -7.5634765625, -7.266845703125, -6.97021484375, -6.673583984375, -6.376953125, -6.080322265625, -5.78369140625, -5.487060546875, -5.1904296875, -4.893798828125, -4.59716796875, -4.300537109375, -4.00390625, -3.707275390625, -3.41064453125, -3.114013671875, -2.8173828125, -2.520751953125, -2.22412109375, -1.927490234375, -1.630859375, -1.334228515625, -1.03759765625, -0.740966796875, -0.4443359375, -0.147705078125, 0.14892578125, 0.445556640625, 0.7421875, 1.038818359375, 1.33544921875, 1.632080078125, 1.9287109375, 2.225341796875, 2.52197265625, 2.818603515625, 3.115234375, 3.411865234375, 3.70849609375, 4.005126953125, 4.3017578125, 4.598388671875, 4.89501953125, 5.191650390625, 5.48828125, 5.784912109375, 6.08154296875, 6.378173828125, 6.6748046875, 6.971435546875, 7.26806640625, 7.564697265625, 7.861328125, 8.157958984375, 8.45458984375, 8.751220703125, 9.0478515625, 9.344482421875, 9.64111328125, 9.937744140625, 10.234375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 6.0, 9.0, 11.0, 12.0, 19.0, 28.0, 41.0, 45.0, 64.0, 133.0, 221.0, 258.0, 389.0, 493.0, 552.0, 527.0, 410.0, 238.0, 177.0, 121.0, 93.0, 66.0, 49.0, 23.0, 33.0, 17.0, 13.0, 10.0, 6.0, 5.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.86016845703125, -6.5679931640625, -6.27581787109375, -5.983642578125, -5.69146728515625, -5.3992919921875, -5.10711669921875, -4.81494140625, -4.52276611328125, -4.2305908203125, -3.93841552734375, -3.646240234375, -3.35406494140625, -3.0618896484375, -2.76971435546875, -2.4775390625, -2.18536376953125, -1.8931884765625, -1.60101318359375, -1.308837890625, -1.01666259765625, -0.7244873046875, -0.43231201171875, -0.14013671875, 0.15203857421875, 0.4442138671875, 0.73638916015625, 1.028564453125, 1.32073974609375, 1.6129150390625, 1.90509033203125, 2.197265625, 2.48944091796875, 2.7816162109375, 3.07379150390625, 3.365966796875, 3.65814208984375, 3.9503173828125, 4.24249267578125, 4.53466796875, 4.82684326171875, 5.1190185546875, 5.41119384765625, 5.703369140625, 5.99554443359375, 6.2877197265625, 6.57989501953125, 6.8720703125, 7.16424560546875, 7.4564208984375, 7.74859619140625, 8.040771484375, 8.33294677734375, 8.6251220703125, 8.91729736328125, 9.20947265625, 9.50164794921875, 9.7938232421875, 10.08599853515625, 10.378173828125, 10.67034912109375, 10.9625244140625, 11.25469970703125, 11.546875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 10.0, 11.0, 15.0, 22.0, 20.0, 32.0, 51.0, 89.0, 120.0, 160.0, 263.0, 347.0, 628.0, 8948.0, 4134414.0, 47178.0, 758.0, 363.0, 308.0, 187.0, 122.0, 58.0, 57.0, 32.0, 23.0, 17.0, 14.0, 9.0, 12.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.03125, -52.6669921875, -51.302734375, -49.9384765625, -48.57421875, -47.2099609375, -45.845703125, -44.4814453125, -43.1171875, -41.7529296875, -40.388671875, -39.0244140625, -37.66015625, -36.2958984375, -34.931640625, -33.5673828125, -32.203125, -30.8388671875, -29.474609375, -28.1103515625, -26.74609375, -25.3818359375, -24.017578125, -22.6533203125, -21.2890625, -19.9248046875, -18.560546875, -17.1962890625, -15.83203125, -14.4677734375, -13.103515625, -11.7392578125, -10.375, -9.0107421875, -7.646484375, -6.2822265625, -4.91796875, -3.5537109375, -2.189453125, -0.8251953125, 0.5390625, 1.9033203125, 3.267578125, 4.6318359375, 5.99609375, 7.3603515625, 8.724609375, 10.0888671875, 11.453125, 12.8173828125, 14.181640625, 15.5458984375, 16.91015625, 18.2744140625, 19.638671875, 21.0029296875, 22.3671875, 23.7314453125, 25.095703125, 26.4599609375, 27.82421875, 29.1884765625, 30.552734375, 31.9169921875, 33.28125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 20.0, 575.0, 409.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.62611389160156, -94.29499816894531, -86.96387481689453, -79.63275909423828, -72.3016357421875, -64.97052001953125, -57.639404296875, -50.308284759521484, -42.97716522216797, -35.64604568481445, -28.31492805480957, -20.983810424804688, -13.652690887451172, -6.321571350097656, 1.0095443725585938, 8.34066390991211, 15.671783447265625, 23.00290298461914, 30.334020614624023, 37.665138244628906, 44.99625778198242, 52.32737731933594, 59.65849304199219, 66.98960876464844, 74.32073211669922, 81.65184783935547, 88.98297119140625, 96.3140869140625, 103.64520263671875, 110.97632598876953, 118.30744171142578, 125.63856506347656, 132.96969604492188, 140.30081176757812, 147.63192749023438, 154.96304321289062, 162.29417419433594, 169.6252899169922, 176.95640563964844, 184.2875213623047, 191.61865234375, 198.94976806640625, 206.2808837890625, 213.61199951171875, 220.94313049316406, 228.2742462158203, 235.60536193847656, 242.9364776611328, 250.26759338378906, 257.5987243652344, 264.9298400878906, 272.2609558105469, 279.5920715332031, 286.9231872558594, 294.2543029785156, 301.5854187011719, 308.9165344238281, 316.2476501464844, 323.5787658691406, 330.9098815917969, 338.2409973144531, 345.5721435546875, 352.90325927734375, 360.234375, 367.56549072265625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 9.0, 19.0, 11.0, 26.0, 20.0, 34.0, 32.0, 46.0, 41.0, 46.0, 46.0, 67.0, 58.0, 49.0, 43.0, 55.0, 43.0, 49.0, 35.0, 43.0, 41.0, 26.0, 31.0, 24.0, 23.0, 14.0, 17.0, 9.0, 10.0, 10.0, 4.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-36.49530792236328, -35.49312210083008, -34.49094009399414, -33.48875427246094, -32.486568450927734, -31.484384536743164, -30.482200622558594, -29.48001480102539, -28.477828979492188, -27.475645065307617, -26.473459243774414, -25.471275329589844, -24.46908950805664, -23.46690559387207, -22.4647216796875, -21.462535858154297, -20.460351943969727, -19.458168029785156, -18.455982208251953, -17.453798294067383, -16.45161247253418, -15.44942855834961, -14.447243690490723, -13.445058822631836, -12.44287395477295, -11.440689086914062, -10.438504219055176, -9.436319351196289, -8.434135437011719, -7.431950092315674, -6.429765701293945, -5.427580833435059, -4.425397872924805, -3.423213005065918, -2.4210283756256104, -1.4188437461853027, -0.416658878326416, 0.5855259895324707, 1.5877103805541992, 2.589895248413086, 3.5920801162719727, 4.594264984130859, 5.596449851989746, 6.598634243011475, 7.600819110870361, 8.603004455566406, 9.605188369750977, 10.607373237609863, 11.60955810546875, 12.611742973327637, 13.613927841186523, 14.616111755371094, 15.618297576904297, 16.620481491088867, 17.622665405273438, 18.62485122680664, 19.627037048339844, 20.629220962524414, 21.631406784057617, 22.633590698242188, 23.63577651977539, 24.63796043395996, 25.64014434814453, 26.642330169677734, 27.644514083862305]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 4.0, 6.0, 7.0, 8.0, 10.0, 11.0, 19.0, 18.0, 24.0, 26.0, 21.0, 30.0, 28.0, 29.0, 36.0, 27.0, 46.0, 27.0, 39.0, 47.0, 26.0, 49.0, 49.0, 29.0, 37.0, 29.0, 38.0, 32.0, 33.0, 32.0, 17.0, 18.0, 21.0, 15.0, 18.0, 14.0, 14.0, 16.0, 6.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.37890625, -3.265045166015625, -3.15118408203125, -3.037322998046875, -2.9234619140625, -2.809600830078125, -2.69573974609375, -2.581878662109375, -2.468017578125, -2.354156494140625, -2.24029541015625, -2.126434326171875, -2.0125732421875, -1.898712158203125, -1.78485107421875, -1.670989990234375, -1.55712890625, -1.443267822265625, -1.32940673828125, -1.215545654296875, -1.1016845703125, -0.987823486328125, -0.87396240234375, -0.760101318359375, -0.646240234375, -0.532379150390625, -0.41851806640625, -0.304656982421875, -0.1907958984375, -0.076934814453125, 0.03692626953125, 0.150787353515625, 0.2646484375, 0.378509521484375, 0.49237060546875, 0.606231689453125, 0.7200927734375, 0.833953857421875, 0.94781494140625, 1.061676025390625, 1.175537109375, 1.289398193359375, 1.40325927734375, 1.517120361328125, 1.6309814453125, 1.744842529296875, 1.85870361328125, 1.972564697265625, 2.08642578125, 2.200286865234375, 2.31414794921875, 2.428009033203125, 2.5418701171875, 2.655731201171875, 2.76959228515625, 2.883453369140625, 2.997314453125, 3.111175537109375, 3.22503662109375, 3.338897705078125, 3.4527587890625, 3.566619873046875, 3.68048095703125, 3.794342041015625, 3.908203125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 5.0, 11.0, 17.0, 31.0, 31.0, 48.0, 83.0, 109.0, 162.0, 276.0, 369.0, 533.0, 753.0, 1158.0, 1675.0, 2504.0, 3786.0, 5457.0, 8135.0, 12154.0, 18980.0, 29231.0, 47959.0, 81060.0, 155117.0, 296223.0, 161728.0, 84145.0, 49041.0, 29948.0, 19412.0, 12772.0, 8241.0, 5558.0, 3798.0, 2645.0, 1752.0, 1146.0, 810.0, 550.0, 372.0, 243.0, 195.0, 110.0, 66.0, 44.0, 39.0, 32.0, 17.0, 12.0, 6.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.58642578125, -0.5665664672851562, -0.5467071533203125, -0.5268478393554688, -0.506988525390625, -0.48712921142578125, -0.4672698974609375, -0.44741058349609375, -0.42755126953125, -0.40769195556640625, -0.3878326416015625, -0.36797332763671875, -0.348114013671875, -0.32825469970703125, -0.3083953857421875, -0.28853607177734375, -0.2686767578125, -0.24881744384765625, -0.2289581298828125, -0.20909881591796875, -0.189239501953125, -0.16938018798828125, -0.1495208740234375, -0.12966156005859375, -0.10980224609375, -0.08994293212890625, -0.0700836181640625, -0.05022430419921875, -0.030364990234375, -0.01050567626953125, 0.0093536376953125, 0.02921295166015625, 0.049072265625, 0.06893157958984375, 0.0887908935546875, 0.10865020751953125, 0.128509521484375, 0.14836883544921875, 0.1682281494140625, 0.18808746337890625, 0.20794677734375, 0.22780609130859375, 0.2476654052734375, 0.26752471923828125, 0.287384033203125, 0.30724334716796875, 0.3271026611328125, 0.34696197509765625, 0.3668212890625, 0.38668060302734375, 0.4065399169921875, 0.42639923095703125, 0.446258544921875, 0.46611785888671875, 0.4859771728515625, 0.5058364868164062, 0.52569580078125, 0.5455551147460938, 0.5654144287109375, 0.5852737426757812, 0.605133056640625, 0.6249923706054688, 0.6448516845703125, 0.6647109985351562, 0.6845703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 9.0, 7.0, 6.0, 12.0, 20.0, 15.0, 6.0, 16.0, 21.0, 16.0, 23.0, 24.0, 37.0, 22.0, 23.0, 32.0, 31.0, 41.0, 33.0, 41.0, 43.0, 1066.0, 38.0, 34.0, 37.0, 32.0, 36.0, 29.0, 21.0, 24.0, 26.0, 24.0, 16.0, 23.0, 21.0, 20.0, 18.0, 15.0, 9.0, 11.0, 8.0, 7.0, 9.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.1015625, -2.034393310546875, -1.96722412109375, -1.900054931640625, -1.8328857421875, -1.765716552734375, -1.69854736328125, -1.631378173828125, -1.564208984375, -1.497039794921875, -1.42987060546875, -1.362701416015625, -1.2955322265625, -1.228363037109375, -1.16119384765625, -1.094024658203125, -1.02685546875, -0.959686279296875, -0.89251708984375, -0.825347900390625, -0.7581787109375, -0.691009521484375, -0.62384033203125, -0.556671142578125, -0.489501953125, -0.422332763671875, -0.35516357421875, -0.287994384765625, -0.2208251953125, -0.153656005859375, -0.08648681640625, -0.019317626953125, 0.0478515625, 0.115020751953125, 0.18218994140625, 0.249359130859375, 0.3165283203125, 0.383697509765625, 0.45086669921875, 0.518035888671875, 0.585205078125, 0.652374267578125, 0.71954345703125, 0.786712646484375, 0.8538818359375, 0.921051025390625, 0.98822021484375, 1.055389404296875, 1.12255859375, 1.189727783203125, 1.25689697265625, 1.324066162109375, 1.3912353515625, 1.458404541015625, 1.52557373046875, 1.592742919921875, 1.659912109375, 1.727081298828125, 1.79425048828125, 1.861419677734375, 1.9285888671875, 1.995758056640625, 2.06292724609375, 2.130096435546875, 2.197265625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 6.0, 5.0, 15.0, 28.0, 28.0, 48.0, 72.0, 96.0, 136.0, 164.0, 274.0, 380.0, 523.0, 765.0, 1030.0, 1468.0, 1982.0, 2885.0, 3905.0, 5385.0, 7296.0, 9876.0, 13859.0, 19375.0, 27337.0, 39882.0, 60306.0, 101560.0, 193780.0, 1272268.0, 116650.0, 67647.0, 43591.0, 29465.0, 20959.0, 15085.0, 10752.0, 7885.0, 5673.0, 4097.0, 3000.0, 2170.0, 1589.0, 1124.0, 805.0, 582.0, 425.0, 284.0, 205.0, 158.0, 90.0, 57.0, 33.0, 31.0, 21.0, 10.0, 7.0, 3.0, 7.0, 1.0, 3.0], "bins": [-0.47607421875, -0.46125030517578125, -0.4464263916015625, -0.43160247802734375, -0.416778564453125, -0.40195465087890625, -0.3871307373046875, -0.37230682373046875, -0.35748291015625, -0.34265899658203125, -0.3278350830078125, -0.31301116943359375, -0.298187255859375, -0.28336334228515625, -0.2685394287109375, -0.25371551513671875, -0.2388916015625, -0.22406768798828125, -0.2092437744140625, -0.19441986083984375, -0.179595947265625, -0.16477203369140625, -0.1499481201171875, -0.13512420654296875, -0.12030029296875, -0.10547637939453125, -0.0906524658203125, -0.07582855224609375, -0.061004638671875, -0.04618072509765625, -0.0313568115234375, -0.01653289794921875, -0.001708984375, 0.01311492919921875, 0.0279388427734375, 0.04276275634765625, 0.057586669921875, 0.07241058349609375, 0.0872344970703125, 0.10205841064453125, 0.11688232421875, 0.13170623779296875, 0.1465301513671875, 0.16135406494140625, 0.176177978515625, 0.19100189208984375, 0.2058258056640625, 0.22064971923828125, 0.2354736328125, 0.25029754638671875, 0.2651214599609375, 0.27994537353515625, 0.294769287109375, 0.30959320068359375, 0.3244171142578125, 0.33924102783203125, 0.35406494140625, 0.36888885498046875, 0.3837127685546875, 0.39853668212890625, 0.413360595703125, 0.42818450927734375, 0.4430084228515625, 0.45783233642578125, 0.47265625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 4.0, 8.0, 8.0, 16.0, 13.0, 26.0, 27.0, 26.0, 29.0, 41.0, 43.0, 42.0, 39.0, 47.0, 51.0, 51.0, 55.0, 53.0, 42.0, 57.0, 46.0, 28.0, 32.0, 30.0, 22.0, 26.0, 22.0, 21.0, 17.0, 9.0, 12.0, 7.0, 6.0, 7.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00011676549911499023, -0.0001131836324930191, -0.00010960176587104797, -0.00010601989924907684, -0.00010243803262710571, -9.885616600513458e-05, -9.527429938316345e-05, -9.169243276119232e-05, -8.811056613922119e-05, -8.452869951725006e-05, -8.094683289527893e-05, -7.73649662733078e-05, -7.378309965133667e-05, -7.020123302936554e-05, -6.661936640739441e-05, -6.303749978542328e-05, -5.945563316345215e-05, -5.587376654148102e-05, -5.229189991950989e-05, -4.871003329753876e-05, -4.512816667556763e-05, -4.1546300053596497e-05, -3.7964433431625366e-05, -3.4382566809654236e-05, -3.0800700187683105e-05, -2.7218833565711975e-05, -2.3636966943740845e-05, -2.0055100321769714e-05, -1.6473233699798584e-05, -1.2891367077827454e-05, -9.309500455856323e-06, -5.727633833885193e-06, -2.1457672119140625e-06, 1.4360994100570679e-06, 5.017966032028198e-06, 8.599832653999329e-06, 1.2181699275970459e-05, 1.576356589794159e-05, 1.934543251991272e-05, 2.292729914188385e-05, 2.650916576385498e-05, 3.009103238582611e-05, 3.367289900779724e-05, 3.725476562976837e-05, 4.08366322517395e-05, 4.441849887371063e-05, 4.800036549568176e-05, 5.158223211765289e-05, 5.5164098739624023e-05, 5.8745965361595154e-05, 6.232783198356628e-05, 6.590969860553741e-05, 6.949156522750854e-05, 7.307343184947968e-05, 7.66552984714508e-05, 8.023716509342194e-05, 8.381903171539307e-05, 8.74008983373642e-05, 9.098276495933533e-05, 9.456463158130646e-05, 9.814649820327759e-05, 0.00010172836482524872, 0.00010531023144721985, 0.00010889209806919098, 0.00011247396469116211]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 2.0, 4.0, 7.0, 7.0, 14.0, 17.0, 13.0, 26.0, 29.0, 31.0, 45.0, 71.0, 77.0, 103.0, 150.0, 325.0, 742.0, 12242.0, 1026697.0, 6245.0, 711.0, 318.0, 150.0, 120.0, 89.0, 71.0, 57.0, 47.0, 33.0, 30.0, 12.0, 16.0, 10.0, 10.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0026607513427734375, -0.0025761425495147705, -0.0024915337562561035, -0.0024069249629974365, -0.0023223161697387695, -0.0022377073764801025, -0.0021530985832214355, -0.0020684897899627686, -0.0019838809967041016, -0.0018992722034454346, -0.0018146634101867676, -0.0017300546169281006, -0.0016454458236694336, -0.0015608370304107666, -0.0014762282371520996, -0.0013916194438934326, -0.0013070106506347656, -0.0012224018573760986, -0.0011377930641174316, -0.0010531842708587646, -0.0009685754776000977, -0.0008839666843414307, -0.0007993578910827637, -0.0007147490978240967, -0.0006301403045654297, -0.0005455315113067627, -0.0004609227180480957, -0.0003763139247894287, -0.0002917051315307617, -0.00020709633827209473, -0.00012248754501342773, -3.787875175476074e-05, 4.673004150390625e-05, 0.00013133883476257324, 0.00021594762802124023, 0.0003005564212799072, 0.0003851652145385742, 0.0004697740077972412, 0.0005543828010559082, 0.0006389915943145752, 0.0007236003875732422, 0.0008082091808319092, 0.0008928179740905762, 0.0009774267673492432, 0.0010620355606079102, 0.0011466443538665771, 0.0012312531471252441, 0.0013158619403839111, 0.0014004707336425781, 0.0014850795269012451, 0.0015696883201599121, 0.001654297113418579, 0.001738905906677246, 0.001823514699935913, 0.00190812349319458, 0.001992732286453247, 0.002077341079711914, 0.002161949872970581, 0.002246558666229248, 0.002331167459487915, 0.002415776252746582, 0.002500385046005249, 0.002584993839263916, 0.002669602632522583, 0.00275421142578125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 30.0, 144.0, 372.0, 365.0, 93.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016670180775690824, -0.00015681717195548117, -0.00014693252160213888, -0.0001370478858007118, -0.00012716324999928474, -0.00011727860692190006, -0.00010739396384451538, -9.750932804308832e-05, -8.762468496570364e-05, -7.774004188831896e-05, -6.785540608689189e-05, -5.797076300950721e-05, -4.8086123570101336e-05, -3.820148413069546e-05, -2.8316841053310782e-05, -1.8432205251883715e-05, -8.547562174499035e-06, 1.3370781744015403e-06, 1.1221718523302115e-05, 2.1106359781697392e-05, 3.0990999221103266e-05, 4.087563866050914e-05, 5.076028173789382e-05, 6.0644917539320886e-05, 7.052956061670557e-05, 8.041420369409025e-05, 9.029883949551731e-05, 0.000100183482572902, 0.00011006812565028667, 0.00011995276145171374, 0.0001298373972531408, 0.0001397220476064831, 0.00014960666885599494, 0.000159491304657422, 0.0001693759550107643, 0.00017926059081219137, 0.00018914522661361843, 0.0001990298624150455, 0.0002089145127683878, 0.00021879914856981486, 0.00022868378437124193, 0.000238568420172669, 0.00024845305597409606, 0.00025833770632743835, 0.00026822235668078065, 0.0002781069779302925, 0.0002879916282836348, 0.0002978762495331466, 0.0003077608998864889, 0.0003176455502398312, 0.00032753017148934305, 0.00033741482184268534, 0.00034729947219602764, 0.0003571840934455395, 0.00036706874379888177, 0.00037695339415222406, 0.00038683804450556636, 0.00039672269485890865, 0.0004066073161084205, 0.0004164919664617628, 0.0004263766168151051, 0.0004362612380646169, 0.0004461458884179592, 0.0004560305387713015, 0.00046591516002081335]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 9.0, 6.0, 10.0, 9.0, 18.0, 17.0, 19.0, 20.0, 20.0, 30.0, 24.0, 31.0, 26.0, 22.0, 34.0, 40.0, 36.0, 48.0, 30.0, 48.0, 30.0, 33.0, 37.0, 36.0, 34.0, 37.0, 40.0, 31.0, 31.0, 22.0, 24.0, 26.0, 18.0, 12.0, 15.0, 15.0, 6.0, 5.0, 12.0, 6.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0], "bins": [-6.645917892456055e-05, -6.452761590480804e-05, -6.259605288505554e-05, -6.066448986530304e-05, -5.873292684555054e-05, -5.6801363825798035e-05, -5.486980080604553e-05, -5.293823778629303e-05, -5.100667476654053e-05, -4.9075111746788025e-05, -4.714354872703552e-05, -4.521198570728302e-05, -4.328042268753052e-05, -4.1348859667778015e-05, -3.941729664802551e-05, -3.748573362827301e-05, -3.555417060852051e-05, -3.3622607588768005e-05, -3.16910445690155e-05, -2.9759481549263e-05, -2.7827918529510498e-05, -2.5896355509757996e-05, -2.3964792490005493e-05, -2.203322947025299e-05, -2.0101666450500488e-05, -1.8170103430747986e-05, -1.6238540410995483e-05, -1.4306977391242981e-05, -1.2375414371490479e-05, -1.0443851351737976e-05, -8.512288331985474e-06, -6.580725312232971e-06, -4.649162292480469e-06, -2.7175992727279663e-06, -7.860362529754639e-07, 1.1455267667770386e-06, 3.077089786529541e-06, 5.0086528062820435e-06, 6.940215826034546e-06, 8.871778845787048e-06, 1.080334186553955e-05, 1.2734904885292053e-05, 1.4666467905044556e-05, 1.6598030924797058e-05, 1.852959394454956e-05, 2.0461156964302063e-05, 2.2392719984054565e-05, 2.4324283003807068e-05, 2.625584602355957e-05, 2.8187409043312073e-05, 3.0118972063064575e-05, 3.205053508281708e-05, 3.398209810256958e-05, 3.591366112232208e-05, 3.7845224142074585e-05, 3.977678716182709e-05, 4.170835018157959e-05, 4.363991320133209e-05, 4.5571476221084595e-05, 4.75030392408371e-05, 4.94346022605896e-05, 5.13661652803421e-05, 5.3297728300094604e-05, 5.522929131984711e-05, 5.716085433959961e-05]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 4.0, 6.0, 7.0, 8.0, 10.0, 11.0, 19.0, 18.0, 24.0, 26.0, 21.0, 30.0, 28.0, 29.0, 36.0, 27.0, 46.0, 27.0, 39.0, 47.0, 26.0, 49.0, 49.0, 29.0, 37.0, 29.0, 38.0, 32.0, 33.0, 32.0, 17.0, 18.0, 21.0, 15.0, 18.0, 14.0, 14.0, 16.0, 6.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.37890625, -3.265045166015625, -3.15118408203125, -3.037322998046875, -2.9234619140625, -2.809600830078125, -2.69573974609375, -2.581878662109375, -2.468017578125, -2.354156494140625, -2.24029541015625, -2.126434326171875, -2.0125732421875, -1.898712158203125, -1.78485107421875, -1.670989990234375, -1.55712890625, -1.443267822265625, -1.32940673828125, -1.215545654296875, -1.1016845703125, -0.987823486328125, -0.87396240234375, -0.760101318359375, -0.646240234375, -0.532379150390625, -0.41851806640625, -0.304656982421875, -0.1907958984375, -0.076934814453125, 0.03692626953125, 0.150787353515625, 0.2646484375, 0.378509521484375, 0.49237060546875, 0.606231689453125, 0.7200927734375, 0.833953857421875, 0.94781494140625, 1.061676025390625, 1.175537109375, 1.289398193359375, 1.40325927734375, 1.517120361328125, 1.6309814453125, 1.744842529296875, 1.85870361328125, 1.972564697265625, 2.08642578125, 2.200286865234375, 2.31414794921875, 2.428009033203125, 2.5418701171875, 2.655731201171875, 2.76959228515625, 2.883453369140625, 2.997314453125, 3.111175537109375, 3.22503662109375, 3.338897705078125, 3.4527587890625, 3.566619873046875, 3.68048095703125, 3.794342041015625, 3.908203125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 1.0, 6.0, 5.0, 8.0, 12.0, 8.0, 20.0, 12.0, 19.0, 39.0, 52.0, 100.0, 133.0, 274.0, 571.0, 1250.0, 2726.0, 5896.0, 13356.0, 29905.0, 75337.0, 222431.0, 411629.0, 177090.0, 61705.0, 25081.0, 11375.0, 5113.0, 2294.0, 1043.0, 496.0, 231.0, 123.0, 54.0, 39.0, 34.0, 12.0, 24.0, 9.0, 8.0, 9.0, 4.0, 8.0, 5.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7421875, -3.61907958984375, -3.4959716796875, -3.37286376953125, -3.249755859375, -3.12664794921875, -3.0035400390625, -2.88043212890625, -2.75732421875, -2.63421630859375, -2.5111083984375, -2.38800048828125, -2.264892578125, -2.14178466796875, -2.0186767578125, -1.89556884765625, -1.7724609375, -1.64935302734375, -1.5262451171875, -1.40313720703125, -1.280029296875, -1.15692138671875, -1.0338134765625, -0.91070556640625, -0.78759765625, -0.66448974609375, -0.5413818359375, -0.41827392578125, -0.295166015625, -0.17205810546875, -0.0489501953125, 0.07415771484375, 0.197265625, 0.32037353515625, 0.4434814453125, 0.56658935546875, 0.689697265625, 0.81280517578125, 0.9359130859375, 1.05902099609375, 1.18212890625, 1.30523681640625, 1.4283447265625, 1.55145263671875, 1.674560546875, 1.79766845703125, 1.9207763671875, 2.04388427734375, 2.1669921875, 2.29010009765625, 2.4132080078125, 2.53631591796875, 2.659423828125, 2.78253173828125, 2.9056396484375, 3.02874755859375, 3.15185546875, 3.27496337890625, 3.3980712890625, 3.52117919921875, 3.644287109375, 3.76739501953125, 3.8905029296875, 4.01361083984375, 4.13671875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 3.0, 8.0, 11.0, 9.0, 10.0, 16.0, 15.0, 16.0, 22.0, 23.0, 32.0, 40.0, 31.0, 37.0, 37.0, 63.0, 101.0, 251.0, 1590.0, 243.0, 95.0, 51.0, 51.0, 42.0, 36.0, 36.0, 33.0, 29.0, 24.0, 22.0, 18.0, 15.0, 10.0, 10.0, 4.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.015625, -17.521728515625, -17.02783203125, -16.533935546875, -16.0400390625, -15.546142578125, -15.05224609375, -14.558349609375, -14.064453125, -13.570556640625, -13.07666015625, -12.582763671875, -12.0888671875, -11.594970703125, -11.10107421875, -10.607177734375, -10.11328125, -9.619384765625, -9.12548828125, -8.631591796875, -8.1376953125, -7.643798828125, -7.14990234375, -6.656005859375, -6.162109375, -5.668212890625, -5.17431640625, -4.680419921875, -4.1865234375, -3.692626953125, -3.19873046875, -2.704833984375, -2.2109375, -1.717041015625, -1.22314453125, -0.729248046875, -0.2353515625, 0.258544921875, 0.75244140625, 1.246337890625, 1.740234375, 2.234130859375, 2.72802734375, 3.221923828125, 3.7158203125, 4.209716796875, 4.70361328125, 5.197509765625, 5.69140625, 6.185302734375, 6.67919921875, 7.173095703125, 7.6669921875, 8.160888671875, 8.65478515625, 9.148681640625, 9.642578125, 10.136474609375, 10.63037109375, 11.124267578125, 11.6181640625, 12.112060546875, 12.60595703125, 13.099853515625, 13.59375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 12.0, 6.0, 7.0, 17.0, 26.0, 22.0, 33.0, 49.0, 58.0, 73.0, 94.0, 141.0, 170.0, 259.0, 468.0, 1238.0, 119226.0, 3017997.0, 4016.0, 618.0, 327.0, 242.0, 146.0, 99.0, 69.0, 54.0, 48.0, 30.0, 26.0, 28.0, 19.0, 19.0, 9.0, 13.0, 8.0, 2.0, 1.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-38.65625, -37.41796875, -36.1796875, -34.94140625, -33.703125, -32.46484375, -31.2265625, -29.98828125, -28.75, -27.51171875, -26.2734375, -25.03515625, -23.796875, -22.55859375, -21.3203125, -20.08203125, -18.84375, -17.60546875, -16.3671875, -15.12890625, -13.890625, -12.65234375, -11.4140625, -10.17578125, -8.9375, -7.69921875, -6.4609375, -5.22265625, -3.984375, -2.74609375, -1.5078125, -0.26953125, 0.96875, 2.20703125, 3.4453125, 4.68359375, 5.921875, 7.16015625, 8.3984375, 9.63671875, 10.875, 12.11328125, 13.3515625, 14.58984375, 15.828125, 17.06640625, 18.3046875, 19.54296875, 20.78125, 22.01953125, 23.2578125, 24.49609375, 25.734375, 26.97265625, 28.2109375, 29.44921875, 30.6875, 31.92578125, 33.1640625, 34.40234375, 35.640625, 36.87890625, 38.1171875, 39.35546875, 40.59375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 207.0, 796.0, 14.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.495949745178223, -5.851185321807861, -1.2064208984375, 3.4383440017700195, 8.083107948303223, 12.727871894836426, 17.372638702392578, 22.01740264892578, 26.662166595458984, 31.306930541992188, 35.95169448852539, 40.596458435058594, 45.24122619628906, 49.885986328125, 54.53075408935547, 59.17551803588867, 63.820281982421875, 68.46504974365234, 73.10980987548828, 77.75457763671875, 82.39933776855469, 87.04410552978516, 91.68887329101562, 96.33363342285156, 100.9783935546875, 105.62316131591797, 110.2679214477539, 114.91268920898438, 119.55744934082031, 124.20221710205078, 128.84698486328125, 133.4917449951172, 138.1365203857422, 142.78128051757812, 147.42605590820312, 152.07081604003906, 156.715576171875, 161.36033630371094, 166.00511169433594, 170.64987182617188, 175.2946319580078, 179.93939208984375, 184.58416748046875, 189.2289276123047, 193.87368774414062, 198.51844787597656, 203.16322326660156, 207.8079833984375, 212.4527587890625, 217.09751892089844, 221.74229431152344, 226.38705444335938, 231.0318145751953, 235.67657470703125, 240.32135009765625, 244.9661102294922, 249.61087036132812, 254.25563049316406, 258.900390625, 263.545166015625, 268.18994140625, 272.8346862792969, 277.4794616699219, 282.12420654296875, 286.76898193359375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 4.0, 19.0, 14.0, 11.0, 16.0, 20.0, 22.0, 29.0, 26.0, 34.0, 30.0, 29.0, 34.0, 38.0, 44.0, 55.0, 37.0, 36.0, 43.0, 50.0, 35.0, 45.0, 40.0, 38.0, 36.0, 31.0, 19.0, 26.0, 31.0, 12.0, 16.0, 13.0, 16.0, 12.0, 5.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.09455490112305, -34.94756317138672, -33.800575256347656, -32.65358352661133, -31.506591796875, -30.359601974487305, -29.21261215209961, -28.06562042236328, -26.918630599975586, -25.77164077758789, -24.624649047851562, -23.477659225463867, -22.330669403076172, -21.183677673339844, -20.03668785095215, -18.889698028564453, -17.742706298828125, -16.59571647644043, -15.448724746704102, -14.301734924316406, -13.154744148254395, -12.007753372192383, -10.860763549804688, -9.713772773742676, -8.566781997680664, -7.419791221618652, -6.272800922393799, -5.125810623168945, -3.9788198471069336, -2.831829071044922, -1.6848387718200684, -0.5378484725952148, 0.6091384887695312, 1.7561290264129639, 2.9031195640563965, 4.05010986328125, 5.197100639343262, 6.344091415405273, 7.491081714630127, 8.63807201385498, 9.785062789916992, 10.932053565979004, 12.079044342041016, 13.226034164428711, 14.373024940490723, 15.520015716552734, 16.66700553894043, 17.813995361328125, 18.960987091064453, 20.10797691345215, 21.254968643188477, 22.401958465576172, 23.5489501953125, 24.695940017700195, 25.84292984008789, 26.98992156982422, 28.136911392211914, 29.28390121459961, 30.430892944335938, 31.577882766723633, 32.72487258911133, 33.871864318847656, 35.018856048583984, 36.16584396362305, 37.312835693359375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 11.0, 7.0, 8.0, 12.0, 11.0, 20.0, 26.0, 29.0, 30.0, 18.0, 25.0, 37.0, 40.0, 26.0, 36.0, 33.0, 41.0, 29.0, 49.0, 42.0, 45.0, 53.0, 28.0, 36.0, 36.0, 30.0, 27.0, 20.0, 31.0, 25.0, 19.0, 22.0, 19.0, 9.0, 6.0, 12.0, 19.0, 7.0, 2.0, 7.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.0078125, -3.8782958984375, -3.748779296875, -3.6192626953125, -3.48974609375, -3.3602294921875, -3.230712890625, -3.1011962890625, -2.9716796875, -2.8421630859375, -2.712646484375, -2.5831298828125, -2.45361328125, -2.3240966796875, -2.194580078125, -2.0650634765625, -1.935546875, -1.8060302734375, -1.676513671875, -1.5469970703125, -1.41748046875, -1.2879638671875, -1.158447265625, -1.0289306640625, -0.8994140625, -0.7698974609375, -0.640380859375, -0.5108642578125, -0.38134765625, -0.2518310546875, -0.122314453125, 0.0072021484375, 0.13671875, 0.2662353515625, 0.395751953125, 0.5252685546875, 0.65478515625, 0.7843017578125, 0.913818359375, 1.0433349609375, 1.1728515625, 1.3023681640625, 1.431884765625, 1.5614013671875, 1.69091796875, 1.8204345703125, 1.949951171875, 2.0794677734375, 2.208984375, 2.3385009765625, 2.468017578125, 2.5975341796875, 2.72705078125, 2.8565673828125, 2.986083984375, 3.1156005859375, 3.2451171875, 3.3746337890625, 3.504150390625, 3.6336669921875, 3.76318359375, 3.8927001953125, 4.022216796875, 4.1517333984375, 4.28125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 4.0, 1.0, 3.0, 6.0, 7.0, 7.0, 12.0, 13.0, 15.0, 17.0, 24.0, 35.0, 39.0, 50.0, 67.0, 68.0, 105.0, 136.0, 288.0, 701.0, 2876.0, 53232.0, 1794337.0, 2254488.0, 82113.0, 3835.0, 835.0, 321.0, 163.0, 103.0, 74.0, 61.0, 56.0, 39.0, 28.0, 23.0, 19.0, 13.0, 16.0, 12.0, 19.0, 5.0, 6.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-13.078125, -12.6824951171875, -12.286865234375, -11.8912353515625, -11.49560546875, -11.0999755859375, -10.704345703125, -10.3087158203125, -9.9130859375, -9.5174560546875, -9.121826171875, -8.7261962890625, -8.33056640625, -7.9349365234375, -7.539306640625, -7.1436767578125, -6.748046875, -6.3524169921875, -5.956787109375, -5.5611572265625, -5.16552734375, -4.7698974609375, -4.374267578125, -3.9786376953125, -3.5830078125, -3.1873779296875, -2.791748046875, -2.3961181640625, -2.00048828125, -1.6048583984375, -1.209228515625, -0.8135986328125, -0.41796875, -0.0223388671875, 0.373291015625, 0.7689208984375, 1.16455078125, 1.5601806640625, 1.955810546875, 2.3514404296875, 2.7470703125, 3.1427001953125, 3.538330078125, 3.9339599609375, 4.32958984375, 4.7252197265625, 5.120849609375, 5.5164794921875, 5.912109375, 6.3077392578125, 6.703369140625, 7.0989990234375, 7.49462890625, 7.8902587890625, 8.285888671875, 8.6815185546875, 9.0771484375, 9.4727783203125, 9.868408203125, 10.2640380859375, 10.65966796875, 11.0552978515625, 11.450927734375, 11.8465576171875, 12.2421875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 14.0, 6.0, 29.0, 30.0, 65.0, 86.0, 117.0, 224.0, 364.0, 488.0, 636.0, 648.0, 467.0, 320.0, 200.0, 118.0, 87.0, 49.0, 40.0, 25.0, 16.0, 11.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.59375, -14.2535400390625, -13.913330078125, -13.5731201171875, -13.23291015625, -12.8927001953125, -12.552490234375, -12.2122802734375, -11.8720703125, -11.5318603515625, -11.191650390625, -10.8514404296875, -10.51123046875, -10.1710205078125, -9.830810546875, -9.4906005859375, -9.150390625, -8.8101806640625, -8.469970703125, -8.1297607421875, -7.78955078125, -7.4493408203125, -7.109130859375, -6.7689208984375, -6.4287109375, -6.0885009765625, -5.748291015625, -5.4080810546875, -5.06787109375, -4.7276611328125, -4.387451171875, -4.0472412109375, -3.70703125, -3.3668212890625, -3.026611328125, -2.6864013671875, -2.34619140625, -2.0059814453125, -1.665771484375, -1.3255615234375, -0.9853515625, -0.6451416015625, -0.304931640625, 0.0352783203125, 0.37548828125, 0.7156982421875, 1.055908203125, 1.3961181640625, 1.736328125, 2.0765380859375, 2.416748046875, 2.7569580078125, 3.09716796875, 3.4373779296875, 3.777587890625, 4.1177978515625, 4.4580078125, 4.7982177734375, 5.138427734375, 5.4786376953125, 5.81884765625, 6.1590576171875, 6.499267578125, 6.8394775390625, 7.1796875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 8.0, 4.0, 8.0, 13.0, 20.0, 42.0, 54.0, 76.0, 115.0, 152.0, 311.0, 433.0, 965.0, 170339.0, 4017374.0, 2785.0, 613.0, 384.0, 197.0, 132.0, 100.0, 61.0, 32.0, 16.0, 14.0, 16.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.25, -28.7548828125, -27.259765625, -25.7646484375, -24.26953125, -22.7744140625, -21.279296875, -19.7841796875, -18.2890625, -16.7939453125, -15.298828125, -13.8037109375, -12.30859375, -10.8134765625, -9.318359375, -7.8232421875, -6.328125, -4.8330078125, -3.337890625, -1.8427734375, -0.34765625, 1.1474609375, 2.642578125, 4.1376953125, 5.6328125, 7.1279296875, 8.623046875, 10.1181640625, 11.61328125, 13.1083984375, 14.603515625, 16.0986328125, 17.59375, 19.0888671875, 20.583984375, 22.0791015625, 23.57421875, 25.0693359375, 26.564453125, 28.0595703125, 29.5546875, 31.0498046875, 32.544921875, 34.0400390625, 35.53515625, 37.0302734375, 38.525390625, 40.0205078125, 41.515625, 43.0107421875, 44.505859375, 46.0009765625, 47.49609375, 48.9912109375, 50.486328125, 51.9814453125, 53.4765625, 54.9716796875, 56.466796875, 57.9619140625, 59.45703125, 60.9521484375, 62.447265625, 63.9423828125, 65.4375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 32.0, 303.0, 481.0, 182.0, 14.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.25506591796875, -140.28289794921875, -136.31072998046875, -132.33856201171875, -128.36639404296875, -124.39422607421875, -120.42206573486328, -116.44989776611328, -112.47772979736328, -108.50556182861328, -104.53339385986328, -100.56122589111328, -96.58906555175781, -92.61689758300781, -88.64472961425781, -84.67256164550781, -80.70039367675781, -76.72822570800781, -72.75605773925781, -68.78388977050781, -64.81172180175781, -60.83955764770508, -56.867393493652344, -52.895225524902344, -48.923057556152344, -44.950889587402344, -40.978721618652344, -37.00655746459961, -33.03438949584961, -29.06222152709961, -25.090055465698242, -21.117889404296875, -17.145729064941406, -13.173562049865723, -9.201395034790039, -5.2292280197143555, -1.2570610046386719, 2.715106964111328, 6.687273025512695, 10.659439086914062, 14.631607055664062, 18.603775024414062, 22.57594108581543, 26.548107147216797, 30.520275115966797, 34.4924430847168, 38.46460723876953, 42.43677520751953, 46.40894317626953, 50.38111114501953, 54.35327911376953, 58.325443267822266, 62.297611236572266, 66.269775390625, 70.241943359375, 74.214111328125, 78.186279296875, 82.158447265625, 86.130615234375, 90.102783203125, 94.074951171875, 98.047119140625, 102.01927947998047, 105.99144744873047, 109.96361541748047]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 6.0, 15.0, 12.0, 18.0, 26.0, 25.0, 28.0, 34.0, 31.0, 37.0, 44.0, 48.0, 53.0, 53.0, 44.0, 53.0, 52.0, 45.0, 46.0, 46.0, 29.0, 33.0, 34.0, 31.0, 23.0, 26.0, 20.0, 14.0, 14.0, 12.0, 11.0, 4.0, 4.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.145313262939453, -24.26028060913086, -23.375246047973633, -22.49021339416504, -21.605178833007812, -20.72014617919922, -19.835113525390625, -18.95008087158203, -18.065046310424805, -17.18001365661621, -16.294979095458984, -15.40994644165039, -14.52491283416748, -13.63987922668457, -12.754846572875977, -11.869812965393066, -10.984779357910156, -10.099745750427246, -9.214712142944336, -8.329679489135742, -7.444645881652832, -6.559612274169922, -5.67457914352417, -4.789546012878418, -3.904512405395508, -3.0194790363311768, -2.1344456672668457, -1.2494122982025146, -0.3643789291381836, 0.5206546783447266, 1.4056878089904785, 2.2907209396362305, 3.1757545471191406, 4.060788154602051, 4.945821285247803, 5.830854415893555, 6.715888023376465, 7.600921630859375, 8.485954284667969, 9.370987892150879, 10.256021499633789, 11.1410551071167, 12.02608871459961, 12.911121368408203, 13.796154975891113, 14.681188583374023, 15.566221237182617, 16.451255798339844, 17.336288452148438, 18.22132110595703, 19.106355667114258, 19.99138832092285, 20.876422882080078, 21.761455535888672, 22.646488189697266, 23.53152084350586, 24.416555404663086, 25.30158805847168, 26.186622619628906, 27.0716552734375, 27.956687927246094, 28.84172248840332, 29.726755142211914, 30.61178970336914, 31.496822357177734]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 6.0, 9.0, 5.0, 13.0, 9.0, 8.0, 14.0, 19.0, 27.0, 24.0, 27.0, 33.0, 17.0, 34.0, 34.0, 30.0, 37.0, 28.0, 43.0, 54.0, 27.0, 39.0, 39.0, 39.0, 37.0, 40.0, 26.0, 31.0, 21.0, 30.0, 23.0, 21.0, 21.0, 25.0, 12.0, 16.0, 21.0, 8.0, 15.0, 12.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.609375, -3.4932861328125, -3.377197265625, -3.2611083984375, -3.14501953125, -3.0289306640625, -2.912841796875, -2.7967529296875, -2.6806640625, -2.5645751953125, -2.448486328125, -2.3323974609375, -2.21630859375, -2.1002197265625, -1.984130859375, -1.8680419921875, -1.751953125, -1.6358642578125, -1.519775390625, -1.4036865234375, -1.28759765625, -1.1715087890625, -1.055419921875, -0.9393310546875, -0.8232421875, -0.7071533203125, -0.591064453125, -0.4749755859375, -0.35888671875, -0.2427978515625, -0.126708984375, -0.0106201171875, 0.10546875, 0.2215576171875, 0.337646484375, 0.4537353515625, 0.56982421875, 0.6859130859375, 0.802001953125, 0.9180908203125, 1.0341796875, 1.1502685546875, 1.266357421875, 1.3824462890625, 1.49853515625, 1.6146240234375, 1.730712890625, 1.8468017578125, 1.962890625, 2.0789794921875, 2.195068359375, 2.3111572265625, 2.42724609375, 2.5433349609375, 2.659423828125, 2.7755126953125, 2.8916015625, 3.0076904296875, 3.123779296875, 3.2398681640625, 3.35595703125, 3.4720458984375, 3.588134765625, 3.7042236328125, 3.8203125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 11.0, 13.0, 11.0, 8.0, 22.0, 42.0, 56.0, 96.0, 115.0, 200.0, 287.0, 440.0, 656.0, 1028.0, 1582.0, 2501.0, 3961.0, 6218.0, 9851.0, 15990.0, 25709.0, 42736.0, 75367.0, 145311.0, 302290.0, 189327.0, 92738.0, 51379.0, 30403.0, 18373.0, 11559.0, 7348.0, 4567.0, 2996.0, 1805.0, 1195.0, 778.0, 527.0, 370.0, 211.0, 148.0, 110.0, 64.0, 51.0, 30.0, 13.0, 16.0, 15.0, 10.0, 12.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.70166015625, -0.67950439453125, -0.6573486328125, -0.63519287109375, -0.613037109375, -0.59088134765625, -0.5687255859375, -0.54656982421875, -0.5244140625, -0.50225830078125, -0.4801025390625, -0.45794677734375, -0.435791015625, -0.41363525390625, -0.3914794921875, -0.36932373046875, -0.34716796875, -0.32501220703125, -0.3028564453125, -0.28070068359375, -0.258544921875, -0.23638916015625, -0.2142333984375, -0.19207763671875, -0.169921875, -0.14776611328125, -0.1256103515625, -0.10345458984375, -0.081298828125, -0.05914306640625, -0.0369873046875, -0.01483154296875, 0.00732421875, 0.02947998046875, 0.0516357421875, 0.07379150390625, 0.095947265625, 0.11810302734375, 0.1402587890625, 0.16241455078125, 0.1845703125, 0.20672607421875, 0.2288818359375, 0.25103759765625, 0.273193359375, 0.29534912109375, 0.3175048828125, 0.33966064453125, 0.36181640625, 0.38397216796875, 0.4061279296875, 0.42828369140625, 0.450439453125, 0.47259521484375, 0.4947509765625, 0.51690673828125, 0.5390625, 0.56121826171875, 0.5833740234375, 0.60552978515625, 0.627685546875, 0.64984130859375, 0.6719970703125, 0.69415283203125, 0.71630859375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 8.0, 10.0, 11.0, 11.0, 7.0, 14.0, 17.0, 16.0, 20.0, 24.0, 32.0, 27.0, 41.0, 34.0, 29.0, 31.0, 40.0, 45.0, 52.0, 1063.0, 42.0, 33.0, 54.0, 33.0, 24.0, 36.0, 40.0, 31.0, 32.0, 30.0, 29.0, 16.0, 13.0, 16.0, 12.0, 20.0, 12.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.658203125, -2.574371337890625, -2.49053955078125, -2.406707763671875, -2.3228759765625, -2.239044189453125, -2.15521240234375, -2.071380615234375, -1.987548828125, -1.903717041015625, -1.81988525390625, -1.736053466796875, -1.6522216796875, -1.568389892578125, -1.48455810546875, -1.400726318359375, -1.31689453125, -1.233062744140625, -1.14923095703125, -1.065399169921875, -0.9815673828125, -0.897735595703125, -0.81390380859375, -0.730072021484375, -0.646240234375, -0.562408447265625, -0.47857666015625, -0.394744873046875, -0.3109130859375, -0.227081298828125, -0.14324951171875, -0.059417724609375, 0.0244140625, 0.108245849609375, 0.19207763671875, 0.275909423828125, 0.3597412109375, 0.443572998046875, 0.52740478515625, 0.611236572265625, 0.695068359375, 0.778900146484375, 0.86273193359375, 0.946563720703125, 1.0303955078125, 1.114227294921875, 1.19805908203125, 1.281890869140625, 1.36572265625, 1.449554443359375, 1.53338623046875, 1.617218017578125, 1.7010498046875, 1.784881591796875, 1.86871337890625, 1.952545166015625, 2.036376953125, 2.120208740234375, 2.20404052734375, 2.287872314453125, 2.3717041015625, 2.455535888671875, 2.53936767578125, 2.623199462890625, 2.70703125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 7.0, 8.0, 15.0, 19.0, 33.0, 38.0, 75.0, 81.0, 93.0, 125.0, 174.0, 228.0, 298.0, 480.0, 674.0, 931.0, 1338.0, 1886.0, 2751.0, 3921.0, 5811.0, 8560.0, 12294.0, 18036.0, 26877.0, 40322.0, 63808.0, 110094.0, 1283007.0, 224052.0, 107180.0, 61217.0, 39751.0, 26644.0, 17700.0, 12065.0, 8044.0, 5598.0, 3882.0, 2649.0, 1814.0, 1304.0, 939.0, 686.0, 502.0, 324.0, 241.0, 183.0, 100.0, 68.0, 61.0, 32.0, 33.0, 27.0, 23.0, 13.0, 14.0, 4.0, 5.0, 0.0, 4.0], "bins": [-0.587890625, -0.5695037841796875, -0.551116943359375, -0.5327301025390625, -0.51434326171875, -0.4959564208984375, -0.477569580078125, -0.4591827392578125, -0.4407958984375, -0.4224090576171875, -0.404022216796875, -0.3856353759765625, -0.36724853515625, -0.3488616943359375, -0.330474853515625, -0.3120880126953125, -0.293701171875, -0.2753143310546875, -0.256927490234375, -0.2385406494140625, -0.22015380859375, -0.2017669677734375, -0.183380126953125, -0.1649932861328125, -0.1466064453125, -0.1282196044921875, -0.109832763671875, -0.0914459228515625, -0.07305908203125, -0.0546722412109375, -0.036285400390625, -0.0178985595703125, 0.00048828125, 0.0188751220703125, 0.037261962890625, 0.0556488037109375, 0.07403564453125, 0.0924224853515625, 0.110809326171875, 0.1291961669921875, 0.1475830078125, 0.1659698486328125, 0.184356689453125, 0.2027435302734375, 0.22113037109375, 0.2395172119140625, 0.257904052734375, 0.2762908935546875, 0.294677734375, 0.3130645751953125, 0.331451416015625, 0.3498382568359375, 0.36822509765625, 0.3866119384765625, 0.404998779296875, 0.4233856201171875, 0.4417724609375, 0.4601593017578125, 0.478546142578125, 0.4969329833984375, 0.51531982421875, 0.5337066650390625, 0.552093505859375, 0.5704803466796875, 0.5888671875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 3.0, 10.0, 7.0, 10.0, 12.0, 27.0, 24.0, 28.0, 35.0, 36.0, 44.0, 50.0, 56.0, 60.0, 68.0, 67.0, 65.0, 62.0, 61.0, 48.0, 33.0, 39.0, 20.0, 28.0, 24.0, 13.0, 7.0, 6.0, 8.0, 8.0, 9.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0001659393310546875, -0.00016099214553833008, -0.00015604496002197266, -0.00015109777450561523, -0.0001461505889892578, -0.0001412034034729004, -0.00013625621795654297, -0.00013130903244018555, -0.00012636184692382812, -0.0001214146614074707, -0.00011646747589111328, -0.00011152029037475586, -0.00010657310485839844, -0.00010162591934204102, -9.66787338256836e-05, -9.173154830932617e-05, -8.678436279296875e-05, -8.183717727661133e-05, -7.68899917602539e-05, -7.194280624389648e-05, -6.699562072753906e-05, -6.204843521118164e-05, -5.710124969482422e-05, -5.21540641784668e-05, -4.7206878662109375e-05, -4.225969314575195e-05, -3.731250762939453e-05, -3.236532211303711e-05, -2.7418136596679688e-05, -2.2470951080322266e-05, -1.7523765563964844e-05, -1.2576580047607422e-05, -7.62939453125e-06, -2.682209014892578e-06, 2.2649765014648438e-06, 7.212162017822266e-06, 1.2159347534179688e-05, 1.710653305053711e-05, 2.205371856689453e-05, 2.7000904083251953e-05, 3.1948089599609375e-05, 3.68952751159668e-05, 4.184246063232422e-05, 4.678964614868164e-05, 5.173683166503906e-05, 5.6684017181396484e-05, 6.16312026977539e-05, 6.657838821411133e-05, 7.152557373046875e-05, 7.647275924682617e-05, 8.14199447631836e-05, 8.636713027954102e-05, 9.131431579589844e-05, 9.626150131225586e-05, 0.00010120868682861328, 0.0001061558723449707, 0.00011110305786132812, 0.00011605024337768555, 0.00012099742889404297, 0.0001259446144104004, 0.0001308917999267578, 0.00013583898544311523, 0.00014078617095947266, 0.00014573335647583008, 0.0001506805419921875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 3.0, 3.0, 12.0, 12.0, 8.0, 10.0, 17.0, 33.0, 38.0, 43.0, 64.0, 75.0, 122.0, 215.0, 535.0, 2852.0, 1038074.0, 5030.0, 594.0, 269.0, 126.0, 100.0, 83.0, 47.0, 36.0, 29.0, 29.0, 22.0, 9.0, 11.0, 9.0, 7.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00345611572265625, -0.0033429861068725586, -0.003229856491088867, -0.0031167268753051758, -0.0030035972595214844, -0.002890467643737793, -0.0027773380279541016, -0.00266420841217041, -0.0025510787963867188, -0.0024379491806030273, -0.002324819564819336, -0.0022116899490356445, -0.002098560333251953, -0.0019854307174682617, -0.0018723011016845703, -0.001759171485900879, -0.0016460418701171875, -0.001532912254333496, -0.0014197826385498047, -0.0013066530227661133, -0.0011935234069824219, -0.0010803937911987305, -0.0009672641754150391, -0.0008541345596313477, -0.0007410049438476562, -0.0006278753280639648, -0.0005147457122802734, -0.00040161609649658203, -0.0002884864807128906, -0.00017535686492919922, -6.222724914550781e-05, 5.0902366638183594e-05, 0.000164031982421875, 0.0002771615982055664, 0.0003902912139892578, 0.0005034208297729492, 0.0006165504455566406, 0.000729680061340332, 0.0008428096771240234, 0.0009559392929077148, 0.0010690689086914062, 0.0011821985244750977, 0.001295328140258789, 0.0014084577560424805, 0.0015215873718261719, 0.0016347169876098633, 0.0017478466033935547, 0.001860976219177246, 0.0019741058349609375, 0.002087235450744629, 0.0022003650665283203, 0.0023134946823120117, 0.002426624298095703, 0.0025397539138793945, 0.002652883529663086, 0.0027660131454467773, 0.0028791427612304688, 0.00299227237701416, 0.0031054019927978516, 0.003218531608581543, 0.0033316612243652344, 0.0034447908401489258, 0.003557920455932617, 0.0036710500717163086, 0.0037841796875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 8.0, 19.0, 47.0, 45.0, 97.0, 148.0, 178.0, 164.0, 124.0, 87.0, 44.0, 29.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00017212591774296016, -0.00016852229600772262, -0.0001649186888244003, -0.00016131506708916277, -0.00015771145990584046, -0.00015410783817060292, -0.0001505042309872806, -0.00014690060925204307, -0.00014329700206872076, -0.00013969338033348322, -0.0001360897731501609, -0.00013248615141492337, -0.00012888254423160106, -0.00012527892249636352, -0.00012167531531304121, -0.00011807169357780367, -0.00011446807911852375, -0.00011086446465924382, -0.0001072608501999639, -0.00010365723574068397, -0.00010005362128140405, -9.645000682212412e-05, -9.284638508688658e-05, -8.924277790356427e-05, -8.563915616832674e-05, -8.203554170904681e-05, -7.843192724976689e-05, -7.482831279048696e-05, -7.122469833120704e-05, -6.762108387192711e-05, -6.401746941264719e-05, -6.0413851315388456e-05, -5.6810244132066146e-05, -5.320662967278622e-05, -4.9603015213506296e-05, -4.5999397116247565e-05, -4.239578265696764e-05, -3.8792168197687715e-05, -3.518855373840779e-05, -3.1584939279127866e-05, -2.798132481984794e-05, -2.4377710360568017e-05, -2.0774095901288092e-05, -1.7170479623018764e-05, -1.356686516373884e-05, -9.963250704458915e-06, -6.3596344261895865e-06, -2.756019966909662e-06, 8.475944923702627e-07, 4.451209406397538e-06, 8.054824320424814e-06, 1.165843968919944e-05, 1.5262054148479365e-05, 1.886566860775929e-05, 2.2469284886028618e-05, 2.6072899345308542e-05, 2.9676513804588467e-05, 3.328012826386839e-05, 3.6883742723148316e-05, 4.048735718242824e-05, 4.4090971641708165e-05, 4.769458610098809e-05, 5.129820419824682e-05, 5.4901818657526746e-05, 5.850543311680667e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 10.0, 10.0, 11.0, 16.0, 15.0, 19.0, 17.0, 21.0, 12.0, 27.0, 38.0, 24.0, 36.0, 31.0, 39.0, 46.0, 40.0, 38.0, 38.0, 45.0, 38.0, 37.0, 39.0, 41.0, 26.0, 32.0, 46.0, 26.0, 36.0, 18.0, 16.0, 22.0, 19.0, 12.0, 11.0, 11.0, 5.0, 8.0, 4.0, 6.0, 5.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.396936416625977e-05, -7.145106792449951e-05, -6.893277168273926e-05, -6.6414475440979e-05, -6.389617919921875e-05, -6.13778829574585e-05, -5.885958671569824e-05, -5.634129047393799e-05, -5.3822994232177734e-05, -5.130469799041748e-05, -4.8786401748657227e-05, -4.626810550689697e-05, -4.374980926513672e-05, -4.1231513023376465e-05, -3.871321678161621e-05, -3.619492053985596e-05, -3.36766242980957e-05, -3.115832805633545e-05, -2.8640031814575195e-05, -2.612173557281494e-05, -2.3603439331054688e-05, -2.1085143089294434e-05, -1.856684684753418e-05, -1.6048550605773926e-05, -1.3530254364013672e-05, -1.1011958122253418e-05, -8.493661880493164e-06, -5.97536563873291e-06, -3.4570693969726562e-06, -9.387731552124023e-07, 1.5795230865478516e-06, 4.0978193283081055e-06, 6.616115570068359e-06, 9.134411811828613e-06, 1.1652708053588867e-05, 1.4171004295349121e-05, 1.6689300537109375e-05, 1.920759677886963e-05, 2.1725893020629883e-05, 2.4244189262390137e-05, 2.676248550415039e-05, 2.9280781745910645e-05, 3.17990779876709e-05, 3.431737422943115e-05, 3.6835670471191406e-05, 3.935396671295166e-05, 4.1872262954711914e-05, 4.439055919647217e-05, 4.690885543823242e-05, 4.9427151679992676e-05, 5.194544792175293e-05, 5.4463744163513184e-05, 5.698204040527344e-05, 5.950033664703369e-05, 6.201863288879395e-05, 6.45369291305542e-05, 6.705522537231445e-05, 6.957352161407471e-05, 7.209181785583496e-05, 7.461011409759521e-05, 7.712841033935547e-05, 7.964670658111572e-05, 8.216500282287598e-05, 8.468329906463623e-05, 8.720159530639648e-05]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 6.0, 9.0, 5.0, 13.0, 9.0, 8.0, 14.0, 19.0, 27.0, 24.0, 27.0, 33.0, 17.0, 34.0, 34.0, 30.0, 37.0, 28.0, 43.0, 54.0, 27.0, 39.0, 39.0, 39.0, 37.0, 40.0, 26.0, 31.0, 21.0, 30.0, 23.0, 21.0, 21.0, 25.0, 12.0, 16.0, 21.0, 8.0, 15.0, 12.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.609375, -3.4932861328125, -3.377197265625, -3.2611083984375, -3.14501953125, -3.0289306640625, -2.912841796875, -2.7967529296875, -2.6806640625, -2.5645751953125, -2.448486328125, -2.3323974609375, -2.21630859375, -2.1002197265625, -1.984130859375, -1.8680419921875, -1.751953125, -1.6358642578125, -1.519775390625, -1.4036865234375, -1.28759765625, -1.1715087890625, -1.055419921875, -0.9393310546875, -0.8232421875, -0.7071533203125, -0.591064453125, -0.4749755859375, -0.35888671875, -0.2427978515625, -0.126708984375, -0.0106201171875, 0.10546875, 0.2215576171875, 0.337646484375, 0.4537353515625, 0.56982421875, 0.6859130859375, 0.802001953125, 0.9180908203125, 1.0341796875, 1.1502685546875, 1.266357421875, 1.3824462890625, 1.49853515625, 1.6146240234375, 1.730712890625, 1.8468017578125, 1.962890625, 2.0789794921875, 2.195068359375, 2.3111572265625, 2.42724609375, 2.5433349609375, 2.659423828125, 2.7755126953125, 2.8916015625, 3.0076904296875, 3.123779296875, 3.2398681640625, 3.35595703125, 3.4720458984375, 3.588134765625, 3.7042236328125, 3.8203125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 10.0, 4.0, 7.0, 16.0, 10.0, 11.0, 22.0, 31.0, 50.0, 54.0, 68.0, 93.0, 106.0, 156.0, 250.0, 439.0, 923.0, 2376.0, 6225.0, 16749.0, 45198.0, 115421.0, 278323.0, 347228.0, 143335.0, 56751.0, 21298.0, 7899.0, 2887.0, 1156.0, 494.0, 277.0, 167.0, 117.0, 93.0, 75.0, 47.0, 38.0, 39.0, 23.0, 22.0, 15.0, 12.0, 9.0, 11.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.84765625, -3.71990966796875, -3.5921630859375, -3.46441650390625, -3.336669921875, -3.20892333984375, -3.0811767578125, -2.95343017578125, -2.82568359375, -2.69793701171875, -2.5701904296875, -2.44244384765625, -2.314697265625, -2.18695068359375, -2.0592041015625, -1.93145751953125, -1.8037109375, -1.67596435546875, -1.5482177734375, -1.42047119140625, -1.292724609375, -1.16497802734375, -1.0372314453125, -0.90948486328125, -0.78173828125, -0.65399169921875, -0.5262451171875, -0.39849853515625, -0.270751953125, -0.14300537109375, -0.0152587890625, 0.11248779296875, 0.240234375, 0.36798095703125, 0.4957275390625, 0.62347412109375, 0.751220703125, 0.87896728515625, 1.0067138671875, 1.13446044921875, 1.26220703125, 1.38995361328125, 1.5177001953125, 1.64544677734375, 1.773193359375, 1.90093994140625, 2.0286865234375, 2.15643310546875, 2.2841796875, 2.41192626953125, 2.5396728515625, 2.66741943359375, 2.795166015625, 2.92291259765625, 3.0506591796875, 3.17840576171875, 3.30615234375, 3.43389892578125, 3.5616455078125, 3.68939208984375, 3.817138671875, 3.94488525390625, 4.0726318359375, 4.20037841796875, 4.328125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 3.0, 0.0, 4.0, 5.0, 12.0, 11.0, 11.0, 8.0, 16.0, 21.0, 21.0, 20.0, 27.0, 22.0, 37.0, 41.0, 41.0, 57.0, 65.0, 166.0, 1440.0, 415.0, 128.0, 75.0, 50.0, 58.0, 41.0, 42.0, 29.0, 33.0, 35.0, 15.0, 16.0, 9.0, 14.0, 9.0, 10.0, 9.0, 7.0, 9.0, 1.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.421875, -11.0272216796875, -10.632568359375, -10.2379150390625, -9.84326171875, -9.4486083984375, -9.053955078125, -8.6593017578125, -8.2646484375, -7.8699951171875, -7.475341796875, -7.0806884765625, -6.68603515625, -6.2913818359375, -5.896728515625, -5.5020751953125, -5.107421875, -4.7127685546875, -4.318115234375, -3.9234619140625, -3.52880859375, -3.1341552734375, -2.739501953125, -2.3448486328125, -1.9501953125, -1.5555419921875, -1.160888671875, -0.7662353515625, -0.37158203125, 0.0230712890625, 0.417724609375, 0.8123779296875, 1.20703125, 1.6016845703125, 1.996337890625, 2.3909912109375, 2.78564453125, 3.1802978515625, 3.574951171875, 3.9696044921875, 4.3642578125, 4.7589111328125, 5.153564453125, 5.5482177734375, 5.94287109375, 6.3375244140625, 6.732177734375, 7.1268310546875, 7.521484375, 7.9161376953125, 8.310791015625, 8.7054443359375, 9.10009765625, 9.4947509765625, 9.889404296875, 10.2840576171875, 10.6787109375, 11.0733642578125, 11.468017578125, 11.8626708984375, 12.25732421875, 12.6519775390625, 13.046630859375, 13.4412841796875, 13.8359375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 7.0, 3.0, 4.0, 13.0, 20.0, 32.0, 25.0, 35.0, 32.0, 59.0, 96.0, 110.0, 187.0, 347.0, 779.0, 3974.0, 3117233.0, 20501.0, 1138.0, 451.0, 198.0, 137.0, 94.0, 67.0, 45.0, 29.0, 16.0, 20.0, 9.0, 13.0, 7.0, 10.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.4375, -48.7373046875, -47.037109375, -45.3369140625, -43.63671875, -41.9365234375, -40.236328125, -38.5361328125, -36.8359375, -35.1357421875, -33.435546875, -31.7353515625, -30.03515625, -28.3349609375, -26.634765625, -24.9345703125, -23.234375, -21.5341796875, -19.833984375, -18.1337890625, -16.43359375, -14.7333984375, -13.033203125, -11.3330078125, -9.6328125, -7.9326171875, -6.232421875, -4.5322265625, -2.83203125, -1.1318359375, 0.568359375, 2.2685546875, 3.96875, 5.6689453125, 7.369140625, 9.0693359375, 10.76953125, 12.4697265625, 14.169921875, 15.8701171875, 17.5703125, 19.2705078125, 20.970703125, 22.6708984375, 24.37109375, 26.0712890625, 27.771484375, 29.4716796875, 31.171875, 32.8720703125, 34.572265625, 36.2724609375, 37.97265625, 39.6728515625, 41.373046875, 43.0732421875, 44.7734375, 46.4736328125, 48.173828125, 49.8740234375, 51.57421875, 53.2744140625, 54.974609375, 56.6748046875, 58.375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 21.0, 55.0, 128.0, 214.0, 257.0, 196.0, 90.0, 35.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.67979621887207, -16.764461517333984, -15.849126815795898, -14.933792114257812, -14.018457412719727, -13.10312271118164, -12.187788009643555, -11.272453308105469, -10.357118606567383, -9.441783905029297, -8.526449203491211, -7.611114501953125, -6.695779800415039, -5.780445098876953, -4.865110397338867, -3.9497756958007812, -3.0344409942626953, -2.1191062927246094, -1.2037715911865234, -0.2884368896484375, 0.6268978118896484, 1.5422325134277344, 2.4575672149658203, 3.3729019165039062, 4.288236618041992, 5.203571319580078, 6.118906021118164, 7.03424072265625, 7.949575424194336, 8.864910125732422, 9.780244827270508, 10.695579528808594, 11.610912322998047, 12.526247024536133, 13.441581726074219, 14.356916427612305, 15.27225112915039, 16.187585830688477, 17.102920532226562, 18.01825523376465, 18.933589935302734, 19.84892463684082, 20.764259338378906, 21.679594039916992, 22.594928741455078, 23.510263442993164, 24.42559814453125, 25.340932846069336, 26.256267547607422, 27.171602249145508, 28.086936950683594, 29.00227165222168, 29.917606353759766, 30.83294105529785, 31.748275756835938, 32.663612365722656, 33.57894515991211, 34.49427795410156, 35.40961456298828, 36.324951171875, 37.24028396606445, 38.155616760253906, 39.070953369140625, 39.986289978027344, 40.9016227722168]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 9.0, 9.0, 10.0, 12.0, 11.0, 13.0, 14.0, 27.0, 32.0, 27.0, 36.0, 34.0, 46.0, 37.0, 31.0, 28.0, 39.0, 55.0, 42.0, 37.0, 48.0, 44.0, 38.0, 44.0, 37.0, 31.0, 27.0, 24.0, 25.0, 22.0, 26.0, 18.0, 9.0, 13.0, 7.0, 4.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.4241828918457, -31.450801849365234, -30.477420806884766, -29.504039764404297, -28.530658721923828, -27.55727767944336, -26.583898544311523, -25.610517501831055, -24.637136459350586, -23.663755416870117, -22.69037437438965, -21.71699333190918, -20.743614196777344, -19.770233154296875, -18.796852111816406, -17.823471069335938, -16.85009002685547, -15.876708984375, -14.903327941894531, -13.929947853088379, -12.95656681060791, -11.983185768127441, -11.009805679321289, -10.03642463684082, -9.063043594360352, -8.089662551879883, -7.116281986236572, -6.142901420593262, -5.169520378112793, -4.196139335632324, -3.2227587699890137, -2.249378204345703, -1.2759971618652344, -0.3026163578033447, 0.6707644462585449, 1.6441452503204346, 2.617526054382324, 3.590907096862793, 4.5642876625061035, 5.537668228149414, 6.511049270629883, 7.484430313110352, 8.45781135559082, 9.431191444396973, 10.404572486877441, 11.37795352935791, 12.351333618164062, 13.324714660644531, 14.298095703125, 15.271476745605469, 16.244857788085938, 17.218238830566406, 18.191619873046875, 19.165000915527344, 20.13838005065918, 21.11176109313965, 22.085142135620117, 23.058523178100586, 24.031904220581055, 25.005285263061523, 25.97866439819336, 26.952045440673828, 27.925426483154297, 28.898807525634766, 29.872188568115234]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 1.0, 7.0, 8.0, 8.0, 6.0, 7.0, 10.0, 14.0, 12.0, 24.0, 25.0, 20.0, 26.0, 26.0, 40.0, 22.0, 27.0, 41.0, 33.0, 27.0, 47.0, 39.0, 36.0, 38.0, 26.0, 38.0, 45.0, 40.0, 31.0, 22.0, 33.0, 22.0, 26.0, 26.0, 17.0, 17.0, 12.0, 13.0, 19.0, 13.0, 12.0, 13.0, 8.0, 3.0, 5.0, 6.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.70703125, -3.5831298828125, -3.459228515625, -3.3353271484375, -3.21142578125, -3.0875244140625, -2.963623046875, -2.8397216796875, -2.7158203125, -2.5919189453125, -2.468017578125, -2.3441162109375, -2.22021484375, -2.0963134765625, -1.972412109375, -1.8485107421875, -1.724609375, -1.6007080078125, -1.476806640625, -1.3529052734375, -1.22900390625, -1.1051025390625, -0.981201171875, -0.8572998046875, -0.7333984375, -0.6094970703125, -0.485595703125, -0.3616943359375, -0.23779296875, -0.1138916015625, 0.010009765625, 0.1339111328125, 0.2578125, 0.3817138671875, 0.505615234375, 0.6295166015625, 0.75341796875, 0.8773193359375, 1.001220703125, 1.1251220703125, 1.2490234375, 1.3729248046875, 1.496826171875, 1.6207275390625, 1.74462890625, 1.8685302734375, 1.992431640625, 2.1163330078125, 2.240234375, 2.3641357421875, 2.488037109375, 2.6119384765625, 2.73583984375, 2.8597412109375, 2.983642578125, 3.1075439453125, 3.2314453125, 3.3553466796875, 3.479248046875, 3.6031494140625, 3.72705078125, 3.8509521484375, 3.974853515625, 4.0987548828125, 4.22265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 11.0, 9.0, 9.0, 18.0, 19.0, 25.0, 31.0, 29.0, 41.0, 62.0, 66.0, 67.0, 95.0, 118.0, 152.0, 259.0, 923.0, 9554.0, 457803.0, 3304912.0, 409136.0, 8970.0, 924.0, 272.0, 155.0, 121.0, 71.0, 77.0, 56.0, 45.0, 48.0, 35.0, 35.0, 22.0, 15.0, 21.0, 10.0, 18.0, 4.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.359375, -11.9539794921875, -11.548583984375, -11.1431884765625, -10.73779296875, -10.3323974609375, -9.927001953125, -9.5216064453125, -9.1162109375, -8.7108154296875, -8.305419921875, -7.9000244140625, -7.49462890625, -7.0892333984375, -6.683837890625, -6.2784423828125, -5.873046875, -5.4676513671875, -5.062255859375, -4.6568603515625, -4.25146484375, -3.8460693359375, -3.440673828125, -3.0352783203125, -2.6298828125, -2.2244873046875, -1.819091796875, -1.4136962890625, -1.00830078125, -0.6029052734375, -0.197509765625, 0.2078857421875, 0.61328125, 1.0186767578125, 1.424072265625, 1.8294677734375, 2.23486328125, 2.6402587890625, 3.045654296875, 3.4510498046875, 3.8564453125, 4.2618408203125, 4.667236328125, 5.0726318359375, 5.47802734375, 5.8834228515625, 6.288818359375, 6.6942138671875, 7.099609375, 7.5050048828125, 7.910400390625, 8.3157958984375, 8.72119140625, 9.1265869140625, 9.531982421875, 9.9373779296875, 10.3427734375, 10.7481689453125, 11.153564453125, 11.5589599609375, 11.96435546875, 12.3697509765625, 12.775146484375, 13.1805419921875, 13.5859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 9.0, 6.0, 8.0, 6.0, 8.0, 12.0, 13.0, 23.0, 23.0, 41.0, 56.0, 76.0, 78.0, 139.0, 163.0, 214.0, 248.0, 319.0, 370.0, 382.0, 387.0, 350.0, 257.0, 210.0, 143.0, 115.0, 101.0, 63.0, 54.0, 47.0, 39.0, 29.0, 22.0, 18.0, 11.0, 3.0, 6.0, 10.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.98046875, -4.7862548828125, -4.592041015625, -4.3978271484375, -4.20361328125, -4.0093994140625, -3.815185546875, -3.6209716796875, -3.4267578125, -3.2325439453125, -3.038330078125, -2.8441162109375, -2.64990234375, -2.4556884765625, -2.261474609375, -2.0672607421875, -1.873046875, -1.6788330078125, -1.484619140625, -1.2904052734375, -1.09619140625, -0.9019775390625, -0.707763671875, -0.5135498046875, -0.3193359375, -0.1251220703125, 0.069091796875, 0.2633056640625, 0.45751953125, 0.6517333984375, 0.845947265625, 1.0401611328125, 1.234375, 1.4285888671875, 1.622802734375, 1.8170166015625, 2.01123046875, 2.2054443359375, 2.399658203125, 2.5938720703125, 2.7880859375, 2.9822998046875, 3.176513671875, 3.3707275390625, 3.56494140625, 3.7591552734375, 3.953369140625, 4.1475830078125, 4.341796875, 4.5360107421875, 4.730224609375, 4.9244384765625, 5.11865234375, 5.3128662109375, 5.507080078125, 5.7012939453125, 5.8955078125, 6.0897216796875, 6.283935546875, 6.4781494140625, 6.67236328125, 6.8665771484375, 7.060791015625, 7.2550048828125, 7.44921875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 4.0, 3.0, 11.0, 13.0, 24.0, 18.0, 39.0, 43.0, 63.0, 65.0, 110.0, 127.0, 162.0, 198.0, 271.0, 409.0, 836.0, 42163.0, 4076390.0, 70640.0, 975.0, 405.0, 313.0, 243.0, 185.0, 149.0, 110.0, 70.0, 56.0, 40.0, 40.0, 22.0, 13.0, 12.0, 9.0, 11.0, 7.0, 6.0, 5.0, 1.0, 1.0, 4.0, 3.0, 1.0], "bins": [-39.28125, -38.261962890625, -37.24267578125, -36.223388671875, -35.2041015625, -34.184814453125, -33.16552734375, -32.146240234375, -31.126953125, -30.107666015625, -29.08837890625, -28.069091796875, -27.0498046875, -26.030517578125, -25.01123046875, -23.991943359375, -22.97265625, -21.953369140625, -20.93408203125, -19.914794921875, -18.8955078125, -17.876220703125, -16.85693359375, -15.837646484375, -14.818359375, -13.799072265625, -12.77978515625, -11.760498046875, -10.7412109375, -9.721923828125, -8.70263671875, -7.683349609375, -6.6640625, -5.644775390625, -4.62548828125, -3.606201171875, -2.5869140625, -1.567626953125, -0.54833984375, 0.470947265625, 1.490234375, 2.509521484375, 3.52880859375, 4.548095703125, 5.5673828125, 6.586669921875, 7.60595703125, 8.625244140625, 9.64453125, 10.663818359375, 11.68310546875, 12.702392578125, 13.7216796875, 14.740966796875, 15.76025390625, 16.779541015625, 17.798828125, 18.818115234375, 19.83740234375, 20.856689453125, 21.8759765625, 22.895263671875, 23.91455078125, 24.933837890625, 25.953125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 25.0, 177.0, 391.0, 309.0, 98.0, 10.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.38491439819336, -19.52646827697754, -16.66802215576172, -13.809574127197266, -10.951128005981445, -8.092681884765625, -5.234233856201172, -2.3757877349853516, 0.48265838623046875, 3.3411049842834473, 6.199551582336426, 9.057998657226562, 11.916444778442383, 14.774890899658203, 17.633338928222656, 20.491785049438477, 23.350231170654297, 26.208677291870117, 29.067123413085938, 31.92557144165039, 34.784019470214844, 37.64246368408203, 40.500911712646484, 43.35935974121094, 46.217803955078125, 49.07625198364258, 51.934696197509766, 54.79314422607422, 57.651588439941406, 60.51003646850586, 63.36848449707031, 66.2269287109375, 69.08537292480469, 71.94381713867188, 74.8022689819336, 77.66071319580078, 80.51915740966797, 83.37760925292969, 86.23605346679688, 89.09449768066406, 91.95294189453125, 94.81138610839844, 97.66983795166016, 100.52828216552734, 103.38672637939453, 106.24517822265625, 109.10362243652344, 111.96206665039062, 114.82051849365234, 117.67896270751953, 120.53741455078125, 123.39585876464844, 126.25430297851562, 129.1127471923828, 131.97119140625, 134.82965087890625, 137.68809509277344, 140.54653930664062, 143.4049835205078, 146.263427734375, 149.12188720703125, 151.98033142089844, 154.83877563476562, 157.6972198486328, 160.5556640625]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 5.0, 9.0, 4.0, 12.0, 18.0, 19.0, 21.0, 23.0, 19.0, 17.0, 30.0, 24.0, 37.0, 34.0, 39.0, 36.0, 50.0, 43.0, 41.0, 42.0, 53.0, 38.0, 42.0, 38.0, 37.0, 25.0, 30.0, 24.0, 30.0, 24.0, 24.0, 16.0, 9.0, 20.0, 15.0, 10.0, 7.0, 11.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.612600326538086, -23.874149322509766, -23.135698318481445, -22.397247314453125, -21.658796310424805, -20.920345306396484, -20.181894302368164, -19.443443298339844, -18.704992294311523, -17.966541290283203, -17.228090286254883, -16.489639282226562, -15.751188278198242, -15.012737274169922, -14.274286270141602, -13.535835266113281, -12.797384262084961, -12.05893325805664, -11.32048225402832, -10.58203125, -9.84358024597168, -9.10512924194336, -8.366678237915039, -7.628227233886719, -6.889776229858398, -6.151325225830078, -5.412874221801758, -4.6744232177734375, -3.935972213745117, -3.197521209716797, -2.4590702056884766, -1.7206192016601562, -0.9821662902832031, -0.2437152862548828, 0.4947357177734375, 1.2331867218017578, 1.9716377258300781, 2.7100887298583984, 3.4485397338867188, 4.186990737915039, 4.925441741943359, 5.66389274597168, 6.40234375, 7.14079475402832, 7.879245758056641, 8.617696762084961, 9.356147766113281, 10.094598770141602, 10.833049774169922, 11.571500778198242, 12.309951782226562, 13.048402786254883, 13.786853790283203, 14.525304794311523, 15.263755798339844, 16.002206802368164, 16.740657806396484, 17.479108810424805, 18.217559814453125, 18.956010818481445, 19.694461822509766, 20.432912826538086, 21.171363830566406, 21.909814834594727, 22.648265838623047]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 8.0, 3.0, 8.0, 5.0, 9.0, 7.0, 18.0, 24.0, 23.0, 19.0, 26.0, 22.0, 24.0, 23.0, 29.0, 32.0, 28.0, 37.0, 42.0, 36.0, 41.0, 39.0, 33.0, 29.0, 33.0, 28.0, 30.0, 33.0, 26.0, 34.0, 21.0, 27.0, 25.0, 25.0, 18.0, 23.0, 15.0, 20.0, 11.0, 11.0, 7.0, 11.0, 7.0, 7.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-3.7734375, -3.6602783203125, -3.547119140625, -3.4339599609375, -3.32080078125, -3.2076416015625, -3.094482421875, -2.9813232421875, -2.8681640625, -2.7550048828125, -2.641845703125, -2.5286865234375, -2.41552734375, -2.3023681640625, -2.189208984375, -2.0760498046875, -1.962890625, -1.8497314453125, -1.736572265625, -1.6234130859375, -1.51025390625, -1.3970947265625, -1.283935546875, -1.1707763671875, -1.0576171875, -0.9444580078125, -0.831298828125, -0.7181396484375, -0.60498046875, -0.4918212890625, -0.378662109375, -0.2655029296875, -0.15234375, -0.0391845703125, 0.073974609375, 0.1871337890625, 0.30029296875, 0.4134521484375, 0.526611328125, 0.6397705078125, 0.7529296875, 0.8660888671875, 0.979248046875, 1.0924072265625, 1.20556640625, 1.3187255859375, 1.431884765625, 1.5450439453125, 1.658203125, 1.7713623046875, 1.884521484375, 1.9976806640625, 2.11083984375, 2.2239990234375, 2.337158203125, 2.4503173828125, 2.5634765625, 2.6766357421875, 2.789794921875, 2.9029541015625, 3.01611328125, 3.1292724609375, 3.242431640625, 3.3555908203125, 3.46875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 7.0, 5.0, 8.0, 9.0, 19.0, 25.0, 42.0, 62.0, 84.0, 120.0, 151.0, 260.0, 352.0, 507.0, 688.0, 1011.0, 1506.0, 2230.0, 3264.0, 4652.0, 7097.0, 10605.0, 15781.0, 23820.0, 35868.0, 54690.0, 88325.0, 152243.0, 249742.0, 148529.0, 85824.0, 54057.0, 35536.0, 23500.0, 15678.0, 10435.0, 7023.0, 4729.0, 3144.0, 2149.0, 1497.0, 1033.0, 669.0, 448.0, 375.0, 242.0, 174.0, 117.0, 79.0, 53.0, 32.0, 33.0, 12.0, 7.0, 13.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.5927734375, -0.573944091796875, -0.55511474609375, -0.536285400390625, -0.5174560546875, -0.498626708984375, -0.47979736328125, -0.460968017578125, -0.442138671875, -0.423309326171875, -0.40447998046875, -0.385650634765625, -0.3668212890625, -0.347991943359375, -0.32916259765625, -0.310333251953125, -0.29150390625, -0.272674560546875, -0.25384521484375, -0.235015869140625, -0.2161865234375, -0.197357177734375, -0.17852783203125, -0.159698486328125, -0.140869140625, -0.122039794921875, -0.10321044921875, -0.084381103515625, -0.0655517578125, -0.046722412109375, -0.02789306640625, -0.009063720703125, 0.009765625, 0.028594970703125, 0.04742431640625, 0.066253662109375, 0.0850830078125, 0.103912353515625, 0.12274169921875, 0.141571044921875, 0.160400390625, 0.179229736328125, 0.19805908203125, 0.216888427734375, 0.2357177734375, 0.254547119140625, 0.27337646484375, 0.292205810546875, 0.31103515625, 0.329864501953125, 0.34869384765625, 0.367523193359375, 0.3863525390625, 0.405181884765625, 0.42401123046875, 0.442840576171875, 0.461669921875, 0.480499267578125, 0.49932861328125, 0.518157958984375, 0.5369873046875, 0.555816650390625, 0.57464599609375, 0.593475341796875, 0.6123046875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 8.0, 4.0, 14.0, 15.0, 9.0, 8.0, 23.0, 19.0, 20.0, 34.0, 26.0, 41.0, 44.0, 38.0, 31.0, 52.0, 40.0, 51.0, 1069.0, 46.0, 37.0, 50.0, 39.0, 47.0, 40.0, 40.0, 25.0, 32.0, 17.0, 17.0, 22.0, 12.0, 7.0, 12.0, 8.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.76025390625, -2.6689453125, -2.57763671875, -2.486328125, -2.39501953125, -2.3037109375, -2.21240234375, -2.12109375, -2.02978515625, -1.9384765625, -1.84716796875, -1.755859375, -1.66455078125, -1.5732421875, -1.48193359375, -1.390625, -1.29931640625, -1.2080078125, -1.11669921875, -1.025390625, -0.93408203125, -0.8427734375, -0.75146484375, -0.66015625, -0.56884765625, -0.4775390625, -0.38623046875, -0.294921875, -0.20361328125, -0.1123046875, -0.02099609375, 0.0703125, 0.16162109375, 0.2529296875, 0.34423828125, 0.435546875, 0.52685546875, 0.6181640625, 0.70947265625, 0.80078125, 0.89208984375, 0.9833984375, 1.07470703125, 1.166015625, 1.25732421875, 1.3486328125, 1.43994140625, 1.53125, 1.62255859375, 1.7138671875, 1.80517578125, 1.896484375, 1.98779296875, 2.0791015625, 2.17041015625, 2.26171875, 2.35302734375, 2.4443359375, 2.53564453125, 2.626953125, 2.71826171875, 2.8095703125, 2.90087890625, 2.9921875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 8.0, 2.0, 8.0, 5.0, 12.0, 6.0, 30.0, 27.0, 48.0, 76.0, 134.0, 156.0, 272.0, 411.0, 576.0, 837.0, 1210.0, 1838.0, 2604.0, 3868.0, 5675.0, 8281.0, 12679.0, 18822.0, 29571.0, 46929.0, 79271.0, 149763.0, 1339434.0, 166250.0, 85518.0, 50654.0, 31304.0, 20156.0, 13057.0, 8719.0, 6085.0, 4072.0, 2782.0, 1880.0, 1359.0, 888.0, 610.0, 390.0, 281.0, 199.0, 118.0, 98.0, 62.0, 39.0, 21.0, 18.0, 12.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.64208984375, -0.62237548828125, -0.6026611328125, -0.58294677734375, -0.563232421875, -0.54351806640625, -0.5238037109375, -0.50408935546875, -0.484375, -0.46466064453125, -0.4449462890625, -0.42523193359375, -0.405517578125, -0.38580322265625, -0.3660888671875, -0.34637451171875, -0.32666015625, -0.30694580078125, -0.2872314453125, -0.26751708984375, -0.247802734375, -0.22808837890625, -0.2083740234375, -0.18865966796875, -0.1689453125, -0.14923095703125, -0.1295166015625, -0.10980224609375, -0.090087890625, -0.07037353515625, -0.0506591796875, -0.03094482421875, -0.01123046875, 0.00848388671875, 0.0281982421875, 0.04791259765625, 0.067626953125, 0.08734130859375, 0.1070556640625, 0.12677001953125, 0.146484375, 0.16619873046875, 0.1859130859375, 0.20562744140625, 0.225341796875, 0.24505615234375, 0.2647705078125, 0.28448486328125, 0.30419921875, 0.32391357421875, 0.3436279296875, 0.36334228515625, 0.383056640625, 0.40277099609375, 0.4224853515625, 0.44219970703125, 0.4619140625, 0.48162841796875, 0.5013427734375, 0.52105712890625, 0.540771484375, 0.56048583984375, 0.5802001953125, 0.59991455078125, 0.61962890625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 8.0, 10.0, 9.0, 14.0, 5.0, 10.0, 17.0, 22.0, 32.0, 30.0, 44.0, 55.0, 68.0, 63.0, 59.0, 62.0, 63.0, 55.0, 71.0, 63.0, 47.0, 40.0, 32.0, 24.0, 25.0, 23.0, 14.0, 11.0, 6.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011867284774780273, -0.0001133875921368599, -0.00010810233652591705, -0.00010281708091497421, -9.753182530403137e-05, -9.224656969308853e-05, -8.696131408214569e-05, -8.167605847120285e-05, -7.639080286026001e-05, -7.110554724931717e-05, -6.582029163837433e-05, -6.053503602743149e-05, -5.524978041648865e-05, -4.996452480554581e-05, -4.4679269194602966e-05, -3.9394013583660126e-05, -3.4108757972717285e-05, -2.8823502361774445e-05, -2.3538246750831604e-05, -1.8252991139888763e-05, -1.2967735528945923e-05, -7.682479918003082e-06, -2.3972243070602417e-06, 2.888031303882599e-06, 8.17328691482544e-06, 1.345854252576828e-05, 1.874379813671112e-05, 2.402905374765396e-05, 2.9314309358596802e-05, 3.459956496953964e-05, 3.988482058048248e-05, 4.5170076191425323e-05, 5.0455331802368164e-05, 5.5740587413311005e-05, 6.1025843024253845e-05, 6.631109863519669e-05, 7.159635424613953e-05, 7.688160985708237e-05, 8.216686546802521e-05, 8.745212107896805e-05, 9.273737668991089e-05, 9.802263230085373e-05, 0.00010330788791179657, 0.00010859314352273941, 0.00011387839913368225, 0.00011916365474462509, 0.00012444891035556793, 0.00012973416596651077, 0.0001350194215774536, 0.00014030467718839645, 0.0001455899327993393, 0.00015087518841028214, 0.00015616044402122498, 0.00016144569963216782, 0.00016673095524311066, 0.0001720162108540535, 0.00017730146646499634, 0.00018258672207593918, 0.00018787197768688202, 0.00019315723329782486, 0.0001984424889087677, 0.00020372774451971054, 0.00020901300013065338, 0.00021429825574159622, 0.00021958351135253906]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 9.0, 10.0, 19.0, 17.0, 35.0, 38.0, 50.0, 60.0, 87.0, 123.0, 196.0, 332.0, 818.0, 12382.0, 1030579.0, 2435.0, 602.0, 251.0, 137.0, 90.0, 59.0, 54.0, 40.0, 27.0, 16.0, 14.0, 15.0, 15.0, 13.0, 5.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0], "bins": [-0.004535675048828125, -0.004423230886459351, -0.004310786724090576, -0.004198342561721802, -0.004085898399353027, -0.003973454236984253, -0.0038610100746154785, -0.003748565912246704, -0.0036361217498779297, -0.0035236775875091553, -0.003411233425140381, -0.0032987892627716064, -0.003186345100402832, -0.0030739009380340576, -0.002961456775665283, -0.002849012613296509, -0.0027365684509277344, -0.00262412428855896, -0.0025116801261901855, -0.002399235963821411, -0.0022867918014526367, -0.0021743476390838623, -0.002061903476715088, -0.0019494593143463135, -0.001837015151977539, -0.0017245709896087646, -0.0016121268272399902, -0.0014996826648712158, -0.0013872385025024414, -0.001274794340133667, -0.0011623501777648926, -0.0010499060153961182, -0.0009374618530273438, -0.0008250176906585693, -0.0007125735282897949, -0.0006001293659210205, -0.0004876852035522461, -0.0003752410411834717, -0.00026279687881469727, -0.00015035271644592285, -3.790855407714844e-05, 7.453560829162598e-05, 0.0001869797706604004, 0.0002994239330291748, 0.0004118680953979492, 0.0005243122577667236, 0.000636756420135498, 0.0007492005825042725, 0.0008616447448730469, 0.0009740889072418213, 0.0010865330696105957, 0.0011989772319793701, 0.0013114213943481445, 0.001423865556716919, 0.0015363097190856934, 0.0016487538814544678, 0.0017611980438232422, 0.0018736422061920166, 0.001986086368560791, 0.0020985305309295654, 0.00221097469329834, 0.0023234188556671143, 0.0024358630180358887, 0.002548307180404663, 0.0026607513427734375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 219.0, 568.0, 200.0, 15.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022592559980694205, -0.00021223867952357978, -0.00019855177379213274, -0.00018486485350877047, -0.0001711779332254082, -0.00015749101294204593, -0.00014380409265868366, -0.00013011718692723662, -0.00011643026664387435, -0.00010274334636051208, -8.905643335310742e-05, -7.536952034570277e-05, -6.16826000623405e-05, -4.799567977897823e-05, -3.430876677157357e-05, -2.0621853764168918e-05, -6.934933480806649e-06, 6.751983164576814e-06, 2.0438899809960276e-05, 3.412581645534374e-05, 4.78127331007272e-05, 6.149965338408947e-05, 7.518656639149413e-05, 8.887347939889878e-05, 0.00010256039968226105, 0.00011624731996562332, 0.00012993422569707036, 0.00014362114598043263, 0.0001573080662637949, 0.00017099498654715717, 0.00018468190683051944, 0.00019836881256196648, 0.00021205574739724398, 0.00022574266768060625, 0.00023942958796396852, 0.0002531165082473308, 0.00026680342853069305, 0.00028049031971022487, 0.00029417723999358714, 0.0003078641602769494, 0.0003215510805603117, 0.00033523800084367394, 0.0003489249211270362, 0.0003626118414103985, 0.0003762987325899303, 0.000389985681977123, 0.00040367257315665483, 0.0004173594934400171, 0.0004310464137233794, 0.00044473333400674164, 0.0004584202542901039, 0.0004721071745734662, 0.00048579409485682845, 0.0004994809860363603, 0.000513167935423553, 0.0005268548266030848, 0.0005405417177826166, 0.0005542286089621484, 0.0005679155583493412, 0.000581602449528873, 0.0005952893989160657, 0.0006089762900955975, 0.0006226632394827902, 0.000636350130662322, 0.0006500370800495148]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 11.0, 8.0, 9.0, 11.0, 15.0, 12.0, 13.0, 18.0, 15.0, 18.0, 35.0, 33.0, 18.0, 27.0, 36.0, 41.0, 35.0, 39.0, 41.0, 26.0, 37.0, 38.0, 45.0, 29.0, 38.0, 31.0, 45.0, 23.0, 24.0, 20.0, 37.0, 20.0, 29.0, 24.0, 15.0, 15.0, 11.0, 15.0, 9.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-7.963180541992188e-05, -7.73230567574501e-05, -7.501430809497833e-05, -7.270555943250656e-05, -7.039681077003479e-05, -6.808806210756302e-05, -6.577931344509125e-05, -6.347056478261948e-05, -6.11618161201477e-05, -5.8853067457675934e-05, -5.654431879520416e-05, -5.423557013273239e-05, -5.192682147026062e-05, -4.961807280778885e-05, -4.730932414531708e-05, -4.5000575482845306e-05, -4.2691826820373535e-05, -4.0383078157901764e-05, -3.807432949542999e-05, -3.576558083295822e-05, -3.345683217048645e-05, -3.114808350801468e-05, -2.8839334845542908e-05, -2.6530586183071136e-05, -2.4221837520599365e-05, -2.1913088858127594e-05, -1.9604340195655823e-05, -1.729559153318405e-05, -1.498684287071228e-05, -1.2678094208240509e-05, -1.0369345545768738e-05, -8.060596883296967e-06, -5.751848220825195e-06, -3.443099558353424e-06, -1.1343508958816528e-06, 1.1743977665901184e-06, 3.4831464290618896e-06, 5.791895091533661e-06, 8.100643754005432e-06, 1.0409392416477203e-05, 1.2718141078948975e-05, 1.5026889741420746e-05, 1.7335638403892517e-05, 1.964438706636429e-05, 2.195313572883606e-05, 2.426188439130783e-05, 2.6570633053779602e-05, 2.8879381716251373e-05, 3.1188130378723145e-05, 3.3496879041194916e-05, 3.580562770366669e-05, 3.811437636613846e-05, 4.042312502861023e-05, 4.2731873691082e-05, 4.504062235355377e-05, 4.734937101602554e-05, 4.9658119678497314e-05, 5.1966868340969086e-05, 5.427561700344086e-05, 5.658436566591263e-05, 5.88931143283844e-05, 6.120186299085617e-05, 6.351061165332794e-05, 6.581936031579971e-05, 6.812810897827148e-05]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 8.0, 3.0, 8.0, 5.0, 9.0, 7.0, 18.0, 24.0, 23.0, 19.0, 26.0, 22.0, 24.0, 23.0, 29.0, 32.0, 28.0, 37.0, 42.0, 36.0, 41.0, 39.0, 33.0, 29.0, 33.0, 28.0, 30.0, 33.0, 26.0, 34.0, 21.0, 27.0, 25.0, 25.0, 18.0, 23.0, 15.0, 20.0, 11.0, 11.0, 7.0, 11.0, 7.0, 7.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-3.7734375, -3.6602783203125, -3.547119140625, -3.4339599609375, -3.32080078125, -3.2076416015625, -3.094482421875, -2.9813232421875, -2.8681640625, -2.7550048828125, -2.641845703125, -2.5286865234375, -2.41552734375, -2.3023681640625, -2.189208984375, -2.0760498046875, -1.962890625, -1.8497314453125, -1.736572265625, -1.6234130859375, -1.51025390625, -1.3970947265625, -1.283935546875, -1.1707763671875, -1.0576171875, -0.9444580078125, -0.831298828125, -0.7181396484375, -0.60498046875, -0.4918212890625, -0.378662109375, -0.2655029296875, -0.15234375, -0.0391845703125, 0.073974609375, 0.1871337890625, 0.30029296875, 0.4134521484375, 0.526611328125, 0.6397705078125, 0.7529296875, 0.8660888671875, 0.979248046875, 1.0924072265625, 1.20556640625, 1.3187255859375, 1.431884765625, 1.5450439453125, 1.658203125, 1.7713623046875, 1.884521484375, 1.9976806640625, 2.11083984375, 2.2239990234375, 2.337158203125, 2.4503173828125, 2.5634765625, 2.6766357421875, 2.789794921875, 2.9029541015625, 3.01611328125, 3.1292724609375, 3.242431640625, 3.3555908203125, 3.46875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 8.0, 5.0, 7.0, 18.0, 20.0, 22.0, 18.0, 45.0, 46.0, 54.0, 62.0, 87.0, 156.0, 184.0, 292.0, 449.0, 900.0, 3007.0, 20259.0, 154733.0, 692278.0, 150685.0, 19966.0, 2872.0, 871.0, 501.0, 264.0, 186.0, 125.0, 93.0, 65.0, 54.0, 53.0, 23.0, 31.0, 24.0, 13.0, 16.0, 11.0, 5.0, 13.0, 4.0, 2.0, 7.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-8.3203125, -8.0718994140625, -7.823486328125, -7.5750732421875, -7.32666015625, -7.0782470703125, -6.829833984375, -6.5814208984375, -6.3330078125, -6.0845947265625, -5.836181640625, -5.5877685546875, -5.33935546875, -5.0909423828125, -4.842529296875, -4.5941162109375, -4.345703125, -4.0972900390625, -3.848876953125, -3.6004638671875, -3.35205078125, -3.1036376953125, -2.855224609375, -2.6068115234375, -2.3583984375, -2.1099853515625, -1.861572265625, -1.6131591796875, -1.36474609375, -1.1163330078125, -0.867919921875, -0.6195068359375, -0.37109375, -0.1226806640625, 0.125732421875, 0.3741455078125, 0.62255859375, 0.8709716796875, 1.119384765625, 1.3677978515625, 1.6162109375, 1.8646240234375, 2.113037109375, 2.3614501953125, 2.60986328125, 2.8582763671875, 3.106689453125, 3.3551025390625, 3.603515625, 3.8519287109375, 4.100341796875, 4.3487548828125, 4.59716796875, 4.8455810546875, 5.093994140625, 5.3424072265625, 5.5908203125, 5.8392333984375, 6.087646484375, 6.3360595703125, 6.58447265625, 6.8328857421875, 7.081298828125, 7.3297119140625, 7.578125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 9.0, 5.0, 13.0, 6.0, 9.0, 8.0, 9.0, 14.0, 18.0, 12.0, 36.0, 32.0, 32.0, 28.0, 45.0, 29.0, 39.0, 48.0, 86.0, 200.0, 1520.0, 252.0, 116.0, 61.0, 50.0, 45.0, 40.0, 38.0, 43.0, 33.0, 30.0, 26.0, 15.0, 16.0, 14.0, 20.0, 13.0, 3.0, 9.0, 6.0, 9.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.8436279296875, -9.460693359375, -9.0777587890625, -8.69482421875, -8.3118896484375, -7.928955078125, -7.5460205078125, -7.1630859375, -6.7801513671875, -6.397216796875, -6.0142822265625, -5.63134765625, -5.2484130859375, -4.865478515625, -4.4825439453125, -4.099609375, -3.7166748046875, -3.333740234375, -2.9508056640625, -2.56787109375, -2.1849365234375, -1.802001953125, -1.4190673828125, -1.0361328125, -0.6531982421875, -0.270263671875, 0.1126708984375, 0.49560546875, 0.8785400390625, 1.261474609375, 1.6444091796875, 2.02734375, 2.4102783203125, 2.793212890625, 3.1761474609375, 3.55908203125, 3.9420166015625, 4.324951171875, 4.7078857421875, 5.0908203125, 5.4737548828125, 5.856689453125, 6.2396240234375, 6.62255859375, 7.0054931640625, 7.388427734375, 7.7713623046875, 8.154296875, 8.5372314453125, 8.920166015625, 9.3031005859375, 9.68603515625, 10.0689697265625, 10.451904296875, 10.8348388671875, 11.2177734375, 11.6007080078125, 11.983642578125, 12.3665771484375, 12.74951171875, 13.1324462890625, 13.515380859375, 13.8983154296875, 14.28125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 10.0, 11.0, 9.0, 17.0, 24.0, 34.0, 28.0, 32.0, 56.0, 52.0, 83.0, 102.0, 124.0, 187.0, 391.0, 914.0, 5363.0, 3092426.0, 43141.0, 1323.0, 525.0, 232.0, 147.0, 101.0, 65.0, 62.0, 50.0, 48.0, 22.0, 25.0, 19.0, 11.0, 16.0, 12.0, 9.0, 5.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.21875, -40.96533203125, -39.7119140625, -38.45849609375, -37.205078125, -35.95166015625, -34.6982421875, -33.44482421875, -32.19140625, -30.93798828125, -29.6845703125, -28.43115234375, -27.177734375, -25.92431640625, -24.6708984375, -23.41748046875, -22.1640625, -20.91064453125, -19.6572265625, -18.40380859375, -17.150390625, -15.89697265625, -14.6435546875, -13.39013671875, -12.13671875, -10.88330078125, -9.6298828125, -8.37646484375, -7.123046875, -5.86962890625, -4.6162109375, -3.36279296875, -2.109375, -0.85595703125, 0.3974609375, 1.65087890625, 2.904296875, 4.15771484375, 5.4111328125, 6.66455078125, 7.91796875, 9.17138671875, 10.4248046875, 11.67822265625, 12.931640625, 14.18505859375, 15.4384765625, 16.69189453125, 17.9453125, 19.19873046875, 20.4521484375, 21.70556640625, 22.958984375, 24.21240234375, 25.4658203125, 26.71923828125, 27.97265625, 29.22607421875, 30.4794921875, 31.73291015625, 32.986328125, 34.23974609375, 35.4931640625, 36.74658203125, 38.0]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [38.0, 489.0, 461.0, 28.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.029485702514648, -2.5264501571655273, -0.02341461181640625, 2.479620933532715, 4.982656478881836, 7.485692024230957, 9.988727569580078, 12.491762161254883, 14.99479866027832, 17.497833251953125, 20.000869750976562, 22.50390625, 25.006940841674805, 27.50997543334961, 30.013011932373047, 32.51604461669922, 35.019081115722656, 37.522117614746094, 40.02515411376953, 42.5281867980957, 45.03122329711914, 47.53425979614258, 50.03729248046875, 52.54032897949219, 55.043365478515625, 57.54640197753906, 60.0494384765625, 62.55247116088867, 65.05551147460938, 67.55854034423828, 70.06157684326172, 72.56461334228516, 75.06765747070312, 77.57069396972656, 80.07373046875, 82.57676696777344, 85.07980346679688, 87.58283233642578, 90.08586883544922, 92.58890533447266, 95.0919418334961, 97.59497833251953, 100.09801483154297, 102.6010513305664, 105.10408020019531, 107.60711669921875, 110.11015319824219, 112.61318969726562, 115.11622619628906, 117.6192626953125, 120.12229919433594, 122.62533569335938, 125.12837219238281, 127.63140106201172, 130.1344451904297, 132.63748168945312, 135.1405029296875, 137.64353942871094, 140.14657592773438, 142.6496124267578, 145.15264892578125, 147.6556854248047, 150.15872192382812, 152.6617431640625, 155.164794921875]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 8.0, 7.0, 12.0, 8.0, 7.0, 9.0, 18.0, 19.0, 22.0, 13.0, 23.0, 20.0, 36.0, 25.0, 35.0, 32.0, 32.0, 30.0, 46.0, 51.0, 38.0, 49.0, 46.0, 39.0, 39.0, 44.0, 41.0, 34.0, 34.0, 24.0, 20.0, 17.0, 12.0, 19.0, 15.0, 16.0, 8.0, 13.0, 9.0, 11.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.94292449951172, -32.890628814697266, -31.838335037231445, -30.786041259765625, -29.733745574951172, -28.68145179748535, -27.62915802001953, -26.576862335205078, -25.524568557739258, -24.472274780273438, -23.419979095458984, -22.367685317993164, -21.315391540527344, -20.26309585571289, -19.21080207824707, -18.15850830078125, -17.106212615966797, -16.053918838500977, -15.001623153686523, -13.949329376220703, -12.897034645080566, -11.84473991394043, -10.79244613647461, -9.740151405334473, -8.687856674194336, -7.635561943054199, -6.583267688751221, -5.530973434448242, -4.4786787033081055, -3.4263839721679688, -2.3740897178649902, -1.3217954635620117, -0.2695045471191406, 0.782789945602417, 1.8350844383239746, 2.8873789310455322, 3.93967342376709, 4.991968154907227, 6.044262409210205, 7.096556663513184, 8.14885139465332, 9.201146125793457, 10.253440856933594, 11.305734634399414, 12.35802936553955, 13.410324096679688, 14.462617874145508, 15.514912605285645, 16.56720733642578, 17.6195011138916, 18.671796798706055, 19.724090576171875, 20.776386260986328, 21.82868003845215, 22.88097381591797, 23.933269500732422, 24.985563278198242, 26.037857055664062, 27.090152740478516, 28.142446517944336, 29.194740295410156, 30.24703598022461, 31.29932975769043, 32.35162353515625, 33.4039192199707]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 6.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 7.0, 11.0, 7.0, 13.0, 15.0, 17.0, 23.0, 19.0, 26.0, 23.0, 15.0, 29.0, 34.0, 29.0, 39.0, 33.0, 33.0, 32.0, 30.0, 41.0, 27.0, 43.0, 38.0, 34.0, 27.0, 34.0, 37.0, 33.0, 26.0, 20.0, 27.0, 20.0, 36.0, 17.0, 12.0, 14.0, 16.0, 10.0, 5.0, 5.0, 5.0, 6.0, 6.0, 4.0, 4.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.0625, -3.9361572265625, -3.809814453125, -3.6834716796875, -3.55712890625, -3.4307861328125, -3.304443359375, -3.1781005859375, -3.0517578125, -2.9254150390625, -2.799072265625, -2.6727294921875, -2.54638671875, -2.4200439453125, -2.293701171875, -2.1673583984375, -2.041015625, -1.9146728515625, -1.788330078125, -1.6619873046875, -1.53564453125, -1.4093017578125, -1.282958984375, -1.1566162109375, -1.0302734375, -0.9039306640625, -0.777587890625, -0.6512451171875, -0.52490234375, -0.3985595703125, -0.272216796875, -0.1458740234375, -0.01953125, 0.1068115234375, 0.233154296875, 0.3594970703125, 0.48583984375, 0.6121826171875, 0.738525390625, 0.8648681640625, 0.9912109375, 1.1175537109375, 1.243896484375, 1.3702392578125, 1.49658203125, 1.6229248046875, 1.749267578125, 1.8756103515625, 2.001953125, 2.1282958984375, 2.254638671875, 2.3809814453125, 2.50732421875, 2.6336669921875, 2.760009765625, 2.8863525390625, 3.0126953125, 3.1390380859375, 3.265380859375, 3.3917236328125, 3.51806640625, 3.6444091796875, 3.770751953125, 3.8970947265625, 4.0234375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 6.0, 7.0, 11.0, 8.0, 10.0, 22.0, 24.0, 24.0, 42.0, 53.0, 72.0, 102.0, 155.0, 254.0, 443.0, 745.0, 2124.0, 7306.0, 36950.0, 213098.0, 896093.0, 1688518.0, 1022831.0, 263615.0, 47616.0, 9314.0, 2558.0, 963.0, 465.0, 253.0, 177.0, 117.0, 88.0, 49.0, 32.0, 32.0, 29.0, 20.0, 12.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0], "bins": [-6.16015625, -5.98193359375, -5.8037109375, -5.62548828125, -5.447265625, -5.26904296875, -5.0908203125, -4.91259765625, -4.734375, -4.55615234375, -4.3779296875, -4.19970703125, -4.021484375, -3.84326171875, -3.6650390625, -3.48681640625, -3.30859375, -3.13037109375, -2.9521484375, -2.77392578125, -2.595703125, -2.41748046875, -2.2392578125, -2.06103515625, -1.8828125, -1.70458984375, -1.5263671875, -1.34814453125, -1.169921875, -0.99169921875, -0.8134765625, -0.63525390625, -0.45703125, -0.27880859375, -0.1005859375, 0.07763671875, 0.255859375, 0.43408203125, 0.6123046875, 0.79052734375, 0.96875, 1.14697265625, 1.3251953125, 1.50341796875, 1.681640625, 1.85986328125, 2.0380859375, 2.21630859375, 2.39453125, 2.57275390625, 2.7509765625, 2.92919921875, 3.107421875, 3.28564453125, 3.4638671875, 3.64208984375, 3.8203125, 3.99853515625, 4.1767578125, 4.35498046875, 4.533203125, 4.71142578125, 4.8896484375, 5.06787109375, 5.24609375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 20.0, 12.0, 14.0, 23.0, 39.0, 62.0, 74.0, 104.0, 128.0, 182.0, 209.0, 351.0, 443.0, 426.0, 446.0, 325.0, 315.0, 224.0, 144.0, 144.0, 85.0, 67.0, 69.0, 28.0, 39.0, 20.0, 13.0, 10.0, 12.0, 5.0, 9.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.359375, -7.111572265625, -6.86376953125, -6.615966796875, -6.3681640625, -6.120361328125, -5.87255859375, -5.624755859375, -5.376953125, -5.129150390625, -4.88134765625, -4.633544921875, -4.3857421875, -4.137939453125, -3.89013671875, -3.642333984375, -3.39453125, -3.146728515625, -2.89892578125, -2.651123046875, -2.4033203125, -2.155517578125, -1.90771484375, -1.659912109375, -1.412109375, -1.164306640625, -0.91650390625, -0.668701171875, -0.4208984375, -0.173095703125, 0.07470703125, 0.322509765625, 0.5703125, 0.818115234375, 1.06591796875, 1.313720703125, 1.5615234375, 1.809326171875, 2.05712890625, 2.304931640625, 2.552734375, 2.800537109375, 3.04833984375, 3.296142578125, 3.5439453125, 3.791748046875, 4.03955078125, 4.287353515625, 4.53515625, 4.782958984375, 5.03076171875, 5.278564453125, 5.5263671875, 5.774169921875, 6.02197265625, 6.269775390625, 6.517578125, 6.765380859375, 7.01318359375, 7.260986328125, 7.5087890625, 7.756591796875, 8.00439453125, 8.252197265625, 8.5]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 9.0, 9.0, 11.0, 15.0, 21.0, 27.0, 47.0, 60.0, 89.0, 129.0, 163.0, 193.0, 281.0, 388.0, 668.0, 1518.0, 7074.0, 1264850.0, 2902863.0, 11882.0, 1730.0, 711.0, 472.0, 304.0, 204.0, 161.0, 107.0, 77.0, 59.0, 50.0, 26.0, 21.0, 16.0, 6.0, 10.0, 8.0, 5.0, 0.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.625, -27.78515625, -26.9453125, -26.10546875, -25.265625, -24.42578125, -23.5859375, -22.74609375, -21.90625, -21.06640625, -20.2265625, -19.38671875, -18.546875, -17.70703125, -16.8671875, -16.02734375, -15.1875, -14.34765625, -13.5078125, -12.66796875, -11.828125, -10.98828125, -10.1484375, -9.30859375, -8.46875, -7.62890625, -6.7890625, -5.94921875, -5.109375, -4.26953125, -3.4296875, -2.58984375, -1.75, -0.91015625, -0.0703125, 0.76953125, 1.609375, 2.44921875, 3.2890625, 4.12890625, 4.96875, 5.80859375, 6.6484375, 7.48828125, 8.328125, 9.16796875, 10.0078125, 10.84765625, 11.6875, 12.52734375, 13.3671875, 14.20703125, 15.046875, 15.88671875, 16.7265625, 17.56640625, 18.40625, 19.24609375, 20.0859375, 20.92578125, 21.765625, 22.60546875, 23.4453125, 24.28515625, 25.125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 56.0, 759.0, 194.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.14484405517578, -55.700927734375, -49.25700759887695, -42.813087463378906, -36.369171142578125, -29.925254821777344, -23.481334686279297, -17.03741455078125, -10.593498229980469, -4.149580001831055, 2.2943382263183594, 8.738256454467773, 15.182174682617188, 21.62609100341797, 28.070011138916016, 34.51393127441406, 40.957847595214844, 47.401763916015625, 53.84568405151367, 60.28960418701172, 66.7335205078125, 73.17743682861328, 79.62135314941406, 86.06527709960938, 92.50919342041016, 98.95310974121094, 105.39703369140625, 111.84095001220703, 118.28486633300781, 124.7287826538086, 131.17269897460938, 137.6166229248047, 144.060546875, 150.5044708251953, 156.94837951660156, 163.39230346679688, 169.83621215820312, 176.28013610839844, 182.72406005859375, 189.16796875, 195.6118927001953, 202.05581665039062, 208.49972534179688, 214.9436492919922, 221.3875732421875, 227.83148193359375, 234.27540588378906, 240.71932983398438, 247.16323852539062, 253.60716247558594, 260.05108642578125, 266.4949951171875, 272.93890380859375, 279.3828125, 285.8267517089844, 292.2706604003906, 298.714599609375, 305.15850830078125, 311.6024475097656, 318.0463562011719, 324.4902648925781, 330.9342041015625, 337.37811279296875, 343.822021484375, 350.26593017578125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 6.0, 8.0, 7.0, 12.0, 17.0, 26.0, 21.0, 17.0, 24.0, 20.0, 28.0, 31.0, 32.0, 36.0, 36.0, 39.0, 43.0, 52.0, 36.0, 34.0, 34.0, 42.0, 45.0, 45.0, 33.0, 30.0, 24.0, 27.0, 31.0, 15.0, 26.0, 24.0, 18.0, 16.0, 20.0, 7.0, 10.0, 7.0, 11.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.00054931640625, -26.189193725585938, -25.377838134765625, -24.566482543945312, -23.755126953125, -22.943771362304688, -22.132417678833008, -21.321062088012695, -20.509706497192383, -19.69835090637207, -18.886995315551758, -18.075639724731445, -17.264286041259766, -16.452930450439453, -15.64157485961914, -14.830219268798828, -14.018863677978516, -13.207508087158203, -12.39615249633789, -11.584797859191895, -10.773442268371582, -9.96208667755127, -9.150732040405273, -8.339376449584961, -7.528020858764648, -6.716665267944336, -5.905310153961182, -5.093955039978027, -4.282599449157715, -3.4712438583374023, -2.659888744354248, -1.8485336303710938, -1.0371780395507812, -0.22582268714904785, 0.5855326652526855, 1.396888017654419, 2.2082433700561523, 3.019598960876465, 3.830954074859619, 4.642309188842773, 5.453664779663086, 6.265020370483398, 7.076375484466553, 7.887730598449707, 8.69908618927002, 9.510441780090332, 10.321796417236328, 11.13315200805664, 11.944507598876953, 12.755863189697266, 13.567218780517578, 14.378573417663574, 15.189929008483887, 16.001285552978516, 16.812639236450195, 17.623994827270508, 18.43535041809082, 19.246706008911133, 20.058061599731445, 20.869417190551758, 21.680770874023438, 22.49212646484375, 23.303482055664062, 24.114837646484375, 24.926193237304688]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 5.0, 12.0, 12.0, 13.0, 16.0, 28.0, 22.0, 27.0, 31.0, 36.0, 38.0, 29.0, 33.0, 43.0, 39.0, 43.0, 43.0, 48.0, 42.0, 41.0, 44.0, 34.0, 40.0, 26.0, 35.0, 36.0, 23.0, 22.0, 23.0, 14.0, 17.0, 19.0, 11.0, 6.0, 7.0, 8.0, 1.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.23126220703125, -4.0992431640625, -3.96722412109375, -3.835205078125, -3.70318603515625, -3.5711669921875, -3.43914794921875, -3.30712890625, -3.17510986328125, -3.0430908203125, -2.91107177734375, -2.779052734375, -2.64703369140625, -2.5150146484375, -2.38299560546875, -2.2509765625, -2.11895751953125, -1.9869384765625, -1.85491943359375, -1.722900390625, -1.59088134765625, -1.4588623046875, -1.32684326171875, -1.19482421875, -1.06280517578125, -0.9307861328125, -0.79876708984375, -0.666748046875, -0.53472900390625, -0.4027099609375, -0.27069091796875, -0.138671875, -0.00665283203125, 0.1253662109375, 0.25738525390625, 0.389404296875, 0.52142333984375, 0.6534423828125, 0.78546142578125, 0.91748046875, 1.04949951171875, 1.1815185546875, 1.31353759765625, 1.445556640625, 1.57757568359375, 1.7095947265625, 1.84161376953125, 1.9736328125, 2.10565185546875, 2.2376708984375, 2.36968994140625, 2.501708984375, 2.63372802734375, 2.7657470703125, 2.89776611328125, 3.02978515625, 3.16180419921875, 3.2938232421875, 3.42584228515625, 3.557861328125, 3.68988037109375, 3.8218994140625, 3.95391845703125, 4.0859375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 7.0, 12.0, 12.0, 26.0, 47.0, 55.0, 99.0, 136.0, 177.0, 248.0, 399.0, 606.0, 890.0, 1254.0, 1811.0, 2903.0, 4249.0, 6536.0, 10035.0, 15318.0, 24244.0, 39754.0, 67255.0, 127335.0, 266843.0, 218477.0, 105644.0, 58215.0, 34381.0, 21679.0, 13657.0, 8706.0, 5826.0, 3851.0, 2616.0, 1762.0, 1104.0, 735.0, 514.0, 372.0, 235.0, 170.0, 110.0, 77.0, 64.0, 30.0, 23.0, 22.0, 12.0, 10.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6630859375, -0.6416015625, -0.6201171875, -0.5986328125, -0.5771484375, -0.5556640625, -0.5341796875, -0.5126953125, -0.4912109375, -0.4697265625, -0.4482421875, -0.4267578125, -0.4052734375, -0.3837890625, -0.3623046875, -0.3408203125, -0.3193359375, -0.2978515625, -0.2763671875, -0.2548828125, -0.2333984375, -0.2119140625, -0.1904296875, -0.1689453125, -0.1474609375, -0.1259765625, -0.1044921875, -0.0830078125, -0.0615234375, -0.0400390625, -0.0185546875, 0.0029296875, 0.0244140625, 0.0458984375, 0.0673828125, 0.0888671875, 0.1103515625, 0.1318359375, 0.1533203125, 0.1748046875, 0.1962890625, 0.2177734375, 0.2392578125, 0.2607421875, 0.2822265625, 0.3037109375, 0.3251953125, 0.3466796875, 0.3681640625, 0.3896484375, 0.4111328125, 0.4326171875, 0.4541015625, 0.4755859375, 0.4970703125, 0.5185546875, 0.5400390625, 0.5615234375, 0.5830078125, 0.6044921875, 0.6259765625, 0.6474609375, 0.6689453125, 0.6904296875, 0.7119140625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 12.0, 10.0, 12.0, 11.0, 10.0, 10.0, 11.0, 22.0, 26.0, 24.0, 24.0, 29.0, 29.0, 38.0, 28.0, 38.0, 30.0, 35.0, 36.0, 44.0, 1062.0, 34.0, 38.0, 36.0, 29.0, 29.0, 35.0, 32.0, 31.0, 27.0, 24.0, 18.0, 18.0, 24.0, 13.0, 17.0, 12.0, 7.0, 8.0, 8.0, 5.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.181640625, -2.107940673828125, -2.03424072265625, -1.960540771484375, -1.8868408203125, -1.813140869140625, -1.73944091796875, -1.665740966796875, -1.592041015625, -1.518341064453125, -1.44464111328125, -1.370941162109375, -1.2972412109375, -1.223541259765625, -1.14984130859375, -1.076141357421875, -1.00244140625, -0.928741455078125, -0.85504150390625, -0.781341552734375, -0.7076416015625, -0.633941650390625, -0.56024169921875, -0.486541748046875, -0.412841796875, -0.339141845703125, -0.26544189453125, -0.191741943359375, -0.1180419921875, -0.044342041015625, 0.02935791015625, 0.103057861328125, 0.1767578125, 0.250457763671875, 0.32415771484375, 0.397857666015625, 0.4715576171875, 0.545257568359375, 0.61895751953125, 0.692657470703125, 0.766357421875, 0.840057373046875, 0.91375732421875, 0.987457275390625, 1.0611572265625, 1.134857177734375, 1.20855712890625, 1.282257080078125, 1.35595703125, 1.429656982421875, 1.50335693359375, 1.577056884765625, 1.6507568359375, 1.724456787109375, 1.79815673828125, 1.871856689453125, 1.945556640625, 2.019256591796875, 2.09295654296875, 2.166656494140625, 2.2403564453125, 2.314056396484375, 2.38775634765625, 2.461456298828125, 2.53515625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 6.0, 14.0, 20.0, 26.0, 41.0, 70.0, 87.0, 108.0, 172.0, 242.0, 351.0, 448.0, 652.0, 857.0, 1235.0, 1754.0, 2458.0, 3445.0, 4893.0, 6828.0, 9757.0, 14197.0, 20310.0, 30465.0, 46073.0, 72057.0, 126517.0, 1296555.0, 184485.0, 94911.0, 57443.0, 37951.0, 25332.0, 17099.0, 11805.0, 8160.0, 5905.0, 4155.0, 2987.0, 2072.0, 1581.0, 1107.0, 841.0, 530.0, 353.0, 266.0, 157.0, 111.0, 94.0, 65.0, 35.0, 19.0, 16.0, 9.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.5537109375, -0.5362777709960938, -0.5188446044921875, -0.5014114379882812, -0.483978271484375, -0.46654510498046875, -0.4491119384765625, -0.43167877197265625, -0.41424560546875, -0.39681243896484375, -0.3793792724609375, -0.36194610595703125, -0.344512939453125, -0.32707977294921875, -0.3096466064453125, -0.29221343994140625, -0.2747802734375, -0.25734710693359375, -0.2399139404296875, -0.22248077392578125, -0.205047607421875, -0.18761444091796875, -0.1701812744140625, -0.15274810791015625, -0.13531494140625, -0.11788177490234375, -0.1004486083984375, -0.08301544189453125, -0.065582275390625, -0.04814910888671875, -0.0307159423828125, -0.01328277587890625, 0.004150390625, 0.02158355712890625, 0.0390167236328125, 0.05644989013671875, 0.073883056640625, 0.09131622314453125, 0.1087493896484375, 0.12618255615234375, 0.14361572265625, 0.16104888916015625, 0.1784820556640625, 0.19591522216796875, 0.213348388671875, 0.23078155517578125, 0.2482147216796875, 0.26564788818359375, 0.2830810546875, 0.30051422119140625, 0.3179473876953125, 0.33538055419921875, 0.352813720703125, 0.37024688720703125, 0.3876800537109375, 0.40511322021484375, 0.42254638671875, 0.43997955322265625, 0.4574127197265625, 0.47484588623046875, 0.492279052734375, 0.5097122192382812, 0.5271453857421875, 0.5445785522460938, 0.56201171875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 3.0, 8.0, 7.0, 5.0, 10.0, 10.0, 15.0, 19.0, 29.0, 22.0, 23.0, 26.0, 21.0, 35.0, 45.0, 40.0, 53.0, 58.0, 57.0, 54.0, 42.0, 46.0, 44.0, 40.0, 39.0, 50.0, 32.0, 29.0, 20.0, 24.0, 19.0, 12.0, 9.0, 7.0, 11.0, 8.0, 10.0, 2.0, 1.0, 1.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00011557340621948242, -0.00011192634701728821, -0.000108279287815094, -0.00010463222861289978, -0.00010098516941070557, -9.733811020851135e-05, -9.369105100631714e-05, -9.004399180412292e-05, -8.639693260192871e-05, -8.27498733997345e-05, -7.910281419754028e-05, -7.545575499534607e-05, -7.180869579315186e-05, -6.816163659095764e-05, -6.451457738876343e-05, -6.0867518186569214e-05, -5.7220458984375e-05, -5.3573399782180786e-05, -4.992634057998657e-05, -4.627928137779236e-05, -4.2632222175598145e-05, -3.898516297340393e-05, -3.533810377120972e-05, -3.16910445690155e-05, -2.804398536682129e-05, -2.4396926164627075e-05, -2.074986696243286e-05, -1.7102807760238647e-05, -1.3455748558044434e-05, -9.80868935585022e-06, -6.161630153656006e-06, -2.514570951461792e-06, 1.1324882507324219e-06, 4.779547452926636e-06, 8.42660665512085e-06, 1.2073665857315063e-05, 1.5720725059509277e-05, 1.936778426170349e-05, 2.3014843463897705e-05, 2.666190266609192e-05, 3.0308961868286133e-05, 3.395602107048035e-05, 3.760308027267456e-05, 4.1250139474868774e-05, 4.489719867706299e-05, 4.85442578792572e-05, 5.2191317081451416e-05, 5.583837628364563e-05, 5.9485435485839844e-05, 6.313249468803406e-05, 6.677955389022827e-05, 7.042661309242249e-05, 7.40736722946167e-05, 7.772073149681091e-05, 8.136779069900513e-05, 8.501484990119934e-05, 8.866190910339355e-05, 9.230896830558777e-05, 9.595602750778198e-05, 9.96030867099762e-05, 0.00010325014591217041, 0.00010689720511436462, 0.00011054426431655884, 0.00011419132351875305, 0.00011783838272094727]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 4.0, 4.0, 11.0, 8.0, 13.0, 11.0, 19.0, 23.0, 42.0, 22.0, 45.0, 47.0, 73.0, 122.0, 151.0, 247.0, 462.0, 1118.0, 73407.0, 968189.0, 2732.0, 716.0, 320.0, 191.0, 130.0, 110.0, 52.0, 57.0, 29.0, 38.0, 32.0, 32.0, 22.0, 13.0, 17.0, 6.0, 9.0, 3.0, 10.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024871826171875, -0.002407550811767578, -0.0023279190063476562, -0.0022482872009277344, -0.0021686553955078125, -0.0020890235900878906, -0.0020093917846679688, -0.0019297599792480469, -0.001850128173828125, -0.0017704963684082031, -0.0016908645629882812, -0.0016112327575683594, -0.0015316009521484375, -0.0014519691467285156, -0.0013723373413085938, -0.0012927055358886719, -0.00121307373046875, -0.0011334419250488281, -0.0010538101196289062, -0.0009741783142089844, -0.0008945465087890625, -0.0008149147033691406, -0.0007352828979492188, -0.0006556510925292969, -0.000576019287109375, -0.0004963874816894531, -0.00041675567626953125, -0.0003371238708496094, -0.0002574920654296875, -0.00017786026000976562, -9.822845458984375e-05, -1.8596649169921875e-05, 6.103515625e-05, 0.00014066696166992188, 0.00022029876708984375, 0.0002999305725097656, 0.0003795623779296875, 0.0004591941833496094, 0.0005388259887695312, 0.0006184577941894531, 0.000698089599609375, 0.0007777214050292969, 0.0008573532104492188, 0.0009369850158691406, 0.0010166168212890625, 0.0010962486267089844, 0.0011758804321289062, 0.0012555122375488281, 0.00133514404296875, 0.0014147758483886719, 0.0014944076538085938, 0.0015740394592285156, 0.0016536712646484375, 0.0017333030700683594, 0.0018129348754882812, 0.0018925666809082031, 0.001972198486328125, 0.002051830291748047, 0.0021314620971679688, 0.0022110939025878906, 0.0022907257080078125, 0.0023703575134277344, 0.0024499893188476562, 0.002529621124267578, 0.0026092529296875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 102.0, 530.0, 331.0, 44.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026377395261079073, -0.0002510901540517807, -0.00023840635549277067, -0.00022572255693376064, -0.00021303874382283539, -0.00020035494526382536, -0.00018767114670481533, -0.00017498733359389007, -0.00016230353503488004, -0.00014961973647587, -0.00013693593791685998, -0.00012425213935784996, -0.0001115683262469247, -9.888452768791467e-05, -8.620072912890464e-05, -7.3516923293937e-05, -6.083313201088458e-05, -4.814932981389575e-05, -3.546552761690691e-05, -2.2781729057896882e-05, -1.0097926860908046e-05, 2.5858753360807896e-06, 1.526967389509082e-05, 2.795347973005846e-05, 4.063727828906849e-05, 5.3321080486057326e-05, 6.600488268304616e-05, 7.868868124205619e-05, 9.137247980106622e-05, 0.00010405628563603386, 0.00011674008419504389, 0.00012942389003001153, 0.00014210768858902156, 0.0001547914871480316, 0.00016747528570704162, 0.00018015908426605165, 0.0001928428973769769, 0.00020552669593598694, 0.00021821049449499696, 0.00023089430760592222, 0.00024357810616493225, 0.0002562619047239423, 0.0002689457032829523, 0.00028162950184196234, 0.00029431330040097237, 0.0003069970989599824, 0.0003196808975189924, 0.0003323647251818329, 0.0003450484946370125, 0.0003577322931960225, 0.00037041609175503254, 0.00038309989031404257, 0.0003957836888730526, 0.0004084674874320626, 0.00042115128599107265, 0.00043383511365391314, 0.00044651891221292317, 0.0004592027107719332, 0.0004718865093309432, 0.00048457030788995326, 0.0004972541355527937, 0.0005099379341118038, 0.0005226217326708138, 0.0005353055312298238, 0.0005479893297888339]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 14.0, 9.0, 23.0, 23.0, 23.0, 30.0, 24.0, 26.0, 35.0, 32.0, 31.0, 35.0, 32.0, 40.0, 57.0, 50.0, 38.0, 39.0, 31.0, 42.0, 34.0, 36.0, 46.0, 32.0, 27.0, 27.0, 22.0, 31.0, 17.0, 14.0, 13.0, 10.0, 14.0, 7.0, 8.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.580352783203125e-05, -6.354041397571564e-05, -6.127730011940002e-05, -5.901418626308441e-05, -5.67510724067688e-05, -5.4487958550453186e-05, -5.222484469413757e-05, -4.996173083782196e-05, -4.769861698150635e-05, -4.5435503125190735e-05, -4.317238926887512e-05, -4.090927541255951e-05, -3.8646161556243896e-05, -3.6383047699928284e-05, -3.411993384361267e-05, -3.185681998729706e-05, -2.9593706130981445e-05, -2.7330592274665833e-05, -2.506747841835022e-05, -2.2804364562034607e-05, -2.0541250705718994e-05, -1.827813684940338e-05, -1.601502299308777e-05, -1.3751909136772156e-05, -1.1488795280456543e-05, -9.22568142414093e-06, -6.962567567825317e-06, -4.699453711509705e-06, -2.436339855194092e-06, -1.73225998878479e-07, 2.089887857437134e-06, 4.353001713752747e-06, 6.616115570068359e-06, 8.879229426383972e-06, 1.1142343282699585e-05, 1.3405457139015198e-05, 1.566857099533081e-05, 1.7931684851646423e-05, 2.0194798707962036e-05, 2.245791256427765e-05, 2.4721026420593262e-05, 2.6984140276908875e-05, 2.9247254133224487e-05, 3.15103679895401e-05, 3.377348184585571e-05, 3.6036595702171326e-05, 3.829970955848694e-05, 4.056282341480255e-05, 4.2825937271118164e-05, 4.508905112743378e-05, 4.735216498374939e-05, 4.9615278840065e-05, 5.1878392696380615e-05, 5.414150655269623e-05, 5.640462040901184e-05, 5.8667734265327454e-05, 6.0930848121643066e-05, 6.319396197795868e-05, 6.545707583427429e-05, 6.77201896905899e-05, 6.998330354690552e-05, 7.224641740322113e-05, 7.450953125953674e-05, 7.677264511585236e-05, 7.903575897216797e-05]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 5.0, 12.0, 12.0, 13.0, 16.0, 28.0, 22.0, 27.0, 31.0, 36.0, 38.0, 29.0, 33.0, 43.0, 39.0, 43.0, 43.0, 48.0, 42.0, 41.0, 44.0, 34.0, 40.0, 26.0, 35.0, 36.0, 23.0, 22.0, 23.0, 14.0, 17.0, 19.0, 11.0, 6.0, 7.0, 8.0, 1.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.23126220703125, -4.0992431640625, -3.96722412109375, -3.835205078125, -3.70318603515625, -3.5711669921875, -3.43914794921875, -3.30712890625, -3.17510986328125, -3.0430908203125, -2.91107177734375, -2.779052734375, -2.64703369140625, -2.5150146484375, -2.38299560546875, -2.2509765625, -2.11895751953125, -1.9869384765625, -1.85491943359375, -1.722900390625, -1.59088134765625, -1.4588623046875, -1.32684326171875, -1.19482421875, -1.06280517578125, -0.9307861328125, -0.79876708984375, -0.666748046875, -0.53472900390625, -0.4027099609375, -0.27069091796875, -0.138671875, -0.00665283203125, 0.1253662109375, 0.25738525390625, 0.389404296875, 0.52142333984375, 0.6534423828125, 0.78546142578125, 0.91748046875, 1.04949951171875, 1.1815185546875, 1.31353759765625, 1.445556640625, 1.57757568359375, 1.7095947265625, 1.84161376953125, 1.9736328125, 2.10565185546875, 2.2376708984375, 2.36968994140625, 2.501708984375, 2.63372802734375, 2.7657470703125, 2.89776611328125, 3.02978515625, 3.16180419921875, 3.2938232421875, 3.42584228515625, 3.557861328125, 3.68988037109375, 3.8218994140625, 3.95391845703125, 4.0859375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 7.0, 7.0, 7.0, 14.0, 11.0, 12.0, 25.0, 37.0, 47.0, 68.0, 112.0, 226.0, 531.0, 1334.0, 3906.0, 10967.0, 30497.0, 86200.0, 253510.0, 393450.0, 174426.0, 59552.0, 21470.0, 7690.0, 2683.0, 951.0, 356.0, 166.0, 97.0, 52.0, 25.0, 26.0, 22.0, 15.0, 14.0, 11.0, 6.0, 9.0, 2.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.22265625, -5.07049560546875, -4.9183349609375, -4.76617431640625, -4.614013671875, -4.46185302734375, -4.3096923828125, -4.15753173828125, -4.00537109375, -3.85321044921875, -3.7010498046875, -3.54888916015625, -3.396728515625, -3.24456787109375, -3.0924072265625, -2.94024658203125, -2.7880859375, -2.63592529296875, -2.4837646484375, -2.33160400390625, -2.179443359375, -2.02728271484375, -1.8751220703125, -1.72296142578125, -1.57080078125, -1.41864013671875, -1.2664794921875, -1.11431884765625, -0.962158203125, -0.80999755859375, -0.6578369140625, -0.50567626953125, -0.353515625, -0.20135498046875, -0.0491943359375, 0.10296630859375, 0.255126953125, 0.40728759765625, 0.5594482421875, 0.71160888671875, 0.86376953125, 1.01593017578125, 1.1680908203125, 1.32025146484375, 1.472412109375, 1.62457275390625, 1.7767333984375, 1.92889404296875, 2.0810546875, 2.23321533203125, 2.3853759765625, 2.53753662109375, 2.689697265625, 2.84185791015625, 2.9940185546875, 3.14617919921875, 3.29833984375, 3.45050048828125, 3.6026611328125, 3.75482177734375, 3.906982421875, 4.05914306640625, 4.2113037109375, 4.36346435546875, 4.515625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 8.0, 10.0, 15.0, 26.0, 22.0, 23.0, 25.0, 23.0, 43.0, 40.0, 50.0, 43.0, 71.0, 141.0, 244.0, 1458.0, 245.0, 108.0, 64.0, 57.0, 30.0, 43.0, 27.0, 36.0, 36.0, 37.0, 19.0, 18.0, 12.0, 16.0, 9.0, 8.0, 4.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 5.0], "bins": [-17.34375, -16.9039306640625, -16.464111328125, -16.0242919921875, -15.58447265625, -15.1446533203125, -14.704833984375, -14.2650146484375, -13.8251953125, -13.3853759765625, -12.945556640625, -12.5057373046875, -12.06591796875, -11.6260986328125, -11.186279296875, -10.7464599609375, -10.306640625, -9.8668212890625, -9.427001953125, -8.9871826171875, -8.54736328125, -8.1075439453125, -7.667724609375, -7.2279052734375, -6.7880859375, -6.3482666015625, -5.908447265625, -5.4686279296875, -5.02880859375, -4.5889892578125, -4.149169921875, -3.7093505859375, -3.26953125, -2.8297119140625, -2.389892578125, -1.9500732421875, -1.51025390625, -1.0704345703125, -0.630615234375, -0.1907958984375, 0.2490234375, 0.6888427734375, 1.128662109375, 1.5684814453125, 2.00830078125, 2.4481201171875, 2.887939453125, 3.3277587890625, 3.767578125, 4.2073974609375, 4.647216796875, 5.0870361328125, 5.52685546875, 5.9666748046875, 6.406494140625, 6.8463134765625, 7.2861328125, 7.7259521484375, 8.165771484375, 8.6055908203125, 9.04541015625, 9.4852294921875, 9.925048828125, 10.3648681640625, 10.8046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 1.0, 5.0, 5.0, 9.0, 16.0, 15.0, 17.0, 25.0, 24.0, 45.0, 59.0, 84.0, 107.0, 163.0, 224.0, 371.0, 683.0, 1848.0, 46398.0, 3058544.0, 33674.0, 1589.0, 678.0, 353.0, 228.0, 135.0, 114.0, 70.0, 57.0, 35.0, 29.0, 19.0, 15.0, 11.0, 15.0, 5.0, 10.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0], "bins": [-32.75, -31.82666015625, -30.9033203125, -29.97998046875, -29.056640625, -28.13330078125, -27.2099609375, -26.28662109375, -25.36328125, -24.43994140625, -23.5166015625, -22.59326171875, -21.669921875, -20.74658203125, -19.8232421875, -18.89990234375, -17.9765625, -17.05322265625, -16.1298828125, -15.20654296875, -14.283203125, -13.35986328125, -12.4365234375, -11.51318359375, -10.58984375, -9.66650390625, -8.7431640625, -7.81982421875, -6.896484375, -5.97314453125, -5.0498046875, -4.12646484375, -3.203125, -2.27978515625, -1.3564453125, -0.43310546875, 0.490234375, 1.41357421875, 2.3369140625, 3.26025390625, 4.18359375, 5.10693359375, 6.0302734375, 6.95361328125, 7.876953125, 8.80029296875, 9.7236328125, 10.64697265625, 11.5703125, 12.49365234375, 13.4169921875, 14.34033203125, 15.263671875, 16.18701171875, 17.1103515625, 18.03369140625, 18.95703125, 19.88037109375, 20.8037109375, 21.72705078125, 22.650390625, 23.57373046875, 24.4970703125, 25.42041015625, 26.34375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 94.0, 547.0, 347.0, 22.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.10516357421875, -51.50600814819336, -48.9068489074707, -46.30769348144531, -43.708534240722656, -41.109378814697266, -38.510223388671875, -35.91106414794922, -33.31190872192383, -30.712751388549805, -28.11359405517578, -25.51443862915039, -22.915281295776367, -20.316123962402344, -17.716968536376953, -15.11781120300293, -12.518653869628906, -9.919496536254883, -7.320340156555176, -4.7211833000183105, -2.1220264434814453, 0.4771308898925781, 3.076287269592285, 5.675443649291992, 8.274600982666016, 10.873758316040039, 13.472914695739746, 16.072071075439453, 18.671228408813477, 21.2703857421875, 23.86954116821289, 26.468698501586914, 29.067855834960938, 31.66701316833496, 34.266170501708984, 36.865325927734375, 39.46448516845703, 42.06364059448242, 44.66279602050781, 47.26195526123047, 49.86111068725586, 52.46026611328125, 55.059425354003906, 57.6585807800293, 60.25773620605469, 62.856895446777344, 65.4560546875, 68.05520629882812, 70.65436553955078, 73.25352478027344, 75.85267639160156, 78.45183563232422, 81.05099487304688, 83.650146484375, 86.24930572509766, 88.84846496582031, 91.44761657714844, 94.0467758178711, 96.64592742919922, 99.24508666992188, 101.84424591064453, 104.44340515136719, 107.04255676269531, 109.64171600341797, 112.24087524414062]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 9.0, 10.0, 7.0, 18.0, 7.0, 5.0, 12.0, 15.0, 23.0, 15.0, 18.0, 27.0, 36.0, 31.0, 44.0, 37.0, 37.0, 31.0, 37.0, 42.0, 37.0, 40.0, 39.0, 34.0, 48.0, 22.0, 40.0, 23.0, 23.0, 28.0, 17.0, 26.0, 21.0, 22.0, 16.0, 14.0, 13.0, 11.0, 5.0, 8.0, 8.0, 5.0, 7.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-29.64960479736328, -28.7479305267334, -27.84625816345215, -26.944583892822266, -26.042911529541016, -25.141237258911133, -24.23956298828125, -23.337890625, -22.43621826171875, -21.534543991088867, -20.632871627807617, -19.731197357177734, -18.829524993896484, -17.9278507232666, -17.02617645263672, -16.12450408935547, -15.222829818725586, -14.32115650177002, -13.419483184814453, -12.51780891418457, -11.61613655090332, -10.714462280273438, -9.812788963317871, -8.911115646362305, -8.009442329406738, -7.107769012451172, -6.2060956954956055, -5.304421901702881, -4.4027485847473145, -3.501075267791748, -2.5994014739990234, -1.697728157043457, -0.7960567474365234, 0.10561668872833252, 1.0072901248931885, 1.908963680267334, 2.8106369972229004, 3.712310314178467, 4.613984107971191, 5.515657424926758, 6.417330741882324, 7.319004058837891, 8.220677375793457, 9.122350692749023, 10.024024963378906, 10.925697326660156, 11.827371597290039, 12.729044914245605, 13.630718231201172, 14.532391548156738, 15.434064865112305, 16.335739135742188, 17.237411499023438, 18.13908576965332, 19.040760040283203, 19.942432403564453, 20.844104766845703, 21.745779037475586, 22.647451400756836, 23.54912567138672, 24.45079803466797, 25.35247230529785, 26.254146575927734, 27.155818939208984, 28.057493209838867]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 5.0, 3.0, 8.0, 16.0, 13.0, 14.0, 21.0, 27.0, 25.0, 25.0, 24.0, 35.0, 25.0, 42.0, 40.0, 37.0, 35.0, 48.0, 47.0, 45.0, 43.0, 46.0, 48.0, 40.0, 31.0, 42.0, 31.0, 32.0, 28.0, 15.0, 14.0, 17.0, 10.0, 13.0, 5.0, 12.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.65625, -4.51470947265625, -4.3731689453125, -4.23162841796875, -4.090087890625, -3.94854736328125, -3.8070068359375, -3.66546630859375, -3.52392578125, -3.38238525390625, -3.2408447265625, -3.09930419921875, -2.957763671875, -2.81622314453125, -2.6746826171875, -2.53314208984375, -2.3916015625, -2.25006103515625, -2.1085205078125, -1.96697998046875, -1.825439453125, -1.68389892578125, -1.5423583984375, -1.40081787109375, -1.25927734375, -1.11773681640625, -0.9761962890625, -0.83465576171875, -0.693115234375, -0.55157470703125, -0.4100341796875, -0.26849365234375, -0.126953125, 0.01458740234375, 0.1561279296875, 0.29766845703125, 0.439208984375, 0.58074951171875, 0.7222900390625, 0.86383056640625, 1.00537109375, 1.14691162109375, 1.2884521484375, 1.42999267578125, 1.571533203125, 1.71307373046875, 1.8546142578125, 1.99615478515625, 2.1376953125, 2.27923583984375, 2.4207763671875, 2.56231689453125, 2.703857421875, 2.84539794921875, 2.9869384765625, 3.12847900390625, 3.27001953125, 3.41156005859375, 3.5531005859375, 3.69464111328125, 3.836181640625, 3.97772216796875, 4.1192626953125, 4.26080322265625, 4.40234375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 3.0, 5.0, 7.0, 15.0, 13.0, 25.0, 11.0, 26.0, 28.0, 35.0, 37.0, 50.0, 58.0, 64.0, 127.0, 225.0, 736.0, 7214.0, 514826.0, 3455447.0, 210064.0, 4025.0, 523.0, 201.0, 132.0, 65.0, 69.0, 48.0, 38.0, 30.0, 23.0, 16.0, 15.0, 12.0, 11.0, 5.0, 4.0, 13.0, 8.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.6070556640625, -13.159423828125, -12.7117919921875, -12.26416015625, -11.8165283203125, -11.368896484375, -10.9212646484375, -10.4736328125, -10.0260009765625, -9.578369140625, -9.1307373046875, -8.68310546875, -8.2354736328125, -7.787841796875, -7.3402099609375, -6.892578125, -6.4449462890625, -5.997314453125, -5.5496826171875, -5.10205078125, -4.6544189453125, -4.206787109375, -3.7591552734375, -3.3115234375, -2.8638916015625, -2.416259765625, -1.9686279296875, -1.52099609375, -1.0733642578125, -0.625732421875, -0.1781005859375, 0.26953125, 0.7171630859375, 1.164794921875, 1.6124267578125, 2.06005859375, 2.5076904296875, 2.955322265625, 3.4029541015625, 3.8505859375, 4.2982177734375, 4.745849609375, 5.1934814453125, 5.64111328125, 6.0887451171875, 6.536376953125, 6.9840087890625, 7.431640625, 7.8792724609375, 8.326904296875, 8.7745361328125, 9.22216796875, 9.6697998046875, 10.117431640625, 10.5650634765625, 11.0126953125, 11.4603271484375, 11.907958984375, 12.3555908203125, 12.80322265625, 13.2508544921875, 13.698486328125, 14.1461181640625, 14.59375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 9.0, 13.0, 23.0, 19.0, 36.0, 64.0, 74.0, 113.0, 166.0, 236.0, 354.0, 460.0, 503.0, 512.0, 418.0, 295.0, 236.0, 174.0, 96.0, 83.0, 49.0, 40.0, 25.0, 16.0, 16.0, 7.0, 11.0, 7.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.0859375, -7.8328857421875, -7.579833984375, -7.3267822265625, -7.07373046875, -6.8206787109375, -6.567626953125, -6.3145751953125, -6.0615234375, -5.8084716796875, -5.555419921875, -5.3023681640625, -5.04931640625, -4.7962646484375, -4.543212890625, -4.2901611328125, -4.037109375, -3.7840576171875, -3.531005859375, -3.2779541015625, -3.02490234375, -2.7718505859375, -2.518798828125, -2.2657470703125, -2.0126953125, -1.7596435546875, -1.506591796875, -1.2535400390625, -1.00048828125, -0.7474365234375, -0.494384765625, -0.2413330078125, 0.01171875, 0.2647705078125, 0.517822265625, 0.7708740234375, 1.02392578125, 1.2769775390625, 1.530029296875, 1.7830810546875, 2.0361328125, 2.2891845703125, 2.542236328125, 2.7952880859375, 3.04833984375, 3.3013916015625, 3.554443359375, 3.8074951171875, 4.060546875, 4.3135986328125, 4.566650390625, 4.8197021484375, 5.07275390625, 5.3258056640625, 5.578857421875, 5.8319091796875, 6.0849609375, 6.3380126953125, 6.591064453125, 6.8441162109375, 7.09716796875, 7.3502197265625, 7.603271484375, 7.8563232421875, 8.109375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 13.0, 8.0, 7.0, 18.0, 30.0, 37.0, 47.0, 30.0, 63.0, 130.0, 138.0, 166.0, 223.0, 359.0, 629.0, 1496.0, 30957.0, 3783034.0, 370671.0, 3899.0, 878.0, 415.0, 266.0, 171.0, 143.0, 114.0, 83.0, 70.0, 43.0, 40.0, 24.0, 19.0, 19.0, 9.0, 10.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.03125, -25.210693359375, -24.39013671875, -23.569580078125, -22.7490234375, -21.928466796875, -21.10791015625, -20.287353515625, -19.466796875, -18.646240234375, -17.82568359375, -17.005126953125, -16.1845703125, -15.364013671875, -14.54345703125, -13.722900390625, -12.90234375, -12.081787109375, -11.26123046875, -10.440673828125, -9.6201171875, -8.799560546875, -7.97900390625, -7.158447265625, -6.337890625, -5.517333984375, -4.69677734375, -3.876220703125, -3.0556640625, -2.235107421875, -1.41455078125, -0.593994140625, 0.2265625, 1.047119140625, 1.86767578125, 2.688232421875, 3.5087890625, 4.329345703125, 5.14990234375, 5.970458984375, 6.791015625, 7.611572265625, 8.43212890625, 9.252685546875, 10.0732421875, 10.893798828125, 11.71435546875, 12.534912109375, 13.35546875, 14.176025390625, 14.99658203125, 15.817138671875, 16.6376953125, 17.458251953125, 18.27880859375, 19.099365234375, 19.919921875, 20.740478515625, 21.56103515625, 22.381591796875, 23.2021484375, 24.022705078125, 24.84326171875, 25.663818359375, 26.484375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 36.0, 342.0, 479.0, 141.0, 12.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.917238235473633, -18.39624786376953, -14.87525749206543, -11.354267120361328, -7.833276748657227, -4.312286376953125, -0.7912960052490234, 2.729694366455078, 6.25068473815918, 9.771675109863281, 13.292665481567383, 16.813655853271484, 20.334646224975586, 23.855636596679688, 27.37662696838379, 30.89761734008789, 34.418609619140625, 37.939598083496094, 41.46059036254883, 44.98158264160156, 48.50257110595703, 52.0235595703125, 55.544551849365234, 59.06554412841797, 62.58653259277344, 66.1075210571289, 69.62850952148438, 73.14950561523438, 76.67049407958984, 80.19148254394531, 83.71247863769531, 87.23346710205078, 90.75445556640625, 94.27544403076172, 97.79643249511719, 101.31742858886719, 104.83841705322266, 108.35940551757812, 111.88040161132812, 115.4013900756836, 118.92237854003906, 122.44336700439453, 125.96435546875, 129.4853515625, 133.00634765625, 136.52732849121094, 140.04832458496094, 143.56930541992188, 147.09030151367188, 150.61129760742188, 154.1322784423828, 157.6532745361328, 161.17425537109375, 164.69525146484375, 168.21624755859375, 171.7372283935547, 175.2582244873047, 178.7792205810547, 182.30020141601562, 185.82119750976562, 189.34219360351562, 192.86317443847656, 196.38417053222656, 199.9051513671875, 203.4261474609375]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 8.0, 15.0, 9.0, 16.0, 5.0, 18.0, 14.0, 28.0, 15.0, 25.0, 30.0, 32.0, 20.0, 27.0, 35.0, 38.0, 44.0, 43.0, 36.0, 36.0, 39.0, 27.0, 30.0, 40.0, 36.0, 32.0, 34.0, 35.0, 35.0, 21.0, 21.0, 18.0, 14.0, 15.0, 17.0, 15.0, 11.0, 8.0, 10.0, 9.0, 6.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.458660125732422, -19.81545066833496, -19.1722412109375, -18.529033660888672, -17.88582420349121, -17.24261474609375, -16.59940528869629, -15.956195831298828, -15.312986373901367, -14.669776916503906, -14.026568412780762, -13.3833589553833, -12.74014949798584, -12.096940994262695, -11.453731536865234, -10.810522079467773, -10.167313575744629, -9.524104118347168, -8.880895614624023, -8.237686157226562, -7.594476699829102, -6.951267719268799, -6.308058738708496, -5.664849281311035, -5.021640300750732, -4.37843132019043, -3.7352218627929688, -3.092012882232666, -2.448803663253784, -1.8055944442749023, -1.1623854637145996, -0.5191760063171387, 0.12403297424316406, 0.7672421336174011, 1.4104512929916382, 2.0536603927612305, 2.6968696117401123, 3.340078830718994, 3.983287811279297, 4.626497268676758, 5.2697062492370605, 5.912915229797363, 6.556124687194824, 7.199333667755127, 7.84254264831543, 8.48575210571289, 9.128961563110352, 9.772171020507812, 10.415379524230957, 11.058588981628418, 11.701797485351562, 12.345006942749023, 12.988216400146484, 13.631425857543945, 14.27463436126709, 14.91784381866455, 15.561052322387695, 16.204261779785156, 16.847471237182617, 17.490680694580078, 18.133888244628906, 18.777097702026367, 19.420307159423828, 20.06351661682129, 20.70672607421875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 9.0, 11.0, 11.0, 14.0, 13.0, 22.0, 27.0, 27.0, 27.0, 21.0, 36.0, 28.0, 43.0, 37.0, 39.0, 51.0, 44.0, 35.0, 38.0, 42.0, 30.0, 47.0, 36.0, 30.0, 43.0, 33.0, 34.0, 28.0, 27.0, 17.0, 22.0, 13.0, 13.0, 11.0, 8.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.45703125, -4.32073974609375, -4.1844482421875, -4.04815673828125, -3.911865234375, -3.77557373046875, -3.6392822265625, -3.50299072265625, -3.36669921875, -3.23040771484375, -3.0941162109375, -2.95782470703125, -2.821533203125, -2.68524169921875, -2.5489501953125, -2.41265869140625, -2.2763671875, -2.14007568359375, -2.0037841796875, -1.86749267578125, -1.731201171875, -1.59490966796875, -1.4586181640625, -1.32232666015625, -1.18603515625, -1.04974365234375, -0.9134521484375, -0.77716064453125, -0.640869140625, -0.50457763671875, -0.3682861328125, -0.23199462890625, -0.095703125, 0.04058837890625, 0.1768798828125, 0.31317138671875, 0.449462890625, 0.58575439453125, 0.7220458984375, 0.85833740234375, 0.99462890625, 1.13092041015625, 1.2672119140625, 1.40350341796875, 1.539794921875, 1.67608642578125, 1.8123779296875, 1.94866943359375, 2.0849609375, 2.22125244140625, 2.3575439453125, 2.49383544921875, 2.630126953125, 2.76641845703125, 2.9027099609375, 3.03900146484375, 3.17529296875, 3.31158447265625, 3.4478759765625, 3.58416748046875, 3.720458984375, 3.85675048828125, 3.9930419921875, 4.12933349609375, 4.265625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 11.0, 9.0, 11.0, 19.0, 38.0, 61.0, 79.0, 114.0, 146.0, 288.0, 398.0, 623.0, 918.0, 1522.0, 2353.0, 3876.0, 6192.0, 10061.0, 16516.0, 27754.0, 49080.0, 89129.0, 176299.0, 307770.0, 160572.0, 82205.0, 45618.0, 26117.0, 15547.0, 9432.0, 5853.0, 3637.0, 2205.0, 1457.0, 932.0, 572.0, 414.0, 259.0, 155.0, 108.0, 78.0, 45.0, 27.0, 17.0, 14.0, 7.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.83154296875, -0.805908203125, -0.7802734375, -0.754638671875, -0.72900390625, -0.703369140625, -0.677734375, -0.652099609375, -0.62646484375, -0.600830078125, -0.5751953125, -0.549560546875, -0.52392578125, -0.498291015625, -0.47265625, -0.447021484375, -0.42138671875, -0.395751953125, -0.3701171875, -0.344482421875, -0.31884765625, -0.293212890625, -0.267578125, -0.241943359375, -0.21630859375, -0.190673828125, -0.1650390625, -0.139404296875, -0.11376953125, -0.088134765625, -0.0625, -0.036865234375, -0.01123046875, 0.014404296875, 0.0400390625, 0.065673828125, 0.09130859375, 0.116943359375, 0.142578125, 0.168212890625, 0.19384765625, 0.219482421875, 0.2451171875, 0.270751953125, 0.29638671875, 0.322021484375, 0.34765625, 0.373291015625, 0.39892578125, 0.424560546875, 0.4501953125, 0.475830078125, 0.50146484375, 0.527099609375, 0.552734375, 0.578369140625, 0.60400390625, 0.629638671875, 0.6552734375, 0.680908203125, 0.70654296875, 0.732177734375, 0.7578125, 0.783447265625, 0.80908203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 0.0, 4.0, 9.0, 10.0, 7.0, 10.0, 6.0, 18.0, 30.0, 22.0, 22.0, 29.0, 38.0, 37.0, 37.0, 30.0, 34.0, 35.0, 43.0, 37.0, 1083.0, 49.0, 44.0, 45.0, 47.0, 39.0, 25.0, 29.0, 33.0, 28.0, 21.0, 15.0, 17.0, 15.0, 13.0, 8.0, 12.0, 16.0, 7.0, 7.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.92327880859375, -2.8367919921875, -2.75030517578125, -2.663818359375, -2.57733154296875, -2.4908447265625, -2.40435791015625, -2.31787109375, -2.23138427734375, -2.1448974609375, -2.05841064453125, -1.971923828125, -1.88543701171875, -1.7989501953125, -1.71246337890625, -1.6259765625, -1.53948974609375, -1.4530029296875, -1.36651611328125, -1.280029296875, -1.19354248046875, -1.1070556640625, -1.02056884765625, -0.93408203125, -0.84759521484375, -0.7611083984375, -0.67462158203125, -0.588134765625, -0.50164794921875, -0.4151611328125, -0.32867431640625, -0.2421875, -0.15570068359375, -0.0692138671875, 0.01727294921875, 0.103759765625, 0.19024658203125, 0.2767333984375, 0.36322021484375, 0.44970703125, 0.53619384765625, 0.6226806640625, 0.70916748046875, 0.795654296875, 0.88214111328125, 0.9686279296875, 1.05511474609375, 1.1416015625, 1.22808837890625, 1.3145751953125, 1.40106201171875, 1.487548828125, 1.57403564453125, 1.6605224609375, 1.74700927734375, 1.83349609375, 1.91998291015625, 2.0064697265625, 2.09295654296875, 2.179443359375, 2.26593017578125, 2.3524169921875, 2.43890380859375, 2.525390625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 13.0, 13.0, 25.0, 30.0, 66.0, 82.0, 118.0, 185.0, 303.0, 466.0, 630.0, 1001.0, 1454.0, 2077.0, 3025.0, 4581.0, 6555.0, 9994.0, 15320.0, 23663.0, 37109.0, 60167.0, 106324.0, 237747.0, 1300611.0, 112307.0, 62186.0, 38409.0, 24360.0, 16066.0, 10575.0, 7176.0, 4752.0, 3138.0, 2116.0, 1446.0, 955.0, 642.0, 452.0, 291.0, 230.0, 159.0, 91.0, 66.0, 44.0, 48.0, 28.0, 9.0, 8.0, 9.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6352920532226562, -0.6148223876953125, -0.5943527221679688, -0.573883056640625, -0.5534133911132812, -0.5329437255859375, -0.5124740600585938, -0.49200439453125, -0.47153472900390625, -0.4510650634765625, -0.43059539794921875, -0.410125732421875, -0.38965606689453125, -0.3691864013671875, -0.34871673583984375, -0.3282470703125, -0.30777740478515625, -0.2873077392578125, -0.26683807373046875, -0.246368408203125, -0.22589874267578125, -0.2054290771484375, -0.18495941162109375, -0.16448974609375, -0.14402008056640625, -0.1235504150390625, -0.10308074951171875, -0.082611083984375, -0.06214141845703125, -0.0416717529296875, -0.02120208740234375, -0.000732421875, 0.01973724365234375, 0.0402069091796875, 0.06067657470703125, 0.081146240234375, 0.10161590576171875, 0.1220855712890625, 0.14255523681640625, 0.16302490234375, 0.18349456787109375, 0.2039642333984375, 0.22443389892578125, 0.244903564453125, 0.26537322998046875, 0.2858428955078125, 0.30631256103515625, 0.3267822265625, 0.34725189208984375, 0.3677215576171875, 0.38819122314453125, 0.408660888671875, 0.42913055419921875, 0.4496002197265625, 0.47006988525390625, 0.49053955078125, 0.5110092163085938, 0.5314788818359375, 0.5519485473632812, 0.572418212890625, 0.5928878784179688, 0.6133575439453125, 0.6338272094726562, 0.654296875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 16.0, 2.0, 7.0, 7.0, 13.0, 21.0, 24.0, 26.0, 26.0, 50.0, 51.0, 70.0, 67.0, 71.0, 81.0, 68.0, 69.0, 71.0, 63.0, 44.0, 31.0, 18.0, 24.0, 12.0, 15.0, 12.0, 8.0, 7.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001919269561767578, -0.0001860298216342926, -0.0001801326870918274, -0.00017423555254936218, -0.00016833841800689697, -0.00016244128346443176, -0.00015654414892196655, -0.00015064701437950134, -0.00014474987983703613, -0.00013885274529457092, -0.0001329556107521057, -0.0001270584762096405, -0.00012116134166717529, -0.00011526420712471008, -0.00010936707258224487, -0.00010346993803977966, -9.757280349731445e-05, -9.167566895484924e-05, -8.577853441238403e-05, -7.988139986991882e-05, -7.398426532745361e-05, -6.80871307849884e-05, -6.21899962425232e-05, -5.6292861700057983e-05, -5.0395727157592773e-05, -4.4498592615127563e-05, -3.8601458072662354e-05, -3.2704323530197144e-05, -2.6807188987731934e-05, -2.0910054445266724e-05, -1.5012919902801514e-05, -9.115785360336304e-06, -3.2186508178710938e-06, 2.678483724594116e-06, 8.575618267059326e-06, 1.4472752809524536e-05, 2.0369887351989746e-05, 2.6267021894454956e-05, 3.2164156436920166e-05, 3.8061290979385376e-05, 4.3958425521850586e-05, 4.9855560064315796e-05, 5.5752694606781006e-05, 6.164982914924622e-05, 6.754696369171143e-05, 7.344409823417664e-05, 7.934123277664185e-05, 8.523836731910706e-05, 9.113550186157227e-05, 9.703263640403748e-05, 0.00010292977094650269, 0.0001088269054889679, 0.0001147240400314331, 0.00012062117457389832, 0.00012651830911636353, 0.00013241544365882874, 0.00013831257820129395, 0.00014420971274375916, 0.00015010684728622437, 0.00015600398182868958, 0.00016190111637115479, 0.00016779825091362, 0.0001736953854560852, 0.00017959251999855042, 0.00018548965454101562]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 8.0, 13.0, 23.0, 9.0, 18.0, 29.0, 36.0, 53.0, 82.0, 134.0, 225.0, 459.0, 1338.0, 1010530.0, 33897.0, 818.0, 340.0, 154.0, 124.0, 59.0, 45.0, 35.0, 32.0, 24.0, 13.0, 10.0, 11.0, 8.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004161834716796875, -0.0040267109870910645, -0.003891587257385254, -0.0037564635276794434, -0.003621339797973633, -0.0034862160682678223, -0.0033510923385620117, -0.003215968608856201, -0.0030808448791503906, -0.00294572114944458, -0.0028105974197387695, -0.002675473690032959, -0.0025403499603271484, -0.002405226230621338, -0.0022701025009155273, -0.002134978771209717, -0.0019998550415039062, -0.0018647313117980957, -0.0017296075820922852, -0.0015944838523864746, -0.001459360122680664, -0.0013242363929748535, -0.001189112663269043, -0.0010539889335632324, -0.0009188652038574219, -0.0007837414741516113, -0.0006486177444458008, -0.0005134940147399902, -0.0003783702850341797, -0.00024324655532836914, -0.0001081228256225586, 2.7000904083251953e-05, 0.0001621246337890625, 0.00029724836349487305, 0.0004323720932006836, 0.0005674958229064941, 0.0007026195526123047, 0.0008377432823181152, 0.0009728670120239258, 0.0011079907417297363, 0.0012431144714355469, 0.0013782382011413574, 0.001513361930847168, 0.0016484856605529785, 0.001783609390258789, 0.0019187331199645996, 0.00205385684967041, 0.0021889805793762207, 0.0023241043090820312, 0.002459228038787842, 0.0025943517684936523, 0.002729475498199463, 0.0028645992279052734, 0.002999722957611084, 0.0031348466873168945, 0.003269970417022705, 0.0034050941467285156, 0.003540217876434326, 0.0036753416061401367, 0.0038104653358459473, 0.003945589065551758, 0.004080712795257568, 0.004215836524963379, 0.0043509602546691895, 0.004486083984375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 15.0, 29.0, 64.0, 106.0, 143.0, 172.0, 154.0, 144.0, 94.0, 41.0, 25.0, 14.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010209299944108352, -9.857855911832303e-05, -9.506411879556254e-05, -9.154967847280204e-05, -8.803523815004155e-05, -8.452079782728106e-05, -8.100636478047818e-05, -7.749191718176007e-05, -7.39774841349572e-05, -7.04630438121967e-05, -6.694860348943621e-05, -6.343416316667572e-05, -5.9919722843915224e-05, -5.640528252115473e-05, -5.2890845836373046e-05, -4.9376405513612553e-05, -4.5861961552873254e-05, -4.234752123011276e-05, -3.883308090735227e-05, -3.5318640584591776e-05, -3.1804200261831284e-05, -2.8289761758060195e-05, -2.4775323254289106e-05, -2.1260882931528613e-05, -1.774644260876812e-05, -1.4232002286007628e-05, -1.0717562872741837e-05, -7.203123459476046e-06, -3.6886831367155537e-06, -1.7424281395506114e-07, 3.340195689816028e-06, 6.8546360125765204e-06, 1.0369083611294627e-05, 1.388352393405512e-05, 1.7397964256815612e-05, 2.09124027605867e-05, 2.4426843083347194e-05, 2.7941283406107686e-05, 3.1455721909878775e-05, 3.497016223263927e-05, 3.848460255539976e-05, 4.199904287816025e-05, 4.5513483200920746e-05, 4.902791988570243e-05, 5.2542360208462924e-05, 5.6056800531223416e-05, 5.957124085398391e-05, 6.30856811767444e-05, 6.66001214995049e-05, 7.011456182226539e-05, 7.362900214502588e-05, 7.714344246778637e-05, 8.065788279054686e-05, 8.417232311330736e-05, 8.768675616011024e-05, 9.120120375882834e-05, 9.471563680563122e-05, 9.823007712839171e-05, 0.0001017445174511522, 0.0001052589577739127, 0.00010877339809667319, 0.00011228783841943368, 0.00011580227874219418, 0.00011931671178899705, 0.00012283115938771516]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 8.0, 10.0, 6.0, 13.0, 10.0, 18.0, 11.0, 25.0, 13.0, 23.0, 21.0, 31.0, 34.0, 26.0, 32.0, 42.0, 35.0, 33.0, 41.0, 29.0, 44.0, 35.0, 36.0, 31.0, 40.0, 34.0, 38.0, 23.0, 28.0, 33.0, 28.0, 28.0, 17.0, 10.0, 19.0, 15.0, 14.0, 8.0, 8.0, 10.0, 6.0, 7.0, 3.0, 5.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.575750350952148e-05, -7.341057062149048e-05, -7.106363773345947e-05, -6.871670484542847e-05, -6.636977195739746e-05, -6.402283906936646e-05, -6.167590618133545e-05, -5.932897329330444e-05, -5.698204040527344e-05, -5.463510751724243e-05, -5.2288174629211426e-05, -4.994124174118042e-05, -4.7594308853149414e-05, -4.524737596511841e-05, -4.29004430770874e-05, -4.0553510189056396e-05, -3.820657730102539e-05, -3.5859644412994385e-05, -3.351271152496338e-05, -3.116577863693237e-05, -2.8818845748901367e-05, -2.647191286087036e-05, -2.4124979972839355e-05, -2.177804708480835e-05, -1.9431114196777344e-05, -1.7084181308746338e-05, -1.4737248420715332e-05, -1.2390315532684326e-05, -1.004338264465332e-05, -7.696449756622314e-06, -5.349516868591309e-06, -3.0025839805603027e-06, -6.556510925292969e-07, 1.691281795501709e-06, 4.038214683532715e-06, 6.385147571563721e-06, 8.732080459594727e-06, 1.1079013347625732e-05, 1.3425946235656738e-05, 1.5772879123687744e-05, 1.811981201171875e-05, 2.0466744899749756e-05, 2.2813677787780762e-05, 2.5160610675811768e-05, 2.7507543563842773e-05, 2.985447645187378e-05, 3.2201409339904785e-05, 3.454834222793579e-05, 3.68952751159668e-05, 3.92422080039978e-05, 4.158914089202881e-05, 4.3936073780059814e-05, 4.628300666809082e-05, 4.8629939556121826e-05, 5.097687244415283e-05, 5.332380533218384e-05, 5.5670738220214844e-05, 5.801767110824585e-05, 6.0364603996276855e-05, 6.271153688430786e-05, 6.505846977233887e-05, 6.740540266036987e-05, 6.975233554840088e-05, 7.209926843643188e-05, 7.444620132446289e-05]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 9.0, 11.0, 11.0, 14.0, 13.0, 22.0, 27.0, 27.0, 27.0, 21.0, 36.0, 28.0, 43.0, 37.0, 39.0, 51.0, 44.0, 35.0, 38.0, 42.0, 30.0, 47.0, 36.0, 30.0, 43.0, 33.0, 34.0, 28.0, 27.0, 17.0, 22.0, 13.0, 13.0, 11.0, 8.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.45703125, -4.32073974609375, -4.1844482421875, -4.04815673828125, -3.911865234375, -3.77557373046875, -3.6392822265625, -3.50299072265625, -3.36669921875, -3.23040771484375, -3.0941162109375, -2.95782470703125, -2.821533203125, -2.68524169921875, -2.5489501953125, -2.41265869140625, -2.2763671875, -2.14007568359375, -2.0037841796875, -1.86749267578125, -1.731201171875, -1.59490966796875, -1.4586181640625, -1.32232666015625, -1.18603515625, -1.04974365234375, -0.9134521484375, -0.77716064453125, -0.640869140625, -0.50457763671875, -0.3682861328125, -0.23199462890625, -0.095703125, 0.04058837890625, 0.1768798828125, 0.31317138671875, 0.449462890625, 0.58575439453125, 0.7220458984375, 0.85833740234375, 0.99462890625, 1.13092041015625, 1.2672119140625, 1.40350341796875, 1.539794921875, 1.67608642578125, 1.8123779296875, 1.94866943359375, 2.0849609375, 2.22125244140625, 2.3575439453125, 2.49383544921875, 2.630126953125, 2.76641845703125, 2.9027099609375, 3.03900146484375, 3.17529296875, 3.31158447265625, 3.4478759765625, 3.58416748046875, 3.720458984375, 3.85675048828125, 3.9930419921875, 4.12933349609375, 4.265625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 2.0, 8.0, 9.0, 9.0, 19.0, 21.0, 24.0, 36.0, 44.0, 66.0, 97.0, 126.0, 190.0, 276.0, 430.0, 835.0, 2827.0, 13082.0, 65420.0, 489034.0, 406361.0, 54177.0, 10874.0, 2460.0, 807.0, 407.0, 268.0, 184.0, 122.0, 88.0, 64.0, 43.0, 40.0, 33.0, 21.0, 12.0, 7.0, 11.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.296875, -8.0450439453125, -7.793212890625, -7.5413818359375, -7.28955078125, -7.0377197265625, -6.785888671875, -6.5340576171875, -6.2822265625, -6.0303955078125, -5.778564453125, -5.5267333984375, -5.27490234375, -5.0230712890625, -4.771240234375, -4.5194091796875, -4.267578125, -4.0157470703125, -3.763916015625, -3.5120849609375, -3.26025390625, -3.0084228515625, -2.756591796875, -2.5047607421875, -2.2529296875, -2.0010986328125, -1.749267578125, -1.4974365234375, -1.24560546875, -0.9937744140625, -0.741943359375, -0.4901123046875, -0.23828125, 0.0135498046875, 0.265380859375, 0.5172119140625, 0.76904296875, 1.0208740234375, 1.272705078125, 1.5245361328125, 1.7763671875, 2.0281982421875, 2.280029296875, 2.5318603515625, 2.78369140625, 3.0355224609375, 3.287353515625, 3.5391845703125, 3.791015625, 4.0428466796875, 4.294677734375, 4.5465087890625, 4.79833984375, 5.0501708984375, 5.302001953125, 5.5538330078125, 5.8056640625, 6.0574951171875, 6.309326171875, 6.5611572265625, 6.81298828125, 7.0648193359375, 7.316650390625, 7.5684814453125, 7.8203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 0.0, 1.0, 5.0, 5.0, 7.0, 7.0, 5.0, 12.0, 12.0, 10.0, 10.0, 18.0, 17.0, 21.0, 23.0, 29.0, 30.0, 43.0, 42.0, 56.0, 58.0, 75.0, 134.0, 391.0, 1411.0, 168.0, 69.0, 52.0, 46.0, 40.0, 41.0, 36.0, 23.0, 28.0, 20.0, 17.0, 12.0, 17.0, 11.0, 14.0, 11.0, 9.0, 6.0, 2.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.5960693359375, -12.176513671875, -11.7569580078125, -11.33740234375, -10.9178466796875, -10.498291015625, -10.0787353515625, -9.6591796875, -9.2396240234375, -8.820068359375, -8.4005126953125, -7.98095703125, -7.5614013671875, -7.141845703125, -6.7222900390625, -6.302734375, -5.8831787109375, -5.463623046875, -5.0440673828125, -4.62451171875, -4.2049560546875, -3.785400390625, -3.3658447265625, -2.9462890625, -2.5267333984375, -2.107177734375, -1.6876220703125, -1.26806640625, -0.8485107421875, -0.428955078125, -0.0093994140625, 0.41015625, 0.8297119140625, 1.249267578125, 1.6688232421875, 2.08837890625, 2.5079345703125, 2.927490234375, 3.3470458984375, 3.7666015625, 4.1861572265625, 4.605712890625, 5.0252685546875, 5.44482421875, 5.8643798828125, 6.283935546875, 6.7034912109375, 7.123046875, 7.5426025390625, 7.962158203125, 8.3817138671875, 8.80126953125, 9.2208251953125, 9.640380859375, 10.0599365234375, 10.4794921875, 10.8990478515625, 11.318603515625, 11.7381591796875, 12.15771484375, 12.5772705078125, 12.996826171875, 13.4163818359375, 13.8359375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 3.0, 9.0, 10.0, 14.0, 23.0, 24.0, 20.0, 21.0, 38.0, 49.0, 49.0, 82.0, 119.0, 192.0, 254.0, 505.0, 1212.0, 7902.0, 2965328.0, 165133.0, 2709.0, 812.0, 384.0, 235.0, 121.0, 83.0, 70.0, 63.0, 41.0, 45.0, 21.0, 24.0, 20.0, 16.0, 10.0, 11.0, 11.0, 9.0, 4.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.09375, -29.08349609375, -28.0732421875, -27.06298828125, -26.052734375, -25.04248046875, -24.0322265625, -23.02197265625, -22.01171875, -21.00146484375, -19.9912109375, -18.98095703125, -17.970703125, -16.96044921875, -15.9501953125, -14.93994140625, -13.9296875, -12.91943359375, -11.9091796875, -10.89892578125, -9.888671875, -8.87841796875, -7.8681640625, -6.85791015625, -5.84765625, -4.83740234375, -3.8271484375, -2.81689453125, -1.806640625, -0.79638671875, 0.2138671875, 1.22412109375, 2.234375, 3.24462890625, 4.2548828125, 5.26513671875, 6.275390625, 7.28564453125, 8.2958984375, 9.30615234375, 10.31640625, 11.32666015625, 12.3369140625, 13.34716796875, 14.357421875, 15.36767578125, 16.3779296875, 17.38818359375, 18.3984375, 19.40869140625, 20.4189453125, 21.42919921875, 22.439453125, 23.44970703125, 24.4599609375, 25.47021484375, 26.48046875, 27.49072265625, 28.5009765625, 29.51123046875, 30.521484375, 31.53173828125, 32.5419921875, 33.55224609375, 34.5625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 364.0, 639.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.357666015625, -178.4025115966797, -174.44735717773438, -170.49220275878906, -166.53704833984375, -162.58189392089844, -158.62673950195312, -154.6715850830078, -150.7164306640625, -146.7612762451172, -142.80612182617188, -138.85096740722656, -134.89581298828125, -130.94065856933594, -126.98550415039062, -123.03034973144531, -119.0751953125, -115.12004089355469, -111.16488647460938, -107.20973205566406, -103.25457763671875, -99.29942321777344, -95.34426879882812, -91.38911437988281, -87.43396759033203, -83.47881317138672, -79.5236587524414, -75.5685043334961, -71.61334991455078, -67.65819549560547, -63.703041076660156, -59.747886657714844, -55.79273223876953, -51.83757781982422, -47.882423400878906, -43.927268981933594, -39.97211456298828, -36.01696014404297, -32.061805725097656, -28.106653213500977, -24.151498794555664, -20.19634437561035, -16.24118995666504, -12.286036491394043, -8.33088207244873, -4.375728607177734, -0.4205741882324219, 3.5345802307128906, 7.489734649658203, 11.444889068603516, 15.400043487548828, 19.35519790649414, 23.310352325439453, 27.265504837036133, 31.220659255981445, 35.175811767578125, 39.13096618652344, 43.08612060546875, 47.04127502441406, 50.996429443359375, 54.95158386230469, 58.90673828125, 62.86189270019531, 66.81704711914062, 70.77220153808594]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 9.0, 5.0, 9.0, 5.0, 10.0, 14.0, 18.0, 21.0, 35.0, 27.0, 22.0, 31.0, 37.0, 32.0, 45.0, 61.0, 34.0, 42.0, 38.0, 39.0, 28.0, 43.0, 38.0, 33.0, 30.0, 35.0, 23.0, 23.0, 34.0, 22.0, 24.0, 17.0, 11.0, 17.0, 9.0, 7.0, 8.0, 10.0, 7.0, 5.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.35193634033203, -27.443452835083008, -26.534971237182617, -25.626487731933594, -24.71800422668457, -23.809520721435547, -22.901039123535156, -21.992555618286133, -21.08407211303711, -20.175588607788086, -19.267107009887695, -18.358623504638672, -17.45013999938965, -16.541656494140625, -15.633174896240234, -14.724691390991211, -13.81620979309082, -12.907727241516113, -11.99924373626709, -11.090761184692383, -10.18227767944336, -9.273795127868652, -8.365312576293945, -7.45682954788208, -6.548346519470215, -5.63986349105835, -4.731380462646484, -3.8228979110717773, -2.914414882659912, -2.005931854248047, -1.0974493026733398, -0.1889662742614746, 0.7195186614990234, 1.6280015707015991, 2.536484479904175, 3.444967269897461, 4.353450298309326, 5.261933326721191, 6.170415878295898, 7.078898906707764, 7.987381935119629, 8.895864486694336, 9.80434799194336, 10.712830543518066, 11.621313095092773, 12.529796600341797, 13.438279151916504, 14.346761703491211, 15.255245208740234, 16.163728713989258, 17.07221031188965, 17.980693817138672, 18.889177322387695, 19.79766082763672, 20.70614242553711, 21.614625930786133, 22.523109436035156, 23.43159294128418, 24.34007453918457, 25.248558044433594, 26.157041549682617, 27.06552505493164, 27.97400665283203, 28.882490158081055, 29.790971755981445]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 9.0, 9.0, 16.0, 9.0, 22.0, 20.0, 28.0, 23.0, 38.0, 31.0, 21.0, 31.0, 33.0, 45.0, 40.0, 40.0, 41.0, 44.0, 44.0, 40.0, 38.0, 38.0, 30.0, 35.0, 36.0, 29.0, 26.0, 22.0, 14.0, 21.0, 13.0, 12.0, 9.0, 11.0, 17.0, 6.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.03515625, -3.90496826171875, -3.7747802734375, -3.64459228515625, -3.514404296875, -3.38421630859375, -3.2540283203125, -3.12384033203125, -2.99365234375, -2.86346435546875, -2.7332763671875, -2.60308837890625, -2.472900390625, -2.34271240234375, -2.2125244140625, -2.08233642578125, -1.9521484375, -1.82196044921875, -1.6917724609375, -1.56158447265625, -1.431396484375, -1.30120849609375, -1.1710205078125, -1.04083251953125, -0.91064453125, -0.78045654296875, -0.6502685546875, -0.52008056640625, -0.389892578125, -0.25970458984375, -0.1295166015625, 0.00067138671875, 0.130859375, 0.26104736328125, 0.3912353515625, 0.52142333984375, 0.651611328125, 0.78179931640625, 0.9119873046875, 1.04217529296875, 1.17236328125, 1.30255126953125, 1.4327392578125, 1.56292724609375, 1.693115234375, 1.82330322265625, 1.9534912109375, 2.08367919921875, 2.2138671875, 2.34405517578125, 2.4742431640625, 2.60443115234375, 2.734619140625, 2.86480712890625, 2.9949951171875, 3.12518310546875, 3.25537109375, 3.38555908203125, 3.5157470703125, 3.64593505859375, 3.776123046875, 3.90631103515625, 4.0364990234375, 4.16668701171875, 4.296875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 9.0, 13.0, 14.0, 16.0, 29.0, 22.0, 24.0, 47.0, 47.0, 61.0, 82.0, 135.0, 203.0, 562.0, 2274.0, 33292.0, 874831.0, 2891512.0, 375191.0, 13414.0, 1408.0, 405.0, 190.0, 109.0, 80.0, 50.0, 47.0, 33.0, 24.0, 22.0, 15.0, 17.0, 16.0, 8.0, 13.0, 7.0, 6.0, 9.0, 3.0, 5.0, 1.0, 6.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-11.125, -10.79150390625, -10.4580078125, -10.12451171875, -9.791015625, -9.45751953125, -9.1240234375, -8.79052734375, -8.45703125, -8.12353515625, -7.7900390625, -7.45654296875, -7.123046875, -6.78955078125, -6.4560546875, -6.12255859375, -5.7890625, -5.45556640625, -5.1220703125, -4.78857421875, -4.455078125, -4.12158203125, -3.7880859375, -3.45458984375, -3.12109375, -2.78759765625, -2.4541015625, -2.12060546875, -1.787109375, -1.45361328125, -1.1201171875, -0.78662109375, -0.453125, -0.11962890625, 0.2138671875, 0.54736328125, 0.880859375, 1.21435546875, 1.5478515625, 1.88134765625, 2.21484375, 2.54833984375, 2.8818359375, 3.21533203125, 3.548828125, 3.88232421875, 4.2158203125, 4.54931640625, 4.8828125, 5.21630859375, 5.5498046875, 5.88330078125, 6.216796875, 6.55029296875, 6.8837890625, 7.21728515625, 7.55078125, 7.88427734375, 8.2177734375, 8.55126953125, 8.884765625, 9.21826171875, 9.5517578125, 9.88525390625, 10.21875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 12.0, 9.0, 15.0, 18.0, 17.0, 32.0, 31.0, 66.0, 70.0, 109.0, 145.0, 194.0, 209.0, 297.0, 348.0, 351.0, 408.0, 367.0, 275.0, 223.0, 213.0, 158.0, 106.0, 85.0, 75.0, 50.0, 36.0, 33.0, 16.0, 16.0, 13.0, 13.0, 21.0, 13.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.10546875, -5.92706298828125, -5.7486572265625, -5.57025146484375, -5.391845703125, -5.21343994140625, -5.0350341796875, -4.85662841796875, -4.67822265625, -4.49981689453125, -4.3214111328125, -4.14300537109375, -3.964599609375, -3.78619384765625, -3.6077880859375, -3.42938232421875, -3.2509765625, -3.07257080078125, -2.8941650390625, -2.71575927734375, -2.537353515625, -2.35894775390625, -2.1805419921875, -2.00213623046875, -1.82373046875, -1.64532470703125, -1.4669189453125, -1.28851318359375, -1.110107421875, -0.93170166015625, -0.7532958984375, -0.57489013671875, -0.396484375, -0.21807861328125, -0.0396728515625, 0.13873291015625, 0.317138671875, 0.49554443359375, 0.6739501953125, 0.85235595703125, 1.03076171875, 1.20916748046875, 1.3875732421875, 1.56597900390625, 1.744384765625, 1.92279052734375, 2.1011962890625, 2.27960205078125, 2.4580078125, 2.63641357421875, 2.8148193359375, 2.99322509765625, 3.171630859375, 3.35003662109375, 3.5284423828125, 3.70684814453125, 3.88525390625, 4.06365966796875, 4.2420654296875, 4.42047119140625, 4.598876953125, 4.77728271484375, 4.9556884765625, 5.13409423828125, 5.3125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 7.0, 2.0, 10.0, 7.0, 16.0, 19.0, 23.0, 26.0, 54.0, 70.0, 77.0, 96.0, 130.0, 176.0, 261.0, 433.0, 759.0, 2264.0, 28945.0, 2603854.0, 1535414.0, 17784.0, 1820.0, 729.0, 416.0, 238.0, 169.0, 123.0, 73.0, 62.0, 56.0, 47.0, 38.0, 30.0, 14.0, 13.0, 12.0, 12.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.423095703125, -16.79931640625, -16.175537109375, -15.5517578125, -14.927978515625, -14.30419921875, -13.680419921875, -13.056640625, -12.432861328125, -11.80908203125, -11.185302734375, -10.5615234375, -9.937744140625, -9.31396484375, -8.690185546875, -8.06640625, -7.442626953125, -6.81884765625, -6.195068359375, -5.5712890625, -4.947509765625, -4.32373046875, -3.699951171875, -3.076171875, -2.452392578125, -1.82861328125, -1.204833984375, -0.5810546875, 0.042724609375, 0.66650390625, 1.290283203125, 1.9140625, 2.537841796875, 3.16162109375, 3.785400390625, 4.4091796875, 5.032958984375, 5.65673828125, 6.280517578125, 6.904296875, 7.528076171875, 8.15185546875, 8.775634765625, 9.3994140625, 10.023193359375, 10.64697265625, 11.270751953125, 11.89453125, 12.518310546875, 13.14208984375, 13.765869140625, 14.3896484375, 15.013427734375, 15.63720703125, 16.260986328125, 16.884765625, 17.508544921875, 18.13232421875, 18.756103515625, 19.3798828125, 20.003662109375, 20.62744140625, 21.251220703125, 21.875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 25.0, 129.0, 367.0, 356.0, 115.0, 22.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.33060455322266, -105.81037902832031, -103.2901611328125, -100.76993560791016, -98.24971008300781, -95.7294921875, -93.20926666259766, -90.68904113769531, -88.1688232421875, -85.64859771728516, -83.12837982177734, -80.608154296875, -78.08793640136719, -75.56771087646484, -73.0474853515625, -70.52726745605469, -68.00704193115234, -65.48681640625, -62.96659851074219, -60.446372985839844, -57.926151275634766, -55.40592956542969, -52.885704040527344, -50.365482330322266, -47.84526062011719, -45.32503890991211, -42.80481719970703, -40.28459167480469, -37.76436996459961, -35.24414825439453, -32.72392272949219, -30.20370101928711, -27.6834716796875, -25.163249969482422, -22.64302635192871, -20.122802734375, -17.602581024169922, -15.082358360290527, -12.562135696411133, -10.041912078857422, -7.521690368652344, -5.001467704772949, -2.4812450408935547, 0.038977622985839844, 2.5592002868652344, 5.079422950744629, 7.599645614624023, 10.119869232177734, 12.640090942382812, 15.160313606262207, 17.6805362701416, 20.200759887695312, 22.72098159790039, 25.24120330810547, 27.76142692565918, 30.28165054321289, 32.80187225341797, 35.32209396362305, 37.842315673828125, 40.36254119873047, 42.88276290893555, 45.402984619140625, 47.92321014404297, 50.44343185424805, 52.963653564453125]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 7.0, 7.0, 13.0, 10.0, 16.0, 11.0, 13.0, 25.0, 27.0, 25.0, 21.0, 32.0, 41.0, 41.0, 42.0, 30.0, 43.0, 39.0, 42.0, 41.0, 33.0, 30.0, 35.0, 34.0, 35.0, 24.0, 38.0, 32.0, 30.0, 22.0, 25.0, 16.0, 11.0, 15.0, 14.0, 11.0, 14.0, 6.0, 7.0, 5.0, 4.0, 7.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.28722381591797, -19.64261245727539, -18.998001098632812, -18.353389739990234, -17.708778381347656, -17.064167022705078, -16.4195556640625, -15.774945259094238, -15.13033390045166, -14.485722541809082, -13.841111183166504, -13.196499824523926, -12.551889419555664, -11.907278060913086, -11.262666702270508, -10.61805534362793, -9.973443984985352, -9.328832626342773, -8.684221267700195, -8.039609909057617, -7.394999027252197, -6.750387668609619, -6.105776786804199, -5.461165428161621, -4.816554069519043, -4.171942710876465, -3.527331590652466, -2.882720470428467, -2.2381091117858887, -1.5934977531433105, -0.9488866329193115, -0.3042755126953125, 0.3403358459472656, 0.9849470853805542, 1.6295583248138428, 2.274169445037842, 2.91878080368042, 3.563392162322998, 4.208003044128418, 4.852614402770996, 5.497225761413574, 6.141837120056152, 6.7864484786987305, 7.43105936050415, 8.07567024230957, 8.720281600952148, 9.364892959594727, 10.009504318237305, 10.654115676879883, 11.298727035522461, 11.943338394165039, 12.587949752807617, 13.232561111450195, 13.877172470092773, 14.521782875061035, 15.166394233703613, 15.811005592346191, 16.455615997314453, 17.10022735595703, 17.74483871459961, 18.389450073242188, 19.034061431884766, 19.678672790527344, 20.323284149169922, 20.9678955078125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0, 8.0, 3.0, 7.0, 11.0, 11.0, 14.0, 23.0, 22.0, 19.0, 20.0, 29.0, 26.0, 24.0, 30.0, 39.0, 40.0, 42.0, 30.0, 36.0, 41.0, 50.0, 54.0, 43.0, 37.0, 44.0, 25.0, 30.0, 44.0, 20.0, 20.0, 25.0, 22.0, 16.0, 20.0, 15.0, 12.0, 9.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.93505859375, -3.7998046875, -3.66455078125, -3.529296875, -3.39404296875, -3.2587890625, -3.12353515625, -2.98828125, -2.85302734375, -2.7177734375, -2.58251953125, -2.447265625, -2.31201171875, -2.1767578125, -2.04150390625, -1.90625, -1.77099609375, -1.6357421875, -1.50048828125, -1.365234375, -1.22998046875, -1.0947265625, -0.95947265625, -0.82421875, -0.68896484375, -0.5537109375, -0.41845703125, -0.283203125, -0.14794921875, -0.0126953125, 0.12255859375, 0.2578125, 0.39306640625, 0.5283203125, 0.66357421875, 0.798828125, 0.93408203125, 1.0693359375, 1.20458984375, 1.33984375, 1.47509765625, 1.6103515625, 1.74560546875, 1.880859375, 2.01611328125, 2.1513671875, 2.28662109375, 2.421875, 2.55712890625, 2.6923828125, 2.82763671875, 2.962890625, 3.09814453125, 3.2333984375, 3.36865234375, 3.50390625, 3.63916015625, 3.7744140625, 3.90966796875, 4.044921875, 4.18017578125, 4.3154296875, 4.45068359375, 4.5859375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 5.0, 12.0, 10.0, 22.0, 33.0, 35.0, 53.0, 77.0, 88.0, 145.0, 197.0, 299.0, 445.0, 591.0, 846.0, 1119.0, 1700.0, 2478.0, 3691.0, 5147.0, 7644.0, 11462.0, 16878.0, 25331.0, 39336.0, 63173.0, 111476.0, 227193.0, 232062.0, 113448.0, 64365.0, 39703.0, 26063.0, 17163.0, 11343.0, 7709.0, 5298.0, 3700.0, 2454.0, 1723.0, 1136.0, 876.0, 596.0, 449.0, 273.0, 205.0, 157.0, 112.0, 92.0, 47.0, 26.0, 32.0, 19.0, 8.0, 3.0, 8.0, 3.0, 4.0, 0.0, 0.0, 3.0], "bins": [-0.63818359375, -0.6176071166992188, -0.5970306396484375, -0.5764541625976562, -0.555877685546875, -0.5353012084960938, -0.5147247314453125, -0.49414825439453125, -0.47357177734375, -0.45299530029296875, -0.4324188232421875, -0.41184234619140625, -0.391265869140625, -0.37068939208984375, -0.3501129150390625, -0.32953643798828125, -0.3089599609375, -0.28838348388671875, -0.2678070068359375, -0.24723052978515625, -0.226654052734375, -0.20607757568359375, -0.1855010986328125, -0.16492462158203125, -0.14434814453125, -0.12377166748046875, -0.1031951904296875, -0.08261871337890625, -0.062042236328125, -0.04146575927734375, -0.0208892822265625, -0.00031280517578125, 0.020263671875, 0.04084014892578125, 0.0614166259765625, 0.08199310302734375, 0.102569580078125, 0.12314605712890625, 0.1437225341796875, 0.16429901123046875, 0.18487548828125, 0.20545196533203125, 0.2260284423828125, 0.24660491943359375, 0.267181396484375, 0.28775787353515625, 0.3083343505859375, 0.32891082763671875, 0.3494873046875, 0.37006378173828125, 0.3906402587890625, 0.41121673583984375, 0.431793212890625, 0.45236968994140625, 0.4729461669921875, 0.49352264404296875, 0.51409912109375, 0.5346755981445312, 0.5552520751953125, 0.5758285522460938, 0.596405029296875, 0.6169815063476562, 0.6375579833984375, 0.6581344604492188, 0.6787109375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 6.0, 12.0, 13.0, 6.0, 18.0, 15.0, 20.0, 19.0, 29.0, 27.0, 32.0, 29.0, 28.0, 34.0, 32.0, 43.0, 32.0, 43.0, 34.0, 1062.0, 33.0, 42.0, 31.0, 27.0, 44.0, 32.0, 31.0, 32.0, 29.0, 26.0, 14.0, 19.0, 14.0, 19.0, 18.0, 9.0, 6.0, 10.0, 7.0, 6.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.55078125, -2.46875, -2.38671875, -2.3046875, -2.22265625, -2.140625, -2.05859375, -1.9765625, -1.89453125, -1.8125, -1.73046875, -1.6484375, -1.56640625, -1.484375, -1.40234375, -1.3203125, -1.23828125, -1.15625, -1.07421875, -0.9921875, -0.91015625, -0.828125, -0.74609375, -0.6640625, -0.58203125, -0.5, -0.41796875, -0.3359375, -0.25390625, -0.171875, -0.08984375, -0.0078125, 0.07421875, 0.15625, 0.23828125, 0.3203125, 0.40234375, 0.484375, 0.56640625, 0.6484375, 0.73046875, 0.8125, 0.89453125, 0.9765625, 1.05859375, 1.140625, 1.22265625, 1.3046875, 1.38671875, 1.46875, 1.55078125, 1.6328125, 1.71484375, 1.796875, 1.87890625, 1.9609375, 2.04296875, 2.125, 2.20703125, 2.2890625, 2.37109375, 2.453125, 2.53515625, 2.6171875, 2.69921875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 8.0, 9.0, 15.0, 27.0, 35.0, 47.0, 90.0, 96.0, 161.0, 230.0, 350.0, 457.0, 631.0, 919.0, 1223.0, 1695.0, 2372.0, 3250.0, 4538.0, 6129.0, 8601.0, 12288.0, 17421.0, 24979.0, 36658.0, 55438.0, 88723.0, 162438.0, 1294168.0, 136133.0, 78001.0, 49088.0, 32632.0, 22693.0, 15733.0, 11342.0, 8061.0, 5804.0, 4123.0, 2940.0, 2132.0, 1559.0, 1095.0, 827.0, 595.0, 421.0, 274.0, 210.0, 155.0, 101.0, 74.0, 56.0, 38.0, 23.0, 17.0, 8.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.5810546875, -0.5631027221679688, -0.5451507568359375, -0.5271987915039062, -0.509246826171875, -0.49129486083984375, -0.4733428955078125, -0.45539093017578125, -0.43743896484375, -0.41948699951171875, -0.4015350341796875, -0.38358306884765625, -0.365631103515625, -0.34767913818359375, -0.3297271728515625, -0.31177520751953125, -0.2938232421875, -0.27587127685546875, -0.2579193115234375, -0.23996734619140625, -0.222015380859375, -0.20406341552734375, -0.1861114501953125, -0.16815948486328125, -0.15020751953125, -0.13225555419921875, -0.1143035888671875, -0.09635162353515625, -0.078399658203125, -0.06044769287109375, -0.0424957275390625, -0.02454376220703125, -0.006591796875, 0.01136016845703125, 0.0293121337890625, 0.04726409912109375, 0.065216064453125, 0.08316802978515625, 0.1011199951171875, 0.11907196044921875, 0.13702392578125, 0.15497589111328125, 0.1729278564453125, 0.19087982177734375, 0.208831787109375, 0.22678375244140625, 0.2447357177734375, 0.26268768310546875, 0.2806396484375, 0.29859161376953125, 0.3165435791015625, 0.33449554443359375, 0.352447509765625, 0.37039947509765625, 0.3883514404296875, 0.40630340576171875, 0.42425537109375, 0.44220733642578125, 0.4601593017578125, 0.47811126708984375, 0.496063232421875, 0.5140151977539062, 0.5319671630859375, 0.5499191284179688, 0.56787109375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 8.0, 10.0, 8.0, 10.0, 11.0, 16.0, 18.0, 15.0, 29.0, 26.0, 42.0, 50.0, 44.0, 58.0, 76.0, 51.0, 65.0, 56.0, 64.0, 51.0, 49.0, 60.0, 46.0, 27.0, 26.0, 17.0, 11.0, 10.0, 9.0, 9.0, 5.0, 3.0, 6.0, 5.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019121170043945312, -0.00018531642854213715, -0.00017942115664482117, -0.0001735258847475052, -0.0001676306128501892, -0.00016173534095287323, -0.00015584006905555725, -0.00014994479715824127, -0.0001440495252609253, -0.00013815425336360931, -0.00013225898146629333, -0.00012636370956897736, -0.00012046843767166138, -0.0001145731657743454, -0.00010867789387702942, -0.00010278262197971344, -9.688735008239746e-05, -9.099207818508148e-05, -8.50968062877655e-05, -7.920153439044952e-05, -7.330626249313354e-05, -6.741099059581757e-05, -6.151571869850159e-05, -5.562044680118561e-05, -4.972517490386963e-05, -4.382990300655365e-05, -3.793463110923767e-05, -3.203935921192169e-05, -2.6144087314605713e-05, -2.0248815417289734e-05, -1.4353543519973755e-05, -8.458271622657776e-06, -2.562999725341797e-06, 3.332272171974182e-06, 9.227544069290161e-06, 1.512281596660614e-05, 2.101808786392212e-05, 2.6913359761238098e-05, 3.280863165855408e-05, 3.8703903555870056e-05, 4.4599175453186035e-05, 5.0494447350502014e-05, 5.638971924781799e-05, 6.228499114513397e-05, 6.818026304244995e-05, 7.407553493976593e-05, 7.997080683708191e-05, 8.586607873439789e-05, 9.176135063171387e-05, 9.765662252902985e-05, 0.00010355189442634583, 0.0001094471663236618, 0.00011534243822097778, 0.00012123771011829376, 0.00012713298201560974, 0.00013302825391292572, 0.0001389235258102417, 0.00014481879770755768, 0.00015071406960487366, 0.00015660934150218964, 0.00016250461339950562, 0.0001683998852968216, 0.00017429515719413757, 0.00018019042909145355, 0.00018608570098876953]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 7.0, 12.0, 17.0, 17.0, 24.0, 26.0, 39.0, 57.0, 91.0, 147.0, 224.0, 341.0, 674.0, 2570.0, 1036095.0, 6239.0, 818.0, 396.0, 214.0, 162.0, 76.0, 73.0, 50.0, 33.0, 37.0, 23.0, 19.0, 22.0, 12.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004161834716796875, -0.004034161567687988, -0.0039064884185791016, -0.003778815269470215, -0.003651142120361328, -0.0035234689712524414, -0.0033957958221435547, -0.003268122673034668, -0.0031404495239257812, -0.0030127763748168945, -0.002885103225708008, -0.002757430076599121, -0.0026297569274902344, -0.0025020837783813477, -0.002374410629272461, -0.0022467374801635742, -0.0021190643310546875, -0.0019913911819458008, -0.001863718032836914, -0.0017360448837280273, -0.0016083717346191406, -0.001480698585510254, -0.0013530254364013672, -0.0012253522872924805, -0.0010976791381835938, -0.000970005989074707, -0.0008423328399658203, -0.0007146596908569336, -0.0005869865417480469, -0.00045931339263916016, -0.00033164024353027344, -0.00020396709442138672, -7.62939453125e-05, 5.137920379638672e-05, 0.00017905235290527344, 0.00030672550201416016, 0.0004343986511230469, 0.0005620718002319336, 0.0006897449493408203, 0.000817418098449707, 0.0009450912475585938, 0.0010727643966674805, 0.0012004375457763672, 0.001328110694885254, 0.0014557838439941406, 0.0015834569931030273, 0.001711130142211914, 0.0018388032913208008, 0.0019664764404296875, 0.0020941495895385742, 0.002221822738647461, 0.0023494958877563477, 0.0024771690368652344, 0.002604842185974121, 0.002732515335083008, 0.0028601884841918945, 0.0029878616333007812, 0.003115534782409668, 0.0032432079315185547, 0.0033708810806274414, 0.003498554229736328, 0.003626227378845215, 0.0037539005279541016, 0.0038815736770629883, 0.004009246826171875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 34.0, 154.0, 245.0, 302.0, 182.0, 71.0, 16.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027681791107170284, -0.0002701149496715516, -0.0002634120173752308, -0.00025670905597507954, -0.00025000612367875874, -0.0002433031622786075, -0.00023660021543037146, -0.00022989726858213544, -0.00022319432173389941, -0.0002164913748856634, -0.00020978842803742737, -0.00020308548118919134, -0.0001963825197890401, -0.0001896795874927193, -0.00018297662609256804, -0.00017627367924433202, -0.000169570732396096, -0.00016286778554785997, -0.00015616483869962394, -0.00014946189185138792, -0.0001427589450031519, -0.00013605598360300064, -0.00012935303675476462, -0.0001226500899065286, -0.00011594714305829257, -0.00010924419621005654, -0.00010254124936182052, -9.583829523762688e-05, -8.913534838939086e-05, -8.243240154115483e-05, -7.572944741696119e-05, -6.902650056872517e-05, -6.232355372048914e-05, -5.562060687225312e-05, -4.891765638603829e-05, -4.221470589982346e-05, -3.551175905158743e-05, -2.8808812203351408e-05, -2.2105861717136577e-05, -1.5402911230921745e-05, -8.699964382685721e-06, -1.997015715460293e-06, 4.705932951765135e-06, 1.1408881618990563e-05, 1.811183028621599e-05, 2.4814777134452015e-05, 3.151772762066685e-05, 3.822067810688168e-05, 4.49236249551177e-05, 5.162657180335373e-05, 5.832952228956856e-05, 6.503247277578339e-05, 7.173541962401941e-05, 7.843836647225544e-05, 8.514132059644908e-05, 9.18442674446851e-05, 9.854721429292113e-05, 0.00010525016114115715, 0.00011195310798939317, 0.00011865606211358681, 0.00012535901623778045, 0.00013206194853410125, 0.0001387649099342525, 0.00014546785678248852, 0.00015217080363072455]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 5.0, 5.0, 9.0, 20.0, 14.0, 26.0, 27.0, 29.0, 22.0, 35.0, 35.0, 35.0, 48.0, 56.0, 47.0, 59.0, 45.0, 54.0, 52.0, 43.0, 42.0, 50.0, 38.0, 26.0, 37.0, 31.0, 20.0, 20.0, 16.0, 10.0, 14.0, 6.0, 2.0, 6.0, 5.0, 1.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011771917343139648, -0.00011443905532360077, -0.00011115893721580505, -0.00010787881910800934, -0.00010459870100021362, -0.00010131858289241791, -9.803846478462219e-05, -9.475834667682648e-05, -9.147822856903076e-05, -8.819811046123505e-05, -8.491799235343933e-05, -8.163787424564362e-05, -7.83577561378479e-05, -7.507763803005219e-05, -7.179751992225647e-05, -6.851740181446075e-05, -6.523728370666504e-05, -6.195716559886932e-05, -5.867704749107361e-05, -5.539692938327789e-05, -5.211681127548218e-05, -4.883669316768646e-05, -4.555657505989075e-05, -4.227645695209503e-05, -3.8996338844299316e-05, -3.57162207365036e-05, -3.2436102628707886e-05, -2.915598452091217e-05, -2.5875866413116455e-05, -2.259574830532074e-05, -1.9315630197525024e-05, -1.603551208972931e-05, -1.2755393981933594e-05, -9.475275874137878e-06, -6.195157766342163e-06, -2.9150396585464478e-06, 3.650784492492676e-07, 3.645196557044983e-06, 6.925314664840698e-06, 1.0205432772636414e-05, 1.3485550880432129e-05, 1.6765668988227844e-05, 2.004578709602356e-05, 2.3325905203819275e-05, 2.660602331161499e-05, 2.9886141419410706e-05, 3.316625952720642e-05, 3.6446377635002136e-05, 3.972649574279785e-05, 4.300661385059357e-05, 4.628673195838928e-05, 4.9566850066185e-05, 5.284696817398071e-05, 5.612708628177643e-05, 5.9407204389572144e-05, 6.268732249736786e-05, 6.596744060516357e-05, 6.924755871295929e-05, 7.2527676820755e-05, 7.580779492855072e-05, 7.908791303634644e-05, 8.236803114414215e-05, 8.564814925193787e-05, 8.892826735973358e-05, 9.22083854675293e-05]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0, 8.0, 3.0, 7.0, 11.0, 11.0, 14.0, 23.0, 22.0, 19.0, 20.0, 29.0, 26.0, 24.0, 30.0, 39.0, 40.0, 42.0, 30.0, 36.0, 41.0, 50.0, 54.0, 43.0, 37.0, 44.0, 25.0, 30.0, 44.0, 20.0, 20.0, 25.0, 22.0, 16.0, 20.0, 15.0, 12.0, 9.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.93505859375, -3.7998046875, -3.66455078125, -3.529296875, -3.39404296875, -3.2587890625, -3.12353515625, -2.98828125, -2.85302734375, -2.7177734375, -2.58251953125, -2.447265625, -2.31201171875, -2.1767578125, -2.04150390625, -1.90625, -1.77099609375, -1.6357421875, -1.50048828125, -1.365234375, -1.22998046875, -1.0947265625, -0.95947265625, -0.82421875, -0.68896484375, -0.5537109375, -0.41845703125, -0.283203125, -0.14794921875, -0.0126953125, 0.12255859375, 0.2578125, 0.39306640625, 0.5283203125, 0.66357421875, 0.798828125, 0.93408203125, 1.0693359375, 1.20458984375, 1.33984375, 1.47509765625, 1.6103515625, 1.74560546875, 1.880859375, 2.01611328125, 2.1513671875, 2.28662109375, 2.421875, 2.55712890625, 2.6923828125, 2.82763671875, 2.962890625, 3.09814453125, 3.2333984375, 3.36865234375, 3.50390625, 3.63916015625, 3.7744140625, 3.90966796875, 4.044921875, 4.18017578125, 4.3154296875, 4.45068359375, 4.5859375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 2.0, 2.0, 13.0, 3.0, 8.0, 26.0, 20.0, 39.0, 57.0, 76.0, 88.0, 104.0, 149.0, 189.0, 258.0, 351.0, 503.0, 707.0, 1485.0, 5258.0, 28272.0, 287266.0, 658501.0, 51419.0, 8833.0, 2008.0, 821.0, 571.0, 387.0, 292.0, 219.0, 134.0, 122.0, 93.0, 70.0, 48.0, 41.0, 26.0, 22.0, 19.0, 12.0, 9.0, 6.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.887451171875, -9.54833984375, -9.209228515625, -8.8701171875, -8.531005859375, -8.19189453125, -7.852783203125, -7.513671875, -7.174560546875, -6.83544921875, -6.496337890625, -6.1572265625, -5.818115234375, -5.47900390625, -5.139892578125, -4.80078125, -4.461669921875, -4.12255859375, -3.783447265625, -3.4443359375, -3.105224609375, -2.76611328125, -2.427001953125, -2.087890625, -1.748779296875, -1.40966796875, -1.070556640625, -0.7314453125, -0.392333984375, -0.05322265625, 0.285888671875, 0.625, 0.964111328125, 1.30322265625, 1.642333984375, 1.9814453125, 2.320556640625, 2.65966796875, 2.998779296875, 3.337890625, 3.677001953125, 4.01611328125, 4.355224609375, 4.6943359375, 5.033447265625, 5.37255859375, 5.711669921875, 6.05078125, 6.389892578125, 6.72900390625, 7.068115234375, 7.4072265625, 7.746337890625, 8.08544921875, 8.424560546875, 8.763671875, 9.102783203125, 9.44189453125, 9.781005859375, 10.1201171875, 10.459228515625, 10.79833984375, 11.137451171875, 11.4765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 3.0, 4.0, 7.0, 10.0, 5.0, 12.0, 17.0, 25.0, 32.0, 38.0, 45.0, 56.0, 59.0, 68.0, 91.0, 315.0, 1663.0, 153.0, 72.0, 65.0, 57.0, 37.0, 41.0, 30.0, 33.0, 22.0, 16.0, 17.0, 10.0, 9.0, 11.0, 2.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.734375, -19.158447265625, -18.58251953125, -18.006591796875, -17.4306640625, -16.854736328125, -16.27880859375, -15.702880859375, -15.126953125, -14.551025390625, -13.97509765625, -13.399169921875, -12.8232421875, -12.247314453125, -11.67138671875, -11.095458984375, -10.51953125, -9.943603515625, -9.36767578125, -8.791748046875, -8.2158203125, -7.639892578125, -7.06396484375, -6.488037109375, -5.912109375, -5.336181640625, -4.76025390625, -4.184326171875, -3.6083984375, -3.032470703125, -2.45654296875, -1.880615234375, -1.3046875, -0.728759765625, -0.15283203125, 0.423095703125, 0.9990234375, 1.574951171875, 2.15087890625, 2.726806640625, 3.302734375, 3.878662109375, 4.45458984375, 5.030517578125, 5.6064453125, 6.182373046875, 6.75830078125, 7.334228515625, 7.91015625, 8.486083984375, 9.06201171875, 9.637939453125, 10.2138671875, 10.789794921875, 11.36572265625, 11.941650390625, 12.517578125, 13.093505859375, 13.66943359375, 14.245361328125, 14.8212890625, 15.397216796875, 15.97314453125, 16.549072265625, 17.125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 13.0, 17.0, 28.0, 56.0, 50.0, 85.0, 160.0, 344.0, 1796.0, 2785039.0, 355834.0, 1523.0, 324.0, 157.0, 102.0, 49.0, 38.0, 24.0, 19.0, 9.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.625, -92.3232421875, -89.021484375, -85.7197265625, -82.41796875, -79.1162109375, -75.814453125, -72.5126953125, -69.2109375, -65.9091796875, -62.607421875, -59.3056640625, -56.00390625, -52.7021484375, -49.400390625, -46.0986328125, -42.796875, -39.4951171875, -36.193359375, -32.8916015625, -29.58984375, -26.2880859375, -22.986328125, -19.6845703125, -16.3828125, -13.0810546875, -9.779296875, -6.4775390625, -3.17578125, 0.1259765625, 3.427734375, 6.7294921875, 10.03125, 13.3330078125, 16.634765625, 19.9365234375, 23.23828125, 26.5400390625, 29.841796875, 33.1435546875, 36.4453125, 39.7470703125, 43.048828125, 46.3505859375, 49.65234375, 52.9541015625, 56.255859375, 59.5576171875, 62.859375, 66.1611328125, 69.462890625, 72.7646484375, 76.06640625, 79.3681640625, 82.669921875, 85.9716796875, 89.2734375, 92.5751953125, 95.876953125, 99.1787109375, 102.48046875, 105.7822265625, 109.083984375, 112.3857421875, 115.6875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 10.0, 57.0, 283.0, 473.0, 155.0, 32.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.85395812988281, -62.91175079345703, -60.969547271728516, -59.027339935302734, -57.08513259887695, -55.14292907714844, -53.200721740722656, -51.258514404296875, -49.316307067871094, -47.37409973144531, -45.4318962097168, -43.489688873291016, -41.547481536865234, -39.60527801513672, -37.66307067871094, -35.720863342285156, -33.77865982055664, -31.836454391479492, -29.89424705505371, -27.952041625976562, -26.00983428955078, -24.067628860473633, -22.125423431396484, -20.183216094970703, -18.241010665893555, -16.298805236816406, -14.356597900390625, -12.414392471313477, -10.472186088562012, -8.529979705810547, -6.587774276733398, -4.645567893981934, -2.703357696533203, -0.7611515522003174, 1.1810545921325684, 3.123260498046875, 5.06546688079834, 7.007673263549805, 8.949878692626953, 10.892085075378418, 12.834291458129883, 14.776497840881348, 16.718704223632812, 18.66090965270996, 20.60311508178711, 22.54532241821289, 24.48752784729004, 26.429733276367188, 28.37194061279297, 30.314146041870117, 32.256351470947266, 34.19855880737305, 36.14076614379883, 38.082969665527344, 40.025177001953125, 41.967384338378906, 43.90959167480469, 45.85179901123047, 47.794002532958984, 49.736209869384766, 51.67841720581055, 53.62062072753906, 55.562828063964844, 57.505035400390625, 59.44723892211914]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 4.0, 12.0, 8.0, 5.0, 15.0, 14.0, 15.0, 17.0, 23.0, 25.0, 20.0, 35.0, 37.0, 38.0, 37.0, 31.0, 37.0, 38.0, 48.0, 41.0, 40.0, 45.0, 38.0, 41.0, 51.0, 40.0, 23.0, 23.0, 24.0, 22.0, 31.0, 20.0, 25.0, 10.0, 8.0, 12.0, 14.0, 7.0, 5.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.744325637817383, -28.76934242248535, -27.794361114501953, -26.819377899169922, -25.84439468383789, -24.869413375854492, -23.89443016052246, -22.919448852539062, -21.94446563720703, -20.969482421875, -19.9945011138916, -19.01951789855957, -18.044536590576172, -17.06955337524414, -16.09457015991211, -15.119587898254395, -14.14460563659668, -13.169623374938965, -12.19464111328125, -11.219657897949219, -10.244675636291504, -9.269693374633789, -8.294710159301758, -7.319727897644043, -6.344745635986328, -5.369763374328613, -4.39478063583374, -3.4197981357574463, -2.4448156356811523, -1.4698333740234375, -0.49485063552856445, 0.4801321029663086, 1.4551162719726562, 2.43009877204895, 3.405081272125244, 4.380064010620117, 5.355046272277832, 6.330028533935547, 7.30501127243042, 8.279994010925293, 9.254976272583008, 10.229958534240723, 11.204940795898438, 12.179924011230469, 13.154906272888184, 14.129888534545898, 15.10487174987793, 16.079853057861328, 17.05483627319336, 18.02981948852539, 19.00480079650879, 19.97978401184082, 20.95476531982422, 21.92974853515625, 22.90473175048828, 23.879714965820312, 24.85469627380371, 25.829679489135742, 26.80466079711914, 27.779644012451172, 28.754627227783203, 29.7296085357666, 30.704591751098633, 31.67957305908203, 32.65455627441406]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 7.0, 6.0, 6.0, 4.0, 6.0, 11.0, 12.0, 13.0, 17.0, 14.0, 19.0, 39.0, 24.0, 27.0, 31.0, 22.0, 46.0, 45.0, 42.0, 49.0, 45.0, 52.0, 49.0, 36.0, 33.0, 41.0, 34.0, 34.0, 27.0, 20.0, 26.0, 25.0, 18.0, 20.0, 19.0, 13.0, 16.0, 16.0, 6.0, 8.0, 8.0, 4.0, 8.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.390625, -4.24755859375, -4.1044921875, -3.96142578125, -3.818359375, -3.67529296875, -3.5322265625, -3.38916015625, -3.24609375, -3.10302734375, -2.9599609375, -2.81689453125, -2.673828125, -2.53076171875, -2.3876953125, -2.24462890625, -2.1015625, -1.95849609375, -1.8154296875, -1.67236328125, -1.529296875, -1.38623046875, -1.2431640625, -1.10009765625, -0.95703125, -0.81396484375, -0.6708984375, -0.52783203125, -0.384765625, -0.24169921875, -0.0986328125, 0.04443359375, 0.1875, 0.33056640625, 0.4736328125, 0.61669921875, 0.759765625, 0.90283203125, 1.0458984375, 1.18896484375, 1.33203125, 1.47509765625, 1.6181640625, 1.76123046875, 1.904296875, 2.04736328125, 2.1904296875, 2.33349609375, 2.4765625, 2.61962890625, 2.7626953125, 2.90576171875, 3.048828125, 3.19189453125, 3.3349609375, 3.47802734375, 3.62109375, 3.76416015625, 3.9072265625, 4.05029296875, 4.193359375, 4.33642578125, 4.4794921875, 4.62255859375, 4.765625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 9.0, 11.0, 12.0, 21.0, 30.0, 38.0, 32.0, 53.0, 66.0, 74.0, 102.0, 119.0, 182.0, 253.0, 381.0, 704.0, 1891.0, 9696.0, 113570.0, 1128531.0, 2375736.0, 515372.0, 39855.0, 4585.0, 1121.0, 559.0, 320.0, 211.0, 184.0, 122.0, 94.0, 71.0, 48.0, 49.0, 45.0, 32.0, 23.0, 16.0, 16.0, 9.0, 11.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.63671875, -7.37615966796875, -7.1156005859375, -6.85504150390625, -6.594482421875, -6.33392333984375, -6.0733642578125, -5.81280517578125, -5.55224609375, -5.29168701171875, -5.0311279296875, -4.77056884765625, -4.510009765625, -4.24945068359375, -3.9888916015625, -3.72833251953125, -3.4677734375, -3.20721435546875, -2.9466552734375, -2.68609619140625, -2.425537109375, -2.16497802734375, -1.9044189453125, -1.64385986328125, -1.38330078125, -1.12274169921875, -0.8621826171875, -0.60162353515625, -0.341064453125, -0.08050537109375, 0.1800537109375, 0.44061279296875, 0.701171875, 0.96173095703125, 1.2222900390625, 1.48284912109375, 1.743408203125, 2.00396728515625, 2.2645263671875, 2.52508544921875, 2.78564453125, 3.04620361328125, 3.3067626953125, 3.56732177734375, 3.827880859375, 4.08843994140625, 4.3489990234375, 4.60955810546875, 4.8701171875, 5.13067626953125, 5.3912353515625, 5.65179443359375, 5.912353515625, 6.17291259765625, 6.4334716796875, 6.69403076171875, 6.95458984375, 7.21514892578125, 7.4757080078125, 7.73626708984375, 7.996826171875, 8.25738525390625, 8.5179443359375, 8.77850341796875, 9.0390625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 6.0, 9.0, 6.0, 19.0, 21.0, 26.0, 41.0, 49.0, 99.0, 107.0, 166.0, 224.0, 327.0, 407.0, 457.0, 444.0, 406.0, 332.0, 236.0, 197.0, 122.0, 96.0, 76.0, 61.0, 34.0, 31.0, 20.0, 17.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.53515625, -5.33050537109375, -5.1258544921875, -4.92120361328125, -4.716552734375, -4.51190185546875, -4.3072509765625, -4.10260009765625, -3.89794921875, -3.69329833984375, -3.4886474609375, -3.28399658203125, -3.079345703125, -2.87469482421875, -2.6700439453125, -2.46539306640625, -2.2607421875, -2.05609130859375, -1.8514404296875, -1.64678955078125, -1.442138671875, -1.23748779296875, -1.0328369140625, -0.82818603515625, -0.62353515625, -0.41888427734375, -0.2142333984375, -0.00958251953125, 0.195068359375, 0.39971923828125, 0.6043701171875, 0.80902099609375, 1.013671875, 1.21832275390625, 1.4229736328125, 1.62762451171875, 1.832275390625, 2.03692626953125, 2.2415771484375, 2.44622802734375, 2.65087890625, 2.85552978515625, 3.0601806640625, 3.26483154296875, 3.469482421875, 3.67413330078125, 3.8787841796875, 4.08343505859375, 4.2880859375, 4.49273681640625, 4.6973876953125, 4.90203857421875, 5.106689453125, 5.31134033203125, 5.5159912109375, 5.72064208984375, 5.92529296875, 6.12994384765625, 6.3345947265625, 6.53924560546875, 6.743896484375, 6.94854736328125, 7.1531982421875, 7.35784912109375, 7.5625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 6.0, 8.0, 18.0, 11.0, 22.0, 28.0, 37.0, 46.0, 62.0, 60.0, 87.0, 141.0, 180.0, 284.0, 431.0, 739.0, 1584.0, 6721.0, 88911.0, 3037941.0, 1020543.0, 29854.0, 3638.0, 1121.0, 569.0, 373.0, 240.0, 148.0, 125.0, 73.0, 61.0, 54.0, 41.0, 27.0, 29.0, 14.0, 14.0, 9.0, 4.0, 4.0, 3.0, 8.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.6484375, -15.1566162109375, -14.664794921875, -14.1729736328125, -13.68115234375, -13.1893310546875, -12.697509765625, -12.2056884765625, -11.7138671875, -11.2220458984375, -10.730224609375, -10.2384033203125, -9.74658203125, -9.2547607421875, -8.762939453125, -8.2711181640625, -7.779296875, -7.2874755859375, -6.795654296875, -6.3038330078125, -5.81201171875, -5.3201904296875, -4.828369140625, -4.3365478515625, -3.8447265625, -3.3529052734375, -2.861083984375, -2.3692626953125, -1.87744140625, -1.3856201171875, -0.893798828125, -0.4019775390625, 0.08984375, 0.5816650390625, 1.073486328125, 1.5653076171875, 2.05712890625, 2.5489501953125, 3.040771484375, 3.5325927734375, 4.0244140625, 4.5162353515625, 5.008056640625, 5.4998779296875, 5.99169921875, 6.4835205078125, 6.975341796875, 7.4671630859375, 7.958984375, 8.4508056640625, 8.942626953125, 9.4344482421875, 9.92626953125, 10.4180908203125, 10.909912109375, 11.4017333984375, 11.8935546875, 12.3853759765625, 12.877197265625, 13.3690185546875, 13.86083984375, 14.3526611328125, 14.844482421875, 15.3363037109375, 15.828125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 56.0, 401.0, 436.0, 111.0, 10.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.4868392944336, -84.95323181152344, -81.41963195800781, -77.88602447509766, -74.35242462158203, -70.81881713867188, -67.28521728515625, -63.751609802246094, -60.2180061340332, -56.68440246582031, -53.15079879760742, -49.61719512939453, -46.083587646484375, -42.54998779296875, -39.016380310058594, -35.4827766418457, -31.949172973632812, -28.415569305419922, -24.88196563720703, -21.348360061645508, -17.814756393432617, -14.281152725219727, -10.747547149658203, -7.2139434814453125, -3.680339813232422, -0.14673566818237305, 3.386868476867676, 6.920473098754883, 10.454076766967773, 13.987680435180664, 17.521286010742188, 21.054889678955078, 24.5885009765625, 28.12210464477539, 31.65570831298828, 35.18931579589844, 38.72291564941406, 42.25652313232422, 45.79012680053711, 49.32373046875, 52.85733413696289, 56.39093780517578, 59.92454147338867, 63.45814514160156, 66.99175262451172, 70.52535247802734, 74.0589599609375, 77.59255981445312, 81.12616729736328, 84.65977478027344, 88.19337463378906, 91.72698211669922, 95.26058197021484, 98.794189453125, 102.32778930664062, 105.86139678955078, 109.39500427246094, 112.9286117553711, 116.46221160888672, 119.99581909179688, 123.5294189453125, 127.06302642822266, 130.5966339111328, 134.13023376464844, 137.66383361816406]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 2.0, 6.0, 12.0, 7.0, 4.0, 8.0, 13.0, 10.0, 12.0, 14.0, 23.0, 16.0, 26.0, 24.0, 21.0, 20.0, 29.0, 33.0, 40.0, 34.0, 45.0, 37.0, 36.0, 42.0, 33.0, 42.0, 37.0, 38.0, 41.0, 36.0, 32.0, 34.0, 39.0, 19.0, 28.0, 10.0, 14.0, 22.0, 13.0, 10.0, 9.0, 7.0, 3.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-21.181427001953125, -20.560644149780273, -19.93985939025879, -19.319076538085938, -18.698291778564453, -18.0775089263916, -17.456724166870117, -16.835941314697266, -16.21515655517578, -15.594372749328613, -14.973588943481445, -14.352805137634277, -13.73202133178711, -13.111237525939941, -12.490453720092773, -11.869670867919922, -11.248887062072754, -10.628103256225586, -10.007319450378418, -9.38653564453125, -8.765751838684082, -8.144968032836914, -7.524184703826904, -6.903400897979736, -6.282617092132568, -5.6618332862854, -5.041049480438232, -4.420266151428223, -3.7994821071624756, -3.1786983013153076, -2.5579147338867188, -1.9371309280395508, -1.3163471221923828, -0.6955633759498596, -0.07477962970733643, 0.546004056930542, 1.16678786277771, 1.787571668624878, 2.408355236053467, 3.0291390419006348, 3.6499228477478027, 4.270706653594971, 4.891490459442139, 5.512273788452148, 6.133057594299316, 6.753841400146484, 7.374625205993652, 7.99540901184082, 8.616192817687988, 9.236976623535156, 9.857760429382324, 10.478544235229492, 11.09932804107666, 11.720111846923828, 12.34089469909668, 12.961679458618164, 13.582462310791016, 14.203246116638184, 14.824029922485352, 15.44481372833252, 16.065597534179688, 16.68638038635254, 17.307165145874023, 17.927947998046875, 18.54873275756836]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 12.0, 10.0, 12.0, 13.0, 12.0, 14.0, 18.0, 15.0, 20.0, 22.0, 28.0, 25.0, 25.0, 31.0, 40.0, 41.0, 39.0, 44.0, 43.0, 46.0, 51.0, 50.0, 31.0, 38.0, 29.0, 40.0, 23.0, 31.0, 20.0, 19.0, 22.0, 22.0, 12.0, 16.0, 13.0, 6.0, 12.0, 10.0, 10.0, 8.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.998046875, -3.866058349609375, -3.73406982421875, -3.602081298828125, -3.4700927734375, -3.338104248046875, -3.20611572265625, -3.074127197265625, -2.942138671875, -2.810150146484375, -2.67816162109375, -2.546173095703125, -2.4141845703125, -2.282196044921875, -2.15020751953125, -2.018218994140625, -1.88623046875, -1.754241943359375, -1.62225341796875, -1.490264892578125, -1.3582763671875, -1.226287841796875, -1.09429931640625, -0.962310791015625, -0.830322265625, -0.698333740234375, -0.56634521484375, -0.434356689453125, -0.3023681640625, -0.170379638671875, -0.03839111328125, 0.093597412109375, 0.2255859375, 0.357574462890625, 0.48956298828125, 0.621551513671875, 0.7535400390625, 0.885528564453125, 1.01751708984375, 1.149505615234375, 1.281494140625, 1.413482666015625, 1.54547119140625, 1.677459716796875, 1.8094482421875, 1.941436767578125, 2.07342529296875, 2.205413818359375, 2.33740234375, 2.469390869140625, 2.60137939453125, 2.733367919921875, 2.8653564453125, 2.997344970703125, 3.12933349609375, 3.261322021484375, 3.393310546875, 3.525299072265625, 3.65728759765625, 3.789276123046875, 3.9212646484375, 4.053253173828125, 4.18524169921875, 4.317230224609375, 4.44921875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 10.0, 15.0, 10.0, 18.0, 28.0, 62.0, 65.0, 95.0, 116.0, 193.0, 272.0, 386.0, 555.0, 808.0, 1175.0, 1706.0, 2307.0, 3343.0, 4906.0, 6985.0, 10183.0, 14410.0, 21493.0, 32622.0, 51399.0, 88973.0, 173683.0, 273284.0, 144206.0, 77320.0, 45575.0, 29187.0, 19608.0, 13146.0, 9155.0, 6410.0, 4516.0, 3137.0, 2180.0, 1536.0, 1033.0, 763.0, 527.0, 369.0, 263.0, 153.0, 120.0, 75.0, 64.0, 36.0, 27.0, 17.0, 13.0, 7.0, 6.0, 7.0, 2.0], "bins": [-0.7099609375, -0.6893081665039062, -0.6686553955078125, -0.6480026245117188, -0.627349853515625, -0.6066970825195312, -0.5860443115234375, -0.5653915405273438, -0.54473876953125, -0.5240859985351562, -0.5034332275390625, -0.48278045654296875, -0.462127685546875, -0.44147491455078125, -0.4208221435546875, -0.40016937255859375, -0.3795166015625, -0.35886383056640625, -0.3382110595703125, -0.31755828857421875, -0.296905517578125, -0.27625274658203125, -0.2555999755859375, -0.23494720458984375, -0.21429443359375, -0.19364166259765625, -0.1729888916015625, -0.15233612060546875, -0.131683349609375, -0.11103057861328125, -0.0903778076171875, -0.06972503662109375, -0.049072265625, -0.02841949462890625, -0.0077667236328125, 0.01288604736328125, 0.033538818359375, 0.05419158935546875, 0.0748443603515625, 0.09549713134765625, 0.11614990234375, 0.13680267333984375, 0.1574554443359375, 0.17810821533203125, 0.198760986328125, 0.21941375732421875, 0.2400665283203125, 0.26071929931640625, 0.2813720703125, 0.30202484130859375, 0.3226776123046875, 0.34333038330078125, 0.363983154296875, 0.38463592529296875, 0.4052886962890625, 0.42594146728515625, 0.44659423828125, 0.46724700927734375, 0.4878997802734375, 0.5085525512695312, 0.529205322265625, 0.5498580932617188, 0.5705108642578125, 0.5911636352539062, 0.61181640625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 6.0, 10.0, 7.0, 13.0, 15.0, 15.0, 16.0, 15.0, 21.0, 36.0, 24.0, 27.0, 32.0, 21.0, 28.0, 29.0, 39.0, 39.0, 43.0, 1066.0, 48.0, 41.0, 40.0, 35.0, 33.0, 37.0, 40.0, 24.0, 34.0, 24.0, 26.0, 17.0, 15.0, 15.0, 17.0, 10.0, 13.0, 7.0, 5.0, 8.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.65234375, -2.57147216796875, -2.4906005859375, -2.40972900390625, -2.328857421875, -2.24798583984375, -2.1671142578125, -2.08624267578125, -2.00537109375, -1.92449951171875, -1.8436279296875, -1.76275634765625, -1.681884765625, -1.60101318359375, -1.5201416015625, -1.43927001953125, -1.3583984375, -1.27752685546875, -1.1966552734375, -1.11578369140625, -1.034912109375, -0.95404052734375, -0.8731689453125, -0.79229736328125, -0.71142578125, -0.63055419921875, -0.5496826171875, -0.46881103515625, -0.387939453125, -0.30706787109375, -0.2261962890625, -0.14532470703125, -0.064453125, 0.01641845703125, 0.0972900390625, 0.17816162109375, 0.259033203125, 0.33990478515625, 0.4207763671875, 0.50164794921875, 0.58251953125, 0.66339111328125, 0.7442626953125, 0.82513427734375, 0.906005859375, 0.98687744140625, 1.0677490234375, 1.14862060546875, 1.2294921875, 1.31036376953125, 1.3912353515625, 1.47210693359375, 1.552978515625, 1.63385009765625, 1.7147216796875, 1.79559326171875, 1.87646484375, 1.95733642578125, 2.0382080078125, 2.11907958984375, 2.199951171875, 2.28082275390625, 2.3616943359375, 2.44256591796875, 2.5234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 5.0, 5.0, 11.0, 24.0, 33.0, 48.0, 70.0, 95.0, 155.0, 196.0, 304.0, 406.0, 589.0, 830.0, 1164.0, 1562.0, 2259.0, 3053.0, 4276.0, 5930.0, 8246.0, 11620.0, 16549.0, 23908.0, 34651.0, 51949.0, 83824.0, 156674.0, 1299881.0, 147336.0, 79667.0, 50167.0, 33188.0, 22601.0, 15993.0, 11285.0, 8066.0, 5751.0, 4084.0, 3018.0, 2191.0, 1529.0, 1165.0, 782.0, 565.0, 440.0, 301.0, 202.0, 161.0, 114.0, 77.0, 41.0, 27.0, 28.0, 17.0, 9.0, 10.0, 4.0, 2.0, 3.0, 1.0], "bins": [-0.54638671875, -0.5290145874023438, -0.5116424560546875, -0.49427032470703125, -0.476898193359375, -0.45952606201171875, -0.4421539306640625, -0.42478179931640625, -0.40740966796875, -0.39003753662109375, -0.3726654052734375, -0.35529327392578125, -0.337921142578125, -0.32054901123046875, -0.3031768798828125, -0.28580474853515625, -0.2684326171875, -0.25106048583984375, -0.2336883544921875, -0.21631622314453125, -0.198944091796875, -0.18157196044921875, -0.1641998291015625, -0.14682769775390625, -0.12945556640625, -0.11208343505859375, -0.0947113037109375, -0.07733917236328125, -0.059967041015625, -0.04259490966796875, -0.0252227783203125, -0.00785064697265625, 0.009521484375, 0.02689361572265625, 0.0442657470703125, 0.06163787841796875, 0.079010009765625, 0.09638214111328125, 0.1137542724609375, 0.13112640380859375, 0.14849853515625, 0.16587066650390625, 0.1832427978515625, 0.20061492919921875, 0.217987060546875, 0.23535919189453125, 0.2527313232421875, 0.27010345458984375, 0.2874755859375, 0.30484771728515625, 0.3222198486328125, 0.33959197998046875, 0.356964111328125, 0.37433624267578125, 0.3917083740234375, 0.40908050537109375, 0.42645263671875, 0.44382476806640625, 0.4611968994140625, 0.47856903076171875, 0.495941162109375, 0.5133132934570312, 0.5306854248046875, 0.5480575561523438, 0.5654296875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 6.0, 9.0, 11.0, 16.0, 6.0, 18.0, 12.0, 31.0, 28.0, 35.0, 32.0, 46.0, 63.0, 47.0, 61.0, 85.0, 79.0, 64.0, 72.0, 41.0, 44.0, 37.0, 33.0, 22.0, 12.0, 20.0, 17.0, 9.0, 8.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020456314086914062, -0.00019867345690727234, -0.00019278377294540405, -0.00018689408898353577, -0.00018100440502166748, -0.0001751147210597992, -0.0001692250370979309, -0.00016333535313606262, -0.00015744566917419434, -0.00015155598521232605, -0.00014566630125045776, -0.00013977661728858948, -0.0001338869333267212, -0.0001279972493648529, -0.00012210756540298462, -0.00011621788144111633, -0.00011032819747924805, -0.00010443851351737976, -9.854882955551147e-05, -9.265914559364319e-05, -8.67694616317749e-05, -8.087977766990662e-05, -7.499009370803833e-05, -6.910040974617004e-05, -6.321072578430176e-05, -5.732104182243347e-05, -5.1431357860565186e-05, -4.55416738986969e-05, -3.965198993682861e-05, -3.376230597496033e-05, -2.787262201309204e-05, -2.1982938051223755e-05, -1.609325408935547e-05, -1.0203570127487183e-05, -4.3138861656188965e-06, 1.5757977962493896e-06, 7.465481758117676e-06, 1.3355165719985962e-05, 1.9244849681854248e-05, 2.5134533643722534e-05, 3.102421760559082e-05, 3.6913901567459106e-05, 4.280358552932739e-05, 4.869326949119568e-05, 5.4582953453063965e-05, 6.047263741493225e-05, 6.636232137680054e-05, 7.225200533866882e-05, 7.814168930053711e-05, 8.40313732624054e-05, 8.992105722427368e-05, 9.581074118614197e-05, 0.00010170042514801025, 0.00010759010910987854, 0.00011347979307174683, 0.00011936947703361511, 0.0001252591609954834, 0.00013114884495735168, 0.00013703852891921997, 0.00014292821288108826, 0.00014881789684295654, 0.00015470758080482483, 0.00016059726476669312, 0.0001664869487285614, 0.0001723766326904297]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 8.0, 11.0, 12.0, 21.0, 33.0, 34.0, 34.0, 44.0, 76.0, 102.0, 128.0, 169.0, 326.0, 570.0, 1350.0, 642215.0, 400605.0, 1194.0, 552.0, 284.0, 192.0, 134.0, 104.0, 79.0, 48.0, 33.0, 40.0, 25.0, 22.0, 13.0, 17.0, 15.0, 11.0, 12.0, 6.0, 9.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0032215118408203125, -0.0031140148639678955, -0.0030065178871154785, -0.0028990209102630615, -0.0027915239334106445, -0.0026840269565582275, -0.0025765299797058105, -0.0024690330028533936, -0.0023615360260009766, -0.0022540390491485596, -0.0021465420722961426, -0.0020390450954437256, -0.0019315481185913086, -0.0018240511417388916, -0.0017165541648864746, -0.0016090571880340576, -0.0015015602111816406, -0.0013940632343292236, -0.0012865662574768066, -0.0011790692806243896, -0.0010715723037719727, -0.0009640753269195557, -0.0008565783500671387, -0.0007490813732147217, -0.0006415843963623047, -0.0005340874195098877, -0.0004265904426574707, -0.0003190934658050537, -0.00021159648895263672, -0.00010409951210021973, 3.3974647521972656e-06, 0.00011089444160461426, 0.00021839141845703125, 0.00032588839530944824, 0.00043338537216186523, 0.0005408823490142822, 0.0006483793258666992, 0.0007558763027191162, 0.0008633732795715332, 0.0009708702564239502, 0.0010783672332763672, 0.0011858642101287842, 0.0012933611869812012, 0.0014008581638336182, 0.0015083551406860352, 0.0016158521175384521, 0.0017233490943908691, 0.0018308460712432861, 0.0019383430480957031, 0.00204584002494812, 0.002153337001800537, 0.002260833978652954, 0.002368330955505371, 0.002475827932357788, 0.002583324909210205, 0.002690821886062622, 0.002798318862915039, 0.002905815839767456, 0.003013312816619873, 0.00312080979347229, 0.003228306770324707, 0.003335803747177124, 0.003443300724029541, 0.003550797700881958, 0.003658294677734375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 14.0, 402.0, 562.0, 32.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0011356903705745935, -0.0011161316651850939, -0.0010965729597955942, -0.0010770141379907727, -0.001057455432601273, -0.0010378967272117734, -0.0010183380218222737, -0.0009987792000174522, -0.0009792204946279526, -0.0009596617892384529, -0.0009401030256412923, -0.0009205443202517927, -0.0009009855566546321, -0.0008814268512651324, -0.0008618680876679718, -0.0008423093822784722, -0.0008227506186813116, -0.0008031919132918119, -0.0007836331496946514, -0.0007640744443051517, -0.0007445156807079911, -0.0007249569753184915, -0.0007053982117213309, -0.0006858395063318312, -0.0006662808009423316, -0.0006467220955528319, -0.0006271633319556713, -0.0006076046265661716, -0.0005880458629690111, -0.0005684871575795114, -0.0005489283939823508, -0.0005293696885928512, -0.0005098109249956906, -0.0004902522196061909, -0.00047069345600903034, -0.0004511347215157002, -0.0004315759870223701, -0.00041201725252904, -0.00039245851803570986, -0.0003728998126462102, -0.00035334107815288007, -0.00033378234365954995, -0.00031422360916621983, -0.0002946648746728897, -0.0002751061401795596, -0.00025554740568622947, -0.00023598868574481457, -0.00021642995125148445, -0.00019687121675815433, -0.0001773124822648242, -0.0001577537477714941, -0.0001381950278300792, -0.00011863628606079146, -9.907755156746134e-05, -7.951882435008883e-05, -5.9960089856758714e-05, -4.040135536342859e-05, -2.0842622689087875e-05, -1.2838900147471577e-06, 1.8274840840604156e-05, 3.783357533393428e-05, 5.73923098272644e-05, 7.69510370446369e-05, 9.650977153796703e-05, 0.00011606850603129715]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 5.0, 2.0, 10.0, 8.0, 14.0, 14.0, 10.0, 14.0, 24.0, 17.0, 29.0, 14.0, 39.0, 35.0, 27.0, 28.0, 32.0, 44.0, 44.0, 37.0, 31.0, 34.0, 39.0, 43.0, 28.0, 41.0, 26.0, 41.0, 23.0, 38.0, 28.0, 16.0, 21.0, 21.0, 24.0, 14.0, 19.0, 11.0, 10.0, 12.0, 11.0, 9.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.445978164672852e-05, -8.176174014806747e-05, -7.906369864940643e-05, -7.636565715074539e-05, -7.366761565208435e-05, -7.096957415342331e-05, -6.827153265476227e-05, -6.557349115610123e-05, -6.287544965744019e-05, -6.0177408158779144e-05, -5.74793666601181e-05, -5.478132516145706e-05, -5.208328366279602e-05, -4.938524216413498e-05, -4.668720066547394e-05, -4.39891591668129e-05, -4.1291117668151855e-05, -3.8593076169490814e-05, -3.589503467082977e-05, -3.319699317216873e-05, -3.049895167350769e-05, -2.780091017484665e-05, -2.5102868676185608e-05, -2.2404827177524567e-05, -1.9706785678863525e-05, -1.7008744180202484e-05, -1.4310702681541443e-05, -1.1612661182880402e-05, -8.91461968421936e-06, -6.216578185558319e-06, -3.518536686897278e-06, -8.204951882362366e-07, 1.8775463104248047e-06, 4.575587809085846e-06, 7.273629307746887e-06, 9.971670806407928e-06, 1.266971230506897e-05, 1.536775380373001e-05, 1.8065795302391052e-05, 2.0763836801052094e-05, 2.3461878299713135e-05, 2.6159919798374176e-05, 2.8857961297035217e-05, 3.155600279569626e-05, 3.42540442943573e-05, 3.695208579301834e-05, 3.965012729167938e-05, 4.2348168790340424e-05, 4.5046210289001465e-05, 4.7744251787662506e-05, 5.044229328632355e-05, 5.314033478498459e-05, 5.583837628364563e-05, 5.853641778230667e-05, 6.123445928096771e-05, 6.393250077962875e-05, 6.66305422782898e-05, 6.932858377695084e-05, 7.202662527561188e-05, 7.472466677427292e-05, 7.742270827293396e-05, 8.0120749771595e-05, 8.281879127025604e-05, 8.551683276891708e-05, 8.821487426757812e-05]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 12.0, 10.0, 12.0, 13.0, 12.0, 14.0, 18.0, 15.0, 20.0, 22.0, 28.0, 25.0, 25.0, 31.0, 40.0, 41.0, 39.0, 44.0, 43.0, 46.0, 51.0, 50.0, 31.0, 38.0, 29.0, 40.0, 23.0, 31.0, 20.0, 19.0, 22.0, 22.0, 12.0, 16.0, 13.0, 6.0, 12.0, 10.0, 10.0, 8.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.998046875, -3.866058349609375, -3.73406982421875, -3.602081298828125, -3.4700927734375, -3.338104248046875, -3.20611572265625, -3.074127197265625, -2.942138671875, -2.810150146484375, -2.67816162109375, -2.546173095703125, -2.4141845703125, -2.282196044921875, -2.15020751953125, -2.018218994140625, -1.88623046875, -1.754241943359375, -1.62225341796875, -1.490264892578125, -1.3582763671875, -1.226287841796875, -1.09429931640625, -0.962310791015625, -0.830322265625, -0.698333740234375, -0.56634521484375, -0.434356689453125, -0.3023681640625, -0.170379638671875, -0.03839111328125, 0.093597412109375, 0.2255859375, 0.357574462890625, 0.48956298828125, 0.621551513671875, 0.7535400390625, 0.885528564453125, 1.01751708984375, 1.149505615234375, 1.281494140625, 1.413482666015625, 1.54547119140625, 1.677459716796875, 1.8094482421875, 1.941436767578125, 2.07342529296875, 2.205413818359375, 2.33740234375, 2.469390869140625, 2.60137939453125, 2.733367919921875, 2.8653564453125, 2.997344970703125, 3.12933349609375, 3.261322021484375, 3.393310546875, 3.525299072265625, 3.65728759765625, 3.789276123046875, 3.9212646484375, 4.053253173828125, 4.18524169921875, 4.317230224609375, 4.44921875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 6.0, 16.0, 16.0, 27.0, 38.0, 42.0, 46.0, 73.0, 88.0, 119.0, 166.0, 261.0, 383.0, 617.0, 1319.0, 2698.0, 6302.0, 15533.0, 39812.0, 104766.0, 293639.0, 360212.0, 136816.0, 50866.0, 19676.0, 7780.0, 3447.0, 1536.0, 803.0, 467.0, 256.0, 189.0, 137.0, 102.0, 74.0, 46.0, 39.0, 37.0, 29.0, 18.0, 13.0, 7.0, 10.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.171875, -5.0057373046875, -4.839599609375, -4.6734619140625, -4.50732421875, -4.3411865234375, -4.175048828125, -4.0089111328125, -3.8427734375, -3.6766357421875, -3.510498046875, -3.3443603515625, -3.17822265625, -3.0120849609375, -2.845947265625, -2.6798095703125, -2.513671875, -2.3475341796875, -2.181396484375, -2.0152587890625, -1.84912109375, -1.6829833984375, -1.516845703125, -1.3507080078125, -1.1845703125, -1.0184326171875, -0.852294921875, -0.6861572265625, -0.52001953125, -0.3538818359375, -0.187744140625, -0.0216064453125, 0.14453125, 0.3106689453125, 0.476806640625, 0.6429443359375, 0.80908203125, 0.9752197265625, 1.141357421875, 1.3074951171875, 1.4736328125, 1.6397705078125, 1.805908203125, 1.9720458984375, 2.13818359375, 2.3043212890625, 2.470458984375, 2.6365966796875, 2.802734375, 2.9688720703125, 3.135009765625, 3.3011474609375, 3.46728515625, 3.6334228515625, 3.799560546875, 3.9656982421875, 4.1318359375, 4.2979736328125, 4.464111328125, 4.6302490234375, 4.79638671875, 4.9625244140625, 5.128662109375, 5.2947998046875, 5.4609375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 12.0, 8.0, 17.0, 15.0, 34.0, 23.0, 25.0, 34.0, 28.0, 33.0, 54.0, 59.0, 64.0, 91.0, 244.0, 1514.0, 264.0, 127.0, 73.0, 56.0, 42.0, 31.0, 36.0, 42.0, 25.0, 16.0, 23.0, 11.0, 8.0, 7.0, 4.0, 9.0, 10.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1015625, -11.6475830078125, -11.193603515625, -10.7396240234375, -10.28564453125, -9.8316650390625, -9.377685546875, -8.9237060546875, -8.4697265625, -8.0157470703125, -7.561767578125, -7.1077880859375, -6.65380859375, -6.1998291015625, -5.745849609375, -5.2918701171875, -4.837890625, -4.3839111328125, -3.929931640625, -3.4759521484375, -3.02197265625, -2.5679931640625, -2.114013671875, -1.6600341796875, -1.2060546875, -0.7520751953125, -0.298095703125, 0.1558837890625, 0.60986328125, 1.0638427734375, 1.517822265625, 1.9718017578125, 2.42578125, 2.8797607421875, 3.333740234375, 3.7877197265625, 4.24169921875, 4.6956787109375, 5.149658203125, 5.6036376953125, 6.0576171875, 6.5115966796875, 6.965576171875, 7.4195556640625, 7.87353515625, 8.3275146484375, 8.781494140625, 9.2354736328125, 9.689453125, 10.1434326171875, 10.597412109375, 11.0513916015625, 11.50537109375, 11.9593505859375, 12.413330078125, 12.8673095703125, 13.3212890625, 13.7752685546875, 14.229248046875, 14.6832275390625, 15.13720703125, 15.5911865234375, 16.045166015625, 16.4991455078125, 16.953125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 7.0, 14.0, 17.0, 21.0, 27.0, 34.0, 54.0, 92.0, 127.0, 217.0, 349.0, 636.0, 1489.0, 24383.0, 2959476.0, 153736.0, 2895.0, 881.0, 425.0, 275.0, 184.0, 119.0, 73.0, 43.0, 27.0, 23.0, 10.0, 12.0, 7.0, 12.0, 9.0, 2.0, 5.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.265625, -28.39697265625, -27.5283203125, -26.65966796875, -25.791015625, -24.92236328125, -24.0537109375, -23.18505859375, -22.31640625, -21.44775390625, -20.5791015625, -19.71044921875, -18.841796875, -17.97314453125, -17.1044921875, -16.23583984375, -15.3671875, -14.49853515625, -13.6298828125, -12.76123046875, -11.892578125, -11.02392578125, -10.1552734375, -9.28662109375, -8.41796875, -7.54931640625, -6.6806640625, -5.81201171875, -4.943359375, -4.07470703125, -3.2060546875, -2.33740234375, -1.46875, -0.60009765625, 0.2685546875, 1.13720703125, 2.005859375, 2.87451171875, 3.7431640625, 4.61181640625, 5.48046875, 6.34912109375, 7.2177734375, 8.08642578125, 8.955078125, 9.82373046875, 10.6923828125, 11.56103515625, 12.4296875, 13.29833984375, 14.1669921875, 15.03564453125, 15.904296875, 16.77294921875, 17.6416015625, 18.51025390625, 19.37890625, 20.24755859375, 21.1162109375, 21.98486328125, 22.853515625, 23.72216796875, 24.5908203125, 25.45947265625, 26.328125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 22.0, 102.0, 259.0, 361.0, 198.0, 52.0, 12.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.3653564453125, -27.031261444091797, -25.69716453552246, -24.363067626953125, -23.028972625732422, -21.69487762451172, -20.360780715942383, -19.026683807373047, -17.692588806152344, -16.35849380493164, -15.024396896362305, -13.690300941467285, -12.356204986572266, -11.022109031677246, -9.688013076782227, -8.353917121887207, -7.0198211669921875, -5.685725212097168, -4.351629257202148, -3.017533302307129, -1.6834373474121094, -0.34934139251708984, 0.9847545623779297, 2.318850517272949, 3.6529464721679688, 4.987042427062988, 6.321138381958008, 7.655234336853027, 8.989330291748047, 10.323426246643066, 11.657522201538086, 12.991618156433105, 14.32571029663086, 15.659806251525879, 16.9939022064209, 18.327999114990234, 19.662094116210938, 20.99618911743164, 22.330286026000977, 23.664382934570312, 24.998477935791016, 26.33257293701172, 27.666669845581055, 29.00076675415039, 30.334861755371094, 31.668956756591797, 33.0030517578125, 34.33715057373047, 35.67124557495117, 37.005340576171875, 38.339439392089844, 39.67353439331055, 41.00762939453125, 42.34172439575195, 43.675819396972656, 45.009918212890625, 46.34401321411133, 47.67810821533203, 49.01220703125, 50.3463020324707, 51.680397033691406, 53.01449203491211, 54.34858703613281, 55.68268585205078, 57.016780853271484]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 10.0, 10.0, 9.0, 13.0, 12.0, 19.0, 21.0, 25.0, 30.0, 26.0, 24.0, 25.0, 34.0, 34.0, 55.0, 29.0, 27.0, 44.0, 42.0, 41.0, 44.0, 44.0, 34.0, 32.0, 32.0, 23.0, 33.0, 28.0, 17.0, 22.0, 16.0, 17.0, 14.0, 17.0, 19.0, 12.0, 12.0, 6.0, 8.0, 8.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-26.375974655151367, -25.584087371826172, -24.79220199584961, -24.000316619873047, -23.20842933654785, -22.416542053222656, -21.624656677246094, -20.83277130126953, -20.040884017944336, -19.24899673461914, -18.457111358642578, -17.665225982666016, -16.87333869934082, -16.081451416015625, -15.289566040039062, -14.497679710388184, -13.705793380737305, -12.913907051086426, -12.122020721435547, -11.330134391784668, -10.538248062133789, -9.74636173248291, -8.954475402832031, -8.162589073181152, -7.370702743530273, -6.5788164138793945, -5.786930084228516, -4.995043754577637, -4.203157424926758, -3.411271095275879, -2.619384765625, -1.827498435974121, -1.035614013671875, -0.2437276840209961, 0.5481586456298828, 1.3400449752807617, 2.1319313049316406, 2.9238176345825195, 3.7157039642333984, 4.507590293884277, 5.299476623535156, 6.091362953186035, 6.883249282836914, 7.675135612487793, 8.467021942138672, 9.25890827178955, 10.05079460144043, 10.842680931091309, 11.634567260742188, 12.426453590393066, 13.218339920043945, 14.010226249694824, 14.802112579345703, 15.593998908996582, 16.38588523864746, 17.177772521972656, 17.96965789794922, 18.76154327392578, 19.553430557250977, 20.345317840576172, 21.137203216552734, 21.929088592529297, 22.720975875854492, 23.512863159179688, 24.30474853515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 7.0, 5.0, 6.0, 10.0, 10.0, 12.0, 17.0, 13.0, 19.0, 14.0, 17.0, 21.0, 18.0, 26.0, 23.0, 24.0, 39.0, 39.0, 46.0, 49.0, 40.0, 51.0, 47.0, 42.0, 41.0, 34.0, 34.0, 30.0, 34.0, 32.0, 27.0, 20.0, 23.0, 22.0, 17.0, 16.0, 17.0, 17.0, 4.0, 8.0, 11.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.0078125, -3.873779296875, -3.73974609375, -3.605712890625, -3.4716796875, -3.337646484375, -3.20361328125, -3.069580078125, -2.935546875, -2.801513671875, -2.66748046875, -2.533447265625, -2.3994140625, -2.265380859375, -2.13134765625, -1.997314453125, -1.86328125, -1.729248046875, -1.59521484375, -1.461181640625, -1.3271484375, -1.193115234375, -1.05908203125, -0.925048828125, -0.791015625, -0.656982421875, -0.52294921875, -0.388916015625, -0.2548828125, -0.120849609375, 0.01318359375, 0.147216796875, 0.28125, 0.415283203125, 0.54931640625, 0.683349609375, 0.8173828125, 0.951416015625, 1.08544921875, 1.219482421875, 1.353515625, 1.487548828125, 1.62158203125, 1.755615234375, 1.8896484375, 2.023681640625, 2.15771484375, 2.291748046875, 2.42578125, 2.559814453125, 2.69384765625, 2.827880859375, 2.9619140625, 3.095947265625, 3.22998046875, 3.364013671875, 3.498046875, 3.632080078125, 3.76611328125, 3.900146484375, 4.0341796875, 4.168212890625, 4.30224609375, 4.436279296875, 4.5703125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 6.0, 5.0, 8.0, 5.0, 10.0, 8.0, 14.0, 18.0, 26.0, 37.0, 40.0, 65.0, 114.0, 180.0, 349.0, 854.0, 3003.0, 23423.0, 317797.0, 2213932.0, 1476141.0, 143437.0, 11528.0, 1891.0, 614.0, 279.0, 135.0, 89.0, 65.0, 40.0, 22.0, 20.0, 29.0, 17.0, 19.0, 9.0, 7.0, 7.0, 4.0, 6.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.734375, -9.46282958984375, -9.1912841796875, -8.91973876953125, -8.648193359375, -8.37664794921875, -8.1051025390625, -7.83355712890625, -7.56201171875, -7.29046630859375, -7.0189208984375, -6.74737548828125, -6.475830078125, -6.20428466796875, -5.9327392578125, -5.66119384765625, -5.3896484375, -5.11810302734375, -4.8465576171875, -4.57501220703125, -4.303466796875, -4.03192138671875, -3.7603759765625, -3.48883056640625, -3.21728515625, -2.94573974609375, -2.6741943359375, -2.40264892578125, -2.131103515625, -1.85955810546875, -1.5880126953125, -1.31646728515625, -1.044921875, -0.77337646484375, -0.5018310546875, -0.23028564453125, 0.041259765625, 0.31280517578125, 0.5843505859375, 0.85589599609375, 1.12744140625, 1.39898681640625, 1.6705322265625, 1.94207763671875, 2.213623046875, 2.48516845703125, 2.7567138671875, 3.02825927734375, 3.2998046875, 3.57135009765625, 3.8428955078125, 4.11444091796875, 4.385986328125, 4.65753173828125, 4.9290771484375, 5.20062255859375, 5.47216796875, 5.74371337890625, 6.0152587890625, 6.28680419921875, 6.558349609375, 6.82989501953125, 7.1014404296875, 7.37298583984375, 7.64453125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 1.0, 7.0, 5.0, 9.0, 12.0, 16.0, 26.0, 36.0, 58.0, 68.0, 89.0, 143.0, 193.0, 311.0, 387.0, 521.0, 501.0, 453.0, 372.0, 262.0, 187.0, 139.0, 79.0, 57.0, 44.0, 27.0, 20.0, 17.0, 8.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.81640625, -7.6064453125, -7.396484375, -7.1865234375, -6.9765625, -6.7666015625, -6.556640625, -6.3466796875, -6.13671875, -5.9267578125, -5.716796875, -5.5068359375, -5.296875, -5.0869140625, -4.876953125, -4.6669921875, -4.45703125, -4.2470703125, -4.037109375, -3.8271484375, -3.6171875, -3.4072265625, -3.197265625, -2.9873046875, -2.77734375, -2.5673828125, -2.357421875, -2.1474609375, -1.9375, -1.7275390625, -1.517578125, -1.3076171875, -1.09765625, -0.8876953125, -0.677734375, -0.4677734375, -0.2578125, -0.0478515625, 0.162109375, 0.3720703125, 0.58203125, 0.7919921875, 1.001953125, 1.2119140625, 1.421875, 1.6318359375, 1.841796875, 2.0517578125, 2.26171875, 2.4716796875, 2.681640625, 2.8916015625, 3.1015625, 3.3115234375, 3.521484375, 3.7314453125, 3.94140625, 4.1513671875, 4.361328125, 4.5712890625, 4.78125, 4.9912109375, 5.201171875, 5.4111328125, 5.62109375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 15.0, 12.0, 15.0, 20.0, 19.0, 31.0, 52.0, 58.0, 86.0, 148.0, 272.0, 433.0, 831.0, 1994.0, 6699.0, 34452.0, 300883.0, 2794559.0, 952082.0, 82890.0, 12979.0, 3232.0, 1144.0, 512.0, 281.0, 171.0, 129.0, 75.0, 47.0, 33.0, 18.0, 19.0, 20.0, 19.0, 2.0, 14.0, 11.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.6796875, -9.37451171875, -9.0693359375, -8.76416015625, -8.458984375, -8.15380859375, -7.8486328125, -7.54345703125, -7.23828125, -6.93310546875, -6.6279296875, -6.32275390625, -6.017578125, -5.71240234375, -5.4072265625, -5.10205078125, -4.796875, -4.49169921875, -4.1865234375, -3.88134765625, -3.576171875, -3.27099609375, -2.9658203125, -2.66064453125, -2.35546875, -2.05029296875, -1.7451171875, -1.43994140625, -1.134765625, -0.82958984375, -0.5244140625, -0.21923828125, 0.0859375, 0.39111328125, 0.6962890625, 1.00146484375, 1.306640625, 1.61181640625, 1.9169921875, 2.22216796875, 2.52734375, 2.83251953125, 3.1376953125, 3.44287109375, 3.748046875, 4.05322265625, 4.3583984375, 4.66357421875, 4.96875, 5.27392578125, 5.5791015625, 5.88427734375, 6.189453125, 6.49462890625, 6.7998046875, 7.10498046875, 7.41015625, 7.71533203125, 8.0205078125, 8.32568359375, 8.630859375, 8.93603515625, 9.2412109375, 9.54638671875, 9.8515625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 16.0, 49.0, 76.0, 154.0, 205.0, 198.0, 148.0, 95.0, 43.0, 13.0, 9.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.798091888427734, -50.645545959472656, -49.49299621582031, -48.34044647216797, -47.18790054321289, -46.03535461425781, -44.88280487060547, -43.730255126953125, -42.57770919799805, -41.42516326904297, -40.272613525390625, -39.12006378173828, -37.9675178527832, -36.814971923828125, -35.66242218017578, -34.50987243652344, -33.35732650756836, -32.20478057861328, -31.052230834960938, -29.899682998657227, -28.747135162353516, -27.594587326049805, -26.442039489746094, -25.289491653442383, -24.136943817138672, -22.98439598083496, -21.83184814453125, -20.67930030822754, -19.526752471923828, -18.374204635620117, -17.221656799316406, -16.069108963012695, -14.916557312011719, -13.764009475708008, -12.611461639404297, -11.458913803100586, -10.306365966796875, -9.153818130493164, -8.001270294189453, -6.848722457885742, -5.696174621582031, -4.54362678527832, -3.3910789489746094, -2.2385311126708984, -1.0859832763671875, 0.06656455993652344, 1.2191123962402344, 2.3716602325439453, 3.5242080688476562, 4.676755905151367, 5.829303741455078, 6.981851577758789, 8.1343994140625, 9.286947250366211, 10.439495086669922, 11.592042922973633, 12.744590759277344, 13.897138595581055, 15.049686431884766, 16.202234268188477, 17.354782104492188, 18.5073299407959, 19.65987777709961, 20.81242561340332, 21.96497344970703]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 5.0, 3.0, 3.0, 3.0, 9.0, 5.0, 10.0, 13.0, 13.0, 10.0, 16.0, 17.0, 22.0, 19.0, 21.0, 43.0, 26.0, 27.0, 35.0, 38.0, 30.0, 32.0, 41.0, 43.0, 31.0, 55.0, 45.0, 30.0, 36.0, 28.0, 32.0, 24.0, 29.0, 22.0, 27.0, 27.0, 20.0, 17.0, 20.0, 14.0, 11.0, 12.0, 13.0, 7.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.560039520263672, -16.944480895996094, -16.328920364379883, -15.713360786437988, -15.097801208496094, -14.4822416305542, -13.866682052612305, -13.25112247467041, -12.635562896728516, -12.020003318786621, -11.404443740844727, -10.788884162902832, -10.173324584960938, -9.557765007019043, -8.942205429077148, -8.326645851135254, -7.711086273193359, -7.095526695251465, -6.47996711730957, -5.864407539367676, -5.248847961425781, -4.633288383483887, -4.017728805541992, -3.4021692276000977, -2.786609649658203, -2.1710500717163086, -1.555490493774414, -0.9399309158325195, -0.324371337890625, 0.29118824005126953, 0.9067478179931641, 1.5223073959350586, 2.1378650665283203, 2.753424644470215, 3.3689842224121094, 3.984543800354004, 4.600103378295898, 5.215662956237793, 5.8312225341796875, 6.446782112121582, 7.062341690063477, 7.677901268005371, 8.293460845947266, 8.90902042388916, 9.524580001831055, 10.14013957977295, 10.755699157714844, 11.371258735656738, 11.986818313598633, 12.602377891540527, 13.217937469482422, 13.833497047424316, 14.449056625366211, 15.064616203308105, 15.68017578125, 16.295734405517578, 16.91129493713379, 17.52685546875, 18.142414093017578, 18.757972717285156, 19.373533248901367, 19.989093780517578, 20.604652404785156, 21.220211029052734, 21.835771560668945]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 5.0, 2.0, 8.0, 11.0, 9.0, 7.0, 11.0, 12.0, 16.0, 12.0, 21.0, 22.0, 26.0, 24.0, 21.0, 33.0, 40.0, 35.0, 35.0, 52.0, 45.0, 52.0, 42.0, 44.0, 55.0, 32.0, 31.0, 28.0, 30.0, 33.0, 23.0, 32.0, 27.0, 25.0, 23.0, 14.0, 13.0, 7.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.817779541015625, -3.67657470703125, -3.535369873046875, -3.3941650390625, -3.252960205078125, -3.11175537109375, -2.970550537109375, -2.829345703125, -2.688140869140625, -2.54693603515625, -2.405731201171875, -2.2645263671875, -2.123321533203125, -1.98211669921875, -1.840911865234375, -1.69970703125, -1.558502197265625, -1.41729736328125, -1.276092529296875, -1.1348876953125, -0.993682861328125, -0.85247802734375, -0.711273193359375, -0.570068359375, -0.428863525390625, -0.28765869140625, -0.146453857421875, -0.0052490234375, 0.135955810546875, 0.27716064453125, 0.418365478515625, 0.5595703125, 0.700775146484375, 0.84197998046875, 0.983184814453125, 1.1243896484375, 1.265594482421875, 1.40679931640625, 1.548004150390625, 1.689208984375, 1.830413818359375, 1.97161865234375, 2.112823486328125, 2.2540283203125, 2.395233154296875, 2.53643798828125, 2.677642822265625, 2.81884765625, 2.960052490234375, 3.10125732421875, 3.242462158203125, 3.3836669921875, 3.524871826171875, 3.66607666015625, 3.807281494140625, 3.948486328125, 4.089691162109375, 4.23089599609375, 4.372100830078125, 4.5133056640625, 4.654510498046875, 4.79571533203125, 4.936920166015625, 5.078125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 8.0, 13.0, 9.0, 34.0, 37.0, 53.0, 66.0, 104.0, 124.0, 197.0, 284.0, 407.0, 639.0, 980.0, 1485.0, 2391.0, 3576.0, 5662.0, 8590.0, 13762.0, 22120.0, 37738.0, 68805.0, 146387.0, 338385.0, 195465.0, 85335.0, 45172.0, 26877.0, 16042.0, 9828.0, 6109.0, 4041.0, 2577.0, 1662.0, 1168.0, 813.0, 542.0, 361.0, 262.0, 149.0, 113.0, 67.0, 36.0, 31.0, 20.0, 12.0, 6.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.723358154296875, -0.69720458984375, -0.671051025390625, -0.6448974609375, -0.618743896484375, -0.59259033203125, -0.566436767578125, -0.540283203125, -0.514129638671875, -0.48797607421875, -0.461822509765625, -0.4356689453125, -0.409515380859375, -0.38336181640625, -0.357208251953125, -0.3310546875, -0.304901123046875, -0.27874755859375, -0.252593994140625, -0.2264404296875, -0.200286865234375, -0.17413330078125, -0.147979736328125, -0.121826171875, -0.095672607421875, -0.06951904296875, -0.043365478515625, -0.0172119140625, 0.008941650390625, 0.03509521484375, 0.061248779296875, 0.08740234375, 0.113555908203125, 0.13970947265625, 0.165863037109375, 0.1920166015625, 0.218170166015625, 0.24432373046875, 0.270477294921875, 0.296630859375, 0.322784423828125, 0.34893798828125, 0.375091552734375, 0.4012451171875, 0.427398681640625, 0.45355224609375, 0.479705810546875, 0.505859375, 0.532012939453125, 0.55816650390625, 0.584320068359375, 0.6104736328125, 0.636627197265625, 0.66278076171875, 0.688934326171875, 0.715087890625, 0.741241455078125, 0.76739501953125, 0.793548583984375, 0.8197021484375, 0.845855712890625, 0.87200927734375, 0.898162841796875, 0.92431640625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 6.0, 3.0, 5.0, 8.0, 14.0, 19.0, 15.0, 14.0, 24.0, 16.0, 28.0, 30.0, 23.0, 29.0, 36.0, 36.0, 39.0, 42.0, 47.0, 35.0, 1059.0, 42.0, 43.0, 42.0, 34.0, 43.0, 28.0, 29.0, 27.0, 32.0, 21.0, 27.0, 19.0, 17.0, 14.0, 10.0, 12.0, 10.0, 9.0, 13.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.771484375, -2.683319091796875, -2.59515380859375, -2.506988525390625, -2.4188232421875, -2.330657958984375, -2.24249267578125, -2.154327392578125, -2.066162109375, -1.977996826171875, -1.88983154296875, -1.801666259765625, -1.7135009765625, -1.625335693359375, -1.53717041015625, -1.449005126953125, -1.36083984375, -1.272674560546875, -1.18450927734375, -1.096343994140625, -1.0081787109375, -0.920013427734375, -0.83184814453125, -0.743682861328125, -0.655517578125, -0.567352294921875, -0.47918701171875, -0.391021728515625, -0.3028564453125, -0.214691162109375, -0.12652587890625, -0.038360595703125, 0.0498046875, 0.137969970703125, 0.22613525390625, 0.314300537109375, 0.4024658203125, 0.490631103515625, 0.57879638671875, 0.666961669921875, 0.755126953125, 0.843292236328125, 0.93145751953125, 1.019622802734375, 1.1077880859375, 1.195953369140625, 1.28411865234375, 1.372283935546875, 1.46044921875, 1.548614501953125, 1.63677978515625, 1.724945068359375, 1.8131103515625, 1.901275634765625, 1.98944091796875, 2.077606201171875, 2.165771484375, 2.253936767578125, 2.34210205078125, 2.430267333984375, 2.5184326171875, 2.606597900390625, 2.69476318359375, 2.782928466796875, 2.87109375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 7.0, 7.0, 5.0, 18.0, 25.0, 31.0, 44.0, 71.0, 108.0, 145.0, 173.0, 276.0, 438.0, 538.0, 840.0, 1106.0, 1594.0, 2130.0, 3022.0, 4334.0, 5965.0, 8396.0, 11791.0, 17051.0, 24694.0, 36409.0, 56100.0, 93852.0, 178821.0, 1294533.0, 133273.0, 73839.0, 45952.0, 30884.0, 20708.0, 14551.0, 10255.0, 7274.0, 5114.0, 3603.0, 2629.0, 1942.0, 1343.0, 943.0, 628.0, 486.0, 354.0, 278.0, 167.0, 124.0, 96.0, 61.0, 42.0, 23.0, 18.0, 12.0, 8.0, 4.0, 3.0, 0.0, 6.0], "bins": [-0.61572265625, -0.596649169921875, -0.57757568359375, -0.558502197265625, -0.5394287109375, -0.520355224609375, -0.50128173828125, -0.482208251953125, -0.463134765625, -0.444061279296875, -0.42498779296875, -0.405914306640625, -0.3868408203125, -0.367767333984375, -0.34869384765625, -0.329620361328125, -0.310546875, -0.291473388671875, -0.27239990234375, -0.253326416015625, -0.2342529296875, -0.215179443359375, -0.19610595703125, -0.177032470703125, -0.157958984375, -0.138885498046875, -0.11981201171875, -0.100738525390625, -0.0816650390625, -0.062591552734375, -0.04351806640625, -0.024444580078125, -0.00537109375, 0.013702392578125, 0.03277587890625, 0.051849365234375, 0.0709228515625, 0.089996337890625, 0.10906982421875, 0.128143310546875, 0.147216796875, 0.166290283203125, 0.18536376953125, 0.204437255859375, 0.2235107421875, 0.242584228515625, 0.26165771484375, 0.280731201171875, 0.2998046875, 0.318878173828125, 0.33795166015625, 0.357025146484375, 0.3760986328125, 0.395172119140625, 0.41424560546875, 0.433319091796875, 0.452392578125, 0.471466064453125, 0.49053955078125, 0.509613037109375, 0.5286865234375, 0.547760009765625, 0.56683349609375, 0.585906982421875, 0.60498046875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 6.0, 4.0, 10.0, 8.0, 5.0, 8.0, 20.0, 17.0, 24.0, 20.0, 20.0, 32.0, 31.0, 44.0, 45.0, 54.0, 55.0, 62.0, 75.0, 58.0, 66.0, 49.0, 39.0, 44.0, 42.0, 36.0, 22.0, 20.0, 18.0, 12.0, 11.0, 9.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015115737915039062, -0.0001463666558265686, -0.00014157593250274658, -0.00013678520917892456, -0.00013199448585510254, -0.00012720376253128052, -0.0001224130392074585, -0.00011762231588363647, -0.00011283159255981445, -0.00010804086923599243, -0.00010325014591217041, -9.845942258834839e-05, -9.366869926452637e-05, -8.887797594070435e-05, -8.408725261688232e-05, -7.92965292930603e-05, -7.450580596923828e-05, -6.971508264541626e-05, -6.492435932159424e-05, -6.013363599777222e-05, -5.5342912673950195e-05, -5.0552189350128174e-05, -4.576146602630615e-05, -4.097074270248413e-05, -3.618001937866211e-05, -3.138929605484009e-05, -2.6598572731018066e-05, -2.1807849407196045e-05, -1.7017126083374023e-05, -1.2226402759552002e-05, -7.4356794357299805e-06, -2.644956111907959e-06, 2.1457672119140625e-06, 6.936490535736084e-06, 1.1727213859558105e-05, 1.6517937183380127e-05, 2.130866050720215e-05, 2.609938383102417e-05, 3.089010715484619e-05, 3.568083047866821e-05, 4.0471553802490234e-05, 4.5262277126312256e-05, 5.005300045013428e-05, 5.48437237739563e-05, 5.963444709777832e-05, 6.442517042160034e-05, 6.921589374542236e-05, 7.400661706924438e-05, 7.87973403930664e-05, 8.358806371688843e-05, 8.837878704071045e-05, 9.316951036453247e-05, 9.796023368835449e-05, 0.00010275095701217651, 0.00010754168033599854, 0.00011233240365982056, 0.00011712312698364258, 0.0001219138503074646, 0.00012670457363128662, 0.00013149529695510864, 0.00013628602027893066, 0.00014107674360275269, 0.0001458674669265747, 0.00015065819025039673, 0.00015544891357421875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 7.0, 12.0, 7.0, 9.0, 21.0, 18.0, 33.0, 30.0, 53.0, 63.0, 104.0, 114.0, 202.0, 276.0, 526.0, 1109.0, 119431.0, 922748.0, 1920.0, 683.0, 350.0, 230.0, 137.0, 86.0, 86.0, 60.0, 42.0, 45.0, 31.0, 24.0, 10.0, 19.0, 12.0, 13.0, 6.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.003078460693359375, -0.002985656261444092, -0.0028928518295288086, -0.0028000473976135254, -0.002707242965698242, -0.002614438533782959, -0.0025216341018676758, -0.0024288296699523926, -0.0023360252380371094, -0.002243220806121826, -0.002150416374206543, -0.0020576119422912598, -0.0019648075103759766, -0.0018720030784606934, -0.0017791986465454102, -0.001686394214630127, -0.0015935897827148438, -0.0015007853507995605, -0.0014079809188842773, -0.0013151764869689941, -0.001222372055053711, -0.0011295676231384277, -0.0010367631912231445, -0.0009439587593078613, -0.0008511543273925781, -0.0007583498954772949, -0.0006655454635620117, -0.0005727410316467285, -0.0004799365997314453, -0.0003871321678161621, -0.0002943277359008789, -0.0002015233039855957, -0.0001087188720703125, -1.5914440155029297e-05, 7.68899917602539e-05, 0.0001696944236755371, 0.0002624988555908203, 0.0003553032875061035, 0.0004481077194213867, 0.0005409121513366699, 0.0006337165832519531, 0.0007265210151672363, 0.0008193254470825195, 0.0009121298789978027, 0.001004934310913086, 0.0010977387428283691, 0.0011905431747436523, 0.0012833476066589355, 0.0013761520385742188, 0.001468956470489502, 0.0015617609024047852, 0.0016545653343200684, 0.0017473697662353516, 0.0018401741981506348, 0.001932978630065918, 0.002025783061981201, 0.0021185874938964844, 0.0022113919258117676, 0.0023041963577270508, 0.002397000789642334, 0.002489805221557617, 0.0025826096534729004, 0.0026754140853881836, 0.002768218517303467, 0.00286102294921875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 43.0, 173.0, 395.0, 281.0, 103.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014769290282856673, -0.0001383087655995041, -0.00012892464292235672, -0.00011954050569329411, -0.00011015638301614672, -0.0001007722457870841, -9.13881158339791e-05, -8.20039858808741e-05, -7.26198559277691e-05, -6.323572597466409e-05, -5.385159602155909e-05, -4.446746243047528e-05, -3.508333247737028e-05, -2.5699202524265274e-05, -1.6315068933181465e-05, -6.930938980076462e-06, 2.4531909730285406e-06, 1.1837321835628245e-05, 2.122145269822795e-05, 3.0605584470322356e-05, 3.998971442342736e-05, 4.937384437653236e-05, 5.875797796761617e-05, 6.814210792072117e-05, 7.752623787382618e-05, 8.691036782693118e-05, 9.629449778003618e-05, 0.00010567862773314118, 0.0001150627649622038, 0.0001244468876393512, 0.0001338310248684138, 0.0001432151475455612, 0.00015259927022270858, 0.0001619834074517712, 0.0001713675301289186, 0.0001807516673579812, 0.0001901357900351286, 0.0001995199272641912, 0.00020890406449325383, 0.00021828818717040122, 0.0002276723098475486, 0.00023705644707661122, 0.00024644058430567384, 0.0002558247069828212, 0.0002652088296599686, 0.000274592952337116, 0.00028397710411809385, 0.00029336122679524124, 0.0003027453785762191, 0.00031212950125336647, 0.0003215136530343443, 0.0003308977757114917, 0.0003402818983886391, 0.0003496660210657865, 0.0003590501728467643, 0.0003684342955239117, 0.0003778184182010591, 0.0003872025408782065, 0.00039658669265918434, 0.0004059708153363317, 0.0004153549380134791, 0.0004247390606906265, 0.00043412321247160435, 0.00044350733514875174, 0.0004528914578258991]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 16.0, 10.0, 11.0, 14.0, 17.0, 11.0, 23.0, 22.0, 25.0, 22.0, 27.0, 26.0, 36.0, 51.0, 40.0, 42.0, 49.0, 41.0, 44.0, 38.0, 36.0, 35.0, 33.0, 34.0, 35.0, 42.0, 36.0, 24.0, 32.0, 27.0, 18.0, 16.0, 16.0, 6.0, 6.0, 11.0, 13.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.143352508544922e-05, -8.877180516719818e-05, -8.611008524894714e-05, -8.34483653306961e-05, -8.078664541244507e-05, -7.812492549419403e-05, -7.546320557594299e-05, -7.280148565769196e-05, -7.013976573944092e-05, -6.747804582118988e-05, -6.481632590293884e-05, -6.21546059846878e-05, -5.949288606643677e-05, -5.683116614818573e-05, -5.416944622993469e-05, -5.1507726311683655e-05, -4.884600639343262e-05, -4.618428647518158e-05, -4.352256655693054e-05, -4.0860846638679504e-05, -3.819912672042847e-05, -3.553740680217743e-05, -3.287568688392639e-05, -3.0213966965675354e-05, -2.7552247047424316e-05, -2.489052712917328e-05, -2.222880721092224e-05, -1.9567087292671204e-05, -1.6905367374420166e-05, -1.4243647456169128e-05, -1.158192753791809e-05, -8.920207619667053e-06, -6.258487701416016e-06, -3.596767783164978e-06, -9.350478649139404e-07, 1.7266720533370972e-06, 4.388391971588135e-06, 7.050111889839172e-06, 9.71183180809021e-06, 1.2373551726341248e-05, 1.5035271644592285e-05, 1.7696991562843323e-05, 2.035871148109436e-05, 2.3020431399345398e-05, 2.5682151317596436e-05, 2.8343871235847473e-05, 3.100559115409851e-05, 3.366731107234955e-05, 3.6329030990600586e-05, 3.8990750908851624e-05, 4.165247082710266e-05, 4.43141907453537e-05, 4.6975910663604736e-05, 4.9637630581855774e-05, 5.229935050010681e-05, 5.496107041835785e-05, 5.762279033660889e-05, 6.0284510254859924e-05, 6.294623017311096e-05, 6.5607950091362e-05, 6.826967000961304e-05, 7.093138992786407e-05, 7.359310984611511e-05, 7.625482976436615e-05, 7.891654968261719e-05]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 5.0, 2.0, 8.0, 11.0, 9.0, 7.0, 11.0, 12.0, 16.0, 12.0, 21.0, 22.0, 26.0, 24.0, 21.0, 33.0, 40.0, 35.0, 35.0, 52.0, 45.0, 52.0, 42.0, 44.0, 55.0, 32.0, 31.0, 28.0, 30.0, 33.0, 23.0, 32.0, 27.0, 25.0, 23.0, 14.0, 13.0, 7.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.817779541015625, -3.67657470703125, -3.535369873046875, -3.3941650390625, -3.252960205078125, -3.11175537109375, -2.970550537109375, -2.829345703125, -2.688140869140625, -2.54693603515625, -2.405731201171875, -2.2645263671875, -2.123321533203125, -1.98211669921875, -1.840911865234375, -1.69970703125, -1.558502197265625, -1.41729736328125, -1.276092529296875, -1.1348876953125, -0.993682861328125, -0.85247802734375, -0.711273193359375, -0.570068359375, -0.428863525390625, -0.28765869140625, -0.146453857421875, -0.0052490234375, 0.135955810546875, 0.27716064453125, 0.418365478515625, 0.5595703125, 0.700775146484375, 0.84197998046875, 0.983184814453125, 1.1243896484375, 1.265594482421875, 1.40679931640625, 1.548004150390625, 1.689208984375, 1.830413818359375, 1.97161865234375, 2.112823486328125, 2.2540283203125, 2.395233154296875, 2.53643798828125, 2.677642822265625, 2.81884765625, 2.960052490234375, 3.10125732421875, 3.242462158203125, 3.3836669921875, 3.524871826171875, 3.66607666015625, 3.807281494140625, 3.948486328125, 4.089691162109375, 4.23089599609375, 4.372100830078125, 4.5133056640625, 4.654510498046875, 4.79571533203125, 4.936920166015625, 5.078125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 10.0, 17.0, 26.0, 33.0, 33.0, 53.0, 70.0, 112.0, 152.0, 164.0, 228.0, 289.0, 473.0, 762.0, 1406.0, 3040.0, 8072.0, 27515.0, 97773.0, 301902.0, 389639.0, 152294.0, 43365.0, 12243.0, 4185.0, 1858.0, 904.0, 542.0, 357.0, 245.0, 226.0, 145.0, 112.0, 69.0, 57.0, 57.0, 30.0, 22.0, 11.0, 13.0, 12.0, 7.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-6.8046875, -6.61126708984375, -6.4178466796875, -6.22442626953125, -6.031005859375, -5.83758544921875, -5.6441650390625, -5.45074462890625, -5.25732421875, -5.06390380859375, -4.8704833984375, -4.67706298828125, -4.483642578125, -4.29022216796875, -4.0968017578125, -3.90338134765625, -3.7099609375, -3.51654052734375, -3.3231201171875, -3.12969970703125, -2.936279296875, -2.74285888671875, -2.5494384765625, -2.35601806640625, -2.16259765625, -1.96917724609375, -1.7757568359375, -1.58233642578125, -1.388916015625, -1.19549560546875, -1.0020751953125, -0.80865478515625, -0.615234375, -0.42181396484375, -0.2283935546875, -0.03497314453125, 0.158447265625, 0.35186767578125, 0.5452880859375, 0.73870849609375, 0.93212890625, 1.12554931640625, 1.3189697265625, 1.51239013671875, 1.705810546875, 1.89923095703125, 2.0926513671875, 2.28607177734375, 2.4794921875, 2.67291259765625, 2.8663330078125, 3.05975341796875, 3.253173828125, 3.44659423828125, 3.6400146484375, 3.83343505859375, 4.02685546875, 4.22027587890625, 4.4136962890625, 4.60711669921875, 4.800537109375, 4.99395751953125, 5.1873779296875, 5.38079833984375, 5.57421875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 12.0, 11.0, 18.0, 29.0, 25.0, 21.0, 45.0, 40.0, 36.0, 74.0, 92.0, 157.0, 358.0, 1460.0, 173.0, 90.0, 70.0, 53.0, 46.0, 43.0, 35.0, 27.0, 19.0, 23.0, 12.0, 8.0, 12.0, 6.0, 17.0, 5.0, 5.0, 1.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.578125, -13.1263427734375, -12.674560546875, -12.2227783203125, -11.77099609375, -11.3192138671875, -10.867431640625, -10.4156494140625, -9.9638671875, -9.5120849609375, -9.060302734375, -8.6085205078125, -8.15673828125, -7.7049560546875, -7.253173828125, -6.8013916015625, -6.349609375, -5.8978271484375, -5.446044921875, -4.9942626953125, -4.54248046875, -4.0906982421875, -3.638916015625, -3.1871337890625, -2.7353515625, -2.2835693359375, -1.831787109375, -1.3800048828125, -0.92822265625, -0.4764404296875, -0.024658203125, 0.4271240234375, 0.87890625, 1.3306884765625, 1.782470703125, 2.2342529296875, 2.68603515625, 3.1378173828125, 3.589599609375, 4.0413818359375, 4.4931640625, 4.9449462890625, 5.396728515625, 5.8485107421875, 6.30029296875, 6.7520751953125, 7.203857421875, 7.6556396484375, 8.107421875, 8.5592041015625, 9.010986328125, 9.4627685546875, 9.91455078125, 10.3663330078125, 10.818115234375, 11.2698974609375, 11.7216796875, 12.1734619140625, 12.625244140625, 13.0770263671875, 13.52880859375, 13.9805908203125, 14.432373046875, 14.8841552734375, 15.3359375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 12.0, 15.0, 25.0, 27.0, 41.0, 41.0, 93.0, 75.0, 104.0, 146.0, 204.0, 309.0, 434.0, 716.0, 1402.0, 11715.0, 2271148.0, 848604.0, 7320.0, 1223.0, 643.0, 361.0, 269.0, 210.0, 132.0, 123.0, 61.0, 35.0, 42.0, 29.0, 30.0, 24.0, 9.0, 8.0, 8.0, 8.0, 8.0, 9.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-26.03125, -25.306640625, -24.58203125, -23.857421875, -23.1328125, -22.408203125, -21.68359375, -20.958984375, -20.234375, -19.509765625, -18.78515625, -18.060546875, -17.3359375, -16.611328125, -15.88671875, -15.162109375, -14.4375, -13.712890625, -12.98828125, -12.263671875, -11.5390625, -10.814453125, -10.08984375, -9.365234375, -8.640625, -7.916015625, -7.19140625, -6.466796875, -5.7421875, -5.017578125, -4.29296875, -3.568359375, -2.84375, -2.119140625, -1.39453125, -0.669921875, 0.0546875, 0.779296875, 1.50390625, 2.228515625, 2.953125, 3.677734375, 4.40234375, 5.126953125, 5.8515625, 6.576171875, 7.30078125, 8.025390625, 8.75, 9.474609375, 10.19921875, 10.923828125, 11.6484375, 12.373046875, 13.09765625, 13.822265625, 14.546875, 15.271484375, 15.99609375, 16.720703125, 17.4453125, 18.169921875, 18.89453125, 19.619140625, 20.34375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 41.0, 79.0, 191.0, 248.0, 255.0, 125.0, 54.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.88557243347168, -22.83837127685547, -21.79117202758789, -20.74397087097168, -19.69676971435547, -18.649568557739258, -17.602367401123047, -16.55516815185547, -15.507966995239258, -14.460765838623047, -13.413565635681152, -12.366365432739258, -11.319164276123047, -10.271963119506836, -9.224762916564941, -8.177562713623047, -7.130361557006836, -6.083160877227783, -5.0359601974487305, -3.9887595176696777, -2.941558837890625, -1.8943581581115723, -0.8471574783325195, 0.2000432014465332, 1.247243881225586, 2.2944445610046387, 3.3416452407836914, 4.388845920562744, 5.436046600341797, 6.48324728012085, 7.530447959899902, 8.577648162841797, 9.624847412109375, 10.672048568725586, 11.71924877166748, 12.766448974609375, 13.813650131225586, 14.860851287841797, 15.908051490783691, 16.955251693725586, 18.002452850341797, 19.049654006958008, 20.09685516357422, 21.144054412841797, 22.191255569458008, 23.23845672607422, 24.285655975341797, 25.332857131958008, 26.38005828857422, 27.42725944519043, 28.47446060180664, 29.52165985107422, 30.56886100769043, 31.61606216430664, 32.66326141357422, 33.71046447753906, 34.75766372680664, 35.80486297607422, 36.85206604003906, 37.89926528930664, 38.94646453857422, 39.99366760253906, 41.04086685180664, 42.088069915771484, 43.13526916503906]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 8.0, 3.0, 7.0, 7.0, 10.0, 10.0, 8.0, 13.0, 17.0, 20.0, 23.0, 23.0, 25.0, 27.0, 25.0, 30.0, 31.0, 40.0, 45.0, 38.0, 39.0, 31.0, 30.0, 35.0, 33.0, 38.0, 27.0, 41.0, 34.0, 31.0, 21.0, 23.0, 20.0, 20.0, 23.0, 16.0, 19.0, 22.0, 8.0, 15.0, 10.0, 11.0, 10.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-21.802602767944336, -21.121204376220703, -20.43980598449707, -19.758407592773438, -19.077009201049805, -18.395610809326172, -17.714214324951172, -17.03281593322754, -16.351417541503906, -15.670019149780273, -14.98862075805664, -14.307222366333008, -13.625824928283691, -12.944426536560059, -12.263028144836426, -11.58163070678711, -10.90023136138916, -10.218832969665527, -9.537434577941895, -8.856037139892578, -8.174638748168945, -7.4932403564453125, -6.81184196472168, -6.130444049835205, -5.449045658111572, -4.7676472663879395, -4.086249351501465, -3.404850959777832, -2.7234528064727783, -2.0420546531677246, -1.3606562614440918, -0.6792583465576172, 0.002140045166015625, 0.6835382580757141, 1.3649364709854126, 2.046334743499756, 2.7277328968048096, 3.4091310501098633, 4.090529441833496, 4.771927356719971, 5.4533257484436035, 6.134724140167236, 6.816122055053711, 7.497520446777344, 8.178918838500977, 8.86031723022461, 9.541715621948242, 10.223113059997559, 10.904511451721191, 11.585909843444824, 12.267308235168457, 12.948705673217773, 13.630104064941406, 14.311502456665039, 14.992900848388672, 15.674299240112305, 16.355697631835938, 17.03709602355957, 17.718494415283203, 18.399892807006836, 19.08129119873047, 19.76268768310547, 20.444087982177734, 21.125484466552734, 21.806882858276367]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 11.0, 4.0, 7.0, 7.0, 1.0, 11.0, 10.0, 10.0, 20.0, 13.0, 14.0, 19.0, 12.0, 19.0, 22.0, 29.0, 25.0, 31.0, 40.0, 39.0, 54.0, 30.0, 37.0, 35.0, 57.0, 38.0, 37.0, 36.0, 28.0, 26.0, 34.0, 33.0, 31.0, 14.0, 33.0, 15.0, 17.0, 18.0, 18.0, 11.0, 14.0, 10.0, 7.0, 6.0, 7.0, 3.0, 5.0, 1.0, 7.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.0078125, -3.874267578125, -3.74072265625, -3.607177734375, -3.4736328125, -3.340087890625, -3.20654296875, -3.072998046875, -2.939453125, -2.805908203125, -2.67236328125, -2.538818359375, -2.4052734375, -2.271728515625, -2.13818359375, -2.004638671875, -1.87109375, -1.737548828125, -1.60400390625, -1.470458984375, -1.3369140625, -1.203369140625, -1.06982421875, -0.936279296875, -0.802734375, -0.669189453125, -0.53564453125, -0.402099609375, -0.2685546875, -0.135009765625, -0.00146484375, 0.132080078125, 0.265625, 0.399169921875, 0.53271484375, 0.666259765625, 0.7998046875, 0.933349609375, 1.06689453125, 1.200439453125, 1.333984375, 1.467529296875, 1.60107421875, 1.734619140625, 1.8681640625, 2.001708984375, 2.13525390625, 2.268798828125, 2.40234375, 2.535888671875, 2.66943359375, 2.802978515625, 2.9365234375, 3.070068359375, 3.20361328125, 3.337158203125, 3.470703125, 3.604248046875, 3.73779296875, 3.871337890625, 4.0048828125, 4.138427734375, 4.27197265625, 4.405517578125, 4.5390625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 7.0, 7.0, 12.0, 3.0, 8.0, 12.0, 21.0, 26.0, 30.0, 40.0, 43.0, 65.0, 93.0, 115.0, 135.0, 185.0, 280.0, 382.0, 532.0, 4753.0, 4183987.0, 1605.0, 469.0, 369.0, 257.0, 216.0, 149.0, 106.0, 83.0, 70.0, 38.0, 29.0, 26.0, 28.0, 24.0, 15.0, 11.0, 10.0, 7.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-80.0625, -77.80078125, -75.5390625, -73.27734375, -71.015625, -68.75390625, -66.4921875, -64.23046875, -61.96875, -59.70703125, -57.4453125, -55.18359375, -52.921875, -50.66015625, -48.3984375, -46.13671875, -43.875, -41.61328125, -39.3515625, -37.08984375, -34.828125, -32.56640625, -30.3046875, -28.04296875, -25.78125, -23.51953125, -21.2578125, -18.99609375, -16.734375, -14.47265625, -12.2109375, -9.94921875, -7.6875, -5.42578125, -3.1640625, -0.90234375, 1.359375, 3.62109375, 5.8828125, 8.14453125, 10.40625, 12.66796875, 14.9296875, 17.19140625, 19.453125, 21.71484375, 23.9765625, 26.23828125, 28.5, 30.76171875, 33.0234375, 35.28515625, 37.546875, 39.80859375, 42.0703125, 44.33203125, 46.59375, 48.85546875, 51.1171875, 53.37890625, 55.640625, 57.90234375, 60.1640625, 62.42578125, 64.6875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 7.0, 6.0, 10.0, 11.0, 11.0, 9.0, 22.0, 36.0, 36.0, 52.0, 57.0, 86.0, 118.0, 180.0, 231.0, 352.0, 456.0, 513.0, 487.0, 402.0, 273.0, 214.0, 130.0, 87.0, 69.0, 48.0, 47.0, 26.0, 30.0, 8.0, 13.0, 13.0, 6.0, 4.0, 10.0, 2.0, 4.0, 0.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.23046875, -7.021484375, -6.8125, -6.603515625, -6.39453125, -6.185546875, -5.9765625, -5.767578125, -5.55859375, -5.349609375, -5.140625, -4.931640625, -4.72265625, -4.513671875, -4.3046875, -4.095703125, -3.88671875, -3.677734375, -3.46875, -3.259765625, -3.05078125, -2.841796875, -2.6328125, -2.423828125, -2.21484375, -2.005859375, -1.796875, -1.587890625, -1.37890625, -1.169921875, -0.9609375, -0.751953125, -0.54296875, -0.333984375, -0.125, 0.083984375, 0.29296875, 0.501953125, 0.7109375, 0.919921875, 1.12890625, 1.337890625, 1.546875, 1.755859375, 1.96484375, 2.173828125, 2.3828125, 2.591796875, 2.80078125, 3.009765625, 3.21875, 3.427734375, 3.63671875, 3.845703125, 4.0546875, 4.263671875, 4.47265625, 4.681640625, 4.890625, 5.099609375, 5.30859375, 5.517578125, 5.7265625, 5.935546875, 6.14453125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 11.0, 7.0, 19.0, 26.0, 31.0, 35.0, 47.0, 63.0, 82.0, 159.0, 603.0, 57261.0, 4132131.0, 3075.0, 334.0, 117.0, 75.0, 44.0, 36.0, 42.0, 24.0, 25.0, 16.0, 7.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-68.4375, -66.7392578125, -65.041015625, -63.3427734375, -61.64453125, -59.9462890625, -58.248046875, -56.5498046875, -54.8515625, -53.1533203125, -51.455078125, -49.7568359375, -48.05859375, -46.3603515625, -44.662109375, -42.9638671875, -41.265625, -39.5673828125, -37.869140625, -36.1708984375, -34.47265625, -32.7744140625, -31.076171875, -29.3779296875, -27.6796875, -25.9814453125, -24.283203125, -22.5849609375, -20.88671875, -19.1884765625, -17.490234375, -15.7919921875, -14.09375, -12.3955078125, -10.697265625, -8.9990234375, -7.30078125, -5.6025390625, -3.904296875, -2.2060546875, -0.5078125, 1.1904296875, 2.888671875, 4.5869140625, 6.28515625, 7.9833984375, 9.681640625, 11.3798828125, 13.078125, 14.7763671875, 16.474609375, 18.1728515625, 19.87109375, 21.5693359375, 23.267578125, 24.9658203125, 26.6640625, 28.3623046875, 30.060546875, 31.7587890625, 33.45703125, 35.1552734375, 36.853515625, 38.5517578125, 40.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 33.0, 90.0, 174.0, 269.0, 257.0, 123.0, 41.0, 13.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.711305618286133, -30.176977157592773, -28.642648696899414, -27.108318328857422, -25.573989868164062, -24.039661407470703, -22.505332946777344, -20.971004486083984, -19.436676025390625, -17.902347564697266, -16.368019104003906, -14.83368968963623, -13.299361228942871, -11.765032768249512, -10.230703353881836, -8.696374893188477, -7.162046432495117, -5.627717971801758, -4.09338903427124, -2.5590600967407227, -1.0247316360473633, 0.5095968246459961, 2.043926239013672, 3.5782546997070312, 5.112583160400391, 6.64691162109375, 8.18124008178711, 9.715569496154785, 11.249897956848145, 12.784226417541504, 14.31855583190918, 15.852884292602539, 17.38721466064453, 18.92154312133789, 20.45587158203125, 21.99020004272461, 23.52452850341797, 25.058856964111328, 26.59318733215332, 28.12751579284668, 29.66184425354004, 31.1961727142334, 32.73050308227539, 34.26483154296875, 35.79916000366211, 37.33348846435547, 38.86781692504883, 40.40214538574219, 41.93647384643555, 43.470802307128906, 45.005130767822266, 46.539459228515625, 48.073787689208984, 49.608116149902344, 51.14244842529297, 52.67677307128906, 54.21110534667969, 55.74543380737305, 57.279762268066406, 58.814090728759766, 60.348419189453125, 61.882747650146484, 63.417076110839844, 64.95140838623047, 66.48573303222656]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 2.0, 1.0, 7.0, 5.0, 11.0, 14.0, 14.0, 12.0, 13.0, 17.0, 32.0, 18.0, 23.0, 21.0, 37.0, 40.0, 40.0, 43.0, 41.0, 31.0, 44.0, 38.0, 44.0, 38.0, 36.0, 39.0, 33.0, 38.0, 35.0, 30.0, 26.0, 29.0, 24.0, 20.0, 17.0, 19.0, 14.0, 14.0, 6.0, 5.0, 7.0, 2.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.36933135986328, -19.69687271118164, -19.024415969848633, -18.351957321166992, -17.679500579833984, -17.007041931152344, -16.334583282470703, -15.662125587463379, -14.989667892456055, -14.31721019744873, -13.644752502441406, -12.972293853759766, -12.299836158752441, -11.627378463745117, -10.954919815063477, -10.282462120056152, -9.610004425048828, -8.937546730041504, -8.26508903503418, -7.592630386352539, -6.920172691345215, -6.247714996337891, -5.575256824493408, -4.902798652648926, -4.230340957641602, -3.5578830242156982, -2.885425090789795, -2.2129671573638916, -1.5405092239379883, -0.868051290512085, -0.19559335708618164, 0.4768648147583008, 1.1493244171142578, 1.8217823505401611, 2.4942402839660645, 3.1666982173919678, 3.839156150817871, 4.511613845825195, 5.184072017669678, 5.85653018951416, 6.528987884521484, 7.201445579528809, 7.873903751373291, 8.546361923217773, 9.218819618225098, 9.891277313232422, 10.563735961914062, 11.236193656921387, 11.908651351928711, 12.581109046936035, 13.25356674194336, 13.926025390625, 14.598483085632324, 15.270940780639648, 15.943399429321289, 16.615856170654297, 17.288314819335938, 17.960773468017578, 18.633230209350586, 19.305688858032227, 19.978145599365234, 20.650604248046875, 21.323062896728516, 21.995521545410156, 22.667978286743164]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 4.0, 9.0, 12.0, 14.0, 10.0, 15.0, 21.0, 23.0, 28.0, 29.0, 28.0, 41.0, 49.0, 37.0, 41.0, 45.0, 49.0, 48.0, 56.0, 45.0, 43.0, 37.0, 27.0, 28.0, 40.0, 28.0, 23.0, 24.0, 35.0, 23.0, 18.0, 8.0, 11.0, 20.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.5816650390625, -4.432861328125, -4.2840576171875, -4.13525390625, -3.9864501953125, -3.837646484375, -3.6888427734375, -3.5400390625, -3.3912353515625, -3.242431640625, -3.0936279296875, -2.94482421875, -2.7960205078125, -2.647216796875, -2.4984130859375, -2.349609375, -2.2008056640625, -2.052001953125, -1.9031982421875, -1.75439453125, -1.6055908203125, -1.456787109375, -1.3079833984375, -1.1591796875, -1.0103759765625, -0.861572265625, -0.7127685546875, -0.56396484375, -0.4151611328125, -0.266357421875, -0.1175537109375, 0.03125, 0.1800537109375, 0.328857421875, 0.4776611328125, 0.62646484375, 0.7752685546875, 0.924072265625, 1.0728759765625, 1.2216796875, 1.3704833984375, 1.519287109375, 1.6680908203125, 1.81689453125, 1.9656982421875, 2.114501953125, 2.2633056640625, 2.412109375, 2.5609130859375, 2.709716796875, 2.8585205078125, 3.00732421875, 3.1561279296875, 3.304931640625, 3.4537353515625, 3.6025390625, 3.7513427734375, 3.900146484375, 4.0489501953125, 4.19775390625, 4.3465576171875, 4.495361328125, 4.6441650390625, 4.79296875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 13.0, 16.0, 20.0, 20.0, 42.0, 61.0, 107.0, 176.0, 287.0, 441.0, 682.0, 1094.0, 1808.0, 2872.0, 4967.0, 8218.0, 14205.0, 24703.0, 45471.0, 88549.0, 211727.0, 355444.0, 140102.0, 65701.0, 34644.0, 19234.0, 11110.0, 6573.0, 3967.0, 2435.0, 1484.0, 880.0, 510.0, 345.0, 229.0, 162.0, 92.0, 52.0, 37.0, 15.0, 20.0, 18.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.916015625, -0.8867340087890625, -0.857452392578125, -0.8281707763671875, -0.79888916015625, -0.7696075439453125, -0.740325927734375, -0.7110443115234375, -0.6817626953125, -0.6524810791015625, -0.623199462890625, -0.5939178466796875, -0.56463623046875, -0.5353546142578125, -0.506072998046875, -0.4767913818359375, -0.447509765625, -0.4182281494140625, -0.388946533203125, -0.3596649169921875, -0.33038330078125, -0.3011016845703125, -0.271820068359375, -0.2425384521484375, -0.2132568359375, -0.1839752197265625, -0.154693603515625, -0.1254119873046875, -0.09613037109375, -0.0668487548828125, -0.037567138671875, -0.0082855224609375, 0.02099609375, 0.0502777099609375, 0.079559326171875, 0.1088409423828125, 0.13812255859375, 0.1674041748046875, 0.196685791015625, 0.2259674072265625, 0.2552490234375, 0.2845306396484375, 0.313812255859375, 0.3430938720703125, 0.37237548828125, 0.4016571044921875, 0.430938720703125, 0.4602203369140625, 0.489501953125, 0.5187835693359375, 0.548065185546875, 0.5773468017578125, 0.60662841796875, 0.6359100341796875, 0.665191650390625, 0.6944732666015625, 0.7237548828125, 0.7530364990234375, 0.782318115234375, 0.8115997314453125, 0.84088134765625, 0.8701629638671875, 0.899444580078125, 0.9287261962890625, 0.9580078125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 8.0, 3.0, 1.0, 5.0, 4.0, 7.0, 9.0, 12.0, 11.0, 13.0, 21.0, 11.0, 15.0, 22.0, 24.0, 17.0, 30.0, 36.0, 29.0, 31.0, 40.0, 19.0, 27.0, 36.0, 35.0, 1063.0, 27.0, 34.0, 47.0, 40.0, 24.0, 23.0, 29.0, 20.0, 32.0, 26.0, 30.0, 26.0, 18.0, 17.0, 12.0, 24.0, 13.0, 7.0, 8.0, 7.0, 9.0, 4.0, 5.0, 5.0, 4.0, 8.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.453125, -2.380157470703125, -2.30718994140625, -2.234222412109375, -2.1612548828125, -2.088287353515625, -2.01531982421875, -1.942352294921875, -1.869384765625, -1.796417236328125, -1.72344970703125, -1.650482177734375, -1.5775146484375, -1.504547119140625, -1.43157958984375, -1.358612060546875, -1.28564453125, -1.212677001953125, -1.13970947265625, -1.066741943359375, -0.9937744140625, -0.920806884765625, -0.84783935546875, -0.774871826171875, -0.701904296875, -0.628936767578125, -0.55596923828125, -0.483001708984375, -0.4100341796875, -0.337066650390625, -0.26409912109375, -0.191131591796875, -0.1181640625, -0.045196533203125, 0.02777099609375, 0.100738525390625, 0.1737060546875, 0.246673583984375, 0.31964111328125, 0.392608642578125, 0.465576171875, 0.538543701171875, 0.61151123046875, 0.684478759765625, 0.7574462890625, 0.830413818359375, 0.90338134765625, 0.976348876953125, 1.04931640625, 1.122283935546875, 1.19525146484375, 1.268218994140625, 1.3411865234375, 1.414154052734375, 1.48712158203125, 1.560089111328125, 1.633056640625, 1.706024169921875, 1.77899169921875, 1.851959228515625, 1.9249267578125, 1.997894287109375, 2.07086181640625, 2.143829345703125, 2.216796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 8.0, 8.0, 14.0, 12.0, 25.0, 47.0, 70.0, 103.0, 147.0, 209.0, 294.0, 399.0, 607.0, 792.0, 1069.0, 1427.0, 2007.0, 2809.0, 3647.0, 5212.0, 7164.0, 9896.0, 13937.0, 19318.0, 28089.0, 40646.0, 60953.0, 98211.0, 185831.0, 1271084.0, 118985.0, 70079.0, 45654.0, 31314.0, 21984.0, 15521.0, 10995.0, 7936.0, 5678.0, 4133.0, 2934.0, 2211.0, 1576.0, 1152.0, 789.0, 616.0, 443.0, 286.0, 237.0, 180.0, 110.0, 88.0, 70.0, 48.0, 38.0, 17.0, 15.0, 10.0, 6.0, 3.0, 2.0], "bins": [-0.541015625, -0.5241928100585938, -0.5073699951171875, -0.49054718017578125, -0.473724365234375, -0.45690155029296875, -0.4400787353515625, -0.42325592041015625, -0.40643310546875, -0.38961029052734375, -0.3727874755859375, -0.35596466064453125, -0.339141845703125, -0.32231903076171875, -0.3054962158203125, -0.28867340087890625, -0.2718505859375, -0.25502777099609375, -0.2382049560546875, -0.22138214111328125, -0.204559326171875, -0.18773651123046875, -0.1709136962890625, -0.15409088134765625, -0.13726806640625, -0.12044525146484375, -0.1036224365234375, -0.08679962158203125, -0.069976806640625, -0.05315399169921875, -0.0363311767578125, -0.01950836181640625, -0.002685546875, 0.01413726806640625, 0.0309600830078125, 0.04778289794921875, 0.064605712890625, 0.08142852783203125, 0.0982513427734375, 0.11507415771484375, 0.13189697265625, 0.14871978759765625, 0.1655426025390625, 0.18236541748046875, 0.199188232421875, 0.21601104736328125, 0.2328338623046875, 0.24965667724609375, 0.2664794921875, 0.28330230712890625, 0.3001251220703125, 0.31694793701171875, 0.333770751953125, 0.35059356689453125, 0.3674163818359375, 0.38423919677734375, 0.40106201171875, 0.41788482666015625, 0.4347076416015625, 0.45153045654296875, 0.468353271484375, 0.48517608642578125, 0.5019989013671875, 0.5188217163085938, 0.53564453125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 4.0, 11.0, 8.0, 14.0, 14.0, 11.0, 18.0, 27.0, 43.0, 44.0, 52.0, 42.0, 69.0, 70.0, 54.0, 68.0, 60.0, 66.0, 54.0, 49.0, 42.0, 49.0, 33.0, 19.0, 15.0, 18.0, 8.0, 8.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013589859008789062, -0.00013083219528198242, -0.00012576580047607422, -0.00012069940567016602, -0.00011563301086425781, -0.00011056661605834961, -0.0001055002212524414, -0.0001004338264465332, -9.5367431640625e-05, -9.03010368347168e-05, -8.52346420288086e-05, -8.016824722290039e-05, -7.510185241699219e-05, -7.003545761108398e-05, -6.496906280517578e-05, -5.990266799926758e-05, -5.4836273193359375e-05, -4.976987838745117e-05, -4.470348358154297e-05, -3.9637088775634766e-05, -3.457069396972656e-05, -2.950429916381836e-05, -2.4437904357910156e-05, -1.9371509552001953e-05, -1.430511474609375e-05, -9.238719940185547e-06, -4.172325134277344e-06, 8.940696716308594e-07, 5.9604644775390625e-06, 1.1026859283447266e-05, 1.609325408935547e-05, 2.1159648895263672e-05, 2.6226043701171875e-05, 3.129243850708008e-05, 3.635883331298828e-05, 4.1425228118896484e-05, 4.649162292480469e-05, 5.155801773071289e-05, 5.6624412536621094e-05, 6.16908073425293e-05, 6.67572021484375e-05, 7.18235969543457e-05, 7.68899917602539e-05, 8.195638656616211e-05, 8.702278137207031e-05, 9.208917617797852e-05, 9.715557098388672e-05, 0.00010222196578979492, 0.00010728836059570312, 0.00011235475540161133, 0.00011742115020751953, 0.00012248754501342773, 0.00012755393981933594, 0.00013262033462524414, 0.00013768672943115234, 0.00014275312423706055, 0.00014781951904296875, 0.00015288591384887695, 0.00015795230865478516, 0.00016301870346069336, 0.00016808509826660156, 0.00017315149307250977, 0.00017821788787841797, 0.00018328428268432617, 0.00018835067749023438]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 6.0, 8.0, 11.0, 7.0, 10.0, 8.0, 17.0, 15.0, 27.0, 29.0, 36.0, 67.0, 97.0, 128.0, 195.0, 258.0, 432.0, 774.0, 1519.0, 472519.0, 568710.0, 1632.0, 766.0, 413.0, 274.0, 195.0, 104.0, 75.0, 54.0, 37.0, 30.0, 30.0, 21.0, 11.0, 10.0, 11.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030765533447265625, -0.0029861032962799072, -0.002895653247833252, -0.0028052031993865967, -0.0027147531509399414, -0.002624303102493286, -0.002533853054046631, -0.0024434030055999756, -0.0023529529571533203, -0.002262502908706665, -0.0021720528602600098, -0.0020816028118133545, -0.0019911527633666992, -0.001900702714920044, -0.0018102526664733887, -0.0017198026180267334, -0.0016293525695800781, -0.0015389025211334229, -0.0014484524726867676, -0.0013580024242401123, -0.001267552375793457, -0.0011771023273468018, -0.0010866522789001465, -0.0009962022304534912, -0.0009057521820068359, -0.0008153021335601807, -0.0007248520851135254, -0.0006344020366668701, -0.0005439519882202148, -0.00045350193977355957, -0.0003630518913269043, -0.000272601842880249, -0.00018215179443359375, -9.170174598693848e-05, -1.2516975402832031e-06, 8.919835090637207e-05, 0.00017964839935302734, 0.0002700984477996826, 0.0003605484962463379, 0.00045099854469299316, 0.0005414485931396484, 0.0006318986415863037, 0.000722348690032959, 0.0008127987384796143, 0.0009032487869262695, 0.0009936988353729248, 0.00108414888381958, 0.0011745989322662354, 0.0012650489807128906, 0.001355499029159546, 0.0014459490776062012, 0.0015363991260528564, 0.0016268491744995117, 0.001717299222946167, 0.0018077492713928223, 0.0018981993198394775, 0.001988649368286133, 0.002079099416732788, 0.0021695494651794434, 0.0022599995136260986, 0.002350449562072754, 0.002440899610519409, 0.0025313496589660645, 0.0026217997074127197, 0.002712249755859375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 25.0, 100.0, 281.0, 348.0, 175.0, 59.0, 14.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003797558892983943, -0.00037220411468297243, -0.00036465234006755054, -0.00035710056545212865, -0.00034954879083670676, -0.00034199701622128487, -0.000334445241605863, -0.0003268934669904411, -0.0003193416923750192, -0.0003117899177595973, -0.0003042381431441754, -0.0002966863685287535, -0.00028913459391333163, -0.00028158281929790974, -0.00027403104468248785, -0.00026647927006706595, -0.0002589275245554745, -0.00025137574994005263, -0.00024382397532463074, -0.00023627220070920885, -0.00022872042609378695, -0.00022116865147836506, -0.00021361687686294317, -0.00020606510224752128, -0.0001985133276320994, -0.0001909615530166775, -0.0001834097784012556, -0.00017585800378583372, -0.00016830622917041183, -0.00016075445455498993, -0.00015320267993956804, -0.00014565090532414615, -0.0001380991452606395, -0.0001305473706452176, -0.0001229955960297957, -0.00011544382141437382, -0.00010789204679895192, -0.00010034027218353003, -9.278850484406576e-05, -8.523673022864386e-05, -7.768495561322197e-05, -7.013318099780008e-05, -6.258140638237819e-05, -5.502963540493511e-05, -4.7477860789513215e-05, -3.9926086174091324e-05, -3.237431519664824e-05, -2.482254058122635e-05, -1.7270765965804458e-05, -9.718992259877268e-06, -2.1672185539500788e-06, 5.384554242482409e-06, 1.29363288579043e-05, 2.048810347332619e-05, 2.8039874450769275e-05, 3.559164906619117e-05, 4.314342368161306e-05, 5.069519829703495e-05, 5.824697291245684e-05, 6.579874025192112e-05, 7.335051486734301e-05, 8.09022894827649e-05, 8.845406409818679e-05, 9.600583871360868e-05, 0.00010355761332903057]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 5.0, 6.0, 8.0, 2.0, 6.0, 11.0, 12.0, 12.0, 22.0, 21.0, 24.0, 28.0, 28.0, 32.0, 27.0, 46.0, 37.0, 42.0, 48.0, 41.0, 49.0, 40.0, 38.0, 51.0, 39.0, 41.0, 46.0, 39.0, 34.0, 38.0, 22.0, 26.0, 19.0, 11.0, 10.0, 13.0, 4.0, 7.0, 8.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.176399230957031e-05, -6.916001439094543e-05, -6.655603647232056e-05, -6.395205855369568e-05, -6.13480806350708e-05, -5.874410271644592e-05, -5.6140124797821045e-05, -5.353614687919617e-05, -5.093216896057129e-05, -4.832819104194641e-05, -4.572421312332153e-05, -4.3120235204696655e-05, -4.051625728607178e-05, -3.79122793674469e-05, -3.530830144882202e-05, -3.2704323530197144e-05, -3.0100345611572266e-05, -2.7496367692947388e-05, -2.489238977432251e-05, -2.2288411855697632e-05, -1.9684433937072754e-05, -1.7080456018447876e-05, -1.4476478099822998e-05, -1.187250018119812e-05, -9.268522262573242e-06, -6.664544343948364e-06, -4.060566425323486e-06, -1.4565885066986084e-06, 1.1473894119262695e-06, 3.7513673305511475e-06, 6.355345249176025e-06, 8.959323167800903e-06, 1.1563301086425781e-05, 1.416727900505066e-05, 1.6771256923675537e-05, 1.9375234842300415e-05, 2.1979212760925293e-05, 2.458319067955017e-05, 2.718716859817505e-05, 2.9791146516799927e-05, 3.2395124435424805e-05, 3.499910235404968e-05, 3.760308027267456e-05, 4.020705819129944e-05, 4.2811036109924316e-05, 4.5415014028549194e-05, 4.801899194717407e-05, 5.062296986579895e-05, 5.322694778442383e-05, 5.5830925703048706e-05, 5.8434903621673584e-05, 6.103888154029846e-05, 6.364285945892334e-05, 6.624683737754822e-05, 6.88508152961731e-05, 7.145479321479797e-05, 7.405877113342285e-05, 7.666274905204773e-05, 7.926672697067261e-05, 8.187070488929749e-05, 8.447468280792236e-05, 8.707866072654724e-05, 8.968263864517212e-05, 9.2286616563797e-05, 9.489059448242188e-05]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 4.0, 9.0, 12.0, 14.0, 10.0, 15.0, 21.0, 23.0, 28.0, 29.0, 28.0, 41.0, 49.0, 37.0, 41.0, 45.0, 49.0, 48.0, 56.0, 45.0, 43.0, 37.0, 27.0, 28.0, 40.0, 28.0, 23.0, 24.0, 35.0, 23.0, 18.0, 8.0, 11.0, 20.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.5816650390625, -4.432861328125, -4.2840576171875, -4.13525390625, -3.9864501953125, -3.837646484375, -3.6888427734375, -3.5400390625, -3.3912353515625, -3.242431640625, -3.0936279296875, -2.94482421875, -2.7960205078125, -2.647216796875, -2.4984130859375, -2.349609375, -2.2008056640625, -2.052001953125, -1.9031982421875, -1.75439453125, -1.6055908203125, -1.456787109375, -1.3079833984375, -1.1591796875, -1.0103759765625, -0.861572265625, -0.7127685546875, -0.56396484375, -0.4151611328125, -0.266357421875, -0.1175537109375, 0.03125, 0.1800537109375, 0.328857421875, 0.4776611328125, 0.62646484375, 0.7752685546875, 0.924072265625, 1.0728759765625, 1.2216796875, 1.3704833984375, 1.519287109375, 1.6680908203125, 1.81689453125, 1.9656982421875, 2.114501953125, 2.2633056640625, 2.412109375, 2.5609130859375, 2.709716796875, 2.8585205078125, 3.00732421875, 3.1561279296875, 3.304931640625, 3.4537353515625, 3.6025390625, 3.7513427734375, 3.900146484375, 4.0489501953125, 4.19775390625, 4.3465576171875, 4.495361328125, 4.6441650390625, 4.79296875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 12.0, 16.0, 19.0, 19.0, 18.0, 26.0, 43.0, 62.0, 68.0, 90.0, 122.0, 179.0, 239.0, 318.0, 472.0, 610.0, 846.0, 1183.0, 1632.0, 3414.0, 18014.0, 152932.0, 598307.0, 230494.0, 28526.0, 4403.0, 1937.0, 1221.0, 888.0, 654.0, 446.0, 360.0, 257.0, 190.0, 135.0, 95.0, 99.0, 58.0, 47.0, 23.0, 25.0, 15.0, 12.0, 12.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.4609375, -9.1707763671875, -8.880615234375, -8.5904541015625, -8.30029296875, -8.0101318359375, -7.719970703125, -7.4298095703125, -7.1396484375, -6.8494873046875, -6.559326171875, -6.2691650390625, -5.97900390625, -5.6888427734375, -5.398681640625, -5.1085205078125, -4.818359375, -4.5281982421875, -4.238037109375, -3.9478759765625, -3.65771484375, -3.3675537109375, -3.077392578125, -2.7872314453125, -2.4970703125, -2.2069091796875, -1.916748046875, -1.6265869140625, -1.33642578125, -1.0462646484375, -0.756103515625, -0.4659423828125, -0.17578125, 0.1143798828125, 0.404541015625, 0.6947021484375, 0.98486328125, 1.2750244140625, 1.565185546875, 1.8553466796875, 2.1455078125, 2.4356689453125, 2.725830078125, 3.0159912109375, 3.30615234375, 3.5963134765625, 3.886474609375, 4.1766357421875, 4.466796875, 4.7569580078125, 5.047119140625, 5.3372802734375, 5.62744140625, 5.9176025390625, 6.207763671875, 6.4979248046875, 6.7880859375, 7.0782470703125, 7.368408203125, 7.6585693359375, 7.94873046875, 8.2388916015625, 8.529052734375, 8.8192138671875, 9.109375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 9.0, 9.0, 10.0, 11.0, 12.0, 25.0, 16.0, 17.0, 19.0, 25.0, 26.0, 35.0, 46.0, 48.0, 43.0, 45.0, 73.0, 188.0, 1437.0, 354.0, 169.0, 81.0, 54.0, 60.0, 32.0, 29.0, 28.0, 17.0, 11.0, 22.0, 17.0, 16.0, 9.0, 14.0, 11.0, 4.0, 4.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-11.2890625, -10.9656982421875, -10.642333984375, -10.3189697265625, -9.99560546875, -9.6722412109375, -9.348876953125, -9.0255126953125, -8.7021484375, -8.3787841796875, -8.055419921875, -7.7320556640625, -7.40869140625, -7.0853271484375, -6.761962890625, -6.4385986328125, -6.115234375, -5.7918701171875, -5.468505859375, -5.1451416015625, -4.82177734375, -4.4984130859375, -4.175048828125, -3.8516845703125, -3.5283203125, -3.2049560546875, -2.881591796875, -2.5582275390625, -2.23486328125, -1.9114990234375, -1.588134765625, -1.2647705078125, -0.94140625, -0.6180419921875, -0.294677734375, 0.0286865234375, 0.35205078125, 0.6754150390625, 0.998779296875, 1.3221435546875, 1.6455078125, 1.9688720703125, 2.292236328125, 2.6156005859375, 2.93896484375, 3.2623291015625, 3.585693359375, 3.9090576171875, 4.232421875, 4.5557861328125, 4.879150390625, 5.2025146484375, 5.52587890625, 5.8492431640625, 6.172607421875, 6.4959716796875, 6.8193359375, 7.1427001953125, 7.466064453125, 7.7894287109375, 8.11279296875, 8.4361572265625, 8.759521484375, 9.0828857421875, 9.40625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 6.0, 4.0, 9.0, 5.0, 14.0, 19.0, 30.0, 34.0, 55.0, 63.0, 98.0, 131.0, 209.0, 354.0, 569.0, 1210.0, 10126.0, 3127372.0, 2985.0, 980.0, 458.0, 301.0, 194.0, 121.0, 98.0, 59.0, 58.0, 32.0, 16.0, 27.0, 9.0, 11.0, 9.0, 9.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.78125, -49.107421875, -47.43359375, -45.759765625, -44.0859375, -42.412109375, -40.73828125, -39.064453125, -37.390625, -35.716796875, -34.04296875, -32.369140625, -30.6953125, -29.021484375, -27.34765625, -25.673828125, -24.0, -22.326171875, -20.65234375, -18.978515625, -17.3046875, -15.630859375, -13.95703125, -12.283203125, -10.609375, -8.935546875, -7.26171875, -5.587890625, -3.9140625, -2.240234375, -0.56640625, 1.107421875, 2.78125, 4.455078125, 6.12890625, 7.802734375, 9.4765625, 11.150390625, 12.82421875, 14.498046875, 16.171875, 17.845703125, 19.51953125, 21.193359375, 22.8671875, 24.541015625, 26.21484375, 27.888671875, 29.5625, 31.236328125, 32.91015625, 34.583984375, 36.2578125, 37.931640625, 39.60546875, 41.279296875, 42.953125, 44.626953125, 46.30078125, 47.974609375, 49.6484375, 51.322265625, 52.99609375, 54.669921875, 56.34375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 18.0, 61.0, 138.0, 180.0, 224.0, 186.0, 109.0, 52.0, 17.0, 8.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.63885498046875, -28.664894104003906, -27.690933227539062, -26.71697425842285, -25.743013381958008, -24.769052505493164, -23.795093536376953, -22.82113265991211, -21.847171783447266, -20.873210906982422, -19.899250030517578, -18.925291061401367, -17.951330184936523, -16.97736930847168, -16.00341033935547, -15.029449462890625, -14.055488586425781, -13.081527709960938, -12.10756778717041, -11.133607864379883, -10.159646987915039, -9.185686111450195, -8.211726188659668, -7.237765789031982, -6.263805389404297, -5.289844989776611, -4.315884590148926, -3.3419241905212402, -2.3679637908935547, -1.3940033912658691, -0.4200429916381836, 0.553917407989502, 1.5278778076171875, 2.501838207244873, 3.4757986068725586, 4.449759006500244, 5.42371940612793, 6.397679805755615, 7.371640205383301, 8.345600128173828, 9.319561004638672, 10.293521881103516, 11.267481803894043, 12.24144172668457, 13.215402603149414, 14.189363479614258, 15.163323402404785, 16.137283325195312, 17.111244201660156, 18.085205078125, 19.059165954589844, 20.033124923706055, 21.0070858001709, 21.981046676635742, 22.955005645751953, 23.928966522216797, 24.90292739868164, 25.876888275146484, 26.850849151611328, 27.82480812072754, 28.798768997192383, 29.772729873657227, 30.746688842773438, 31.72064971923828, 32.694610595703125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 10.0, 9.0, 14.0, 16.0, 26.0, 19.0, 24.0, 31.0, 24.0, 28.0, 27.0, 29.0, 37.0, 55.0, 44.0, 46.0, 51.0, 46.0, 50.0, 48.0, 30.0, 49.0, 26.0, 34.0, 31.0, 23.0, 19.0, 19.0, 26.0, 12.0, 15.0, 14.0, 12.0, 3.0, 8.0, 10.0, 5.0, 10.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.97964096069336, -22.160324096679688, -21.341007232666016, -20.521690368652344, -19.702373504638672, -18.883056640625, -18.06374168395996, -17.24442481994629, -16.425107955932617, -15.605791091918945, -14.786474227905273, -13.967158317565918, -13.147841453552246, -12.328524589538574, -11.509208679199219, -10.689891815185547, -9.870574951171875, -9.051258087158203, -8.231941223144531, -7.412625312805176, -6.593308448791504, -5.773991584777832, -4.954675197601318, -4.135358810424805, -3.316041946411133, -2.49672532081604, -1.6774086952209473, -0.8580920696258545, -0.03877544403076172, 0.7805414199829102, 1.5998578071594238, 2.4191741943359375, 3.2384910583496094, 4.057807922363281, 4.877124309539795, 5.696440696716309, 6.5157575607299805, 7.335074424743652, 8.154390335083008, 8.97370719909668, 9.793024063110352, 10.612340927124023, 11.431657791137695, 12.25097370147705, 13.070290565490723, 13.889607429504395, 14.70892333984375, 15.528240203857422, 16.347557067871094, 17.166873931884766, 17.986190795898438, 18.80550765991211, 19.62482452392578, 20.444141387939453, 21.263456344604492, 22.082773208618164, 22.902090072631836, 23.721406936645508, 24.54072380065918, 25.36004066467285, 26.17935562133789, 26.998672485351562, 27.817989349365234, 28.637306213378906, 29.456623077392578]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 2.0, 6.0, 4.0, 7.0, 12.0, 12.0, 13.0, 19.0, 11.0, 16.0, 26.0, 28.0, 30.0, 32.0, 40.0, 41.0, 37.0, 34.0, 54.0, 43.0, 41.0, 48.0, 44.0, 42.0, 29.0, 39.0, 31.0, 32.0, 38.0, 30.0, 22.0, 17.0, 24.0, 26.0, 12.0, 19.0, 12.0, 6.0, 14.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.5714111328125, -4.424072265625, -4.2767333984375, -4.12939453125, -3.9820556640625, -3.834716796875, -3.6873779296875, -3.5400390625, -3.3927001953125, -3.245361328125, -3.0980224609375, -2.95068359375, -2.8033447265625, -2.656005859375, -2.5086669921875, -2.361328125, -2.2139892578125, -2.066650390625, -1.9193115234375, -1.77197265625, -1.6246337890625, -1.477294921875, -1.3299560546875, -1.1826171875, -1.0352783203125, -0.887939453125, -0.7406005859375, -0.59326171875, -0.4459228515625, -0.298583984375, -0.1512451171875, -0.00390625, 0.1434326171875, 0.290771484375, 0.4381103515625, 0.58544921875, 0.7327880859375, 0.880126953125, 1.0274658203125, 1.1748046875, 1.3221435546875, 1.469482421875, 1.6168212890625, 1.76416015625, 1.9114990234375, 2.058837890625, 2.2061767578125, 2.353515625, 2.5008544921875, 2.648193359375, 2.7955322265625, 2.94287109375, 3.0902099609375, 3.237548828125, 3.3848876953125, 3.5322265625, 3.6795654296875, 3.826904296875, 3.9742431640625, 4.12158203125, 4.2689208984375, 4.416259765625, 4.5635986328125, 4.7109375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 3.0, 4.0, 14.0, 13.0, 7.0, 17.0, 24.0, 21.0, 21.0, 44.0, 39.0, 45.0, 60.0, 77.0, 113.0, 155.0, 249.0, 479.0, 924.0, 2442.0, 7143.0, 28631.0, 184307.0, 1103989.0, 2109387.0, 638601.0, 92257.0, 16847.0, 4689.0, 1660.0, 765.0, 384.0, 217.0, 150.0, 113.0, 81.0, 68.0, 48.0, 51.0, 32.0, 23.0, 29.0, 11.0, 15.0, 9.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.64453125, -7.4151611328125, -7.185791015625, -6.9564208984375, -6.72705078125, -6.4976806640625, -6.268310546875, -6.0389404296875, -5.8095703125, -5.5802001953125, -5.350830078125, -5.1214599609375, -4.89208984375, -4.6627197265625, -4.433349609375, -4.2039794921875, -3.974609375, -3.7452392578125, -3.515869140625, -3.2864990234375, -3.05712890625, -2.8277587890625, -2.598388671875, -2.3690185546875, -2.1396484375, -1.9102783203125, -1.680908203125, -1.4515380859375, -1.22216796875, -0.9927978515625, -0.763427734375, -0.5340576171875, -0.3046875, -0.0753173828125, 0.154052734375, 0.3834228515625, 0.61279296875, 0.8421630859375, 1.071533203125, 1.3009033203125, 1.5302734375, 1.7596435546875, 1.989013671875, 2.2183837890625, 2.44775390625, 2.6771240234375, 2.906494140625, 3.1358642578125, 3.365234375, 3.5946044921875, 3.823974609375, 4.0533447265625, 4.28271484375, 4.5120849609375, 4.741455078125, 4.9708251953125, 5.2001953125, 5.4295654296875, 5.658935546875, 5.8883056640625, 6.11767578125, 6.3470458984375, 6.576416015625, 6.8057861328125, 7.03515625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 9.0, 6.0, 10.0, 13.0, 22.0, 33.0, 35.0, 43.0, 65.0, 78.0, 75.0, 94.0, 134.0, 174.0, 237.0, 321.0, 391.0, 468.0, 423.0, 352.0, 292.0, 186.0, 147.0, 88.0, 88.0, 57.0, 46.0, 47.0, 33.0, 26.0, 22.0, 14.0, 14.0, 6.0, 4.0, 6.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.696533203125, -5.48291015625, -5.269287109375, -5.0556640625, -4.842041015625, -4.62841796875, -4.414794921875, -4.201171875, -3.987548828125, -3.77392578125, -3.560302734375, -3.3466796875, -3.133056640625, -2.91943359375, -2.705810546875, -2.4921875, -2.278564453125, -2.06494140625, -1.851318359375, -1.6376953125, -1.424072265625, -1.21044921875, -0.996826171875, -0.783203125, -0.569580078125, -0.35595703125, -0.142333984375, 0.0712890625, 0.284912109375, 0.49853515625, 0.712158203125, 0.92578125, 1.139404296875, 1.35302734375, 1.566650390625, 1.7802734375, 1.993896484375, 2.20751953125, 2.421142578125, 2.634765625, 2.848388671875, 3.06201171875, 3.275634765625, 3.4892578125, 3.702880859375, 3.91650390625, 4.130126953125, 4.34375, 4.557373046875, 4.77099609375, 4.984619140625, 5.1982421875, 5.411865234375, 5.62548828125, 5.839111328125, 6.052734375, 6.266357421875, 6.47998046875, 6.693603515625, 6.9072265625, 7.120849609375, 7.33447265625, 7.548095703125, 7.76171875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 7.0, 14.0, 30.0, 37.0, 68.0, 99.0, 175.0, 243.0, 477.0, 900.0, 1992.0, 8836.0, 222658.0, 3645602.0, 297902.0, 10776.0, 2266.0, 959.0, 488.0, 302.0, 153.0, 104.0, 69.0, 43.0, 31.0, 14.0, 14.0, 6.0, 3.0, 6.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.84375, -15.307373046875, -14.77099609375, -14.234619140625, -13.6982421875, -13.161865234375, -12.62548828125, -12.089111328125, -11.552734375, -11.016357421875, -10.47998046875, -9.943603515625, -9.4072265625, -8.870849609375, -8.33447265625, -7.798095703125, -7.26171875, -6.725341796875, -6.18896484375, -5.652587890625, -5.1162109375, -4.579833984375, -4.04345703125, -3.507080078125, -2.970703125, -2.434326171875, -1.89794921875, -1.361572265625, -0.8251953125, -0.288818359375, 0.24755859375, 0.783935546875, 1.3203125, 1.856689453125, 2.39306640625, 2.929443359375, 3.4658203125, 4.002197265625, 4.53857421875, 5.074951171875, 5.611328125, 6.147705078125, 6.68408203125, 7.220458984375, 7.7568359375, 8.293212890625, 8.82958984375, 9.365966796875, 9.90234375, 10.438720703125, 10.97509765625, 11.511474609375, 12.0478515625, 12.584228515625, 13.12060546875, 13.656982421875, 14.193359375, 14.729736328125, 15.26611328125, 15.802490234375, 16.3388671875, 16.875244140625, 17.41162109375, 17.947998046875, 18.484375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 26.0, 199.0, 446.0, 270.0, 64.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.316314697265625, -53.8779182434082, -50.43952178955078, -47.00112533569336, -43.56272888183594, -40.124332427978516, -36.685935974121094, -33.24753952026367, -29.80914306640625, -26.370746612548828, -22.932350158691406, -19.493953704833984, -16.055557250976562, -12.61716079711914, -9.178764343261719, -5.740367889404297, -2.301971435546875, 1.1364250183105469, 4.574821472167969, 8.01321792602539, 11.451614379882812, 14.890010833740234, 18.328407287597656, 21.766803741455078, 25.2052001953125, 28.643596649169922, 32.081993103027344, 35.520389556884766, 38.95878601074219, 42.39718246459961, 45.83557891845703, 49.27397537231445, 52.712371826171875, 56.1507682800293, 59.58916473388672, 63.02756118774414, 66.46595764160156, 69.90435791015625, 73.3427505493164, 76.78114318847656, 80.21954345703125, 83.65794372558594, 87.0963363647461, 90.53472900390625, 93.97312927246094, 97.41152954101562, 100.84992218017578, 104.28831481933594, 107.72671508789062, 111.16511535644531, 114.60350799560547, 118.04190063476562, 121.48030090332031, 124.918701171875, 128.35708618164062, 131.7954864501953, 135.23388671875, 138.6722869873047, 142.11068725585938, 145.549072265625, 148.9874725341797, 152.42587280273438, 155.8642578125, 159.3026580810547, 162.74105834960938]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 12.0, 13.0, 10.0, 19.0, 17.0, 19.0, 25.0, 32.0, 31.0, 34.0, 28.0, 33.0, 31.0, 35.0, 41.0, 36.0, 60.0, 52.0, 45.0, 38.0, 30.0, 51.0, 33.0, 32.0, 27.0, 25.0, 25.0, 29.0, 26.0, 17.0, 16.0, 7.0, 9.0, 14.0, 5.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.326858520507812, -23.46636390686035, -22.605867385864258, -21.745372772216797, -20.884876251220703, -20.024381637573242, -19.16388702392578, -18.303390502929688, -17.442893981933594, -16.582399368286133, -15.721902847290039, -14.861408233642578, -14.000911712646484, -13.140417098999023, -12.279921531677246, -11.419425964355469, -10.558931350708008, -9.69843578338623, -8.837940216064453, -7.977445125579834, -7.116949558258057, -6.256453990936279, -5.39595890045166, -4.535463333129883, -3.6749677658081055, -2.814472198486328, -1.9539768695831299, -1.0934815406799316, -0.2329859733581543, 0.627509593963623, 1.4880046844482422, 2.3485002517700195, 3.208995819091797, 4.069491386413574, 4.929986953735352, 5.790482044219971, 6.650977611541748, 7.511473178863525, 8.371968269348145, 9.232463836669922, 10.0929594039917, 10.953454971313477, 11.813950538635254, 12.674446105957031, 13.534940719604492, 14.395437240600586, 15.255931854248047, 16.11642837524414, 16.9769229888916, 17.837417602539062, 18.697914123535156, 19.558408737182617, 20.41890525817871, 21.279399871826172, 22.139896392822266, 23.000391006469727, 23.860885620117188, 24.72138023376465, 25.581876754760742, 26.442371368408203, 27.302867889404297, 28.163362503051758, 29.02385711669922, 29.884353637695312, 30.744850158691406]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 12.0, 8.0, 16.0, 17.0, 19.0, 22.0, 22.0, 28.0, 30.0, 38.0, 28.0, 40.0, 32.0, 44.0, 46.0, 43.0, 46.0, 43.0, 39.0, 41.0, 28.0, 33.0, 39.0, 32.0, 29.0, 34.0, 33.0, 28.0, 24.0, 16.0, 11.0, 8.0, 15.0, 9.0, 12.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.75, -3.642120361328125, -3.53424072265625, -3.426361083984375, -3.3184814453125, -3.210601806640625, -3.10272216796875, -2.994842529296875, -2.886962890625, -2.779083251953125, -2.67120361328125, -2.563323974609375, -2.4554443359375, -2.347564697265625, -2.23968505859375, -2.131805419921875, -2.02392578125, -1.916046142578125, -1.80816650390625, -1.700286865234375, -1.5924072265625, -1.484527587890625, -1.37664794921875, -1.268768310546875, -1.160888671875, -1.053009033203125, -0.94512939453125, -0.837249755859375, -0.7293701171875, -0.621490478515625, -0.51361083984375, -0.405731201171875, -0.2978515625, -0.189971923828125, -0.08209228515625, 0.025787353515625, 0.1336669921875, 0.241546630859375, 0.34942626953125, 0.457305908203125, 0.565185546875, 0.673065185546875, 0.78094482421875, 0.888824462890625, 0.9967041015625, 1.104583740234375, 1.21246337890625, 1.320343017578125, 1.42822265625, 1.536102294921875, 1.64398193359375, 1.751861572265625, 1.8597412109375, 1.967620849609375, 2.07550048828125, 2.183380126953125, 2.291259765625, 2.399139404296875, 2.50701904296875, 2.614898681640625, 2.7227783203125, 2.830657958984375, 2.93853759765625, 3.046417236328125, 3.154296875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 13.0, 17.0, 12.0, 27.0, 34.0, 54.0, 72.0, 97.0, 140.0, 200.0, 303.0, 390.0, 618.0, 846.0, 1261.0, 1798.0, 2649.0, 4028.0, 5927.0, 9059.0, 13681.0, 20999.0, 32979.0, 52282.0, 87002.0, 162845.0, 273763.0, 152757.0, 82898.0, 49863.0, 31667.0, 20475.0, 13361.0, 8658.0, 5738.0, 3786.0, 2630.0, 1734.0, 1176.0, 870.0, 586.0, 388.0, 251.0, 187.0, 128.0, 91.0, 63.0, 62.0, 40.0, 14.0, 19.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.53955078125, -0.5229263305664062, -0.5063018798828125, -0.48967742919921875, -0.473052978515625, -0.45642852783203125, -0.4398040771484375, -0.42317962646484375, -0.40655517578125, -0.38993072509765625, -0.3733062744140625, -0.35668182373046875, -0.340057373046875, -0.32343292236328125, -0.3068084716796875, -0.29018402099609375, -0.2735595703125, -0.25693511962890625, -0.2403106689453125, -0.22368621826171875, -0.207061767578125, -0.19043731689453125, -0.1738128662109375, -0.15718841552734375, -0.14056396484375, -0.12393951416015625, -0.1073150634765625, -0.09069061279296875, -0.074066162109375, -0.05744171142578125, -0.0408172607421875, -0.02419281005859375, -0.007568359375, 0.00905609130859375, 0.0256805419921875, 0.04230499267578125, 0.058929443359375, 0.07555389404296875, 0.0921783447265625, 0.10880279541015625, 0.12542724609375, 0.14205169677734375, 0.1586761474609375, 0.17530059814453125, 0.191925048828125, 0.20854949951171875, 0.2251739501953125, 0.24179840087890625, 0.2584228515625, 0.27504730224609375, 0.2916717529296875, 0.30829620361328125, 0.324920654296875, 0.34154510498046875, 0.3581695556640625, 0.37479400634765625, 0.39141845703125, 0.40804290771484375, 0.4246673583984375, 0.44129180908203125, 0.457916259765625, 0.47454071044921875, 0.4911651611328125, 0.5077896118164062, 0.5244140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 13.0, 5.0, 10.0, 8.0, 10.0, 16.0, 16.0, 25.0, 13.0, 23.0, 31.0, 26.0, 26.0, 32.0, 35.0, 39.0, 26.0, 47.0, 35.0, 26.0, 1057.0, 37.0, 31.0, 39.0, 27.0, 41.0, 28.0, 28.0, 31.0, 32.0, 22.0, 18.0, 24.0, 21.0, 18.0, 9.0, 19.0, 14.0, 8.0, 12.0, 6.0, 6.0, 6.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.8974609375, -1.8379364013671875, -1.778411865234375, -1.7188873291015625, -1.65936279296875, -1.5998382568359375, -1.540313720703125, -1.4807891845703125, -1.4212646484375, -1.3617401123046875, -1.302215576171875, -1.2426910400390625, -1.18316650390625, -1.1236419677734375, -1.064117431640625, -1.0045928955078125, -0.945068359375, -0.8855438232421875, -0.826019287109375, -0.7664947509765625, -0.70697021484375, -0.6474456787109375, -0.587921142578125, -0.5283966064453125, -0.4688720703125, -0.4093475341796875, -0.349822998046875, -0.2902984619140625, -0.23077392578125, -0.1712493896484375, -0.111724853515625, -0.0522003173828125, 0.00732421875, 0.0668487548828125, 0.126373291015625, 0.1858978271484375, 0.24542236328125, 0.3049468994140625, 0.364471435546875, 0.4239959716796875, 0.4835205078125, 0.5430450439453125, 0.602569580078125, 0.6620941162109375, 0.72161865234375, 0.7811431884765625, 0.840667724609375, 0.9001922607421875, 0.959716796875, 1.0192413330078125, 1.078765869140625, 1.1382904052734375, 1.19781494140625, 1.2573394775390625, 1.316864013671875, 1.3763885498046875, 1.4359130859375, 1.4954376220703125, 1.554962158203125, 1.6144866943359375, 1.67401123046875, 1.7335357666015625, 1.793060302734375, 1.8525848388671875, 1.912109375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 6.0, 9.0, 10.0, 10.0, 28.0, 32.0, 56.0, 61.0, 98.0, 129.0, 165.0, 220.0, 311.0, 451.0, 597.0, 867.0, 1146.0, 1628.0, 2249.0, 3137.0, 4200.0, 5771.0, 7903.0, 10796.0, 14930.0, 21391.0, 30365.0, 44537.0, 68000.0, 111024.0, 1249338.0, 194253.0, 108419.0, 66211.0, 43511.0, 30001.0, 20944.0, 14915.0, 10754.0, 7745.0, 5613.0, 4149.0, 3028.0, 2179.0, 1611.0, 1139.0, 887.0, 688.0, 469.0, 365.0, 239.0, 182.0, 112.0, 79.0, 64.0, 37.0, 37.0, 18.0, 15.0, 7.0, 5.0, 2.0, 6.0], "bins": [-0.4130859375, -0.4001655578613281, -0.38724517822265625, -0.3743247985839844, -0.3614044189453125, -0.3484840393066406, -0.33556365966796875, -0.3226432800292969, -0.309722900390625, -0.2968025207519531, -0.28388214111328125, -0.2709617614746094, -0.2580413818359375, -0.24512100219726562, -0.23220062255859375, -0.21928024291992188, -0.20635986328125, -0.19343948364257812, -0.18051910400390625, -0.16759872436523438, -0.1546783447265625, -0.14175796508789062, -0.12883758544921875, -0.11591720581054688, -0.102996826171875, -0.09007644653320312, -0.07715606689453125, -0.06423568725585938, -0.0513153076171875, -0.038394927978515625, -0.02547454833984375, -0.012554168701171875, 0.0003662109375, 0.013286590576171875, 0.02620697021484375, 0.039127349853515625, 0.0520477294921875, 0.06496810913085938, 0.07788848876953125, 0.09080886840820312, 0.103729248046875, 0.11664962768554688, 0.12957000732421875, 0.14249038696289062, 0.1554107666015625, 0.16833114624023438, 0.18125152587890625, 0.19417190551757812, 0.20709228515625, 0.22001266479492188, 0.23293304443359375, 0.24585342407226562, 0.2587738037109375, 0.2716941833496094, 0.28461456298828125, 0.2975349426269531, 0.310455322265625, 0.3233757019042969, 0.33629608154296875, 0.3492164611816406, 0.3621368408203125, 0.3750572204589844, 0.38797760009765625, 0.4008979797363281, 0.413818359375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 1.0, 3.0, 8.0, 12.0, 9.0, 18.0, 29.0, 26.0, 25.0, 29.0, 39.0, 38.0, 46.0, 58.0, 64.0, 54.0, 61.0, 70.0, 38.0, 54.0, 42.0, 39.0, 40.0, 35.0, 37.0, 24.0, 13.0, 20.0, 14.0, 17.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.28640365600586e-05, -8.961278945207596e-05, -8.636154234409332e-05, -8.311029523611069e-05, -7.985904812812805e-05, -7.660780102014542e-05, -7.335655391216278e-05, -7.010530680418015e-05, -6.685405969619751e-05, -6.360281258821487e-05, -6.035156548023224e-05, -5.71003183722496e-05, -5.384907126426697e-05, -5.059782415628433e-05, -4.73465770483017e-05, -4.409532994031906e-05, -4.0844082832336426e-05, -3.759283572435379e-05, -3.4341588616371155e-05, -3.109034150838852e-05, -2.7839094400405884e-05, -2.4587847292423248e-05, -2.1336600184440613e-05, -1.8085353076457977e-05, -1.4834105968475342e-05, -1.1582858860492706e-05, -8.33161175251007e-06, -5.080364644527435e-06, -1.8291175365447998e-06, 1.4221295714378357e-06, 4.673376679420471e-06, 7.924623787403107e-06, 1.1175870895385742e-05, 1.4427118003368378e-05, 1.7678365111351013e-05, 2.092961221933365e-05, 2.4180859327316284e-05, 2.743210643529892e-05, 3.0683353543281555e-05, 3.393460065126419e-05, 3.7185847759246826e-05, 4.043709486722946e-05, 4.36883419752121e-05, 4.693958908319473e-05, 5.019083619117737e-05, 5.3442083299160004e-05, 5.669333040714264e-05, 5.9944577515125275e-05, 6.319582462310791e-05, 6.644707173109055e-05, 6.969831883907318e-05, 7.294956594705582e-05, 7.620081305503845e-05, 7.945206016302109e-05, 8.270330727100372e-05, 8.595455437898636e-05, 8.9205801486969e-05, 9.245704859495163e-05, 9.570829570293427e-05, 9.89595428109169e-05, 0.00010221078991889954, 0.00010546203702688217, 0.00010871328413486481, 0.00011196453124284744, 0.00011521577835083008]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 1.0, 6.0, 6.0, 5.0, 7.0, 16.0, 11.0, 19.0, 28.0, 26.0, 44.0, 52.0, 65.0, 101.0, 135.0, 179.0, 273.0, 409.0, 677.0, 1531.0, 184699.0, 854589.0, 3281.0, 839.0, 486.0, 311.0, 205.0, 127.0, 117.0, 80.0, 65.0, 41.0, 31.0, 24.0, 15.0, 12.0, 9.0, 7.0, 12.0, 1.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.0023288726806640625, -0.0022678375244140625, -0.0022068023681640625, -0.0021457672119140625, -0.0020847320556640625, -0.0020236968994140625, -0.0019626617431640625, -0.0019016265869140625, -0.0018405914306640625, -0.0017795562744140625, -0.0017185211181640625, -0.0016574859619140625, -0.0015964508056640625, -0.0015354156494140625, -0.0014743804931640625, -0.0014133453369140625, -0.0013523101806640625, -0.0012912750244140625, -0.0012302398681640625, -0.0011692047119140625, -0.0011081695556640625, -0.0010471343994140625, -0.0009860992431640625, -0.0009250640869140625, -0.0008640289306640625, -0.0008029937744140625, -0.0007419586181640625, -0.0006809234619140625, -0.0006198883056640625, -0.0005588531494140625, -0.0004978179931640625, -0.0004367828369140625, -0.0003757476806640625, -0.0003147125244140625, -0.0002536773681640625, -0.0001926422119140625, -0.0001316070556640625, -7.05718994140625e-05, -9.5367431640625e-06, 5.14984130859375e-05, 0.0001125335693359375, 0.0001735687255859375, 0.0002346038818359375, 0.0002956390380859375, 0.0003566741943359375, 0.0004177093505859375, 0.0004787445068359375, 0.0005397796630859375, 0.0006008148193359375, 0.0006618499755859375, 0.0007228851318359375, 0.0007839202880859375, 0.0008449554443359375, 0.0009059906005859375, 0.0009670257568359375, 0.0010280609130859375, 0.0010890960693359375, 0.0011501312255859375, 0.0012111663818359375, 0.0012722015380859375, 0.0013332366943359375, 0.0013942718505859375, 0.0014553070068359375, 0.0015163421630859375, 0.0015773773193359375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 26.0, 76.0, 176.0, 256.0, 246.0, 140.0, 58.0, 16.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.349190516630188e-05, -5.8578654716257006e-05, -5.3665404266212136e-05, -4.875215017818846e-05, -4.383889972814359e-05, -3.892564927809872e-05, -3.401239519007504e-05, -2.909914474003017e-05, -2.41858942899853e-05, -1.927264383994043e-05, -1.4359391570906155e-05, -9.446140211366583e-06, -4.5328888518270105e-06, 3.8036159821785986e-07, 5.293613867252134e-06, 1.0206866136286408e-05, 1.5120116586331278e-05, 2.003336703637615e-05, 2.4946619305410422e-05, 2.9859871574444696e-05, 3.477312202448957e-05, 3.968637247453444e-05, 4.4599626562558115e-05, 4.9512877012602985e-05, 5.4426127462647855e-05, 5.9339377912692726e-05, 6.42526283627376e-05, 6.916587881278247e-05, 7.407912926282734e-05, 7.899237971287221e-05, 8.390563743887469e-05, 8.881888788891956e-05, 9.373214561492205e-05, 9.864539606496692e-05, 0.00010355864651501179, 0.00010847189696505666, 0.00011338514741510153, 0.0001182983978651464, 0.00012321164831519127, 0.00012812489876523614, 0.000133038149215281, 0.00013795139966532588, 0.00014286465011537075, 0.00014777790056541562, 0.0001526911510154605, 0.00015760440146550536, 0.00016251765191555023, 0.0001674309023655951, 0.0001723441673675552, 0.00017725741781760007, 0.00018217066826764494, 0.0001870839187176898, 0.00019199716916773468, 0.00019691041961777955, 0.00020182367006782442, 0.00020673693506978452, 0.0002116501855198294, 0.00021656343596987426, 0.00022147668641991913, 0.000226389936869964, 0.00023130318732000887, 0.00023621643777005374, 0.00024112968822009861, 0.0002460429386701435, 0.00025095618912018836]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 2.0, 11.0, 12.0, 14.0, 21.0, 17.0, 18.0, 29.0, 31.0, 19.0, 37.0, 37.0, 32.0, 43.0, 39.0, 50.0, 46.0, 48.0, 42.0, 38.0, 47.0, 40.0, 38.0, 30.0, 34.0, 36.0, 27.0, 26.0, 19.0, 26.0, 12.0, 9.0, 17.0, 11.0, 8.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.0558319091796875e-05, -5.88512048125267e-05, -5.714409053325653e-05, -5.543697625398636e-05, -5.3729861974716187e-05, -5.2022747695446014e-05, -5.031563341617584e-05, -4.860851913690567e-05, -4.69014048576355e-05, -4.5194290578365326e-05, -4.3487176299095154e-05, -4.178006201982498e-05, -4.007294774055481e-05, -3.836583346128464e-05, -3.6658719182014465e-05, -3.495160490274429e-05, -3.324449062347412e-05, -3.153737634420395e-05, -2.9830262064933777e-05, -2.8123147785663605e-05, -2.6416033506393433e-05, -2.470891922712326e-05, -2.300180494785309e-05, -2.1294690668582916e-05, -1.9587576389312744e-05, -1.7880462110042572e-05, -1.61733478307724e-05, -1.4466233551502228e-05, -1.2759119272232056e-05, -1.1052004992961884e-05, -9.344890713691711e-06, -7.63777643442154e-06, -5.930662155151367e-06, -4.223547875881195e-06, -2.516433596611023e-06, -8.093193173408508e-07, 8.977949619293213e-07, 2.6049092411994934e-06, 4.3120235204696655e-06, 6.019137799739838e-06, 7.72625207901001e-06, 9.433366358280182e-06, 1.1140480637550354e-05, 1.2847594916820526e-05, 1.4554709196090698e-05, 1.626182347536087e-05, 1.7968937754631042e-05, 1.9676052033901215e-05, 2.1383166313171387e-05, 2.309028059244156e-05, 2.479739487171173e-05, 2.6504509150981903e-05, 2.8211623430252075e-05, 2.9918737709522247e-05, 3.162585198879242e-05, 3.333296626806259e-05, 3.5040080547332764e-05, 3.6747194826602936e-05, 3.845430910587311e-05, 4.016142338514328e-05, 4.186853766441345e-05, 4.3575651943683624e-05, 4.5282766222953796e-05, 4.698988050222397e-05, 4.869699478149414e-05]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 12.0, 8.0, 16.0, 17.0, 19.0, 22.0, 22.0, 28.0, 30.0, 38.0, 28.0, 40.0, 32.0, 44.0, 46.0, 43.0, 46.0, 43.0, 39.0, 41.0, 28.0, 33.0, 39.0, 32.0, 29.0, 34.0, 33.0, 28.0, 24.0, 16.0, 11.0, 8.0, 15.0, 9.0, 12.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.75, -3.642120361328125, -3.53424072265625, -3.426361083984375, -3.3184814453125, -3.210601806640625, -3.10272216796875, -2.994842529296875, -2.886962890625, -2.779083251953125, -2.67120361328125, -2.563323974609375, -2.4554443359375, -2.347564697265625, -2.23968505859375, -2.131805419921875, -2.02392578125, -1.916046142578125, -1.80816650390625, -1.700286865234375, -1.5924072265625, -1.484527587890625, -1.37664794921875, -1.268768310546875, -1.160888671875, -1.053009033203125, -0.94512939453125, -0.837249755859375, -0.7293701171875, -0.621490478515625, -0.51361083984375, -0.405731201171875, -0.2978515625, -0.189971923828125, -0.08209228515625, 0.025787353515625, 0.1336669921875, 0.241546630859375, 0.34942626953125, 0.457305908203125, 0.565185546875, 0.673065185546875, 0.78094482421875, 0.888824462890625, 0.9967041015625, 1.104583740234375, 1.21246337890625, 1.320343017578125, 1.42822265625, 1.536102294921875, 1.64398193359375, 1.751861572265625, 1.8597412109375, 1.967620849609375, 2.07550048828125, 2.183380126953125, 2.291259765625, 2.399139404296875, 2.50701904296875, 2.614898681640625, 2.7227783203125, 2.830657958984375, 2.93853759765625, 3.046417236328125, 3.154296875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 5.0, 9.0, 9.0, 14.0, 19.0, 33.0, 34.0, 62.0, 77.0, 82.0, 128.0, 163.0, 227.0, 302.0, 364.0, 536.0, 718.0, 1019.0, 1341.0, 1891.0, 2771.0, 4779.0, 15921.0, 155685.0, 698751.0, 135045.0, 14263.0, 4526.0, 2775.0, 1932.0, 1316.0, 984.0, 734.0, 530.0, 385.0, 265.0, 238.0, 156.0, 111.0, 85.0, 65.0, 53.0, 43.0, 26.0, 20.0, 19.0, 17.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.3282470703125, -8.054931640625, -7.7816162109375, -7.50830078125, -7.2349853515625, -6.961669921875, -6.6883544921875, -6.4150390625, -6.1417236328125, -5.868408203125, -5.5950927734375, -5.32177734375, -5.0484619140625, -4.775146484375, -4.5018310546875, -4.228515625, -3.9552001953125, -3.681884765625, -3.4085693359375, -3.13525390625, -2.8619384765625, -2.588623046875, -2.3153076171875, -2.0419921875, -1.7686767578125, -1.495361328125, -1.2220458984375, -0.94873046875, -0.6754150390625, -0.402099609375, -0.1287841796875, 0.14453125, 0.4178466796875, 0.691162109375, 0.9644775390625, 1.23779296875, 1.5111083984375, 1.784423828125, 2.0577392578125, 2.3310546875, 2.6043701171875, 2.877685546875, 3.1510009765625, 3.42431640625, 3.6976318359375, 3.970947265625, 4.2442626953125, 4.517578125, 4.7908935546875, 5.064208984375, 5.3375244140625, 5.61083984375, 5.8841552734375, 6.157470703125, 6.4307861328125, 6.7041015625, 6.9774169921875, 7.250732421875, 7.5240478515625, 7.79736328125, 8.0706787109375, 8.343994140625, 8.6173095703125, 8.890625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 7.0, 7.0, 9.0, 12.0, 19.0, 15.0, 16.0, 17.0, 32.0, 28.0, 37.0, 56.0, 61.0, 78.0, 119.0, 370.0, 1576.0, 153.0, 85.0, 52.0, 53.0, 41.0, 40.0, 34.0, 29.0, 25.0, 16.0, 11.0, 10.0, 16.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.859375, -10.510498046875, -10.16162109375, -9.812744140625, -9.4638671875, -9.114990234375, -8.76611328125, -8.417236328125, -8.068359375, -7.719482421875, -7.37060546875, -7.021728515625, -6.6728515625, -6.323974609375, -5.97509765625, -5.626220703125, -5.27734375, -4.928466796875, -4.57958984375, -4.230712890625, -3.8818359375, -3.532958984375, -3.18408203125, -2.835205078125, -2.486328125, -2.137451171875, -1.78857421875, -1.439697265625, -1.0908203125, -0.741943359375, -0.39306640625, -0.044189453125, 0.3046875, 0.653564453125, 1.00244140625, 1.351318359375, 1.7001953125, 2.049072265625, 2.39794921875, 2.746826171875, 3.095703125, 3.444580078125, 3.79345703125, 4.142333984375, 4.4912109375, 4.840087890625, 5.18896484375, 5.537841796875, 5.88671875, 6.235595703125, 6.58447265625, 6.933349609375, 7.2822265625, 7.631103515625, 7.97998046875, 8.328857421875, 8.677734375, 9.026611328125, 9.37548828125, 9.724365234375, 10.0732421875, 10.422119140625, 10.77099609375, 11.119873046875, 11.46875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 19.0, 42.0, 33.0, 33.0, 48.0, 72.0, 92.0, 178.0, 222.0, 432.0, 799.0, 2312.0, 249036.0, 2887497.0, 2622.0, 971.0, 425.0, 259.0, 173.0, 100.0, 81.0, 66.0, 47.0, 24.0, 17.0, 16.0, 22.0, 11.0, 5.0, 6.0, 2.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.07568359375, -37.7763671875, -36.47705078125, -35.177734375, -33.87841796875, -32.5791015625, -31.27978515625, -29.98046875, -28.68115234375, -27.3818359375, -26.08251953125, -24.783203125, -23.48388671875, -22.1845703125, -20.88525390625, -19.5859375, -18.28662109375, -16.9873046875, -15.68798828125, -14.388671875, -13.08935546875, -11.7900390625, -10.49072265625, -9.19140625, -7.89208984375, -6.5927734375, -5.29345703125, -3.994140625, -2.69482421875, -1.3955078125, -0.09619140625, 1.203125, 2.50244140625, 3.8017578125, 5.10107421875, 6.400390625, 7.69970703125, 8.9990234375, 10.29833984375, 11.59765625, 12.89697265625, 14.1962890625, 15.49560546875, 16.794921875, 18.09423828125, 19.3935546875, 20.69287109375, 21.9921875, 23.29150390625, 24.5908203125, 25.89013671875, 27.189453125, 28.48876953125, 29.7880859375, 31.08740234375, 32.38671875, 33.68603515625, 34.9853515625, 36.28466796875, 37.583984375, 38.88330078125, 40.1826171875, 41.48193359375, 42.78125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 24.0, 45.0, 97.0, 208.0, 263.0, 231.0, 86.0, 37.0, 15.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.93561553955078, -46.724857330322266, -45.514095306396484, -44.30333709716797, -43.09257888793945, -41.88181686401367, -40.671058654785156, -39.460296630859375, -38.24953842163086, -37.038780212402344, -35.82801818847656, -34.61725997924805, -33.40650177001953, -32.19573974609375, -30.984981536865234, -29.774221420288086, -28.56346321105957, -27.352703094482422, -26.141944885253906, -24.931184768676758, -23.72042465209961, -22.509666442871094, -21.298906326293945, -20.088146209716797, -18.87738800048828, -17.666627883911133, -16.455869674682617, -15.245109558105469, -14.03434944152832, -12.823590278625488, -11.612831115722656, -10.402070999145508, -9.19131088256836, -7.980551242828369, -6.769791603088379, -5.559032440185547, -4.348272800445557, -3.1375131607055664, -1.9267539978027344, -0.7159938812255859, 0.4947652816772461, 1.7055248022079468, 2.9162843227386475, 4.127043724060059, 5.337803363800049, 6.548563003540039, 7.759322166442871, 8.97008228302002, 10.180841445922852, 11.391600608825684, 12.602360725402832, 13.813119888305664, 15.023880004882812, 16.234638214111328, 17.445398330688477, 18.656158447265625, 19.86691665649414, 21.07767677307129, 22.288434982299805, 23.499195098876953, 24.7099552154541, 25.92071533203125, 27.131473541259766, 28.342233657836914, 29.552993774414062]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 7.0, 16.0, 10.0, 11.0, 9.0, 12.0, 12.0, 11.0, 22.0, 16.0, 16.0, 33.0, 28.0, 30.0, 27.0, 27.0, 34.0, 31.0, 41.0, 29.0, 40.0, 40.0, 37.0, 39.0, 29.0, 25.0, 34.0, 25.0, 29.0, 30.0, 36.0, 31.0, 27.0, 30.0, 19.0, 20.0, 8.0, 20.0, 10.0, 11.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.995271682739258, -18.326915740966797, -17.658557891845703, -16.990201950073242, -16.32184600830078, -15.65349006652832, -14.985133171081543, -14.316776275634766, -13.648420333862305, -12.980064392089844, -12.311707496643066, -11.643350601196289, -10.974994659423828, -10.306638717651367, -9.63828182220459, -8.969924926757812, -8.301568984985352, -7.633212566375732, -6.964856147766113, -6.296499729156494, -5.628143310546875, -4.959786891937256, -4.291430473327637, -3.6230740547180176, -2.9547176361083984, -2.2863612174987793, -1.6180047988891602, -0.949648380279541, -0.2812919616699219, 0.38706445693969727, 1.0554208755493164, 1.7237772941589355, 2.392131805419922, 3.060488224029541, 3.72884464263916, 4.397201061248779, 5.065557479858398, 5.733913898468018, 6.402270317077637, 7.070626735687256, 7.738983154296875, 8.407339096069336, 9.075695991516113, 9.74405288696289, 10.412408828735352, 11.080764770507812, 11.74912166595459, 12.417478561401367, 13.085834503173828, 13.754190444946289, 14.422547340393066, 15.090904235839844, 15.759260177612305, 16.427616119384766, 17.09597396850586, 17.76432991027832, 18.43268585205078, 19.101041793823242, 19.769397735595703, 20.437755584716797, 21.106111526489258, 21.77446746826172, 22.442825317382812, 23.111181259155273, 23.779537200927734]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 8.0, 6.0, 5.0, 5.0, 6.0, 12.0, 17.0, 18.0, 16.0, 24.0, 18.0, 26.0, 31.0, 23.0, 38.0, 26.0, 37.0, 43.0, 29.0, 41.0, 30.0, 42.0, 42.0, 48.0, 38.0, 32.0, 32.0, 36.0, 38.0, 35.0, 19.0, 23.0, 26.0, 26.0, 19.0, 13.0, 12.0, 17.0, 13.0, 4.0, 6.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.40234375, -3.29425048828125, -3.1861572265625, -3.07806396484375, -2.969970703125, -2.86187744140625, -2.7537841796875, -2.64569091796875, -2.53759765625, -2.42950439453125, -2.3214111328125, -2.21331787109375, -2.105224609375, -1.99713134765625, -1.8890380859375, -1.78094482421875, -1.6728515625, -1.56475830078125, -1.4566650390625, -1.34857177734375, -1.240478515625, -1.13238525390625, -1.0242919921875, -0.91619873046875, -0.80810546875, -0.70001220703125, -0.5919189453125, -0.48382568359375, -0.375732421875, -0.26763916015625, -0.1595458984375, -0.05145263671875, 0.056640625, 0.16473388671875, 0.2728271484375, 0.38092041015625, 0.489013671875, 0.59710693359375, 0.7052001953125, 0.81329345703125, 0.92138671875, 1.02947998046875, 1.1375732421875, 1.24566650390625, 1.353759765625, 1.46185302734375, 1.5699462890625, 1.67803955078125, 1.7861328125, 1.89422607421875, 2.0023193359375, 2.11041259765625, 2.218505859375, 2.32659912109375, 2.4346923828125, 2.54278564453125, 2.65087890625, 2.75897216796875, 2.8670654296875, 2.97515869140625, 3.083251953125, 3.19134521484375, 3.2994384765625, 3.40753173828125, 3.515625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 6.0, 10.0, 11.0, 18.0, 13.0, 15.0, 20.0, 29.0, 32.0, 36.0, 44.0, 57.0, 74.0, 92.0, 156.0, 370.0, 1081.0, 3979.0, 26213.0, 529249.0, 3153552.0, 450069.0, 23380.0, 3776.0, 1027.0, 340.0, 148.0, 94.0, 82.0, 65.0, 50.0, 29.0, 28.0, 30.0, 31.0, 16.0, 8.0, 15.0, 7.0, 10.0, 8.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.5390625, -10.2042236328125, -9.869384765625, -9.5345458984375, -9.19970703125, -8.8648681640625, -8.530029296875, -8.1951904296875, -7.8603515625, -7.5255126953125, -7.190673828125, -6.8558349609375, -6.52099609375, -6.1861572265625, -5.851318359375, -5.5164794921875, -5.181640625, -4.8468017578125, -4.511962890625, -4.1771240234375, -3.84228515625, -3.5074462890625, -3.172607421875, -2.8377685546875, -2.5029296875, -2.1680908203125, -1.833251953125, -1.4984130859375, -1.16357421875, -0.8287353515625, -0.493896484375, -0.1590576171875, 0.17578125, 0.5106201171875, 0.845458984375, 1.1802978515625, 1.51513671875, 1.8499755859375, 2.184814453125, 2.5196533203125, 2.8544921875, 3.1893310546875, 3.524169921875, 3.8590087890625, 4.19384765625, 4.5286865234375, 4.863525390625, 5.1983642578125, 5.533203125, 5.8680419921875, 6.202880859375, 6.5377197265625, 6.87255859375, 7.2073974609375, 7.542236328125, 7.8770751953125, 8.2119140625, 8.5467529296875, 8.881591796875, 9.2164306640625, 9.55126953125, 9.8861083984375, 10.220947265625, 10.5557861328125, 10.890625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 10.0, 19.0, 33.0, 148.0, 409.0, 1057.0, 1474.0, 622.0, 193.0, 83.0, 27.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.015625, -22.322509765625, -21.62939453125, -20.936279296875, -20.2431640625, -19.550048828125, -18.85693359375, -18.163818359375, -17.470703125, -16.777587890625, -16.08447265625, -15.391357421875, -14.6982421875, -14.005126953125, -13.31201171875, -12.618896484375, -11.92578125, -11.232666015625, -10.53955078125, -9.846435546875, -9.1533203125, -8.460205078125, -7.76708984375, -7.073974609375, -6.380859375, -5.687744140625, -4.99462890625, -4.301513671875, -3.6083984375, -2.915283203125, -2.22216796875, -1.529052734375, -0.8359375, -0.142822265625, 0.55029296875, 1.243408203125, 1.9365234375, 2.629638671875, 3.32275390625, 4.015869140625, 4.708984375, 5.402099609375, 6.09521484375, 6.788330078125, 7.4814453125, 8.174560546875, 8.86767578125, 9.560791015625, 10.25390625, 10.947021484375, 11.64013671875, 12.333251953125, 13.0263671875, 13.719482421875, 14.41259765625, 15.105712890625, 15.798828125, 16.491943359375, 17.18505859375, 17.878173828125, 18.5712890625, 19.264404296875, 19.95751953125, 20.650634765625, 21.34375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 11.0, 16.0, 25.0, 103.0, 313.0, 1417.0, 24152.0, 4161408.0, 5648.0, 842.0, 225.0, 61.0, 22.0, 15.0, 6.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.1875, -43.74560546875, -42.3037109375, -40.86181640625, -39.419921875, -37.97802734375, -36.5361328125, -35.09423828125, -33.65234375, -32.21044921875, -30.7685546875, -29.32666015625, -27.884765625, -26.44287109375, -25.0009765625, -23.55908203125, -22.1171875, -20.67529296875, -19.2333984375, -17.79150390625, -16.349609375, -14.90771484375, -13.4658203125, -12.02392578125, -10.58203125, -9.14013671875, -7.6982421875, -6.25634765625, -4.814453125, -3.37255859375, -1.9306640625, -0.48876953125, 0.953125, 2.39501953125, 3.8369140625, 5.27880859375, 6.720703125, 8.16259765625, 9.6044921875, 11.04638671875, 12.48828125, 13.93017578125, 15.3720703125, 16.81396484375, 18.255859375, 19.69775390625, 21.1396484375, 22.58154296875, 24.0234375, 25.46533203125, 26.9072265625, 28.34912109375, 29.791015625, 31.23291015625, 32.6748046875, 34.11669921875, 35.55859375, 37.00048828125, 38.4423828125, 39.88427734375, 41.326171875, 42.76806640625, 44.2099609375, 45.65185546875, 47.09375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 25.0, 98.0, 249.0, 301.0, 227.0, 90.0, 11.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.73889923095703, -73.76427459716797, -71.78964233398438, -69.81501770019531, -67.84038543701172, -65.86576080322266, -63.89113235473633, -61.91650390625, -59.94187545776367, -57.967247009277344, -55.992618560791016, -54.01799011230469, -52.043365478515625, -50.06873321533203, -48.09410858154297, -46.11948013305664, -44.14485168457031, -42.170223236083984, -40.195594787597656, -38.22096633911133, -36.246337890625, -34.27171325683594, -32.29708480834961, -30.32245635986328, -28.347827911376953, -26.373199462890625, -24.398571014404297, -22.4239444732666, -20.449316024780273, -18.474687576293945, -16.50006103515625, -14.525432586669922, -12.550804138183594, -10.576175689697266, -8.601548194885254, -6.626920223236084, -4.652292251586914, -2.677663803100586, -0.7030363082885742, 1.2715911865234375, 3.2462196350097656, 5.2208476066589355, 7.1954755783081055, 9.170103073120117, 11.144731521606445, 13.119359970092773, 15.093987464904785, 17.068614959716797, 19.043243408203125, 21.017871856689453, 22.99250030517578, 24.967126846313477, 26.941755294799805, 28.916383743286133, 30.891010284423828, 32.865638732910156, 34.840267181396484, 36.81489562988281, 38.78952407836914, 40.76415252685547, 42.73877716064453, 44.713409423828125, 46.68803405761719, 48.662662506103516, 50.637290954589844]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 9.0, 8.0, 7.0, 13.0, 11.0, 15.0, 20.0, 22.0, 18.0, 23.0, 26.0, 29.0, 31.0, 39.0, 32.0, 44.0, 40.0, 34.0, 38.0, 45.0, 39.0, 40.0, 36.0, 34.0, 30.0, 50.0, 26.0, 24.0, 23.0, 31.0, 24.0, 20.0, 22.0, 14.0, 11.0, 8.0, 13.0, 10.0, 8.0, 8.0, 3.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.18072509765625, -21.426908493041992, -20.6730899810791, -19.919273376464844, -19.165454864501953, -18.411638259887695, -17.657821655273438, -16.904003143310547, -16.15018653869629, -15.396368980407715, -14.64255142211914, -13.888734817504883, -13.134917259216309, -12.381099700927734, -11.62728214263916, -10.873464584350586, -10.119647026062012, -9.365829467773438, -8.612011909484863, -7.858194828033447, -7.104377746582031, -6.350560188293457, -5.596742630004883, -4.842925548553467, -4.089107990264893, -3.3352906703948975, -2.5814733505249023, -1.8276557922363281, -1.073838472366333, -0.3200211524963379, 0.43379640579223633, 1.1876134872436523, 1.9414310455322266, 2.6952483654022217, 3.449065685272217, 4.202883243560791, 4.956700325012207, 5.710517883300781, 6.4643354415893555, 7.2181525230407715, 7.971970081329346, 8.725787162780762, 9.479604721069336, 10.23342227935791, 10.987239837646484, 11.741056442260742, 12.494874954223633, 13.24869155883789, 14.002509117126465, 14.756326675415039, 15.510144233703613, 16.263961791992188, 17.017778396606445, 17.771595001220703, 18.525413513183594, 19.27923011779785, 20.033048629760742, 20.786865234375, 21.54068374633789, 22.29450035095215, 23.04831886291504, 23.802135467529297, 24.555953979492188, 25.309770584106445, 26.063587188720703]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 10.0, 3.0, 7.0, 5.0, 13.0, 16.0, 13.0, 15.0, 14.0, 28.0, 24.0, 29.0, 28.0, 28.0, 31.0, 41.0, 33.0, 39.0, 46.0, 42.0, 39.0, 52.0, 40.0, 39.0, 36.0, 37.0, 40.0, 45.0, 32.0, 19.0, 18.0, 23.0, 25.0, 15.0, 15.0, 10.0, 9.0, 8.0, 5.0, 10.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.62640380859375, -2.5379638671875, -2.44952392578125, -2.361083984375, -2.27264404296875, -2.1842041015625, -2.09576416015625, -2.00732421875, -1.91888427734375, -1.8304443359375, -1.74200439453125, -1.653564453125, -1.56512451171875, -1.4766845703125, -1.38824462890625, -1.2998046875, -1.21136474609375, -1.1229248046875, -1.03448486328125, -0.946044921875, -0.85760498046875, -0.7691650390625, -0.68072509765625, -0.59228515625, -0.50384521484375, -0.4154052734375, -0.32696533203125, -0.238525390625, -0.15008544921875, -0.0616455078125, 0.02679443359375, 0.115234375, 0.20367431640625, 0.2921142578125, 0.38055419921875, 0.468994140625, 0.55743408203125, 0.6458740234375, 0.73431396484375, 0.82275390625, 0.91119384765625, 0.9996337890625, 1.08807373046875, 1.176513671875, 1.26495361328125, 1.3533935546875, 1.44183349609375, 1.5302734375, 1.61871337890625, 1.7071533203125, 1.79559326171875, 1.884033203125, 1.97247314453125, 2.0609130859375, 2.14935302734375, 2.23779296875, 2.32623291015625, 2.4146728515625, 2.50311279296875, 2.591552734375, 2.67999267578125, 2.7684326171875, 2.85687255859375, 2.9453125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 14.0, 19.0, 34.0, 50.0, 85.0, 113.0, 142.0, 244.0, 349.0, 481.0, 759.0, 1043.0, 1478.0, 2217.0, 3054.0, 4492.0, 6541.0, 9466.0, 14099.0, 21297.0, 32713.0, 51102.0, 84628.0, 152448.0, 267379.0, 155269.0, 87134.0, 52010.0, 32948.0, 21476.0, 14252.0, 9725.0, 6584.0, 4666.0, 3179.0, 2149.0, 1536.0, 1031.0, 739.0, 454.0, 384.0, 248.0, 175.0, 104.0, 83.0, 50.0, 31.0, 25.0, 17.0, 16.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.414794921875, -0.4012031555175781, -0.38761138916015625, -0.3740196228027344, -0.3604278564453125, -0.3468360900878906, -0.33324432373046875, -0.3196525573730469, -0.306060791015625, -0.2924690246582031, -0.27887725830078125, -0.2652854919433594, -0.2516937255859375, -0.23810195922851562, -0.22451019287109375, -0.21091842651367188, -0.19732666015625, -0.18373489379882812, -0.17014312744140625, -0.15655136108398438, -0.1429595947265625, -0.12936782836914062, -0.11577606201171875, -0.10218429565429688, -0.088592529296875, -0.07500076293945312, -0.06140899658203125, -0.047817230224609375, -0.0342254638671875, -0.020633697509765625, -0.00704193115234375, 0.006549835205078125, 0.0201416015625, 0.033733367919921875, 0.04732513427734375, 0.060916900634765625, 0.0745086669921875, 0.08810043334960938, 0.10169219970703125, 0.11528396606445312, 0.128875732421875, 0.14246749877929688, 0.15605926513671875, 0.16965103149414062, 0.1832427978515625, 0.19683456420898438, 0.21042633056640625, 0.22401809692382812, 0.23760986328125, 0.2512016296386719, 0.26479339599609375, 0.2783851623535156, 0.2919769287109375, 0.3055686950683594, 0.31916046142578125, 0.3327522277832031, 0.346343994140625, 0.3599357604980469, 0.37352752685546875, 0.3871192932128906, 0.4007110595703125, 0.4143028259277344, 0.42789459228515625, 0.4414863586425781, 0.455078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 10.0, 7.0, 8.0, 8.0, 9.0, 15.0, 16.0, 21.0, 23.0, 20.0, 34.0, 27.0, 35.0, 49.0, 41.0, 43.0, 43.0, 51.0, 48.0, 1067.0, 46.0, 46.0, 51.0, 28.0, 36.0, 40.0, 33.0, 24.0, 17.0, 28.0, 14.0, 15.0, 15.0, 9.0, 16.0, 6.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.078125, -2.0189208984375, -1.959716796875, -1.9005126953125, -1.84130859375, -1.7821044921875, -1.722900390625, -1.6636962890625, -1.6044921875, -1.5452880859375, -1.486083984375, -1.4268798828125, -1.36767578125, -1.3084716796875, -1.249267578125, -1.1900634765625, -1.130859375, -1.0716552734375, -1.012451171875, -0.9532470703125, -0.89404296875, -0.8348388671875, -0.775634765625, -0.7164306640625, -0.6572265625, -0.5980224609375, -0.538818359375, -0.4796142578125, -0.42041015625, -0.3612060546875, -0.302001953125, -0.2427978515625, -0.18359375, -0.1243896484375, -0.065185546875, -0.0059814453125, 0.05322265625, 0.1124267578125, 0.171630859375, 0.2308349609375, 0.2900390625, 0.3492431640625, 0.408447265625, 0.4676513671875, 0.52685546875, 0.5860595703125, 0.645263671875, 0.7044677734375, 0.763671875, 0.8228759765625, 0.882080078125, 0.9412841796875, 1.00048828125, 1.0596923828125, 1.118896484375, 1.1781005859375, 1.2373046875, 1.2965087890625, 1.355712890625, 1.4149169921875, 1.47412109375, 1.5333251953125, 1.592529296875, 1.6517333984375, 1.7109375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 15.0, 21.0, 31.0, 44.0, 77.0, 108.0, 149.0, 215.0, 301.0, 476.0, 662.0, 1026.0, 1524.0, 2226.0, 3255.0, 4953.0, 7405.0, 10884.0, 16957.0, 26524.0, 43096.0, 74261.0, 146227.0, 1347372.0, 183777.0, 88480.0, 49971.0, 30054.0, 19195.0, 12542.0, 8164.0, 5553.0, 3660.0, 2634.0, 1704.0, 1120.0, 821.0, 523.0, 397.0, 239.0, 172.0, 112.0, 64.0, 44.0, 29.0, 21.0, 11.0, 12.0, 6.0, 10.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.4375, -0.4236717224121094, -0.40984344482421875, -0.3960151672363281, -0.3821868896484375, -0.3683586120605469, -0.35453033447265625, -0.3407020568847656, -0.326873779296875, -0.3130455017089844, -0.29921722412109375, -0.2853889465332031, -0.2715606689453125, -0.2577323913574219, -0.24390411376953125, -0.23007583618164062, -0.21624755859375, -0.20241928100585938, -0.18859100341796875, -0.17476272583007812, -0.1609344482421875, -0.14710617065429688, -0.13327789306640625, -0.11944961547851562, -0.105621337890625, -0.09179306030273438, -0.07796478271484375, -0.06413650512695312, -0.0503082275390625, -0.036479949951171875, -0.02265167236328125, -0.008823394775390625, 0.0050048828125, 0.018833160400390625, 0.03266143798828125, 0.046489715576171875, 0.0603179931640625, 0.07414627075195312, 0.08797454833984375, 0.10180282592773438, 0.115631103515625, 0.12945938110351562, 0.14328765869140625, 0.15711593627929688, 0.1709442138671875, 0.18477249145507812, 0.19860076904296875, 0.21242904663085938, 0.22625732421875, 0.24008560180664062, 0.25391387939453125, 0.2677421569824219, 0.2815704345703125, 0.2953987121582031, 0.30922698974609375, 0.3230552673339844, 0.336883544921875, 0.3507118225097656, 0.36454010009765625, 0.3783683776855469, 0.3921966552734375, 0.4060249328613281, 0.41985321044921875, 0.4336814880371094, 0.447509765625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 5.0, 8.0, 5.0, 9.0, 6.0, 13.0, 9.0, 11.0, 21.0, 32.0, 44.0, 49.0, 62.0, 56.0, 67.0, 67.0, 82.0, 78.0, 61.0, 63.0, 48.0, 50.0, 33.0, 27.0, 24.0, 23.0, 10.0, 6.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010216236114501953, -9.889528155326843e-05, -9.562820196151733e-05, -9.236112236976624e-05, -8.909404277801514e-05, -8.582696318626404e-05, -8.255988359451294e-05, -7.929280400276184e-05, -7.602572441101074e-05, -7.275864481925964e-05, -6.949156522750854e-05, -6.622448563575745e-05, -6.295740604400635e-05, -5.969032645225525e-05, -5.642324686050415e-05, -5.315616726875305e-05, -4.988908767700195e-05, -4.6622008085250854e-05, -4.3354928493499756e-05, -4.008784890174866e-05, -3.682076930999756e-05, -3.355368971824646e-05, -3.028661012649536e-05, -2.7019530534744263e-05, -2.3752450942993164e-05, -2.0485371351242065e-05, -1.7218291759490967e-05, -1.3951212167739868e-05, -1.068413257598877e-05, -7.417052984237671e-06, -4.149973392486572e-06, -8.828938007354736e-07, 2.384185791015625e-06, 5.651265382766724e-06, 8.918344974517822e-06, 1.2185424566268921e-05, 1.545250415802002e-05, 1.8719583749771118e-05, 2.1986663341522217e-05, 2.5253742933273315e-05, 2.8520822525024414e-05, 3.178790211677551e-05, 3.505498170852661e-05, 3.832206130027771e-05, 4.158914089202881e-05, 4.485622048377991e-05, 4.8123300075531006e-05, 5.1390379667282104e-05, 5.46574592590332e-05, 5.79245388507843e-05, 6.11916184425354e-05, 6.44586980342865e-05, 6.77257776260376e-05, 7.09928572177887e-05, 7.42599368095398e-05, 7.75270164012909e-05, 8.079409599304199e-05, 8.406117558479309e-05, 8.732825517654419e-05, 9.059533476829529e-05, 9.386241436004639e-05, 9.712949395179749e-05, 0.00010039657354354858, 0.00010366365313529968, 0.00010693073272705078]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 3.0, 16.0, 10.0, 15.0, 22.0, 30.0, 35.0, 45.0, 80.0, 102.0, 160.0, 257.0, 453.0, 850.0, 2394.0, 1013478.0, 27970.0, 1150.0, 548.0, 315.0, 198.0, 134.0, 72.0, 44.0, 44.0, 25.0, 16.0, 21.0, 15.0, 11.0, 13.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020694732666015625, -0.0020042061805725098, -0.001938939094543457, -0.0018736720085144043, -0.0018084049224853516, -0.0017431378364562988, -0.001677870750427246, -0.0016126036643981934, -0.0015473365783691406, -0.0014820694923400879, -0.0014168024063110352, -0.0013515353202819824, -0.0012862682342529297, -0.001221001148223877, -0.0011557340621948242, -0.0010904669761657715, -0.0010251998901367188, -0.000959932804107666, -0.0008946657180786133, -0.0008293986320495605, -0.0007641315460205078, -0.0006988644599914551, -0.0006335973739624023, -0.0005683302879333496, -0.0005030632019042969, -0.00043779611587524414, -0.0003725290298461914, -0.00030726194381713867, -0.00024199485778808594, -0.0001767277717590332, -0.00011146068572998047, -4.6193599700927734e-05, 1.9073486328125e-05, 8.434057235717773e-05, 0.00014960765838623047, 0.0002148747444152832, 0.00028014183044433594, 0.00034540891647338867, 0.0004106760025024414, 0.00047594308853149414, 0.0005412101745605469, 0.0006064772605895996, 0.0006717443466186523, 0.0007370114326477051, 0.0008022785186767578, 0.0008675456047058105, 0.0009328126907348633, 0.000998079776763916, 0.0010633468627929688, 0.0011286139488220215, 0.0011938810348510742, 0.001259148120880127, 0.0013244152069091797, 0.0013896822929382324, 0.0014549493789672852, 0.0015202164649963379, 0.0015854835510253906, 0.0016507506370544434, 0.001716017723083496, 0.0017812848091125488, 0.0018465518951416016, 0.0019118189811706543, 0.001977086067199707, 0.0020423531532287598, 0.0021076202392578125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 15.0, 488.0, 489.0, 19.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0006496733985841274, -0.000637414981611073, -0.0006251565064303577, -0.0006128980894573033, -0.0006006396724842489, -0.0005883811973035336, -0.0005761227803304791, -0.0005638643633574247, -0.0005516059463843703, -0.0005393475294113159, -0.0005270890542306006, -0.0005148306372575462, -0.0005025722202844918, -0.0004903137451037765, -0.00047805532813072205, -0.00046579691115766764, -0.0004535384359769523, -0.00044127998990006745, -0.00042902157292701304, -0.0004167631268501282, -0.00040450470987707376, -0.0003922462638001889, -0.00037998781772330403, -0.0003677294007502496, -0.00035547095467336476, -0.0003432125085964799, -0.0003309540916234255, -0.0003186956455465406, -0.00030643719946965575, -0.00029417878249660134, -0.0002819203364197165, -0.0002696618903428316, -0.00025740344426594675, -0.0002451449981890619, -0.00023288658121600747, -0.0002206281351391226, -0.00020836970361415297, -0.00019611127208918333, -0.00018385282601229846, -0.00017159439448732883, -0.0001593359629623592, -0.00014707753143738955, -0.00013481909991241992, -0.00012256065383553505, -0.00011030222231056541, -9.804379078559577e-05, -8.578535198466852e-05, -7.352691318374127e-05, -6.126848165877163e-05, -4.901004649582319e-05, -3.6751611332874745e-05, -2.44931761699263e-05, -1.2234741006977856e-05, 2.3690517991781235e-08, 1.2282129318919033e-05, 2.4540568119846284e-05, 3.679899964481592e-05, 4.9057434807764366e-05, 6.131586997071281e-05, 7.357430877164006e-05, 8.58327402966097e-05, 9.809117182157934e-05, 0.00011034961062250659, 0.00012260804942343384, 0.00013486648094840348]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 9.0, 6.0, 11.0, 9.0, 9.0, 20.0, 7.0, 20.0, 25.0, 22.0, 36.0, 30.0, 33.0, 20.0, 48.0, 25.0, 35.0, 38.0, 39.0, 50.0, 49.0, 38.0, 41.0, 37.0, 47.0, 38.0, 39.0, 22.0, 27.0, 31.0, 24.0, 27.0, 18.0, 15.0, 15.0, 11.0, 11.0, 4.0, 3.0, 1.0, 4.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.369020462036133e-05, -4.225224256515503e-05, -4.081428050994873e-05, -3.937631845474243e-05, -3.793835639953613e-05, -3.6500394344329834e-05, -3.5062432289123535e-05, -3.3624470233917236e-05, -3.218650817871094e-05, -3.074854612350464e-05, -2.931058406829834e-05, -2.787262201309204e-05, -2.6434659957885742e-05, -2.4996697902679443e-05, -2.3558735847473145e-05, -2.2120773792266846e-05, -2.0682811737060547e-05, -1.9244849681854248e-05, -1.780688762664795e-05, -1.636892557144165e-05, -1.4930963516235352e-05, -1.3493001461029053e-05, -1.2055039405822754e-05, -1.0617077350616455e-05, -9.179115295410156e-06, -7.741153240203857e-06, -6.303191184997559e-06, -4.86522912979126e-06, -3.427267074584961e-06, -1.989305019378662e-06, -5.513429641723633e-07, 8.866190910339355e-07, 2.3245811462402344e-06, 3.762543201446533e-06, 5.200505256652832e-06, 6.638467311859131e-06, 8.07642936706543e-06, 9.514391422271729e-06, 1.0952353477478027e-05, 1.2390315532684326e-05, 1.3828277587890625e-05, 1.5266239643096924e-05, 1.6704201698303223e-05, 1.814216375350952e-05, 1.958012580871582e-05, 2.101808786392212e-05, 2.2456049919128418e-05, 2.3894011974334717e-05, 2.5331974029541016e-05, 2.6769936084747314e-05, 2.8207898139953613e-05, 2.9645860195159912e-05, 3.108382225036621e-05, 3.252178430557251e-05, 3.395974636077881e-05, 3.539770841598511e-05, 3.6835670471191406e-05, 3.8273632526397705e-05, 3.9711594581604004e-05, 4.11495566368103e-05, 4.25875186920166e-05, 4.40254807472229e-05, 4.54634428024292e-05, 4.69014048576355e-05, 4.83393669128418e-05]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 10.0, 3.0, 7.0, 5.0, 13.0, 16.0, 13.0, 15.0, 14.0, 28.0, 24.0, 29.0, 28.0, 28.0, 31.0, 41.0, 33.0, 39.0, 46.0, 42.0, 39.0, 52.0, 40.0, 39.0, 36.0, 37.0, 40.0, 45.0, 32.0, 19.0, 18.0, 23.0, 25.0, 15.0, 15.0, 10.0, 9.0, 8.0, 5.0, 10.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.62640380859375, -2.5379638671875, -2.44952392578125, -2.361083984375, -2.27264404296875, -2.1842041015625, -2.09576416015625, -2.00732421875, -1.91888427734375, -1.8304443359375, -1.74200439453125, -1.653564453125, -1.56512451171875, -1.4766845703125, -1.38824462890625, -1.2998046875, -1.21136474609375, -1.1229248046875, -1.03448486328125, -0.946044921875, -0.85760498046875, -0.7691650390625, -0.68072509765625, -0.59228515625, -0.50384521484375, -0.4154052734375, -0.32696533203125, -0.238525390625, -0.15008544921875, -0.0616455078125, 0.02679443359375, 0.115234375, 0.20367431640625, 0.2921142578125, 0.38055419921875, 0.468994140625, 0.55743408203125, 0.6458740234375, 0.73431396484375, 0.82275390625, 0.91119384765625, 0.9996337890625, 1.08807373046875, 1.176513671875, 1.26495361328125, 1.3533935546875, 1.44183349609375, 1.5302734375, 1.61871337890625, 1.7071533203125, 1.79559326171875, 1.884033203125, 1.97247314453125, 2.0609130859375, 2.14935302734375, 2.23779296875, 2.32623291015625, 2.4146728515625, 2.50311279296875, 2.591552734375, 2.67999267578125, 2.7684326171875, 2.85687255859375, 2.9453125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 13.0, 17.0, 29.0, 33.0, 44.0, 79.0, 92.0, 122.0, 146.0, 182.0, 265.0, 395.0, 589.0, 952.0, 1611.0, 3097.0, 7088.0, 22185.0, 115969.0, 604598.0, 234183.0, 37133.0, 10169.0, 4086.0, 2049.0, 1138.0, 656.0, 460.0, 317.0, 215.0, 157.0, 113.0, 90.0, 63.0, 49.0, 58.0, 36.0, 15.0, 14.0, 13.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.49072265625, -5.3173828125, -5.14404296875, -4.970703125, -4.79736328125, -4.6240234375, -4.45068359375, -4.27734375, -4.10400390625, -3.9306640625, -3.75732421875, -3.583984375, -3.41064453125, -3.2373046875, -3.06396484375, -2.890625, -2.71728515625, -2.5439453125, -2.37060546875, -2.197265625, -2.02392578125, -1.8505859375, -1.67724609375, -1.50390625, -1.33056640625, -1.1572265625, -0.98388671875, -0.810546875, -0.63720703125, -0.4638671875, -0.29052734375, -0.1171875, 0.05615234375, 0.2294921875, 0.40283203125, 0.576171875, 0.74951171875, 0.9228515625, 1.09619140625, 1.26953125, 1.44287109375, 1.6162109375, 1.78955078125, 1.962890625, 2.13623046875, 2.3095703125, 2.48291015625, 2.65625, 2.82958984375, 3.0029296875, 3.17626953125, 3.349609375, 3.52294921875, 3.6962890625, 3.86962890625, 4.04296875, 4.21630859375, 4.3896484375, 4.56298828125, 4.736328125, 4.90966796875, 5.0830078125, 5.25634765625, 5.4296875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 12.0, 6.0, 11.0, 3.0, 14.0, 18.0, 28.0, 24.0, 40.0, 39.0, 62.0, 62.0, 95.0, 140.0, 394.0, 1517.0, 166.0, 86.0, 60.0, 58.0, 43.0, 34.0, 32.0, 22.0, 22.0, 7.0, 13.0, 9.0, 4.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-12.140625, -11.813232421875, -11.48583984375, -11.158447265625, -10.8310546875, -10.503662109375, -10.17626953125, -9.848876953125, -9.521484375, -9.194091796875, -8.86669921875, -8.539306640625, -8.2119140625, -7.884521484375, -7.55712890625, -7.229736328125, -6.90234375, -6.574951171875, -6.24755859375, -5.920166015625, -5.5927734375, -5.265380859375, -4.93798828125, -4.610595703125, -4.283203125, -3.955810546875, -3.62841796875, -3.301025390625, -2.9736328125, -2.646240234375, -2.31884765625, -1.991455078125, -1.6640625, -1.336669921875, -1.00927734375, -0.681884765625, -0.3544921875, -0.027099609375, 0.30029296875, 0.627685546875, 0.955078125, 1.282470703125, 1.60986328125, 1.937255859375, 2.2646484375, 2.592041015625, 2.91943359375, 3.246826171875, 3.57421875, 3.901611328125, 4.22900390625, 4.556396484375, 4.8837890625, 5.211181640625, 5.53857421875, 5.865966796875, 6.193359375, 6.520751953125, 6.84814453125, 7.175537109375, 7.5029296875, 7.830322265625, 8.15771484375, 8.485107421875, 8.8125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 1.0, 8.0, 6.0, 5.0, 15.0, 8.0, 11.0, 24.0, 35.0, 29.0, 64.0, 67.0, 101.0, 132.0, 202.0, 339.0, 778.0, 2494.0, 1414444.0, 1722491.0, 2597.0, 764.0, 371.0, 216.0, 129.0, 117.0, 59.0, 62.0, 31.0, 27.0, 25.0, 13.0, 10.0, 10.0, 11.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.90625, -17.266845703125, -16.62744140625, -15.988037109375, -15.3486328125, -14.709228515625, -14.06982421875, -13.430419921875, -12.791015625, -12.151611328125, -11.51220703125, -10.872802734375, -10.2333984375, -9.593994140625, -8.95458984375, -8.315185546875, -7.67578125, -7.036376953125, -6.39697265625, -5.757568359375, -5.1181640625, -4.478759765625, -3.83935546875, -3.199951171875, -2.560546875, -1.921142578125, -1.28173828125, -0.642333984375, -0.0029296875, 0.636474609375, 1.27587890625, 1.915283203125, 2.5546875, 3.194091796875, 3.83349609375, 4.472900390625, 5.1123046875, 5.751708984375, 6.39111328125, 7.030517578125, 7.669921875, 8.309326171875, 8.94873046875, 9.588134765625, 10.2275390625, 10.866943359375, 11.50634765625, 12.145751953125, 12.78515625, 13.424560546875, 14.06396484375, 14.703369140625, 15.3427734375, 15.982177734375, 16.62158203125, 17.260986328125, 17.900390625, 18.539794921875, 19.17919921875, 19.818603515625, 20.4580078125, 21.097412109375, 21.73681640625, 22.376220703125, 23.015625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 44.0, 489.0, 446.0, 33.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.157018661499023, -27.982383728027344, -25.807750701904297, -23.63311767578125, -21.45848274230957, -19.28384780883789, -17.109214782714844, -14.93458080291748, -12.759946823120117, -10.585312843322754, -8.41067886352539, -6.236044883728027, -4.061410903930664, -1.8867769241333008, 0.2878570556640625, 2.462491035461426, 4.637125015258789, 6.811758995056152, 8.986392974853516, 11.161026954650879, 13.335660934448242, 15.510294914245605, 17.68492889404297, 19.859561920166016, 22.034196853637695, 24.208831787109375, 26.383464813232422, 28.55809783935547, 30.73273277282715, 32.90736770629883, 35.082000732421875, 37.25663375854492, 39.4312744140625, 41.60590744018555, 43.780540466308594, 45.955177307128906, 48.12981033325195, 50.304443359375, 52.47908020019531, 54.65371322631836, 56.828346252441406, 59.00297927856445, 61.1776123046875, 63.35224914550781, 65.52688598632812, 67.7015151977539, 69.87615203857422, 72.05078125, 74.22541809082031, 76.40005493164062, 78.5746841430664, 80.74932098388672, 82.9239501953125, 85.09858703613281, 87.27322387695312, 89.4478530883789, 91.62248992919922, 93.79712677001953, 95.97175598144531, 98.14639282226562, 100.32102966308594, 102.49565887451172, 104.67029571533203, 106.84492492675781, 109.01956176757812]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 8.0, 6.0, 12.0, 9.0, 7.0, 14.0, 11.0, 25.0, 24.0, 25.0, 31.0, 25.0, 26.0, 31.0, 27.0, 36.0, 34.0, 28.0, 28.0, 43.0, 35.0, 41.0, 43.0, 50.0, 37.0, 34.0, 30.0, 26.0, 30.0, 33.0, 25.0, 24.0, 28.0, 17.0, 13.0, 6.0, 17.0, 10.0, 10.0, 9.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-17.1634521484375, -16.640655517578125, -16.11785888671875, -15.595062255859375, -15.072265625, -14.549468994140625, -14.02667236328125, -13.503875732421875, -12.9810791015625, -12.458282470703125, -11.93548583984375, -11.412689208984375, -10.889892578125, -10.367095947265625, -9.84429931640625, -9.321502685546875, -8.798705101013184, -8.275908470153809, -7.753111839294434, -7.230315208435059, -6.707518577575684, -6.184721946716309, -5.661924839019775, -5.1391282081604, -4.616331577301025, -4.09353494644165, -3.5707383155822754, -3.0479414463043213, -2.5251448154449463, -2.0023481845855713, -1.4795513153076172, -0.9567546844482422, -0.4339580535888672, 0.08883863687515259, 0.6116353273391724, 1.134432077407837, 1.657228708267212, 2.180025339126587, 2.702822208404541, 3.225618839263916, 3.748415470123291, 4.271212100982666, 4.794008731842041, 5.316805839538574, 5.839602470397949, 6.362399101257324, 6.885195732116699, 7.407992362976074, 7.930788993835449, 8.453585624694824, 8.9763822555542, 9.499178886413574, 10.02197551727295, 10.544772148132324, 11.067569732666016, 11.59036636352539, 12.113162994384766, 12.63595962524414, 13.158756256103516, 13.68155288696289, 14.204349517822266, 14.72714614868164, 15.249942779541016, 15.77273941040039, 16.295536041259766]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 6.0, 11.0, 10.0, 10.0, 14.0, 8.0, 13.0, 12.0, 16.0, 19.0, 26.0, 13.0, 30.0, 26.0, 31.0, 31.0, 39.0, 39.0, 38.0, 44.0, 38.0, 38.0, 36.0, 44.0, 34.0, 48.0, 32.0, 21.0, 26.0, 24.0, 26.0, 24.0, 25.0, 27.0, 19.0, 14.0, 18.0, 14.0, 9.0, 8.0, 2.0, 12.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.7576904296875, -2.663818359375, -2.5699462890625, -2.47607421875, -2.3822021484375, -2.288330078125, -2.1944580078125, -2.1005859375, -2.0067138671875, -1.912841796875, -1.8189697265625, -1.72509765625, -1.6312255859375, -1.537353515625, -1.4434814453125, -1.349609375, -1.2557373046875, -1.161865234375, -1.0679931640625, -0.97412109375, -0.8802490234375, -0.786376953125, -0.6925048828125, -0.5986328125, -0.5047607421875, -0.410888671875, -0.3170166015625, -0.22314453125, -0.1292724609375, -0.035400390625, 0.0584716796875, 0.15234375, 0.2462158203125, 0.340087890625, 0.4339599609375, 0.52783203125, 0.6217041015625, 0.715576171875, 0.8094482421875, 0.9033203125, 0.9971923828125, 1.091064453125, 1.1849365234375, 1.27880859375, 1.3726806640625, 1.466552734375, 1.5604248046875, 1.654296875, 1.7481689453125, 1.842041015625, 1.9359130859375, 2.02978515625, 2.1236572265625, 2.217529296875, 2.3114013671875, 2.4052734375, 2.4991455078125, 2.593017578125, 2.6868896484375, 2.78076171875, 2.8746337890625, 2.968505859375, 3.0623779296875, 3.15625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 9.0, 9.0, 8.0, 9.0, 7.0, 12.0, 15.0, 23.0, 23.0, 43.0, 47.0, 66.0, 78.0, 116.0, 130.0, 212.0, 253.0, 356.0, 593.0, 969.0, 1852.0, 5855.0, 135751.0, 3630405.0, 402897.0, 9023.0, 2229.0, 1074.0, 614.0, 423.0, 317.0, 237.0, 156.0, 108.0, 78.0, 64.0, 47.0, 35.0, 39.0, 14.0, 25.0, 16.0, 8.0, 11.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-16.328125, -15.8115234375, -15.294921875, -14.7783203125, -14.26171875, -13.7451171875, -13.228515625, -12.7119140625, -12.1953125, -11.6787109375, -11.162109375, -10.6455078125, -10.12890625, -9.6123046875, -9.095703125, -8.5791015625, -8.0625, -7.5458984375, -7.029296875, -6.5126953125, -5.99609375, -5.4794921875, -4.962890625, -4.4462890625, -3.9296875, -3.4130859375, -2.896484375, -2.3798828125, -1.86328125, -1.3466796875, -0.830078125, -0.3134765625, 0.203125, 0.7197265625, 1.236328125, 1.7529296875, 2.26953125, 2.7861328125, 3.302734375, 3.8193359375, 4.3359375, 4.8525390625, 5.369140625, 5.8857421875, 6.40234375, 6.9189453125, 7.435546875, 7.9521484375, 8.46875, 8.9853515625, 9.501953125, 10.0185546875, 10.53515625, 11.0517578125, 11.568359375, 12.0849609375, 12.6015625, 13.1181640625, 13.634765625, 14.1513671875, 14.66796875, 15.1845703125, 15.701171875, 16.2177734375, 16.734375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 5.0, 6.0, 3.0, 15.0, 37.0, 62.0, 159.0, 396.0, 933.0, 1196.0, 737.0, 309.0, 130.0, 41.0, 22.0, 11.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9453125, -13.5001220703125, -13.054931640625, -12.6097412109375, -12.16455078125, -11.7193603515625, -11.274169921875, -10.8289794921875, -10.3837890625, -9.9385986328125, -9.493408203125, -9.0482177734375, -8.60302734375, -8.1578369140625, -7.712646484375, -7.2674560546875, -6.822265625, -6.3770751953125, -5.931884765625, -5.4866943359375, -5.04150390625, -4.5963134765625, -4.151123046875, -3.7059326171875, -3.2607421875, -2.8155517578125, -2.370361328125, -1.9251708984375, -1.47998046875, -1.0347900390625, -0.589599609375, -0.1444091796875, 0.30078125, 0.7459716796875, 1.191162109375, 1.6363525390625, 2.08154296875, 2.5267333984375, 2.971923828125, 3.4171142578125, 3.8623046875, 4.3074951171875, 4.752685546875, 5.1978759765625, 5.64306640625, 6.0882568359375, 6.533447265625, 6.9786376953125, 7.423828125, 7.8690185546875, 8.314208984375, 8.7593994140625, 9.20458984375, 9.6497802734375, 10.094970703125, 10.5401611328125, 10.9853515625, 11.4305419921875, 11.875732421875, 12.3209228515625, 12.76611328125, 13.2113037109375, 13.656494140625, 14.1016845703125, 14.546875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 9.0, 10.0, 29.0, 36.0, 63.0, 70.0, 124.0, 164.0, 290.0, 402.0, 801.0, 1511.0, 3937.0, 14198.0, 118092.0, 2119326.0, 1816272.0, 99516.0, 12480.0, 3510.0, 1501.0, 742.0, 396.0, 274.0, 157.0, 117.0, 76.0, 60.0, 25.0, 24.0, 17.0, 9.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-9.4375, -9.17510986328125, -8.9127197265625, -8.65032958984375, -8.387939453125, -8.12554931640625, -7.8631591796875, -7.60076904296875, -7.33837890625, -7.07598876953125, -6.8135986328125, -6.55120849609375, -6.288818359375, -6.02642822265625, -5.7640380859375, -5.50164794921875, -5.2392578125, -4.97686767578125, -4.7144775390625, -4.45208740234375, -4.189697265625, -3.92730712890625, -3.6649169921875, -3.40252685546875, -3.14013671875, -2.87774658203125, -2.6153564453125, -2.35296630859375, -2.090576171875, -1.82818603515625, -1.5657958984375, -1.30340576171875, -1.041015625, -0.77862548828125, -0.5162353515625, -0.25384521484375, 0.008544921875, 0.27093505859375, 0.5333251953125, 0.79571533203125, 1.05810546875, 1.32049560546875, 1.5828857421875, 1.84527587890625, 2.107666015625, 2.37005615234375, 2.6324462890625, 2.89483642578125, 3.1572265625, 3.41961669921875, 3.6820068359375, 3.94439697265625, 4.206787109375, 4.46917724609375, 4.7315673828125, 4.99395751953125, 5.25634765625, 5.51873779296875, 5.7811279296875, 6.04351806640625, 6.305908203125, 6.56829833984375, 6.8306884765625, 7.09307861328125, 7.35546875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 7.0, 8.0, 13.0, 22.0, 27.0, 21.0, 31.0, 42.0, 50.0, 58.0, 61.0, 71.0, 84.0, 88.0, 75.0, 53.0, 48.0, 55.0, 37.0, 47.0, 23.0, 21.0, 13.0, 9.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.53204345703125, -39.5267219543457, -38.521400451660156, -37.51607894897461, -36.51075744628906, -35.505435943603516, -34.50011444091797, -33.49479293823242, -32.489471435546875, -31.484149932861328, -30.47882843017578, -29.473506927490234, -28.468185424804688, -27.46286392211914, -26.457542419433594, -25.452220916748047, -24.446901321411133, -23.441579818725586, -22.43625831604004, -21.430936813354492, -20.425615310668945, -19.4202938079834, -18.414974212646484, -17.409652709960938, -16.40433120727539, -15.399009704589844, -14.393688201904297, -13.38836669921875, -12.383045196533203, -11.377723693847656, -10.372403144836426, -9.367081642150879, -8.361759185791016, -7.356437683105469, -6.351116180419922, -5.345795154571533, -4.340473651885986, -3.3351521492004395, -2.329831123352051, -1.324509620666504, -0.31918811798095703, 0.6861332654953003, 1.6914546489715576, 2.6967759132385254, 3.7020974159240723, 4.707418918609619, 5.712739944458008, 6.718061447143555, 7.723382949829102, 8.728704452514648, 9.734025955200195, 10.739347457885742, 11.744668960571289, 12.749990463256836, 13.755311012268066, 14.760632514953613, 15.76595401763916, 16.77127456665039, 17.776596069335938, 18.781917572021484, 19.78723907470703, 20.792560577392578, 21.797882080078125, 22.803203582763672, 23.80852508544922]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 10.0, 2.0, 4.0, 9.0, 4.0, 9.0, 11.0, 13.0, 18.0, 21.0, 19.0, 26.0, 21.0, 34.0, 21.0, 32.0, 39.0, 35.0, 46.0, 47.0, 37.0, 43.0, 42.0, 49.0, 55.0, 37.0, 34.0, 26.0, 35.0, 27.0, 22.0, 32.0, 23.0, 22.0, 18.0, 16.0, 11.0, 13.0, 9.0, 11.0, 7.0, 8.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.17300796508789, -20.441434860229492, -19.70985984802246, -18.978286743164062, -18.24671173095703, -17.515138626098633, -16.783565521240234, -16.051990509033203, -15.320416450500488, -14.588842391967773, -13.857268333435059, -13.125694274902344, -12.394121170043945, -11.662546157836914, -10.930973052978516, -10.1993989944458, -9.467824935913086, -8.736250877380371, -8.004676818847656, -7.2731032371521, -6.541529178619385, -5.80995512008667, -5.078381538391113, -4.346807479858398, -3.6152334213256836, -2.8836593627929688, -2.152085542678833, -1.4205117225646973, -0.6889376640319824, 0.04263639450073242, 0.7742099761962891, 1.505784034729004, 2.2373580932617188, 2.9689321517944336, 3.7005059719085693, 4.432079792022705, 5.16365385055542, 5.895227909088135, 6.626801490783691, 7.358375549316406, 8.089949607849121, 8.821523666381836, 9.55309772491455, 10.284671783447266, 11.016244888305664, 11.747819900512695, 12.479393005371094, 13.210967063903809, 13.942541122436523, 14.674115180969238, 15.405689239501953, 16.13726234436035, 16.868837356567383, 17.60041046142578, 18.331985473632812, 19.06355857849121, 19.79513168334961, 20.526704788208008, 21.25827980041504, 21.989852905273438, 22.72142791748047, 23.453001022338867, 24.184574127197266, 24.916149139404297, 25.647724151611328]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 10.0, 12.0, 14.0, 17.0, 9.0, 19.0, 24.0, 17.0, 33.0, 28.0, 39.0, 35.0, 38.0, 42.0, 45.0, 45.0, 44.0, 51.0, 51.0, 47.0, 42.0, 36.0, 39.0, 33.0, 26.0, 24.0, 26.0, 25.0, 24.0, 18.0, 13.0, 16.0, 8.0, 7.0, 9.0, 4.0, 11.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03125, -38.6982421875, -37.365234375, -36.0322265625, -34.69921875, -33.3662109375, -32.033203125, -30.7001953125, -29.3671875, -28.0341796875, -26.701171875, -25.3681640625, -24.03515625, -22.7021484375, -21.369140625, -20.0361328125, -18.703125, -17.3701171875, -16.037109375, -14.7041015625, -13.37109375, -12.0380859375, -10.705078125, -9.3720703125, -8.0390625, -6.7060546875, -5.373046875, -4.0400390625, -2.70703125, -1.3740234375, -0.041015625, 1.2919921875, 2.625, 3.9580078125, 5.291015625, 6.6240234375, 7.95703125, 9.2900390625, 10.623046875, 11.9560546875, 13.2890625, 14.6220703125, 15.955078125, 17.2880859375, 18.62109375, 19.9541015625, 21.287109375, 22.6201171875, 23.953125, 25.2861328125, 26.619140625, 27.9521484375, 29.28515625, 30.6181640625, 31.951171875, 33.2841796875, 34.6171875, 35.9501953125, 37.283203125, 38.6162109375, 39.94921875, 41.2822265625, 42.615234375, 43.9482421875, 45.28125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 14.0, 12.0, 36.0, 36.0, 62.0, 103.0, 129.0, 188.0, 300.0, 398.0, 739.0, 1096.0, 1734.0, 2803.0, 4443.0, 7127.0, 11427.0, 19079.0, 32460.0, 58592.0, 117305.0, 273891.0, 264318.0, 113915.0, 57322.0, 32053.0, 18850.0, 11281.0, 6910.0, 4395.0, 2700.0, 1793.0, 1058.0, 690.0, 398.0, 283.0, 160.0, 143.0, 101.0, 75.0, 43.0, 27.0, 9.0, 13.0, 7.0, 6.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-7.54296875, -7.31427001953125, -7.0855712890625, -6.85687255859375, -6.628173828125, -6.39947509765625, -6.1707763671875, -5.94207763671875, -5.71337890625, -5.48468017578125, -5.2559814453125, -5.02728271484375, -4.798583984375, -4.56988525390625, -4.3411865234375, -4.11248779296875, -3.8837890625, -3.65509033203125, -3.4263916015625, -3.19769287109375, -2.968994140625, -2.74029541015625, -2.5115966796875, -2.28289794921875, -2.05419921875, -1.82550048828125, -1.5968017578125, -1.36810302734375, -1.139404296875, -0.91070556640625, -0.6820068359375, -0.45330810546875, -0.224609375, 0.00408935546875, 0.2327880859375, 0.46148681640625, 0.690185546875, 0.91888427734375, 1.1475830078125, 1.37628173828125, 1.60498046875, 1.83367919921875, 2.0623779296875, 2.29107666015625, 2.519775390625, 2.74847412109375, 2.9771728515625, 3.20587158203125, 3.4345703125, 3.66326904296875, 3.8919677734375, 4.12066650390625, 4.349365234375, 4.57806396484375, 4.8067626953125, 5.03546142578125, 5.26416015625, 5.49285888671875, 5.7215576171875, 5.95025634765625, 6.178955078125, 6.40765380859375, 6.6363525390625, 6.86505126953125, 7.09375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 9.0, 8.0, 8.0, 17.0, 13.0, 17.0, 14.0, 22.0, 21.0, 25.0, 32.0, 38.0, 34.0, 44.0, 23.0, 34.0, 51.0, 27.0, 36.0, 1059.0, 35.0, 48.0, 41.0, 33.0, 33.0, 28.0, 31.0, 39.0, 35.0, 21.0, 25.0, 12.0, 18.0, 10.0, 13.0, 10.0, 9.0, 11.0, 4.0, 11.0, 1.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.9375, -23.15625, -22.375, -21.59375, -20.8125, -20.03125, -19.25, -18.46875, -17.6875, -16.90625, -16.125, -15.34375, -14.5625, -13.78125, -13.0, -12.21875, -11.4375, -10.65625, -9.875, -9.09375, -8.3125, -7.53125, -6.75, -5.96875, -5.1875, -4.40625, -3.625, -2.84375, -2.0625, -1.28125, -0.5, 0.28125, 1.0625, 1.84375, 2.625, 3.40625, 4.1875, 4.96875, 5.75, 6.53125, 7.3125, 8.09375, 8.875, 9.65625, 10.4375, 11.21875, 12.0, 12.78125, 13.5625, 14.34375, 15.125, 15.90625, 16.6875, 17.46875, 18.25, 19.03125, 19.8125, 20.59375, 21.375, 22.15625, 22.9375, 23.71875, 24.5, 25.28125, 26.0625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 7.0, 9.0, 18.0, 17.0, 27.0, 42.0, 65.0, 86.0, 145.0, 186.0, 253.0, 356.0, 515.0, 752.0, 955.0, 1461.0, 1942.0, 2662.0, 3878.0, 5390.0, 7601.0, 11165.0, 16238.0, 23634.0, 35329.0, 54334.0, 88722.0, 163968.0, 1301107.0, 142143.0, 79405.0, 49557.0, 33055.0, 21890.0, 14980.0, 10248.0, 7179.0, 5064.0, 3624.0, 2631.0, 1850.0, 1389.0, 904.0, 681.0, 516.0, 356.0, 234.0, 189.0, 101.0, 102.0, 75.0, 43.0, 21.0, 18.0, 16.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-5.609375, -5.43621826171875, -5.2630615234375, -5.08990478515625, -4.916748046875, -4.74359130859375, -4.5704345703125, -4.39727783203125, -4.22412109375, -4.05096435546875, -3.8778076171875, -3.70465087890625, -3.531494140625, -3.35833740234375, -3.1851806640625, -3.01202392578125, -2.8388671875, -2.66571044921875, -2.4925537109375, -2.31939697265625, -2.146240234375, -1.97308349609375, -1.7999267578125, -1.62677001953125, -1.45361328125, -1.28045654296875, -1.1072998046875, -0.93414306640625, -0.760986328125, -0.58782958984375, -0.4146728515625, -0.24151611328125, -0.068359375, 0.10479736328125, 0.2779541015625, 0.45111083984375, 0.624267578125, 0.79742431640625, 0.9705810546875, 1.14373779296875, 1.31689453125, 1.49005126953125, 1.6632080078125, 1.83636474609375, 2.009521484375, 2.18267822265625, 2.3558349609375, 2.52899169921875, 2.7021484375, 2.87530517578125, 3.0484619140625, 3.22161865234375, 3.394775390625, 3.56793212890625, 3.7410888671875, 3.91424560546875, 4.08740234375, 4.26055908203125, 4.4337158203125, 4.60687255859375, 4.780029296875, 4.95318603515625, 5.1263427734375, 5.29949951171875, 5.47265625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 4.0, 6.0, 4.0, 8.0, 8.0, 10.0, 12.0, 19.0, 27.0, 17.0, 30.0, 37.0, 58.0, 59.0, 66.0, 74.0, 77.0, 80.0, 87.0, 60.0, 59.0, 40.0, 29.0, 20.0, 14.0, 21.0, 18.0, 13.0, 6.0, 11.0, 3.0, 10.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0030040740966796875, -0.002924621105194092, -0.002845168113708496, -0.0027657151222229004, -0.0026862621307373047, -0.002606809139251709, -0.0025273561477661133, -0.0024479031562805176, -0.002368450164794922, -0.002288997173309326, -0.0022095441818237305, -0.0021300911903381348, -0.002050638198852539, -0.0019711852073669434, -0.0018917322158813477, -0.001812279224395752, -0.0017328262329101562, -0.0016533732414245605, -0.0015739202499389648, -0.0014944672584533691, -0.0014150142669677734, -0.0013355612754821777, -0.001256108283996582, -0.0011766552925109863, -0.0010972023010253906, -0.001017749309539795, -0.0009382963180541992, -0.0008588433265686035, -0.0007793903350830078, -0.0006999373435974121, -0.0006204843521118164, -0.0005410313606262207, -0.000461578369140625, -0.0003821253776550293, -0.0003026723861694336, -0.0002232193946838379, -0.0001437664031982422, -6.431341171264648e-05, 1.5139579772949219e-05, 9.459257125854492e-05, 0.00017404556274414062, 0.00025349855422973633, 0.00033295154571533203, 0.00041240453720092773, 0.0004918575286865234, 0.0005713105201721191, 0.0006507635116577148, 0.0007302165031433105, 0.0008096694946289062, 0.000889122486114502, 0.0009685754776000977, 0.0010480284690856934, 0.001127481460571289, 0.0012069344520568848, 0.0012863874435424805, 0.0013658404350280762, 0.0014452934265136719, 0.0015247464179992676, 0.0016041994094848633, 0.001683652400970459, 0.0017631053924560547, 0.0018425583839416504, 0.001922011375427246, 0.002001464366912842, 0.0020809173583984375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 7.0, 9.0, 4.0, 11.0, 14.0, 20.0, 20.0, 48.0, 45.0, 54.0, 92.0, 135.0, 246.0, 368.0, 692.0, 1432.0, 3556.0, 11108.0, 43637.0, 245876.0, 552097.0, 147490.0, 28343.0, 7791.0, 2757.0, 1159.0, 619.0, 302.0, 197.0, 130.0, 79.0, 64.0, 38.0, 31.0, 23.0, 8.0, 21.0, 17.0, 3.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01285552978515625, -0.012402176856994629, -0.011948823928833008, -0.011495471000671387, -0.011042118072509766, -0.010588765144348145, -0.010135412216186523, -0.009682059288024902, -0.009228706359863281, -0.00877535343170166, -0.008322000503540039, -0.007868647575378418, -0.007415294647216797, -0.006961941719055176, -0.006508588790893555, -0.006055235862731934, -0.0056018829345703125, -0.005148530006408691, -0.00469517707824707, -0.004241824150085449, -0.003788471221923828, -0.003335118293762207, -0.002881765365600586, -0.002428412437438965, -0.0019750595092773438, -0.0015217065811157227, -0.0010683536529541016, -0.0006150007247924805, -0.00016164779663085938, 0.0002917051315307617, 0.0007450580596923828, 0.001198410987854004, 0.001651763916015625, 0.002105116844177246, 0.002558469772338867, 0.0030118227005004883, 0.0034651756286621094, 0.0039185285568237305, 0.0043718814849853516, 0.004825234413146973, 0.005278587341308594, 0.005731940269470215, 0.006185293197631836, 0.006638646125793457, 0.007091999053955078, 0.007545351982116699, 0.00799870491027832, 0.008452057838439941, 0.008905410766601562, 0.009358763694763184, 0.009812116622924805, 0.010265469551086426, 0.010718822479248047, 0.011172175407409668, 0.011625528335571289, 0.01207888126373291, 0.012532234191894531, 0.012985587120056152, 0.013438940048217773, 0.013892292976379395, 0.014345645904541016, 0.014798998832702637, 0.015252351760864258, 0.01570570468902588, 0.0161590576171875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 19.0, 37.0, 70.0, 99.0, 142.0, 177.0, 145.0, 126.0, 70.0, 50.0, 18.0, 19.0, 10.0, 9.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012861154973506927, -0.0011907619191333652, -0.0010954084573313594, -0.0010000548791140318, -0.000904701417312026, -0.0008093478390946984, -0.0007139943190850317, -0.0006186407990753651, -0.0005232872790656984, -0.0004279337590560317, -0.000332580239046365, -0.00023722668993286788, -0.0001418731699232012, -4.651964991353452e-05, 4.8833899199962616e-05, 0.0001441874192096293, 0.00023954093921929598, 0.00033489445922896266, 0.00043024797923862934, 0.0005256015574559569, 0.0006209550192579627, 0.0007163085974752903, 0.000811662117484957, 0.0009070156374946237, 0.0010023692157119513, 0.0010977227939292789, 0.0011930762557312846, 0.0012884298339486122, 0.001383783295750618, 0.0014791368739679456, 0.0015744904521852732, 0.001669843913987279, 0.0017651973757892847, 0.0018605509540066123, 0.00195590453222394, 0.0020512579940259457, 0.0021466114558279514, 0.002241964917629957, 0.0023373186122626066, 0.0024326720740646124, 0.002528025535866618, 0.002623378997668624, 0.0027187326923012733, 0.002814086154103279, 0.002909439615905285, 0.0030047930777072906, 0.00310014677233994, 0.003195500234141946, 0.0032908539287745953, 0.003386207390576601, 0.0034815610852092505, 0.0035769145470112562, 0.003672268008813262, 0.0037676214706152678, 0.003862975165247917, 0.003958328627049923, 0.004053682088851929, 0.0041490355506539345, 0.00424438901245594, 0.004339742474257946, 0.004435096401721239, 0.004530449863523245, 0.004625803325325251, 0.004721156787127256, 0.004816510248929262]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 11.0, 16.0, 9.0, 18.0, 17.0, 28.0, 26.0, 23.0, 26.0, 30.0, 38.0, 34.0, 49.0, 58.0, 48.0, 39.0, 36.0, 33.0, 53.0, 41.0, 40.0, 35.0, 32.0, 30.0, 36.0, 30.0, 29.0, 27.0, 26.0, 15.0, 17.0, 12.0, 5.0, 6.0, 4.0, 4.0, 6.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011513829231262207, -0.0011114394292235374, -0.0010714959353208542, -0.001031552441418171, -0.0009916089475154877, -0.0009516654536128044, -0.0009117219597101212, -0.0008717784658074379, -0.0008318349719047546, -0.0007918914780020714, -0.0007519479840993881, -0.0007120044901967049, -0.0006720609962940216, -0.0006321175023913383, -0.0005921740084886551, -0.0005522305145859718, -0.0005122870206832886, -0.0004723435267806053, -0.00043240003287792206, -0.0003924565389752388, -0.00035251304507255554, -0.0003125695511698723, -0.000272626057267189, -0.00023268256336450577, -0.0001927390694618225, -0.00015279557555913925, -0.000112852081656456, -7.290858775377274e-05, -3.296509385108948e-05, 6.9784000515937805e-06, 4.692189395427704e-05, 8.68653878569603e-05, 0.00012680888175964355, 0.0001667523756623268, 0.00020669586956501007, 0.00024663936346769333, 0.0002865828573703766, 0.00032652635127305984, 0.0003664698451757431, 0.00040641333907842636, 0.0004463568329811096, 0.0004863003268837929, 0.0005262438207864761, 0.0005661873146891594, 0.0006061308085918427, 0.0006460743024945259, 0.0006860177963972092, 0.0007259612902998924, 0.0007659047842025757, 0.0008058482781052589, 0.0008457917720079422, 0.0008857352659106255, 0.0009256787598133087, 0.000965622253715992, 0.0010055657476186752, 0.0010455092415213585, 0.0010854527354240417, 0.001125396229326725, 0.0011653397232294083, 0.0012052832171320915, 0.0012452267110347748, 0.001285170204937458, 0.0013251136988401413, 0.0013650571927428246, 0.0014050006866455078]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 10.0, 12.0, 14.0, 17.0, 9.0, 19.0, 24.0, 17.0, 33.0, 28.0, 39.0, 35.0, 38.0, 43.0, 44.0, 45.0, 44.0, 51.0, 51.0, 46.0, 43.0, 36.0, 39.0, 33.0, 26.0, 24.0, 26.0, 25.0, 24.0, 18.0, 13.0, 16.0, 8.0, 7.0, 9.0, 4.0, 11.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03125, -38.6982421875, -37.365234375, -36.0322265625, -34.69921875, -33.3662109375, -32.033203125, -30.7001953125, -29.3671875, -28.0341796875, -26.701171875, -25.3681640625, -24.03515625, -22.7021484375, -21.369140625, -20.0361328125, -18.703125, -17.3701171875, -16.037109375, -14.7041015625, -13.37109375, -12.0380859375, -10.705078125, -9.3720703125, -8.0390625, -6.7060546875, -5.373046875, -4.0400390625, -2.70703125, -1.3740234375, -0.041015625, 1.2919921875, 2.625, 3.9580078125, 5.291015625, 6.6240234375, 7.95703125, 9.2900390625, 10.623046875, 11.9560546875, 13.2890625, 14.6220703125, 15.955078125, 17.2880859375, 18.62109375, 19.9541015625, 21.287109375, 22.6201171875, 23.953125, 25.2861328125, 26.619140625, 27.9521484375, 29.28515625, 30.6181640625, 31.951171875, 33.2841796875, 34.6171875, 35.9501953125, 37.283203125, 38.6162109375, 39.94921875, 41.2822265625, 42.615234375, 43.9482421875, 45.28125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 6.0, 6.0, 20.0, 22.0, 25.0, 52.0, 52.0, 98.0, 142.0, 239.0, 398.0, 684.0, 1265.0, 2582.0, 6308.0, 19585.0, 83851.0, 404437.0, 410750.0, 86228.0, 19923.0, 6230.0, 2633.0, 1224.0, 648.0, 398.0, 241.0, 150.0, 101.0, 74.0, 49.0, 27.0, 40.0, 12.0, 11.0, 13.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.109375, -8.86322021484375, -8.6170654296875, -8.37091064453125, -8.124755859375, -7.87860107421875, -7.6324462890625, -7.38629150390625, -7.14013671875, -6.89398193359375, -6.6478271484375, -6.40167236328125, -6.155517578125, -5.90936279296875, -5.6632080078125, -5.41705322265625, -5.1708984375, -4.92474365234375, -4.6785888671875, -4.43243408203125, -4.186279296875, -3.94012451171875, -3.6939697265625, -3.44781494140625, -3.20166015625, -2.95550537109375, -2.7093505859375, -2.46319580078125, -2.217041015625, -1.97088623046875, -1.7247314453125, -1.47857666015625, -1.232421875, -0.98626708984375, -0.7401123046875, -0.49395751953125, -0.247802734375, -0.00164794921875, 0.2445068359375, 0.49066162109375, 0.73681640625, 0.98297119140625, 1.2291259765625, 1.47528076171875, 1.721435546875, 1.96759033203125, 2.2137451171875, 2.45989990234375, 2.7060546875, 2.95220947265625, 3.1983642578125, 3.44451904296875, 3.690673828125, 3.93682861328125, 4.1829833984375, 4.42913818359375, 4.67529296875, 4.92144775390625, 5.1676025390625, 5.41375732421875, 5.659912109375, 5.90606689453125, 6.1522216796875, 6.39837646484375, 6.64453125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 5.0, 13.0, 17.0, 16.0, 25.0, 27.0, 35.0, 38.0, 32.0, 48.0, 59.0, 52.0, 66.0, 2113.0, 64.0, 60.0, 57.0, 63.0, 50.0, 37.0, 37.0, 27.0, 22.0, 19.0, 10.0, 14.0, 12.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.625, -73.0703125, -70.515625, -67.9609375, -65.40625, -62.8515625, -60.296875, -57.7421875, -55.1875, -52.6328125, -50.078125, -47.5234375, -44.96875, -42.4140625, -39.859375, -37.3046875, -34.75, -32.1953125, -29.640625, -27.0859375, -24.53125, -21.9765625, -19.421875, -16.8671875, -14.3125, -11.7578125, -9.203125, -6.6484375, -4.09375, -1.5390625, 1.015625, 3.5703125, 6.125, 8.6796875, 11.234375, 13.7890625, 16.34375, 18.8984375, 21.453125, 24.0078125, 26.5625, 29.1171875, 31.671875, 34.2265625, 36.78125, 39.3359375, 41.890625, 44.4453125, 47.0, 49.5546875, 52.109375, 54.6640625, 57.21875, 59.7734375, 62.328125, 64.8828125, 67.4375, 69.9921875, 72.546875, 75.1015625, 77.65625, 80.2109375, 82.765625, 85.3203125, 87.875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 5.0, 4.0, 9.0, 8.0, 20.0, 29.0, 35.0, 66.0, 87.0, 121.0, 171.0, 264.0, 347.0, 582.0, 949.0, 2060.0, 5759.0, 38899.0, 2370507.0, 681233.0, 34807.0, 5205.0, 1840.0, 955.0, 560.0, 376.0, 228.0, 167.0, 127.0, 74.0, 59.0, 40.0, 26.0, 17.0, 8.0, 8.0, 9.0, 8.0, 3.0, 2.0, 10.0, 1.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0], "bins": [-12.6875, -12.302734375, -11.91796875, -11.533203125, -11.1484375, -10.763671875, -10.37890625, -9.994140625, -9.609375, -9.224609375, -8.83984375, -8.455078125, -8.0703125, -7.685546875, -7.30078125, -6.916015625, -6.53125, -6.146484375, -5.76171875, -5.376953125, -4.9921875, -4.607421875, -4.22265625, -3.837890625, -3.453125, -3.068359375, -2.68359375, -2.298828125, -1.9140625, -1.529296875, -1.14453125, -0.759765625, -0.375, 0.009765625, 0.39453125, 0.779296875, 1.1640625, 1.548828125, 1.93359375, 2.318359375, 2.703125, 3.087890625, 3.47265625, 3.857421875, 4.2421875, 4.626953125, 5.01171875, 5.396484375, 5.78125, 6.166015625, 6.55078125, 6.935546875, 7.3203125, 7.705078125, 8.08984375, 8.474609375, 8.859375, 9.244140625, 9.62890625, 10.013671875, 10.3984375, 10.783203125, 11.16796875, 11.552734375, 11.9375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 13.0, 8.0, 20.0, 27.0, 56.0, 81.0, 108.0, 156.0, 154.0, 127.0, 92.0, 55.0, 34.0, 18.0, 11.0, 7.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-111.04193878173828, -107.97674560546875, -104.91155242919922, -101.84636688232422, -98.78117370605469, -95.71598052978516, -92.65078735351562, -89.58560180664062, -86.5204086303711, -83.45521545410156, -80.39002227783203, -77.32483673095703, -74.2596435546875, -71.19445037841797, -68.12925720214844, -65.06407165527344, -61.99887466430664, -58.93368148803711, -55.868492126464844, -52.80329895019531, -49.73810958862305, -46.672916412353516, -43.60772705078125, -40.54253387451172, -37.47734069824219, -34.412147521972656, -31.34695816040039, -28.28176498413086, -25.216575622558594, -22.151382446289062, -19.086191177368164, -16.020999908447266, -12.955810546875, -9.890619277954102, -6.825427532196045, -3.7602357864379883, -0.6950445175170898, 2.3701467514038086, 5.435338973999023, 8.500530242919922, 11.56572151184082, 14.630912780761719, 17.696104049682617, 20.761295318603516, 23.826488494873047, 26.891677856445312, 29.956871032714844, 33.022064208984375, 36.08725357055664, 39.15244674682617, 42.21763610839844, 45.28282928466797, 48.348018646240234, 51.413211822509766, 54.47840118408203, 57.54359436035156, 60.608787536621094, 63.673980712890625, 66.73917388916016, 69.80435943603516, 72.86955261230469, 75.93474578857422, 78.99993896484375, 82.06512451171875, 85.13031768798828]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 6.0, 8.0, 3.0, 4.0, 8.0, 5.0, 8.0, 16.0, 13.0, 22.0, 34.0, 27.0, 29.0, 33.0, 31.0, 34.0, 55.0, 55.0, 56.0, 51.0, 59.0, 51.0, 55.0, 51.0, 40.0, 41.0, 35.0, 27.0, 29.0, 24.0, 20.0, 18.0, 9.0, 7.0, 11.0, 7.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.08335876464844, -81.07108306884766, -78.05879974365234, -75.04652404785156, -72.03424072265625, -69.02196502685547, -66.00968933105469, -62.99740982055664, -59.985130310058594, -56.97285079956055, -53.9605712890625, -50.94829559326172, -47.93601608276367, -44.923736572265625, -41.911460876464844, -38.8991813659668, -35.88690185546875, -32.8746223449707, -29.86234474182129, -26.850067138671875, -23.837787628173828, -20.82550811767578, -17.813230514526367, -14.800952911376953, -11.788673400878906, -8.776394844055176, -5.764116287231445, -2.751837730407715, 0.2604408264160156, 3.272719383239746, 6.284997940063477, 9.29727554321289, 12.309555053710938, 15.321833610534668, 18.3341121673584, 21.346389770507812, 24.35866928100586, 27.370948791503906, 30.38322639465332, 33.395503997802734, 36.40778350830078, 39.42006301879883, 42.432342529296875, 45.444618225097656, 48.4568977355957, 51.46917724609375, 54.48145294189453, 57.49373245239258, 60.506011962890625, 63.51829147338867, 66.53057098388672, 69.5428466796875, 72.55513000488281, 75.5674057006836, 78.57968139648438, 81.59196472167969, 84.60424041748047, 87.61651611328125, 90.62879943847656, 93.64107513427734, 96.65335083007812, 99.66563415527344, 102.67790985107422, 105.690185546875, 108.70246887207031]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 9.0, 18.0, 13.0, 15.0, 30.0, 33.0, 62.0, 79.0, 128.0, 216.0, 364.0, 578.0, 1003.0, 1629.0, 2505.0, 4026.0, 6529.0, 1014182.0, 6573.0, 3903.0, 2553.0, 1560.0, 973.0, 572.0, 330.0, 214.0, 150.0, 105.0, 69.0, 38.0, 37.0, 14.0, 20.0, 10.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.47530746459961, -21.875869750976562, -21.276432037353516, -20.67699432373047, -20.077556610107422, -19.478118896484375, -18.878681182861328, -18.27924346923828, -17.679805755615234, -17.080368041992188, -16.48093032836914, -15.881492614746094, -15.282054901123047, -14.6826171875, -14.083179473876953, -13.483741760253906, -12.884303092956543, -12.284865379333496, -11.68542766571045, -11.085989952087402, -10.486552238464355, -9.887114524841309, -9.287675857543945, -8.688238143920898, -8.088800430297852, -7.489362716674805, -6.889925003051758, -6.290487289428711, -5.691049575805664, -5.091611862182617, -4.492173671722412, -3.8927359580993652, -3.2932987213134766, -2.6938610076904297, -2.094423294067383, -1.4949853420257568, -0.89554762840271, -0.2961099147796631, 0.3033280372619629, 0.9027657508850098, 1.5022034645080566, 2.1016411781311035, 2.7010788917541504, 3.3005168437957764, 3.8999545574188232, 4.499392509460449, 5.098830223083496, 5.698267936706543, 6.29770565032959, 6.897143363952637, 7.496581077575684, 8.09601879119873, 8.695456504821777, 9.294894218444824, 9.894332885742188, 10.493770599365234, 11.093208312988281, 11.692646026611328, 12.292083740234375, 12.891521453857422, 13.490959167480469, 14.090396881103516, 14.689834594726562, 15.28927230834961, 15.888710021972656]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 19.0, 23.0, 44.0, 56.0, 61.0, 141.0, 3677.0, 51458920.0, 193.0, 74.0, 31.0, 25.0, 21.0, 29.0, 21.0, 16.0, 18.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2878.673095703125, -2727.9326171875, -2577.192138671875, -2426.45166015625, -2275.71142578125, -2124.970703125, -1974.23046875, -1823.489990234375, -1672.74951171875, -1522.009033203125, -1371.2685546875, -1220.5281982421875, -1069.7877197265625, -919.0472412109375, -768.3068237304688, -617.56640625, -466.825927734375, -316.0854797363281, -165.34503173828125, -14.604583740234375, 136.1358642578125, 286.8763427734375, 437.61676025390625, 588.357177734375, 739.09765625, 889.838134765625, 1040.57861328125, 1191.3189697265625, 1342.0594482421875, 1492.7999267578125, 1643.540283203125, 1794.28076171875, 1945.02099609375, 2095.761474609375, 2246.501953125, 2397.242431640625, 2547.98291015625, 2698.72314453125, 2849.463623046875, 3000.2041015625, 3150.944580078125, 3301.68505859375, 3452.425537109375, 3603.166015625, 3753.90625, 3904.64697265625, 4055.38720703125, 4206.1279296875, 4356.8681640625, 4507.6083984375, 4658.34912109375, 4809.08935546875, 4959.830078125, 5110.5703125, 5261.31103515625, 5412.05126953125, 5562.7919921875, 5713.5322265625, 5864.27294921875, 6015.01318359375, 6165.75390625, 6316.494140625, 6467.23486328125, 6617.97509765625, 6768.71533203125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 3.0, 8.0, 9.0, 17.0, 18.0, 45.0, 66.0, 105.0, 147.0, 197.0, 290.0, 412.0, 640.0, 950.0, 1282.0, 1937.0, 2784.0, 4204.0, 6218.0, 9463.0, 14161.0, 21730.0, 33251.0, 52523.0, 85826.0, 145477.0, 268958.0, 670255.0, 3980681.0, 449581.0, 218233.0, 120667.0, 71686.0, 44560.0, 28543.0, 18471.0, 12185.0, 8070.0, 5657.0, 3669.0, 2647.0, 1753.0, 1293.0, 881.0, 541.0, 471.0, 238.0, 226.0, 104.0, 100.0, 68.0, 43.0, 20.0, 27.0, 19.0, 3.0, 16.0, 6.0, 3.0, 0.0, 6.0], "bins": [-3.53515625, -3.422332763671875, -3.30950927734375, -3.196685791015625, -3.0838623046875, -2.971038818359375, -2.85821533203125, -2.745391845703125, -2.632568359375, -2.519744873046875, -2.40692138671875, -2.294097900390625, -2.1812744140625, -2.068450927734375, -1.95562744140625, -1.842803955078125, -1.72998046875, -1.617156982421875, -1.50433349609375, -1.391510009765625, -1.2786865234375, -1.165863037109375, -1.05303955078125, -0.940216064453125, -0.827392578125, -0.714569091796875, -0.60174560546875, -0.488922119140625, -0.3760986328125, -0.263275146484375, -0.15045166015625, -0.037628173828125, 0.0751953125, 0.188018798828125, 0.30084228515625, 0.413665771484375, 0.5264892578125, 0.639312744140625, 0.75213623046875, 0.864959716796875, 0.977783203125, 1.090606689453125, 1.20343017578125, 1.316253662109375, 1.4290771484375, 1.541900634765625, 1.65472412109375, 1.767547607421875, 1.88037109375, 1.993194580078125, 2.10601806640625, 2.218841552734375, 2.3316650390625, 2.444488525390625, 2.55731201171875, 2.670135498046875, 2.782958984375, 2.895782470703125, 3.00860595703125, 3.121429443359375, 3.2342529296875, 3.347076416015625, 3.45989990234375, 3.572723388671875, 3.685546875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [4.0, 6.0, 1.0, 4.0, 6.0, 4.0, 2.0, 10.0, 10.0, 14.0, 11.0, 8.0, 13.0, 17.0, 16.0, 24.0, 34.0, 27.0, 43.0, 25.0, 34.0, 38.0, 31.0, 52.0, 71.0, 224.0, 702.0, 158.0, 47.0, 41.0, 41.0, 45.0, 32.0, 28.0, 26.0, 24.0, 20.0, 25.0, 23.0, 11.0, 13.0, 14.0, 10.0, 10.0, 6.0, 9.0, 3.0, 7.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.1484375, -6.877685546875, -6.60693359375, -6.336181640625, -6.0654296875, -5.794677734375, -5.52392578125, -5.253173828125, -4.982421875, -4.711669921875, -4.44091796875, -4.170166015625, -3.8994140625, -3.628662109375, -3.35791015625, -3.087158203125, -2.81640625, -2.545654296875, -2.27490234375, -2.004150390625, -1.7333984375, -1.462646484375, -1.19189453125, -0.921142578125, -0.650390625, -0.379638671875, -0.10888671875, 0.161865234375, 0.4326171875, 0.703369140625, 0.97412109375, 1.244873046875, 1.515625, 1.786376953125, 2.05712890625, 2.327880859375, 2.5986328125, 2.869384765625, 3.14013671875, 3.410888671875, 3.681640625, 3.952392578125, 4.22314453125, 4.493896484375, 4.7646484375, 5.035400390625, 5.30615234375, 5.576904296875, 5.84765625, 6.118408203125, 6.38916015625, 6.659912109375, 6.9306640625, 7.201416015625, 7.47216796875, 7.742919921875, 8.013671875, 8.284423828125, 8.55517578125, 8.825927734375, 9.0966796875, 9.367431640625, 9.63818359375, 9.908935546875, 10.1796875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 6.0, 0.0, 1.0, 9.0, 14.0, 9.0, 6.0, 26.0, 31.0, 32.0, 71.0, 85.0, 131.0, 185.0, 327.0, 462.0, 733.0, 1179.0, 1789.0, 2884.0, 4955.0, 8276.0, 14839.0, 25292.0, 45872.0, 87943.0, 175064.0, 413169.0, 4056166.0, 903253.0, 274324.0, 126114.0, 64995.0, 34977.0, 19790.0, 11287.0, 6506.0, 3972.0, 2333.0, 1562.0, 943.0, 644.0, 409.0, 229.0, 177.0, 117.0, 76.0, 67.0, 38.0, 25.0, 11.0, 14.0, 9.0, 7.0, 1.0, 8.0, 3.0, 0.0, 0.0, 3.0], "bins": [-6.0234375, -5.83966064453125, -5.6558837890625, -5.47210693359375, -5.288330078125, -5.10455322265625, -4.9207763671875, -4.73699951171875, -4.55322265625, -4.36944580078125, -4.1856689453125, -4.00189208984375, -3.818115234375, -3.63433837890625, -3.4505615234375, -3.26678466796875, -3.0830078125, -2.89923095703125, -2.7154541015625, -2.53167724609375, -2.347900390625, -2.16412353515625, -1.9803466796875, -1.79656982421875, -1.61279296875, -1.42901611328125, -1.2452392578125, -1.06146240234375, -0.877685546875, -0.69390869140625, -0.5101318359375, -0.32635498046875, -0.142578125, 0.04119873046875, 0.2249755859375, 0.40875244140625, 0.592529296875, 0.77630615234375, 0.9600830078125, 1.14385986328125, 1.32763671875, 1.51141357421875, 1.6951904296875, 1.87896728515625, 2.062744140625, 2.24652099609375, 2.4302978515625, 2.61407470703125, 2.7978515625, 2.98162841796875, 3.1654052734375, 3.34918212890625, 3.532958984375, 3.71673583984375, 3.9005126953125, 4.08428955078125, 4.26806640625, 4.45184326171875, 4.6356201171875, 4.81939697265625, 5.003173828125, 5.18695068359375, 5.3707275390625, 5.55450439453125, 5.73828125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 13.0, 16.0, 7.0, 14.0, 27.0, 20.0, 38.0, 27.0, 26.0, 39.0, 50.0, 59.0, 79.0, 144.0, 560.0, 388.0, 101.0, 61.0, 46.0, 40.0, 40.0, 36.0, 36.0, 33.0, 20.0, 21.0, 19.0, 11.0, 10.0, 12.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.4537353515625, -8.188720703125, -7.9237060546875, -7.65869140625, -7.3936767578125, -7.128662109375, -6.8636474609375, -6.5986328125, -6.3336181640625, -6.068603515625, -5.8035888671875, -5.53857421875, -5.2735595703125, -5.008544921875, -4.7435302734375, -4.478515625, -4.2135009765625, -3.948486328125, -3.6834716796875, -3.41845703125, -3.1534423828125, -2.888427734375, -2.6234130859375, -2.3583984375, -2.0933837890625, -1.828369140625, -1.5633544921875, -1.29833984375, -1.0333251953125, -0.768310546875, -0.5032958984375, -0.23828125, 0.0267333984375, 0.291748046875, 0.5567626953125, 0.82177734375, 1.0867919921875, 1.351806640625, 1.6168212890625, 1.8818359375, 2.1468505859375, 2.411865234375, 2.6768798828125, 2.94189453125, 3.2069091796875, 3.471923828125, 3.7369384765625, 4.001953125, 4.2669677734375, 4.531982421875, 4.7969970703125, 5.06201171875, 5.3270263671875, 5.592041015625, 5.8570556640625, 6.1220703125, 6.3870849609375, 6.652099609375, 6.9171142578125, 7.18212890625, 7.4471435546875, 7.712158203125, 7.9771728515625, 8.2421875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 7.0, 0.0, 22.0, 32.0, 27.0, 23.0, 37.0, 36.0, 52.0, 110.0, 139.0, 207.0, 201.0, 197.0, 350.0, 550.0, 713.0, 900.0, 1481.0, 2248.0, 3271.0, 6101.0, 11756.0, 26628.0, 86872.0, 5900256.0, 174958.0, 38521.0, 15504.0, 7640.0, 4237.0, 2670.0, 1566.0, 1210.0, 785.0, 505.0, 387.0, 313.0, 244.0, 130.0, 136.0, 88.0, 83.0, 85.0, 39.0, 47.0, 8.0, 12.0, 4.0, 10.0, 23.0, 12.0, 0.0, 0.0, 3.0, 6.0], "bins": [-14.4296875, -14.0013427734375, -13.572998046875, -13.1446533203125, -12.71630859375, -12.2879638671875, -11.859619140625, -11.4312744140625, -11.0029296875, -10.5745849609375, -10.146240234375, -9.7178955078125, -9.28955078125, -8.8612060546875, -8.432861328125, -8.0045166015625, -7.576171875, -7.1478271484375, -6.719482421875, -6.2911376953125, -5.86279296875, -5.4344482421875, -5.006103515625, -4.5777587890625, -4.1494140625, -3.7210693359375, -3.292724609375, -2.8643798828125, -2.43603515625, -2.0076904296875, -1.579345703125, -1.1510009765625, -0.72265625, -0.2943115234375, 0.134033203125, 0.5623779296875, 0.99072265625, 1.4190673828125, 1.847412109375, 2.2757568359375, 2.7041015625, 3.1324462890625, 3.560791015625, 3.9891357421875, 4.41748046875, 4.8458251953125, 5.274169921875, 5.7025146484375, 6.130859375, 6.5592041015625, 6.987548828125, 7.4158935546875, 7.84423828125, 8.2725830078125, 8.700927734375, 9.1292724609375, 9.5576171875, 9.9859619140625, 10.414306640625, 10.8426513671875, 11.27099609375, 11.6993408203125, 12.127685546875, 12.5560302734375, 12.984375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 8.0, 5.0, 3.0, 10.0, 7.0, 12.0, 17.0, 16.0, 21.0, 16.0, 22.0, 22.0, 23.0, 35.0, 45.0, 41.0, 50.0, 71.0, 103.0, 190.0, 460.0, 251.0, 126.0, 68.0, 50.0, 44.0, 44.0, 37.0, 30.0, 25.0, 21.0, 23.0, 26.0, 21.0, 8.0, 11.0, 13.0, 16.0, 12.0, 9.0, 5.0, 1.0, 5.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-5.18359375, -5.0343017578125, -4.885009765625, -4.7357177734375, -4.58642578125, -4.4371337890625, -4.287841796875, -4.1385498046875, -3.9892578125, -3.8399658203125, -3.690673828125, -3.5413818359375, -3.39208984375, -3.2427978515625, -3.093505859375, -2.9442138671875, -2.794921875, -2.6456298828125, -2.496337890625, -2.3470458984375, -2.19775390625, -2.0484619140625, -1.899169921875, -1.7498779296875, -1.6005859375, -1.4512939453125, -1.302001953125, -1.1527099609375, -1.00341796875, -0.8541259765625, -0.704833984375, -0.5555419921875, -0.40625, -0.2569580078125, -0.107666015625, 0.0416259765625, 0.19091796875, 0.3402099609375, 0.489501953125, 0.6387939453125, 0.7880859375, 0.9373779296875, 1.086669921875, 1.2359619140625, 1.38525390625, 1.5345458984375, 1.683837890625, 1.8331298828125, 1.982421875, 2.1317138671875, 2.281005859375, 2.4302978515625, 2.57958984375, 2.7288818359375, 2.878173828125, 3.0274658203125, 3.1767578125, 3.3260498046875, 3.475341796875, 3.6246337890625, 3.77392578125, 3.9232177734375, 4.072509765625, 4.2218017578125, 4.37109375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 4.0, 16.0, 29.0, 50.0, 69.0, 131.0, 364.0, 170.0, 68.0, 53.0, 20.0, 4.0, 8.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.03418731689453, -19.437789916992188, -18.84139060974121, -18.244993209838867, -17.648595809936523, -17.052196502685547, -16.455799102783203, -15.85940170288086, -15.2630033493042, -14.666604995727539, -14.070207595825195, -13.473809242248535, -12.877410888671875, -12.281013488769531, -11.684615135192871, -11.088216781616211, -10.491819381713867, -9.895421028137207, -9.299023628234863, -8.702625274658203, -8.10622787475586, -7.509829521179199, -6.913431167602539, -6.317033290863037, -5.720635414123535, -5.124237537384033, -4.527839660644531, -3.931441307067871, -3.335043430328369, -2.738645553588867, -2.142247438430786, -1.545849323272705, -0.9494514465332031, -0.3530534505844116, 0.24334454536437988, 0.8397425413131714, 1.436140537261963, 2.032538414001465, 2.628936529159546, 3.225334644317627, 3.821732521057129, 4.418130397796631, 5.014528274536133, 5.610926628112793, 6.207324504852295, 6.803722381591797, 7.400120735168457, 7.996518611907959, 8.592916488647461, 9.189314842224121, 9.785712242126465, 10.382110595703125, 10.978507995605469, 11.574906349182129, 12.171304702758789, 12.767702102661133, 13.364100456237793, 13.960498809814453, 14.556896209716797, 15.153294563293457, 15.749692916870117, 16.34609031677246, 16.942487716674805, 17.53888702392578, 18.135284423828125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 9.0, 6.0, 8.0, 16.0, 20.0, 19.0, 21.0, 22.0, 26.0, 23.0, 30.0, 41.0, 36.0, 42.0, 48.0, 48.0, 42.0, 49.0, 43.0, 32.0, 37.0, 39.0, 40.0, 29.0, 40.0, 24.0, 34.0, 22.0, 26.0, 19.0, 16.0, 20.0, 17.0, 13.0, 13.0, 3.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.480586051940918, -6.259017467498779, -6.037448406219482, -5.815879821777344, -5.594310760498047, -5.372742176055908, -5.151173114776611, -4.929604530334473, -4.708035469055176, -4.486466884613037, -4.26489782333374, -4.043329238891602, -3.8217601776123047, -3.600191593170166, -3.378622531890869, -3.1570539474487305, -2.9354851245880127, -2.713916301727295, -2.492347478866577, -2.2707786560058594, -2.0492098331451416, -1.8276411294937134, -1.6060723066329956, -1.3845034837722778, -1.16293466091156, -0.9413658380508423, -0.7197970151901245, -0.4982282519340515, -0.27665942907333374, -0.05509066581726074, 0.16647815704345703, 0.3880469799041748, 0.6096158027648926, 0.8311846256256104, 1.0527534484863281, 1.274322271347046, 1.4958910942077637, 1.717459797859192, 1.9390286207199097, 2.160597324371338, 2.3821663856506348, 2.6037352085113525, 2.8253040313720703, 3.046872854232788, 3.268441677093506, 3.4900102615356445, 3.7115793228149414, 3.93314790725708, 4.154716491699219, 4.376285076141357, 4.597854137420654, 4.819422721862793, 5.04099178314209, 5.2625603675842285, 5.484129428863525, 5.705698013305664, 5.927267074584961, 6.1488356590271, 6.3704047203063965, 6.591973304748535, 6.813542366027832, 7.035110950469971, 7.256680011749268, 7.478248596191406, 7.699817657470703]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 6.0, 15.0, 9.0, 17.0, 23.0, 26.0, 25.0, 42.0, 84.0, 80.0, 113.0, 164.0, 264.0, 376.0, 535.0, 871.0, 1559.0, 3267.0, 8737.0, 32905.0, 3847217.0, 263781.0, 22978.0, 5919.0, 2298.0, 1127.0, 632.0, 369.0, 265.0, 167.0, 100.0, 83.0, 63.0, 42.0, 26.0, 14.0, 28.0, 12.0, 6.0, 7.0, 4.0, 7.0, 5.0, 5.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0196533203125, -0.01894974708557129, -0.018246173858642578, -0.017542600631713867, -0.016839027404785156, -0.016135454177856445, -0.015431880950927734, -0.014728307723999023, -0.014024734497070312, -0.013321161270141602, -0.01261758804321289, -0.01191401481628418, -0.011210441589355469, -0.010506868362426758, -0.009803295135498047, -0.009099721908569336, -0.008396148681640625, -0.007692575454711914, -0.006989002227783203, -0.006285429000854492, -0.005581855773925781, -0.00487828254699707, -0.004174709320068359, -0.0034711360931396484, -0.0027675628662109375, -0.0020639896392822266, -0.0013604164123535156, -0.0006568431854248047, 4.673004150390625e-05, 0.0007503032684326172, 0.0014538764953613281, 0.002157449722290039, 0.00286102294921875, 0.003564596176147461, 0.004268169403076172, 0.004971742630004883, 0.005675315856933594, 0.006378889083862305, 0.007082462310791016, 0.0077860355377197266, 0.008489608764648438, 0.009193181991577148, 0.00989675521850586, 0.01060032844543457, 0.011303901672363281, 0.012007474899291992, 0.012711048126220703, 0.013414621353149414, 0.014118194580078125, 0.014821767807006836, 0.015525341033935547, 0.016228914260864258, 0.01693248748779297, 0.01763606071472168, 0.01833963394165039, 0.0190432071685791, 0.019746780395507812, 0.020450353622436523, 0.021153926849365234, 0.021857500076293945, 0.022561073303222656, 0.023264646530151367, 0.023968219757080078, 0.02467179298400879, 0.0253753662109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 8.0, 10.0, 7.0, 12.0, 10.0, 15.0, 13.0, 31.0, 753.0, 22.0, 12.0, 7.0, 14.0, 10.0, 4.0, 6.0, 7.0, 5.0, 4.0, 4.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014944076538085938, -0.0014466643333435059, -0.001398921012878418, -0.00135117769241333, -0.0013034343719482422, -0.0012556910514831543, -0.0012079477310180664, -0.0011602044105529785, -0.0011124610900878906, -0.0010647177696228027, -0.0010169744491577148, -0.000969231128692627, -0.0009214878082275391, -0.0008737444877624512, -0.0008260011672973633, -0.0007782578468322754, -0.0007305145263671875, -0.0006827712059020996, -0.0006350278854370117, -0.0005872845649719238, -0.0005395412445068359, -0.000491797924041748, -0.00044405460357666016, -0.00039631128311157227, -0.0003485679626464844, -0.0003008246421813965, -0.0002530813217163086, -0.0002053380012512207, -0.0001575946807861328, -0.00010985136032104492, -6.210803985595703e-05, -1.436471939086914e-05, 3.337860107421875e-05, 8.112192153930664e-05, 0.00012886524200439453, 0.00017660856246948242, 0.0002243518829345703, 0.0002720952033996582, 0.0003198385238647461, 0.000367581844329834, 0.0004153251647949219, 0.00046306848526000977, 0.0005108118057250977, 0.0005585551261901855, 0.0006062984466552734, 0.0006540417671203613, 0.0007017850875854492, 0.0007495284080505371, 0.000797271728515625, 0.0008450150489807129, 0.0008927583694458008, 0.0009405016899108887, 0.0009882450103759766, 0.0010359883308410645, 0.0010837316513061523, 0.0011314749717712402, 0.0011792182922363281, 0.001226961612701416, 0.001274704933166504, 0.0013224482536315918, 0.0013701915740966797, 0.0014179348945617676, 0.0014656782150268555, 0.0015134215354919434, 0.0015611648559570312]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 10.0, 6.0, 11.0, 14.0, 21.0, 26.0, 38.0, 49.0, 58.0, 73.0, 118.0, 179.0, 275.0, 421.0, 762.0, 1422.0, 3273.0, 11801.0, 133313.0, 3877668.0, 145607.0, 12274.0, 3382.0, 1412.0, 754.0, 423.0, 252.0, 188.0, 127.0, 91.0, 68.0, 34.0, 30.0, 25.0, 21.0, 14.0, 9.0, 9.0, 3.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.024169921875, -0.023448705673217773, -0.022727489471435547, -0.02200627326965332, -0.021285057067871094, -0.020563840866088867, -0.01984262466430664, -0.019121408462524414, -0.018400192260742188, -0.01767897605895996, -0.016957759857177734, -0.016236543655395508, -0.015515327453613281, -0.014794111251831055, -0.014072895050048828, -0.013351678848266602, -0.012630462646484375, -0.011909246444702148, -0.011188030242919922, -0.010466814041137695, -0.009745597839355469, -0.009024381637573242, -0.008303165435791016, -0.007581949234008789, -0.0068607330322265625, -0.006139516830444336, -0.005418300628662109, -0.004697084426879883, -0.003975868225097656, -0.0032546520233154297, -0.002533435821533203, -0.0018122196197509766, -0.00109100341796875, -0.00036978721618652344, 0.0003514289855957031, 0.0010726451873779297, 0.0017938613891601562, 0.002515077590942383, 0.0032362937927246094, 0.003957509994506836, 0.0046787261962890625, 0.005399942398071289, 0.006121158599853516, 0.006842374801635742, 0.007563591003417969, 0.008284807205200195, 0.009006023406982422, 0.009727239608764648, 0.010448455810546875, 0.011169672012329102, 0.011890888214111328, 0.012612104415893555, 0.013333320617675781, 0.014054536819458008, 0.014775753021240234, 0.015496969223022461, 0.016218185424804688, 0.016939401626586914, 0.01766061782836914, 0.018381834030151367, 0.019103050231933594, 0.01982426643371582, 0.020545482635498047, 0.021266698837280273, 0.0219879150390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 9.0, 9.0, 15.0, 12.0, 22.0, 21.0, 36.0, 32.0, 51.0, 66.0, 104.0, 120.0, 167.0, 193.0, 302.0, 570.0, 967.0, 401.0, 239.0, 183.0, 144.0, 79.0, 69.0, 55.0, 51.0, 29.0, 40.0, 22.0, 10.0, 8.0, 9.0, 10.0, 8.0, 2.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0025920867919921875, -0.0025163888931274414, -0.0024406909942626953, -0.0023649930953979492, -0.002289295196533203, -0.002213597297668457, -0.002137899398803711, -0.002062201499938965, -0.0019865036010742188, -0.0019108057022094727, -0.0018351078033447266, -0.0017594099044799805, -0.0016837120056152344, -0.0016080141067504883, -0.0015323162078857422, -0.001456618309020996, -0.00138092041015625, -0.001305222511291504, -0.0012295246124267578, -0.0011538267135620117, -0.0010781288146972656, -0.0010024309158325195, -0.0009267330169677734, -0.0008510351181030273, -0.0007753372192382812, -0.0006996393203735352, -0.0006239414215087891, -0.000548243522644043, -0.0004725456237792969, -0.0003968477249145508, -0.0003211498260498047, -0.0002454519271850586, -0.0001697540283203125, -9.40561294555664e-05, -1.8358230590820312e-05, 5.733966827392578e-05, 0.00013303756713867188, 0.00020873546600341797, 0.00028443336486816406, 0.00036013126373291016, 0.00043582916259765625, 0.0005115270614624023, 0.0005872249603271484, 0.0006629228591918945, 0.0007386207580566406, 0.0008143186569213867, 0.0008900165557861328, 0.0009657144546508789, 0.001041412353515625, 0.001117110252380371, 0.0011928081512451172, 0.0012685060501098633, 0.0013442039489746094, 0.0014199018478393555, 0.0014955997467041016, 0.0015712976455688477, 0.0016469955444335938, 0.0017226934432983398, 0.001798391342163086, 0.001874089241027832, 0.0019497871398925781, 0.0020254850387573242, 0.0021011829376220703, 0.0021768808364868164, 0.0022525787353515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 21.0, 24.0, 56.0, 145.0, 251.0, 268.0, 123.0, 55.0, 23.0, 12.0, 5.0, 4.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03887498751282692, -0.03776520863175392, -0.036655426025390625, -0.03554564714431763, -0.03443586453795433, -0.03332608565688133, -0.032216303050518036, -0.031106524169445038, -0.02999674342572689, -0.028886962682008743, -0.027777181938290596, -0.02666740119457245, -0.02555762231349945, -0.024447839707136154, -0.023338060826063156, -0.02222828008234501, -0.02111849933862686, -0.020008718594908714, -0.018898937851190567, -0.01778915710747242, -0.016679376363754272, -0.0155695965513587, -0.014459816738963127, -0.01335003599524498, -0.012240255251526833, -0.011130474507808685, -0.010020693764090538, -0.008910913951694965, -0.007801133207976818, -0.006691352464258671, -0.005581572186201811, -0.004471791908144951, -0.003362007439136505, -0.0022522269282490015, -0.0011424464173614979, -3.2665906473994255e-05, 0.0010771146044135094, 0.0021868953481316566, 0.0032966756261885166, 0.004406455904245377, 0.005516236647963524, 0.006626017391681671, 0.007735797669738531, 0.008845577947795391, 0.009955358691513538, 0.011065139435231686, 0.012174919247627258, 0.013284699991345406, 0.014394480735063553, 0.0155042614787817, 0.016614042222499847, 0.017723822966217995, 0.018833603709936142, 0.01994338259100914, 0.021053163334727287, 0.022162944078445435, 0.023272724822163582, 0.02438250556588173, 0.025492286309599876, 0.026602067053318024, 0.02771184593439102, 0.028821628540754318, 0.029931407421827316, 0.031041188165545464, 0.03215096890926361]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 7.0, 5.0, 4.0, 5.0, 7.0, 5.0, 12.0, 14.0, 10.0, 13.0, 12.0, 40.0, 28.0, 28.0, 47.0, 31.0, 49.0, 45.0, 33.0, 45.0, 54.0, 56.0, 47.0, 56.0, 46.0, 38.0, 39.0, 43.0, 29.0, 24.0, 26.0, 25.0, 17.0, 12.0, 8.0, 7.0, 4.0, 14.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010569870471954346, -0.010247211903333664, -0.009924553334712982, -0.0096018947660923, -0.009279236197471619, -0.008956577628850937, -0.008633919060230255, -0.008311260491609573, -0.007988601922988892, -0.00766594335436821, -0.007343284785747528, -0.007020626217126846, -0.0066979676485061646, -0.006375309079885483, -0.006052650511264801, -0.005729991942644119, -0.0054073333740234375, -0.005084674805402756, -0.004762016236782074, -0.004439357668161392, -0.0041166990995407104, -0.0037940405309200287, -0.003471381962299347, -0.003148723393678665, -0.0028260648250579834, -0.0025034062564373016, -0.00218074768781662, -0.0018580891191959381, -0.0015354305505752563, -0.0012127719819545746, -0.0008901134133338928, -0.0005674548447132111, -0.0002447962760925293, 7.786229252815247e-05, 0.00040052086114883423, 0.000723179429769516, 0.0010458379983901978, 0.0013684965670108795, 0.0016911551356315613, 0.002013813704252243, 0.002336472272872925, 0.0026591308414936066, 0.0029817894101142883, 0.00330444797873497, 0.003627106547355652, 0.003949765115976334, 0.004272423684597015, 0.004595082253217697, 0.004917740821838379, 0.005240399390459061, 0.005563057959079742, 0.005885716527700424, 0.006208375096321106, 0.006531033664941788, 0.0068536922335624695, 0.007176350802183151, 0.007499009370803833, 0.007821667939424515, 0.008144326508045197, 0.008466985076665878, 0.00878964364528656, 0.009112302213907242, 0.009434960782527924, 0.009757619351148605, 0.010080277919769287]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 12.0, 17.0, 14.0, 24.0, 34.0, 38.0, 58.0, 90.0, 117.0, 147.0, 204.0, 290.0, 390.0, 628.0, 902.0, 1330.0, 2223.0, 3608.0, 6576.0, 13349.0, 35932.0, 873521.0, 71017.0, 17790.0, 8226.0, 4489.0, 2699.0, 1569.0, 988.0, 684.0, 476.0, 319.0, 210.0, 131.0, 112.0, 87.0, 64.0, 45.0, 28.0, 27.0, 23.0, 14.0, 12.0, 7.0, 15.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0169677734375, -0.01643204689025879, -0.015896320343017578, -0.015360593795776367, -0.014824867248535156, -0.014289140701293945, -0.013753414154052734, -0.013217687606811523, -0.012681961059570312, -0.012146234512329102, -0.01161050796508789, -0.01107478141784668, -0.010539054870605469, -0.010003328323364258, -0.009467601776123047, -0.008931875228881836, -0.008396148681640625, -0.007860422134399414, -0.007324695587158203, -0.006788969039916992, -0.006253242492675781, -0.00571751594543457, -0.005181789398193359, -0.0046460628509521484, -0.0041103363037109375, -0.0035746097564697266, -0.0030388832092285156, -0.0025031566619873047, -0.0019674301147460938, -0.0014317035675048828, -0.0008959770202636719, -0.00036025047302246094, 0.00017547607421875, 0.0007112026214599609, 0.0012469291687011719, 0.0017826557159423828, 0.0023183822631835938, 0.0028541088104248047, 0.0033898353576660156, 0.0039255619049072266, 0.0044612884521484375, 0.0049970149993896484, 0.005532741546630859, 0.00606846809387207, 0.006604194641113281, 0.007139921188354492, 0.007675647735595703, 0.008211374282836914, 0.008747100830078125, 0.009282827377319336, 0.009818553924560547, 0.010354280471801758, 0.010890007019042969, 0.01142573356628418, 0.01196146011352539, 0.012497186660766602, 0.013032913208007812, 0.013568639755249023, 0.014104366302490234, 0.014640092849731445, 0.015175819396972656, 0.015711545944213867, 0.016247272491455078, 0.01678299903869629, 0.0173187255859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 7.0, 4.0, 6.0, 8.0, 4.0, 7.0, 7.0, 12.0, 16.0, 29.0, 131.0, 377.0, 245.0, 45.0, 21.0, 14.0, 7.0, 9.0, 5.0, 2.0, 9.0, 4.0, 1.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015516281127929688, -0.0015009045600891113, -0.001450181007385254, -0.0013994574546813965, -0.001348733901977539, -0.0012980103492736816, -0.0012472867965698242, -0.0011965632438659668, -0.0011458396911621094, -0.001095116138458252, -0.0010443925857543945, -0.0009936690330505371, -0.0009429454803466797, -0.0008922219276428223, -0.0008414983749389648, -0.0007907748222351074, -0.00074005126953125, -0.0006893277168273926, -0.0006386041641235352, -0.0005878806114196777, -0.0005371570587158203, -0.0004864335060119629, -0.00043570995330810547, -0.00038498640060424805, -0.0003342628479003906, -0.0002835392951965332, -0.00023281574249267578, -0.00018209218978881836, -0.00013136863708496094, -8.064508438110352e-05, -2.9921531677246094e-05, 2.0802021026611328e-05, 7.152557373046875e-05, 0.00012224912643432617, 0.0001729726791381836, 0.00022369623184204102, 0.00027441978454589844, 0.00032514333724975586, 0.0003758668899536133, 0.0004265904426574707, 0.0004773139953613281, 0.0005280375480651855, 0.000578761100769043, 0.0006294846534729004, 0.0006802082061767578, 0.0007309317588806152, 0.0007816553115844727, 0.0008323788642883301, 0.0008831024169921875, 0.0009338259696960449, 0.0009845495223999023, 0.0010352730751037598, 0.0010859966278076172, 0.0011367201805114746, 0.001187443733215332, 0.0012381672859191895, 0.0012888908386230469, 0.0013396143913269043, 0.0013903379440307617, 0.0014410614967346191, 0.0014917850494384766, 0.001542508602142334, 0.0015932321548461914, 0.0016439557075500488, 0.0016946792602539062]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 3.0, 8.0, 9.0, 15.0, 17.0, 18.0, 34.0, 50.0, 48.0, 88.0, 93.0, 164.0, 252.0, 342.0, 531.0, 761.0, 1231.0, 2167.0, 4180.0, 10363.0, 50879.0, 840122.0, 110396.0, 14726.0, 5235.0, 2656.0, 1446.0, 863.0, 535.0, 386.0, 271.0, 187.0, 141.0, 92.0, 67.0, 48.0, 41.0, 25.0, 17.0, 14.0, 10.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0266876220703125, -0.025870084762573242, -0.025052547454833984, -0.024235010147094727, -0.02341747283935547, -0.02259993553161621, -0.021782398223876953, -0.020964860916137695, -0.020147323608398438, -0.01932978630065918, -0.018512248992919922, -0.017694711685180664, -0.016877174377441406, -0.01605963706970215, -0.01524209976196289, -0.014424562454223633, -0.013607025146484375, -0.012789487838745117, -0.01197195053100586, -0.011154413223266602, -0.010336875915527344, -0.009519338607788086, -0.008701801300048828, -0.00788426399230957, -0.0070667266845703125, -0.006249189376831055, -0.005431652069091797, -0.004614114761352539, -0.0037965774536132812, -0.0029790401458740234, -0.0021615028381347656, -0.0013439655303955078, -0.00052642822265625, 0.0002911090850830078, 0.0011086463928222656, 0.0019261837005615234, 0.0027437210083007812, 0.003561258316040039, 0.004378795623779297, 0.005196332931518555, 0.0060138702392578125, 0.00683140754699707, 0.007648944854736328, 0.008466482162475586, 0.009284019470214844, 0.010101556777954102, 0.01091909408569336, 0.011736631393432617, 0.012554168701171875, 0.013371706008911133, 0.01418924331665039, 0.015006780624389648, 0.015824317932128906, 0.016641855239868164, 0.017459392547607422, 0.01827692985534668, 0.019094467163085938, 0.019912004470825195, 0.020729541778564453, 0.02154707908630371, 0.02236461639404297, 0.023182153701782227, 0.023999691009521484, 0.024817228317260742, 0.025634765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 2.0, 6.0, 11.0, 24.0, 17.0, 24.0, 20.0, 17.0, 35.0, 29.0, 30.0, 35.0, 37.0, 41.0, 40.0, 32.0, 44.0, 27.0, 46.0, 43.0, 45.0, 48.0, 50.0, 37.0, 31.0, 32.0, 27.0, 26.0, 20.0, 10.0, 25.0, 15.0, 11.0, 11.0, 4.0, 7.0, 3.0, 7.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006847381591796875, -0.006637156009674072, -0.0064269304275512695, -0.006216704845428467, -0.006006479263305664, -0.005796253681182861, -0.005586028099060059, -0.005375802516937256, -0.005165576934814453, -0.00495535135269165, -0.004745125770568848, -0.004534900188446045, -0.004324674606323242, -0.0041144490242004395, -0.0039042234420776367, -0.003693997859954834, -0.0034837722778320312, -0.0032735466957092285, -0.0030633211135864258, -0.002853095531463623, -0.0026428699493408203, -0.0024326443672180176, -0.002222418785095215, -0.002012193202972412, -0.0018019676208496094, -0.0015917420387268066, -0.001381516456604004, -0.0011712908744812012, -0.0009610652923583984, -0.0007508397102355957, -0.000540614128112793, -0.00033038854598999023, -0.0001201629638671875, 9.006261825561523e-05, 0.00030028820037841797, 0.0005105137825012207, 0.0007207393646240234, 0.0009309649467468262, 0.001141190528869629, 0.0013514161109924316, 0.0015616416931152344, 0.0017718672752380371, 0.00198209285736084, 0.0021923184394836426, 0.0024025440216064453, 0.002612769603729248, 0.0028229951858520508, 0.0030332207679748535, 0.0032434463500976562, 0.003453671932220459, 0.0036638975143432617, 0.0038741230964660645, 0.004084348678588867, 0.00429457426071167, 0.004504799842834473, 0.004715025424957275, 0.004925251007080078, 0.005135476589202881, 0.005345702171325684, 0.005555927753448486, 0.005766153335571289, 0.005976378917694092, 0.0061866044998168945, 0.006396830081939697, 0.0066070556640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 11.0, 21.0, 33.0, 49.0, 82.0, 126.0, 235.0, 591.0, 1517.0, 6355.0, 153795.0, 872177.0, 10137.0, 2012.0, 735.0, 309.0, 154.0, 78.0, 45.0, 25.0, 27.0, 11.0, 7.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038330078125, -0.03720664978027344, -0.036083221435546875, -0.03495979309082031, -0.03383636474609375, -0.03271293640136719, -0.031589508056640625, -0.030466079711914062, -0.0293426513671875, -0.028219223022460938, -0.027095794677734375, -0.025972366333007812, -0.02484893798828125, -0.023725509643554688, -0.022602081298828125, -0.021478652954101562, -0.020355224609375, -0.019231796264648438, -0.018108367919921875, -0.016984939575195312, -0.01586151123046875, -0.014738082885742188, -0.013614654541015625, -0.012491226196289062, -0.0113677978515625, -0.010244369506835938, -0.009120941162109375, -0.007997512817382812, -0.00687408447265625, -0.0057506561279296875, -0.004627227783203125, -0.0035037994384765625, -0.00238037109375, -0.0012569427490234375, -0.000133514404296875, 0.0009899139404296875, 0.00211334228515625, 0.0032367706298828125, 0.004360198974609375, 0.0054836273193359375, 0.0066070556640625, 0.0077304840087890625, 0.008853912353515625, 0.009977340698242188, 0.01110076904296875, 0.012224197387695312, 0.013347625732421875, 0.014471054077148438, 0.015594482421875, 0.016717910766601562, 0.017841339111328125, 0.018964767456054688, 0.02008819580078125, 0.021211624145507812, 0.022335052490234375, 0.023458480834960938, 0.0245819091796875, 0.025705337524414062, 0.026828765869140625, 0.027952194213867188, 0.02907562255859375, 0.030199050903320312, 0.031322479248046875, 0.03244590759277344, 0.0335693359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 4.0, 8.0, 2.0, 9.0, 6.0, 18.0, 15.0, 30.0, 24.0, 34.0, 38.0, 54.0, 80.0, 148.0, 154.0, 83.0, 63.0, 50.0, 45.0, 30.0, 21.0, 21.0, 8.0, 15.0, 9.0, 4.0, 7.0, 0.0, 3.0, 5.0, 3.0, 1.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003353118896484375, -0.0032486021518707275, -0.00314408540725708, -0.0030395686626434326, -0.002935051918029785, -0.0028305351734161377, -0.0027260184288024902, -0.0026215016841888428, -0.0025169849395751953, -0.002412468194961548, -0.0023079514503479004, -0.002203434705734253, -0.0020989179611206055, -0.001994401216506958, -0.0018898844718933105, -0.001785367727279663, -0.0016808509826660156, -0.0015763342380523682, -0.0014718174934387207, -0.0013673007488250732, -0.0012627840042114258, -0.0011582672595977783, -0.0010537505149841309, -0.0009492337703704834, -0.0008447170257568359, -0.0007402002811431885, -0.000635683536529541, -0.0005311667919158936, -0.0004266500473022461, -0.00032213330268859863, -0.00021761655807495117, -0.00011309981346130371, -8.58306884765625e-06, 9.593367576599121e-05, 0.00020045042037963867, 0.00030496716499328613, 0.0004094839096069336, 0.0005140006542205811, 0.0006185173988342285, 0.000723034143447876, 0.0008275508880615234, 0.0009320676326751709, 0.0010365843772888184, 0.0011411011219024658, 0.0012456178665161133, 0.0013501346111297607, 0.0014546513557434082, 0.0015591681003570557, 0.0016636848449707031, 0.0017682015895843506, 0.001872718334197998, 0.0019772350788116455, 0.002081751823425293, 0.0021862685680389404, 0.002290785312652588, 0.0023953020572662354, 0.002499818801879883, 0.0026043355464935303, 0.0027088522911071777, 0.002813369035720825, 0.0029178857803344727, 0.00302240252494812, 0.0031269192695617676, 0.003231436014175415, 0.0033359527587890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 13.0, 25.0, 28.0, 35.0, 58.0, 83.0, 104.0, 178.0, 455.0, 806.0, 2521.0, 12330.0, 904569.0, 116749.0, 7190.0, 1893.0, 641.0, 331.0, 179.0, 119.0, 78.0, 38.0, 24.0, 14.0, 19.0, 15.0, 21.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.039581298828125, -0.03805065155029297, -0.03652000427246094, -0.034989356994628906, -0.033458709716796875, -0.031928062438964844, -0.030397415161132812, -0.02886676788330078, -0.02733612060546875, -0.02580547332763672, -0.024274826049804688, -0.022744178771972656, -0.021213531494140625, -0.019682884216308594, -0.018152236938476562, -0.01662158966064453, -0.0150909423828125, -0.013560295104980469, -0.012029647827148438, -0.010499000549316406, -0.008968353271484375, -0.007437705993652344, -0.0059070587158203125, -0.004376411437988281, -0.00284576416015625, -0.0013151168823242188, 0.0002155303955078125, 0.0017461776733398438, 0.003276824951171875, 0.004807472229003906, 0.0063381195068359375, 0.007868766784667969, 0.0093994140625, 0.010930061340332031, 0.012460708618164062, 0.013991355895996094, 0.015522003173828125, 0.017052650451660156, 0.018583297729492188, 0.02011394500732422, 0.02164459228515625, 0.02317523956298828, 0.024705886840820312, 0.026236534118652344, 0.027767181396484375, 0.029297828674316406, 0.030828475952148438, 0.03235912322998047, 0.0338897705078125, 0.03542041778564453, 0.03695106506347656, 0.038481712341308594, 0.040012359619140625, 0.041543006896972656, 0.04307365417480469, 0.04460430145263672, 0.04613494873046875, 0.04766559600830078, 0.04919624328613281, 0.050726890563964844, 0.052257537841796875, 0.053788185119628906, 0.05531883239746094, 0.05684947967529297, 0.058380126953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 8.0, 9.0, 18.0, 20.0, 42.0, 152.0, 334.0, 206.0, 78.0, 29.0, 22.0, 16.0, 13.0, 14.0, 5.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0271453857421875, -0.026406288146972656, -0.025667190551757812, -0.02492809295654297, -0.024188995361328125, -0.02344989776611328, -0.022710800170898438, -0.021971702575683594, -0.02123260498046875, -0.020493507385253906, -0.019754409790039062, -0.01901531219482422, -0.018276214599609375, -0.01753711700439453, -0.016798019409179688, -0.016058921813964844, -0.01531982421875, -0.014580726623535156, -0.013841629028320312, -0.013102531433105469, -0.012363433837890625, -0.011624336242675781, -0.010885238647460938, -0.010146141052246094, -0.00940704345703125, -0.008667945861816406, -0.007928848266601562, -0.007189750671386719, -0.006450653076171875, -0.005711555480957031, -0.0049724578857421875, -0.004233360290527344, -0.0034942626953125, -0.0027551651000976562, -0.0020160675048828125, -0.0012769699096679688, -0.000537872314453125, 0.00020122528076171875, 0.0009403228759765625, 0.0016794204711914062, 0.00241851806640625, 0.0031576156616210938, 0.0038967132568359375, 0.004635810852050781, 0.005374908447265625, 0.006114006042480469, 0.0068531036376953125, 0.007592201232910156, 0.008331298828125, 0.009070396423339844, 0.009809494018554688, 0.010548591613769531, 0.011287689208984375, 0.012026786804199219, 0.012765884399414062, 0.013504981994628906, 0.01424407958984375, 0.014983177185058594, 0.015722274780273438, 0.01646137237548828, 0.017200469970703125, 0.01793956756591797, 0.018678665161132812, 0.019417762756347656, 0.0201568603515625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 26.0, 59.0, 207.0, 542.0, 93.0, 22.0, 12.0, 5.0, 4.0, 0.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.38651442527770996, -0.3774142563343048, -0.36831408739089966, -0.3592139184474945, -0.35011374950408936, -0.3410135805606842, -0.33191341161727905, -0.3228132426738739, -0.31371307373046875, -0.3046129047870636, -0.29551273584365845, -0.2864125669002533, -0.27731239795684814, -0.268212229013443, -0.25911206007003784, -0.2500118911266327, -0.24091173708438873, -0.23181156814098358, -0.22271139919757843, -0.21361123025417328, -0.20451106131076813, -0.19541089236736298, -0.18631073832511902, -0.17721056938171387, -0.16811040043830872, -0.15901023149490356, -0.1499100625514984, -0.14080989360809326, -0.1317097246646881, -0.12260955572128296, -0.1135093942284584, -0.10440922528505325, -0.0953090488910675, -0.08620887994766235, -0.0771087110042572, -0.06800854206085205, -0.0589083768427372, -0.049808207899332047, -0.040708042681217194, -0.03160787373781204, -0.02250770479440689, -0.013407536782324314, -0.004307368770241737, 0.004792798310518265, 0.013892967253923416, 0.022993136197328568, 0.03209330141544342, 0.04119347035884857, 0.05029363930225372, 0.059393808245658875, 0.06849397718906403, 0.07759414613246918, 0.08669431507587433, 0.09579448401927948, 0.10489464551210403, 0.11399481445550919, 0.12309498339891434, 0.1321951448917389, 0.14129531383514404, 0.1503954827785492, 0.15949565172195435, 0.1685958206653595, 0.17769598960876465, 0.1867961585521698, 0.19589632749557495]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 9.0, 2.0, 4.0, 7.0, 9.0, 7.0, 17.0, 21.0, 33.0, 59.0, 73.0, 107.0, 105.0, 139.0, 118.0, 65.0, 72.0, 20.0, 38.0, 17.0, 11.0, 9.0, 12.0, 4.0, 9.0, 9.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.12486505508422852, -0.12102162837982178, -0.11717820912599564, -0.1133347824215889, -0.10949136316776276, -0.10564793646335602, -0.10180450975894928, -0.09796108305454254, -0.0941176638007164, -0.09027423709630966, -0.08643081784248352, -0.08258739113807678, -0.07874396443367004, -0.0749005451798439, -0.07105711847543716, -0.06721369922161102, -0.06337027251720428, -0.059526849538087845, -0.055683426558971405, -0.05183999985456467, -0.04799657687544823, -0.04415315389633179, -0.04030972719192505, -0.03646630421280861, -0.03262288123369217, -0.02877945825457573, -0.02493603341281414, -0.02109260857105255, -0.01724918559193611, -0.013405762612819672, -0.009562337771058083, -0.0057189129292964935, -0.0018754899501800537, 0.0019679339602589607, 0.005811357870697975, 0.00965478178113699, 0.013498205691576004, 0.017341628670692444, 0.021185053512454033, 0.025028478354215622, 0.028871901333332062, 0.0327153243124485, 0.03655874729156494, 0.04040217399597168, 0.04424559697508812, 0.04808901995420456, 0.0519324466586113, 0.05577586963772774, 0.05961929261684418, 0.06346271932125092, 0.06730613857507706, 0.0711495652794838, 0.07499298453330994, 0.07883641123771667, 0.08267983794212341, 0.08652326464653015, 0.09036668390035629, 0.09421011060476303, 0.09805352985858917, 0.10189695656299591, 0.10574038326740265, 0.10958380252122879, 0.11342722922563553, 0.11727064847946167, 0.12111407518386841]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 9.0, 10.0, 17.0, 19.0, 21.0, 26.0, 47.0, 169.0, 2220.0, 4129894.0, 60744.0, 791.0, 112.0, 47.0, 37.0, 17.0, 18.0, 21.0, 8.0, 3.0, 5.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03515625, -1.962127685546875, -1.88909912109375, -1.816070556640625, -1.7430419921875, -1.670013427734375, -1.59698486328125, -1.523956298828125, -1.450927734375, -1.377899169921875, -1.30487060546875, -1.231842041015625, -1.1588134765625, -1.085784912109375, -1.01275634765625, -0.939727783203125, -0.86669921875, -0.793670654296875, -0.72064208984375, -0.647613525390625, -0.5745849609375, -0.501556396484375, -0.42852783203125, -0.355499267578125, -0.282470703125, -0.209442138671875, -0.13641357421875, -0.063385009765625, 0.0096435546875, 0.082672119140625, 0.15570068359375, 0.228729248046875, 0.3017578125, 0.374786376953125, 0.44781494140625, 0.520843505859375, 0.5938720703125, 0.666900634765625, 0.73992919921875, 0.812957763671875, 0.885986328125, 0.959014892578125, 1.03204345703125, 1.105072021484375, 1.1781005859375, 1.251129150390625, 1.32415771484375, 1.397186279296875, 1.47021484375, 1.543243408203125, 1.61627197265625, 1.689300537109375, 1.7623291015625, 1.835357666015625, 1.90838623046875, 1.981414794921875, 2.054443359375, 2.127471923828125, 2.20050048828125, 2.273529052734375, 2.3465576171875, 2.419586181640625, 2.49261474609375, 2.565643310546875, 2.638671875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 5.0, 5.0, 2.0, 0.0, 6.0, 6.0, 7.0, 5.0, 4.0, 15.0, 17.0, 30.0, 54.0, 124.0, 178.0, 217.0, 109.0, 71.0, 46.0, 18.0, 17.0, 5.0, 7.0, 7.0, 3.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 6.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010204315185546875, -0.0009855031967163086, -0.0009505748748779297, -0.0009156465530395508, -0.0008807182312011719, -0.000845789909362793, -0.0008108615875244141, -0.0007759332656860352, -0.0007410049438476562, -0.0007060766220092773, -0.0006711483001708984, -0.0006362199783325195, -0.0006012916564941406, -0.0005663633346557617, -0.0005314350128173828, -0.0004965066909790039, -0.000461578369140625, -0.0004266500473022461, -0.0003917217254638672, -0.0003567934036254883, -0.0003218650817871094, -0.00028693675994873047, -0.00025200843811035156, -0.00021708011627197266, -0.00018215179443359375, -0.00014722347259521484, -0.00011229515075683594, -7.736682891845703e-05, -4.2438507080078125e-05, -7.510185241699219e-06, 2.7418136596679688e-05, 6.23464584350586e-05, 9.72747802734375e-05, 0.0001322031021118164, 0.0001671314239501953, 0.00020205974578857422, 0.00023698806762695312, 0.00027191638946533203, 0.00030684471130371094, 0.00034177303314208984, 0.00037670135498046875, 0.00041162967681884766, 0.00044655799865722656, 0.00048148632049560547, 0.0005164146423339844, 0.0005513429641723633, 0.0005862712860107422, 0.0006211996078491211, 0.0006561279296875, 0.0006910562515258789, 0.0007259845733642578, 0.0007609128952026367, 0.0007958412170410156, 0.0008307695388793945, 0.0008656978607177734, 0.0009006261825561523, 0.0009355545043945312, 0.0009704828262329102, 0.001005411148071289, 0.001040339469909668, 0.0010752677917480469, 0.0011101961135864258, 0.0011451244354248047, 0.0011800527572631836, 0.0012149810791015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 9.0, 8.0, 16.0, 21.0, 22.0, 29.0, 42.0, 54.0, 72.0, 85.0, 133.0, 201.0, 2060.0, 4170460.0, 19588.0, 565.0, 182.0, 139.0, 124.0, 86.0, 78.0, 63.0, 55.0, 46.0, 36.0, 28.0, 19.0, 17.0, 9.0, 4.0, 9.0, 5.0, 3.0, 1.0, 6.0, 1.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3271484375, -0.31390380859375, -0.3006591796875, -0.28741455078125, -0.274169921875, -0.26092529296875, -0.2476806640625, -0.23443603515625, -0.22119140625, -0.20794677734375, -0.1947021484375, -0.18145751953125, -0.168212890625, -0.15496826171875, -0.1417236328125, -0.12847900390625, -0.115234375, -0.10198974609375, -0.0887451171875, -0.07550048828125, -0.062255859375, -0.04901123046875, -0.0357666015625, -0.02252197265625, -0.00927734375, 0.00396728515625, 0.0172119140625, 0.03045654296875, 0.043701171875, 0.05694580078125, 0.0701904296875, 0.08343505859375, 0.0966796875, 0.10992431640625, 0.1231689453125, 0.13641357421875, 0.149658203125, 0.16290283203125, 0.1761474609375, 0.18939208984375, 0.20263671875, 0.21588134765625, 0.2291259765625, 0.24237060546875, 0.255615234375, 0.26885986328125, 0.2821044921875, 0.29534912109375, 0.30859375, 0.32183837890625, 0.3350830078125, 0.34832763671875, 0.361572265625, 0.37481689453125, 0.3880615234375, 0.40130615234375, 0.41455078125, 0.42779541015625, 0.4410400390625, 0.45428466796875, 0.467529296875, 0.48077392578125, 0.4940185546875, 0.50726318359375, 0.5205078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 11.0, 13.0, 19.0, 28.0, 30.0, 45.0, 72.0, 81.0, 106.0, 150.0, 220.0, 289.0, 1346.0, 479.0, 242.0, 168.0, 143.0, 118.0, 97.0, 78.0, 68.0, 59.0, 47.0, 37.0, 29.0, 25.0, 12.0, 9.0, 8.0, 9.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002529144287109375, -0.0024268031120300293, -0.0023244619369506836, -0.002222120761871338, -0.002119779586791992, -0.0020174384117126465, -0.0019150972366333008, -0.001812756061553955, -0.0017104148864746094, -0.0016080737113952637, -0.001505732536315918, -0.0014033913612365723, -0.0013010501861572266, -0.0011987090110778809, -0.0010963678359985352, -0.0009940266609191895, -0.0008916854858398438, -0.000789344310760498, -0.0006870031356811523, -0.0005846619606018066, -0.00048232078552246094, -0.00037997961044311523, -0.00027763843536376953, -0.00017529726028442383, -7.295608520507812e-05, 2.9385089874267578e-05, 0.00013172626495361328, 0.00023406744003295898, 0.0003364086151123047, 0.0004387497901916504, 0.0005410909652709961, 0.0006434321403503418, 0.0007457733154296875, 0.0008481144905090332, 0.0009504556655883789, 0.0010527968406677246, 0.0011551380157470703, 0.001257479190826416, 0.0013598203659057617, 0.0014621615409851074, 0.0015645027160644531, 0.0016668438911437988, 0.0017691850662231445, 0.0018715262413024902, 0.001973867416381836, 0.0020762085914611816, 0.0021785497665405273, 0.002280890941619873, 0.0023832321166992188, 0.0024855732917785645, 0.00258791446685791, 0.002690255641937256, 0.0027925968170166016, 0.0028949379920959473, 0.002997279167175293, 0.0030996203422546387, 0.0032019615173339844, 0.00330430269241333, 0.0034066438674926758, 0.0035089850425720215, 0.003611326217651367, 0.003713667392730713, 0.0038160085678100586, 0.003918349742889404, 0.00402069091796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 734.0, 249.0, 25.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09924425184726715, -0.06409721076488495, -0.028950177133083344, 0.006196856498718262, 0.041343897581100464, 0.07649093866348267, 0.11163796484470367, 0.14678500592708588, 0.18193204700946808, 0.21707908809185028, 0.2522261142730713, 0.2873731553554535, 0.3225201964378357, 0.3576672375202179, 0.3928142786026001, 0.4279612898826599, 0.4631083607673645, 0.4982554018497467, 0.5334024429321289, 0.5685494542121887, 0.6036965250968933, 0.6388435363769531, 0.6739906072616577, 0.7091376185417175, 0.7442846298217773, 0.7794316411018372, 0.8145787119865417, 0.8497257232666016, 0.8848727941513062, 0.920019805431366, 0.9551668167114258, 0.9903138875961304, 1.0254608392715454, 1.06060791015625, 1.095754861831665, 1.1309019327163696, 1.1660490036010742, 1.2011960744857788, 1.2363430261611938, 1.2714900970458984, 1.306637167930603, 1.3417842388153076, 1.3769311904907227, 1.4120782613754272, 1.4472253322601318, 1.4823724031448364, 1.5175193548202515, 1.552666425704956, 1.587813377380371, 1.6229604482650757, 1.6581073999404907, 1.6932544708251953, 1.7284015417099, 1.7635486125946045, 1.7986955642700195, 1.8338426351547241, 1.8689897060394287, 1.9041367769241333, 1.9392837285995483, 1.974430799484253, 2.009577751159668, 2.044724941253662, 2.079871892929077, 2.115018844604492, 2.1501660346984863]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 11.0, 12.0, 16.0, 14.0, 36.0, 46.0, 65.0, 84.0, 106.0, 100.0, 121.0, 92.0, 82.0, 69.0, 56.0, 39.0, 17.0, 11.0, 5.0, 11.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0771322250366211, -0.07387250661849976, -0.07061278820037842, -0.06735306978225708, -0.06409335136413574, -0.060833629220724106, -0.05757390707731247, -0.05431418865919113, -0.051054470241069794, -0.047794751822948456, -0.04453503340482712, -0.04127531126141548, -0.038015592843294144, -0.034755874425172806, -0.03149615228176117, -0.02823643386363983, -0.024976715445518494, -0.021716997027397156, -0.01845727674663067, -0.015197557397186756, -0.011937838047742844, -0.008678119629621506, -0.005418399348855019, -0.0021586790680885315, 0.0011010393500328064, 0.004360758699476719, 0.007620478048920631, 0.010880197398364544, 0.014139916747808456, 0.017399635165929794, 0.02065935544669628, 0.02391907572746277, 0.027178794145584106, 0.030438512563705444, 0.03369823098182678, 0.03695795312523842, 0.040217671543359756, 0.043477389961481094, 0.04673711210489273, 0.04999683052301407, 0.053256548941135406, 0.056516267359256744, 0.05977598577737808, 0.06303570419549942, 0.06629543006420135, 0.06955514848232269, 0.07281486690044403, 0.07607458531856537, 0.0793343037366867, 0.08259402215480804, 0.08585374057292938, 0.08911345899105072, 0.09237317740917206, 0.0956328958272934, 0.09889262169599533, 0.10215234011411667, 0.105412058532238, 0.10867177695035934, 0.11193149536848068, 0.11519121378660202, 0.11845093965530396, 0.12171065807342529, 0.12497037649154663, 0.12823009490966797, 0.1314898133277893]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 9.0, 8.0, 13.0, 14.0, 27.0, 28.0, 28.0, 52.0, 76.0, 92.0, 107.0, 196.0, 235.0, 315.0, 458.0, 673.0, 990.0, 1485.0, 2446.0, 4091.0, 7072.0, 14600.0, 48956.0, 818299.0, 106689.0, 19515.0, 8881.0, 4802.0, 2794.0, 1767.0, 1146.0, 750.0, 505.0, 413.0, 253.0, 192.0, 155.0, 113.0, 67.0, 70.0, 51.0, 31.0, 18.0, 17.0, 22.0, 10.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0219268798828125, -0.0212554931640625, -0.0205841064453125, -0.0199127197265625, -0.0192413330078125, -0.0185699462890625, -0.0178985595703125, -0.0172271728515625, -0.0165557861328125, -0.0158843994140625, -0.0152130126953125, -0.0145416259765625, -0.0138702392578125, -0.0131988525390625, -0.0125274658203125, -0.0118560791015625, -0.0111846923828125, -0.0105133056640625, -0.0098419189453125, -0.0091705322265625, -0.0084991455078125, -0.0078277587890625, -0.0071563720703125, -0.0064849853515625, -0.0058135986328125, -0.0051422119140625, -0.0044708251953125, -0.0037994384765625, -0.0031280517578125, -0.0024566650390625, -0.0017852783203125, -0.0011138916015625, -0.0004425048828125, 0.0002288818359375, 0.0009002685546875, 0.0015716552734375, 0.0022430419921875, 0.0029144287109375, 0.0035858154296875, 0.0042572021484375, 0.0049285888671875, 0.0055999755859375, 0.0062713623046875, 0.0069427490234375, 0.0076141357421875, 0.0082855224609375, 0.0089569091796875, 0.0096282958984375, 0.0102996826171875, 0.0109710693359375, 0.0116424560546875, 0.0123138427734375, 0.0129852294921875, 0.0136566162109375, 0.0143280029296875, 0.0149993896484375, 0.0156707763671875, 0.0163421630859375, 0.0170135498046875, 0.0176849365234375, 0.0183563232421875, 0.0190277099609375, 0.0196990966796875, 0.0203704833984375, 0.0210418701171875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 3.0, 5.0, 7.0, 8.0, 8.0, 8.0, 11.0, 18.0, 33.0, 67.0, 130.0, 213.0, 200.0, 114.0, 55.0, 25.0, 11.0, 10.0, 6.0, 10.0, 5.0, 5.0, 4.0, 5.0, 6.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011262893676757812, -0.0010872185230255127, -0.0010481476783752441, -0.0010090768337249756, -0.000970005989074707, -0.0009309351444244385, -0.0008918642997741699, -0.0008527934551239014, -0.0008137226104736328, -0.0007746517658233643, -0.0007355809211730957, -0.0006965100765228271, -0.0006574392318725586, -0.00061836838722229, -0.0005792975425720215, -0.0005402266979217529, -0.0005011558532714844, -0.0004620850086212158, -0.00042301416397094727, -0.0003839433193206787, -0.00034487247467041016, -0.0003058016300201416, -0.00026673078536987305, -0.0002276599407196045, -0.00018858909606933594, -0.00014951825141906738, -0.00011044740676879883, -7.137656211853027e-05, -3.230571746826172e-05, 6.765127182006836e-06, 4.583597183227539e-05, 8.490681648254395e-05, 0.0001239776611328125, 0.00016304850578308105, 0.0002021193504333496, 0.00024119019508361816, 0.0002802610397338867, 0.0003193318843841553, 0.00035840272903442383, 0.0003974735736846924, 0.00043654441833496094, 0.0004756152629852295, 0.000514686107635498, 0.0005537569522857666, 0.0005928277969360352, 0.0006318986415863037, 0.0006709694862365723, 0.0007100403308868408, 0.0007491111755371094, 0.0007881820201873779, 0.0008272528648376465, 0.000866323709487915, 0.0009053945541381836, 0.0009444653987884521, 0.0009835362434387207, 0.0010226070880889893, 0.0010616779327392578, 0.0011007487773895264, 0.001139819622039795, 0.0011788904666900635, 0.001217961311340332, 0.0012570321559906006, 0.0012961030006408691, 0.0013351738452911377, 0.0013742446899414062]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 5.0, 2.0, 5.0, 2.0, 4.0, 6.0, 9.0, 6.0, 12.0, 16.0, 16.0, 16.0, 11.0, 13.0, 23.0, 24.0, 30.0, 35.0, 39.0, 40.0, 122.0, 627.0, 4079.0, 196423.0, 838584.0, 7055.0, 855.0, 176.0, 59.0, 34.0, 33.0, 25.0, 20.0, 17.0, 24.0, 11.0, 17.0, 13.0, 8.0, 12.0, 6.0, 8.0, 5.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.05023193359375, -0.04856395721435547, -0.04689598083496094, -0.045228004455566406, -0.043560028076171875, -0.041892051696777344, -0.04022407531738281, -0.03855609893798828, -0.03688812255859375, -0.03522014617919922, -0.03355216979980469, -0.031884193420410156, -0.030216217041015625, -0.028548240661621094, -0.026880264282226562, -0.02521228790283203, -0.0235443115234375, -0.02187633514404297, -0.020208358764648438, -0.018540382385253906, -0.016872406005859375, -0.015204429626464844, -0.013536453247070312, -0.011868476867675781, -0.01020050048828125, -0.008532524108886719, -0.0068645477294921875, -0.005196571350097656, -0.003528594970703125, -0.0018606185913085938, -0.0001926422119140625, 0.0014753341674804688, 0.003143310546875, 0.004811286926269531, 0.0064792633056640625, 0.008147239685058594, 0.009815216064453125, 0.011483192443847656, 0.013151168823242188, 0.014819145202636719, 0.01648712158203125, 0.01815509796142578, 0.019823074340820312, 0.021491050720214844, 0.023159027099609375, 0.024827003479003906, 0.026494979858398438, 0.02816295623779297, 0.0298309326171875, 0.03149890899658203, 0.03316688537597656, 0.034834861755371094, 0.036502838134765625, 0.038170814514160156, 0.03983879089355469, 0.04150676727294922, 0.04317474365234375, 0.04484272003173828, 0.04651069641113281, 0.048178672790527344, 0.049846649169921875, 0.051514625549316406, 0.05318260192871094, 0.05485057830810547, 0.0565185546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 8.0, 11.0, 11.0, 11.0, 18.0, 20.0, 15.0, 19.0, 28.0, 31.0, 24.0, 20.0, 27.0, 29.0, 31.0, 38.0, 36.0, 36.0, 35.0, 42.0, 32.0, 41.0, 38.0, 41.0, 49.0, 34.0, 30.0, 30.0, 22.0, 30.0, 22.0, 22.0, 18.0, 21.0, 4.0, 9.0, 9.0, 8.0, 13.0, 7.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.004161834716796875, -0.004039019346237183, -0.00391620397567749, -0.003793388605117798, -0.0036705732345581055, -0.003547757863998413, -0.0034249424934387207, -0.0033021271228790283, -0.003179311752319336, -0.0030564963817596436, -0.002933681011199951, -0.002810865640640259, -0.0026880502700805664, -0.002565234899520874, -0.0024424195289611816, -0.0023196041584014893, -0.002196788787841797, -0.0020739734172821045, -0.0019511580467224121, -0.0018283426761627197, -0.0017055273056030273, -0.001582711935043335, -0.0014598965644836426, -0.0013370811939239502, -0.0012142658233642578, -0.0010914504528045654, -0.000968635082244873, -0.0008458197116851807, -0.0007230043411254883, -0.0006001889705657959, -0.0004773736000061035, -0.00035455822944641113, -0.00023174285888671875, -0.00010892748832702637, 1.3887882232666016e-05, 0.0001367032527923584, 0.0002595186233520508, 0.00038233399391174316, 0.0005051493644714355, 0.0006279647350311279, 0.0007507801055908203, 0.0008735954761505127, 0.000996410846710205, 0.0011192262172698975, 0.0012420415878295898, 0.0013648569583892822, 0.0014876723289489746, 0.001610487699508667, 0.0017333030700683594, 0.0018561184406280518, 0.001978933811187744, 0.0021017491817474365, 0.002224564552307129, 0.0023473799228668213, 0.0024701952934265137, 0.002593010663986206, 0.0027158260345458984, 0.002838641405105591, 0.002961456775665283, 0.0030842721462249756, 0.003207087516784668, 0.0033299028873443604, 0.0034527182579040527, 0.003575533628463745, 0.0036983489990234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 17.0, 30.0, 29.0, 59.0, 140.0, 508.0, 2911.0, 123239.0, 915083.0, 5427.0, 684.0, 215.0, 77.0, 35.0, 22.0, 10.0, 15.0, 9.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038360595703125, -0.03694629669189453, -0.03553199768066406, -0.034117698669433594, -0.032703399658203125, -0.031289100646972656, -0.029874801635742188, -0.02846050262451172, -0.02704620361328125, -0.02563190460205078, -0.024217605590820312, -0.022803306579589844, -0.021389007568359375, -0.019974708557128906, -0.018560409545898438, -0.01714611053466797, -0.0157318115234375, -0.014317512512207031, -0.012903213500976562, -0.011488914489746094, -0.010074615478515625, -0.008660316467285156, -0.0072460174560546875, -0.005831718444824219, -0.00441741943359375, -0.0030031204223632812, -0.0015888214111328125, -0.00017452239990234375, 0.001239776611328125, 0.0026540756225585938, 0.0040683746337890625, 0.005482673645019531, 0.00689697265625, 0.008311271667480469, 0.009725570678710938, 0.011139869689941406, 0.012554168701171875, 0.013968467712402344, 0.015382766723632812, 0.01679706573486328, 0.01821136474609375, 0.01962566375732422, 0.021039962768554688, 0.022454261779785156, 0.023868560791015625, 0.025282859802246094, 0.026697158813476562, 0.02811145782470703, 0.0295257568359375, 0.03094005584716797, 0.03235435485839844, 0.033768653869628906, 0.035182952880859375, 0.036597251892089844, 0.03801155090332031, 0.03942584991455078, 0.04084014892578125, 0.04225444793701172, 0.04366874694824219, 0.045083045959472656, 0.046497344970703125, 0.047911643981933594, 0.04932594299316406, 0.05074024200439453, 0.052154541015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 5.0, 4.0, 6.0, 3.0, 4.0, 10.0, 8.0, 18.0, 16.0, 27.0, 56.0, 158.0, 359.0, 162.0, 52.0, 18.0, 16.0, 11.0, 14.0, 8.0, 11.0, 2.0, 5.0, 3.0, 3.0, 5.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009007453918457031, -0.0008607730269432068, -0.0008208006620407104, -0.0007808282971382141, -0.0007408559322357178, -0.0007008835673332214, -0.0006609112024307251, -0.0006209388375282288, -0.0005809664726257324, -0.0005409941077232361, -0.0005010217428207397, -0.0004610493779182434, -0.00042107701301574707, -0.00038110464811325073, -0.0003411322832107544, -0.00030115991830825806, -0.0002611875534057617, -0.00022121518850326538, -0.00018124282360076904, -0.0001412704586982727, -0.00010129809379577637, -6.132572889328003e-05, -2.135336399078369e-05, 1.8619000911712646e-05, 5.8591365814208984e-05, 9.856373071670532e-05, 0.00013853609561920166, 0.000178508460521698, 0.00021848082542419434, 0.0002584531903266907, 0.000298425555229187, 0.00033839792013168335, 0.0003783702850341797, 0.000418342649936676, 0.00045831501483917236, 0.0004982873797416687, 0.000538259744644165, 0.0005782321095466614, 0.0006182044744491577, 0.000658176839351654, 0.0006981492042541504, 0.0007381215691566467, 0.0007780939340591431, 0.0008180662989616394, 0.0008580386638641357, 0.0008980110287666321, 0.0009379833936691284, 0.0009779557585716248, 0.001017928123474121, 0.0010579004883766174, 0.0010978728532791138, 0.00113784521818161, 0.0011778175830841064, 0.0012177899479866028, 0.0012577623128890991, 0.0012977346777915955, 0.0013377070426940918, 0.0013776794075965881, 0.0014176517724990845, 0.0014576241374015808, 0.0014975965023040771, 0.0015375688672065735, 0.0015775412321090698, 0.0016175135970115662, 0.0016574859619140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 3.0, 8.0, 13.0, 9.0, 23.0, 24.0, 51.0, 126.0, 473.0, 3267.0, 823387.0, 218284.0, 2304.0, 339.0, 117.0, 50.0, 27.0, 22.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031158447265625, -0.02973794937133789, -0.02831745147705078, -0.026896953582763672, -0.025476455688476562, -0.024055957794189453, -0.022635459899902344, -0.021214962005615234, -0.019794464111328125, -0.018373966217041016, -0.016953468322753906, -0.015532970428466797, -0.014112472534179688, -0.012691974639892578, -0.011271476745605469, -0.00985097885131836, -0.00843048095703125, -0.007009983062744141, -0.005589485168457031, -0.004168987274169922, -0.0027484893798828125, -0.0013279914855957031, 9.250640869140625e-05, 0.0015130043029785156, 0.002933502197265625, 0.004354000091552734, 0.005774497985839844, 0.007194995880126953, 0.008615493774414062, 0.010035991668701172, 0.011456489562988281, 0.01287698745727539, 0.0142974853515625, 0.01571798324584961, 0.01713848114013672, 0.018558979034423828, 0.019979476928710938, 0.021399974822998047, 0.022820472717285156, 0.024240970611572266, 0.025661468505859375, 0.027081966400146484, 0.028502464294433594, 0.029922962188720703, 0.03134346008300781, 0.03276395797729492, 0.03418445587158203, 0.03560495376586914, 0.03702545166015625, 0.03844594955444336, 0.03986644744873047, 0.04128694534301758, 0.04270744323730469, 0.0441279411315918, 0.045548439025878906, 0.046968936920166016, 0.048389434814453125, 0.049809932708740234, 0.051230430603027344, 0.05265092849731445, 0.05407142639160156, 0.05549192428588867, 0.05691242218017578, 0.05833292007446289, 0.05975341796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 8.0, 16.0, 18.0, 18.0, 34.0, 36.0, 68.0, 71.0, 121.0, 164.0, 124.0, 102.0, 54.0, 37.0, 26.0, 22.0, 20.0, 8.0, 6.0, 9.0, 4.0, 2.0, 8.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00431060791015625, -0.004147708415985107, -0.003984808921813965, -0.0038219094276428223, -0.0036590099334716797, -0.003496110439300537, -0.0033332109451293945, -0.003170311450958252, -0.0030074119567871094, -0.002844512462615967, -0.0026816129684448242, -0.0025187134742736816, -0.002355813980102539, -0.0021929144859313965, -0.002030014991760254, -0.0018671154975891113, -0.0017042160034179688, -0.0015413165092468262, -0.0013784170150756836, -0.001215517520904541, -0.0010526180267333984, -0.0008897185325622559, -0.0007268190383911133, -0.0005639195442199707, -0.0004010200500488281, -0.00023812055587768555, -7.522106170654297e-05, 8.767843246459961e-05, 0.0002505779266357422, 0.00041347742080688477, 0.0005763769149780273, 0.0007392764091491699, 0.0009021759033203125, 0.001065075397491455, 0.0012279748916625977, 0.0013908743858337402, 0.0015537738800048828, 0.0017166733741760254, 0.001879572868347168, 0.0020424723625183105, 0.002205371856689453, 0.0023682713508605957, 0.0025311708450317383, 0.002694070339202881, 0.0028569698333740234, 0.003019869327545166, 0.0031827688217163086, 0.003345668315887451, 0.0035085678100585938, 0.0036714673042297363, 0.003834366798400879, 0.0039972662925720215, 0.004160165786743164, 0.004323065280914307, 0.004485964775085449, 0.004648864269256592, 0.004811763763427734, 0.004974663257598877, 0.0051375627517700195, 0.005300462245941162, 0.005463361740112305, 0.005626261234283447, 0.00578916072845459, 0.005952060222625732, 0.006114959716796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 10.0, 3.0, 7.0, 12.0, 37.0, 190.0, 404.0, 219.0, 64.0, 25.0, 11.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14002105593681335, -0.1365664303302765, -0.13311180472373962, -0.12965716421604156, -0.1262025386095047, -0.12274791300296783, -0.11929328739643097, -0.1158386617898941, -0.11238402873277664, -0.10892940312623978, -0.10547477006912231, -0.10202014446258545, -0.09856551885604858, -0.09511088579893112, -0.09165626019239426, -0.0882016271352768, -0.08474700152873993, -0.08129237592220306, -0.0778377428650856, -0.07438311725854874, -0.07092848420143127, -0.06747385859489441, -0.06401923298835754, -0.06056460365653038, -0.05710997432470322, -0.05365534499287605, -0.05020071566104889, -0.046746090054512024, -0.04329146072268486, -0.0398368313908577, -0.03638220578432083, -0.03292757645249367, -0.029472939670085907, -0.026018310338258743, -0.02256368286907673, -0.019109055399894714, -0.01565442606806755, -0.012199796736240387, -0.008745169267058372, -0.005290541797876358, -0.0018359124660491943, 0.0016187159344553947, 0.005073344334959984, 0.008527972735464573, 0.011982601135969162, 0.015437230467796326, 0.01889185793697834, 0.022346485406160355, 0.02580111473798752, 0.029255744069814682, 0.032710373401641846, 0.03616499900817871, 0.039619628340005875, 0.04307425767183304, 0.046528883278369904, 0.04998351261019707, 0.05343814194202423, 0.056892771273851395, 0.06034740060567856, 0.06380202621221542, 0.06725665926933289, 0.07071128487586975, 0.07416591048240662, 0.07762053608894348, 0.08107516914606094]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 10.0, 12.0, 11.0, 27.0, 25.0, 44.0, 45.0, 54.0, 57.0, 85.0, 69.0, 80.0, 76.0, 73.0, 57.0, 48.0, 36.0, 35.0, 28.0, 21.0, 20.0, 16.0, 5.0, 8.0, 9.0, 8.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.04657745361328125, -0.0452071912586689, -0.04383692890405655, -0.0424666702747345, -0.04109640792012215, -0.039726145565509796, -0.038355886936187744, -0.036985624581575394, -0.03561536222696304, -0.03424509987235069, -0.03287483751773834, -0.03150457888841629, -0.03013431653380394, -0.02876405417919159, -0.027393793687224388, -0.026023533195257187, -0.024653270840644836, -0.023283008486032486, -0.021912747994065285, -0.020542487502098083, -0.019172225147485733, -0.017801962792873383, -0.01643170230090618, -0.015061440877616405, -0.01369117945432663, -0.012320918031036854, -0.010950656607747078, -0.009580395184457302, -0.008210133761167526, -0.00683987233787775, -0.0054696109145879745, -0.004099349491298199, -0.002729088068008423, -0.001358826644718647, 1.1434778571128845e-05, 0.0013816962018609047, 0.0027519576251506805, 0.004122219048440456, 0.005492480471730232, 0.006862741895020008, 0.008233003318309784, 0.00960326474159956, 0.010973526164889336, 0.012343787588179111, 0.013714049011468887, 0.015084310434758663, 0.01645457185804844, 0.01782483235001564, 0.01919509470462799, 0.02056535705924034, 0.021935617551207542, 0.023305878043174744, 0.024676140397787094, 0.026046402752399445, 0.027416663244366646, 0.028786923736333847, 0.030157186090946198, 0.03152744844555855, 0.0328977108001709, 0.03426796942949295, 0.0356382317841053, 0.03700849413871765, 0.0383787527680397, 0.039749015122652054, 0.041119277477264404]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 0.0, 6.0, 5.0, 3.0, 4.0, 4.0, 0.0, 6.0, 14.0, 13.0, 7.0, 8.0, 16.0, 14.0, 18.0, 32.0, 64.0, 322.0, 4193249.0, 263.0, 54.0, 22.0, 17.0, 33.0, 12.0, 20.0, 16.0, 8.0, 8.0, 14.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.8828125, -0.8495025634765625, -0.816192626953125, -0.7828826904296875, -0.74957275390625, -0.7162628173828125, -0.682952880859375, -0.6496429443359375, -0.6163330078125, -0.5830230712890625, -0.549713134765625, -0.5164031982421875, -0.48309326171875, -0.4497833251953125, -0.416473388671875, -0.3831634521484375, -0.349853515625, -0.3165435791015625, -0.283233642578125, -0.2499237060546875, -0.21661376953125, -0.1833038330078125, -0.149993896484375, -0.1166839599609375, -0.0833740234375, -0.0500640869140625, -0.016754150390625, 0.0165557861328125, 0.04986572265625, 0.0831756591796875, 0.116485595703125, 0.1497955322265625, 0.18310546875, 0.2164154052734375, 0.249725341796875, 0.2830352783203125, 0.31634521484375, 0.3496551513671875, 0.382965087890625, 0.4162750244140625, 0.4495849609375, 0.4828948974609375, 0.516204833984375, 0.5495147705078125, 0.58282470703125, 0.6161346435546875, 0.649444580078125, 0.6827545166015625, 0.716064453125, 0.7493743896484375, 0.782684326171875, 0.8159942626953125, 0.84930419921875, 0.8826141357421875, 0.915924072265625, 0.9492340087890625, 0.9825439453125, 1.0158538818359375, 1.049163818359375, 1.0824737548828125, 1.11578369140625, 1.1490936279296875, 1.182403564453125, 1.2157135009765625, 1.2490234375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 1.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 8.0, 12.0, 13.0, 22.0, 25.0, 33.0, 83.0, 122.0, 171.0, 148.0, 107.0, 88.0, 43.0, 26.0, 12.0, 9.0, 7.0, 6.0, 12.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00107574462890625, -0.0010420680046081543, -0.0010083913803100586, -0.0009747147560119629, -0.0009410381317138672, -0.0009073615074157715, -0.0008736848831176758, -0.0008400082588195801, -0.0008063316345214844, -0.0007726550102233887, -0.000738978385925293, -0.0007053017616271973, -0.0006716251373291016, -0.0006379485130310059, -0.0006042718887329102, -0.0005705952644348145, -0.0005369186401367188, -0.000503242015838623, -0.00046956539154052734, -0.00043588876724243164, -0.00040221214294433594, -0.00036853551864624023, -0.00033485889434814453, -0.00030118227005004883, -0.0002675056457519531, -0.00023382902145385742, -0.00020015239715576172, -0.00016647577285766602, -0.0001327991485595703, -9.912252426147461e-05, -6.54458999633789e-05, -3.17692756652832e-05, 1.9073486328125e-06, 3.55839729309082e-05, 6.92605972290039e-05, 0.00010293722152709961, 0.0001366138458251953, 0.00017029047012329102, 0.00020396709442138672, 0.00023764371871948242, 0.0002713203430175781, 0.00030499696731567383, 0.00033867359161376953, 0.00037235021591186523, 0.00040602684020996094, 0.00043970346450805664, 0.00047338008880615234, 0.000507056713104248, 0.0005407333374023438, 0.0005744099617004395, 0.0006080865859985352, 0.0006417632102966309, 0.0006754398345947266, 0.0007091164588928223, 0.000742793083190918, 0.0007764697074890137, 0.0008101463317871094, 0.0008438229560852051, 0.0008774995803833008, 0.0009111762046813965, 0.0009448528289794922, 0.0009785294532775879, 0.0010122060775756836, 0.0010458827018737793, 0.001079559326171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 17.0, 39.0, 138.0, 23876.0, 4170048.0, 122.0, 24.0, 7.0, 7.0, 3.0, 1.0, 4.0], "bins": [-1.498046875, -1.4713134765625, -1.444580078125, -1.4178466796875, -1.39111328125, -1.3643798828125, -1.337646484375, -1.3109130859375, -1.2841796875, -1.2574462890625, -1.230712890625, -1.2039794921875, -1.17724609375, -1.1505126953125, -1.123779296875, -1.0970458984375, -1.0703125, -1.0435791015625, -1.016845703125, -0.9901123046875, -0.96337890625, -0.9366455078125, -0.909912109375, -0.8831787109375, -0.8564453125, -0.8297119140625, -0.802978515625, -0.7762451171875, -0.74951171875, -0.7227783203125, -0.696044921875, -0.6693115234375, -0.642578125, -0.6158447265625, -0.589111328125, -0.5623779296875, -0.53564453125, -0.5089111328125, -0.482177734375, -0.4554443359375, -0.4287109375, -0.4019775390625, -0.375244140625, -0.3485107421875, -0.32177734375, -0.2950439453125, -0.268310546875, -0.2415771484375, -0.21484375, -0.1881103515625, -0.161376953125, -0.1346435546875, -0.10791015625, -0.0811767578125, -0.054443359375, -0.0277099609375, -0.0009765625, 0.0257568359375, 0.052490234375, 0.0792236328125, 0.10595703125, 0.1326904296875, 0.159423828125, 0.1861572265625, 0.212890625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 11.0, 32.0, 108.0, 412.0, 2929.0, 461.0, 83.0, 20.0, 9.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0138397216796875, -0.013581395149230957, -0.013323068618774414, -0.013064742088317871, -0.012806415557861328, -0.012548089027404785, -0.012289762496948242, -0.0120314359664917, -0.011773109436035156, -0.011514782905578613, -0.01125645637512207, -0.010998129844665527, -0.010739803314208984, -0.010481476783752441, -0.010223150253295898, -0.009964823722839355, -0.009706497192382812, -0.00944817066192627, -0.009189844131469727, -0.008931517601013184, -0.00867319107055664, -0.008414864540100098, -0.008156538009643555, -0.007898211479187012, -0.007639884948730469, -0.007381558418273926, -0.007123231887817383, -0.00686490535736084, -0.006606578826904297, -0.006348252296447754, -0.006089925765991211, -0.005831599235534668, -0.005573272705078125, -0.005314946174621582, -0.005056619644165039, -0.004798293113708496, -0.004539966583251953, -0.00428164005279541, -0.004023313522338867, -0.0037649869918823242, -0.0035066604614257812, -0.0032483339309692383, -0.0029900074005126953, -0.0027316808700561523, -0.0024733543395996094, -0.0022150278091430664, -0.0019567012786865234, -0.0016983747482299805, -0.0014400482177734375, -0.0011817216873168945, -0.0009233951568603516, -0.0006650686264038086, -0.0004067420959472656, -0.00014841556549072266, 0.00010991096496582031, 0.0003682374954223633, 0.0006265640258789062, 0.0008848905563354492, 0.0011432170867919922, 0.0014015436172485352, 0.0016598701477050781, 0.001918196678161621, 0.002176523208618164, 0.002434849739074707, 0.00269317626953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1002.0, 18.0, 1.0], "bins": [-3.636082410812378, -3.577230930328369, -3.5183792114257812, -3.4595277309417725, -3.4006762504577637, -3.341824531555176, -3.282973051071167, -3.224121332168579, -3.1652698516845703, -3.1064183712005615, -3.0475666522979736, -2.988715171813965, -2.929863452911377, -2.871011972427368, -2.8121604919433594, -2.7533087730407715, -2.6944572925567627, -2.635605812072754, -2.576754093170166, -2.5179026126861572, -2.4590511322021484, -2.4001994132995605, -2.3413479328155518, -2.282496213912964, -2.223644733428955, -2.1647932529449463, -2.1059415340423584, -2.0470900535583496, -1.9882384538650513, -1.929386854171753, -1.8705353736877441, -1.8116837739944458, -1.7528321743011475, -1.6939805746078491, -1.6351289749145508, -1.576277494430542, -1.5174258947372437, -1.4585742950439453, -1.3997228145599365, -1.3408712148666382, -1.2820196151733398, -1.2231680154800415, -1.1643164157867432, -1.1054649353027344, -1.046613335609436, -0.9877617359161377, -0.9289101958274841, -0.8700586557388306, -0.811207115650177, -0.7523555755615234, -0.6935039758682251, -0.6346523761749268, -0.5758008360862732, -0.5169492959976196, -0.4580976963043213, -0.39924612641334534, -0.3403945565223694, -0.28154298663139343, -0.22269141674041748, -0.16383984684944153, -0.10498827695846558, -0.046136707067489624, 0.012714862823486328, 0.07156643271446228, 0.13041800260543823]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 11.0, 25.0, 66.0, 151.0, 254.0, 238.0, 161.0, 69.0, 28.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28930211067199707, -0.28349003195762634, -0.2776779532432556, -0.2718658745288849, -0.26605379581451416, -0.26024168729782104, -0.2544296383857727, -0.24861754477024078, -0.24280545115470886, -0.23699337244033813, -0.2311812937259674, -0.22536921501159668, -0.21955712139606476, -0.21374504268169403, -0.2079329639673233, -0.20212088525295258, -0.19630880653858185, -0.19049672782421112, -0.1846846491098404, -0.17887255549430847, -0.17306047677993774, -0.16724839806556702, -0.1614363193511963, -0.15562424063682556, -0.14981216192245483, -0.1440000832080841, -0.13818800449371338, -0.13237592577934265, -0.12656383216381073, -0.12075175344944, -0.11493967473506927, -0.10912759602069855, -0.10331550240516663, -0.0975034236907959, -0.09169133752584457, -0.08587925881147385, -0.08006717264652252, -0.0742550939321518, -0.06844301521778107, -0.06263093650341034, -0.056818850338459015, -0.05100676789879799, -0.04519468545913696, -0.039382606744766235, -0.03357052430510521, -0.027758441865444183, -0.021946363151073456, -0.01613428071141243, -0.010322198271751404, -0.004510116763412952, 0.001301964744925499, 0.007114045321941376, 0.012926127761602402, 0.018738210201263428, 0.024550288915634155, 0.03036237135529518, 0.03617445379495621, 0.04198653623461723, 0.04779861867427826, 0.05361069738864899, 0.05942277982831001, 0.06523486226797104, 0.07104694098234177, 0.07685902714729309, 0.08267110586166382]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 6.0, 14.0, 18.0, 14.0, 21.0, 26.0, 39.0, 43.0, 39.0, 36.0, 59.0, 44.0, 73.0, 3148.0, 1043755.0, 780.0, 58.0, 55.0, 43.0, 49.0, 44.0, 30.0, 35.0, 16.0, 15.0, 17.0, 14.0, 9.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.274658203125, -0.26618194580078125, -0.2577056884765625, -0.24922943115234375, -0.240753173828125, -0.23227691650390625, -0.2238006591796875, -0.21532440185546875, -0.20684814453125, -0.19837188720703125, -0.1898956298828125, -0.18141937255859375, -0.172943115234375, -0.16446685791015625, -0.1559906005859375, -0.14751434326171875, -0.1390380859375, -0.13056182861328125, -0.1220855712890625, -0.11360931396484375, -0.105133056640625, -0.09665679931640625, -0.0881805419921875, -0.07970428466796875, -0.07122802734375, -0.06275177001953125, -0.0542755126953125, -0.04579925537109375, -0.037322998046875, -0.02884674072265625, -0.0203704833984375, -0.01189422607421875, -0.00341796875, 0.00505828857421875, 0.0135345458984375, 0.02201080322265625, 0.030487060546875, 0.03896331787109375, 0.0474395751953125, 0.05591583251953125, 0.06439208984375, 0.07286834716796875, 0.0813446044921875, 0.08982086181640625, 0.098297119140625, 0.10677337646484375, 0.1152496337890625, 0.12372589111328125, 0.1322021484375, 0.14067840576171875, 0.1491546630859375, 0.15763092041015625, 0.166107177734375, 0.17458343505859375, 0.1830596923828125, 0.19153594970703125, 0.20001220703125, 0.20848846435546875, 0.2169647216796875, 0.22544097900390625, 0.233917236328125, 0.24239349365234375, 0.2508697509765625, 0.25934600830078125, 0.267822265625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 118.0, 565.0, 306.0, 24.0, 3.0], "bins": [-0.07366943359375, -0.07245504856109619, -0.07124066352844238, -0.07002627849578857, -0.06881189346313477, -0.06759750843048096, -0.06638312339782715, -0.06516873836517334, -0.06395435333251953, -0.06273996829986572, -0.061525583267211914, -0.060311198234558105, -0.0590968132019043, -0.05788242816925049, -0.05666804313659668, -0.05545365810394287, -0.05423927307128906, -0.053024888038635254, -0.051810503005981445, -0.05059611797332764, -0.04938173294067383, -0.04816734790802002, -0.04695296287536621, -0.0457385778427124, -0.044524192810058594, -0.043309807777404785, -0.04209542274475098, -0.04088103771209717, -0.03966665267944336, -0.03845226764678955, -0.03723788261413574, -0.036023497581481934, -0.034809112548828125, -0.033594727516174316, -0.03238034248352051, -0.0311659574508667, -0.02995157241821289, -0.028737187385559082, -0.027522802352905273, -0.026308417320251465, -0.025094032287597656, -0.023879647254943848, -0.02266526222229004, -0.02145087718963623, -0.020236492156982422, -0.019022107124328613, -0.017807722091674805, -0.016593337059020996, -0.015378952026367188, -0.014164566993713379, -0.01295018196105957, -0.011735796928405762, -0.010521411895751953, -0.009307026863098145, -0.008092641830444336, -0.006878256797790527, -0.005663871765136719, -0.00444948673248291, -0.0032351016998291016, -0.002020716667175293, -0.0008063316345214844, 0.0004080533981323242, 0.0016224384307861328, 0.0028368234634399414, 0.00405120849609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 1.0, 6.0, 2.0, 8.0, 10.0, 13.0, 14.0, 17.0, 27.0, 35.0, 39.0, 45.0, 79.0, 110.0, 176.0, 269.0, 861.0, 4597.0, 67812.0, 922823.0, 46351.0, 3672.0, 750.0, 283.0, 163.0, 111.0, 76.0, 47.0, 36.0, 23.0, 30.0, 16.0, 12.0, 9.0, 8.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10801887512207031, -0.10422134399414062, -0.10042381286621094, -0.09662628173828125, -0.09282875061035156, -0.08903121948242188, -0.08523368835449219, -0.0814361572265625, -0.07763862609863281, -0.07384109497070312, -0.07004356384277344, -0.06624603271484375, -0.06244850158691406, -0.058650970458984375, -0.05485343933105469, -0.051055908203125, -0.04725837707519531, -0.043460845947265625, -0.03966331481933594, -0.03586578369140625, -0.03206825256347656, -0.028270721435546875, -0.024473190307617188, -0.0206756591796875, -0.016878128051757812, -0.013080596923828125, -0.009283065795898438, -0.00548553466796875, -0.0016880035400390625, 0.002109527587890625, 0.0059070587158203125, 0.00970458984375, 0.013502120971679688, 0.017299652099609375, 0.021097183227539062, 0.02489471435546875, 0.028692245483398438, 0.032489776611328125, 0.03628730773925781, 0.0400848388671875, 0.04388236999511719, 0.047679901123046875, 0.05147743225097656, 0.05527496337890625, 0.05907249450683594, 0.06287002563476562, 0.06666755676269531, 0.070465087890625, 0.07426261901855469, 0.07806015014648438, 0.08185768127441406, 0.08565521240234375, 0.08945274353027344, 0.09325027465820312, 0.09704780578613281, 0.1008453369140625, 0.10464286804199219, 0.10844039916992188, 0.11223793029785156, 0.11603546142578125, 0.11983299255371094, 0.12363052368164062, 0.1274280548095703, 0.1312255859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 3.0, 7.0, 13.0, 21.0, 14.0, 17.0, 23.0, 24.0, 40.0, 40.0, 54.0, 54.0, 60.0, 73.0, 59.0, 59.0, 65.0, 73.0, 46.0, 41.0, 49.0, 39.0, 29.0, 19.0, 18.0, 12.0, 12.0, 8.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0494384765625, -0.04771757125854492, -0.045996665954589844, -0.044275760650634766, -0.04255485534667969, -0.04083395004272461, -0.03911304473876953, -0.03739213943481445, -0.035671234130859375, -0.0339503288269043, -0.03222942352294922, -0.03050851821899414, -0.028787612915039062, -0.027066707611083984, -0.025345802307128906, -0.023624897003173828, -0.02190399169921875, -0.020183086395263672, -0.018462181091308594, -0.016741275787353516, -0.015020370483398438, -0.01329946517944336, -0.011578559875488281, -0.009857654571533203, -0.008136749267578125, -0.006415843963623047, -0.004694938659667969, -0.0029740333557128906, -0.0012531280517578125, 0.0004677772521972656, 0.0021886825561523438, 0.003909587860107422, 0.0056304931640625, 0.007351398468017578, 0.009072303771972656, 0.010793209075927734, 0.012514114379882812, 0.01423501968383789, 0.01595592498779297, 0.017676830291748047, 0.019397735595703125, 0.021118640899658203, 0.02283954620361328, 0.02456045150756836, 0.026281356811523438, 0.028002262115478516, 0.029723167419433594, 0.03144407272338867, 0.03316497802734375, 0.03488588333129883, 0.036606788635253906, 0.038327693939208984, 0.04004859924316406, 0.04176950454711914, 0.04349040985107422, 0.0452113151550293, 0.046932220458984375, 0.04865312576293945, 0.05037403106689453, 0.05209493637084961, 0.05381584167480469, 0.055536746978759766, 0.057257652282714844, 0.05897855758666992, 0.060699462890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 9.0, 9.0, 6.0, 4.0, 12.0, 10.0, 18.0, 22.0, 24.0, 34.0, 43.0, 97.0, 181.0, 523.0, 2548.0, 27013.0, 1006834.0, 9064.0, 1322.0, 361.0, 147.0, 72.0, 32.0, 33.0, 23.0, 20.0, 19.0, 5.0, 8.0, 12.0, 4.0, 7.0, 6.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.41650390625, -0.4040031433105469, -0.39150238037109375, -0.3790016174316406, -0.3665008544921875, -0.3540000915527344, -0.34149932861328125, -0.3289985656738281, -0.316497802734375, -0.3039970397949219, -0.29149627685546875, -0.2789955139160156, -0.2664947509765625, -0.2539939880371094, -0.24149322509765625, -0.22899246215820312, -0.21649169921875, -0.20399093627929688, -0.19149017333984375, -0.17898941040039062, -0.1664886474609375, -0.15398788452148438, -0.14148712158203125, -0.12898635864257812, -0.116485595703125, -0.10398483276367188, -0.09148406982421875, -0.07898330688476562, -0.0664825439453125, -0.053981781005859375, -0.04148101806640625, -0.028980255126953125, -0.0164794921875, -0.003978729248046875, 0.00852203369140625, 0.021022796630859375, 0.0335235595703125, 0.046024322509765625, 0.05852508544921875, 0.07102584838867188, 0.083526611328125, 0.09602737426757812, 0.10852813720703125, 0.12102890014648438, 0.1335296630859375, 0.14603042602539062, 0.15853118896484375, 0.17103195190429688, 0.18353271484375, 0.19603347778320312, 0.20853424072265625, 0.22103500366210938, 0.2335357666015625, 0.24603652954101562, 0.25853729248046875, 0.2710380554199219, 0.283538818359375, 0.2960395812988281, 0.30854034423828125, 0.3210411071777344, 0.3335418701171875, 0.3460426330566406, 0.35854339599609375, 0.3710441589355469, 0.383544921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 13.0, 14.0, 10.0, 8.0, 11.0, 10.0, 21.0, 19.0, 31.0, 51.0, 63.0, 74.0, 111.0, 165.0, 92.0, 78.0, 55.0, 41.0, 20.0, 27.0, 18.0, 9.0, 12.0, 5.0, 8.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003249645233154297, -0.00031453371047973633, -0.00030410289764404297, -0.0002936720848083496, -0.00028324127197265625, -0.0002728104591369629, -0.00026237964630126953, -0.00025194883346557617, -0.0002415180206298828, -0.00023108720779418945, -0.0002206563949584961, -0.00021022558212280273, -0.00019979476928710938, -0.00018936395645141602, -0.00017893314361572266, -0.0001685023307800293, -0.00015807151794433594, -0.00014764070510864258, -0.00013720989227294922, -0.00012677907943725586, -0.0001163482666015625, -0.00010591745376586914, -9.548664093017578e-05, -8.505582809448242e-05, -7.462501525878906e-05, -6.41942024230957e-05, -5.3763389587402344e-05, -4.3332576751708984e-05, -3.2901763916015625e-05, -2.2470951080322266e-05, -1.2040138244628906e-05, -1.6093254089355469e-06, 8.821487426757812e-06, 1.9252300262451172e-05, 2.968311309814453e-05, 4.011392593383789e-05, 5.054473876953125e-05, 6.097555160522461e-05, 7.140636444091797e-05, 8.183717727661133e-05, 9.226799011230469e-05, 0.00010269880294799805, 0.0001131296157836914, 0.00012356042861938477, 0.00013399124145507812, 0.00014442205429077148, 0.00015485286712646484, 0.0001652836799621582, 0.00017571449279785156, 0.00018614530563354492, 0.00019657611846923828, 0.00020700693130493164, 0.000217437744140625, 0.00022786855697631836, 0.00023829936981201172, 0.0002487301826477051, 0.00025916099548339844, 0.0002695918083190918, 0.00028002262115478516, 0.0002904534339904785, 0.0003008842468261719, 0.00031131505966186523, 0.0003217458724975586, 0.00033217668533325195, 0.0003426074981689453]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 5.0, 2.0, 6.0, 8.0, 10.0, 12.0, 31.0, 78.0, 282.0, 1410.0, 10726.0, 981798.0, 49198.0, 3969.0, 687.0, 185.0, 52.0, 20.0, 19.0, 14.0, 4.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4586982727050781, -0.44425201416015625, -0.4298057556152344, -0.4153594970703125, -0.4009132385253906, -0.38646697998046875, -0.3720207214355469, -0.357574462890625, -0.3431282043457031, -0.32868194580078125, -0.3142356872558594, -0.2997894287109375, -0.2853431701660156, -0.27089691162109375, -0.2564506530761719, -0.24200439453125, -0.22755813598632812, -0.21311187744140625, -0.19866561889648438, -0.1842193603515625, -0.16977310180664062, -0.15532684326171875, -0.14088058471679688, -0.126434326171875, -0.11198806762695312, -0.09754180908203125, -0.08309555053710938, -0.0686492919921875, -0.054203033447265625, -0.03975677490234375, -0.025310516357421875, -0.0108642578125, 0.003582000732421875, 0.01802825927734375, 0.032474517822265625, 0.0469207763671875, 0.061367034912109375, 0.07581329345703125, 0.09025955200195312, 0.104705810546875, 0.11915206909179688, 0.13359832763671875, 0.14804458618164062, 0.1624908447265625, 0.17693710327148438, 0.19138336181640625, 0.20582962036132812, 0.22027587890625, 0.23472213745117188, 0.24916839599609375, 0.2636146545410156, 0.2780609130859375, 0.2925071716308594, 0.30695343017578125, 0.3213996887207031, 0.335845947265625, 0.3502922058105469, 0.36473846435546875, 0.3791847229003906, 0.3936309814453125, 0.4080772399902344, 0.42252349853515625, 0.4369697570800781, 0.451416015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 8.0, 7.0, 13.0, 16.0, 32.0, 39.0, 124.0, 455.0, 142.0, 45.0, 28.0, 18.0, 14.0, 2.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1689453125, -0.1637554168701172, -0.15856552124023438, -0.15337562561035156, -0.14818572998046875, -0.14299583435058594, -0.13780593872070312, -0.1326160430908203, -0.1274261474609375, -0.12223625183105469, -0.11704635620117188, -0.11185646057128906, -0.10666656494140625, -0.10147666931152344, -0.09628677368164062, -0.09109687805175781, -0.085906982421875, -0.08071708679199219, -0.07552719116210938, -0.07033729553222656, -0.06514739990234375, -0.05995750427246094, -0.054767608642578125, -0.04957771301269531, -0.0443878173828125, -0.03919792175292969, -0.034008026123046875, -0.028818130493164062, -0.02362823486328125, -0.018438339233398438, -0.013248443603515625, -0.008058547973632812, -0.00286865234375, 0.0023212432861328125, 0.007511138916015625, 0.012701034545898438, 0.01789093017578125, 0.023080825805664062, 0.028270721435546875, 0.03346061706542969, 0.0386505126953125, 0.04384040832519531, 0.049030303955078125, 0.05422019958496094, 0.05941009521484375, 0.06459999084472656, 0.06978988647460938, 0.07497978210449219, 0.080169677734375, 0.08535957336425781, 0.09054946899414062, 0.09573936462402344, 0.10092926025390625, 0.10611915588378906, 0.11130905151367188, 0.11649894714355469, 0.1216888427734375, 0.1268787384033203, 0.13206863403320312, 0.13725852966308594, 0.14244842529296875, 0.14763832092285156, 0.15282821655273438, 0.1580181121826172, 0.1632080078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 984.0, 28.0, 4.0, 1.0], "bins": [-35.275917053222656, -34.69390106201172, -34.11188888549805, -33.52987289428711, -32.94785690307617, -32.3658447265625, -31.783828735351562, -31.201814651489258, -30.619800567626953, -30.03778648376465, -29.45577049255371, -28.873756408691406, -28.2917423248291, -27.709728240966797, -27.12771224975586, -26.545698165893555, -25.96368408203125, -25.381669998168945, -24.799654006958008, -24.217639923095703, -23.6356258392334, -23.053611755371094, -22.471595764160156, -21.88958168029785, -21.307565689086914, -20.72555160522461, -20.143535614013672, -19.561521530151367, -18.979507446289062, -18.397493362426758, -17.81547737121582, -17.233463287353516, -16.65144920349121, -16.069435119628906, -15.487420082092285, -14.905405044555664, -14.32339096069336, -13.741375923156738, -13.159360885620117, -12.577346801757812, -11.995332717895508, -11.413317680358887, -10.831303596496582, -10.249288558959961, -9.667274475097656, -9.085259437561035, -8.503244400024414, -7.921230316162109, -7.339215278625488, -6.757200717926025, -6.1751861572265625, -5.593171119689941, -5.011157035827637, -4.429141998291016, -3.8471274375915527, -3.26511287689209, -2.683098316192627, -2.101083755493164, -1.5190690755844116, -0.9370543956756592, -0.3550398349761963, 0.2269747257232666, 0.8089895248413086, 1.3910040855407715, 1.9730185270309448]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 25.0, 50.0, 115.0, 184.0, 179.0, 199.0, 131.0, 77.0, 33.0, 12.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587221622467041, -2.5386786460876465, -2.490135431289673, -2.4415924549102783, -2.3930492401123047, -2.34450626373291, -2.2959632873535156, -2.247420072555542, -2.1988770961761475, -2.150334119796753, -2.1017909049987793, -2.0532479286193848, -2.004704713821411, -1.9561617374420166, -1.9076186418533325, -1.8590755462646484, -1.8105324506759644, -1.7619893550872803, -1.7134462594985962, -1.664903163909912, -1.6163601875305176, -1.5678170919418335, -1.5192739963531494, -1.4707309007644653, -1.4221878051757812, -1.3736447095870972, -1.325101613998413, -1.2765586376190186, -1.2280155420303345, -1.1794724464416504, -1.1309293508529663, -1.0823862552642822, -1.0338433980941772, -0.9853003025054932, -0.9367572665214539, -0.8882141709327698, -0.8396711349487305, -0.7911280393600464, -0.7425849437713623, -0.6940418481826782, -0.6454988121986389, -0.5969557166099548, -0.5484126806259155, -0.49986958503723145, -0.45132651925086975, -0.40278345346450806, -0.354240357875824, -0.3056972920894623, -0.2571542263031006, -0.2086111605167389, -0.160068079829216, -0.11152499914169312, -0.06298193335533142, -0.014438867568969727, 0.034104228019714355, 0.08264729380607605, 0.13119035959243774, 0.17973342537879944, 0.22827650606632233, 0.2768195867538452, 0.3253626525402069, 0.3739057183265686, 0.4224488139152527, 0.4709918797016144, 0.5195349454879761]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 18.0, 38.0, 75.0, 150.0, 498.0, 42257.0, 4150998.0, 205.0, 41.0, 6.0, 1.0], "bins": [-3.6875, -3.625072479248047, -3.5626449584960938, -3.5002174377441406, -3.4377899169921875, -3.3753623962402344, -3.3129348754882812, -3.250507354736328, -3.188079833984375, -3.125652313232422, -3.0632247924804688, -3.0007972717285156, -2.9383697509765625, -2.8759422302246094, -2.8135147094726562, -2.751087188720703, -2.68865966796875, -2.626232147216797, -2.5638046264648438, -2.5013771057128906, -2.4389495849609375, -2.3765220642089844, -2.3140945434570312, -2.251667022705078, -2.189239501953125, -2.126811981201172, -2.0643844604492188, -2.0019569396972656, -1.9395294189453125, -1.8771018981933594, -1.8146743774414062, -1.7522468566894531, -1.6898193359375, -1.6273918151855469, -1.5649642944335938, -1.5025367736816406, -1.4401092529296875, -1.3776817321777344, -1.3152542114257812, -1.2528266906738281, -1.190399169921875, -1.1279716491699219, -1.0655441284179688, -1.0031166076660156, -0.9406890869140625, -0.8782615661621094, -0.8158340454101562, -0.7534065246582031, -0.69097900390625, -0.6285514831542969, -0.5661239624023438, -0.5036964416503906, -0.4412689208984375, -0.3788414001464844, -0.31641387939453125, -0.2539863586425781, -0.191558837890625, -0.12913131713867188, -0.06670379638671875, -0.004276275634765625, 0.0581512451171875, 0.12057876586914062, 0.18300628662109375, 0.24543380737304688, 0.307861328125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 58.0, 247.0, 377.0, 234.0, 76.0, 14.0, 3.0, 1.0], "bins": [-0.0992431640625, -0.09754598140716553, -0.09584879875183105, -0.09415161609649658, -0.09245443344116211, -0.09075725078582764, -0.08906006813049316, -0.08736288547515869, -0.08566570281982422, -0.08396852016448975, -0.08227133750915527, -0.0805741548538208, -0.07887697219848633, -0.07717978954315186, -0.07548260688781738, -0.07378542423248291, -0.07208824157714844, -0.07039105892181396, -0.06869387626647949, -0.06699669361114502, -0.06529951095581055, -0.06360232830047607, -0.0619051456451416, -0.06020796298980713, -0.058510780334472656, -0.056813597679138184, -0.05511641502380371, -0.05341923236846924, -0.051722049713134766, -0.05002486705780029, -0.04832768440246582, -0.04663050174713135, -0.044933319091796875, -0.0432361364364624, -0.04153895378112793, -0.03984177112579346, -0.038144588470458984, -0.03644740581512451, -0.03475022315979004, -0.033053040504455566, -0.031355857849121094, -0.02965867519378662, -0.02796149253845215, -0.026264309883117676, -0.024567127227783203, -0.02286994457244873, -0.021172761917114258, -0.019475579261779785, -0.017778396606445312, -0.01608121395111084, -0.014384031295776367, -0.012686848640441895, -0.010989665985107422, -0.00929248332977295, -0.0075953006744384766, -0.005898118019104004, -0.004200935363769531, -0.0025037527084350586, -0.0008065700531005859, 0.0008906126022338867, 0.0025877952575683594, 0.004284977912902832, 0.005982160568237305, 0.007679343223571777, 0.00937652587890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 18.0, 38.0, 79.0, 202.0, 237.0, 382.0, 4186524.0, 6212.0, 304.0, 154.0, 85.0, 37.0, 5.0, 1.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.015625, -4.91497802734375, -4.8143310546875, -4.71368408203125, -4.613037109375, -4.51239013671875, -4.4117431640625, -4.31109619140625, -4.21044921875, -4.10980224609375, -4.0091552734375, -3.90850830078125, -3.807861328125, -3.70721435546875, -3.6065673828125, -3.50592041015625, -3.4052734375, -3.30462646484375, -3.2039794921875, -3.10333251953125, -3.002685546875, -2.90203857421875, -2.8013916015625, -2.70074462890625, -2.60009765625, -2.49945068359375, -2.3988037109375, -2.29815673828125, -2.197509765625, -2.09686279296875, -1.9962158203125, -1.89556884765625, -1.794921875, -1.69427490234375, -1.5936279296875, -1.49298095703125, -1.392333984375, -1.29168701171875, -1.1910400390625, -1.09039306640625, -0.98974609375, -0.88909912109375, -0.7884521484375, -0.68780517578125, -0.587158203125, -0.48651123046875, -0.3858642578125, -0.28521728515625, -0.1845703125, -0.08392333984375, 0.0167236328125, 0.11737060546875, 0.218017578125, 0.31866455078125, 0.4193115234375, 0.51995849609375, 0.62060546875, 0.72125244140625, 0.8218994140625, 0.92254638671875, 1.023193359375, 1.12384033203125, 1.2244873046875, 1.32513427734375, 1.42578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 112.0, 3858.0, 88.0, 14.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47607421875, -0.46661949157714844, -0.4571647644042969, -0.4477100372314453, -0.43825531005859375, -0.4288005828857422, -0.4193458557128906, -0.40989112854003906, -0.4004364013671875, -0.39098167419433594, -0.3815269470214844, -0.3720722198486328, -0.36261749267578125, -0.3531627655029297, -0.3437080383300781, -0.33425331115722656, -0.324798583984375, -0.31534385681152344, -0.3058891296386719, -0.2964344024658203, -0.28697967529296875, -0.2775249481201172, -0.2680702209472656, -0.25861549377441406, -0.2491607666015625, -0.23970603942871094, -0.23025131225585938, -0.2207965850830078, -0.21134185791015625, -0.2018871307373047, -0.19243240356445312, -0.18297767639160156, -0.17352294921875, -0.16406822204589844, -0.15461349487304688, -0.1451587677001953, -0.13570404052734375, -0.1262493133544922, -0.11679458618164062, -0.10733985900878906, -0.0978851318359375, -0.08843040466308594, -0.07897567749023438, -0.06952095031738281, -0.06006622314453125, -0.05061149597167969, -0.041156768798828125, -0.03170204162597656, -0.022247314453125, -0.012792587280273438, -0.003337860107421875, 0.0061168670654296875, 0.01557159423828125, 0.025026321411132812, 0.034481048583984375, 0.04393577575683594, 0.0533905029296875, 0.06284523010253906, 0.07229995727539062, 0.08175468444824219, 0.09120941162109375, 0.10066413879394531, 0.11011886596679688, 0.11957359313964844, 0.1290283203125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 15.0, 38.0, 736.0, 185.0, 27.0, 8.0, 3.0, 2.0], "bins": [-5.6812028884887695, -5.584517002105713, -5.487830638885498, -5.391144752502441, -5.294458389282227, -5.19777250289917, -5.101086139678955, -5.004400253295898, -4.907713890075684, -4.811028003692627, -4.714341640472412, -4.6176557540893555, -4.520969390869141, -4.424283504486084, -4.327597141265869, -4.2309112548828125, -4.134225368499756, -4.037539482116699, -3.9408531188964844, -3.8441669940948486, -3.747480869293213, -3.6507949829101562, -3.5541088581085205, -3.4574227333068848, -3.360736608505249, -3.2640504837036133, -3.1673643589019775, -3.070678234100342, -2.973992347717285, -2.8773062229156494, -2.7806200981140137, -2.683933973312378, -2.587247848510742, -2.4905617237091064, -2.3938755989074707, -2.297189474105835, -2.200503349304199, -2.1038174629211426, -2.007131338119507, -1.910445213317871, -1.8137590885162354, -1.7170729637145996, -1.6203868389129639, -1.5237008333206177, -1.427014708518982, -1.3303285837173462, -1.233642578125, -1.1369564533233643, -1.0402703285217285, -0.9435842037200928, -0.8468981385231018, -0.7502120733261108, -0.6535259485244751, -0.5568398237228394, -0.4601537585258484, -0.3634676933288574, -0.2667815685272217, -0.17009547352790833, -0.07340937852859497, 0.023276716470718384, 0.11996281147003174, 0.2166489064693451, 0.31333500146865845, 0.4100210666656494, 0.5067071914672852]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 21.0, 38.0, 58.0, 122.0, 144.0, 158.0, 164.0, 108.0, 82.0, 57.0, 19.0, 11.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.633592128753662, -1.581588864326477, -1.5295854806900024, -1.4775822162628174, -1.4255788326263428, -1.3735755681991577, -1.3215723037719727, -1.269568920135498, -1.217565655708313, -1.165562391281128, -1.1135590076446533, -1.0615557432174683, -1.0095523595809937, -0.9575490951538086, -0.9055457711219788, -0.8535424470901489, -0.8015391230583191, -0.7495357990264893, -0.6975324749946594, -0.6455291509628296, -0.5935258865356445, -0.5415225625038147, -0.48951923847198486, -0.4375159442424774, -0.3855126202106476, -0.33350929617881775, -0.2815060019493103, -0.22950267791748047, -0.17749936878681183, -0.1254960596561432, -0.07349273562431335, -0.021489441394805908, 0.030513882637023926, 0.08251719176769257, 0.1345205008983612, 0.18652382493019104, 0.23852713406085968, 0.2905304431915283, 0.34253376722335815, 0.3945370614528656, 0.44654038548469543, 0.49854370951652527, 0.5505470037460327, 0.6025503277778625, 0.6545536518096924, 0.7065569162368774, 0.758560299873352, 0.8105635643005371, 0.8625668883323669, 0.9145702123641968, 0.9665735363960266, 1.0185768604278564, 1.0705801248550415, 1.1225833892822266, 1.1745867729187012, 1.2265900373458862, 1.2785934209823608, 1.330596685409546, 1.3826000690460205, 1.4346033334732056, 1.4866067171096802, 1.5386099815368652, 1.5906133651733398, 1.642616629600525, 1.69461989402771]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 9.0, 14.0, 15.0, 28.0, 27.0, 49.0, 85.0, 202.0, 603.0, 2058.0, 23305.0, 974635.0, 43625.0, 2660.0, 740.0, 248.0, 83.0, 52.0, 39.0, 30.0, 16.0, 9.0, 10.0, 9.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8212890625, -0.7975387573242188, -0.7737884521484375, -0.7500381469726562, -0.726287841796875, -0.7025375366210938, -0.6787872314453125, -0.6550369262695312, -0.63128662109375, -0.6075363159179688, -0.5837860107421875, -0.5600357055664062, -0.536285400390625, -0.5125350952148438, -0.4887847900390625, -0.46503448486328125, -0.4412841796875, -0.41753387451171875, -0.3937835693359375, -0.37003326416015625, -0.346282958984375, -0.32253265380859375, -0.2987823486328125, -0.27503204345703125, -0.25128173828125, -0.22753143310546875, -0.2037811279296875, -0.18003082275390625, -0.156280517578125, -0.13253021240234375, -0.1087799072265625, -0.08502960205078125, -0.061279296875, -0.03752899169921875, -0.0137786865234375, 0.00997161865234375, 0.033721923828125, 0.05747222900390625, 0.0812225341796875, 0.10497283935546875, 0.12872314453125, 0.15247344970703125, 0.1762237548828125, 0.19997406005859375, 0.223724365234375, 0.24747467041015625, 0.2712249755859375, 0.29497528076171875, 0.3187255859375, 0.34247589111328125, 0.3662261962890625, 0.38997650146484375, 0.413726806640625, 0.43747711181640625, 0.4612274169921875, 0.48497772216796875, 0.50872802734375, 0.5324783325195312, 0.5562286376953125, 0.5799789428710938, 0.603729248046875, 0.6274795532226562, 0.6512298583984375, 0.6749801635742188, 0.69873046875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 25.0, 41.0, 75.0, 139.0, 174.0, 188.0, 151.0, 87.0, 71.0, 27.0, 14.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.142578125, -0.1394186019897461, -0.1362590789794922, -0.13309955596923828, -0.12994003295898438, -0.12678050994873047, -0.12362098693847656, -0.12046146392822266, -0.11730194091796875, -0.11414241790771484, -0.11098289489746094, -0.10782337188720703, -0.10466384887695312, -0.10150432586669922, -0.09834480285644531, -0.0951852798461914, -0.0920257568359375, -0.0888662338256836, -0.08570671081542969, -0.08254718780517578, -0.07938766479492188, -0.07622814178466797, -0.07306861877441406, -0.06990909576416016, -0.06674957275390625, -0.06359004974365234, -0.06043052673339844, -0.05727100372314453, -0.054111480712890625, -0.05095195770263672, -0.04779243469238281, -0.044632911682128906, -0.041473388671875, -0.038313865661621094, -0.03515434265136719, -0.03199481964111328, -0.028835296630859375, -0.02567577362060547, -0.022516250610351562, -0.019356727600097656, -0.01619720458984375, -0.013037681579589844, -0.009878158569335938, -0.006718635559082031, -0.003559112548828125, -0.00039958953857421875, 0.0027599334716796875, 0.005919456481933594, 0.0090789794921875, 0.012238502502441406, 0.015398025512695312, 0.01855754852294922, 0.021717071533203125, 0.02487659454345703, 0.028036117553710938, 0.031195640563964844, 0.03435516357421875, 0.037514686584472656, 0.04067420959472656, 0.04383373260498047, 0.046993255615234375, 0.05015277862548828, 0.05331230163574219, 0.056471824645996094, 0.05963134765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 5.0, 7.0, 7.0, 19.0, 15.0, 22.0, 34.0, 35.0, 46.0, 87.0, 180.0, 420.0, 2552.0, 62169.0, 961949.0, 19033.0, 1308.0, 283.0, 109.0, 67.0, 50.0, 39.0, 17.0, 25.0, 18.0, 8.0, 13.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44482421875, -0.4306373596191406, -0.41645050048828125, -0.4022636413574219, -0.3880767822265625, -0.3738899230957031, -0.35970306396484375, -0.3455162048339844, -0.331329345703125, -0.3171424865722656, -0.30295562744140625, -0.2887687683105469, -0.2745819091796875, -0.2603950500488281, -0.24620819091796875, -0.23202133178710938, -0.21783447265625, -0.20364761352539062, -0.18946075439453125, -0.17527389526367188, -0.1610870361328125, -0.14690017700195312, -0.13271331787109375, -0.11852645874023438, -0.104339599609375, -0.09015274047851562, -0.07596588134765625, -0.061779022216796875, -0.0475921630859375, -0.033405303955078125, -0.01921844482421875, -0.005031585693359375, 0.0091552734375, 0.023342132568359375, 0.03752899169921875, 0.051715850830078125, 0.0659027099609375, 0.08008956909179688, 0.09427642822265625, 0.10846328735351562, 0.122650146484375, 0.13683700561523438, 0.15102386474609375, 0.16521072387695312, 0.1793975830078125, 0.19358444213867188, 0.20777130126953125, 0.22195816040039062, 0.23614501953125, 0.2503318786621094, 0.26451873779296875, 0.2787055969238281, 0.2928924560546875, 0.3070793151855469, 0.32126617431640625, 0.3354530334472656, 0.349639892578125, 0.3638267517089844, 0.37801361083984375, 0.3922004699707031, 0.4063873291015625, 0.4205741882324219, 0.43476104736328125, 0.4489479064941406, 0.463134765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 4.0, 10.0, 12.0, 15.0, 26.0, 24.0, 36.0, 26.0, 39.0, 48.0, 61.0, 58.0, 63.0, 56.0, 69.0, 67.0, 49.0, 58.0, 41.0, 40.0, 34.0, 31.0, 25.0, 29.0, 11.0, 11.0, 13.0, 11.0, 3.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1689453125, -0.1636638641357422, -0.15838241577148438, -0.15310096740722656, -0.14781951904296875, -0.14253807067871094, -0.13725662231445312, -0.1319751739501953, -0.1266937255859375, -0.12141227722167969, -0.11613082885742188, -0.11084938049316406, -0.10556793212890625, -0.10028648376464844, -0.09500503540039062, -0.08972358703613281, -0.084442138671875, -0.07916069030761719, -0.07387924194335938, -0.06859779357910156, -0.06331634521484375, -0.05803489685058594, -0.052753448486328125, -0.04747200012207031, -0.0421905517578125, -0.03690910339355469, -0.031627655029296875, -0.026346206665039062, -0.02106475830078125, -0.015783309936523438, -0.010501861572265625, -0.0052204132080078125, 6.103515625e-05, 0.0053424835205078125, 0.010623931884765625, 0.015905380249023438, 0.02118682861328125, 0.026468276977539062, 0.031749725341796875, 0.03703117370605469, 0.0423126220703125, 0.04759407043457031, 0.052875518798828125, 0.05815696716308594, 0.06343841552734375, 0.06871986389160156, 0.07400131225585938, 0.07928276062011719, 0.084564208984375, 0.08984565734863281, 0.09512710571289062, 0.10040855407714844, 0.10569000244140625, 0.11097145080566406, 0.11625289916992188, 0.12153434753417969, 0.1268157958984375, 0.1320972442626953, 0.13737869262695312, 0.14266014099121094, 0.14794158935546875, 0.15322303771972656, 0.15850448608398438, 0.1637859344482422, 0.1690673828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 12.0, 18.0, 34.0, 46.0, 121.0, 237.0, 489.0, 1250.0, 5862.0, 152218.0, 873167.0, 11871.0, 1927.0, 638.0, 296.0, 140.0, 86.0, 41.0, 22.0, 16.0, 15.0, 9.0, 8.0, 6.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24560546875, -0.23917007446289062, -0.23273468017578125, -0.22629928588867188, -0.2198638916015625, -0.21342849731445312, -0.20699310302734375, -0.20055770874023438, -0.194122314453125, -0.18768692016601562, -0.18125152587890625, -0.17481613159179688, -0.1683807373046875, -0.16194534301757812, -0.15550994873046875, -0.14907455444335938, -0.14263916015625, -0.13620376586914062, -0.12976837158203125, -0.12333297729492188, -0.1168975830078125, -0.11046218872070312, -0.10402679443359375, -0.09759140014648438, -0.091156005859375, -0.08472061157226562, -0.07828521728515625, -0.07184982299804688, -0.0654144287109375, -0.058979034423828125, -0.05254364013671875, -0.046108245849609375, -0.0396728515625, -0.033237457275390625, -0.02680206298828125, -0.020366668701171875, -0.0139312744140625, -0.007495880126953125, -0.00106048583984375, 0.005374908447265625, 0.011810302734375, 0.018245697021484375, 0.02468109130859375, 0.031116485595703125, 0.0375518798828125, 0.043987274169921875, 0.05042266845703125, 0.056858062744140625, 0.06329345703125, 0.06972885131835938, 0.07616424560546875, 0.08259963989257812, 0.0890350341796875, 0.09547042846679688, 0.10190582275390625, 0.10834121704101562, 0.114776611328125, 0.12121200561523438, 0.12764739990234375, 0.13408279418945312, 0.1405181884765625, 0.14695358276367188, 0.15338897705078125, 0.15982437133789062, 0.166259765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 8.0, 1.0, 3.0, 6.0, 8.0, 8.0, 17.0, 14.0, 12.0, 16.0, 29.0, 34.0, 60.0, 66.0, 95.0, 132.0, 113.0, 73.0, 71.0, 41.0, 39.0, 28.0, 32.0, 16.0, 13.0, 20.0, 6.0, 8.0, 11.0, 2.0, 3.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002493858337402344, -0.00024043768644332886, -0.00023148953914642334, -0.00022254139184951782, -0.0002135932445526123, -0.0002046450972557068, -0.00019569694995880127, -0.00018674880266189575, -0.00017780065536499023, -0.00016885250806808472, -0.0001599043607711792, -0.00015095621347427368, -0.00014200806617736816, -0.00013305991888046265, -0.00012411177158355713, -0.00011516362428665161, -0.0001062154769897461, -9.726732969284058e-05, -8.831918239593506e-05, -7.937103509902954e-05, -7.042288780212402e-05, -6.14747405052185e-05, -5.252659320831299e-05, -4.357844591140747e-05, -3.463029861450195e-05, -2.5682151317596436e-05, -1.6734004020690918e-05, -7.7858567237854e-06, 1.1622905731201172e-06, 1.0110437870025635e-05, 1.9058585166931152e-05, 2.800673246383667e-05, 3.695487976074219e-05, 4.5903027057647705e-05, 5.485117435455322e-05, 6.379932165145874e-05, 7.274746894836426e-05, 8.169561624526978e-05, 9.064376354217529e-05, 9.959191083908081e-05, 0.00010854005813598633, 0.00011748820543289185, 0.00012643635272979736, 0.00013538450002670288, 0.0001443326473236084, 0.00015328079462051392, 0.00016222894191741943, 0.00017117708921432495, 0.00018012523651123047, 0.00018907338380813599, 0.0001980215311050415, 0.00020696967840194702, 0.00021591782569885254, 0.00022486597299575806, 0.00023381412029266357, 0.0002427622675895691, 0.0002517104148864746, 0.0002606585621833801, 0.00026960670948028564, 0.00027855485677719116, 0.0002875030040740967, 0.0002964511513710022, 0.0003053992986679077, 0.00031434744596481323, 0.00032329559326171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 10.0, 16.0, 20.0, 38.0, 54.0, 147.0, 380.0, 1668.0, 20007.0, 1003969.0, 19747.0, 1692.0, 419.0, 172.0, 75.0, 41.0, 18.0, 21.0, 13.0, 13.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.28125, -0.2723197937011719, -0.26338958740234375, -0.2544593811035156, -0.2455291748046875, -0.23659896850585938, -0.22766876220703125, -0.21873855590820312, -0.209808349609375, -0.20087814331054688, -0.19194793701171875, -0.18301773071289062, -0.1740875244140625, -0.16515731811523438, -0.15622711181640625, -0.14729690551757812, -0.13836669921875, -0.12943649291992188, -0.12050628662109375, -0.11157608032226562, -0.1026458740234375, -0.09371566772460938, -0.08478546142578125, -0.07585525512695312, -0.066925048828125, -0.057994842529296875, -0.04906463623046875, -0.040134429931640625, -0.0312042236328125, -0.022274017333984375, -0.01334381103515625, -0.004413604736328125, 0.0045166015625, 0.013446807861328125, 0.02237701416015625, 0.031307220458984375, 0.0402374267578125, 0.049167633056640625, 0.05809783935546875, 0.06702804565429688, 0.075958251953125, 0.08488845825195312, 0.09381866455078125, 0.10274887084960938, 0.1116790771484375, 0.12060928344726562, 0.12953948974609375, 0.13846969604492188, 0.14739990234375, 0.15633010864257812, 0.16526031494140625, 0.17419052124023438, 0.1831207275390625, 0.19205093383789062, 0.20098114013671875, 0.20991134643554688, 0.218841552734375, 0.22777175903320312, 0.23670196533203125, 0.24563217163085938, 0.2545623779296875, 0.2634925842285156, 0.27242279052734375, 0.2813529968261719, 0.290283203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 16.0, 22.0, 19.0, 39.0, 59.0, 122.0, 169.0, 190.0, 131.0, 78.0, 39.0, 32.0, 21.0, 12.0, 8.0, 9.0, 8.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1055908203125, -0.10196685791015625, -0.0983428955078125, -0.09471893310546875, -0.091094970703125, -0.08747100830078125, -0.0838470458984375, -0.08022308349609375, -0.07659912109375, -0.07297515869140625, -0.0693511962890625, -0.06572723388671875, -0.062103271484375, -0.05847930908203125, -0.0548553466796875, -0.05123138427734375, -0.047607421875, -0.04398345947265625, -0.0403594970703125, -0.03673553466796875, -0.033111572265625, -0.02948760986328125, -0.0258636474609375, -0.02223968505859375, -0.01861572265625, -0.01499176025390625, -0.0113677978515625, -0.00774383544921875, -0.004119873046875, -0.00049591064453125, 0.0031280517578125, 0.00675201416015625, 0.0103759765625, 0.01399993896484375, 0.0176239013671875, 0.02124786376953125, 0.024871826171875, 0.02849578857421875, 0.0321197509765625, 0.03574371337890625, 0.03936767578125, 0.04299163818359375, 0.0466156005859375, 0.05023956298828125, 0.053863525390625, 0.05748748779296875, 0.0611114501953125, 0.06473541259765625, 0.068359375, 0.07198333740234375, 0.0756072998046875, 0.07923126220703125, 0.082855224609375, 0.08647918701171875, 0.0901031494140625, 0.09372711181640625, 0.09735107421875, 0.10097503662109375, 0.1045989990234375, 0.10822296142578125, 0.111846923828125, 0.11547088623046875, 0.1190948486328125, 0.12271881103515625, 0.1263427734375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 84.0, 755.0, 124.0, 27.0, 10.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.53749942779541, -5.410022258758545, -5.28254508972168, -5.155067443847656, -5.027590274810791, -4.900113105773926, -4.772635459899902, -4.645158290863037, -4.517681121826172, -4.390203952789307, -4.262726783752441, -4.135249137878418, -4.007771968841553, -3.8802947998046875, -3.752817392349243, -3.625339984893799, -3.4978628158569336, -3.3703856468200684, -3.242908239364624, -3.1154308319091797, -2.9879536628723145, -2.860476493835449, -2.732999086380005, -2.6055216789245605, -2.4780445098876953, -2.35056734085083, -2.2230899333953857, -2.0956125259399414, -1.9681353569030762, -1.8406580686569214, -1.7131807804107666, -1.5857034921646118, -1.458226203918457, -1.3307489156723022, -1.2032716274261475, -1.0757943391799927, -0.9483170509338379, -0.8208397626876831, -0.6933624744415283, -0.5658851861953735, -0.43840789794921875, -0.31093060970306396, -0.18345332145690918, -0.055976033210754395, 0.07150125503540039, 0.19897854328155518, 0.32645583152770996, 0.45393311977386475, 0.5814104080200195, 0.7088876962661743, 0.8363649845123291, 0.9638422727584839, 1.0913195610046387, 1.2187968492507935, 1.3462741374969482, 1.473751425743103, 1.6012287139892578, 1.7287060022354126, 1.8561832904815674, 1.9836605787277222, 2.111137866973877, 2.238615036010742, 2.3660924434661865, 2.493569850921631, 2.621047019958496]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 13.0, 7.0, 17.0, 18.0, 22.0, 19.0, 33.0, 38.0, 48.0, 42.0, 49.0, 66.0, 74.0, 69.0, 55.0, 69.0, 49.0, 48.0, 50.0, 37.0, 32.0, 28.0, 26.0, 20.0, 19.0, 14.0, 9.0, 12.0, 6.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9222455024719238, -0.8873699307441711, -0.8524943590164185, -0.8176187872886658, -0.7827432155609131, -0.7478677034378052, -0.7129921317100525, -0.6781165599822998, -0.6432409882545471, -0.6083654165267944, -0.5734898447990417, -0.5386142730712891, -0.5037387609481812, -0.4688631594181061, -0.4339876174926758, -0.3991120457649231, -0.3642364740371704, -0.3293609023094177, -0.29448533058166504, -0.25960978865623474, -0.22473421692848206, -0.18985864520072937, -0.15498308837413788, -0.12010753154754639, -0.0852319598197937, -0.05035639554262161, -0.015480831265449524, 0.019394733011722565, 0.05427029728889465, 0.08914586901664734, 0.12402142584323883, 0.15889698266983032, 0.19377243518829346, 0.22864800691604614, 0.26352357864379883, 0.2983991205692291, 0.3332746922969818, 0.3681502640247345, 0.4030258059501648, 0.4379013776779175, 0.47277694940567017, 0.5076525211334229, 0.5425280928611755, 0.5774036645889282, 0.6122791767120361, 0.6471548080444336, 0.6820303201675415, 0.7169058918952942, 0.7517814636230469, 0.7866570353507996, 0.8215326070785522, 0.8564081788063049, 0.8912837505340576, 0.9261592626571655, 0.9610348343849182, 0.9959104061126709, 1.0307860374450684, 1.0656615495681763, 1.1005371809005737, 1.1354126930236816, 1.170288324356079, 1.205163836479187, 1.2400394678115845, 1.2749149799346924, 1.3097904920578003]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 0.0, 2.0, 3.0, 3.0, 6.0, 12.0, 7.0, 8.0, 11.0, 17.0, 22.0, 19.0, 23.0, 30.0, 48.0, 56.0, 79.0, 125.0, 152.0, 268.0, 535.0, 1258.0, 4077.0, 25681.0, 3612346.0, 526275.0, 18891.0, 3099.0, 787.0, 280.0, 94.0, 34.0, 20.0, 13.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.9873046875, -0.9679145812988281, -0.9485244750976562, -0.9291343688964844, -0.9097442626953125, -0.8903541564941406, -0.8709640502929688, -0.8515739440917969, -0.832183837890625, -0.8127937316894531, -0.7934036254882812, -0.7740135192871094, -0.7546234130859375, -0.7352333068847656, -0.7158432006835938, -0.6964530944824219, -0.67706298828125, -0.6576728820800781, -0.6382827758789062, -0.6188926696777344, -0.5995025634765625, -0.5801124572753906, -0.5607223510742188, -0.5413322448730469, -0.521942138671875, -0.5025520324707031, -0.48316192626953125, -0.4637718200683594, -0.4443817138671875, -0.4249916076660156, -0.40560150146484375, -0.3862113952636719, -0.3668212890625, -0.3474311828613281, -0.32804107666015625, -0.3086509704589844, -0.2892608642578125, -0.2698707580566406, -0.25048065185546875, -0.23109054565429688, -0.211700439453125, -0.19231033325195312, -0.17292022705078125, -0.15353012084960938, -0.1341400146484375, -0.11474990844726562, -0.09535980224609375, -0.07596969604492188, -0.05657958984375, -0.037189483642578125, -0.01779937744140625, 0.001590728759765625, 0.0209808349609375, 0.040370941162109375, 0.05976104736328125, 0.07915115356445312, 0.098541259765625, 0.11793136596679688, 0.13732147216796875, 0.15671157836914062, 0.1761016845703125, 0.19549179077148438, 0.21488189697265625, 0.23427200317382812, 0.253662109375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 8.0, 13.0, 33.0, 61.0, 102.0, 123.0, 178.0, 157.0, 132.0, 79.0, 50.0, 34.0, 19.0, 8.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.149658203125, -0.14671659469604492, -0.14377498626708984, -0.14083337783813477, -0.1378917694091797, -0.1349501609802246, -0.13200855255126953, -0.12906694412231445, -0.12612533569335938, -0.1231837272644043, -0.12024211883544922, -0.11730051040649414, -0.11435890197753906, -0.11141729354858398, -0.1084756851196289, -0.10553407669067383, -0.10259246826171875, -0.09965085983276367, -0.0967092514038086, -0.09376764297485352, -0.09082603454589844, -0.08788442611694336, -0.08494281768798828, -0.0820012092590332, -0.07905960083007812, -0.07611799240112305, -0.07317638397216797, -0.07023477554321289, -0.06729316711425781, -0.06435155868530273, -0.061409950256347656, -0.05846834182739258, -0.0555267333984375, -0.05258512496948242, -0.049643516540527344, -0.046701908111572266, -0.04376029968261719, -0.04081869125366211, -0.03787708282470703, -0.03493547439575195, -0.031993865966796875, -0.029052257537841797, -0.02611064910888672, -0.02316904067993164, -0.020227432250976562, -0.017285823822021484, -0.014344215393066406, -0.011402606964111328, -0.00846099853515625, -0.005519390106201172, -0.0025777816772460938, 0.0003638267517089844, 0.0033054351806640625, 0.006247043609619141, 0.009188652038574219, 0.012130260467529297, 0.015071868896484375, 0.018013477325439453, 0.02095508575439453, 0.02389669418334961, 0.026838302612304688, 0.029779911041259766, 0.032721519470214844, 0.03566312789916992, 0.038604736328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 22.0, 70.0, 151.0, 544.0, 105600.0, 4087409.0, 346.0, 89.0, 34.0, 10.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.6368865966796875, -6.504241943359375, -6.3715972900390625, -6.23895263671875, -6.1063079833984375, -5.973663330078125, -5.8410186767578125, -5.7083740234375, -5.5757293701171875, -5.443084716796875, -5.3104400634765625, -5.17779541015625, -5.0451507568359375, -4.912506103515625, -4.7798614501953125, -4.647216796875, -4.5145721435546875, -4.381927490234375, -4.2492828369140625, -4.11663818359375, -3.9839935302734375, -3.851348876953125, -3.7187042236328125, -3.5860595703125, -3.4534149169921875, -3.320770263671875, -3.1881256103515625, -3.05548095703125, -2.9228363037109375, -2.790191650390625, -2.6575469970703125, -2.52490234375, -2.3922576904296875, -2.259613037109375, -2.1269683837890625, -1.99432373046875, -1.8616790771484375, -1.729034423828125, -1.5963897705078125, -1.4637451171875, -1.3311004638671875, -1.198455810546875, -1.0658111572265625, -0.93316650390625, -0.8005218505859375, -0.667877197265625, -0.5352325439453125, -0.402587890625, -0.2699432373046875, -0.137298583984375, -0.0046539306640625, 0.12799072265625, 0.2606353759765625, 0.393280029296875, 0.5259246826171875, 0.6585693359375, 0.7912139892578125, 0.923858642578125, 1.0565032958984375, 1.18914794921875, 1.3217926025390625, 1.454437255859375, 1.5870819091796875, 1.7197265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 16.0, 53.0, 467.0, 3381.0, 112.0, 31.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.62646484375, -0.6151199340820312, -0.6037750244140625, -0.5924301147460938, -0.581085205078125, -0.5697402954101562, -0.5583953857421875, -0.5470504760742188, -0.53570556640625, -0.5243606567382812, -0.5130157470703125, -0.5016708374023438, -0.490325927734375, -0.47898101806640625, -0.4676361083984375, -0.45629119873046875, -0.4449462890625, -0.43360137939453125, -0.4222564697265625, -0.41091156005859375, -0.399566650390625, -0.38822174072265625, -0.3768768310546875, -0.36553192138671875, -0.35418701171875, -0.34284210205078125, -0.3314971923828125, -0.32015228271484375, -0.308807373046875, -0.29746246337890625, -0.2861175537109375, -0.27477264404296875, -0.263427734375, -0.25208282470703125, -0.2407379150390625, -0.22939300537109375, -0.218048095703125, -0.20670318603515625, -0.1953582763671875, -0.18401336669921875, -0.17266845703125, -0.16132354736328125, -0.1499786376953125, -0.13863372802734375, -0.127288818359375, -0.11594390869140625, -0.1045989990234375, -0.09325408935546875, -0.0819091796875, -0.07056427001953125, -0.0592193603515625, -0.04787445068359375, -0.036529541015625, -0.02518463134765625, -0.0138397216796875, -0.00249481201171875, 0.00885009765625, 0.02019500732421875, 0.0315399169921875, 0.04288482666015625, 0.054229736328125, 0.06557464599609375, 0.0769195556640625, 0.08826446533203125, 0.099609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 6.0, 24.0, 128.0, 780.0, 60.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548156499862671, -3.4421892166137695, -3.3362221717834473, -3.230254888534546, -3.1242876052856445, -3.0183205604553223, -2.912353277206421, -2.8063859939575195, -2.7004189491271973, -2.594451665878296, -2.4884846210479736, -2.3825173377990723, -2.27655029296875, -2.1705830097198486, -2.0646157264709473, -1.9586485624313354, -1.8526813983917236, -1.7467142343521118, -1.6407470703125, -1.5347797870635986, -1.4288126230239868, -1.322845458984375, -1.2168781757354736, -1.1109110116958618, -1.00494384765625, -0.8989766836166382, -0.7930094599723816, -0.687042236328125, -0.5810750722885132, -0.47510790824890137, -0.3691406846046448, -0.2631734609603882, -0.15720605850219727, -0.05123886466026306, 0.05472832918167114, 0.16069552302360535, 0.26666271686553955, 0.37262988090515137, 0.47859710454940796, 0.5845643281936646, 0.6905314922332764, 0.7964986562728882, 0.9024658799171448, 1.0084331035614014, 1.1144002676010132, 1.220367431640625, 1.3263347148895264, 1.4323018789291382, 1.53826904296875, 1.6442362070083618, 1.7502033710479736, 1.856170654296875, 1.9621378183364868, 2.0681049823760986, 2.174072265625, 2.2800393104553223, 2.3860065937042236, 2.491973876953125, 2.5979409217834473, 2.7039082050323486, 2.80987548828125, 2.9158425331115723, 3.0218098163604736, 3.127777099609375, 3.2337441444396973]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 8.0, 13.0, 28.0, 41.0, 53.0, 78.0, 95.0, 106.0, 129.0, 100.0, 96.0, 94.0, 70.0, 35.0, 19.0, 21.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.502690315246582, -1.4595664739608765, -1.4164427518844604, -1.3733189105987549, -1.3301951885223389, -1.2870713472366333, -1.2439475059509277, -1.2008237838745117, -1.1576999425888062, -1.1145761013031006, -1.0714523792266846, -1.028328537940979, -0.9852047562599182, -0.9420809745788574, -0.8989571928977966, -0.8558334112167358, -0.812709629535675, -0.7695858478546143, -0.7264620661735535, -0.6833382844924927, -0.6402144432067871, -0.5970906615257263, -0.5539668798446655, -0.51084303855896, -0.46771928668022156, -0.42459550499916077, -0.3814716935157776, -0.3383479118347168, -0.295224130153656, -0.2521003186702728, -0.20897653698921204, -0.16585272550582886, -0.12272894382476807, -0.07960514724254608, -0.036481358110904694, 0.006642431020736694, 0.04976622760295868, 0.09289002418518066, 0.13601380586624146, 0.17913761734962463, 0.22226139903068542, 0.2653851807117462, 0.3085089921951294, 0.3516327738761902, 0.394756555557251, 0.43788036704063416, 0.48100414872169495, 0.5241279602050781, 0.5672517418861389, 0.6103755235671997, 0.6534993052482605, 0.6966230869293213, 0.7397469282150269, 0.7828707098960876, 0.8259944915771484, 0.869118332862854, 0.91224205493927, 0.9553658366203308, 0.9984896183013916, 1.0416134595870972, 1.0847371816635132, 1.1278610229492188, 1.1709847450256348, 1.2141085863113403, 1.257232427597046]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 7.0, 11.0, 12.0, 18.0, 20.0, 23.0, 40.0, 40.0, 53.0, 90.0, 102.0, 178.0, 303.0, 487.0, 975.0, 2264.0, 6958.0, 27766.0, 171432.0, 717394.0, 93601.0, 18000.0, 4936.0, 1749.0, 762.0, 403.0, 274.0, 177.0, 142.0, 90.0, 67.0, 38.0, 40.0, 28.0, 23.0, 11.0, 8.0, 11.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.34521484375, -0.33516693115234375, -0.3251190185546875, -0.31507110595703125, -0.305023193359375, -0.29497528076171875, -0.2849273681640625, -0.27487945556640625, -0.26483154296875, -0.25478363037109375, -0.2447357177734375, -0.23468780517578125, -0.224639892578125, -0.21459197998046875, -0.2045440673828125, -0.19449615478515625, -0.1844482421875, -0.17440032958984375, -0.1643524169921875, -0.15430450439453125, -0.144256591796875, -0.13420867919921875, -0.1241607666015625, -0.11411285400390625, -0.10406494140625, -0.09401702880859375, -0.0839691162109375, -0.07392120361328125, -0.063873291015625, -0.05382537841796875, -0.0437774658203125, -0.03372955322265625, -0.023681640625, -0.01363372802734375, -0.0035858154296875, 0.00646209716796875, 0.016510009765625, 0.02655792236328125, 0.0366058349609375, 0.04665374755859375, 0.05670166015625, 0.06674957275390625, 0.0767974853515625, 0.08684539794921875, 0.096893310546875, 0.10694122314453125, 0.1169891357421875, 0.12703704833984375, 0.1370849609375, 0.14713287353515625, 0.1571807861328125, 0.16722869873046875, 0.177276611328125, 0.18732452392578125, 0.1973724365234375, 0.20742034912109375, 0.21746826171875, 0.22751617431640625, 0.2375640869140625, 0.24761199951171875, 0.257659912109375, 0.26770782470703125, 0.2777557373046875, 0.28780364990234375, 0.2978515625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 8.0, 17.0, 28.0, 38.0, 57.0, 83.0, 80.0, 95.0, 124.0, 112.0, 93.0, 84.0, 52.0, 45.0, 37.0, 22.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.14599609375, -0.14256668090820312, -0.13913726806640625, -0.13570785522460938, -0.1322784423828125, -0.12884902954101562, -0.12541961669921875, -0.12199020385742188, -0.118560791015625, -0.11513137817382812, -0.11170196533203125, -0.10827255249023438, -0.1048431396484375, -0.10141372680664062, -0.09798431396484375, -0.09455490112304688, -0.09112548828125, -0.08769607543945312, -0.08426666259765625, -0.08083724975585938, -0.0774078369140625, -0.07397842407226562, -0.07054901123046875, -0.06711959838867188, -0.063690185546875, -0.060260772705078125, -0.05683135986328125, -0.053401947021484375, -0.0499725341796875, -0.046543121337890625, -0.04311370849609375, -0.039684295654296875, -0.0362548828125, -0.032825469970703125, -0.02939605712890625, -0.025966644287109375, -0.0225372314453125, -0.019107818603515625, -0.01567840576171875, -0.012248992919921875, -0.008819580078125, -0.005390167236328125, -0.00196075439453125, 0.001468658447265625, 0.0048980712890625, 0.008327484130859375, 0.01175689697265625, 0.015186309814453125, 0.01861572265625, 0.022045135498046875, 0.02547454833984375, 0.028903961181640625, 0.0323333740234375, 0.035762786865234375, 0.03919219970703125, 0.042621612548828125, 0.046051025390625, 0.049480438232421875, 0.05290985107421875, 0.056339263916015625, 0.0597686767578125, 0.06319808959960938, 0.06662750244140625, 0.07005691528320312, 0.073486328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 2.0, 5.0, 2.0, 13.0, 14.0, 8.0, 13.0, 31.0, 35.0, 32.0, 57.0, 89.0, 178.0, 338.0, 1403.0, 8092.0, 109582.0, 876361.0, 46058.0, 4629.0, 899.0, 292.0, 122.0, 81.0, 51.0, 47.0, 30.0, 19.0, 17.0, 19.0, 9.0, 8.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.399658203125, -0.3864936828613281, -0.37332916259765625, -0.3601646423339844, -0.3470001220703125, -0.3338356018066406, -0.32067108154296875, -0.3075065612792969, -0.294342041015625, -0.2811775207519531, -0.26801300048828125, -0.2548484802246094, -0.2416839599609375, -0.22851943969726562, -0.21535491943359375, -0.20219039916992188, -0.18902587890625, -0.17586135864257812, -0.16269683837890625, -0.14953231811523438, -0.1363677978515625, -0.12320327758789062, -0.11003875732421875, -0.09687423706054688, -0.083709716796875, -0.07054519653320312, -0.05738067626953125, -0.044216156005859375, -0.0310516357421875, -0.017887115478515625, -0.00472259521484375, 0.008441925048828125, 0.0216064453125, 0.034770965576171875, 0.04793548583984375, 0.061100006103515625, 0.0742645263671875, 0.08742904663085938, 0.10059356689453125, 0.11375808715820312, 0.126922607421875, 0.14008712768554688, 0.15325164794921875, 0.16641616821289062, 0.1795806884765625, 0.19274520874023438, 0.20590972900390625, 0.21907424926757812, 0.23223876953125, 0.24540328979492188, 0.25856781005859375, 0.2717323303222656, 0.2848968505859375, 0.2980613708496094, 0.31122589111328125, 0.3243904113769531, 0.337554931640625, 0.3507194519042969, 0.36388397216796875, 0.3770484924316406, 0.3902130126953125, 0.4033775329589844, 0.41654205322265625, 0.4297065734863281, 0.44287109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 12.0, 10.0, 14.0, 18.0, 24.0, 21.0, 28.0, 41.0, 47.0, 44.0, 64.0, 65.0, 58.0, 64.0, 69.0, 51.0, 63.0, 57.0, 37.0, 38.0, 28.0, 29.0, 24.0, 21.0, 11.0, 14.0, 10.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2578125, -0.24934005737304688, -0.24086761474609375, -0.23239517211914062, -0.2239227294921875, -0.21545028686523438, -0.20697784423828125, -0.19850540161132812, -0.190032958984375, -0.18156051635742188, -0.17308807373046875, -0.16461563110351562, -0.1561431884765625, -0.14767074584960938, -0.13919830322265625, -0.13072586059570312, -0.12225341796875, -0.11378097534179688, -0.10530853271484375, -0.09683609008789062, -0.0883636474609375, -0.07989120483398438, -0.07141876220703125, -0.06294631958007812, -0.054473876953125, -0.046001434326171875, -0.03752899169921875, -0.029056549072265625, -0.0205841064453125, -0.012111663818359375, -0.00363922119140625, 0.004833221435546875, 0.0133056640625, 0.021778106689453125, 0.03025054931640625, 0.038722991943359375, 0.0471954345703125, 0.055667877197265625, 0.06414031982421875, 0.07261276245117188, 0.081085205078125, 0.08955764770507812, 0.09803009033203125, 0.10650253295898438, 0.1149749755859375, 0.12344741821289062, 0.13191986083984375, 0.14039230346679688, 0.14886474609375, 0.15733718872070312, 0.16580963134765625, 0.17428207397460938, 0.1827545166015625, 0.19122695922851562, 0.19969940185546875, 0.20817184448242188, 0.216644287109375, 0.22511672973632812, 0.23358917236328125, 0.24206161499023438, 0.2505340576171875, 0.2590065002441406, 0.26747894287109375, 0.2759513854980469, 0.284423828125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 2.0, 5.0, 5.0, 3.0, 4.0, 8.0, 8.0, 9.0, 15.0, 27.0, 41.0, 75.0, 133.0, 370.0, 992.0, 3711.0, 27125.0, 937379.0, 70653.0, 5676.0, 1451.0, 464.0, 158.0, 76.0, 50.0, 35.0, 10.0, 17.0, 7.0, 6.0, 11.0, 4.0, 9.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1434326171875, -0.13916778564453125, -0.1349029541015625, -0.13063812255859375, -0.126373291015625, -0.12210845947265625, -0.1178436279296875, -0.11357879638671875, -0.10931396484375, -0.10504913330078125, -0.1007843017578125, -0.09651947021484375, -0.092254638671875, -0.08798980712890625, -0.0837249755859375, -0.07946014404296875, -0.0751953125, -0.07093048095703125, -0.0666656494140625, -0.06240081787109375, -0.058135986328125, -0.05387115478515625, -0.0496063232421875, -0.04534149169921875, -0.04107666015625, -0.03681182861328125, -0.0325469970703125, -0.02828216552734375, -0.024017333984375, -0.01975250244140625, -0.0154876708984375, -0.01122283935546875, -0.0069580078125, -0.00269317626953125, 0.0015716552734375, 0.00583648681640625, 0.010101318359375, 0.01436614990234375, 0.0186309814453125, 0.02289581298828125, 0.02716064453125, 0.03142547607421875, 0.0356903076171875, 0.03995513916015625, 0.044219970703125, 0.04848480224609375, 0.0527496337890625, 0.05701446533203125, 0.061279296875, 0.06554412841796875, 0.0698089599609375, 0.07407379150390625, 0.078338623046875, 0.08260345458984375, 0.0868682861328125, 0.09113311767578125, 0.09539794921875, 0.09966278076171875, 0.1039276123046875, 0.10819244384765625, 0.112457275390625, 0.11672210693359375, 0.1209869384765625, 0.12525177001953125, 0.1295166015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 10.0, 10.0, 11.0, 24.0, 29.0, 37.0, 50.0, 54.0, 68.0, 96.0, 102.0, 89.0, 85.0, 77.0, 56.0, 50.0, 30.0, 23.0, 35.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.733438491821289e-05, -9.361002594232559e-05, -8.98856669664383e-05, -8.6161307990551e-05, -8.24369490146637e-05, -7.87125900387764e-05, -7.49882310628891e-05, -7.12638720870018e-05, -6.75395131111145e-05, -6.38151541352272e-05, -6.0090795159339905e-05, -5.6366436183452606e-05, -5.264207720756531e-05, -4.891771823167801e-05, -4.519335925579071e-05, -4.146900027990341e-05, -3.774464130401611e-05, -3.4020282328128815e-05, -3.0295923352241516e-05, -2.6571564376354218e-05, -2.284720540046692e-05, -1.912284642457962e-05, -1.5398487448692322e-05, -1.1674128472805023e-05, -7.949769496917725e-06, -4.225410521030426e-06, -5.010515451431274e-07, 3.223307430744171e-06, 6.94766640663147e-06, 1.0672025382518768e-05, 1.4396384358406067e-05, 1.8120743334293365e-05, 2.1845102310180664e-05, 2.5569461286067963e-05, 2.929382026195526e-05, 3.301817923784256e-05, 3.674253821372986e-05, 4.046689718961716e-05, 4.4191256165504456e-05, 4.7915615141391754e-05, 5.163997411727905e-05, 5.536433309316635e-05, 5.908869206905365e-05, 6.281305104494095e-05, 6.653741002082825e-05, 7.026176899671555e-05, 7.398612797260284e-05, 7.771048694849014e-05, 8.143484592437744e-05, 8.515920490026474e-05, 8.888356387615204e-05, 9.260792285203934e-05, 9.633228182792664e-05, 0.00010005664080381393, 0.00010378099977970123, 0.00010750535875558853, 0.00011122971773147583, 0.00011495407670736313, 0.00011867843568325043, 0.00012240279465913773, 0.00012612715363502502, 0.00012985151261091232, 0.00013357587158679962, 0.00013730023056268692, 0.00014102458953857422]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 3.0, 10.0, 12.0, 28.0, 47.0, 86.0, 139.0, 281.0, 809.0, 3284.0, 21482.0, 757184.0, 251412.0, 10706.0, 1973.0, 537.0, 249.0, 110.0, 73.0, 40.0, 21.0, 13.0, 16.0, 7.0, 8.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11639404296875, -0.1130533218383789, -0.10971260070800781, -0.10637187957763672, -0.10303115844726562, -0.09969043731689453, -0.09634971618652344, -0.09300899505615234, -0.08966827392578125, -0.08632755279541016, -0.08298683166503906, -0.07964611053466797, -0.07630538940429688, -0.07296466827392578, -0.06962394714355469, -0.0662832260131836, -0.0629425048828125, -0.059601783752441406, -0.05626106262207031, -0.05292034149169922, -0.049579620361328125, -0.04623889923095703, -0.04289817810058594, -0.039557456970214844, -0.03621673583984375, -0.032876014709472656, -0.029535293579101562, -0.02619457244873047, -0.022853851318359375, -0.01951313018798828, -0.016172409057617188, -0.012831687927246094, -0.009490966796875, -0.006150245666503906, -0.0028095245361328125, 0.0005311965942382812, 0.003871917724609375, 0.007212638854980469, 0.010553359985351562, 0.013894081115722656, 0.01723480224609375, 0.020575523376464844, 0.023916244506835938, 0.02725696563720703, 0.030597686767578125, 0.03393840789794922, 0.03727912902832031, 0.040619850158691406, 0.0439605712890625, 0.047301292419433594, 0.05064201354980469, 0.05398273468017578, 0.057323455810546875, 0.06066417694091797, 0.06400489807128906, 0.06734561920166016, 0.07068634033203125, 0.07402706146240234, 0.07736778259277344, 0.08070850372314453, 0.08404922485351562, 0.08738994598388672, 0.09073066711425781, 0.0940713882446289, 0.097412109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 8.0, 7.0, 18.0, 25.0, 31.0, 59.0, 85.0, 123.0, 142.0, 137.0, 123.0, 78.0, 48.0, 34.0, 16.0, 17.0, 8.0, 6.0, 8.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07537841796875, -0.07315254211425781, -0.07092666625976562, -0.06870079040527344, -0.06647491455078125, -0.06424903869628906, -0.062023162841796875, -0.05979728698730469, -0.0575714111328125, -0.05534553527832031, -0.053119659423828125, -0.05089378356933594, -0.04866790771484375, -0.04644203186035156, -0.044216156005859375, -0.04199028015136719, -0.039764404296875, -0.03753852844238281, -0.035312652587890625, -0.03308677673339844, -0.03086090087890625, -0.028635025024414062, -0.026409149169921875, -0.024183273315429688, -0.0219573974609375, -0.019731521606445312, -0.017505645751953125, -0.015279769897460938, -0.01305389404296875, -0.010828018188476562, -0.008602142333984375, -0.0063762664794921875, -0.004150390625, -0.0019245147705078125, 0.000301361083984375, 0.0025272369384765625, 0.00475311279296875, 0.0069789886474609375, 0.009204864501953125, 0.011430740356445312, 0.0136566162109375, 0.015882492065429688, 0.018108367919921875, 0.020334243774414062, 0.02256011962890625, 0.024785995483398438, 0.027011871337890625, 0.029237747192382812, 0.031463623046875, 0.03368949890136719, 0.035915374755859375, 0.03814125061035156, 0.04036712646484375, 0.04259300231933594, 0.044818878173828125, 0.04704475402832031, 0.0492706298828125, 0.05149650573730469, 0.053722381591796875, 0.05594825744628906, 0.05817413330078125, 0.06040000915527344, 0.06262588500976562, 0.06485176086425781, 0.06707763671875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 13.0, 31.0, 74.0, 333.0, 378.0, 108.0, 36.0, 20.0, 7.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3696460723876953, -3.2929718494415283, -3.2162978649139404, -3.1396236419677734, -3.0629496574401855, -2.9862754344940186, -2.9096014499664307, -2.8329272270202637, -2.756253242492676, -2.679579019546509, -2.602905035018921, -2.526230812072754, -2.449556827545166, -2.372882604598999, -2.296208620071411, -2.219534397125244, -2.142860174179077, -2.06618595123291, -1.9895119667053223, -1.9128378629684448, -1.8361637592315674, -1.7594895362854004, -1.682815432548523, -1.6061413288116455, -1.529467225074768, -1.4527931213378906, -1.3761190176010132, -1.2994449138641357, -1.2227706909179688, -1.1460967063903809, -1.0694224834442139, -0.9927483797073364, -0.9160740375518799, -0.8393999338150024, -0.762725830078125, -0.6860516667366028, -0.6093775629997253, -0.5327034592628479, -0.45602932572364807, -0.37935519218444824, -0.3026810884475708, -0.22600696980953217, -0.14933285117149353, -0.0726587325334549, 0.00401538610458374, 0.08068948984146118, 0.157363623380661, 0.23403775691986084, 0.3107118606567383, 0.3873859643936157, 0.46406009793281555, 0.5407342314720154, 0.6174083352088928, 0.6940824389457703, 0.7707566022872925, 0.8474307060241699, 0.9241048097610474, 1.0007789134979248, 1.0774530172348022, 1.1541271209716797, 1.2308013439178467, 1.3074753284454346, 1.3841495513916016, 1.460823655128479, 1.5374977588653564]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 7.0, 8.0, 9.0, 14.0, 7.0, 15.0, 25.0, 17.0, 27.0, 27.0, 26.0, 32.0, 43.0, 52.0, 40.0, 56.0, 59.0, 45.0, 73.0, 59.0, 60.0, 42.0, 44.0, 37.0, 35.0, 23.0, 22.0, 20.0, 14.0, 18.0, 6.0, 16.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.36531400680542, -1.323684573173523, -1.282055139541626, -1.2404258251190186, -1.1987963914871216, -1.1571669578552246, -1.1155375242233276, -1.0739080905914307, -1.0322786569595337, -0.9906492233276367, -0.9490198493003845, -0.9073904156684875, -0.8657609820365906, -0.8241316080093384, -0.7825021743774414, -0.7408727407455444, -0.6992433667182922, -0.6576139330863953, -0.6159845590591431, -0.5743551254272461, -0.5327256917953491, -0.49109628796577454, -0.44946688413619995, -0.407837450504303, -0.3662080466747284, -0.3245786428451538, -0.28294920921325684, -0.24131980538368225, -0.19969038665294647, -0.1580609679222107, -0.11643156409263611, -0.07480213046073914, -0.03317272663116455, 0.00845668837428093, 0.05008610337972641, 0.09171551465988159, 0.13334493339061737, 0.17497435212135315, 0.21660375595092773, 0.2582331895828247, 0.2998625934123993, 0.3414919972419739, 0.38312143087387085, 0.42475083470344543, 0.46638023853302, 0.508009672164917, 0.549639105796814, 0.5912685394287109, 0.6328979134559631, 0.6745273470878601, 0.7161567211151123, 0.7577861547470093, 0.7994155883789062, 0.8410450220108032, 0.8826743960380554, 0.9243038296699524, 0.9659332036972046, 1.0075626373291016, 1.0491920709609985, 1.0908215045928955, 1.132450819015503, 1.1740802526474, 1.2157096862792969, 1.2573391199111938, 1.2989685535430908]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 6.0, 4.0, 10.0, 14.0, 21.0, 26.0, 24.0, 39.0, 51.0, 65.0, 81.0, 115.0, 165.0, 265.0, 403.0, 747.0, 1616.0, 4115.0, 13727.0, 88205.0, 3905189.0, 153854.0, 18077.0, 4543.0, 1523.0, 671.0, 337.0, 172.0, 85.0, 46.0, 29.0, 13.0, 13.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.548828125, -0.5362358093261719, -0.5236434936523438, -0.5110511779785156, -0.4984588623046875, -0.4858665466308594, -0.47327423095703125, -0.4606819152832031, -0.448089599609375, -0.4354972839355469, -0.42290496826171875, -0.4103126525878906, -0.3977203369140625, -0.3851280212402344, -0.37253570556640625, -0.3599433898925781, -0.34735107421875, -0.3347587585449219, -0.32216644287109375, -0.3095741271972656, -0.2969818115234375, -0.2843894958496094, -0.27179718017578125, -0.2592048645019531, -0.246612548828125, -0.23402023315429688, -0.22142791748046875, -0.20883560180664062, -0.1962432861328125, -0.18365097045898438, -0.17105865478515625, -0.15846633911132812, -0.1458740234375, -0.13328170776367188, -0.12068939208984375, -0.10809707641601562, -0.0955047607421875, -0.08291244506835938, -0.07032012939453125, -0.057727813720703125, -0.045135498046875, -0.032543182373046875, -0.01995086669921875, -0.007358551025390625, 0.0052337646484375, 0.017826080322265625, 0.03041839599609375, 0.043010711669921875, 0.05560302734375, 0.06819534301757812, 0.08078765869140625, 0.09337997436523438, 0.1059722900390625, 0.11856460571289062, 0.13115692138671875, 0.14374923706054688, 0.156341552734375, 0.16893386840820312, 0.18152618408203125, 0.19411849975585938, 0.2067108154296875, 0.21930313110351562, 0.23189544677734375, 0.24448776245117188, 0.257080078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 3.0, 10.0, 23.0, 21.0, 50.0, 63.0, 70.0, 99.0, 97.0, 113.0, 89.0, 80.0, 79.0, 77.0, 46.0, 32.0, 16.0, 13.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1478271484375, -0.1444253921508789, -0.1410236358642578, -0.13762187957763672, -0.13422012329101562, -0.13081836700439453, -0.12741661071777344, -0.12401485443115234, -0.12061309814453125, -0.11721134185791016, -0.11380958557128906, -0.11040782928466797, -0.10700607299804688, -0.10360431671142578, -0.10020256042480469, -0.0968008041381836, -0.0933990478515625, -0.0899972915649414, -0.08659553527832031, -0.08319377899169922, -0.07979202270507812, -0.07639026641845703, -0.07298851013183594, -0.06958675384521484, -0.06618499755859375, -0.06278324127197266, -0.05938148498535156, -0.05597972869873047, -0.052577972412109375, -0.04917621612548828, -0.04577445983886719, -0.042372703552246094, -0.038970947265625, -0.035569190979003906, -0.03216743469238281, -0.02876567840576172, -0.025363922119140625, -0.02196216583251953, -0.018560409545898438, -0.015158653259277344, -0.01175689697265625, -0.008355140686035156, -0.0049533843994140625, -0.0015516281127929688, 0.001850128173828125, 0.005251884460449219, 0.008653640747070312, 0.012055397033691406, 0.0154571533203125, 0.018858909606933594, 0.022260665893554688, 0.02566242218017578, 0.029064178466796875, 0.03246593475341797, 0.03586769104003906, 0.039269447326660156, 0.04267120361328125, 0.046072959899902344, 0.04947471618652344, 0.05287647247314453, 0.056278228759765625, 0.05967998504638672, 0.06308174133300781, 0.0664834976196289, 0.06988525390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 17.0, 61.0, 107.0, 275.0, 898.0, 4101483.0, 90266.0, 759.0, 271.0, 92.0, 26.0, 13.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.005859375, -1.9515228271484375, -1.897186279296875, -1.8428497314453125, -1.78851318359375, -1.7341766357421875, -1.679840087890625, -1.6255035400390625, -1.5711669921875, -1.5168304443359375, -1.462493896484375, -1.4081573486328125, -1.35382080078125, -1.2994842529296875, -1.245147705078125, -1.1908111572265625, -1.136474609375, -1.0821380615234375, -1.027801513671875, -0.9734649658203125, -0.91912841796875, -0.8647918701171875, -0.810455322265625, -0.7561187744140625, -0.7017822265625, -0.6474456787109375, -0.593109130859375, -0.5387725830078125, -0.48443603515625, -0.4300994873046875, -0.375762939453125, -0.3214263916015625, -0.26708984375, -0.2127532958984375, -0.158416748046875, -0.1040802001953125, -0.04974365234375, 0.0045928955078125, 0.058929443359375, 0.1132659912109375, 0.1676025390625, 0.2219390869140625, 0.276275634765625, 0.3306121826171875, 0.38494873046875, 0.4392852783203125, 0.493621826171875, 0.5479583740234375, 0.602294921875, 0.6566314697265625, 0.710968017578125, 0.7653045654296875, 0.81964111328125, 0.8739776611328125, 0.928314208984375, 0.9826507568359375, 1.0369873046875, 1.0913238525390625, 1.145660400390625, 1.1999969482421875, 1.25433349609375, 1.3086700439453125, 1.363006591796875, 1.4173431396484375, 1.4716796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 9.0, 22.0, 77.0, 735.0, 3081.0, 125.0, 23.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.32141876220703125, -0.3122711181640625, -0.30312347412109375, -0.293975830078125, -0.28482818603515625, -0.2756805419921875, -0.26653289794921875, -0.25738525390625, -0.24823760986328125, -0.2390899658203125, -0.22994232177734375, -0.220794677734375, -0.21164703369140625, -0.2024993896484375, -0.19335174560546875, -0.1842041015625, -0.17505645751953125, -0.1659088134765625, -0.15676116943359375, -0.147613525390625, -0.13846588134765625, -0.1293182373046875, -0.12017059326171875, -0.11102294921875, -0.10187530517578125, -0.0927276611328125, -0.08358001708984375, -0.074432373046875, -0.06528472900390625, -0.0561370849609375, -0.04698944091796875, -0.037841796875, -0.02869415283203125, -0.0195465087890625, -0.01039886474609375, -0.001251220703125, 0.00789642333984375, 0.0170440673828125, 0.02619171142578125, 0.03533935546875, 0.04448699951171875, 0.0536346435546875, 0.06278228759765625, 0.071929931640625, 0.08107757568359375, 0.0902252197265625, 0.09937286376953125, 0.1085205078125, 0.11766815185546875, 0.1268157958984375, 0.13596343994140625, 0.145111083984375, 0.15425872802734375, 0.1634063720703125, 0.17255401611328125, 0.18170166015625, 0.19084930419921875, 0.1999969482421875, 0.20914459228515625, 0.218292236328125, 0.22743988037109375, 0.2365875244140625, 0.24573516845703125, 0.2548828125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 26.0, 779.0, 192.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.393536329269409, -3.316080093383789, -3.23862361907959, -3.1611673831939697, -3.0837111473083496, -3.0062546730041504, -2.9287984371185303, -2.85134220123291, -2.773885726928711, -2.696429491043091, -2.6189730167388916, -2.5415167808532715, -2.4640605449676514, -2.3866043090820312, -2.309147834777832, -2.231691598892212, -2.154235363006592, -2.0767791271209717, -1.999322772026062, -1.9218664169311523, -1.8444101810455322, -1.7669538259506226, -1.689497470855713, -1.6120412349700928, -1.534584879875183, -1.4571285247802734, -1.3796722888946533, -1.3022159337997437, -1.224759578704834, -1.1473033428192139, -1.0698469877243042, -0.9923906922340393, -0.9149341583251953, -0.8374778628349304, -0.7600215673446655, -0.6825652122497559, -0.605108916759491, -0.5276526212692261, -0.4501962959766388, -0.3727399706840515, -0.2952836751937866, -0.21782736480236053, -0.14037105441093445, -0.06291474401950836, 0.014541566371917725, 0.09199786186218262, 0.1694541871547699, 0.24691051244735718, 0.32436680793762207, 0.40182310342788696, 0.47927942872047424, 0.5567357540130615, 0.6341920495033264, 0.7116483449935913, 0.789104700088501, 0.8665609955787659, 0.9440172910690308, 1.0214736461639404, 1.0989298820495605, 1.1763862371444702, 1.2538425922393799, 1.331298828125, 1.4087551832199097, 1.4862115383148193, 1.5636677742004395]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 9.0, 4.0, 17.0, 20.0, 28.0, 30.0, 42.0, 61.0, 59.0, 81.0, 74.0, 91.0, 79.0, 81.0, 63.0, 47.0, 41.0, 31.0, 48.0, 29.0, 16.0, 8.0, 9.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4426233172416687, -0.4294520616531372, -0.4162808060646057, -0.4031095504760742, -0.3899383246898651, -0.3767670691013336, -0.3635958135128021, -0.35042455792427063, -0.3372533321380615, -0.32408207654953003, -0.31091082096099854, -0.29773956537246704, -0.28456833958625793, -0.27139708399772644, -0.25822582840919495, -0.24505457282066345, -0.23188331723213196, -0.21871206164360046, -0.20554082095623016, -0.19236956536769867, -0.17919832468032837, -0.16602706909179688, -0.15285581350326538, -0.1396845579147339, -0.1265133172273636, -0.11334206908941269, -0.10017082095146179, -0.0869995653629303, -0.0738283172249794, -0.0606570690870285, -0.04748581349849701, -0.03431456536054611, -0.021143317222595215, -0.007972067221999168, 0.005199182778596878, 0.018370434641838074, 0.03154168277978897, 0.04471293091773987, 0.05788418650627136, 0.07105543464422226, 0.08422668278217316, 0.09739793092012405, 0.11056917905807495, 0.12374043464660645, 0.13691169023513794, 0.15008293092250824, 0.16325418651103973, 0.17642542719841003, 0.18959668278694153, 0.20276793837547302, 0.21593917906284332, 0.22911043465137482, 0.24228167533874512, 0.2554529309272766, 0.2686241865158081, 0.2817954421043396, 0.2949666976928711, 0.3081379532814026, 0.3213092088699341, 0.3344804644584656, 0.3476516902446747, 0.3608229458332062, 0.37399420142173767, 0.38716545701026917, 0.40033668279647827]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 12.0, 7.0, 14.0, 15.0, 20.0, 40.0, 64.0, 87.0, 136.0, 163.0, 290.0, 463.0, 783.0, 1835.0, 5165.0, 20206.0, 120450.0, 722843.0, 143078.0, 23003.0, 5635.0, 2030.0, 902.0, 472.0, 261.0, 184.0, 113.0, 74.0, 64.0, 26.0, 32.0, 16.0, 22.0, 16.0, 8.0, 5.0, 8.0, 5.0, 3.0, 0.0, 4.0, 2.0], "bins": [-0.37255859375, -0.36313629150390625, -0.3537139892578125, -0.34429168701171875, -0.334869384765625, -0.32544708251953125, -0.3160247802734375, -0.30660247802734375, -0.29718017578125, -0.28775787353515625, -0.2783355712890625, -0.26891326904296875, -0.259490966796875, -0.25006866455078125, -0.2406463623046875, -0.23122406005859375, -0.2218017578125, -0.21237945556640625, -0.2029571533203125, -0.19353485107421875, -0.184112548828125, -0.17469024658203125, -0.1652679443359375, -0.15584564208984375, -0.14642333984375, -0.13700103759765625, -0.1275787353515625, -0.11815643310546875, -0.108734130859375, -0.09931182861328125, -0.0898895263671875, -0.08046722412109375, -0.071044921875, -0.06162261962890625, -0.0522003173828125, -0.04277801513671875, -0.033355712890625, -0.02393341064453125, -0.0145111083984375, -0.00508880615234375, 0.00433349609375, 0.01375579833984375, 0.0231781005859375, 0.03260040283203125, 0.042022705078125, 0.05144500732421875, 0.0608673095703125, 0.07028961181640625, 0.0797119140625, 0.08913421630859375, 0.0985565185546875, 0.10797882080078125, 0.117401123046875, 0.12682342529296875, 0.1362457275390625, 0.14566802978515625, 0.15509033203125, 0.16451263427734375, 0.1739349365234375, 0.18335723876953125, 0.192779541015625, 0.20220184326171875, 0.2116241455078125, 0.22104644775390625, 0.23046875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 8.0, 15.0, 25.0, 43.0, 41.0, 56.0, 74.0, 86.0, 86.0, 95.0, 95.0, 68.0, 66.0, 73.0, 54.0, 32.0, 30.0, 17.0, 17.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.1339111328125, -0.13083744049072266, -0.1277637481689453, -0.12469005584716797, -0.12161636352539062, -0.11854267120361328, -0.11546897888183594, -0.1123952865600586, -0.10932159423828125, -0.1062479019165039, -0.10317420959472656, -0.10010051727294922, -0.09702682495117188, -0.09395313262939453, -0.09087944030761719, -0.08780574798583984, -0.0847320556640625, -0.08165836334228516, -0.07858467102050781, -0.07551097869873047, -0.07243728637695312, -0.06936359405517578, -0.06628990173339844, -0.0632162094116211, -0.06014251708984375, -0.057068824768066406, -0.05399513244628906, -0.05092144012451172, -0.047847747802734375, -0.04477405548095703, -0.04170036315917969, -0.038626670837402344, -0.035552978515625, -0.032479286193847656, -0.029405593872070312, -0.02633190155029297, -0.023258209228515625, -0.02018451690673828, -0.017110824584960938, -0.014037132263183594, -0.01096343994140625, -0.007889747619628906, -0.0048160552978515625, -0.0017423629760742188, 0.001331329345703125, 0.004405021667480469, 0.0074787139892578125, 0.010552406311035156, 0.0136260986328125, 0.016699790954589844, 0.019773483276367188, 0.02284717559814453, 0.025920867919921875, 0.02899456024169922, 0.03206825256347656, 0.035141944885253906, 0.03821563720703125, 0.041289329528808594, 0.04436302185058594, 0.04743671417236328, 0.050510406494140625, 0.05358409881591797, 0.05665779113769531, 0.059731483459472656, 0.06280517578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 6.0, 5.0, 10.0, 13.0, 26.0, 41.0, 52.0, 101.0, 212.0, 493.0, 1785.0, 10293.0, 232058.0, 778949.0, 20526.0, 2649.0, 745.0, 265.0, 126.0, 59.0, 45.0, 28.0, 12.0, 12.0, 10.0, 8.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.65625, -0.6394844055175781, -0.6227188110351562, -0.6059532165527344, -0.5891876220703125, -0.5724220275878906, -0.5556564331054688, -0.5388908386230469, -0.522125244140625, -0.5053596496582031, -0.48859405517578125, -0.4718284606933594, -0.4550628662109375, -0.4382972717285156, -0.42153167724609375, -0.4047660827636719, -0.38800048828125, -0.3712348937988281, -0.35446929931640625, -0.3377037048339844, -0.3209381103515625, -0.3041725158691406, -0.28740692138671875, -0.2706413269042969, -0.253875732421875, -0.23711013793945312, -0.22034454345703125, -0.20357894897460938, -0.1868133544921875, -0.17004776000976562, -0.15328216552734375, -0.13651657104492188, -0.1197509765625, -0.10298538208007812, -0.08621978759765625, -0.06945419311523438, -0.0526885986328125, -0.035923004150390625, -0.01915740966796875, -0.002391815185546875, 0.014373779296875, 0.031139373779296875, 0.04790496826171875, 0.06467056274414062, 0.0814361572265625, 0.09820175170898438, 0.11496734619140625, 0.13173294067382812, 0.14849853515625, 0.16526412963867188, 0.18202972412109375, 0.19879531860351562, 0.2155609130859375, 0.23232650756835938, 0.24909210205078125, 0.2658576965332031, 0.282623291015625, 0.2993888854980469, 0.31615447998046875, 0.3329200744628906, 0.3496856689453125, 0.3664512634277344, 0.38321685791015625, 0.3999824523925781, 0.416748046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 4.0, 7.0, 5.0, 12.0, 21.0, 30.0, 36.0, 36.0, 53.0, 67.0, 85.0, 95.0, 102.0, 81.0, 74.0, 69.0, 60.0, 42.0, 21.0, 30.0, 19.0, 9.0, 7.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5166015625, -0.5034751892089844, -0.49034881591796875, -0.4772224426269531, -0.4640960693359375, -0.4509696960449219, -0.43784332275390625, -0.4247169494628906, -0.411590576171875, -0.3984642028808594, -0.38533782958984375, -0.3722114562988281, -0.3590850830078125, -0.3459587097167969, -0.33283233642578125, -0.3197059631347656, -0.30657958984375, -0.2934532165527344, -0.28032684326171875, -0.2672004699707031, -0.2540740966796875, -0.24094772338867188, -0.22782135009765625, -0.21469497680664062, -0.201568603515625, -0.18844223022460938, -0.17531585693359375, -0.16218948364257812, -0.1490631103515625, -0.13593673706054688, -0.12281036376953125, -0.10968399047851562, -0.0965576171875, -0.08343124389648438, -0.07030487060546875, -0.057178497314453125, -0.0440521240234375, -0.030925750732421875, -0.01779937744140625, -0.004673004150390625, 0.008453369140625, 0.021579742431640625, 0.03470611572265625, 0.047832489013671875, 0.0609588623046875, 0.07408523559570312, 0.08721160888671875, 0.10033798217773438, 0.11346435546875, 0.12659072875976562, 0.13971710205078125, 0.15284347534179688, 0.1659698486328125, 0.17909622192382812, 0.19222259521484375, 0.20534896850585938, 0.218475341796875, 0.23160171508789062, 0.24472808837890625, 0.2578544616699219, 0.2709808349609375, 0.2841072082519531, 0.29723358154296875, 0.3103599548339844, 0.323486328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 12.0, 8.0, 11.0, 27.0, 32.0, 45.0, 86.0, 145.0, 272.0, 579.0, 1224.0, 3774.0, 22868.0, 785909.0, 219029.0, 10277.0, 2364.0, 861.0, 429.0, 213.0, 132.0, 81.0, 57.0, 26.0, 21.0, 11.0, 8.0, 6.0, 7.0, 9.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1031494140625, -0.0994415283203125, -0.095733642578125, -0.0920257568359375, -0.08831787109375, -0.0846099853515625, -0.080902099609375, -0.0771942138671875, -0.073486328125, -0.0697784423828125, -0.066070556640625, -0.0623626708984375, -0.05865478515625, -0.0549468994140625, -0.051239013671875, -0.0475311279296875, -0.0438232421875, -0.0401153564453125, -0.036407470703125, -0.0326995849609375, -0.02899169921875, -0.0252838134765625, -0.021575927734375, -0.0178680419921875, -0.01416015625, -0.0104522705078125, -0.006744384765625, -0.0030364990234375, 0.00067138671875, 0.0043792724609375, 0.008087158203125, 0.0117950439453125, 0.0155029296875, 0.0192108154296875, 0.022918701171875, 0.0266265869140625, 0.03033447265625, 0.0340423583984375, 0.037750244140625, 0.0414581298828125, 0.045166015625, 0.0488739013671875, 0.052581787109375, 0.0562896728515625, 0.05999755859375, 0.0637054443359375, 0.067413330078125, 0.0711212158203125, 0.0748291015625, 0.0785369873046875, 0.082244873046875, 0.0859527587890625, 0.08966064453125, 0.0933685302734375, 0.097076416015625, 0.1007843017578125, 0.1044921875, 0.1082000732421875, 0.111907958984375, 0.1156158447265625, 0.11932373046875, 0.1230316162109375, 0.126739501953125, 0.1304473876953125, 0.1341552734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 13.0, 17.0, 29.0, 40.0, 50.0, 75.0, 97.0, 95.0, 146.0, 111.0, 93.0, 69.0, 54.0, 39.0, 20.0, 17.0, 9.0, 9.0, 5.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001747608184814453, -0.00017011724412441254, -0.00016547366976737976, -0.00016083009541034698, -0.0001561865210533142, -0.00015154294669628143, -0.00014689937233924866, -0.00014225579798221588, -0.0001376122236251831, -0.00013296864926815033, -0.00012832507491111755, -0.00012368150055408478, -0.000119037926197052, -0.00011439435184001923, -0.00010975077748298645, -0.00010510720312595367, -0.0001004636287689209, -9.582005441188812e-05, -9.117648005485535e-05, -8.653290569782257e-05, -8.18893313407898e-05, -7.724575698375702e-05, -7.260218262672424e-05, -6.795860826969147e-05, -6.331503391265869e-05, -5.8671459555625916e-05, -5.402788519859314e-05, -4.9384310841560364e-05, -4.474073648452759e-05, -4.009716212749481e-05, -3.5453587770462036e-05, -3.081001341342926e-05, -2.6166439056396484e-05, -2.152286469936371e-05, -1.6879290342330933e-05, -1.2235715985298157e-05, -7.592141628265381e-06, -2.948567271232605e-06, 1.695007085800171e-06, 6.338581442832947e-06, 1.0982155799865723e-05, 1.56257301568985e-05, 2.0269304513931274e-05, 2.491287887096405e-05, 2.9556453227996826e-05, 3.42000275850296e-05, 3.884360194206238e-05, 4.3487176299095154e-05, 4.813075065612793e-05, 5.2774325013160706e-05, 5.741789937019348e-05, 6.206147372722626e-05, 6.670504808425903e-05, 7.134862244129181e-05, 7.599219679832458e-05, 8.063577115535736e-05, 8.527934551239014e-05, 8.992291986942291e-05, 9.456649422645569e-05, 9.921006858348846e-05, 0.00010385364294052124, 0.00010849721729755402, 0.00011314079165458679, 0.00011778436601161957, 0.00012242794036865234]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 16.0, 33.0, 68.0, 160.0, 449.0, 1396.0, 10040.0, 781470.0, 248022.0, 5270.0, 982.0, 353.0, 131.0, 61.0, 29.0, 20.0, 13.0, 11.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0999755859375, -0.09494590759277344, -0.08991622924804688, -0.08488655090332031, -0.07985687255859375, -0.07482719421386719, -0.06979751586914062, -0.06476783752441406, -0.0597381591796875, -0.05470848083496094, -0.049678802490234375, -0.04464912414550781, -0.03961944580078125, -0.03458976745605469, -0.029560089111328125, -0.024530410766601562, -0.019500732421875, -0.014471054077148438, -0.009441375732421875, -0.0044116973876953125, 0.00061798095703125, 0.0056476593017578125, 0.010677337646484375, 0.015707015991210938, 0.0207366943359375, 0.025766372680664062, 0.030796051025390625, 0.03582572937011719, 0.04085540771484375, 0.04588508605957031, 0.050914764404296875, 0.05594444274902344, 0.06097412109375, 0.06600379943847656, 0.07103347778320312, 0.07606315612792969, 0.08109283447265625, 0.08612251281738281, 0.09115219116210938, 0.09618186950683594, 0.1012115478515625, 0.10624122619628906, 0.11127090454101562, 0.11630058288574219, 0.12133026123046875, 0.1263599395751953, 0.13138961791992188, 0.13641929626464844, 0.141448974609375, 0.14647865295410156, 0.15150833129882812, 0.1565380096435547, 0.16156768798828125, 0.1665973663330078, 0.17162704467773438, 0.17665672302246094, 0.1816864013671875, 0.18671607971191406, 0.19174575805664062, 0.1967754364013672, 0.20180511474609375, 0.2068347930908203, 0.21186447143554688, 0.21689414978027344, 0.221923828125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 9.0, 10.0, 31.0, 49.0, 107.0, 148.0, 222.0, 180.0, 105.0, 51.0, 32.0, 18.0, 11.0, 10.0, 4.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08544921875, -0.08183860778808594, -0.07822799682617188, -0.07461738586425781, -0.07100677490234375, -0.06739616394042969, -0.06378555297851562, -0.06017494201660156, -0.0565643310546875, -0.05295372009277344, -0.049343109130859375, -0.04573249816894531, -0.04212188720703125, -0.03851127624511719, -0.034900665283203125, -0.03129005432128906, -0.027679443359375, -0.024068832397460938, -0.020458221435546875, -0.016847610473632812, -0.01323699951171875, -0.009626388549804688, -0.006015777587890625, -0.0024051666259765625, 0.0012054443359375, 0.0048160552978515625, 0.008426666259765625, 0.012037277221679688, 0.01564788818359375, 0.019258499145507812, 0.022869110107421875, 0.026479721069335938, 0.03009033203125, 0.03370094299316406, 0.037311553955078125, 0.04092216491699219, 0.04453277587890625, 0.04814338684082031, 0.051753997802734375, 0.05536460876464844, 0.0589752197265625, 0.06258583068847656, 0.06619644165039062, 0.06980705261230469, 0.07341766357421875, 0.07702827453613281, 0.08063888549804688, 0.08424949645996094, 0.087860107421875, 0.09147071838378906, 0.09508132934570312, 0.09869194030761719, 0.10230255126953125, 0.10591316223144531, 0.10952377319335938, 0.11313438415527344, 0.1167449951171875, 0.12035560607910156, 0.12396621704101562, 0.1275768280029297, 0.13118743896484375, 0.1347980499267578, 0.13840866088867188, 0.14201927185058594, 0.1456298828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 10.0, 32.0, 129.0, 630.0, 181.0, 25.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.594270706176758, -8.424546241760254, -8.254822731018066, -8.085098266601562, -7.915374755859375, -7.745650768280029, -7.575926780700684, -7.406202793121338, -7.236478805541992, -7.0667548179626465, -6.897030830383301, -6.727306842803955, -6.557582855224609, -6.387858867645264, -6.218134880065918, -6.048410892486572, -5.878686904907227, -5.708962917327881, -5.539238929748535, -5.3695149421691895, -5.199790954589844, -5.030066967010498, -4.860342979431152, -4.690618991851807, -4.520894527435303, -4.351170539855957, -4.181446552276611, -4.011722564697266, -3.84199857711792, -3.672274589538574, -3.5025506019592285, -3.332826614379883, -3.163102388381958, -2.9933784008026123, -2.8236544132232666, -2.653930425643921, -2.484206438064575, -2.3144824504852295, -2.1447582244873047, -1.9750343561172485, -1.8053103685379028, -1.6355863809585571, -1.4658623933792114, -1.2961382865905762, -1.1264142990112305, -0.9566903710365295, -0.7869663238525391, -0.6172423362731934, -0.44751834869384766, -0.27779436111450195, -0.10807034373283386, 0.06165367364883423, 0.23137766122817993, 0.40110164880752563, 0.5708256959915161, 0.7405496835708618, 0.9102736711502075, 1.0799976587295532, 1.249721646308899, 1.4194457530975342, 1.5891697406768799, 1.7588937282562256, 1.9286177158355713, 2.098341703414917, 2.2680656909942627]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 6.0, 5.0, 6.0, 9.0, 9.0, 10.0, 18.0, 24.0, 18.0, 24.0, 27.0, 29.0, 35.0, 36.0, 34.0, 45.0, 39.0, 44.0, 61.0, 56.0, 37.0, 52.0, 44.0, 44.0, 35.0, 28.0, 33.0, 32.0, 22.0, 31.0, 19.0, 23.0, 9.0, 14.0, 4.0, 8.0, 5.0, 7.0, 4.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4786643981933594, -1.433106541633606, -1.3875486850738525, -1.3419908285140991, -1.2964329719543457, -1.2508751153945923, -1.2053172588348389, -1.1597594022750854, -1.114201545715332, -1.0686436891555786, -1.0230858325958252, -0.9775279760360718, -0.9319701194763184, -0.8864122629165649, -0.8408544063568115, -0.7952965497970581, -0.7497387528419495, -0.704180896282196, -0.6586230397224426, -0.6130651831626892, -0.5675073266029358, -0.5219494700431824, -0.47639164328575134, -0.4308337867259979, -0.3852759301662445, -0.3397180736064911, -0.29416021704673767, -0.24860237538814545, -0.20304451882839203, -0.1574866622686386, -0.11192882061004639, -0.06637096405029297, -0.02081310749053955, 0.02474474534392357, 0.07030259817838669, 0.11586044728755951, 0.16141830384731293, 0.20697616040706635, 0.25253400206565857, 0.298091858625412, 0.3436497151851654, 0.3892075717449188, 0.43476542830467224, 0.48032325506210327, 0.5258811116218567, 0.5714389681816101, 0.6169968247413635, 0.6625546813011169, 0.7081125378608704, 0.7536703944206238, 0.7992282509803772, 0.8447861075401306, 0.890343964099884, 0.9359018206596375, 0.9814596176147461, 1.0270174741744995, 1.072575330734253, 1.1181331872940063, 1.1636910438537598, 1.2092489004135132, 1.2548067569732666, 1.30036461353302, 1.3459224700927734, 1.3914803266525269, 1.4370381832122803]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 6.0, 1.0, 9.0, 9.0, 5.0, 6.0, 8.0, 10.0, 13.0, 24.0, 25.0, 36.0, 64.0, 85.0, 122.0, 209.0, 347.0, 615.0, 1304.0, 2743.0, 7491.0, 36287.0, 3054392.0, 1047091.0, 32023.0, 6908.0, 2353.0, 1023.0, 479.0, 274.0, 132.0, 63.0, 52.0, 22.0, 17.0, 19.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.72998046875, -0.7133750915527344, -0.6967697143554688, -0.6801643371582031, -0.6635589599609375, -0.6469535827636719, -0.6303482055664062, -0.6137428283691406, -0.597137451171875, -0.5805320739746094, -0.5639266967773438, -0.5473213195800781, -0.5307159423828125, -0.5141105651855469, -0.49750518798828125, -0.4808998107910156, -0.46429443359375, -0.4476890563964844, -0.43108367919921875, -0.4144783020019531, -0.3978729248046875, -0.3812675476074219, -0.36466217041015625, -0.3480567932128906, -0.331451416015625, -0.3148460388183594, -0.29824066162109375, -0.2816352844238281, -0.2650299072265625, -0.24842453002929688, -0.23181915283203125, -0.21521377563476562, -0.1986083984375, -0.18200302124023438, -0.16539764404296875, -0.14879226684570312, -0.1321868896484375, -0.11558151245117188, -0.09897613525390625, -0.08237075805664062, -0.065765380859375, -0.049160003662109375, -0.03255462646484375, -0.015949249267578125, 0.0006561279296875, 0.017261505126953125, 0.03386688232421875, 0.050472259521484375, 0.06707763671875, 0.08368301391601562, 0.10028839111328125, 0.11689376831054688, 0.1334991455078125, 0.15010452270507812, 0.16670989990234375, 0.18331527709960938, 0.199920654296875, 0.21652603149414062, 0.23313140869140625, 0.24973678588867188, 0.2663421630859375, 0.2829475402832031, 0.29955291748046875, 0.3161582946777344, 0.332763671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 9.0, 9.0, 21.0, 26.0, 47.0, 45.0, 46.0, 69.0, 95.0, 94.0, 91.0, 79.0, 90.0, 68.0, 58.0, 44.0, 41.0, 19.0, 15.0, 14.0, 11.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.1396484375, -0.13650083541870117, -0.13335323333740234, -0.13020563125610352, -0.1270580291748047, -0.12391042709350586, -0.12076282501220703, -0.1176152229309082, -0.11446762084960938, -0.11132001876831055, -0.10817241668701172, -0.10502481460571289, -0.10187721252441406, -0.09872961044311523, -0.0955820083618164, -0.09243440628051758, -0.08928680419921875, -0.08613920211791992, -0.0829916000366211, -0.07984399795532227, -0.07669639587402344, -0.07354879379272461, -0.07040119171142578, -0.06725358963012695, -0.06410598754882812, -0.0609583854675293, -0.05781078338623047, -0.05466318130493164, -0.05151557922363281, -0.048367977142333984, -0.045220375061035156, -0.04207277297973633, -0.0389251708984375, -0.03577756881713867, -0.032629966735839844, -0.029482364654541016, -0.026334762573242188, -0.02318716049194336, -0.02003955841064453, -0.016891956329345703, -0.013744354248046875, -0.010596752166748047, -0.007449150085449219, -0.004301548004150391, -0.0011539459228515625, 0.0019936561584472656, 0.005141258239746094, 0.008288860321044922, 0.01143646240234375, 0.014584064483642578, 0.017731666564941406, 0.020879268646240234, 0.024026870727539062, 0.02717447280883789, 0.03032207489013672, 0.03346967697143555, 0.036617279052734375, 0.0397648811340332, 0.04291248321533203, 0.04606008529663086, 0.04920768737792969, 0.052355289459228516, 0.055502891540527344, 0.05865049362182617, 0.061798095703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 1.0, 13.0, 19.0, 28.0, 37.0, 72.0, 125.0, 275.0, 1075.0, 10511.0, 4162900.0, 17565.0, 1213.0, 241.0, 103.0, 47.0, 20.0, 15.0, 9.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052734375, -2.0066909790039062, -1.9606475830078125, -1.9146041870117188, -1.868560791015625, -1.8225173950195312, -1.7764739990234375, -1.7304306030273438, -1.68438720703125, -1.6383438110351562, -1.5923004150390625, -1.5462570190429688, -1.500213623046875, -1.4541702270507812, -1.4081268310546875, -1.3620834350585938, -1.3160400390625, -1.2699966430664062, -1.2239532470703125, -1.1779098510742188, -1.131866455078125, -1.0858230590820312, -1.0397796630859375, -0.9937362670898438, -0.94769287109375, -0.9016494750976562, -0.8556060791015625, -0.8095626831054688, -0.763519287109375, -0.7174758911132812, -0.6714324951171875, -0.6253890991210938, -0.579345703125, -0.5333023071289062, -0.4872589111328125, -0.44121551513671875, -0.395172119140625, -0.34912872314453125, -0.3030853271484375, -0.25704193115234375, -0.21099853515625, -0.16495513916015625, -0.1189117431640625, -0.07286834716796875, -0.026824951171875, 0.01921844482421875, 0.0652618408203125, 0.11130523681640625, 0.1573486328125, 0.20339202880859375, 0.2494354248046875, 0.29547882080078125, 0.341522216796875, 0.38756561279296875, 0.4336090087890625, 0.47965240478515625, 0.52569580078125, 0.5717391967773438, 0.6177825927734375, 0.6638259887695312, 0.709869384765625, 0.7559127807617188, 0.8019561767578125, 0.8479995727539062, 0.89404296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 9.0, 11.0, 13.0, 40.0, 151.0, 2782.0, 907.0, 84.0, 38.0, 13.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.646484375, -0.6329746246337891, -0.6194648742675781, -0.6059551239013672, -0.5924453735351562, -0.5789356231689453, -0.5654258728027344, -0.5519161224365234, -0.5384063720703125, -0.5248966217041016, -0.5113868713378906, -0.4978771209716797, -0.48436737060546875, -0.4708576202392578, -0.4573478698730469, -0.44383811950683594, -0.430328369140625, -0.41681861877441406, -0.4033088684082031, -0.3897991180419922, -0.37628936767578125, -0.3627796173095703, -0.3492698669433594, -0.33576011657714844, -0.3222503662109375, -0.30874061584472656, -0.2952308654785156, -0.2817211151123047, -0.26821136474609375, -0.2547016143798828, -0.24119186401367188, -0.22768211364746094, -0.21417236328125, -0.20066261291503906, -0.18715286254882812, -0.1736431121826172, -0.16013336181640625, -0.1466236114501953, -0.13311386108398438, -0.11960411071777344, -0.1060943603515625, -0.09258460998535156, -0.07907485961914062, -0.06556510925292969, -0.05205535888671875, -0.03854560852050781, -0.025035858154296875, -0.011526107788085938, 0.001983642578125, 0.015493392944335938, 0.029003143310546875, 0.04251289367675781, 0.05602264404296875, 0.06953239440917969, 0.08304214477539062, 0.09655189514160156, 0.1100616455078125, 0.12357139587402344, 0.13708114624023438, 0.1505908966064453, 0.16410064697265625, 0.1776103973388672, 0.19112014770507812, 0.20462989807128906, 0.2181396484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 12.0, 35.0, 179.0, 538.0, 179.0, 31.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.164594888687134, -3.105350971221924, -3.046107292175293, -2.986863613128662, -2.927619695663452, -2.868375778198242, -2.8091320991516113, -2.7498884201049805, -2.6906445026397705, -2.6314005851745605, -2.5721569061279297, -2.512913227081299, -2.453669309616089, -2.394425392150879, -2.335181713104248, -2.275938034057617, -2.2166941165924072, -2.1574501991271973, -2.0982065200805664, -2.0389628410339355, -1.9797189235687256, -1.9204751253128052, -1.8612313270568848, -1.8019875288009644, -1.742743730545044, -1.6834999322891235, -1.6242561340332031, -1.5650123357772827, -1.5057685375213623, -1.446524739265442, -1.3872809410095215, -1.328037142753601, -1.2687932252883911, -1.2095494270324707, -1.1503056287765503, -1.0910618305206299, -1.0318180322647095, -0.9725742340087891, -0.9133304357528687, -0.8540866374969482, -0.7948428392410278, -0.7355990409851074, -0.676355242729187, -0.6171114444732666, -0.5578676462173462, -0.4986238479614258, -0.43938004970550537, -0.38013625144958496, -0.32089245319366455, -0.26164865493774414, -0.20240485668182373, -0.14316105842590332, -0.08391726016998291, -0.0246734619140625, 0.03457033634185791, 0.09381413459777832, 0.15305793285369873, 0.21230173110961914, 0.27154552936553955, 0.33078932762145996, 0.39003312587738037, 0.4492769241333008, 0.5085207223892212, 0.5677645206451416, 0.627008318901062]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 10.0, 16.0, 31.0, 43.0, 70.0, 103.0, 131.0, 129.0, 111.0, 112.0, 85.0, 56.0, 54.0, 19.0, 18.0, 6.0, 8.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5089569091796875, -1.4624419212341309, -1.4159269332885742, -1.3694119453430176, -1.322896957397461, -1.2763819694519043, -1.2298669815063477, -1.183351993560791, -1.1368370056152344, -1.0903220176696777, -1.043807029724121, -0.9972920417785645, -0.9507770538330078, -0.9042620658874512, -0.8577470183372498, -0.8112320303916931, -0.7647169828414917, -0.7182019948959351, -0.6716870069503784, -0.6251720190048218, -0.5786570310592651, -0.5321420431137085, -0.4856269955635071, -0.43911200761795044, -0.3925970196723938, -0.34608203172683716, -0.2995670437812805, -0.2530520260334015, -0.20653703808784485, -0.1600220501422882, -0.11350703239440918, -0.06699204444885254, -0.020476937294006348, 0.02603805810213089, 0.07255305349826813, 0.11906805634498596, 0.1655830442905426, 0.21209803223609924, 0.25861304998397827, 0.3051280379295349, 0.35164302587509155, 0.3981580138206482, 0.44467300176620483, 0.49118801951408386, 0.5377030372619629, 0.5842180252075195, 0.6307330131530762, 0.6772480010986328, 0.7237629890441895, 0.7702779769897461, 0.8167929649353027, 0.8633079528808594, 0.909822940826416, 0.9563379287719727, 1.0028529167175293, 1.049367904663086, 1.0958828926086426, 1.1423978805541992, 1.1889128684997559, 1.2354278564453125, 1.2819428443908691, 1.3284578323364258, 1.3749728202819824, 1.421487808227539, 1.4680029153823853]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 10.0, 10.0, 15.0, 22.0, 24.0, 51.0, 66.0, 106.0, 172.0, 314.0, 604.0, 1590.0, 5636.0, 43905.0, 757039.0, 217950.0, 16196.0, 2872.0, 953.0, 408.0, 223.0, 110.0, 82.0, 65.0, 24.0, 33.0, 18.0, 10.0, 13.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5045356750488281, -0.49002838134765625, -0.4755210876464844, -0.4610137939453125, -0.4465065002441406, -0.43199920654296875, -0.4174919128417969, -0.402984619140625, -0.3884773254394531, -0.37397003173828125, -0.3594627380371094, -0.3449554443359375, -0.3304481506347656, -0.31594085693359375, -0.3014335632324219, -0.28692626953125, -0.2724189758300781, -0.25791168212890625, -0.24340438842773438, -0.2288970947265625, -0.21438980102539062, -0.19988250732421875, -0.18537521362304688, -0.170867919921875, -0.15636062622070312, -0.14185333251953125, -0.12734603881835938, -0.1128387451171875, -0.09833145141601562, -0.08382415771484375, -0.06931686401367188, -0.0548095703125, -0.040302276611328125, -0.02579498291015625, -0.011287689208984375, 0.0032196044921875, 0.017726898193359375, 0.03223419189453125, 0.046741485595703125, 0.061248779296875, 0.07575607299804688, 0.09026336669921875, 0.10477066040039062, 0.1192779541015625, 0.13378524780273438, 0.14829254150390625, 0.16279983520507812, 0.17730712890625, 0.19181442260742188, 0.20632171630859375, 0.22082901000976562, 0.2353363037109375, 0.24984359741210938, 0.26435089111328125, 0.2788581848144531, 0.293365478515625, 0.3078727722167969, 0.32238006591796875, 0.3368873596191406, 0.3513946533203125, 0.3659019470214844, 0.38040924072265625, 0.3949165344238281, 0.409423828125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 10.0, 8.0, 22.0, 43.0, 65.0, 100.0, 107.0, 129.0, 137.0, 122.0, 106.0, 65.0, 45.0, 25.0, 11.0, 5.0, 6.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2049560546875, -0.20030498504638672, -0.19565391540527344, -0.19100284576416016, -0.18635177612304688, -0.1817007064819336, -0.1770496368408203, -0.17239856719970703, -0.16774749755859375, -0.16309642791748047, -0.1584453582763672, -0.1537942886352539, -0.14914321899414062, -0.14449214935302734, -0.13984107971191406, -0.13519001007080078, -0.1305389404296875, -0.12588787078857422, -0.12123680114746094, -0.11658573150634766, -0.11193466186523438, -0.1072835922241211, -0.10263252258300781, -0.09798145294189453, -0.09333038330078125, -0.08867931365966797, -0.08402824401855469, -0.0793771743774414, -0.07472610473632812, -0.07007503509521484, -0.06542396545410156, -0.06077289581298828, -0.056121826171875, -0.05147075653076172, -0.04681968688964844, -0.042168617248535156, -0.037517547607421875, -0.032866477966308594, -0.028215408325195312, -0.02356433868408203, -0.01891326904296875, -0.014262199401855469, -0.009611129760742188, -0.004960060119628906, -0.000308990478515625, 0.004342079162597656, 0.008993148803710938, 0.013644218444824219, 0.0182952880859375, 0.02294635772705078, 0.027597427368164062, 0.032248497009277344, 0.036899566650390625, 0.041550636291503906, 0.04620170593261719, 0.05085277557373047, 0.05550384521484375, 0.06015491485595703, 0.06480598449707031, 0.0694570541381836, 0.07410812377929688, 0.07875919342041016, 0.08341026306152344, 0.08806133270263672, 0.09271240234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 20.0, 20.0, 37.0, 40.0, 66.0, 96.0, 149.0, 283.0, 481.0, 1049.0, 2470.0, 6880.0, 23034.0, 93815.0, 537750.0, 304715.0, 54966.0, 14380.0, 4669.0, 1773.0, 781.0, 397.0, 254.0, 132.0, 91.0, 46.0, 31.0, 27.0, 24.0, 7.0, 14.0, 11.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1915283203125, -0.18551063537597656, -0.17949295043945312, -0.1734752655029297, -0.16745758056640625, -0.1614398956298828, -0.15542221069335938, -0.14940452575683594, -0.1433868408203125, -0.13736915588378906, -0.13135147094726562, -0.1253337860107422, -0.11931610107421875, -0.11329841613769531, -0.10728073120117188, -0.10126304626464844, -0.095245361328125, -0.08922767639160156, -0.08320999145507812, -0.07719230651855469, -0.07117462158203125, -0.06515693664550781, -0.059139251708984375, -0.05312156677246094, -0.0471038818359375, -0.04108619689941406, -0.035068511962890625, -0.029050827026367188, -0.02303314208984375, -0.017015457153320312, -0.010997772216796875, -0.0049800872802734375, 0.00103759765625, 0.0070552825927734375, 0.013072967529296875, 0.019090652465820312, 0.02510833740234375, 0.031126022338867188, 0.037143707275390625, 0.04316139221191406, 0.0491790771484375, 0.05519676208496094, 0.061214447021484375, 0.06723213195800781, 0.07324981689453125, 0.07926750183105469, 0.08528518676757812, 0.09130287170410156, 0.097320556640625, 0.10333824157714844, 0.10935592651367188, 0.11537361145019531, 0.12139129638671875, 0.1274089813232422, 0.13342666625976562, 0.13944435119628906, 0.1454620361328125, 0.15147972106933594, 0.15749740600585938, 0.1635150909423828, 0.16953277587890625, 0.1755504608154297, 0.18156814575195312, 0.18758583068847656, 0.193603515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 9.0, 10.0, 17.0, 19.0, 23.0, 17.0, 22.0, 34.0, 41.0, 31.0, 46.0, 51.0, 41.0, 53.0, 55.0, 42.0, 46.0, 52.0, 46.0, 43.0, 43.0, 29.0, 47.0, 32.0, 27.0, 34.0, 21.0, 14.0, 17.0, 11.0, 8.0, 2.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.210693359375, -0.20326614379882812, -0.19583892822265625, -0.18841171264648438, -0.1809844970703125, -0.17355728149414062, -0.16613006591796875, -0.15870285034179688, -0.151275634765625, -0.14384841918945312, -0.13642120361328125, -0.12899398803710938, -0.1215667724609375, -0.11413955688476562, -0.10671234130859375, -0.09928512573242188, -0.09185791015625, -0.08443069458007812, -0.07700347900390625, -0.06957626342773438, -0.0621490478515625, -0.054721832275390625, -0.04729461669921875, -0.039867401123046875, -0.032440185546875, -0.025012969970703125, -0.01758575439453125, -0.010158538818359375, -0.0027313232421875, 0.004695892333984375, 0.01212310791015625, 0.019550323486328125, 0.0269775390625, 0.034404754638671875, 0.04183197021484375, 0.049259185791015625, 0.0566864013671875, 0.06411361694335938, 0.07154083251953125, 0.07896804809570312, 0.086395263671875, 0.09382247924804688, 0.10124969482421875, 0.10867691040039062, 0.1161041259765625, 0.12353134155273438, 0.13095855712890625, 0.13838577270507812, 0.14581298828125, 0.15324020385742188, 0.16066741943359375, 0.16809463500976562, 0.1755218505859375, 0.18294906616210938, 0.19037628173828125, 0.19780349731445312, 0.205230712890625, 0.21265792846679688, 0.22008514404296875, 0.22751235961914062, 0.2349395751953125, 0.24236679077148438, 0.24979400634765625, 0.2572212219238281, 0.2646484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 7.0, 11.0, 21.0, 16.0, 17.0, 21.0, 26.0, 34.0, 51.0, 68.0, 94.0, 173.0, 310.0, 706.0, 1747.0, 5656.0, 37510.0, 752021.0, 231332.0, 13307.0, 3211.0, 1062.0, 472.0, 222.0, 119.0, 82.0, 52.0, 29.0, 26.0, 41.0, 16.0, 18.0, 14.0, 7.0, 6.0, 9.0, 9.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08026123046875, -0.07726287841796875, -0.0742645263671875, -0.07126617431640625, -0.068267822265625, -0.06526947021484375, -0.0622711181640625, -0.05927276611328125, -0.0562744140625, -0.05327606201171875, -0.0502777099609375, -0.04727935791015625, -0.044281005859375, -0.04128265380859375, -0.0382843017578125, -0.03528594970703125, -0.03228759765625, -0.02928924560546875, -0.0262908935546875, -0.02329254150390625, -0.020294189453125, -0.01729583740234375, -0.0142974853515625, -0.01129913330078125, -0.00830078125, -0.00530242919921875, -0.0023040771484375, 0.00069427490234375, 0.003692626953125, 0.00669097900390625, 0.0096893310546875, 0.01268768310546875, 0.01568603515625, 0.01868438720703125, 0.0216827392578125, 0.02468109130859375, 0.027679443359375, 0.03067779541015625, 0.0336761474609375, 0.03667449951171875, 0.0396728515625, 0.04267120361328125, 0.0456695556640625, 0.04866790771484375, 0.051666259765625, 0.05466461181640625, 0.0576629638671875, 0.06066131591796875, 0.06365966796875, 0.06665802001953125, 0.0696563720703125, 0.07265472412109375, 0.075653076171875, 0.07865142822265625, 0.0816497802734375, 0.08464813232421875, 0.087646484375, 0.09064483642578125, 0.0936431884765625, 0.09664154052734375, 0.099639892578125, 0.10263824462890625, 0.1056365966796875, 0.10863494873046875, 0.11163330078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 14.0, 13.0, 24.0, 34.0, 66.0, 141.0, 245.0, 207.0, 129.0, 59.0, 33.0, 17.0, 17.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00043272972106933594, -0.0004240460693836212, -0.0004153624176979065, -0.00040667876601219177, -0.00039799511432647705, -0.00038931146264076233, -0.0003806278109550476, -0.0003719441592693329, -0.00036326050758361816, -0.00035457685589790344, -0.0003458932042121887, -0.000337209552526474, -0.0003285259008407593, -0.00031984224915504456, -0.00031115859746932983, -0.0003024749457836151, -0.0002937912940979004, -0.00028510764241218567, -0.00027642399072647095, -0.0002677403390407562, -0.0002590566873550415, -0.0002503730356693268, -0.00024168938398361206, -0.00023300573229789734, -0.00022432208061218262, -0.0002156384289264679, -0.00020695477724075317, -0.00019827112555503845, -0.00018958747386932373, -0.000180903822183609, -0.0001722201704978943, -0.00016353651881217957, -0.00015485286712646484, -0.00014616921544075012, -0.0001374855637550354, -0.00012880191206932068, -0.00012011826038360596, -0.00011143460869789124, -0.00010275095701217651, -9.406730532646179e-05, -8.538365364074707e-05, -7.670000195503235e-05, -6.801635026931763e-05, -5.9332698583602905e-05, -5.0649046897888184e-05, -4.196539521217346e-05, -3.328174352645874e-05, -2.459809184074402e-05, -1.5914440155029297e-05, -7.230788469314575e-06, 1.4528632164001465e-06, 1.0136514902114868e-05, 1.882016658782959e-05, 2.750381827354431e-05, 3.618746995925903e-05, 4.4871121644973755e-05, 5.3554773330688477e-05, 6.22384250164032e-05, 7.092207670211792e-05, 7.960572838783264e-05, 8.828938007354736e-05, 9.697303175926208e-05, 0.0001056566834449768, 0.00011434033513069153, 0.00012302398681640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 14.0, 19.0, 35.0, 86.0, 187.0, 958.0, 88151.0, 954967.0, 3542.0, 319.0, 123.0, 71.0, 41.0, 25.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.354736328125, -0.346710205078125, -0.33868408203125, -0.330657958984375, -0.3226318359375, -0.314605712890625, -0.30657958984375, -0.298553466796875, -0.29052734375, -0.282501220703125, -0.27447509765625, -0.266448974609375, -0.2584228515625, -0.250396728515625, -0.24237060546875, -0.234344482421875, -0.226318359375, -0.218292236328125, -0.21026611328125, -0.202239990234375, -0.1942138671875, -0.186187744140625, -0.17816162109375, -0.170135498046875, -0.162109375, -0.154083251953125, -0.14605712890625, -0.138031005859375, -0.1300048828125, -0.121978759765625, -0.11395263671875, -0.105926513671875, -0.097900390625, -0.089874267578125, -0.08184814453125, -0.073822021484375, -0.0657958984375, -0.057769775390625, -0.04974365234375, -0.041717529296875, -0.03369140625, -0.025665283203125, -0.01763916015625, -0.009613037109375, -0.0015869140625, 0.006439208984375, 0.01446533203125, 0.022491455078125, 0.030517578125, 0.038543701171875, 0.04656982421875, 0.054595947265625, 0.0626220703125, 0.070648193359375, 0.07867431640625, 0.086700439453125, 0.0947265625, 0.102752685546875, 0.11077880859375, 0.118804931640625, 0.1268310546875, 0.134857177734375, 0.14288330078125, 0.150909423828125, 0.158935546875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 9.0, 13.0, 21.0, 20.0, 75.0, 175.0, 263.0, 222.0, 114.0, 49.0, 20.0, 15.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2851533889770508, -0.27953529357910156, -0.27391719818115234, -0.2682991027832031, -0.2626810073852539, -0.2570629119873047, -0.25144481658935547, -0.24582672119140625, -0.24020862579345703, -0.2345905303955078, -0.2289724349975586, -0.22335433959960938, -0.21773624420166016, -0.21211814880371094, -0.20650005340576172, -0.2008819580078125, -0.19526386260986328, -0.18964576721191406, -0.18402767181396484, -0.17840957641601562, -0.1727914810180664, -0.1671733856201172, -0.16155529022216797, -0.15593719482421875, -0.15031909942626953, -0.1447010040283203, -0.1390829086303711, -0.13346481323242188, -0.12784671783447266, -0.12222862243652344, -0.11661052703857422, -0.110992431640625, -0.10537433624267578, -0.09975624084472656, -0.09413814544677734, -0.08852005004882812, -0.0829019546508789, -0.07728385925292969, -0.07166576385498047, -0.06604766845703125, -0.06042957305908203, -0.05481147766113281, -0.049193382263183594, -0.043575286865234375, -0.037957191467285156, -0.03233909606933594, -0.02672100067138672, -0.0211029052734375, -0.015484809875488281, -0.009866714477539062, -0.004248619079589844, 0.001369476318359375, 0.006987571716308594, 0.012605667114257812, 0.01822376251220703, 0.02384185791015625, 0.02945995330810547, 0.03507804870605469, 0.040696144104003906, 0.046314239501953125, 0.051932334899902344, 0.05755043029785156, 0.06316852569580078, 0.06878662109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 16.0, 51.0, 289.0, 497.0, 109.0, 36.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4458900690078735, -1.3271595239639282, -1.2084288597106934, -1.089698314666748, -0.9709676504135132, -0.8522371053695679, -0.7335065007209778, -0.6147758960723877, -0.4960452914237976, -0.3773146867752075, -0.25858408212661743, -0.13985350728034973, -0.021122902631759644, 0.09760767221450806, 0.21633827686309814, 0.33506888151168823, 0.4537994861602783, 0.5725300908088684, 0.6912606954574585, 0.8099912405014038, 0.9287219047546387, 1.047452449798584, 1.1661829948425293, 1.2849136590957642, 1.403644323348999, 1.5223748683929443, 1.6411055326461792, 1.7598360776901245, 1.8785667419433594, 1.9972972869873047, 2.11602783203125, 2.2347583770751953, 2.3534891605377197, 2.472219705581665, 2.5909502506256104, 2.7096810340881348, 2.82841157913208, 2.9471421241760254, 3.0658726692199707, 3.184603214263916, 3.3033339977264404, 3.4220645427703857, 3.540795087814331, 3.6595258712768555, 3.778256416320801, 3.896986961364746, 4.015717506408691, 4.134448051452637, 4.253178596496582, 4.371909141540527, 4.490639686584473, 4.609370231628418, 4.728100776672363, 4.846831321716309, 4.965562343597412, 5.084292888641357, 5.203023433685303, 5.321753978729248, 5.440484523773193, 5.559215068817139, 5.677945613861084, 5.7966766357421875, 5.915407180786133, 6.034137725830078, 6.152868270874023]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 5.0, 4.0, 14.0, 9.0, 20.0, 21.0, 29.0, 30.0, 29.0, 22.0, 23.0, 37.0, 40.0, 37.0, 35.0, 34.0, 51.0, 57.0, 39.0, 52.0, 58.0, 38.0, 41.0, 49.0, 35.0, 37.0, 27.0, 28.0, 21.0, 10.0, 12.0, 9.0, 8.0, 7.0, 6.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.4333292245864868, -1.3927112817764282, -1.3520934581756592, -1.3114755153656006, -1.270857572555542, -1.2302396297454834, -1.1896216869354248, -1.1490038633346558, -1.1083859205245972, -1.0677679777145386, -1.0271501541137695, -0.9865322113037109, -0.9459142684936523, -0.9052963256835938, -0.8646784424781799, -0.8240605592727661, -0.7834426164627075, -0.7428246736526489, -0.7022067904472351, -0.6615889072418213, -0.6209709644317627, -0.5803530216217041, -0.5397351384162903, -0.4991172254085541, -0.45849931240081787, -0.41788139939308167, -0.37726348638534546, -0.33664557337760925, -0.29602766036987305, -0.25540974736213684, -0.21479183435440063, -0.17417392134666443, -0.13355612754821777, -0.09293821454048157, -0.05232030153274536, -0.011702388525009155, 0.02891552448272705, 0.06953343749046326, 0.11015135049819946, 0.15076926350593567, 0.19138717651367188, 0.23200508952140808, 0.2726230025291443, 0.3132409155368805, 0.3538588285446167, 0.3944767415523529, 0.4350946545600891, 0.4757125675678253, 0.5163304805755615, 0.5569484233856201, 0.5975663065910339, 0.6381841897964478, 0.6788021326065063, 0.7194200754165649, 0.7600379586219788, 0.8006558418273926, 0.8412737846374512, 0.8818917274475098, 0.9225096106529236, 0.9631274938583374, 1.003745436668396, 1.0443633794784546, 1.0849812030792236, 1.1255991458892822, 1.1662170886993408]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 0.0, 1.0, 8.0, 2.0, 4.0, 3.0, 9.0, 7.0, 14.0, 9.0, 15.0, 17.0, 21.0, 32.0, 40.0, 55.0, 72.0, 86.0, 142.0, 178.0, 336.0, 493.0, 1107.0, 2482.0, 7372.0, 31182.0, 627146.0, 3462332.0, 46805.0, 9338.0, 2823.0, 1070.0, 482.0, 275.0, 131.0, 79.0, 33.0, 35.0, 13.0, 13.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.35498046875, -0.3471088409423828, -0.3392372131347656, -0.33136558532714844, -0.32349395751953125, -0.31562232971191406, -0.3077507019042969, -0.2998790740966797, -0.2920074462890625, -0.2841358184814453, -0.2762641906738281, -0.26839256286621094, -0.26052093505859375, -0.25264930725097656, -0.24477767944335938, -0.2369060516357422, -0.229034423828125, -0.2211627960205078, -0.21329116821289062, -0.20541954040527344, -0.19754791259765625, -0.18967628479003906, -0.18180465698242188, -0.1739330291748047, -0.1660614013671875, -0.1581897735595703, -0.15031814575195312, -0.14244651794433594, -0.13457489013671875, -0.12670326232910156, -0.11883163452148438, -0.11096000671386719, -0.10308837890625, -0.09521675109863281, -0.08734512329101562, -0.07947349548339844, -0.07160186767578125, -0.06373023986816406, -0.055858612060546875, -0.04798698425292969, -0.0401153564453125, -0.03224372863769531, -0.024372100830078125, -0.016500473022460938, -0.00862884521484375, -0.0007572174072265625, 0.007114410400390625, 0.014986038208007812, 0.022857666015625, 0.030729293823242188, 0.038600921630859375, 0.04647254943847656, 0.05434417724609375, 0.06221580505371094, 0.07008743286132812, 0.07795906066894531, 0.0858306884765625, 0.09370231628417969, 0.10157394409179688, 0.10944557189941406, 0.11731719970703125, 0.12518882751464844, 0.13306045532226562, 0.1409320831298828, 0.1488037109375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 8.0, 12.0, 29.0, 47.0, 78.0, 80.0, 100.0, 123.0, 121.0, 120.0, 110.0, 65.0, 53.0, 26.0, 10.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2015380859375, -0.1969614028930664, -0.1923847198486328, -0.18780803680419922, -0.18323135375976562, -0.17865467071533203, -0.17407798767089844, -0.16950130462646484, -0.16492462158203125, -0.16034793853759766, -0.15577125549316406, -0.15119457244873047, -0.14661788940429688, -0.14204120635986328, -0.1374645233154297, -0.1328878402709961, -0.1283111572265625, -0.1237344741821289, -0.11915779113769531, -0.11458110809326172, -0.11000442504882812, -0.10542774200439453, -0.10085105895996094, -0.09627437591552734, -0.09169769287109375, -0.08712100982666016, -0.08254432678222656, -0.07796764373779297, -0.07339096069335938, -0.06881427764892578, -0.06423759460449219, -0.059660911560058594, -0.055084228515625, -0.050507545471191406, -0.04593086242675781, -0.04135417938232422, -0.036777496337890625, -0.03220081329345703, -0.027624130249023438, -0.023047447204589844, -0.01847076416015625, -0.013894081115722656, -0.009317398071289062, -0.004740715026855469, -0.000164031982421875, 0.004412651062011719, 0.008989334106445312, 0.013566017150878906, 0.0181427001953125, 0.022719383239746094, 0.027296066284179688, 0.03187274932861328, 0.036449432373046875, 0.04102611541748047, 0.04560279846191406, 0.050179481506347656, 0.05475616455078125, 0.059332847595214844, 0.06390953063964844, 0.06848621368408203, 0.07306289672851562, 0.07763957977294922, 0.08221626281738281, 0.0867929458618164, 0.09136962890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 12.0, 8.0, 23.0, 24.0, 31.0, 71.0, 156.0, 339.0, 877.0, 2361.0, 7894.0, 52221.0, 3983862.0, 129421.0, 11767.0, 3139.0, 1112.0, 506.0, 206.0, 118.0, 43.0, 28.0, 16.0, 11.0, 4.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2364501953125, -0.2284717559814453, -0.22049331665039062, -0.21251487731933594, -0.20453643798828125, -0.19655799865722656, -0.18857955932617188, -0.1806011199951172, -0.1726226806640625, -0.1646442413330078, -0.15666580200195312, -0.14868736267089844, -0.14070892333984375, -0.13273048400878906, -0.12475204467773438, -0.11677360534667969, -0.108795166015625, -0.10081672668457031, -0.09283828735351562, -0.08485984802246094, -0.07688140869140625, -0.06890296936035156, -0.060924530029296875, -0.05294609069824219, -0.0449676513671875, -0.03698921203613281, -0.029010772705078125, -0.021032333374023438, -0.01305389404296875, -0.0050754547119140625, 0.002902984619140625, 0.010881423950195312, 0.01885986328125, 0.026838302612304688, 0.034816741943359375, 0.04279518127441406, 0.05077362060546875, 0.05875205993652344, 0.06673049926757812, 0.07470893859863281, 0.0826873779296875, 0.09066581726074219, 0.09864425659179688, 0.10662269592285156, 0.11460113525390625, 0.12257957458496094, 0.13055801391601562, 0.1385364532470703, 0.146514892578125, 0.1544933319091797, 0.16247177124023438, 0.17045021057128906, 0.17842864990234375, 0.18640708923339844, 0.19438552856445312, 0.2023639678955078, 0.2103424072265625, 0.2183208465576172, 0.22629928588867188, 0.23427772521972656, 0.24225616455078125, 0.25023460388183594, 0.2582130432128906, 0.2661914825439453, 0.274169921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 12.0, 13.0, 15.0, 25.0, 42.0, 81.0, 137.0, 648.0, 2427.0, 360.0, 134.0, 64.0, 25.0, 26.0, 11.0, 10.0, 4.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0902099609375, -0.0873250961303711, -0.08444023132324219, -0.08155536651611328, -0.07867050170898438, -0.07578563690185547, -0.07290077209472656, -0.07001590728759766, -0.06713104248046875, -0.06424617767333984, -0.06136131286621094, -0.05847644805908203, -0.055591583251953125, -0.05270671844482422, -0.04982185363769531, -0.046936988830566406, -0.0440521240234375, -0.041167259216308594, -0.03828239440917969, -0.03539752960205078, -0.032512664794921875, -0.02962779998779297, -0.026742935180664062, -0.023858070373535156, -0.02097320556640625, -0.018088340759277344, -0.015203475952148438, -0.012318611145019531, -0.009433746337890625, -0.006548881530761719, -0.0036640167236328125, -0.0007791519165039062, 0.002105712890625, 0.004990577697753906, 0.007875442504882812, 0.010760307312011719, 0.013645172119140625, 0.01653003692626953, 0.019414901733398438, 0.022299766540527344, 0.02518463134765625, 0.028069496154785156, 0.030954360961914062, 0.03383922576904297, 0.036724090576171875, 0.03960895538330078, 0.04249382019042969, 0.045378684997558594, 0.0482635498046875, 0.051148414611816406, 0.05403327941894531, 0.05691814422607422, 0.059803009033203125, 0.06268787384033203, 0.06557273864746094, 0.06845760345458984, 0.07134246826171875, 0.07422733306884766, 0.07711219787597656, 0.07999706268310547, 0.08288192749023438, 0.08576679229736328, 0.08865165710449219, 0.0915365219116211, 0.09442138671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 55.0, 261.0, 459.0, 167.0, 33.0, 12.0, 8.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32473528385162354, -0.29798340797424316, -0.2712315618991852, -0.244479700922966, -0.21772783994674683, -0.19097597897052765, -0.16422411799430847, -0.1374722570180893, -0.11072039604187012, -0.08396853506565094, -0.05721667408943176, -0.030464813113212585, -0.003712952136993408, 0.02303890883922577, 0.049790769815444946, 0.07654263079166412, 0.1032944917678833, 0.13004635274410248, 0.15679821372032166, 0.18355007469654083, 0.21030193567276, 0.2370537966489792, 0.26380565762519836, 0.29055750370025635, 0.3173093795776367, 0.3440612554550171, 0.3708131015300751, 0.39756494760513306, 0.4243168234825134, 0.4510686993598938, 0.4778205454349518, 0.5045723915100098, 0.5313242673873901, 0.5580761432647705, 0.5848280191421509, 0.6115798354148865, 0.6383317112922668, 0.6650835871696472, 0.6918354034423828, 0.7185872793197632, 0.7453391551971436, 0.7720910310745239, 0.7988429069519043, 0.8255947232246399, 0.8523465991020203, 0.8790984749794006, 0.9058502912521362, 0.9326021671295166, 0.959354043006897, 0.9861059188842773, 1.0128577947616577, 1.039609670639038, 1.066361427307129, 1.0931133031845093, 1.1198651790618896, 1.14661705493927, 1.1733689308166504, 1.2001208066940308, 1.2268726825714111, 1.2536245584487915, 1.2803764343261719, 1.3071281909942627, 1.333880066871643, 1.3606319427490234, 1.3873838186264038]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 9.0, 4.0, 6.0, 9.0, 13.0, 9.0, 20.0, 23.0, 29.0, 29.0, 20.0, 44.0, 35.0, 44.0, 46.0, 47.0, 56.0, 48.0, 44.0, 42.0, 41.0, 54.0, 29.0, 46.0, 40.0, 30.0, 25.0, 22.0, 21.0, 13.0, 23.0, 15.0, 7.0, 8.0, 9.0, 8.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.21170544624328613, -0.20439811050891876, -0.1970907747745514, -0.18978342413902283, -0.18247608840465546, -0.17516875267028809, -0.16786141693592072, -0.16055408120155334, -0.15324673056602478, -0.1459393948316574, -0.13863205909729004, -0.13132470846176147, -0.1240173727273941, -0.11671003699302673, -0.10940270125865936, -0.10209536552429199, -0.09478802978992462, -0.08748069405555725, -0.08017335087060928, -0.07286601513624191, -0.06555867195129395, -0.058251336216926575, -0.050944000482559204, -0.043636661022901535, -0.036329321563243866, -0.029021982103586197, -0.021714644506573677, -0.014407306909561157, -0.007099967449903488, 0.0002073720097541809, 0.0075147077441215515, 0.01482204720377922, 0.02212938666343689, 0.02943672612309456, 0.03674406558275223, 0.0440514013171196, 0.05135874077677727, 0.058666080236434937, 0.06597341597080231, 0.07328075170516968, 0.08058809489011765, 0.08789543062448502, 0.09520277380943298, 0.10251010954380035, 0.10981744527816772, 0.11712478846311569, 0.12443212419748306, 0.13173946738243103, 0.1390468031167984, 0.14635413885116577, 0.15366147458553314, 0.1609688103199005, 0.16827616095542908, 0.17558349668979645, 0.18289083242416382, 0.1901981681585312, 0.19750550389289856, 0.20481283962726593, 0.2121201753616333, 0.21942752599716187, 0.22673486173152924, 0.2340421974658966, 0.24134953320026398, 0.24865686893463135, 0.2559642195701599]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 5.0, 12.0, 27.0, 13.0, 15.0, 25.0, 34.0, 76.0, 74.0, 121.0, 216.0, 342.0, 711.0, 1839.0, 6566.0, 34943.0, 345368.0, 588396.0, 55990.0, 9270.0, 2515.0, 913.0, 426.0, 217.0, 145.0, 84.0, 56.0, 34.0, 33.0, 28.0, 9.0, 9.0, 9.0, 6.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23150634765625, -0.2222900390625, -0.21307373046875, -0.203857421875, -0.19464111328125, -0.1854248046875, -0.17620849609375, -0.1669921875, -0.15777587890625, -0.1485595703125, -0.13934326171875, -0.130126953125, -0.12091064453125, -0.1116943359375, -0.10247802734375, -0.09326171875, -0.08404541015625, -0.0748291015625, -0.06561279296875, -0.056396484375, -0.04718017578125, -0.0379638671875, -0.02874755859375, -0.01953125, -0.01031494140625, -0.0010986328125, 0.00811767578125, 0.017333984375, 0.02655029296875, 0.0357666015625, 0.04498291015625, 0.05419921875, 0.06341552734375, 0.0726318359375, 0.08184814453125, 0.091064453125, 0.10028076171875, 0.1094970703125, 0.11871337890625, 0.1279296875, 0.13714599609375, 0.1463623046875, 0.15557861328125, 0.164794921875, 0.17401123046875, 0.1832275390625, 0.19244384765625, 0.20166015625, 0.21087646484375, 0.2200927734375, 0.22930908203125, 0.238525390625, 0.24774169921875, 0.2569580078125, 0.26617431640625, 0.275390625, 0.28460693359375, 0.2938232421875, 0.30303955078125, 0.312255859375, 0.32147216796875, 0.3306884765625, 0.33990478515625, 0.34912109375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 17.0, 37.0, 37.0, 67.0, 81.0, 98.0, 115.0, 139.0, 111.0, 105.0, 73.0, 51.0, 35.0, 12.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.191162109375, -0.18673419952392578, -0.18230628967285156, -0.17787837982177734, -0.17345046997070312, -0.1690225601196289, -0.1645946502685547, -0.16016674041748047, -0.15573883056640625, -0.15131092071533203, -0.1468830108642578, -0.1424551010131836, -0.13802719116210938, -0.13359928131103516, -0.12917137145996094, -0.12474346160888672, -0.1203155517578125, -0.11588764190673828, -0.11145973205566406, -0.10703182220458984, -0.10260391235351562, -0.0981760025024414, -0.09374809265136719, -0.08932018280029297, -0.08489227294921875, -0.08046436309814453, -0.07603645324707031, -0.0716085433959961, -0.06718063354492188, -0.06275272369384766, -0.05832481384277344, -0.05389690399169922, -0.049468994140625, -0.04504108428955078, -0.04061317443847656, -0.036185264587402344, -0.031757354736328125, -0.027329444885253906, -0.022901535034179688, -0.01847362518310547, -0.01404571533203125, -0.009617805480957031, -0.0051898956298828125, -0.0007619857788085938, 0.003665924072265625, 0.008093833923339844, 0.012521743774414062, 0.01694965362548828, 0.0213775634765625, 0.02580547332763672, 0.030233383178710938, 0.034661293029785156, 0.039089202880859375, 0.043517112731933594, 0.04794502258300781, 0.05237293243408203, 0.05680084228515625, 0.06122875213623047, 0.06565666198730469, 0.0700845718383789, 0.07451248168945312, 0.07894039154052734, 0.08336830139160156, 0.08779621124267578, 0.09222412109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0, 8.0, 5.0, 12.0, 8.0, 20.0, 22.0, 29.0, 34.0, 37.0, 56.0, 70.0, 82.0, 106.0, 131.0, 201.0, 318.0, 574.0, 1164.0, 2380.0, 5627.0, 13819.0, 37207.0, 115464.0, 426185.0, 314018.0, 83049.0, 28068.0, 10952.0, 4478.0, 1939.0, 943.0, 527.0, 311.0, 180.0, 106.0, 83.0, 78.0, 57.0, 42.0, 45.0, 25.0, 25.0, 25.0, 11.0, 6.0, 8.0, 8.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.127197265625, -0.12320518493652344, -0.11921310424804688, -0.11522102355957031, -0.11122894287109375, -0.10723686218261719, -0.10324478149414062, -0.09925270080566406, -0.0952606201171875, -0.09126853942871094, -0.08727645874023438, -0.08328437805175781, -0.07929229736328125, -0.07530021667480469, -0.07130813598632812, -0.06731605529785156, -0.063323974609375, -0.05933189392089844, -0.055339813232421875, -0.05134773254394531, -0.04735565185546875, -0.04336357116699219, -0.039371490478515625, -0.03537940979003906, -0.0313873291015625, -0.027395248413085938, -0.023403167724609375, -0.019411087036132812, -0.01541900634765625, -0.011426925659179688, -0.007434844970703125, -0.0034427642822265625, 0.00054931640625, 0.0045413970947265625, 0.008533477783203125, 0.012525558471679688, 0.01651763916015625, 0.020509719848632812, 0.024501800537109375, 0.028493881225585938, 0.0324859619140625, 0.03647804260253906, 0.040470123291015625, 0.04446220397949219, 0.04845428466796875, 0.05244636535644531, 0.056438446044921875, 0.06043052673339844, 0.064422607421875, 0.06841468811035156, 0.07240676879882812, 0.07639884948730469, 0.08039093017578125, 0.08438301086425781, 0.08837509155273438, 0.09236717224121094, 0.0963592529296875, 0.10035133361816406, 0.10434341430664062, 0.10833549499511719, 0.11232757568359375, 0.11631965637207031, 0.12031173706054688, 0.12430381774902344, 0.1282958984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 7.0, 5.0, 13.0, 6.0, 16.0, 21.0, 20.0, 17.0, 16.0, 30.0, 37.0, 20.0, 30.0, 24.0, 48.0, 35.0, 34.0, 28.0, 41.0, 33.0, 40.0, 39.0, 36.0, 38.0, 35.0, 28.0, 37.0, 30.0, 32.0, 27.0, 23.0, 11.0, 23.0, 14.0, 12.0, 13.0, 10.0, 2.0, 12.0, 13.0, 7.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.18722152709960938, -0.18132781982421875, -0.17543411254882812, -0.1695404052734375, -0.16364669799804688, -0.15775299072265625, -0.15185928344726562, -0.145965576171875, -0.14007186889648438, -0.13417816162109375, -0.12828445434570312, -0.1223907470703125, -0.11649703979492188, -0.11060333251953125, -0.10470962524414062, -0.09881591796875, -0.09292221069335938, -0.08702850341796875, -0.08113479614257812, -0.0752410888671875, -0.06934738159179688, -0.06345367431640625, -0.057559967041015625, -0.051666259765625, -0.045772552490234375, -0.03987884521484375, -0.033985137939453125, -0.0280914306640625, -0.022197723388671875, -0.01630401611328125, -0.010410308837890625, -0.0045166015625, 0.001377105712890625, 0.00727081298828125, 0.013164520263671875, 0.0190582275390625, 0.024951934814453125, 0.03084564208984375, 0.036739349365234375, 0.042633056640625, 0.048526763916015625, 0.05442047119140625, 0.060314178466796875, 0.0662078857421875, 0.07210159301757812, 0.07799530029296875, 0.08388900756835938, 0.08978271484375, 0.09567642211914062, 0.10157012939453125, 0.10746383666992188, 0.1133575439453125, 0.11925125122070312, 0.12514495849609375, 0.13103866577148438, 0.136932373046875, 0.14282608032226562, 0.14871978759765625, 0.15461349487304688, 0.1605072021484375, 0.16640090942382812, 0.17229461669921875, 0.17818832397460938, 0.18408203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 15.0, 23.0, 25.0, 32.0, 71.0, 106.0, 206.0, 394.0, 769.0, 1757.0, 4843.0, 20293.0, 244252.0, 703290.0, 58143.0, 9139.0, 2803.0, 1160.0, 549.0, 275.0, 168.0, 89.0, 38.0, 38.0, 17.0, 10.0, 15.0, 2.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0733642578125, -0.07085609436035156, -0.06834793090820312, -0.06583976745605469, -0.06333160400390625, -0.06082344055175781, -0.058315277099609375, -0.05580711364746094, -0.0532989501953125, -0.05079078674316406, -0.048282623291015625, -0.04577445983886719, -0.04326629638671875, -0.04075813293457031, -0.038249969482421875, -0.03574180603027344, -0.033233642578125, -0.030725479125976562, -0.028217315673828125, -0.025709152221679688, -0.02320098876953125, -0.020692825317382812, -0.018184661865234375, -0.015676498413085938, -0.0131683349609375, -0.010660171508789062, -0.008152008056640625, -0.0056438446044921875, -0.00313568115234375, -0.0006275177001953125, 0.001880645751953125, 0.0043888092041015625, 0.00689697265625, 0.009405136108398438, 0.011913299560546875, 0.014421463012695312, 0.01692962646484375, 0.019437789916992188, 0.021945953369140625, 0.024454116821289062, 0.0269622802734375, 0.029470443725585938, 0.031978607177734375, 0.03448677062988281, 0.03699493408203125, 0.03950309753417969, 0.042011260986328125, 0.04451942443847656, 0.047027587890625, 0.04953575134277344, 0.052043914794921875, 0.05455207824707031, 0.05706024169921875, 0.05956840515136719, 0.062076568603515625, 0.06458473205566406, 0.0670928955078125, 0.06960105895996094, 0.07210922241210938, 0.07461738586425781, 0.07712554931640625, 0.07963371276855469, 0.08214187622070312, 0.08465003967285156, 0.087158203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 5.0, 7.0, 7.0, 6.0, 20.0, 14.0, 15.0, 19.0, 35.0, 37.0, 68.0, 70.0, 108.0, 107.0, 104.0, 75.0, 71.0, 43.0, 40.0, 26.0, 22.0, 16.0, 22.0, 8.0, 8.0, 11.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00011348724365234375, -0.00011000689119100571, -0.00010652653872966766, -0.00010304618626832962, -9.956583380699158e-05, -9.608548134565353e-05, -9.260512888431549e-05, -8.912477642297745e-05, -8.56444239616394e-05, -8.216407150030136e-05, -7.868371903896332e-05, -7.520336657762527e-05, -7.172301411628723e-05, -6.824266165494919e-05, -6.476230919361115e-05, -6.12819567322731e-05, -5.780160427093506e-05, -5.4321251809597015e-05, -5.084089934825897e-05, -4.736054688692093e-05, -4.3880194425582886e-05, -4.039984196424484e-05, -3.69194895029068e-05, -3.3439137041568756e-05, -2.9958784580230713e-05, -2.647843211889267e-05, -2.2998079657554626e-05, -1.9517727196216583e-05, -1.603737473487854e-05, -1.2557022273540497e-05, -9.076669812202454e-06, -5.59631735086441e-06, -2.115964889526367e-06, 1.364387571811676e-06, 4.844740033149719e-06, 8.325092494487762e-06, 1.1805444955825806e-05, 1.528579741716385e-05, 1.8766149878501892e-05, 2.2246502339839935e-05, 2.572685480117798e-05, 2.9207207262516022e-05, 3.2687559723854065e-05, 3.616791218519211e-05, 3.964826464653015e-05, 4.3128617107868195e-05, 4.660896956920624e-05, 5.008932203054428e-05, 5.3569674491882324e-05, 5.705002695322037e-05, 6.053037941455841e-05, 6.401073187589645e-05, 6.74910843372345e-05, 7.097143679857254e-05, 7.445178925991058e-05, 7.793214172124863e-05, 8.141249418258667e-05, 8.489284664392471e-05, 8.837319910526276e-05, 9.18535515666008e-05, 9.533390402793884e-05, 9.881425648927689e-05, 0.00010229460895061493, 0.00010577496141195297, 0.00010925531387329102]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 9.0, 14.0, 24.0, 14.0, 43.0, 55.0, 81.0, 149.0, 266.0, 531.0, 1192.0, 2987.0, 10243.0, 60028.0, 552983.0, 370827.0, 37256.0, 7405.0, 2415.0, 962.0, 450.0, 226.0, 135.0, 76.0, 36.0, 38.0, 23.0, 25.0, 20.0, 9.0, 8.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0819091796875, -0.07968854904174805, -0.0774679183959961, -0.07524728775024414, -0.07302665710449219, -0.07080602645874023, -0.06858539581298828, -0.06636476516723633, -0.06414413452148438, -0.06192350387573242, -0.05970287322998047, -0.057482242584228516, -0.05526161193847656, -0.05304098129272461, -0.050820350646972656, -0.0485997200012207, -0.04637908935546875, -0.0441584587097168, -0.041937828063964844, -0.03971719741821289, -0.03749656677246094, -0.035275936126708984, -0.03305530548095703, -0.030834674835205078, -0.028614044189453125, -0.026393413543701172, -0.02417278289794922, -0.021952152252197266, -0.019731521606445312, -0.01751089096069336, -0.015290260314941406, -0.013069629669189453, -0.0108489990234375, -0.008628368377685547, -0.006407737731933594, -0.004187107086181641, -0.0019664764404296875, 0.0002541542053222656, 0.0024747848510742188, 0.004695415496826172, 0.006916046142578125, 0.009136676788330078, 0.011357307434082031, 0.013577938079833984, 0.015798568725585938, 0.01801919937133789, 0.020239830017089844, 0.022460460662841797, 0.02468109130859375, 0.026901721954345703, 0.029122352600097656, 0.03134298324584961, 0.03356361389160156, 0.035784244537353516, 0.03800487518310547, 0.04022550582885742, 0.042446136474609375, 0.04466676712036133, 0.04688739776611328, 0.049108028411865234, 0.05132865905761719, 0.05354928970336914, 0.055769920349121094, 0.05799055099487305, 0.060211181640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 14.0, 13.0, 34.0, 37.0, 50.0, 91.0, 99.0, 96.0, 119.0, 107.0, 95.0, 66.0, 41.0, 26.0, 33.0, 28.0, 9.0, 9.0, 9.0, 3.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.09991455078125, -0.09750843048095703, -0.09510231018066406, -0.0926961898803711, -0.09029006958007812, -0.08788394927978516, -0.08547782897949219, -0.08307170867919922, -0.08066558837890625, -0.07825946807861328, -0.07585334777832031, -0.07344722747802734, -0.07104110717773438, -0.0686349868774414, -0.06622886657714844, -0.06382274627685547, -0.0614166259765625, -0.05901050567626953, -0.05660438537597656, -0.054198265075683594, -0.051792144775390625, -0.049386024475097656, -0.04697990417480469, -0.04457378387451172, -0.04216766357421875, -0.03976154327392578, -0.03735542297363281, -0.034949302673339844, -0.032543182373046875, -0.030137062072753906, -0.027730941772460938, -0.02532482147216797, -0.022918701171875, -0.02051258087158203, -0.018106460571289062, -0.015700340270996094, -0.013294219970703125, -0.010888099670410156, -0.008481979370117188, -0.006075859069824219, -0.00366973876953125, -0.0012636184692382812, 0.0011425018310546875, 0.0035486221313476562, 0.005954742431640625, 0.008360862731933594, 0.010766983032226562, 0.013173103332519531, 0.0155792236328125, 0.01798534393310547, 0.020391464233398438, 0.022797584533691406, 0.025203704833984375, 0.027609825134277344, 0.030015945434570312, 0.03242206573486328, 0.03482818603515625, 0.03723430633544922, 0.03964042663574219, 0.042046546936035156, 0.044452667236328125, 0.046858787536621094, 0.04926490783691406, 0.05167102813720703, 0.0540771484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 29.0, 245.0, 570.0, 125.0, 26.0, 9.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.828999996185303, -6.695713043212891, -6.56242561340332, -6.429138660430908, -6.295851230621338, -6.162564277648926, -6.0292768478393555, -5.895989894866943, -5.762702941894531, -5.629415988922119, -5.496128559112549, -5.362841606140137, -5.229554176330566, -5.096267223358154, -4.962980270385742, -4.829692840576172, -4.696405410766602, -4.5631184577941895, -4.429831027984619, -4.296544075012207, -4.163256645202637, -4.029969692230225, -3.8966825008392334, -3.763395309448242, -3.63010835647583, -3.496821165084839, -3.3635339736938477, -3.2302470207214355, -3.0969598293304443, -2.963672637939453, -2.830385446548462, -2.6970982551574707, -2.5638108253479004, -2.430523633956909, -2.297236442565918, -2.163949489593506, -2.0306622982025146, -1.8973751068115234, -1.7640879154205322, -1.630800724029541, -1.497513771057129, -1.3642265796661377, -1.230939507484436, -1.0976523160934448, -0.9643651843070984, -0.831078052520752, -0.6977908611297607, -0.5645037293434143, -0.43121659755706787, -0.29792946577072144, -0.1646423041820526, -0.03135514259338379, 0.10193198919296265, 0.23521912097930908, 0.3685063123703003, 0.5017934441566467, 0.6350805759429932, 0.7683677077293396, 0.901654839515686, 1.0349420309066772, 1.168229103088379, 1.3015162944793701, 1.4348034858703613, 1.5680906772613525, 1.7013777494430542]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 7.0, 8.0, 6.0, 9.0, 10.0, 14.0, 18.0, 21.0, 24.0, 21.0, 35.0, 34.0, 34.0, 38.0, 33.0, 33.0, 35.0, 42.0, 49.0, 43.0, 50.0, 45.0, 42.0, 38.0, 36.0, 32.0, 29.0, 18.0, 25.0, 27.0, 20.0, 19.0, 23.0, 14.0, 16.0, 8.0, 11.0, 8.0, 4.0, 4.0, 1.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0462589263916016, -1.0107876062393188, -0.9753163456916809, -0.939845085144043, -0.9043737649917603, -0.8689024448394775, -0.8334311842918396, -0.7979599237442017, -0.762488603591919, -0.7270172834396362, -0.6915460228919983, -0.6560747623443604, -0.6206034421920776, -0.5851321220397949, -0.549660861492157, -0.514189600944519, -0.47871828079223633, -0.443246990442276, -0.4077757000923157, -0.37230440974235535, -0.336833119392395, -0.3013618290424347, -0.26589053869247437, -0.23041924834251404, -0.1949479579925537, -0.15947666764259338, -0.12400537729263306, -0.08853408694267273, -0.0530627965927124, -0.017591506242752075, 0.017879784107208252, 0.05335107445716858, 0.08882224559783936, 0.12429353594779968, 0.15976482629776, 0.19523611664772034, 0.23070740699768066, 0.266178697347641, 0.3016499876976013, 0.33712127804756165, 0.372592568397522, 0.4080638587474823, 0.4435351490974426, 0.47900643944740295, 0.5144777297973633, 0.549949049949646, 0.5854203104972839, 0.6208915710449219, 0.6563628911972046, 0.6918342113494873, 0.7273054718971252, 0.7627767324447632, 0.7982480525970459, 0.8337193727493286, 0.8691906332969666, 0.9046618938446045, 0.9401332139968872, 0.9756045341491699, 1.011075735092163, 1.0465470552444458, 1.0820183753967285, 1.1174896955490112, 1.152961015701294, 1.188432216644287, 1.2239035367965698]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 10.0, 10.0, 22.0, 23.0, 28.0, 40.0, 52.0, 79.0, 146.0, 242.0, 518.0, 1190.0, 3286.0, 12614.0, 96002.0, 3967201.0, 95484.0, 12129.0, 3224.0, 1097.0, 448.0, 204.0, 94.0, 60.0, 22.0, 18.0, 11.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44091796875, -0.4305419921875, -0.420166015625, -0.4097900390625, -0.3994140625, -0.3890380859375, -0.378662109375, -0.3682861328125, -0.35791015625, -0.3475341796875, -0.337158203125, -0.3267822265625, -0.31640625, -0.3060302734375, -0.295654296875, -0.2852783203125, -0.27490234375, -0.2645263671875, -0.254150390625, -0.2437744140625, -0.2333984375, -0.2230224609375, -0.212646484375, -0.2022705078125, -0.19189453125, -0.1815185546875, -0.171142578125, -0.1607666015625, -0.150390625, -0.1400146484375, -0.129638671875, -0.1192626953125, -0.10888671875, -0.0985107421875, -0.088134765625, -0.0777587890625, -0.0673828125, -0.0570068359375, -0.046630859375, -0.0362548828125, -0.02587890625, -0.0155029296875, -0.005126953125, 0.0052490234375, 0.015625, 0.0260009765625, 0.036376953125, 0.0467529296875, 0.05712890625, 0.0675048828125, 0.077880859375, 0.0882568359375, 0.0986328125, 0.1090087890625, 0.119384765625, 0.1297607421875, 0.14013671875, 0.1505126953125, 0.160888671875, 0.1712646484375, 0.181640625, 0.1920166015625, 0.202392578125, 0.2127685546875, 0.22314453125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 14.0, 18.0, 35.0, 49.0, 63.0, 80.0, 78.0, 114.0, 107.0, 90.0, 87.0, 94.0, 57.0, 44.0, 26.0, 17.0, 7.0, 6.0, 6.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.182373046875, -0.1780719757080078, -0.17377090454101562, -0.16946983337402344, -0.16516876220703125, -0.16086769104003906, -0.15656661987304688, -0.1522655487060547, -0.1479644775390625, -0.1436634063720703, -0.13936233520507812, -0.13506126403808594, -0.13076019287109375, -0.12645912170410156, -0.12215805053710938, -0.11785697937011719, -0.113555908203125, -0.10925483703613281, -0.10495376586914062, -0.10065269470214844, -0.09635162353515625, -0.09205055236816406, -0.08774948120117188, -0.08344841003417969, -0.0791473388671875, -0.07484626770019531, -0.07054519653320312, -0.06624412536621094, -0.06194305419921875, -0.05764198303222656, -0.053340911865234375, -0.04903984069824219, -0.04473876953125, -0.04043769836425781, -0.036136627197265625, -0.03183555603027344, -0.02753448486328125, -0.023233413696289062, -0.018932342529296875, -0.014631271362304688, -0.0103302001953125, -0.0060291290283203125, -0.001728057861328125, 0.0025730133056640625, 0.00687408447265625, 0.011175155639648438, 0.015476226806640625, 0.019777297973632812, 0.024078369140625, 0.028379440307617188, 0.032680511474609375, 0.03698158264160156, 0.04128265380859375, 0.04558372497558594, 0.049884796142578125, 0.05418586730957031, 0.0584869384765625, 0.06278800964355469, 0.06708908081054688, 0.07139015197753906, 0.07569122314453125, 0.07999229431152344, 0.08429336547851562, 0.08859443664550781, 0.0928955078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 8.0, 5.0, 20.0, 21.0, 33.0, 56.0, 87.0, 183.0, 388.0, 1158.0, 4386.0, 21449.0, 587428.0, 3539031.0, 31787.0, 5737.0, 1552.0, 468.0, 187.0, 101.0, 63.0, 42.0, 33.0, 17.0, 15.0, 12.0, 3.0, 8.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24746322631835938, -0.23833465576171875, -0.22920608520507812, -0.2200775146484375, -0.21094894409179688, -0.20182037353515625, -0.19269180297851562, -0.183563232421875, -0.17443466186523438, -0.16530609130859375, -0.15617752075195312, -0.1470489501953125, -0.13792037963867188, -0.12879180908203125, -0.11966323852539062, -0.11053466796875, -0.10140609741210938, -0.09227752685546875, -0.08314895629882812, -0.0740203857421875, -0.06489181518554688, -0.05576324462890625, -0.046634674072265625, -0.037506103515625, -0.028377532958984375, -0.01924896240234375, -0.010120391845703125, -0.0009918212890625, 0.008136749267578125, 0.01726531982421875, 0.026393890380859375, 0.0355224609375, 0.044651031494140625, 0.05377960205078125, 0.06290817260742188, 0.0720367431640625, 0.08116531372070312, 0.09029388427734375, 0.09942245483398438, 0.108551025390625, 0.11767959594726562, 0.12680816650390625, 0.13593673706054688, 0.1450653076171875, 0.15419387817382812, 0.16332244873046875, 0.17245101928710938, 0.18157958984375, 0.19070816040039062, 0.19983673095703125, 0.20896530151367188, 0.2180938720703125, 0.22722244262695312, 0.23635101318359375, 0.24547958374023438, 0.254608154296875, 0.2637367248535156, 0.27286529541015625, 0.2819938659667969, 0.2911224365234375, 0.3002510070800781, 0.30937957763671875, 0.3185081481933594, 0.32763671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 6.0, 8.0, 12.0, 29.0, 48.0, 67.0, 145.0, 400.0, 2549.0, 540.0, 129.0, 56.0, 26.0, 21.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09259033203125, -0.0878610610961914, -0.08313179016113281, -0.07840251922607422, -0.07367324829101562, -0.06894397735595703, -0.06421470642089844, -0.059485435485839844, -0.05475616455078125, -0.050026893615722656, -0.04529762268066406, -0.04056835174560547, -0.035839080810546875, -0.03110980987548828, -0.026380538940429688, -0.021651268005371094, -0.0169219970703125, -0.012192726135253906, -0.0074634552001953125, -0.0027341842651367188, 0.001995086669921875, 0.006724357604980469, 0.011453628540039062, 0.016182899475097656, 0.02091217041015625, 0.025641441345214844, 0.030370712280273438, 0.03509998321533203, 0.039829254150390625, 0.04455852508544922, 0.04928779602050781, 0.054017066955566406, 0.058746337890625, 0.0634756088256836, 0.06820487976074219, 0.07293415069580078, 0.07766342163085938, 0.08239269256591797, 0.08712196350097656, 0.09185123443603516, 0.09658050537109375, 0.10130977630615234, 0.10603904724121094, 0.11076831817626953, 0.11549758911132812, 0.12022686004638672, 0.12495613098144531, 0.1296854019165039, 0.1344146728515625, 0.1391439437866211, 0.1438732147216797, 0.14860248565673828, 0.15333175659179688, 0.15806102752685547, 0.16279029846191406, 0.16751956939697266, 0.17224884033203125, 0.17697811126708984, 0.18170738220214844, 0.18643665313720703, 0.19116592407226562, 0.19589519500732422, 0.2006244659423828, 0.2053537368774414, 0.2100830078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 22.0, 110.0, 476.0, 316.0, 55.0, 8.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0404784679412842, -0.9969796538352966, -0.9534808397293091, -0.9099820852279663, -0.866483211517334, -0.8229844570159912, -0.7794856429100037, -0.7359868288040161, -0.6924880146980286, -0.648989200592041, -0.6054903864860535, -0.5619915723800659, -0.5184928178787231, -0.4749939739704132, -0.43149518966674805, -0.3879963755607605, -0.34449756145477295, -0.3009987473487854, -0.25749993324279785, -0.2140011489391327, -0.17050233483314514, -0.1270035207271576, -0.08350473642349243, -0.04000592231750488, 0.003492891788482666, 0.04699169844388962, 0.09049050509929657, 0.13398930430412292, 0.17748811841011047, 0.22098693251609802, 0.2644857168197632, 0.30798453092575073, 0.3514833450317383, 0.39498215913772583, 0.4384809732437134, 0.48197975754737854, 0.5254786014556885, 0.5689773559570312, 0.6124761700630188, 0.6559749841690063, 0.6994737982749939, 0.7429726123809814, 0.786471426486969, 0.8299702405929565, 0.8734689950942993, 0.9169678688049316, 0.9604666233062744, 1.0039653778076172, 1.0474642515182495, 1.0909630060195923, 1.1344618797302246, 1.1779606342315674, 1.2214595079421997, 1.2649582624435425, 1.3084571361541748, 1.3519558906555176, 1.3954546451568604, 1.4389533996582031, 1.4824522733688354, 1.5259510278701782, 1.5694499015808105, 1.6129486560821533, 1.656447410583496, 1.6999462842941284, 1.7434451580047607]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 11.0, 15.0, 9.0, 13.0, 18.0, 27.0, 20.0, 19.0, 27.0, 41.0, 40.0, 49.0, 31.0, 44.0, 58.0, 51.0, 48.0, 55.0, 47.0, 55.0, 36.0, 46.0, 44.0, 28.0, 26.0, 20.0, 27.0, 15.0, 15.0, 18.0, 13.0, 10.0, 7.0, 8.0, 4.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301017701625824, -0.29016268253326416, -0.27930769324302673, -0.2684526741504669, -0.2575976550579071, -0.24674266576766968, -0.23588764667510986, -0.22503264248371124, -0.21417763829231262, -0.203322634100914, -0.1924676150083542, -0.18161261081695557, -0.17075760662555695, -0.15990260243415833, -0.1490475833415985, -0.1381925791501999, -0.12733756005764008, -0.11648254841566086, -0.10562754422426224, -0.09477253258228302, -0.0839175283908844, -0.07306251674890518, -0.062207505106925964, -0.051352500915527344, -0.040497489273548126, -0.029642481356859207, -0.01878747157752514, -0.00793246179819107, 0.0029225461184978485, 0.013777554035186768, 0.024632565677165985, 0.035487569868564606, 0.04634258151054382, 0.05719758942723274, 0.06805259734392166, 0.07890760898590088, 0.0897626131772995, 0.10061762481927872, 0.11147263646125793, 0.12232764065265656, 0.13318264484405518, 0.1440376490354538, 0.1548926681280136, 0.16574767231941223, 0.17660267651081085, 0.18745768070220947, 0.1983126997947693, 0.2091677039861679, 0.22002272307872772, 0.23087772727012634, 0.24173274636268616, 0.2525877356529236, 0.2634427547454834, 0.2742977738380432, 0.285152792930603, 0.29600778222084045, 0.30686280131340027, 0.3177178204059601, 0.3285728096961975, 0.3394278287887573, 0.35028284788131714, 0.36113783717155457, 0.3719928562641144, 0.3828478455543518, 0.3937028646469116]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 6.0, 4.0, 1.0, 10.0, 11.0, 17.0, 12.0, 31.0, 44.0, 64.0, 99.0, 189.0, 399.0, 791.0, 1879.0, 5812.0, 25884.0, 272724.0, 674975.0, 51667.0, 9031.0, 2822.0, 1006.0, 481.0, 218.0, 151.0, 61.0, 54.0, 31.0, 31.0, 15.0, 6.0, 5.0, 3.0, 7.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.466796875, -0.4535255432128906, -0.44025421142578125, -0.4269828796386719, -0.4137115478515625, -0.4004402160644531, -0.38716888427734375, -0.3738975524902344, -0.360626220703125, -0.3473548889160156, -0.33408355712890625, -0.3208122253417969, -0.3075408935546875, -0.2942695617675781, -0.28099822998046875, -0.2677268981933594, -0.25445556640625, -0.24118423461914062, -0.22791290283203125, -0.21464157104492188, -0.2013702392578125, -0.18809890747070312, -0.17482757568359375, -0.16155624389648438, -0.148284912109375, -0.13501358032226562, -0.12174224853515625, -0.10847091674804688, -0.0951995849609375, -0.08192825317382812, -0.06865692138671875, -0.055385589599609375, -0.0421142578125, -0.028842926025390625, -0.01557159423828125, -0.002300262451171875, 0.0109710693359375, 0.024242401123046875, 0.03751373291015625, 0.050785064697265625, 0.064056396484375, 0.07732772827148438, 0.09059906005859375, 0.10387039184570312, 0.1171417236328125, 0.13041305541992188, 0.14368438720703125, 0.15695571899414062, 0.17022705078125, 0.18349838256835938, 0.19676971435546875, 0.21004104614257812, 0.2233123779296875, 0.23658370971679688, 0.24985504150390625, 0.2631263732910156, 0.276397705078125, 0.2896690368652344, 0.30294036865234375, 0.3162117004394531, 0.3294830322265625, 0.3427543640136719, 0.35602569580078125, 0.3692970275878906, 0.382568359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 10.0, 37.0, 36.0, 54.0, 62.0, 91.0, 93.0, 113.0, 103.0, 99.0, 82.0, 74.0, 46.0, 45.0, 18.0, 8.0, 9.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183837890625, -0.17944908142089844, -0.17506027221679688, -0.1706714630126953, -0.16628265380859375, -0.1618938446044922, -0.15750503540039062, -0.15311622619628906, -0.1487274169921875, -0.14433860778808594, -0.13994979858398438, -0.1355609893798828, -0.13117218017578125, -0.1267833709716797, -0.12239456176757812, -0.11800575256347656, -0.113616943359375, -0.10922813415527344, -0.10483932495117188, -0.10045051574707031, -0.09606170654296875, -0.09167289733886719, -0.08728408813476562, -0.08289527893066406, -0.0785064697265625, -0.07411766052246094, -0.06972885131835938, -0.06534004211425781, -0.06095123291015625, -0.05656242370605469, -0.052173614501953125, -0.04778480529785156, -0.04339599609375, -0.03900718688964844, -0.034618377685546875, -0.030229568481445312, -0.02584075927734375, -0.021451950073242188, -0.017063140869140625, -0.012674331665039062, -0.0082855224609375, -0.0038967132568359375, 0.000492095947265625, 0.0048809051513671875, 0.00926971435546875, 0.013658523559570312, 0.018047332763671875, 0.022436141967773438, 0.026824951171875, 0.031213760375976562, 0.035602569580078125, 0.03999137878417969, 0.04438018798828125, 0.04876899719238281, 0.053157806396484375, 0.05754661560058594, 0.0619354248046875, 0.06632423400878906, 0.07071304321289062, 0.07510185241699219, 0.07949066162109375, 0.08387947082519531, 0.08826828002929688, 0.09265708923339844, 0.0970458984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 4.0, 5.0, 4.0, 6.0, 17.0, 17.0, 32.0, 55.0, 75.0, 126.0, 199.0, 349.0, 617.0, 1257.0, 2511.0, 6265.0, 20116.0, 98876.0, 675917.0, 194776.0, 32014.0, 8711.0, 3275.0, 1477.0, 759.0, 403.0, 252.0, 137.0, 97.0, 58.0, 35.0, 37.0, 24.0, 16.0, 7.0, 4.0, 9.0, 5.0, 7.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.223388671875, -0.21531295776367188, -0.20723724365234375, -0.19916152954101562, -0.1910858154296875, -0.18301010131835938, -0.17493438720703125, -0.16685867309570312, -0.158782958984375, -0.15070724487304688, -0.14263153076171875, -0.13455581665039062, -0.1264801025390625, -0.11840438842773438, -0.11032867431640625, -0.10225296020507812, -0.09417724609375, -0.08610153198242188, -0.07802581787109375, -0.06995010375976562, -0.0618743896484375, -0.053798675537109375, -0.04572296142578125, -0.037647247314453125, -0.029571533203125, -0.021495819091796875, -0.01342010498046875, -0.005344390869140625, 0.0027313232421875, 0.010807037353515625, 0.01888275146484375, 0.026958465576171875, 0.0350341796875, 0.043109893798828125, 0.05118560791015625, 0.059261322021484375, 0.0673370361328125, 0.07541275024414062, 0.08348846435546875, 0.09156417846679688, 0.099639892578125, 0.10771560668945312, 0.11579132080078125, 0.12386703491210938, 0.1319427490234375, 0.14001846313476562, 0.14809417724609375, 0.15616989135742188, 0.16424560546875, 0.17232131958007812, 0.18039703369140625, 0.18847274780273438, 0.1965484619140625, 0.20462417602539062, 0.21269989013671875, 0.22077560424804688, 0.228851318359375, 0.23692703247070312, 0.24500274658203125, 0.2530784606933594, 0.2611541748046875, 0.2692298889160156, 0.27730560302734375, 0.2853813171386719, 0.29345703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 9.0, 7.0, 10.0, 6.0, 17.0, 14.0, 18.0, 23.0, 27.0, 25.0, 33.0, 36.0, 24.0, 35.0, 32.0, 48.0, 54.0, 59.0, 44.0, 55.0, 48.0, 52.0, 43.0, 34.0, 32.0, 26.0, 22.0, 26.0, 24.0, 16.0, 17.0, 13.0, 11.0, 11.0, 5.0, 6.0, 8.0, 3.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.280029296875, -0.27203369140625, -0.2640380859375, -0.25604248046875, -0.248046875, -0.24005126953125, -0.2320556640625, -0.22406005859375, -0.216064453125, -0.20806884765625, -0.2000732421875, -0.19207763671875, -0.18408203125, -0.17608642578125, -0.1680908203125, -0.16009521484375, -0.152099609375, -0.14410400390625, -0.1361083984375, -0.12811279296875, -0.1201171875, -0.11212158203125, -0.1041259765625, -0.09613037109375, -0.088134765625, -0.08013916015625, -0.0721435546875, -0.06414794921875, -0.05615234375, -0.04815673828125, -0.0401611328125, -0.03216552734375, -0.024169921875, -0.01617431640625, -0.0081787109375, -0.00018310546875, 0.0078125, 0.01580810546875, 0.0238037109375, 0.03179931640625, 0.039794921875, 0.04779052734375, 0.0557861328125, 0.06378173828125, 0.07177734375, 0.07977294921875, 0.0877685546875, 0.09576416015625, 0.103759765625, 0.11175537109375, 0.1197509765625, 0.12774658203125, 0.1357421875, 0.14373779296875, 0.1517333984375, 0.15972900390625, 0.167724609375, 0.17572021484375, 0.1837158203125, 0.19171142578125, 0.19970703125, 0.20770263671875, 0.2156982421875, 0.22369384765625, 0.231689453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 19.0, 46.0, 71.0, 139.0, 334.0, 961.0, 7452.0, 1008083.0, 29138.0, 1487.0, 445.0, 191.0, 88.0, 40.0, 33.0, 13.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2347412109375, -0.22625160217285156, -0.21776199340820312, -0.2092723846435547, -0.20078277587890625, -0.1922931671142578, -0.18380355834960938, -0.17531394958496094, -0.1668243408203125, -0.15833473205566406, -0.14984512329101562, -0.1413555145263672, -0.13286590576171875, -0.12437629699707031, -0.11588668823242188, -0.10739707946777344, -0.098907470703125, -0.09041786193847656, -0.08192825317382812, -0.07343864440917969, -0.06494903564453125, -0.05645942687988281, -0.047969818115234375, -0.03948020935058594, -0.0309906005859375, -0.022500991821289062, -0.014011383056640625, -0.0055217742919921875, 0.00296783447265625, 0.011457443237304688, 0.019947052001953125, 0.028436660766601562, 0.03692626953125, 0.04541587829589844, 0.053905487060546875, 0.06239509582519531, 0.07088470458984375, 0.07937431335449219, 0.08786392211914062, 0.09635353088378906, 0.1048431396484375, 0.11333274841308594, 0.12182235717773438, 0.1303119659423828, 0.13880157470703125, 0.1472911834716797, 0.15578079223632812, 0.16427040100097656, 0.172760009765625, 0.18124961853027344, 0.18973922729492188, 0.1982288360595703, 0.20671844482421875, 0.2152080535888672, 0.22369766235351562, 0.23218727111816406, 0.2406768798828125, 0.24916648864746094, 0.2576560974121094, 0.2661457061767578, 0.27463531494140625, 0.2831249237060547, 0.2916145324707031, 0.30010414123535156, 0.30859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 23.0, 30.0, 58.0, 117.0, 218.0, 247.0, 131.0, 76.0, 47.0, 16.0, 12.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004241466522216797, -0.00041430629789829254, -0.0004044659435749054, -0.00039462558925151825, -0.0003847852349281311, -0.00037494488060474396, -0.0003651045262813568, -0.00035526417195796967, -0.0003454238176345825, -0.0003355834633111954, -0.00032574310898780823, -0.0003159027546644211, -0.00030606240034103394, -0.0002962220460176468, -0.00028638169169425964, -0.0002765413373708725, -0.00026670098304748535, -0.0002568606287240982, -0.00024702027440071106, -0.00023717992007732391, -0.00022733956575393677, -0.00021749921143054962, -0.00020765885710716248, -0.00019781850278377533, -0.00018797814846038818, -0.00017813779413700104, -0.0001682974398136139, -0.00015845708549022675, -0.0001486167311668396, -0.00013877637684345245, -0.0001289360225200653, -0.00011909566819667816, -0.00010925531387329102, -9.941495954990387e-05, -8.957460522651672e-05, -7.973425090312958e-05, -6.989389657974243e-05, -6.0053542256355286e-05, -5.021318793296814e-05, -4.0372833609580994e-05, -3.053247928619385e-05, -2.06921249628067e-05, -1.0851770639419556e-05, -1.0114163160324097e-06, 8.828938007354736e-06, 1.8669292330741882e-05, 2.850964665412903e-05, 3.8350000977516174e-05, 4.819035530090332e-05, 5.8030709624290466e-05, 6.787106394767761e-05, 7.771141827106476e-05, 8.75517725944519e-05, 9.739212691783905e-05, 0.0001072324812412262, 0.00011707283556461334, 0.0001269131898880005, 0.00013675354421138763, 0.00014659389853477478, 0.00015643425285816193, 0.00016627460718154907, 0.00017611496150493622, 0.00018595531582832336, 0.0001957956701517105, 0.00020563602447509766]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 11.0, 39.0, 65.0, 135.0, 386.0, 1537.0, 241195.0, 802309.0, 2206.0, 383.0, 140.0, 78.0, 36.0, 15.0, 13.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.316650390625, -0.3083362579345703, -0.3000221252441406, -0.29170799255371094, -0.28339385986328125, -0.27507972717285156, -0.2667655944824219, -0.2584514617919922, -0.2501373291015625, -0.2418231964111328, -0.23350906372070312, -0.22519493103027344, -0.21688079833984375, -0.20856666564941406, -0.20025253295898438, -0.1919384002685547, -0.183624267578125, -0.1753101348876953, -0.16699600219726562, -0.15868186950683594, -0.15036773681640625, -0.14205360412597656, -0.13373947143554688, -0.1254253387451172, -0.1171112060546875, -0.10879707336425781, -0.10048294067382812, -0.09216880798339844, -0.08385467529296875, -0.07554054260253906, -0.06722640991210938, -0.05891227722167969, -0.05059814453125, -0.04228401184082031, -0.033969879150390625, -0.025655746459960938, -0.01734161376953125, -0.009027481079101562, -0.000713348388671875, 0.0076007843017578125, 0.0159149169921875, 0.024229049682617188, 0.032543182373046875, 0.04085731506347656, 0.04917144775390625, 0.05748558044433594, 0.06579971313476562, 0.07411384582519531, 0.082427978515625, 0.09074211120605469, 0.09905624389648438, 0.10737037658691406, 0.11568450927734375, 0.12399864196777344, 0.13231277465820312, 0.1406269073486328, 0.1489410400390625, 0.1572551727294922, 0.16556930541992188, 0.17388343811035156, 0.18219757080078125, 0.19051170349121094, 0.19882583618164062, 0.2071399688720703, 0.2154541015625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 13.0, 10.0, 51.0, 127.0, 253.0, 305.0, 136.0, 69.0, 22.0, 15.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.31689453125, -0.31017398834228516, -0.3034534454345703, -0.29673290252685547, -0.2900123596191406, -0.2832918167114258, -0.27657127380371094, -0.2698507308959961, -0.26313018798828125, -0.2564096450805664, -0.24968910217285156, -0.24296855926513672, -0.23624801635742188, -0.22952747344970703, -0.2228069305419922, -0.21608638763427734, -0.2093658447265625, -0.20264530181884766, -0.1959247589111328, -0.18920421600341797, -0.18248367309570312, -0.17576313018798828, -0.16904258728027344, -0.1623220443725586, -0.15560150146484375, -0.1488809585571289, -0.14216041564941406, -0.13543987274169922, -0.12871932983398438, -0.12199878692626953, -0.11527824401855469, -0.10855770111083984, -0.101837158203125, -0.09511661529541016, -0.08839607238769531, -0.08167552947998047, -0.07495498657226562, -0.06823444366455078, -0.06151390075683594, -0.054793357849121094, -0.04807281494140625, -0.041352272033691406, -0.03463172912597656, -0.02791118621826172, -0.021190643310546875, -0.014470100402832031, -0.0077495574951171875, -0.0010290145874023438, 0.0056915283203125, 0.012412071228027344, 0.019132614135742188, 0.02585315704345703, 0.032573699951171875, 0.03929424285888672, 0.04601478576660156, 0.052735328674316406, 0.05945587158203125, 0.0661764144897461, 0.07289695739746094, 0.07961750030517578, 0.08633804321289062, 0.09305858612060547, 0.09977912902832031, 0.10649967193603516, 0.11322021484375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 59.0, 330.0, 473.0, 115.0, 16.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.055200576782227, -9.869478225708008, -9.683755874633789, -9.49803352355957, -9.312312126159668, -9.12658977508545, -8.94086742401123, -8.755145072937012, -8.569422721862793, -8.383700370788574, -8.197978019714355, -8.012255668640137, -7.826533794403076, -7.640811443328857, -7.455089569091797, -7.269367218017578, -7.083644866943359, -6.897922515869141, -6.71220064163208, -6.526478290557861, -6.340755939483643, -6.155033588409424, -5.969311714172363, -5.7835893630981445, -5.597867488861084, -5.412145137786865, -5.226423263549805, -5.040700912475586, -4.854978561401367, -4.669256210327148, -4.483534336090088, -4.297811985015869, -4.112089157104492, -3.9263670444488525, -3.740644693374634, -3.554922580718994, -3.3692002296447754, -3.1834781169891357, -2.997756004333496, -2.8120336532592773, -2.626311779022217, -2.440589666366577, -2.2548673152923584, -2.0691452026367188, -1.8834228515625, -1.6977007389068604, -1.5119785070419312, -1.326256275177002, -1.1405339241027832, -0.954811692237854, -0.7690894603729248, -0.5833672881126404, -0.3976450562477112, -0.21192282438278198, -0.02620065212249756, 0.15952157974243164, 0.34524381160736084, 0.53096604347229, 0.7166882753372192, 0.9024104475975037, 1.088132619857788, 1.2738549709320068, 1.4595770835876465, 1.6452993154525757, 1.8310215473175049]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 9.0, 6.0, 7.0, 9.0, 9.0, 13.0, 13.0, 26.0, 23.0, 27.0, 24.0, 20.0, 34.0, 35.0, 40.0, 32.0, 27.0, 33.0, 37.0, 46.0, 44.0, 46.0, 34.0, 37.0, 39.0, 33.0, 20.0, 31.0, 27.0, 25.0, 26.0, 18.0, 24.0, 12.0, 21.0, 19.0, 12.0, 6.0, 9.0, 6.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 4.0, 7.0, 2.0, 1.0, 2.0], "bins": [-1.1482033729553223, -1.113869547843933, -1.079535722732544, -1.0452018976211548, -1.0108680725097656, -0.9765341877937317, -0.9422003626823425, -0.9078665375709534, -0.8735326528549194, -0.8391988277435303, -0.8048650026321411, -0.770531177520752, -0.736197292804718, -0.7018634676933289, -0.6675296425819397, -0.6331958174705505, -0.5988619923591614, -0.5645281672477722, -0.5301943421363831, -0.4958604872226715, -0.46152663230895996, -0.4271928071975708, -0.39285898208618164, -0.3585251569747925, -0.32419130206108093, -0.2898574769496918, -0.2555236220359802, -0.22118979692459106, -0.1868559569120407, -0.15252211689949036, -0.1181882917881012, -0.08385445177555084, -0.04952061176300049, -0.015186775475740433, 0.019147060811519623, 0.05348089337348938, 0.08781473338603973, 0.12214857339859009, 0.15648239850997925, 0.1908162385225296, 0.22515007853507996, 0.2594839036464691, 0.29381775856018066, 0.3281515836715698, 0.362485408782959, 0.39681926369667053, 0.4311530888080597, 0.46548694372177124, 0.4998207688331604, 0.5341545939445496, 0.5684884190559387, 0.6028223037719727, 0.6371561288833618, 0.671489953994751, 0.7058237791061401, 0.7401576042175293, 0.7744914293289185, 0.8088252544403076, 0.8431590795516968, 0.8774929046630859, 0.9118267893791199, 0.946160614490509, 0.9804944396018982, 1.0148283243179321, 1.0491621494293213]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 3.0, 6.0, 9.0, 6.0, 15.0, 18.0, 21.0, 36.0, 36.0, 50.0, 60.0, 61.0, 98.0, 102.0, 165.0, 217.0, 316.0, 595.0, 1275.0, 2955.0, 9457.0, 47426.0, 3599948.0, 490952.0, 28807.0, 6702.0, 2362.0, 1037.0, 515.0, 332.0, 178.0, 114.0, 98.0, 66.0, 54.0, 40.0, 36.0, 27.0, 12.0, 16.0, 10.0, 14.0, 7.0, 6.0, 6.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0], "bins": [-0.275390625, -0.2677116394042969, -0.26003265380859375, -0.2523536682128906, -0.2446746826171875, -0.23699569702148438, -0.22931671142578125, -0.22163772583007812, -0.213958740234375, -0.20627975463867188, -0.19860076904296875, -0.19092178344726562, -0.1832427978515625, -0.17556381225585938, -0.16788482666015625, -0.16020584106445312, -0.15252685546875, -0.14484786987304688, -0.13716888427734375, -0.12948989868164062, -0.1218109130859375, -0.11413192749023438, -0.10645294189453125, -0.09877395629882812, -0.091094970703125, -0.08341598510742188, -0.07573699951171875, -0.06805801391601562, -0.0603790283203125, -0.052700042724609375, -0.04502105712890625, -0.037342071533203125, -0.0296630859375, -0.021984100341796875, -0.01430511474609375, -0.006626129150390625, 0.0010528564453125, 0.008731842041015625, 0.01641082763671875, 0.024089813232421875, 0.031768798828125, 0.039447784423828125, 0.04712677001953125, 0.054805755615234375, 0.0624847412109375, 0.07016372680664062, 0.07784271240234375, 0.08552169799804688, 0.09320068359375, 0.10087966918945312, 0.10855865478515625, 0.11623764038085938, 0.1239166259765625, 0.13159561157226562, 0.13927459716796875, 0.14695358276367188, 0.154632568359375, 0.16231155395507812, 0.16999053955078125, 0.17766952514648438, 0.1853485107421875, 0.19302749633789062, 0.20070648193359375, 0.20838546752929688, 0.216064453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 14.0, 21.0, 20.0, 37.0, 48.0, 71.0, 80.0, 88.0, 106.0, 103.0, 85.0, 79.0, 83.0, 57.0, 32.0, 28.0, 18.0, 11.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.197021484375, -0.1923351287841797, -0.18764877319335938, -0.18296241760253906, -0.17827606201171875, -0.17358970642089844, -0.16890335083007812, -0.1642169952392578, -0.1595306396484375, -0.1548442840576172, -0.15015792846679688, -0.14547157287597656, -0.14078521728515625, -0.13609886169433594, -0.13141250610351562, -0.1267261505126953, -0.122039794921875, -0.11735343933105469, -0.11266708374023438, -0.10798072814941406, -0.10329437255859375, -0.09860801696777344, -0.09392166137695312, -0.08923530578613281, -0.0845489501953125, -0.07986259460449219, -0.07517623901367188, -0.07048988342285156, -0.06580352783203125, -0.06111717224121094, -0.056430816650390625, -0.05174446105957031, -0.04705810546875, -0.04237174987792969, -0.037685394287109375, -0.03299903869628906, -0.02831268310546875, -0.023626327514648438, -0.018939971923828125, -0.014253616333007812, -0.0095672607421875, -0.0048809051513671875, -0.000194549560546875, 0.0044918060302734375, 0.00917816162109375, 0.013864517211914062, 0.018550872802734375, 0.023237228393554688, 0.027923583984375, 0.03260993957519531, 0.037296295166015625, 0.04198265075683594, 0.04666900634765625, 0.05135536193847656, 0.056041717529296875, 0.06072807312011719, 0.0654144287109375, 0.07010078430175781, 0.07478713989257812, 0.07947349548339844, 0.08415985107421875, 0.08884620666503906, 0.09353256225585938, 0.09821891784667969, 0.1029052734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 16.0, 20.0, 28.0, 39.0, 64.0, 90.0, 147.0, 240.0, 358.0, 626.0, 1063.0, 2009.0, 4623.0, 14166.0, 83679.0, 3892036.0, 163224.0, 20183.0, 5893.0, 2499.0, 1326.0, 734.0, 430.0, 275.0, 160.0, 117.0, 80.0, 36.0, 26.0, 23.0, 21.0, 6.0, 12.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.201904296875, -0.19402313232421875, -0.1861419677734375, -0.17826080322265625, -0.170379638671875, -0.16249847412109375, -0.1546173095703125, -0.14673614501953125, -0.13885498046875, -0.13097381591796875, -0.1230926513671875, -0.11521148681640625, -0.107330322265625, -0.09944915771484375, -0.0915679931640625, -0.08368682861328125, -0.0758056640625, -0.06792449951171875, -0.0600433349609375, -0.05216217041015625, -0.044281005859375, -0.03639984130859375, -0.0285186767578125, -0.02063751220703125, -0.01275634765625, -0.00487518310546875, 0.0030059814453125, 0.01088714599609375, 0.018768310546875, 0.02664947509765625, 0.0345306396484375, 0.04241180419921875, 0.05029296875, 0.05817413330078125, 0.0660552978515625, 0.07393646240234375, 0.081817626953125, 0.08969879150390625, 0.0975799560546875, 0.10546112060546875, 0.11334228515625, 0.12122344970703125, 0.1291046142578125, 0.13698577880859375, 0.144866943359375, 0.15274810791015625, 0.1606292724609375, 0.16851043701171875, 0.1763916015625, 0.18427276611328125, 0.1921539306640625, 0.20003509521484375, 0.207916259765625, 0.21579742431640625, 0.2236785888671875, 0.23155975341796875, 0.23944091796875, 0.24732208251953125, 0.2552032470703125, 0.26308441162109375, 0.270965576171875, 0.27884674072265625, 0.2867279052734375, 0.29460906982421875, 0.302490234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 9.0, 8.0, 28.0, 49.0, 74.0, 188.0, 980.0, 2304.0, 214.0, 90.0, 49.0, 32.0, 10.0, 7.0, 7.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.09460735321044922, -0.09052085876464844, -0.08643436431884766, -0.08234786987304688, -0.0782613754272461, -0.07417488098144531, -0.07008838653564453, -0.06600189208984375, -0.06191539764404297, -0.05782890319824219, -0.053742408752441406, -0.049655914306640625, -0.045569419860839844, -0.04148292541503906, -0.03739643096923828, -0.0333099365234375, -0.02922344207763672, -0.025136947631835938, -0.021050453186035156, -0.016963958740234375, -0.012877464294433594, -0.008790969848632812, -0.004704475402832031, -0.00061798095703125, 0.0034685134887695312, 0.0075550079345703125, 0.011641502380371094, 0.015727996826171875, 0.019814491271972656, 0.023900985717773438, 0.02798748016357422, 0.032073974609375, 0.03616046905517578, 0.04024696350097656, 0.044333457946777344, 0.048419952392578125, 0.052506446838378906, 0.05659294128417969, 0.06067943572998047, 0.06476593017578125, 0.06885242462158203, 0.07293891906738281, 0.0770254135131836, 0.08111190795898438, 0.08519840240478516, 0.08928489685058594, 0.09337139129638672, 0.0974578857421875, 0.10154438018798828, 0.10563087463378906, 0.10971736907958984, 0.11380386352539062, 0.1178903579711914, 0.12197685241699219, 0.12606334686279297, 0.13014984130859375, 0.13423633575439453, 0.1383228302001953, 0.1424093246459961, 0.14649581909179688, 0.15058231353759766, 0.15466880798339844, 0.15875530242919922, 0.162841796875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 10.0, 18.0, 65.0, 200.0, 427.0, 212.0, 53.0, 11.0, 6.0, 2.0, 2.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2805880308151245, -0.24361862242221832, -0.20664921402931213, -0.16967980563640594, -0.13271039724349976, -0.09574098885059357, -0.05877158045768738, -0.021802186965942383, 0.015167236328125, 0.05213664472103119, 0.08910605311393738, 0.12607546150684357, 0.16304486989974976, 0.20001427829265594, 0.23698368668556213, 0.27395308017730713, 0.3109225034713745, 0.3478919267654419, 0.3848613202571869, 0.4218307137489319, 0.45880013704299927, 0.49576956033706665, 0.5327389240264893, 0.5697083473205566, 0.606677770614624, 0.6436471939086914, 0.6806166172027588, 0.7175859808921814, 0.7545554041862488, 0.7915248274803162, 0.8284941911697388, 0.8654636144638062, 0.902432918548584, 0.9394023418426514, 0.9763717651367188, 1.0133411884307861, 1.0503106117248535, 1.0872799158096313, 1.1242493391036987, 1.1612187623977661, 1.1981881856918335, 1.2351576089859009, 1.2721270322799683, 1.3090964555740356, 1.3460657596588135, 1.3830351829528809, 1.4200046062469482, 1.4569740295410156, 1.493943452835083, 1.5309128761291504, 1.5678822994232178, 1.6048517227172852, 1.6418211460113525, 1.6787904500961304, 1.7157598733901978, 1.7527292966842651, 1.7896987199783325, 1.8266681432724, 1.8636375665664673, 1.9006069898605347, 1.9375762939453125, 1.9745457172393799, 2.0115151405334473, 2.0484845638275146, 2.085453987121582]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 10.0, 10.0, 11.0, 20.0, 25.0, 29.0, 35.0, 52.0, 59.0, 62.0, 74.0, 85.0, 85.0, 77.0, 84.0, 61.0, 42.0, 47.0, 43.0, 25.0, 20.0, 16.0, 12.0, 10.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4367576241493225, -0.42403900623321533, -0.41132041811943054, -0.39860180020332336, -0.3858831822872162, -0.3731645941734314, -0.3604459762573242, -0.34772735834121704, -0.33500877022743225, -0.3222901523113251, -0.3095715641975403, -0.2968529462814331, -0.2841343283653259, -0.27141574025154114, -0.25869712233543396, -0.24597851932048798, -0.2332599014043808, -0.22054129838943481, -0.20782268047332764, -0.19510407745838165, -0.18238547444343567, -0.1696668565273285, -0.1569482535123825, -0.14422965049743652, -0.13151103258132935, -0.11879242211580276, -0.10607381910085678, -0.0933552086353302, -0.08063660562038422, -0.06791799515485764, -0.055199384689331055, -0.04248078167438507, -0.029762178659439087, -0.017043571919202805, -0.004324963316321373, 0.008393645286560059, 0.02111225202679634, 0.03383085876703262, 0.046549469232559204, 0.05926807224750519, 0.07198668271303177, 0.08470529317855835, 0.09742389619350433, 0.11014250665903091, 0.1228611171245575, 0.13557972013950348, 0.14829832315444946, 0.16101694107055664, 0.17373554408550262, 0.1864541471004486, 0.1991727650165558, 0.21189136803150177, 0.22460997104644775, 0.23732858896255493, 0.2500472068786621, 0.2627657949924469, 0.2754844129085541, 0.28820303082466125, 0.30092161893844604, 0.3136402368545532, 0.3263588547706604, 0.3390774428844452, 0.35179606080055237, 0.36451464891433716, 0.37723326683044434]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 14.0, 21.0, 30.0, 51.0, 116.0, 226.0, 557.0, 1371.0, 4812.0, 21550.0, 181307.0, 722858.0, 96116.0, 14257.0, 3374.0, 1078.0, 397.0, 188.0, 88.0, 55.0, 27.0, 17.0, 6.0, 10.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.49365234375, -0.481719970703125, -0.46978759765625, -0.457855224609375, -0.4459228515625, -0.433990478515625, -0.42205810546875, -0.410125732421875, -0.398193359375, -0.386260986328125, -0.37432861328125, -0.362396240234375, -0.3504638671875, -0.338531494140625, -0.32659912109375, -0.314666748046875, -0.302734375, -0.290802001953125, -0.27886962890625, -0.266937255859375, -0.2550048828125, -0.243072509765625, -0.23114013671875, -0.219207763671875, -0.207275390625, -0.195343017578125, -0.18341064453125, -0.171478271484375, -0.1595458984375, -0.147613525390625, -0.13568115234375, -0.123748779296875, -0.11181640625, -0.099884033203125, -0.08795166015625, -0.076019287109375, -0.0640869140625, -0.052154541015625, -0.04022216796875, -0.028289794921875, -0.016357421875, -0.004425048828125, 0.00750732421875, 0.019439697265625, 0.0313720703125, 0.043304443359375, 0.05523681640625, 0.067169189453125, 0.0791015625, 0.091033935546875, 0.10296630859375, 0.114898681640625, 0.1268310546875, 0.138763427734375, 0.15069580078125, 0.162628173828125, 0.174560546875, 0.186492919921875, 0.19842529296875, 0.210357666015625, 0.2222900390625, 0.234222412109375, 0.24615478515625, 0.258087158203125, 0.27001953125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 19.0, 13.0, 23.0, 35.0, 38.0, 63.0, 72.0, 85.0, 94.0, 100.0, 86.0, 82.0, 80.0, 58.0, 53.0, 29.0, 29.0, 13.0, 6.0, 10.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.188568115234375, -0.18402099609375, -0.179473876953125, -0.1749267578125, -0.170379638671875, -0.16583251953125, -0.161285400390625, -0.15673828125, -0.152191162109375, -0.14764404296875, -0.143096923828125, -0.1385498046875, -0.134002685546875, -0.12945556640625, -0.124908447265625, -0.120361328125, -0.115814208984375, -0.11126708984375, -0.106719970703125, -0.1021728515625, -0.097625732421875, -0.09307861328125, -0.088531494140625, -0.083984375, -0.079437255859375, -0.07489013671875, -0.070343017578125, -0.0657958984375, -0.061248779296875, -0.05670166015625, -0.052154541015625, -0.047607421875, -0.043060302734375, -0.03851318359375, -0.033966064453125, -0.0294189453125, -0.024871826171875, -0.02032470703125, -0.015777587890625, -0.01123046875, -0.006683349609375, -0.00213623046875, 0.002410888671875, 0.0069580078125, 0.011505126953125, 0.01605224609375, 0.020599365234375, 0.025146484375, 0.029693603515625, 0.03424072265625, 0.038787841796875, 0.0433349609375, 0.047882080078125, 0.05242919921875, 0.056976318359375, 0.0615234375, 0.066070556640625, 0.07061767578125, 0.075164794921875, 0.0797119140625, 0.084259033203125, 0.08880615234375, 0.093353271484375, 0.097900390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 8.0, 12.0, 8.0, 12.0, 23.0, 33.0, 50.0, 71.0, 124.0, 215.0, 341.0, 654.0, 1353.0, 2812.0, 6963.0, 19483.0, 68093.0, 331146.0, 474962.0, 99506.0, 26700.0, 8982.0, 3537.0, 1591.0, 784.0, 421.0, 219.0, 152.0, 98.0, 47.0, 30.0, 29.0, 24.0, 20.0, 13.0, 10.0, 8.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.242431640625, -0.23553085327148438, -0.22863006591796875, -0.22172927856445312, -0.2148284912109375, -0.20792770385742188, -0.20102691650390625, -0.19412612915039062, -0.187225341796875, -0.18032455444335938, -0.17342376708984375, -0.16652297973632812, -0.1596221923828125, -0.15272140502929688, -0.14582061767578125, -0.13891983032226562, -0.13201904296875, -0.12511825561523438, -0.11821746826171875, -0.11131668090820312, -0.1044158935546875, -0.09751510620117188, -0.09061431884765625, -0.08371353149414062, -0.076812744140625, -0.06991195678710938, -0.06301116943359375, -0.056110382080078125, -0.0492095947265625, -0.042308807373046875, -0.03540802001953125, -0.028507232666015625, -0.0216064453125, -0.014705657958984375, -0.00780487060546875, -0.000904083251953125, 0.0059967041015625, 0.012897491455078125, 0.01979827880859375, 0.026699066162109375, 0.033599853515625, 0.040500640869140625, 0.04740142822265625, 0.054302215576171875, 0.0612030029296875, 0.06810379028320312, 0.07500457763671875, 0.08190536499023438, 0.08880615234375, 0.09570693969726562, 0.10260772705078125, 0.10950851440429688, 0.1164093017578125, 0.12331008911132812, 0.13021087646484375, 0.13711166381835938, 0.144012451171875, 0.15091323852539062, 0.15781402587890625, 0.16471481323242188, 0.1716156005859375, 0.17851638793945312, 0.18541717529296875, 0.19231796264648438, 0.19921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 5.0, 9.0, 9.0, 20.0, 22.0, 17.0, 29.0, 27.0, 31.0, 36.0, 32.0, 27.0, 48.0, 43.0, 43.0, 50.0, 38.0, 66.0, 35.0, 37.0, 44.0, 42.0, 48.0, 38.0, 29.0, 30.0, 32.0, 14.0, 20.0, 22.0, 11.0, 12.0, 7.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.328857421875, -0.31906890869140625, -0.3092803955078125, -0.29949188232421875, -0.289703369140625, -0.27991485595703125, -0.2701263427734375, -0.26033782958984375, -0.25054931640625, -0.24076080322265625, -0.2309722900390625, -0.22118377685546875, -0.211395263671875, -0.20160675048828125, -0.1918182373046875, -0.18202972412109375, -0.1722412109375, -0.16245269775390625, -0.1526641845703125, -0.14287567138671875, -0.133087158203125, -0.12329864501953125, -0.1135101318359375, -0.10372161865234375, -0.09393310546875, -0.08414459228515625, -0.0743560791015625, -0.06456756591796875, -0.054779052734375, -0.04499053955078125, -0.0352020263671875, -0.02541351318359375, -0.015625, -0.00583648681640625, 0.0039520263671875, 0.01374053955078125, 0.023529052734375, 0.03331756591796875, 0.0431060791015625, 0.05289459228515625, 0.06268310546875, 0.07247161865234375, 0.0822601318359375, 0.09204864501953125, 0.101837158203125, 0.11162567138671875, 0.1214141845703125, 0.13120269775390625, 0.1409912109375, 0.15077972412109375, 0.1605682373046875, 0.17035675048828125, 0.180145263671875, 0.18993377685546875, 0.1997222900390625, 0.20951080322265625, 0.21929931640625, 0.22908782958984375, 0.2388763427734375, 0.24866485595703125, 0.258453369140625, 0.26824188232421875, 0.2780303955078125, 0.28781890869140625, 0.297607421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 10.0, 7.0, 5.0, 9.0, 24.0, 36.0, 45.0, 68.0, 132.0, 207.0, 495.0, 1403.0, 4518.0, 19792.0, 213737.0, 755597.0, 40979.0, 7902.0, 2205.0, 696.0, 303.0, 142.0, 86.0, 55.0, 32.0, 26.0, 13.0, 11.0, 11.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.267333984375, -0.2608451843261719, -0.25435638427734375, -0.24786758422851562, -0.2413787841796875, -0.23488998413085938, -0.22840118408203125, -0.22191238403320312, -0.215423583984375, -0.20893478393554688, -0.20244598388671875, -0.19595718383789062, -0.1894683837890625, -0.18297958374023438, -0.17649078369140625, -0.17000198364257812, -0.16351318359375, -0.15702438354492188, -0.15053558349609375, -0.14404678344726562, -0.1375579833984375, -0.13106918334960938, -0.12458038330078125, -0.11809158325195312, -0.111602783203125, -0.10511398315429688, -0.09862518310546875, -0.09213638305664062, -0.0856475830078125, -0.07915878295898438, -0.07266998291015625, -0.06618118286132812, -0.0596923828125, -0.053203582763671875, -0.04671478271484375, -0.040225982666015625, -0.0337371826171875, -0.027248382568359375, -0.02075958251953125, -0.014270782470703125, -0.007781982421875, -0.001293182373046875, 0.00519561767578125, 0.011684417724609375, 0.0181732177734375, 0.024662017822265625, 0.03115081787109375, 0.037639617919921875, 0.04412841796875, 0.050617218017578125, 0.05710601806640625, 0.06359481811523438, 0.0700836181640625, 0.07657241821289062, 0.08306121826171875, 0.08955001831054688, 0.096038818359375, 0.10252761840820312, 0.10901641845703125, 0.11550521850585938, 0.1219940185546875, 0.12848281860351562, 0.13497161865234375, 0.14146041870117188, 0.14794921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 10.0, 15.0, 38.0, 151.0, 378.0, 276.0, 89.0, 35.0, 7.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005335807800292969, -0.0005232710391283035, -0.0005129612982273102, -0.0005026515573263168, -0.0004923418164253235, -0.00048203207552433014, -0.0004717223346233368, -0.00046141259372234344, -0.0004511028528213501, -0.00044079311192035675, -0.0004304833710193634, -0.00042017363011837006, -0.0004098638892173767, -0.00039955414831638336, -0.00038924440741539, -0.00037893466651439667, -0.0003686249256134033, -0.00035831518471241, -0.0003480054438114166, -0.0003376957029104233, -0.00032738596200942993, -0.0003170762211084366, -0.00030676648020744324, -0.0002964567393064499, -0.00028614699840545654, -0.0002758372575044632, -0.00026552751660346985, -0.0002552177757024765, -0.00024490803480148315, -0.0002345982939004898, -0.00022428855299949646, -0.0002139788120985031, -0.00020366907119750977, -0.00019335933029651642, -0.00018304958939552307, -0.00017273984849452972, -0.00016243010759353638, -0.00015212036669254303, -0.00014181062579154968, -0.00013150088489055634, -0.00012119114398956299, -0.00011088140308856964, -0.0001005716621875763, -9.026192128658295e-05, -7.99521803855896e-05, -6.964243948459625e-05, -5.9332698583602905e-05, -4.902295768260956e-05, -3.871321678161621e-05, -2.8403475880622864e-05, -1.8093734979629517e-05, -7.78399407863617e-06, 2.5257468223571777e-06, 1.2835487723350525e-05, 2.3145228624343872e-05, 3.345496952533722e-05, 4.3764710426330566e-05, 5.4074451327323914e-05, 6.438419222831726e-05, 7.469393312931061e-05, 8.500367403030396e-05, 9.53134149312973e-05, 0.00010562315583229065, 0.000115932896733284, 0.00012624263763427734]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 24.0, 67.0, 151.0, 385.0, 1278.0, 5440.0, 33291.0, 797426.0, 192295.0, 14252.0, 2827.0, 731.0, 228.0, 93.0, 33.0, 17.0, 10.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.1303882598876953, -0.12344741821289062, -0.11650657653808594, -0.10956573486328125, -0.10262489318847656, -0.09568405151367188, -0.08874320983886719, -0.0818023681640625, -0.07486152648925781, -0.06792068481445312, -0.06097984313964844, -0.05403900146484375, -0.04709815979003906, -0.040157318115234375, -0.03321647644042969, -0.026275634765625, -0.019334793090820312, -0.012393951416015625, -0.0054531097412109375, 0.00148773193359375, 0.008428573608398438, 0.015369415283203125, 0.022310256958007812, 0.0292510986328125, 0.03619194030761719, 0.043132781982421875, 0.05007362365722656, 0.05701446533203125, 0.06395530700683594, 0.07089614868164062, 0.07783699035644531, 0.08477783203125, 0.09171867370605469, 0.09865951538085938, 0.10560035705566406, 0.11254119873046875, 0.11948204040527344, 0.12642288208007812, 0.1333637237548828, 0.1403045654296875, 0.1472454071044922, 0.15418624877929688, 0.16112709045410156, 0.16806793212890625, 0.17500877380371094, 0.18194961547851562, 0.1888904571533203, 0.195831298828125, 0.2027721405029297, 0.20971298217773438, 0.21665382385253906, 0.22359466552734375, 0.23053550720214844, 0.23747634887695312, 0.2444171905517578, 0.2513580322265625, 0.2582988739013672, 0.2652397155761719, 0.27218055725097656, 0.27912139892578125, 0.28606224060058594, 0.2930030822753906, 0.2999439239501953, 0.306884765625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 9.0, 8.0, 6.0, 12.0, 17.0, 21.0, 35.0, 69.0, 114.0, 160.0, 145.0, 129.0, 106.0, 65.0, 47.0, 21.0, 19.0, 12.0, 3.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1036376953125, -0.09825706481933594, -0.09287643432617188, -0.08749580383300781, -0.08211517333984375, -0.07673454284667969, -0.07135391235351562, -0.06597328186035156, -0.0605926513671875, -0.05521202087402344, -0.049831390380859375, -0.04445075988769531, -0.03907012939453125, -0.03368949890136719, -0.028308868408203125, -0.022928237915039062, -0.017547607421875, -0.012166976928710938, -0.006786346435546875, -0.0014057159423828125, 0.00397491455078125, 0.009355545043945312, 0.014736175537109375, 0.020116806030273438, 0.0254974365234375, 0.030878067016601562, 0.036258697509765625, 0.04163932800292969, 0.04701995849609375, 0.05240058898925781, 0.057781219482421875, 0.06316184997558594, 0.06854248046875, 0.07392311096191406, 0.07930374145507812, 0.08468437194824219, 0.09006500244140625, 0.09544563293457031, 0.10082626342773438, 0.10620689392089844, 0.1115875244140625, 0.11696815490722656, 0.12234878540039062, 0.1277294158935547, 0.13311004638671875, 0.1384906768798828, 0.14387130737304688, 0.14925193786621094, 0.154632568359375, 0.16001319885253906, 0.16539382934570312, 0.1707744598388672, 0.17615509033203125, 0.1815357208251953, 0.18691635131835938, 0.19229698181152344, 0.1976776123046875, 0.20305824279785156, 0.20843887329101562, 0.2138195037841797, 0.21920013427734375, 0.2245807647705078, 0.22996139526367188, 0.23534202575683594, 0.24072265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 21.0, 36.0, 88.0, 185.0, 316.0, 197.0, 102.0, 44.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1654329299926758, -1.063624620437622, -0.9618163108825684, -0.8600080609321594, -0.7581997513771057, -0.656391441822052, -0.5545831918716431, -0.45277488231658936, -0.35096657276153564, -0.24915827810764313, -0.1473499834537506, -0.04554170370101929, 0.056266605854034424, 0.15807491540908813, 0.25988316535949707, 0.3616914749145508, 0.4634997844696045, 0.5653080940246582, 0.6671164035797119, 0.7689246535301208, 0.8707329630851746, 0.9725412726402283, 1.0743495225906372, 1.176157832145691, 1.2779661417007446, 1.3797744512557983, 1.481582760810852, 1.5833909511566162, 1.68519926071167, 1.7870075702667236, 1.8888158798217773, 1.990624189376831, 2.0924324989318848, 2.1942408084869385, 2.296049118041992, 2.397857427597046, 2.4996657371520996, 2.6014740467071533, 2.703282356262207, 2.8050904273986816, 2.9068989753723145, 3.008707284927368, 3.110515594482422, 3.2123239040374756, 3.3141322135925293, 3.415940523147583, 3.5177488327026367, 3.6195569038391113, 3.721365213394165, 3.8231735229492188, 3.9249818325042725, 4.026790142059326, 4.128598213195801, 4.230406761169434, 4.332214832305908, 4.434023380279541, 4.535831451416016, 4.63763952255249, 4.739448070526123, 4.841256141662598, 4.9430646896362305, 5.044872760772705, 5.146681308746338, 5.2484893798828125, 5.350297927856445]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 13.0, 10.0, 12.0, 8.0, 15.0, 14.0, 24.0, 22.0, 23.0, 29.0, 31.0, 32.0, 33.0, 40.0, 43.0, 51.0, 34.0, 49.0, 36.0, 46.0, 37.0, 45.0, 35.0, 35.0, 36.0, 39.0, 27.0, 27.0, 18.0, 27.0, 12.0, 15.0, 13.0, 10.0, 11.0, 13.0, 5.0, 9.0, 4.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3125150203704834, -1.2703300714492798, -1.2281451225280762, -1.185960292816162, -1.1437753438949585, -1.1015903949737549, -1.0594055652618408, -1.0172206163406372, -0.9750356674194336, -0.93285071849823, -0.8906658291816711, -0.8484809398651123, -0.8062959909439087, -0.7641110420227051, -0.7219261527061462, -0.6797412633895874, -0.6375563144683838, -0.5953713655471802, -0.5531864762306213, -0.5110015869140625, -0.4688166379928589, -0.42663171887397766, -0.38444679975509644, -0.3422618806362152, -0.300076961517334, -0.25789204239845276, -0.21570712327957153, -0.1735222041606903, -0.13133728504180908, -0.08915236592292786, -0.04696744680404663, -0.004782527685165405, 0.03740251064300537, 0.0795874297618866, 0.12177234888076782, 0.16395726799964905, 0.20614218711853027, 0.2483271062374115, 0.2905120253562927, 0.33269694447517395, 0.3748818635940552, 0.4170667827129364, 0.4592517018318176, 0.5014365911483765, 0.5436215400695801, 0.5858064889907837, 0.6279913783073425, 0.6701762676239014, 0.712361216545105, 0.7545461654663086, 0.7967310547828674, 0.8389159440994263, 0.8811008930206299, 0.9232858419418335, 0.9654707312583923, 1.0076556205749512, 1.0498405694961548, 1.0920255184173584, 1.1342103481292725, 1.176395297050476, 1.2185802459716797, 1.2607651948928833, 1.302950143814087, 1.345134973526001, 1.3873199224472046]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 10.0, 7.0, 7.0, 6.0, 8.0, 18.0, 28.0, 27.0, 44.0, 53.0, 81.0, 137.0, 238.0, 465.0, 973.0, 2223.0, 5479.0, 16774.0, 118767.0, 3971166.0, 57651.0, 12024.0, 4364.0, 1863.0, 837.0, 465.0, 223.0, 136.0, 98.0, 50.0, 20.0, 14.0, 9.0, 0.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.405029296875, -0.3956890106201172, -0.3863487243652344, -0.37700843811035156, -0.36766815185546875, -0.35832786560058594, -0.3489875793457031, -0.3396472930908203, -0.3303070068359375, -0.3209667205810547, -0.3116264343261719, -0.30228614807128906, -0.29294586181640625, -0.28360557556152344, -0.2742652893066406, -0.2649250030517578, -0.255584716796875, -0.2462444305419922, -0.23690414428710938, -0.22756385803222656, -0.21822357177734375, -0.20888328552246094, -0.19954299926757812, -0.1902027130126953, -0.1808624267578125, -0.1715221405029297, -0.16218185424804688, -0.15284156799316406, -0.14350128173828125, -0.13416099548339844, -0.12482070922851562, -0.11548042297363281, -0.10614013671875, -0.09679985046386719, -0.08745956420898438, -0.07811927795410156, -0.06877899169921875, -0.05943870544433594, -0.050098419189453125, -0.04075813293457031, -0.0314178466796875, -0.022077560424804688, -0.012737274169921875, -0.0033969879150390625, 0.00594329833984375, 0.015283584594726562, 0.024623870849609375, 0.03396415710449219, 0.043304443359375, 0.05264472961425781, 0.061985015869140625, 0.07132530212402344, 0.08066558837890625, 0.09000587463378906, 0.09934616088867188, 0.10868644714355469, 0.1180267333984375, 0.1273670196533203, 0.13670730590820312, 0.14604759216308594, 0.15538787841796875, 0.16472816467285156, 0.17406845092773438, 0.1834087371826172, 0.1927490234375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 12.0, 12.0, 14.0, 19.0, 38.0, 47.0, 36.0, 56.0, 69.0, 77.0, 67.0, 68.0, 76.0, 71.0, 59.0, 67.0, 50.0, 34.0, 37.0, 20.0, 20.0, 16.0, 10.0, 4.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.17138671875, -0.1673755645751953, -0.16336441040039062, -0.15935325622558594, -0.15534210205078125, -0.15133094787597656, -0.14731979370117188, -0.1433086395263672, -0.1392974853515625, -0.1352863311767578, -0.13127517700195312, -0.12726402282714844, -0.12325286865234375, -0.11924171447753906, -0.11523056030273438, -0.11121940612792969, -0.107208251953125, -0.10319709777832031, -0.09918594360351562, -0.09517478942871094, -0.09116363525390625, -0.08715248107910156, -0.08314132690429688, -0.07913017272949219, -0.0751190185546875, -0.07110786437988281, -0.06709671020507812, -0.06308555603027344, -0.05907440185546875, -0.05506324768066406, -0.051052093505859375, -0.04704093933105469, -0.04302978515625, -0.03901863098144531, -0.035007476806640625, -0.030996322631835938, -0.02698516845703125, -0.022974014282226562, -0.018962860107421875, -0.014951705932617188, -0.0109405517578125, -0.0069293975830078125, -0.002918243408203125, 0.0010929107666015625, 0.00510406494140625, 0.009115219116210938, 0.013126373291015625, 0.017137527465820312, 0.021148681640625, 0.025159835815429688, 0.029170989990234375, 0.03318214416503906, 0.03719329833984375, 0.04120445251464844, 0.045215606689453125, 0.04922676086425781, 0.0532379150390625, 0.05724906921386719, 0.061260223388671875, 0.06527137756347656, 0.06928253173828125, 0.07329368591308594, 0.07730484008789062, 0.08131599426269531, 0.0853271484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 7.0, 12.0, 31.0, 39.0, 50.0, 67.0, 110.0, 171.0, 235.0, 482.0, 769.0, 1313.0, 2494.0, 4959.0, 12223.0, 46103.0, 3724894.0, 355081.0, 27429.0, 9063.0, 3963.0, 1990.0, 1085.0, 655.0, 380.0, 230.0, 152.0, 109.0, 49.0, 45.0, 31.0, 19.0, 8.0, 7.0, 3.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1953125, -0.1887664794921875, -0.182220458984375, -0.1756744384765625, -0.16912841796875, -0.1625823974609375, -0.156036376953125, -0.1494903564453125, -0.1429443359375, -0.1363983154296875, -0.129852294921875, -0.1233062744140625, -0.11676025390625, -0.1102142333984375, -0.103668212890625, -0.0971221923828125, -0.090576171875, -0.0840301513671875, -0.077484130859375, -0.0709381103515625, -0.06439208984375, -0.0578460693359375, -0.051300048828125, -0.0447540283203125, -0.0382080078125, -0.0316619873046875, -0.025115966796875, -0.0185699462890625, -0.01202392578125, -0.0054779052734375, 0.001068115234375, 0.0076141357421875, 0.01416015625, 0.0207061767578125, 0.027252197265625, 0.0337982177734375, 0.04034423828125, 0.0468902587890625, 0.053436279296875, 0.0599822998046875, 0.0665283203125, 0.0730743408203125, 0.079620361328125, 0.0861663818359375, 0.09271240234375, 0.0992584228515625, 0.105804443359375, 0.1123504638671875, 0.118896484375, 0.1254425048828125, 0.131988525390625, 0.1385345458984375, 0.14508056640625, 0.1516265869140625, 0.158172607421875, 0.1647186279296875, 0.1712646484375, 0.1778106689453125, 0.184356689453125, 0.1909027099609375, 0.19744873046875, 0.2039947509765625, 0.210540771484375, 0.2170867919921875, 0.2236328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 10.0, 5.0, 4.0, 6.0, 10.0, 11.0, 6.0, 20.0, 51.0, 94.0, 423.0, 2936.0, 285.0, 83.0, 42.0, 30.0, 16.0, 11.0, 9.0, 7.0, 3.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09991455078125, -0.0965127944946289, -0.09311103820800781, -0.08970928192138672, -0.08630752563476562, -0.08290576934814453, -0.07950401306152344, -0.07610225677490234, -0.07270050048828125, -0.06929874420166016, -0.06589698791503906, -0.06249523162841797, -0.059093475341796875, -0.05569171905517578, -0.05228996276855469, -0.048888206481933594, -0.0454864501953125, -0.042084693908691406, -0.03868293762207031, -0.03528118133544922, -0.031879425048828125, -0.02847766876220703, -0.025075912475585938, -0.021674156188964844, -0.01827239990234375, -0.014870643615722656, -0.011468887329101562, -0.008067131042480469, -0.004665374755859375, -0.0012636184692382812, 0.0021381378173828125, 0.005539894104003906, 0.008941650390625, 0.012343406677246094, 0.015745162963867188, 0.01914691925048828, 0.022548675537109375, 0.02595043182373047, 0.029352188110351562, 0.032753944396972656, 0.03615570068359375, 0.039557456970214844, 0.04295921325683594, 0.04636096954345703, 0.049762725830078125, 0.05316448211669922, 0.05656623840332031, 0.059967994689941406, 0.0633697509765625, 0.0667715072631836, 0.07017326354980469, 0.07357501983642578, 0.07697677612304688, 0.08037853240966797, 0.08378028869628906, 0.08718204498291016, 0.09058380126953125, 0.09398555755615234, 0.09738731384277344, 0.10078907012939453, 0.10419082641601562, 0.10759258270263672, 0.11099433898925781, 0.1143960952758789, 0.1177978515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 13.0, 58.0, 174.0, 328.0, 255.0, 111.0, 39.0, 15.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4735005795955658, -0.4494094252586365, -0.42531827092170715, -0.40122711658477783, -0.3771359622478485, -0.3530448079109192, -0.3289536237716675, -0.30486249923706055, -0.28077131509780884, -0.2566801607608795, -0.2325890064239502, -0.20849785208702087, -0.18440669775009155, -0.16031554341316223, -0.13622437417507172, -0.1121332198381424, -0.08804208040237427, -0.06395092606544495, -0.03985976800322533, -0.015768609941005707, 0.008322544395923615, 0.032413698732852936, 0.056504860520362854, 0.08059601485729218, 0.1046871691942215, 0.12877832353115082, 0.15286947786808014, 0.17696064710617065, 0.20105180144309998, 0.2251429557800293, 0.24923411011695862, 0.27332526445388794, 0.2974163889884949, 0.3215075433254242, 0.3455986976623535, 0.36968985199928284, 0.39378100633621216, 0.4178721606731415, 0.4419633150100708, 0.4660544991493225, 0.49014562368392944, 0.5142368078231812, 0.5383279323577881, 0.5624191164970398, 0.5865102410316467, 0.6106014251708984, 0.6346925497055054, 0.6587837338447571, 0.6828749179840088, 0.7069661021232605, 0.7310572266578674, 0.7551484107971191, 0.7792395353317261, 0.8033307194709778, 0.8274218440055847, 0.8515130281448364, 0.8756041526794434, 0.8996953368186951, 0.923786461353302, 0.9478776454925537, 0.9719687700271606, 0.9960599541664124, 1.020151138305664, 1.044242262840271, 1.068333387374878]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 10.0, 10.0, 20.0, 37.0, 36.0, 43.0, 51.0, 63.0, 86.0, 79.0, 91.0, 75.0, 77.0, 71.0, 74.0, 55.0, 25.0, 30.0, 23.0, 15.0, 9.0, 12.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31004977226257324, -0.2992687523365021, -0.2884877026081085, -0.27770668268203735, -0.2669256329536438, -0.25614461302757263, -0.24536357820034027, -0.2345825433731079, -0.22380150854587555, -0.2130204737186432, -0.20223943889141083, -0.19145840406417847, -0.1806773841381073, -0.16989633440971375, -0.15911531448364258, -0.14833427965641022, -0.13755324482917786, -0.1267722100019455, -0.11599117517471313, -0.10521014779806137, -0.09442911297082901, -0.08364807814359665, -0.07286705076694489, -0.062086015939712524, -0.051304981112480164, -0.0405239462852478, -0.02974291518330574, -0.018961884081363678, -0.008180849254131317, 0.0026001855731010437, 0.013381212949752808, 0.02416224777698517, 0.03494328260421753, 0.04572431743144989, 0.05650534853339195, 0.06728637963533401, 0.07806741446256638, 0.08884844928979874, 0.0996294766664505, 0.11041051149368286, 0.12119154632091522, 0.13197258114814758, 0.14275361597537994, 0.1535346508026123, 0.16431567072868347, 0.17509672045707703, 0.1858777403831482, 0.19665877521038055, 0.20743981003761292, 0.21822084486484528, 0.22900187969207764, 0.2397828996181488, 0.25056394934654236, 0.2613449692726135, 0.2721260190010071, 0.28290703892707825, 0.2936880588531494, 0.3044690787792206, 0.31525012850761414, 0.3260311484336853, 0.33681219816207886, 0.34759321808815, 0.3583742380142212, 0.36915528774261475, 0.3799363374710083]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 12.0, 8.0, 20.0, 28.0, 42.0, 59.0, 85.0, 159.0, 264.0, 488.0, 891.0, 1708.0, 3500.0, 7421.0, 17548.0, 47439.0, 152569.0, 419980.0, 267551.0, 80562.0, 27452.0, 10906.0, 4846.0, 2261.0, 1188.0, 654.0, 366.0, 217.0, 112.0, 75.0, 46.0, 26.0, 17.0, 12.0, 7.0, 9.0, 4.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159423828125, -0.15387535095214844, -0.14832687377929688, -0.1427783966064453, -0.13722991943359375, -0.1316814422607422, -0.12613296508789062, -0.12058448791503906, -0.1150360107421875, -0.10948753356933594, -0.10393905639648438, -0.09839057922363281, -0.09284210205078125, -0.08729362487792969, -0.08174514770507812, -0.07619667053222656, -0.070648193359375, -0.06509971618652344, -0.059551239013671875, -0.05400276184082031, -0.04845428466796875, -0.04290580749511719, -0.037357330322265625, -0.03180885314941406, -0.0262603759765625, -0.020711898803710938, -0.015163421630859375, -0.009614944458007812, -0.00406646728515625, 0.0014820098876953125, 0.007030487060546875, 0.012578964233398438, 0.01812744140625, 0.023675918579101562, 0.029224395751953125, 0.03477287292480469, 0.04032135009765625, 0.04586982727050781, 0.051418304443359375, 0.05696678161621094, 0.0625152587890625, 0.06806373596191406, 0.07361221313476562, 0.07916069030761719, 0.08470916748046875, 0.09025764465332031, 0.09580612182617188, 0.10135459899902344, 0.106903076171875, 0.11245155334472656, 0.11800003051757812, 0.12354850769042969, 0.12909698486328125, 0.1346454620361328, 0.14019393920898438, 0.14574241638183594, 0.1512908935546875, 0.15683937072753906, 0.16238784790039062, 0.1679363250732422, 0.17348480224609375, 0.1790332794189453, 0.18458175659179688, 0.19013023376464844, 0.1956787109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 15.0, 12.0, 23.0, 28.0, 46.0, 49.0, 60.0, 64.0, 65.0, 79.0, 74.0, 73.0, 65.0, 70.0, 64.0, 44.0, 36.0, 34.0, 19.0, 19.0, 17.0, 14.0, 7.0, 1.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.175537109375, -0.17142391204833984, -0.1673107147216797, -0.16319751739501953, -0.15908432006835938, -0.15497112274169922, -0.15085792541503906, -0.1467447280883789, -0.14263153076171875, -0.1385183334350586, -0.13440513610839844, -0.13029193878173828, -0.12617874145507812, -0.12206554412841797, -0.11795234680175781, -0.11383914947509766, -0.1097259521484375, -0.10561275482177734, -0.10149955749511719, -0.09738636016845703, -0.09327316284179688, -0.08915996551513672, -0.08504676818847656, -0.0809335708618164, -0.07682037353515625, -0.0727071762084961, -0.06859397888183594, -0.06448078155517578, -0.060367584228515625, -0.05625438690185547, -0.05214118957519531, -0.048027992248535156, -0.043914794921875, -0.039801597595214844, -0.03568840026855469, -0.03157520294189453, -0.027462005615234375, -0.02334880828857422, -0.019235610961914062, -0.015122413635253906, -0.01100921630859375, -0.006896018981933594, -0.0027828216552734375, 0.0013303756713867188, 0.005443572998046875, 0.009556770324707031, 0.013669967651367188, 0.017783164978027344, 0.0218963623046875, 0.026009559631347656, 0.030122756958007812, 0.03423595428466797, 0.038349151611328125, 0.04246234893798828, 0.04657554626464844, 0.050688743591308594, 0.05480194091796875, 0.058915138244628906, 0.06302833557128906, 0.06714153289794922, 0.07125473022460938, 0.07536792755126953, 0.07948112487792969, 0.08359432220458984, 0.08770751953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 4.0, 5.0, 15.0, 17.0, 17.0, 25.0, 22.0, 30.0, 36.0, 47.0, 67.0, 103.0, 164.0, 207.0, 389.0, 746.0, 1551.0, 4030.0, 11896.0, 42877.0, 240306.0, 605244.0, 104499.0, 23620.0, 7263.0, 2692.0, 1149.0, 558.0, 338.0, 186.0, 142.0, 77.0, 43.0, 44.0, 29.0, 40.0, 21.0, 14.0, 10.0, 7.0, 7.0, 5.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.272705078125, -0.26497650146484375, -0.2572479248046875, -0.24951934814453125, -0.241790771484375, -0.23406219482421875, -0.2263336181640625, -0.21860504150390625, -0.21087646484375, -0.20314788818359375, -0.1954193115234375, -0.18769073486328125, -0.179962158203125, -0.17223358154296875, -0.1645050048828125, -0.15677642822265625, -0.1490478515625, -0.14131927490234375, -0.1335906982421875, -0.12586212158203125, -0.118133544921875, -0.11040496826171875, -0.1026763916015625, -0.09494781494140625, -0.08721923828125, -0.07949066162109375, -0.0717620849609375, -0.06403350830078125, -0.056304931640625, -0.04857635498046875, -0.0408477783203125, -0.03311920166015625, -0.025390625, -0.01766204833984375, -0.0099334716796875, -0.00220489501953125, 0.005523681640625, 0.01325225830078125, 0.0209808349609375, 0.02870941162109375, 0.03643798828125, 0.04416656494140625, 0.0518951416015625, 0.05962371826171875, 0.067352294921875, 0.07508087158203125, 0.0828094482421875, 0.09053802490234375, 0.0982666015625, 0.10599517822265625, 0.1137237548828125, 0.12145233154296875, 0.129180908203125, 0.13690948486328125, 0.1446380615234375, 0.15236663818359375, 0.16009521484375, 0.16782379150390625, 0.1755523681640625, 0.18328094482421875, 0.191009521484375, 0.19873809814453125, 0.2064666748046875, 0.21419525146484375, 0.221923828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 5.0, 9.0, 16.0, 12.0, 22.0, 15.0, 18.0, 16.0, 19.0, 17.0, 22.0, 29.0, 40.0, 30.0, 42.0, 31.0, 48.0, 34.0, 54.0, 46.0, 45.0, 29.0, 43.0, 33.0, 28.0, 30.0, 51.0, 37.0, 22.0, 20.0, 28.0, 21.0, 10.0, 11.0, 18.0, 8.0, 8.0, 3.0, 1.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.330810546875, -0.3211669921875, -0.3115234375, -0.3018798828125, -0.292236328125, -0.2825927734375, -0.27294921875, -0.2633056640625, -0.253662109375, -0.2440185546875, -0.234375, -0.2247314453125, -0.215087890625, -0.2054443359375, -0.19580078125, -0.1861572265625, -0.176513671875, -0.1668701171875, -0.1572265625, -0.1475830078125, -0.137939453125, -0.1282958984375, -0.11865234375, -0.1090087890625, -0.099365234375, -0.0897216796875, -0.080078125, -0.0704345703125, -0.060791015625, -0.0511474609375, -0.04150390625, -0.0318603515625, -0.022216796875, -0.0125732421875, -0.0029296875, 0.0067138671875, 0.016357421875, 0.0260009765625, 0.03564453125, 0.0452880859375, 0.054931640625, 0.0645751953125, 0.07421875, 0.0838623046875, 0.093505859375, 0.1031494140625, 0.11279296875, 0.1224365234375, 0.132080078125, 0.1417236328125, 0.1513671875, 0.1610107421875, 0.170654296875, 0.1802978515625, 0.18994140625, 0.1995849609375, 0.209228515625, 0.2188720703125, 0.228515625, 0.2381591796875, 0.247802734375, 0.2574462890625, 0.26708984375, 0.2767333984375, 0.286376953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 10.0, 12.0, 11.0, 20.0, 23.0, 43.0, 70.0, 92.0, 215.0, 327.0, 666.0, 1409.0, 3569.0, 10264.0, 38001.0, 312376.0, 601746.0, 57441.0, 13933.0, 4665.0, 1831.0, 854.0, 446.0, 212.0, 123.0, 74.0, 33.0, 34.0, 18.0, 13.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.12773609161376953, -0.12388038635253906, -0.1200246810913086, -0.11616897583007812, -0.11231327056884766, -0.10845756530761719, -0.10460186004638672, -0.10074615478515625, -0.09689044952392578, -0.09303474426269531, -0.08917903900146484, -0.08532333374023438, -0.0814676284790039, -0.07761192321777344, -0.07375621795654297, -0.0699005126953125, -0.06604480743408203, -0.06218910217285156, -0.058333396911621094, -0.054477691650390625, -0.050621986389160156, -0.04676628112792969, -0.04291057586669922, -0.03905487060546875, -0.03519916534423828, -0.03134346008300781, -0.027487754821777344, -0.023632049560546875, -0.019776344299316406, -0.015920639038085938, -0.012064933776855469, -0.008209228515625, -0.004353523254394531, -0.0004978179931640625, 0.0033578872680664062, 0.007213592529296875, 0.011069297790527344, 0.014925003051757812, 0.01878070831298828, 0.02263641357421875, 0.02649211883544922, 0.030347824096679688, 0.034203529357910156, 0.038059234619140625, 0.041914939880371094, 0.04577064514160156, 0.04962635040283203, 0.0534820556640625, 0.05733776092529297, 0.06119346618652344, 0.0650491714477539, 0.06890487670898438, 0.07276058197021484, 0.07661628723144531, 0.08047199249267578, 0.08432769775390625, 0.08818340301513672, 0.09203910827636719, 0.09589481353759766, 0.09975051879882812, 0.1036062240600586, 0.10746192932128906, 0.11131763458251953, 0.11517333984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 3.0, 8.0, 22.0, 9.0, 10.0, 16.0, 24.0, 35.0, 23.0, 31.0, 43.0, 77.0, 114.0, 132.0, 120.0, 75.0, 60.0, 50.0, 38.0, 28.0, 19.0, 20.0, 14.0, 5.0, 6.0, 9.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5849552154541016e-05, -5.3017400205135345e-05, -5.0185248255729675e-05, -4.7353096306324005e-05, -4.4520944356918335e-05, -4.1688792407512665e-05, -3.8856640458106995e-05, -3.6024488508701324e-05, -3.3192336559295654e-05, -3.0360184609889984e-05, -2.7528032660484314e-05, -2.4695880711078644e-05, -2.1863728761672974e-05, -1.9031576812267303e-05, -1.6199424862861633e-05, -1.3367272913455963e-05, -1.0535120964050293e-05, -7.702969014644623e-06, -4.870817065238953e-06, -2.0386651158332825e-06, 7.934868335723877e-07, 3.625638782978058e-06, 6.457790732383728e-06, 9.289942681789398e-06, 1.2122094631195068e-05, 1.4954246580600739e-05, 1.778639853000641e-05, 2.061855047941208e-05, 2.345070242881775e-05, 2.628285437822342e-05, 2.911500632762909e-05, 3.194715827703476e-05, 3.477931022644043e-05, 3.76114621758461e-05, 4.044361412525177e-05, 4.327576607465744e-05, 4.610791802406311e-05, 4.894006997346878e-05, 5.177222192287445e-05, 5.460437387228012e-05, 5.743652582168579e-05, 6.026867777109146e-05, 6.310082972049713e-05, 6.59329816699028e-05, 6.876513361930847e-05, 7.159728556871414e-05, 7.442943751811981e-05, 7.726158946752548e-05, 8.009374141693115e-05, 8.292589336633682e-05, 8.575804531574249e-05, 8.859019726514816e-05, 9.142234921455383e-05, 9.42545011639595e-05, 9.708665311336517e-05, 9.991880506277084e-05, 0.00010275095701217651, 0.00010558310896158218, 0.00010841526091098785, 0.00011124741286039352, 0.0001140795648097992, 0.00011691171675920486, 0.00011974386870861053, 0.0001225760206580162, 0.00012540817260742188]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 2.0, 3.0, 10.0, 10.0, 20.0, 20.0, 35.0, 50.0, 72.0, 96.0, 166.0, 322.0, 606.0, 1293.0, 2860.0, 7074.0, 20673.0, 74122.0, 415575.0, 417245.0, 74435.0, 20885.0, 7341.0, 2836.0, 1280.0, 635.0, 338.0, 189.0, 126.0, 78.0, 45.0, 33.0, 21.0, 14.0, 10.0, 10.0, 10.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.105712890625, -0.10277652740478516, -0.09984016418457031, -0.09690380096435547, -0.09396743774414062, -0.09103107452392578, -0.08809471130371094, -0.0851583480834961, -0.08222198486328125, -0.0792856216430664, -0.07634925842285156, -0.07341289520263672, -0.07047653198242188, -0.06754016876220703, -0.06460380554199219, -0.061667442321777344, -0.0587310791015625, -0.055794715881347656, -0.05285835266113281, -0.04992198944091797, -0.046985626220703125, -0.04404926300048828, -0.04111289978027344, -0.038176536560058594, -0.03524017333984375, -0.032303810119628906, -0.029367446899414062, -0.02643108367919922, -0.023494720458984375, -0.02055835723876953, -0.017621994018554688, -0.014685630798339844, -0.011749267578125, -0.008812904357910156, -0.0058765411376953125, -0.0029401779174804688, -3.814697265625e-06, 0.0029325485229492188, 0.0058689117431640625, 0.008805274963378906, 0.01174163818359375, 0.014678001403808594, 0.017614364624023438, 0.02055072784423828, 0.023487091064453125, 0.02642345428466797, 0.029359817504882812, 0.032296180725097656, 0.0352325439453125, 0.038168907165527344, 0.04110527038574219, 0.04404163360595703, 0.046977996826171875, 0.04991436004638672, 0.05285072326660156, 0.055787086486816406, 0.05872344970703125, 0.061659812927246094, 0.06459617614746094, 0.06753253936767578, 0.07046890258789062, 0.07340526580810547, 0.07634162902832031, 0.07927799224853516, 0.08221435546875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 4.0, 13.0, 19.0, 28.0, 25.0, 34.0, 52.0, 66.0, 92.0, 110.0, 139.0, 107.0, 80.0, 55.0, 57.0, 30.0, 29.0, 15.0, 9.0, 11.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.081298828125, -0.0774688720703125, -0.073638916015625, -0.0698089599609375, -0.06597900390625, -0.0621490478515625, -0.058319091796875, -0.0544891357421875, -0.0506591796875, -0.0468292236328125, -0.042999267578125, -0.0391693115234375, -0.03533935546875, -0.0315093994140625, -0.027679443359375, -0.0238494873046875, -0.02001953125, -0.0161895751953125, -0.012359619140625, -0.0085296630859375, -0.00469970703125, -0.0008697509765625, 0.002960205078125, 0.0067901611328125, 0.0106201171875, 0.0144500732421875, 0.018280029296875, 0.0221099853515625, 0.02593994140625, 0.0297698974609375, 0.033599853515625, 0.0374298095703125, 0.041259765625, 0.0450897216796875, 0.048919677734375, 0.0527496337890625, 0.05657958984375, 0.0604095458984375, 0.064239501953125, 0.0680694580078125, 0.0718994140625, 0.0757293701171875, 0.079559326171875, 0.0833892822265625, 0.08721923828125, 0.0910491943359375, 0.094879150390625, 0.0987091064453125, 0.1025390625, 0.1063690185546875, 0.110198974609375, 0.1140289306640625, 0.11785888671875, 0.1216888427734375, 0.125518798828125, 0.1293487548828125, 0.1331787109375, 0.1370086669921875, 0.140838623046875, 0.1446685791015625, 0.14849853515625, 0.1523284912109375, 0.156158447265625, 0.1599884033203125, 0.163818359375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 14.0, 62.0, 150.0, 400.0, 267.0, 94.0, 17.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.028061866760254, -0.8768825531005859, -0.7257032990455627, -0.5745240449905396, -0.4233447313308716, -0.2721654176712036, -0.12098616361618042, 0.030193090438842773, 0.18137240409851074, 0.3325516879558563, 0.4837309718132019, 0.6349102258682251, 0.7860895395278931, 0.937268853187561, 1.0884480476379395, 1.2396273612976074, 1.3908066749572754, 1.5419859886169434, 1.6931653022766113, 1.8443444967269897, 1.9955238103866577, 2.1467032432556152, 2.297882318496704, 2.449061632156372, 2.60024094581604, 2.751420259475708, 2.902599573135376, 3.053778886795044, 3.204957962036133, 3.356137275695801, 3.5073165893554688, 3.6584959030151367, 3.8096752166748047, 3.9608545303344727, 4.112033843994141, 4.263213157653809, 4.414392471313477, 4.5655717849731445, 4.7167510986328125, 4.8679304122924805, 5.019109725952148, 5.170289039611816, 5.321468353271484, 5.472647666931152, 5.62382698059082, 5.775006294250488, 5.926185607910156, 6.077364921569824, 6.228543758392334, 6.379723072052002, 6.53090238571167, 6.682081699371338, 6.833261013031006, 6.984440326690674, 7.135619640350342, 7.286798477172852, 7.4379777908325195, 7.5891571044921875, 7.7403364181518555, 7.891515731811523, 8.042695045471191, 8.19387435913086, 8.345053672790527, 8.496232986450195, 8.647412300109863]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 11.0, 4.0, 10.0, 10.0, 10.0, 12.0, 18.0, 15.0, 22.0, 28.0, 20.0, 28.0, 34.0, 25.0, 49.0, 40.0, 29.0, 37.0, 44.0, 48.0, 38.0, 46.0, 45.0, 30.0, 45.0, 36.0, 35.0, 28.0, 26.0, 39.0, 30.0, 22.0, 17.0, 11.0, 9.0, 17.0, 8.0, 11.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5384279489517212, -1.4869585037231445, -1.4354890584945679, -1.3840196132659912, -1.3325501680374146, -1.281080722808838, -1.2296111583709717, -1.1781418323516846, -1.1266722679138184, -1.0752028226852417, -1.023733377456665, -0.9722639322280884, -0.9207944869995117, -0.8693250417709351, -0.8178555369377136, -0.766386091709137, -0.7149167060852051, -0.6634472608566284, -0.6119778156280518, -0.5605083703994751, -0.5090389251708984, -0.4575694501399994, -0.40609997510910034, -0.3546305298805237, -0.303161084651947, -0.25169163942337036, -0.2002221792936325, -0.14875271916389465, -0.097283273935318, -0.04581382870674133, 0.005655646324157715, 0.057125091552734375, 0.10859441757202148, 0.16006386280059814, 0.211533322930336, 0.26300278306007385, 0.3144722282886505, 0.3659416735172272, 0.4174111485481262, 0.4688805937767029, 0.5203500390052795, 0.5718194842338562, 0.6232889294624329, 0.6747584342956543, 0.726227879524231, 0.7776973247528076, 0.8291667699813843, 0.8806362152099609, 0.9321056604385376, 0.9835751056671143, 1.035044550895691, 1.0865139961242676, 1.1379834413528442, 1.189452886581421, 1.240922451019287, 1.2923917770385742, 1.3438613414764404, 1.395330786705017, 1.4468002319335938, 1.4982696771621704, 1.549739122390747, 1.6012085676193237, 1.6526780128479004, 1.7041475772857666, 1.7556169033050537]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 1.0, 7.0, 13.0, 12.0, 14.0, 13.0, 24.0, 22.0, 28.0, 40.0, 57.0, 79.0, 105.0, 158.0, 194.0, 333.0, 618.0, 1136.0, 1845.0, 3949.0, 9611.0, 33717.0, 3206375.0, 889245.0, 29866.0, 8674.0, 3703.0, 1861.0, 921.0, 575.0, 386.0, 204.0, 135.0, 100.0, 71.0, 45.0, 35.0, 30.0, 22.0, 13.0, 17.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0], "bins": [-0.2939453125, -0.2865886688232422, -0.2792320251464844, -0.27187538146972656, -0.26451873779296875, -0.25716209411621094, -0.24980545043945312, -0.2424488067626953, -0.2350921630859375, -0.2277355194091797, -0.22037887573242188, -0.21302223205566406, -0.20566558837890625, -0.19830894470214844, -0.19095230102539062, -0.1835956573486328, -0.176239013671875, -0.1688823699951172, -0.16152572631835938, -0.15416908264160156, -0.14681243896484375, -0.13945579528808594, -0.13209915161132812, -0.12474250793457031, -0.1173858642578125, -0.11002922058105469, -0.10267257690429688, -0.09531593322753906, -0.08795928955078125, -0.08060264587402344, -0.07324600219726562, -0.06588935852050781, -0.05853271484375, -0.05117607116699219, -0.043819427490234375, -0.03646278381347656, -0.02910614013671875, -0.021749496459960938, -0.014392852783203125, -0.0070362091064453125, 0.0003204345703125, 0.0076770782470703125, 0.015033721923828125, 0.022390365600585938, 0.02974700927734375, 0.03710365295410156, 0.044460296630859375, 0.05181694030761719, 0.059173583984375, 0.06653022766113281, 0.07388687133789062, 0.08124351501464844, 0.08860015869140625, 0.09595680236816406, 0.10331344604492188, 0.11067008972167969, 0.1180267333984375, 0.1253833770751953, 0.13274002075195312, 0.14009666442871094, 0.14745330810546875, 0.15480995178222656, 0.16216659545898438, 0.1695232391357422, 0.1768798828125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 12.0, 17.0, 24.0, 25.0, 29.0, 40.0, 48.0, 38.0, 58.0, 75.0, 67.0, 69.0, 56.0, 72.0, 85.0, 57.0, 40.0, 51.0, 26.0, 24.0, 16.0, 18.0, 14.0, 9.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1748046875, -0.17061710357666016, -0.1664295196533203, -0.16224193572998047, -0.15805435180664062, -0.15386676788330078, -0.14967918395996094, -0.1454916000366211, -0.14130401611328125, -0.1371164321899414, -0.13292884826660156, -0.12874126434326172, -0.12455368041992188, -0.12036609649658203, -0.11617851257324219, -0.11199092864990234, -0.1078033447265625, -0.10361576080322266, -0.09942817687988281, -0.09524059295654297, -0.09105300903320312, -0.08686542510986328, -0.08267784118652344, -0.0784902572631836, -0.07430267333984375, -0.0701150894165039, -0.06592750549316406, -0.06173992156982422, -0.057552337646484375, -0.05336475372314453, -0.04917716979980469, -0.044989585876464844, -0.040802001953125, -0.036614418029785156, -0.03242683410644531, -0.02823925018310547, -0.024051666259765625, -0.01986408233642578, -0.015676498413085938, -0.011488914489746094, -0.00730133056640625, -0.0031137466430664062, 0.0010738372802734375, 0.005261421203613281, 0.009449005126953125, 0.013636589050292969, 0.017824172973632812, 0.022011756896972656, 0.0261993408203125, 0.030386924743652344, 0.03457450866699219, 0.03876209259033203, 0.042949676513671875, 0.04713726043701172, 0.05132484436035156, 0.055512428283691406, 0.05970001220703125, 0.0638875961303711, 0.06807518005371094, 0.07226276397705078, 0.07645034790039062, 0.08063793182373047, 0.08482551574707031, 0.08901309967041016, 0.09320068359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 4.0, 9.0, 13.0, 15.0, 25.0, 52.0, 50.0, 106.0, 156.0, 265.0, 489.0, 859.0, 1601.0, 3082.0, 6960.0, 24987.0, 1295279.0, 2819737.0, 26576.0, 7230.0, 3065.0, 1612.0, 899.0, 493.0, 296.0, 176.0, 81.0, 62.0, 35.0, 15.0, 18.0, 8.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17724609375, -0.17016220092773438, -0.16307830810546875, -0.15599441528320312, -0.1489105224609375, -0.14182662963867188, -0.13474273681640625, -0.12765884399414062, -0.120574951171875, -0.11349105834960938, -0.10640716552734375, -0.09932327270507812, -0.0922393798828125, -0.08515548706054688, -0.07807159423828125, -0.07098770141601562, -0.06390380859375, -0.056819915771484375, -0.04973602294921875, -0.042652130126953125, -0.0355682373046875, -0.028484344482421875, -0.02140045166015625, -0.014316558837890625, -0.007232666015625, -0.000148773193359375, 0.00693511962890625, 0.014019012451171875, 0.0211029052734375, 0.028186798095703125, 0.03527069091796875, 0.042354583740234375, 0.0494384765625, 0.056522369384765625, 0.06360626220703125, 0.07069015502929688, 0.0777740478515625, 0.08485794067382812, 0.09194183349609375, 0.09902572631835938, 0.106109619140625, 0.11319351196289062, 0.12027740478515625, 0.12736129760742188, 0.1344451904296875, 0.14152908325195312, 0.14861297607421875, 0.15569686889648438, 0.16278076171875, 0.16986465454101562, 0.17694854736328125, 0.18403244018554688, 0.1911163330078125, 0.19820022583007812, 0.20528411865234375, 0.21236801147460938, 0.219451904296875, 0.22653579711914062, 0.23361968994140625, 0.24070358276367188, 0.2477874755859375, 0.2548713684082031, 0.26195526123046875, 0.2690391540527344, 0.276123046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 13.0, 14.0, 23.0, 50.0, 89.0, 676.0, 2880.0, 141.0, 60.0, 37.0, 23.0, 13.0, 8.0, 7.0, 3.0, 2.0, 5.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1478271484375, -0.14308929443359375, -0.1383514404296875, -0.13361358642578125, -0.128875732421875, -0.12413787841796875, -0.1194000244140625, -0.11466217041015625, -0.10992431640625, -0.10518646240234375, -0.1004486083984375, -0.09571075439453125, -0.090972900390625, -0.08623504638671875, -0.0814971923828125, -0.07675933837890625, -0.072021484375, -0.06728363037109375, -0.0625457763671875, -0.05780792236328125, -0.053070068359375, -0.04833221435546875, -0.0435943603515625, -0.03885650634765625, -0.03411865234375, -0.02938079833984375, -0.0246429443359375, -0.01990509033203125, -0.015167236328125, -0.01042938232421875, -0.0056915283203125, -0.00095367431640625, 0.0037841796875, 0.00852203369140625, 0.0132598876953125, 0.01799774169921875, 0.022735595703125, 0.02747344970703125, 0.0322113037109375, 0.03694915771484375, 0.04168701171875, 0.04642486572265625, 0.0511627197265625, 0.05590057373046875, 0.060638427734375, 0.06537628173828125, 0.0701141357421875, 0.07485198974609375, 0.07958984375, 0.08432769775390625, 0.0890655517578125, 0.09380340576171875, 0.098541259765625, 0.10327911376953125, 0.1080169677734375, 0.11275482177734375, 0.11749267578125, 0.12223052978515625, 0.1269683837890625, 0.13170623779296875, 0.136444091796875, 0.14118194580078125, 0.1459197998046875, 0.15065765380859375, 0.1553955078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 65.0, 778.0, 141.0, 18.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8055806756019592, -0.7213149666786194, -0.6370493173599243, -0.5527836084365845, -0.46851789951324463, -0.3842521905899048, -0.2999865412712097, -0.21572083234786987, -0.13145512342453003, -0.04718942940235138, 0.03707626461982727, 0.12134194374084473, 0.20560765266418457, 0.2898733615875244, 0.3741390109062195, 0.4584047198295593, 0.5426704287528992, 0.626936137676239, 0.7112017869949341, 0.7954674959182739, 0.8797332048416138, 0.9639989137649536, 1.048264503479004, 1.1325302124023438, 1.2167959213256836, 1.3010616302490234, 1.3853273391723633, 1.4695930480957031, 1.553858757019043, 1.6381244659423828, 1.722390055656433, 1.806655764579773, 1.8909215927124023, 1.9751873016357422, 2.059453010559082, 2.143718719482422, 2.2279844284057617, 2.3122501373291016, 2.3965158462524414, 2.4807815551757812, 2.565047264099121, 2.649312973022461, 2.733578681945801, 2.8178443908691406, 2.9021100997924805, 2.9863758087158203, 3.07064151763916, 3.1549072265625, 3.2391726970672607, 3.3234384059906006, 3.4077041149139404, 3.4919698238372803, 3.57623553276062, 3.66050124168396, 3.7447667121887207, 3.8290324211120605, 3.9132981300354004, 3.9975638389587402, 4.08182954788208, 4.16609525680542, 4.25036096572876, 4.3346266746521, 4.4188923835754395, 4.503158092498779, 4.587423801422119]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 9.0, 10.0, 11.0, 25.0, 31.0, 39.0, 41.0, 60.0, 65.0, 52.0, 75.0, 70.0, 69.0, 77.0, 67.0, 48.0, 63.0, 53.0, 28.0, 29.0, 20.0, 17.0, 11.0, 11.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3940753936767578, -0.3810008764266968, -0.36792638897895813, -0.3548518717288971, -0.34177735447883606, -0.3287028670310974, -0.3156283497810364, -0.30255383253097534, -0.2894793152809143, -0.27640479803085327, -0.2633303105831146, -0.2502557933330536, -0.23718127608299255, -0.2241067737340927, -0.21103227138519287, -0.19795775413513184, -0.1848832666873932, -0.17180876433849335, -0.1587342470884323, -0.14565974473953247, -0.13258522748947144, -0.1195107251405716, -0.10643622279167175, -0.09336171299219131, -0.08028720319271088, -0.06721269339323044, -0.0541381873190403, -0.04106368124485016, -0.02798917144536972, -0.014914661645889282, -0.001840159296989441, 0.011234350502490997, 0.024308860301971436, 0.037383370101451874, 0.050457876175642014, 0.06353238224983215, 0.07660689204931259, 0.08968140184879303, 0.10275590419769287, 0.11583041399717331, 0.12890492379665375, 0.1419794261455536, 0.15505394339561462, 0.16812844574451447, 0.1812029480934143, 0.19427746534347534, 0.20735196769237518, 0.22042647004127502, 0.23350098729133606, 0.2465754896402359, 0.25964999198913574, 0.2727245092391968, 0.2857990264892578, 0.29887354373931885, 0.3119480311870575, 0.32502254843711853, 0.3380970358848572, 0.3511715531349182, 0.36424604058265686, 0.3773205578327179, 0.39039507508277893, 0.4034695625305176, 0.4165440797805786, 0.42961859703063965, 0.4426931142807007]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 7.0, 9.0, 26.0, 40.0, 55.0, 104.0, 188.0, 463.0, 1272.0, 3900.0, 14619.0, 70514.0, 523064.0, 366492.0, 51584.0, 11346.0, 3079.0, 1028.0, 386.0, 172.0, 79.0, 48.0, 16.0, 17.0, 13.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.371826171875, -0.36250877380371094, -0.3531913757324219, -0.3438739776611328, -0.33455657958984375, -0.3252391815185547, -0.3159217834472656, -0.30660438537597656, -0.2972869873046875, -0.28796958923339844, -0.2786521911621094, -0.2693347930908203, -0.26001739501953125, -0.2506999969482422, -0.24138259887695312, -0.23206520080566406, -0.222747802734375, -0.21343040466308594, -0.20411300659179688, -0.1947956085205078, -0.18547821044921875, -0.1761608123779297, -0.16684341430664062, -0.15752601623535156, -0.1482086181640625, -0.13889122009277344, -0.12957382202148438, -0.12025642395019531, -0.11093902587890625, -0.10162162780761719, -0.09230422973632812, -0.08298683166503906, -0.07366943359375, -0.06435203552246094, -0.055034637451171875, -0.04571723937988281, -0.03639984130859375, -0.027082443237304688, -0.017765045166015625, -0.008447647094726562, 0.0008697509765625, 0.010187149047851562, 0.019504547119140625, 0.028821945190429688, 0.03813934326171875, 0.04745674133300781, 0.056774139404296875, 0.06609153747558594, 0.075408935546875, 0.08472633361816406, 0.09404373168945312, 0.10336112976074219, 0.11267852783203125, 0.12199592590332031, 0.13131332397460938, 0.14063072204589844, 0.1499481201171875, 0.15926551818847656, 0.16858291625976562, 0.1779003143310547, 0.18721771240234375, 0.1965351104736328, 0.20585250854492188, 0.21516990661621094, 0.2244873046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 5.0, 15.0, 11.0, 35.0, 23.0, 31.0, 34.0, 39.0, 58.0, 51.0, 62.0, 81.0, 67.0, 61.0, 74.0, 77.0, 59.0, 46.0, 27.0, 35.0, 25.0, 14.0, 17.0, 15.0, 14.0, 6.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.171142578125, -0.16692733764648438, -0.16271209716796875, -0.15849685668945312, -0.1542816162109375, -0.15006637573242188, -0.14585113525390625, -0.14163589477539062, -0.137420654296875, -0.13320541381835938, -0.12899017333984375, -0.12477493286132812, -0.1205596923828125, -0.11634445190429688, -0.11212921142578125, -0.10791397094726562, -0.10369873046875, -0.09948348999023438, -0.09526824951171875, -0.09105300903320312, -0.0868377685546875, -0.08262252807617188, -0.07840728759765625, -0.07419204711914062, -0.069976806640625, -0.06576156616210938, -0.06154632568359375, -0.057331085205078125, -0.0531158447265625, -0.048900604248046875, -0.04468536376953125, -0.040470123291015625, -0.0362548828125, -0.032039642333984375, -0.02782440185546875, -0.023609161376953125, -0.0193939208984375, -0.015178680419921875, -0.01096343994140625, -0.006748199462890625, -0.002532958984375, 0.001682281494140625, 0.00589752197265625, 0.010112762451171875, 0.0143280029296875, 0.018543243408203125, 0.02275848388671875, 0.026973724365234375, 0.03118896484375, 0.035404205322265625, 0.03961944580078125, 0.043834686279296875, 0.0480499267578125, 0.052265167236328125, 0.05648040771484375, 0.060695648193359375, 0.064910888671875, 0.06912612915039062, 0.07334136962890625, 0.07755661010742188, 0.0817718505859375, 0.08598709106445312, 0.09020233154296875, 0.09441757202148438, 0.0986328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 8.0, 14.0, 15.0, 24.0, 20.0, 40.0, 52.0, 67.0, 83.0, 95.0, 149.0, 285.0, 487.0, 1242.0, 5165.0, 29484.0, 359840.0, 599026.0, 42496.0, 6896.0, 1537.0, 550.0, 295.0, 186.0, 133.0, 92.0, 62.0, 56.0, 33.0, 27.0, 23.0, 16.0, 13.0, 11.0, 8.0, 9.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3753776550292969, -0.36525726318359375, -0.3551368713378906, -0.3450164794921875, -0.3348960876464844, -0.32477569580078125, -0.3146553039550781, -0.304534912109375, -0.2944145202636719, -0.28429412841796875, -0.2741737365722656, -0.2640533447265625, -0.2539329528808594, -0.24381256103515625, -0.23369216918945312, -0.22357177734375, -0.21345138549804688, -0.20333099365234375, -0.19321060180664062, -0.1830902099609375, -0.17296981811523438, -0.16284942626953125, -0.15272903442382812, -0.142608642578125, -0.13248825073242188, -0.12236785888671875, -0.11224746704101562, -0.1021270751953125, -0.09200668334960938, -0.08188629150390625, -0.07176589965820312, -0.0616455078125, -0.051525115966796875, -0.04140472412109375, -0.031284332275390625, -0.0211639404296875, -0.011043548583984375, -0.00092315673828125, 0.009197235107421875, 0.019317626953125, 0.029438018798828125, 0.03955841064453125, 0.049678802490234375, 0.0597991943359375, 0.06991958618164062, 0.08003997802734375, 0.09016036987304688, 0.10028076171875, 0.11040115356445312, 0.12052154541015625, 0.13064193725585938, 0.1407623291015625, 0.15088272094726562, 0.16100311279296875, 0.17112350463867188, 0.181243896484375, 0.19136428833007812, 0.20148468017578125, 0.21160507202148438, 0.2217254638671875, 0.23184585571289062, 0.24196624755859375, 0.2520866394042969, 0.26220703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 4.0, 5.0, 6.0, 6.0, 5.0, 17.0, 2.0, 10.0, 10.0, 15.0, 15.0, 30.0, 20.0, 24.0, 24.0, 32.0, 28.0, 35.0, 27.0, 40.0, 37.0, 49.0, 32.0, 42.0, 48.0, 42.0, 33.0, 37.0, 24.0, 30.0, 29.0, 24.0, 24.0, 20.0, 28.0, 25.0, 18.0, 14.0, 14.0, 2.0, 12.0, 8.0, 7.0, 8.0, 8.0, 4.0, 7.0, 4.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.328125, -0.3183135986328125, -0.308502197265625, -0.2986907958984375, -0.28887939453125, -0.2790679931640625, -0.269256591796875, -0.2594451904296875, -0.2496337890625, -0.2398223876953125, -0.230010986328125, -0.2201995849609375, -0.21038818359375, -0.2005767822265625, -0.190765380859375, -0.1809539794921875, -0.171142578125, -0.1613311767578125, -0.151519775390625, -0.1417083740234375, -0.13189697265625, -0.1220855712890625, -0.112274169921875, -0.1024627685546875, -0.0926513671875, -0.0828399658203125, -0.073028564453125, -0.0632171630859375, -0.05340576171875, -0.0435943603515625, -0.033782958984375, -0.0239715576171875, -0.01416015625, -0.0043487548828125, 0.005462646484375, 0.0152740478515625, 0.02508544921875, 0.0348968505859375, 0.044708251953125, 0.0545196533203125, 0.0643310546875, 0.0741424560546875, 0.083953857421875, 0.0937652587890625, 0.10357666015625, 0.1133880615234375, 0.123199462890625, 0.1330108642578125, 0.142822265625, 0.1526336669921875, 0.162445068359375, 0.1722564697265625, 0.18206787109375, 0.1918792724609375, 0.201690673828125, 0.2115020751953125, 0.2213134765625, 0.2311248779296875, 0.240936279296875, 0.2507476806640625, 0.26055908203125, 0.2703704833984375, 0.280181884765625, 0.2899932861328125, 0.2998046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 9.0, 9.0, 14.0, 17.0, 43.0, 43.0, 43.0, 73.0, 133.0, 212.0, 306.0, 523.0, 759.0, 1376.0, 2532.0, 5005.0, 10865.0, 31268.0, 232107.0, 679824.0, 53790.0, 15404.0, 6683.0, 3149.0, 1724.0, 995.0, 618.0, 363.0, 213.0, 133.0, 108.0, 65.0, 47.0, 34.0, 18.0, 17.0, 10.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11114501953125, -0.10758113861083984, -0.10401725769042969, -0.10045337677001953, -0.09688949584960938, -0.09332561492919922, -0.08976173400878906, -0.0861978530883789, -0.08263397216796875, -0.0790700912475586, -0.07550621032714844, -0.07194232940673828, -0.06837844848632812, -0.06481456756591797, -0.06125068664550781, -0.057686805725097656, -0.0541229248046875, -0.050559043884277344, -0.04699516296386719, -0.04343128204345703, -0.039867401123046875, -0.03630352020263672, -0.03273963928222656, -0.029175758361816406, -0.02561187744140625, -0.022047996520996094, -0.018484115600585938, -0.014920234680175781, -0.011356353759765625, -0.007792472839355469, -0.0042285919189453125, -0.0006647109985351562, 0.002899169921875, 0.006463050842285156, 0.010026931762695312, 0.013590812683105469, 0.017154693603515625, 0.02071857452392578, 0.024282455444335938, 0.027846336364746094, 0.03141021728515625, 0.034974098205566406, 0.03853797912597656, 0.04210186004638672, 0.045665740966796875, 0.04922962188720703, 0.05279350280761719, 0.056357383728027344, 0.0599212646484375, 0.06348514556884766, 0.06704902648925781, 0.07061290740966797, 0.07417678833007812, 0.07774066925048828, 0.08130455017089844, 0.0848684310913086, 0.08843231201171875, 0.0919961929321289, 0.09556007385253906, 0.09912395477294922, 0.10268783569335938, 0.10625171661376953, 0.10981559753417969, 0.11337947845458984, 0.116943359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 2.0, 8.0, 9.0, 10.0, 10.0, 21.0, 19.0, 29.0, 28.0, 38.0, 41.0, 66.0, 70.0, 82.0, 83.0, 101.0, 76.0, 63.0, 52.0, 40.0, 32.0, 28.0, 22.0, 16.0, 10.0, 11.0, 10.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.89897346496582e-05, -8.60951840877533e-05, -8.320063352584839e-05, -8.030608296394348e-05, -7.741153240203857e-05, -7.451698184013367e-05, -7.162243127822876e-05, -6.872788071632385e-05, -6.583333015441895e-05, -6.293877959251404e-05, -6.004422903060913e-05, -5.7149678468704224e-05, -5.4255127906799316e-05, -5.136057734489441e-05, -4.84660267829895e-05, -4.5571476221084595e-05, -4.267692565917969e-05, -3.978237509727478e-05, -3.688782453536987e-05, -3.3993273973464966e-05, -3.109872341156006e-05, -2.820417284965515e-05, -2.5309622287750244e-05, -2.2415071725845337e-05, -1.952052116394043e-05, -1.6625970602035522e-05, -1.3731420040130615e-05, -1.0836869478225708e-05, -7.9423189163208e-06, -5.0477683544158936e-06, -2.1532177925109863e-06, 7.413327693939209e-07, 3.635883331298828e-06, 6.530433893203735e-06, 9.424984455108643e-06, 1.231953501701355e-05, 1.5214085578918457e-05, 1.8108636140823364e-05, 2.100318670272827e-05, 2.389773726463318e-05, 2.6792287826538086e-05, 2.9686838388442993e-05, 3.25813889503479e-05, 3.547593951225281e-05, 3.8370490074157715e-05, 4.126504063606262e-05, 4.415959119796753e-05, 4.7054141759872437e-05, 4.9948692321777344e-05, 5.284324288368225e-05, 5.573779344558716e-05, 5.8632344007492065e-05, 6.152689456939697e-05, 6.442144513130188e-05, 6.731599569320679e-05, 7.02105462551117e-05, 7.31050968170166e-05, 7.599964737892151e-05, 7.889419794082642e-05, 8.178874850273132e-05, 8.468329906463623e-05, 8.757784962654114e-05, 9.047240018844604e-05, 9.336695075035095e-05, 9.626150131225586e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 14.0, 19.0, 16.0, 26.0, 44.0, 79.0, 113.0, 189.0, 305.0, 567.0, 957.0, 1631.0, 3173.0, 7040.0, 20140.0, 110660.0, 778897.0, 92848.0, 18414.0, 6488.0, 3046.0, 1615.0, 917.0, 586.0, 290.0, 171.0, 115.0, 73.0, 53.0, 18.0, 20.0, 12.0, 10.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1376953125, -0.1340198516845703, -0.13034439086914062, -0.12666893005371094, -0.12299346923828125, -0.11931800842285156, -0.11564254760742188, -0.11196708679199219, -0.1082916259765625, -0.10461616516113281, -0.10094070434570312, -0.09726524353027344, -0.09358978271484375, -0.08991432189941406, -0.08623886108398438, -0.08256340026855469, -0.078887939453125, -0.07521247863769531, -0.07153701782226562, -0.06786155700683594, -0.06418609619140625, -0.06051063537597656, -0.056835174560546875, -0.05315971374511719, -0.0494842529296875, -0.04580879211425781, -0.042133331298828125, -0.03845787048339844, -0.03478240966796875, -0.031106948852539062, -0.027431488037109375, -0.023756027221679688, -0.02008056640625, -0.016405105590820312, -0.012729644775390625, -0.009054183959960938, -0.00537872314453125, -0.0017032623291015625, 0.001972198486328125, 0.0056476593017578125, 0.0093231201171875, 0.012998580932617188, 0.016674041748046875, 0.020349502563476562, 0.02402496337890625, 0.027700424194335938, 0.031375885009765625, 0.03505134582519531, 0.038726806640625, 0.04240226745605469, 0.046077728271484375, 0.04975318908691406, 0.05342864990234375, 0.05710411071777344, 0.060779571533203125, 0.06445503234863281, 0.0681304931640625, 0.07180595397949219, 0.07548141479492188, 0.07915687561035156, 0.08283233642578125, 0.08650779724121094, 0.09018325805664062, 0.09385871887207031, 0.0975341796875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 7.0, 7.0, 5.0, 7.0, 14.0, 15.0, 23.0, 30.0, 56.0, 70.0, 118.0, 153.0, 153.0, 114.0, 82.0, 50.0, 26.0, 16.0, 12.0, 11.0, 3.0, 10.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134521484375, -0.13057327270507812, -0.12662506103515625, -0.12267684936523438, -0.1187286376953125, -0.11478042602539062, -0.11083221435546875, -0.10688400268554688, -0.102935791015625, -0.09898757934570312, -0.09503936767578125, -0.09109115600585938, -0.0871429443359375, -0.08319473266601562, -0.07924652099609375, -0.07529830932617188, -0.07135009765625, -0.06740188598632812, -0.06345367431640625, -0.059505462646484375, -0.0555572509765625, -0.051609039306640625, -0.04766082763671875, -0.043712615966796875, -0.039764404296875, -0.035816192626953125, -0.03186798095703125, -0.027919769287109375, -0.0239715576171875, -0.020023345947265625, -0.01607513427734375, -0.012126922607421875, -0.0081787109375, -0.004230499267578125, -0.00028228759765625, 0.003665924072265625, 0.0076141357421875, 0.011562347412109375, 0.01551055908203125, 0.019458770751953125, 0.023406982421875, 0.027355194091796875, 0.03130340576171875, 0.035251617431640625, 0.0391998291015625, 0.043148040771484375, 0.04709625244140625, 0.051044464111328125, 0.05499267578125, 0.058940887451171875, 0.06288909912109375, 0.06683731079101562, 0.0707855224609375, 0.07473373413085938, 0.07868194580078125, 0.08263015747070312, 0.086578369140625, 0.09052658081054688, 0.09447479248046875, 0.09842300415039062, 0.1023712158203125, 0.10631942749023438, 0.11026763916015625, 0.11421585083007812, 0.1181640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 16.0, 60.0, 116.0, 180.0, 221.0, 192.0, 97.0, 59.0, 28.0, 16.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0002601146697998, -0.9190535545349121, -0.8378469944000244, -0.7566404342651367, -0.675433874130249, -0.5942273139953613, -0.5130207538604736, -0.43181419372558594, -0.35060763359069824, -0.26940107345581055, -0.18819451332092285, -0.10698795318603516, -0.02578139305114746, 0.055425167083740234, 0.13663172721862793, 0.21783828735351562, 0.2990448474884033, 0.380251407623291, 0.4614579677581787, 0.5426645278930664, 0.6238710880279541, 0.7050776481628418, 0.7862842082977295, 0.8674907684326172, 0.9486973285675049, 1.0299038887023926, 1.1111104488372803, 1.192317008972168, 1.2735235691070557, 1.3547301292419434, 1.435936689376831, 1.5171432495117188, 1.5983495712280273, 1.679556131362915, 1.7607626914978027, 1.8419692516326904, 1.9231758117675781, 2.004382371902466, 2.0855889320373535, 2.166795492172241, 2.248002052307129, 2.3292086124420166, 2.4104151725769043, 2.491621732711792, 2.5728282928466797, 2.6540348529815674, 2.735241413116455, 2.8164479732513428, 2.8976545333862305, 2.978861093521118, 3.060067653656006, 3.1412742137908936, 3.2224807739257812, 3.303687334060669, 3.3848938941955566, 3.4661004543304443, 3.547307014465332, 3.6285135746002197, 3.7097201347351074, 3.790926694869995, 3.872133255004883, 3.9533398151397705, 4.034546375274658, 4.115753173828125, 4.196959495544434]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 9.0, 7.0, 13.0, 19.0, 26.0, 23.0, 25.0, 34.0, 38.0, 43.0, 53.0, 46.0, 54.0, 67.0, 52.0, 64.0, 57.0, 55.0, 57.0, 32.0, 30.0, 43.0, 25.0, 27.0, 17.0, 19.0, 10.0, 13.0, 6.0, 7.0, 7.0, 4.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.409971237182617, -2.3364856243133545, -2.263000249862671, -2.189514636993408, -2.1160292625427246, -2.042543649673462, -1.9690580368041992, -1.895572543144226, -1.822087049484253, -1.7486015558242798, -1.6751160621643066, -1.601630449295044, -1.5281449556350708, -1.4546594619750977, -1.381173849105835, -1.3076883554458618, -1.2342028617858887, -1.1607173681259155, -1.0872318744659424, -1.0137462615966797, -0.9402607679367065, -0.8667752742767334, -0.7932897210121155, -0.7198041677474976, -0.6463186740875244, -0.5728331804275513, -0.49934762716293335, -0.4258621037006378, -0.3523765802383423, -0.27889105677604675, -0.20540553331375122, -0.1319199800491333, -0.05843472480773926, 0.015050798654556274, 0.0885363221168518, 0.16202184557914734, 0.23550736904144287, 0.3089928925037384, 0.38247841596603394, 0.45596396923065186, 0.529449462890625, 0.6029349565505981, 0.6764205098152161, 0.749906063079834, 0.8233915567398071, 0.8968770503997803, 0.9703626036643982, 1.0438481569290161, 1.1173336505889893, 1.1908191442489624, 1.2643046379089355, 1.3377902507781982, 1.4112757444381714, 1.4847612380981445, 1.5582468509674072, 1.6317323446273804, 1.7052178382873535, 1.7787033319473267, 1.8521888256072998, 1.9256744384765625, 1.9991599321365356, 2.072645425796509, 2.1461310386657715, 2.219616413116455, 2.2931020259857178]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 5.0, 24.0, 36.0, 86.0, 207.0, 704.0, 5970.0, 4136410.0, 48134.0, 2064.0, 378.0, 120.0, 50.0, 27.0, 16.0, 6.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.5380859375, -0.5270500183105469, -0.5160140991210938, -0.5049781799316406, -0.4939422607421875, -0.4829063415527344, -0.47187042236328125, -0.4608345031738281, -0.449798583984375, -0.4387626647949219, -0.42772674560546875, -0.4166908264160156, -0.4056549072265625, -0.3946189880371094, -0.38358306884765625, -0.3725471496582031, -0.36151123046875, -0.3504753112792969, -0.33943939208984375, -0.3284034729003906, -0.3173675537109375, -0.3063316345214844, -0.29529571533203125, -0.2842597961425781, -0.273223876953125, -0.2621879577636719, -0.25115203857421875, -0.24011611938476562, -0.2290802001953125, -0.21804428100585938, -0.20700836181640625, -0.19597244262695312, -0.1849365234375, -0.17390060424804688, -0.16286468505859375, -0.15182876586914062, -0.1407928466796875, -0.12975692749023438, -0.11872100830078125, -0.10768508911132812, -0.096649169921875, -0.08561325073242188, -0.07457733154296875, -0.06354141235351562, -0.0525054931640625, -0.041469573974609375, -0.03043365478515625, -0.019397735595703125, -0.00836181640625, 0.002674102783203125, 0.01371002197265625, 0.024745941162109375, 0.0357818603515625, 0.046817779541015625, 0.05785369873046875, 0.06888961791992188, 0.079925537109375, 0.09096145629882812, 0.10199737548828125, 0.11303329467773438, 0.1240692138671875, 0.13510513305664062, 0.14614105224609375, 0.15717697143554688, 0.168212890625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 11.0, 6.0, 12.0, 13.0, 15.0, 28.0, 25.0, 38.0, 55.0, 44.0, 60.0, 54.0, 73.0, 66.0, 68.0, 56.0, 51.0, 47.0, 51.0, 44.0, 43.0, 27.0, 29.0, 15.0, 18.0, 17.0, 13.0, 6.0, 9.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0], "bins": [-0.17529296875, -0.17093753814697266, -0.1665821075439453, -0.16222667694091797, -0.15787124633789062, -0.15351581573486328, -0.14916038513183594, -0.1448049545288086, -0.14044952392578125, -0.1360940933227539, -0.13173866271972656, -0.12738323211669922, -0.12302780151367188, -0.11867237091064453, -0.11431694030761719, -0.10996150970458984, -0.1056060791015625, -0.10125064849853516, -0.09689521789550781, -0.09253978729248047, -0.08818435668945312, -0.08382892608642578, -0.07947349548339844, -0.0751180648803711, -0.07076263427734375, -0.0664072036743164, -0.06205177307128906, -0.05769634246826172, -0.053340911865234375, -0.04898548126220703, -0.04463005065917969, -0.040274620056152344, -0.035919189453125, -0.031563758850097656, -0.027208328247070312, -0.02285289764404297, -0.018497467041015625, -0.014142036437988281, -0.009786605834960938, -0.005431175231933594, -0.00107574462890625, 0.0032796859741210938, 0.0076351165771484375, 0.011990547180175781, 0.016345977783203125, 0.02070140838623047, 0.025056838989257812, 0.029412269592285156, 0.0337677001953125, 0.038123130798339844, 0.04247856140136719, 0.04683399200439453, 0.051189422607421875, 0.05554485321044922, 0.05990028381347656, 0.0642557144165039, 0.06861114501953125, 0.0729665756225586, 0.07732200622558594, 0.08167743682861328, 0.08603286743164062, 0.09038829803466797, 0.09474372863769531, 0.09909915924072266, 0.10345458984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 7.0, 0.0, 8.0, 6.0, 8.0, 14.0, 17.0, 22.0, 23.0, 37.0, 70.0, 79.0, 113.0, 164.0, 276.0, 371.0, 694.0, 1628.0, 5222.0, 28842.0, 3970184.0, 168437.0, 12371.0, 2989.0, 1104.0, 530.0, 340.0, 227.0, 166.0, 112.0, 61.0, 49.0, 29.0, 24.0, 23.0, 15.0, 10.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.124267578125, -0.12122058868408203, -0.11817359924316406, -0.1151266098022461, -0.11207962036132812, -0.10903263092041016, -0.10598564147949219, -0.10293865203857422, -0.09989166259765625, -0.09684467315673828, -0.09379768371582031, -0.09075069427490234, -0.08770370483398438, -0.0846567153930664, -0.08160972595214844, -0.07856273651123047, -0.0755157470703125, -0.07246875762939453, -0.06942176818847656, -0.0663747787475586, -0.06332778930664062, -0.060280799865722656, -0.05723381042480469, -0.05418682098388672, -0.05113983154296875, -0.04809284210205078, -0.04504585266113281, -0.041998863220214844, -0.038951873779296875, -0.035904884338378906, -0.03285789489746094, -0.02981090545654297, -0.026763916015625, -0.02371692657470703, -0.020669937133789062, -0.017622947692871094, -0.014575958251953125, -0.011528968811035156, -0.008481979370117188, -0.005434989929199219, -0.00238800048828125, 0.0006589889526367188, 0.0037059783935546875, 0.006752967834472656, 0.009799957275390625, 0.012846946716308594, 0.015893936157226562, 0.01894092559814453, 0.0219879150390625, 0.02503490447998047, 0.028081893920898438, 0.031128883361816406, 0.034175872802734375, 0.037222862243652344, 0.04026985168457031, 0.04331684112548828, 0.04636383056640625, 0.04941082000732422, 0.05245780944824219, 0.055504798889160156, 0.058551788330078125, 0.061598777770996094, 0.06464576721191406, 0.06769275665283203, 0.07073974609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 9.0, 8.0, 6.0, 17.0, 40.0, 110.0, 3269.0, 474.0, 79.0, 31.0, 11.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0209503173828125, -0.02013993263244629, -0.019329547882080078, -0.018519163131713867, -0.017708778381347656, -0.016898393630981445, -0.016088008880615234, -0.015277624130249023, -0.014467239379882812, -0.013656854629516602, -0.01284646987915039, -0.01203608512878418, -0.011225700378417969, -0.010415315628051758, -0.009604930877685547, -0.008794546127319336, -0.007984161376953125, -0.007173776626586914, -0.006363391876220703, -0.005553007125854492, -0.004742622375488281, -0.00393223762512207, -0.0031218528747558594, -0.0023114681243896484, -0.0015010833740234375, -0.0006906986236572266, 0.00011968612670898438, 0.0009300708770751953, 0.0017404556274414062, 0.002550840377807617, 0.003361225128173828, 0.004171609878540039, 0.00498199462890625, 0.005792379379272461, 0.006602764129638672, 0.007413148880004883, 0.008223533630371094, 0.009033918380737305, 0.009844303131103516, 0.010654687881469727, 0.011465072631835938, 0.012275457382202148, 0.01308584213256836, 0.01389622688293457, 0.014706611633300781, 0.015516996383666992, 0.016327381134033203, 0.017137765884399414, 0.017948150634765625, 0.018758535385131836, 0.019568920135498047, 0.020379304885864258, 0.02118968963623047, 0.02200007438659668, 0.02281045913696289, 0.0236208438873291, 0.024431228637695312, 0.025241613388061523, 0.026051998138427734, 0.026862382888793945, 0.027672767639160156, 0.028483152389526367, 0.029293537139892578, 0.03010392189025879, 0.030914306640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 13.0, 30.0, 180.0, 415.0, 293.0, 70.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.35568585991859436, -0.34867897629737854, -0.3416720926761627, -0.3346652090549469, -0.3276583254337311, -0.32065144181251526, -0.31364455819129944, -0.3066376745700836, -0.2996307909488678, -0.292623907327652, -0.28561702370643616, -0.27861014008522034, -0.2716032564640045, -0.2645963728427887, -0.2575894892215729, -0.25058260560035706, -0.24357573688030243, -0.2365688532590866, -0.2295619696378708, -0.22255508601665497, -0.21554820239543915, -0.20854131877422333, -0.2015344500541687, -0.19452756643295288, -0.18752068281173706, -0.18051379919052124, -0.17350691556930542, -0.1665000319480896, -0.15949314832687378, -0.15248626470565796, -0.14547938108444214, -0.13847249746322632, -0.1314656287431717, -0.12445874512195587, -0.11745186150074005, -0.11044497787952423, -0.10343809425830841, -0.09643121063709259, -0.08942433446645737, -0.08241745084524155, -0.07541056722402573, -0.0684036836028099, -0.061396799981594086, -0.054389920085668564, -0.047383036464452744, -0.04037615284323692, -0.0333692729473114, -0.02636238932609558, -0.01935550570487976, -0.012348623014986515, -0.005341740325093269, 0.0016651414334774017, 0.008672025054693222, 0.015678908675909042, 0.022685788571834564, 0.029692672193050385, 0.036699555814266205, 0.043706439435482025, 0.050713323056697845, 0.05772020295262337, 0.06472708284854889, 0.07173396646976471, 0.07874085009098053, 0.08574773371219635, 0.09275461733341217]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 4.0, 3.0, 5.0, 4.0, 10.0, 9.0, 15.0, 20.0, 10.0, 15.0, 18.0, 20.0, 27.0, 27.0, 23.0, 38.0, 37.0, 47.0, 48.0, 39.0, 56.0, 50.0, 54.0, 51.0, 56.0, 41.0, 50.0, 38.0, 31.0, 25.0, 25.0, 21.0, 21.0, 15.0, 9.0, 9.0, 12.0, 9.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04060918092727661, -0.03935711085796356, -0.03810504078865051, -0.03685297071933746, -0.035600900650024414, -0.034348830580711365, -0.033096760511398315, -0.031844690442085266, -0.030592620372772217, -0.029340550303459167, -0.028088480234146118, -0.02683641016483307, -0.02558434009552002, -0.02433227002620697, -0.02308019995689392, -0.02182812988758087, -0.020576059818267822, -0.019323989748954773, -0.018071919679641724, -0.016819849610328674, -0.015567779541015625, -0.014315709471702576, -0.013063639402389526, -0.011811569333076477, -0.010559499263763428, -0.009307429194450378, -0.008055359125137329, -0.00680328905582428, -0.0055512189865112305, -0.004299148917198181, -0.003047078847885132, -0.0017950087785720825, -0.0005429387092590332, 0.0007091313600540161, 0.0019612014293670654, 0.0032132714986801147, 0.004465341567993164, 0.005717411637306213, 0.006969481706619263, 0.008221551775932312, 0.009473621845245361, 0.01072569191455841, 0.01197776198387146, 0.01322983205318451, 0.014481902122497559, 0.015733972191810608, 0.016986042261123657, 0.018238112330436707, 0.019490182399749756, 0.020742252469062805, 0.021994322538375854, 0.023246392607688904, 0.024498462677001953, 0.025750532746315002, 0.027002602815628052, 0.0282546728849411, 0.02950674295425415, 0.0307588130235672, 0.03201088309288025, 0.0332629531621933, 0.03451502323150635, 0.0357670933008194, 0.037019163370132446, 0.038271233439445496, 0.039523303508758545]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 8.0, 5.0, 12.0, 8.0, 16.0, 25.0, 41.0, 82.0, 126.0, 185.0, 357.0, 711.0, 1766.0, 4891.0, 17222.0, 78759.0, 494945.0, 370648.0, 58201.0, 13578.0, 4131.0, 1460.0, 629.0, 302.0, 164.0, 107.0, 59.0, 46.0, 27.0, 18.0, 12.0, 9.0, 2.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.3408203125, -0.332489013671875, -0.32415771484375, -0.315826416015625, -0.3074951171875, -0.299163818359375, -0.29083251953125, -0.282501220703125, -0.274169921875, -0.265838623046875, -0.25750732421875, -0.249176025390625, -0.2408447265625, -0.232513427734375, -0.22418212890625, -0.215850830078125, -0.20751953125, -0.199188232421875, -0.19085693359375, -0.182525634765625, -0.1741943359375, -0.165863037109375, -0.15753173828125, -0.149200439453125, -0.140869140625, -0.132537841796875, -0.12420654296875, -0.115875244140625, -0.1075439453125, -0.099212646484375, -0.09088134765625, -0.082550048828125, -0.07421875, -0.065887451171875, -0.05755615234375, -0.049224853515625, -0.0408935546875, -0.032562255859375, -0.02423095703125, -0.015899658203125, -0.007568359375, 0.000762939453125, 0.00909423828125, 0.017425537109375, 0.0257568359375, 0.034088134765625, 0.04241943359375, 0.050750732421875, 0.05908203125, 0.067413330078125, 0.07574462890625, 0.084075927734375, 0.0924072265625, 0.100738525390625, 0.10906982421875, 0.117401123046875, 0.125732421875, 0.134063720703125, 0.14239501953125, 0.150726318359375, 0.1590576171875, 0.167388916015625, 0.17572021484375, 0.184051513671875, 0.1923828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 5.0, 20.0, 11.0, 25.0, 29.0, 38.0, 46.0, 48.0, 46.0, 57.0, 65.0, 70.0, 68.0, 53.0, 46.0, 54.0, 49.0, 44.0, 45.0, 34.0, 34.0, 17.0, 16.0, 17.0, 15.0, 11.0, 6.0, 6.0, 5.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.1724853515625, -0.1682415008544922, -0.16399765014648438, -0.15975379943847656, -0.15550994873046875, -0.15126609802246094, -0.14702224731445312, -0.1427783966064453, -0.1385345458984375, -0.1342906951904297, -0.13004684448242188, -0.12580299377441406, -0.12155914306640625, -0.11731529235839844, -0.11307144165039062, -0.10882759094238281, -0.104583740234375, -0.10033988952636719, -0.09609603881835938, -0.09185218811035156, -0.08760833740234375, -0.08336448669433594, -0.07912063598632812, -0.07487678527832031, -0.0706329345703125, -0.06638908386230469, -0.062145233154296875, -0.05790138244628906, -0.05365753173828125, -0.04941368103027344, -0.045169830322265625, -0.04092597961425781, -0.03668212890625, -0.03243827819824219, -0.028194427490234375, -0.023950576782226562, -0.01970672607421875, -0.015462875366210938, -0.011219024658203125, -0.0069751739501953125, -0.0027313232421875, 0.0015125274658203125, 0.005756378173828125, 0.010000228881835938, 0.01424407958984375, 0.018487930297851562, 0.022731781005859375, 0.026975631713867188, 0.031219482421875, 0.03546333312988281, 0.039707183837890625, 0.04395103454589844, 0.04819488525390625, 0.05243873596191406, 0.056682586669921875, 0.06092643737792969, 0.0651702880859375, 0.06941413879394531, 0.07365798950195312, 0.07790184020996094, 0.08214569091796875, 0.08638954162597656, 0.09063339233398438, 0.09487724304199219, 0.09912109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 9.0, 17.0, 17.0, 19.0, 22.0, 37.0, 55.0, 64.0, 92.0, 178.0, 265.0, 497.0, 1279.0, 4871.0, 34055.0, 679603.0, 302323.0, 19794.0, 3279.0, 947.0, 415.0, 255.0, 136.0, 81.0, 82.0, 49.0, 35.0, 26.0, 14.0, 12.0, 6.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343017578125, -0.33025360107421875, -0.3174896240234375, -0.30472564697265625, -0.291961669921875, -0.27919769287109375, -0.2664337158203125, -0.25366973876953125, -0.24090576171875, -0.22814178466796875, -0.2153778076171875, -0.20261383056640625, -0.189849853515625, -0.17708587646484375, -0.1643218994140625, -0.15155792236328125, -0.1387939453125, -0.12602996826171875, -0.1132659912109375, -0.10050201416015625, -0.087738037109375, -0.07497406005859375, -0.0622100830078125, -0.04944610595703125, -0.03668212890625, -0.02391815185546875, -0.0111541748046875, 0.00160980224609375, 0.014373779296875, 0.02713775634765625, 0.0399017333984375, 0.05266571044921875, 0.0654296875, 0.07819366455078125, 0.0909576416015625, 0.10372161865234375, 0.116485595703125, 0.12924957275390625, 0.1420135498046875, 0.15477752685546875, 0.16754150390625, 0.18030548095703125, 0.1930694580078125, 0.20583343505859375, 0.218597412109375, 0.23136138916015625, 0.2441253662109375, 0.25688934326171875, 0.2696533203125, 0.28241729736328125, 0.2951812744140625, 0.30794525146484375, 0.320709228515625, 0.33347320556640625, 0.3462371826171875, 0.35900115966796875, 0.37176513671875, 0.38452911376953125, 0.3972930908203125, 0.41005706787109375, 0.422821044921875, 0.43558502197265625, 0.4483489990234375, 0.46111297607421875, 0.473876953125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 12.0, 9.0, 5.0, 18.0, 13.0, 22.0, 20.0, 41.0, 35.0, 39.0, 52.0, 56.0, 70.0, 59.0, 62.0, 78.0, 56.0, 62.0, 60.0, 50.0, 44.0, 30.0, 20.0, 23.0, 18.0, 24.0, 5.0, 10.0, 12.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6979942321777344, -0.6791915893554688, -0.6603889465332031, -0.6415863037109375, -0.6227836608886719, -0.6039810180664062, -0.5851783752441406, -0.566375732421875, -0.5475730895996094, -0.5287704467773438, -0.5099678039550781, -0.4911651611328125, -0.4723625183105469, -0.45355987548828125, -0.4347572326660156, -0.41595458984375, -0.3971519470214844, -0.37834930419921875, -0.3595466613769531, -0.3407440185546875, -0.3219413757324219, -0.30313873291015625, -0.2843360900878906, -0.265533447265625, -0.24673080444335938, -0.22792816162109375, -0.20912551879882812, -0.1903228759765625, -0.17152023315429688, -0.15271759033203125, -0.13391494750976562, -0.1151123046875, -0.09630966186523438, -0.07750701904296875, -0.058704376220703125, -0.0399017333984375, -0.021099090576171875, -0.00229644775390625, 0.016506195068359375, 0.035308837890625, 0.054111480712890625, 0.07291412353515625, 0.09171676635742188, 0.1105194091796875, 0.12932205200195312, 0.14812469482421875, 0.16692733764648438, 0.18572998046875, 0.20453262329101562, 0.22333526611328125, 0.24213790893554688, 0.2609405517578125, 0.2797431945800781, 0.29854583740234375, 0.3173484802246094, 0.336151123046875, 0.3549537658691406, 0.37375640869140625, 0.3925590515136719, 0.4113616943359375, 0.4301643371582031, 0.44896697998046875, 0.4677696228027344, 0.486572265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 12.0, 9.0, 20.0, 37.0, 52.0, 102.0, 187.0, 448.0, 1375.0, 6197.0, 74370.0, 932338.0, 28167.0, 3673.0, 872.0, 320.0, 137.0, 80.0, 56.0, 37.0, 14.0, 12.0, 8.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33349609375, -0.32349395751953125, -0.3134918212890625, -0.30348968505859375, -0.293487548828125, -0.28348541259765625, -0.2734832763671875, -0.26348114013671875, -0.25347900390625, -0.24347686767578125, -0.2334747314453125, -0.22347259521484375, -0.213470458984375, -0.20346832275390625, -0.1934661865234375, -0.18346405029296875, -0.1734619140625, -0.16345977783203125, -0.1534576416015625, -0.14345550537109375, -0.133453369140625, -0.12345123291015625, -0.1134490966796875, -0.10344696044921875, -0.09344482421875, -0.08344268798828125, -0.0734405517578125, -0.06343841552734375, -0.053436279296875, -0.04343414306640625, -0.0334320068359375, -0.02342987060546875, -0.013427734375, -0.00342559814453125, 0.0065765380859375, 0.01657867431640625, 0.026580810546875, 0.03658294677734375, 0.0465850830078125, 0.05658721923828125, 0.06658935546875, 0.07659149169921875, 0.0865936279296875, 0.09659576416015625, 0.106597900390625, 0.11660003662109375, 0.1266021728515625, 0.13660430908203125, 0.1466064453125, 0.15660858154296875, 0.1666107177734375, 0.17661285400390625, 0.186614990234375, 0.19661712646484375, 0.2066192626953125, 0.21662139892578125, 0.22662353515625, 0.23662567138671875, 0.2466278076171875, 0.25662994384765625, 0.266632080078125, 0.27663421630859375, 0.2866363525390625, 0.29663848876953125, 0.306640625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 4.0, 4.0, 6.0, 11.0, 25.0, 15.0, 20.0, 21.0, 37.0, 46.0, 53.0, 72.0, 90.0, 79.0, 100.0, 75.0, 86.0, 48.0, 44.0, 38.0, 21.0, 29.0, 20.0, 11.0, 15.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.246566772460938e-05, -6.01746141910553e-05, -5.788356065750122e-05, -5.5592507123947144e-05, -5.3301453590393066e-05, -5.101040005683899e-05, -4.871934652328491e-05, -4.6428292989730835e-05, -4.413723945617676e-05, -4.184618592262268e-05, -3.9555132389068604e-05, -3.7264078855514526e-05, -3.497302532196045e-05, -3.268197178840637e-05, -3.0390918254852295e-05, -2.8099864721298218e-05, -2.580881118774414e-05, -2.3517757654190063e-05, -2.1226704120635986e-05, -1.893565058708191e-05, -1.6644597053527832e-05, -1.4353543519973755e-05, -1.2062489986419678e-05, -9.7714364528656e-06, -7.4803829193115234e-06, -5.189329385757446e-06, -2.898275852203369e-06, -6.07222318649292e-07, 1.6838312149047852e-06, 3.974884748458862e-06, 6.2659382820129395e-06, 8.556991815567017e-06, 1.0848045349121094e-05, 1.3139098882675171e-05, 1.5430152416229248e-05, 1.7721205949783325e-05, 2.0012259483337402e-05, 2.230331301689148e-05, 2.4594366550445557e-05, 2.6885420083999634e-05, 2.917647361755371e-05, 3.146752715110779e-05, 3.3758580684661865e-05, 3.604963421821594e-05, 3.834068775177002e-05, 4.06317412853241e-05, 4.2922794818878174e-05, 4.521384835243225e-05, 4.750490188598633e-05, 4.9795955419540405e-05, 5.208700895309448e-05, 5.437806248664856e-05, 5.666911602020264e-05, 5.8960169553756714e-05, 6.125122308731079e-05, 6.354227662086487e-05, 6.583333015441895e-05, 6.812438368797302e-05, 7.04154372215271e-05, 7.270649075508118e-05, 7.499754428863525e-05, 7.728859782218933e-05, 7.957965135574341e-05, 8.187070488929749e-05, 8.416175842285156e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 6.0, 7.0, 7.0, 14.0, 23.0, 55.0, 77.0, 126.0, 314.0, 977.0, 5518.0, 139660.0, 886008.0, 13266.0, 1664.0, 474.0, 155.0, 86.0, 52.0, 26.0, 20.0, 12.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.2637672424316406, -0.25238800048828125, -0.24100875854492188, -0.2296295166015625, -0.21825027465820312, -0.20687103271484375, -0.19549179077148438, -0.184112548828125, -0.17273330688476562, -0.16135406494140625, -0.14997482299804688, -0.1385955810546875, -0.12721633911132812, -0.11583709716796875, -0.10445785522460938, -0.09307861328125, -0.08169937133789062, -0.07032012939453125, -0.058940887451171875, -0.0475616455078125, -0.036182403564453125, -0.02480316162109375, -0.013423919677734375, -0.002044677734375, 0.009334564208984375, 0.02071380615234375, 0.032093048095703125, 0.0434722900390625, 0.054851531982421875, 0.06623077392578125, 0.07761001586914062, 0.0889892578125, 0.10036849975585938, 0.11174774169921875, 0.12312698364257812, 0.1345062255859375, 0.14588546752929688, 0.15726470947265625, 0.16864395141601562, 0.180023193359375, 0.19140243530273438, 0.20278167724609375, 0.21416091918945312, 0.2255401611328125, 0.23691940307617188, 0.24829864501953125, 0.2596778869628906, 0.27105712890625, 0.2824363708496094, 0.29381561279296875, 0.3051948547363281, 0.3165740966796875, 0.3279533386230469, 0.33933258056640625, 0.3507118225097656, 0.362091064453125, 0.3734703063964844, 0.38484954833984375, 0.3962287902832031, 0.4076080322265625, 0.4189872741699219, 0.43036651611328125, 0.4417457580566406, 0.453125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 28.0, 61.0, 325.0, 473.0, 67.0, 20.0, 10.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5390625, -0.5167236328125, -0.494384765625, -0.4720458984375, -0.44970703125, -0.4273681640625, -0.405029296875, -0.3826904296875, -0.3603515625, -0.3380126953125, -0.315673828125, -0.2933349609375, -0.27099609375, -0.2486572265625, -0.226318359375, -0.2039794921875, -0.181640625, -0.1593017578125, -0.136962890625, -0.1146240234375, -0.09228515625, -0.0699462890625, -0.047607421875, -0.0252685546875, -0.0029296875, 0.0194091796875, 0.041748046875, 0.0640869140625, 0.08642578125, 0.1087646484375, 0.131103515625, 0.1534423828125, 0.17578125, 0.1981201171875, 0.220458984375, 0.2427978515625, 0.26513671875, 0.2874755859375, 0.309814453125, 0.3321533203125, 0.3544921875, 0.3768310546875, 0.399169921875, 0.4215087890625, 0.44384765625, 0.4661865234375, 0.488525390625, 0.5108642578125, 0.533203125, 0.5555419921875, 0.577880859375, 0.6002197265625, 0.62255859375, 0.6448974609375, 0.667236328125, 0.6895751953125, 0.7119140625, 0.7342529296875, 0.756591796875, 0.7789306640625, 0.80126953125, 0.8236083984375, 0.845947265625, 0.8682861328125, 0.890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 10.0, 28.0, 53.0, 100.0, 184.0, 213.0, 187.0, 127.0, 57.0, 20.0, 14.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9101192951202393, -2.815542221069336, -2.7209651470184326, -2.6263880729675293, -2.531810998916626, -2.4372339248657227, -2.3426566123962402, -2.248079776763916, -2.1535024642944336, -2.0589253902435303, -1.964348316192627, -1.8697712421417236, -1.7751941680908203, -1.680617094039917, -1.5860399007797241, -1.4914628267288208, -1.396885871887207, -1.3023087978363037, -1.2077317237854004, -1.113154649734497, -1.0185775756835938, -0.9240004420280457, -0.8294233083724976, -0.7348462343215942, -0.6402691602706909, -0.5456920862197876, -0.4511149823665619, -0.3565378785133362, -0.26196080446243286, -0.16738373041152954, -0.07280659675598145, 0.021770477294921875, 0.1163475513458252, 0.2109246402978897, 0.3055017292499542, 0.40007883310317993, 0.49465590715408325, 0.5892329812049866, 0.6838101148605347, 0.778387188911438, 0.8729642629623413, 0.9675413370132446, 1.062118411064148, 1.1566956043243408, 1.2512726783752441, 1.3458497524261475, 1.4404268264770508, 1.535003900527954, 1.6295809745788574, 1.7241580486297607, 1.818735122680664, 1.9133121967315674, 2.0078892707824707, 2.102466344833374, 2.1970434188842773, 2.2916207313537598, 2.386197566986084, 2.4807746410369873, 2.5753517150878906, 2.669928789138794, 2.7645058631896973, 2.8590829372406006, 2.953660011291504, 3.0482373237609863, 3.1428143978118896]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 9.0, 3.0, 8.0, 8.0, 10.0, 9.0, 13.0, 21.0, 25.0, 22.0, 18.0, 28.0, 34.0, 29.0, 37.0, 36.0, 30.0, 45.0, 43.0, 36.0, 48.0, 42.0, 43.0, 49.0, 37.0, 37.0, 32.0, 43.0, 37.0, 24.0, 20.0, 21.0, 20.0, 17.0, 10.0, 8.0, 8.0, 5.0, 9.0, 4.0, 14.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-2.24587345123291, -2.182187795639038, -2.118502140045166, -2.054816484451294, -1.9911308288574219, -1.9274451732635498, -1.8637595176696777, -1.8000738620758057, -1.7363882064819336, -1.6727025508880615, -1.6090168952941895, -1.5453312397003174, -1.4816455841064453, -1.4179599285125732, -1.3542742729187012, -1.290588617324829, -1.2269030809402466, -1.1632174253463745, -1.0995317697525024, -1.0358461141586304, -0.9721604585647583, -0.9084748029708862, -0.8447892069816589, -0.7811035513877869, -0.7174178957939148, -0.6537322402000427, -0.5900465846061707, -0.5263609886169434, -0.4626753032207489, -0.39898964762687683, -0.33530402183532715, -0.2716183662414551, -0.207932710647583, -0.14424705505371094, -0.08056141436100006, -0.016875773668289185, 0.046809881925582886, 0.11049553751945496, 0.17418116331100464, 0.2378668189048767, 0.3015524744987488, 0.36523813009262085, 0.4289237856864929, 0.4926094114780426, 0.5562950372695923, 0.6199806928634644, 0.6836663484573364, 0.7473520040512085, 0.8110376596450806, 0.8747233152389526, 0.9384089708328247, 1.0020946264266968, 1.0657802820205688, 1.129465937614441, 1.1931514739990234, 1.2568371295928955, 1.3205227851867676, 1.3842084407806396, 1.4478940963745117, 1.5115797519683838, 1.5752654075622559, 1.638951063156128, 1.70263671875, 1.766322374343872, 1.8300080299377441]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 8.0, 9.0, 15.0, 16.0, 44.0, 67.0, 136.0, 326.0, 849.0, 3269.0, 25192.0, 4104669.0, 52720.0, 5026.0, 1193.0, 430.0, 158.0, 73.0, 39.0, 21.0, 8.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.369384765625, -0.3617868423461914, -0.3541889190673828, -0.3465909957885742, -0.3389930725097656, -0.33139514923095703, -0.32379722595214844, -0.31619930267333984, -0.30860137939453125, -0.30100345611572266, -0.29340553283691406, -0.28580760955810547, -0.2782096862792969, -0.2706117630004883, -0.2630138397216797, -0.2554159164428711, -0.2478179931640625, -0.2402200698852539, -0.2326221466064453, -0.22502422332763672, -0.21742630004882812, -0.20982837677001953, -0.20223045349121094, -0.19463253021240234, -0.18703460693359375, -0.17943668365478516, -0.17183876037597656, -0.16424083709716797, -0.15664291381835938, -0.14904499053955078, -0.1414470672607422, -0.1338491439819336, -0.126251220703125, -0.1186532974243164, -0.11105537414550781, -0.10345745086669922, -0.09585952758789062, -0.08826160430908203, -0.08066368103027344, -0.07306575775146484, -0.06546783447265625, -0.057869911193847656, -0.05027198791503906, -0.04267406463623047, -0.035076141357421875, -0.02747821807861328, -0.019880294799804688, -0.012282371520996094, -0.0046844482421875, 0.0029134750366210938, 0.010511398315429688, 0.01810932159423828, 0.025707244873046875, 0.03330516815185547, 0.04090309143066406, 0.048501014709472656, 0.05609893798828125, 0.06369686126708984, 0.07129478454589844, 0.07889270782470703, 0.08649063110351562, 0.09408855438232422, 0.10168647766113281, 0.1092844009399414, 0.11688232421875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 8.0, 13.0, 22.0, 30.0, 32.0, 42.0, 43.0, 58.0, 54.0, 81.0, 57.0, 61.0, 67.0, 54.0, 66.0, 60.0, 47.0, 42.0, 29.0, 28.0, 20.0, 14.0, 9.0, 10.0, 4.0, 9.0, 6.0, 3.0, 4.0, 3.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.16599273681640625, -0.1612091064453125, -0.15642547607421875, -0.151641845703125, -0.14685821533203125, -0.1420745849609375, -0.13729095458984375, -0.13250732421875, -0.12772369384765625, -0.1229400634765625, -0.11815643310546875, -0.113372802734375, -0.10858917236328125, -0.1038055419921875, -0.09902191162109375, -0.09423828125, -0.08945465087890625, -0.0846710205078125, -0.07988739013671875, -0.075103759765625, -0.07032012939453125, -0.0655364990234375, -0.06075286865234375, -0.05596923828125, -0.05118560791015625, -0.0464019775390625, -0.04161834716796875, -0.036834716796875, -0.03205108642578125, -0.0272674560546875, -0.02248382568359375, -0.0177001953125, -0.01291656494140625, -0.0081329345703125, -0.00334930419921875, 0.001434326171875, 0.00621795654296875, 0.0110015869140625, 0.01578521728515625, 0.02056884765625, 0.02535247802734375, 0.0301361083984375, 0.03491973876953125, 0.039703369140625, 0.04448699951171875, 0.0492706298828125, 0.05405426025390625, 0.058837890625, 0.06362152099609375, 0.0684051513671875, 0.07318878173828125, 0.077972412109375, 0.08275604248046875, 0.0875396728515625, 0.09232330322265625, 0.09710693359375, 0.10189056396484375, 0.1066741943359375, 0.11145782470703125, 0.116241455078125, 0.12102508544921875, 0.1258087158203125, 0.13059234619140625, 0.1353759765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 5.0, 10.0, 11.0, 9.0, 13.0, 20.0, 20.0, 25.0, 27.0, 32.0, 47.0, 63.0, 72.0, 74.0, 112.0, 164.0, 232.0, 428.0, 757.0, 1518.0, 3409.0, 12734.0, 237903.0, 3903507.0, 24090.0, 4767.0, 1781.0, 900.0, 506.0, 267.0, 174.0, 111.0, 88.0, 89.0, 57.0, 63.0, 33.0, 29.0, 24.0, 34.0, 12.0, 15.0, 8.0, 12.0, 7.0, 6.0, 9.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1446533203125, -0.1402912139892578, -0.13592910766601562, -0.13156700134277344, -0.12720489501953125, -0.12284278869628906, -0.11848068237304688, -0.11411857604980469, -0.1097564697265625, -0.10539436340332031, -0.10103225708007812, -0.09667015075683594, -0.09230804443359375, -0.08794593811035156, -0.08358383178710938, -0.07922172546386719, -0.074859619140625, -0.07049751281738281, -0.06613540649414062, -0.06177330017089844, -0.05741119384765625, -0.05304908752441406, -0.048686981201171875, -0.04432487487792969, -0.0399627685546875, -0.03560066223144531, -0.031238555908203125, -0.026876449584960938, -0.02251434326171875, -0.018152236938476562, -0.013790130615234375, -0.009428024291992188, -0.00506591796875, -0.0007038116455078125, 0.003658294677734375, 0.008020401000976562, 0.01238250732421875, 0.016744613647460938, 0.021106719970703125, 0.025468826293945312, 0.0298309326171875, 0.03419303894042969, 0.038555145263671875, 0.04291725158691406, 0.04727935791015625, 0.05164146423339844, 0.056003570556640625, 0.06036567687988281, 0.064727783203125, 0.06908988952636719, 0.07345199584960938, 0.07781410217285156, 0.08217620849609375, 0.08653831481933594, 0.09090042114257812, 0.09526252746582031, 0.0996246337890625, 0.10398674011230469, 0.10834884643554688, 0.11271095275878906, 0.11707305908203125, 0.12143516540527344, 0.12579727172851562, 0.1301593780517578, 0.134521484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 19.0, 26.0, 64.0, 217.0, 3328.0, 280.0, 70.0, 22.0, 15.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0142974853515625, -0.013062238693237305, -0.01182699203491211, -0.010591745376586914, -0.009356498718261719, -0.008121252059936523, -0.006886005401611328, -0.005650758743286133, -0.0044155120849609375, -0.003180265426635742, -0.0019450187683105469, -0.0007097721099853516, 0.0005254745483398438, 0.001760721206665039, 0.0029959678649902344, 0.00423121452331543, 0.005466461181640625, 0.00670170783996582, 0.007936954498291016, 0.009172201156616211, 0.010407447814941406, 0.011642694473266602, 0.012877941131591797, 0.014113187789916992, 0.015348434448242188, 0.016583681106567383, 0.017818927764892578, 0.019054174423217773, 0.02028942108154297, 0.021524667739868164, 0.02275991439819336, 0.023995161056518555, 0.02523040771484375, 0.026465654373168945, 0.02770090103149414, 0.028936147689819336, 0.03017139434814453, 0.03140664100646973, 0.03264188766479492, 0.03387713432312012, 0.03511238098144531, 0.03634762763977051, 0.0375828742980957, 0.0388181209564209, 0.040053367614746094, 0.04128861427307129, 0.042523860931396484, 0.04375910758972168, 0.044994354248046875, 0.04622960090637207, 0.047464847564697266, 0.04870009422302246, 0.049935340881347656, 0.05117058753967285, 0.05240583419799805, 0.05364108085632324, 0.05487632751464844, 0.05611157417297363, 0.05734682083129883, 0.05858206748962402, 0.05981731414794922, 0.061052560806274414, 0.06228780746459961, 0.0635230541229248, 0.06475830078125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 7.0, 11.0, 9.0, 18.0, 27.0, 46.0, 52.0, 72.0, 93.0, 125.0, 111.0, 109.0, 83.0, 60.0, 48.0, 40.0, 23.0, 22.0, 9.0, 8.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1159844696521759, -0.11311082541942596, -0.11023718863725662, -0.10736354440450668, -0.10448990017175674, -0.1016162633895874, -0.09874261915683746, -0.09586897492408752, -0.09299533069133759, -0.09012168645858765, -0.0872480496764183, -0.08437440544366837, -0.08150076121091843, -0.07862712442874908, -0.07575348019599915, -0.0728798359632492, -0.07000619918107986, -0.06713255494832993, -0.06425891816616058, -0.061385273933410645, -0.058511629700660706, -0.055637989193201065, -0.052764348685741425, -0.049890704452991486, -0.047017063945531845, -0.044143423438072205, -0.041269779205322266, -0.038396138697862625, -0.035522498190402985, -0.032648853957653046, -0.029775213450193405, -0.026901571080088615, -0.024027928709983826, -0.021154286339879036, -0.018280643969774246, -0.015407003462314606, -0.012533361092209816, -0.009659718722105026, -0.006786078214645386, -0.003912435844540596, -0.0010387934744358063, 0.0018348484300076962, 0.004708490334451199, 0.007582131773233414, 0.010455774143338203, 0.013329416513442993, 0.016203057020902634, 0.019076699391007423, 0.021950341761112213, 0.024823984131217003, 0.027697626501321793, 0.030571267008781433, 0.03344491124153137, 0.03631855174899101, 0.03919219225645065, 0.04206583648920059, 0.04493947699666023, 0.04781311750411987, 0.05068676173686981, 0.05356040224432945, 0.05643404275178909, 0.05930768698453903, 0.06218132749199867, 0.06505496799945831, 0.06792861223220825]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 8.0, 4.0, 8.0, 8.0, 11.0, 13.0, 11.0, 20.0, 25.0, 32.0, 23.0, 41.0, 29.0, 35.0, 42.0, 42.0, 56.0, 45.0, 40.0, 46.0, 43.0, 49.0, 51.0, 36.0, 38.0, 33.0, 39.0, 26.0, 31.0, 18.0, 16.0, 15.0, 17.0, 20.0, 9.0, 14.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051313161849975586, -0.04919978976249695, -0.04708641767501831, -0.04497304558753967, -0.042859673500061035, -0.0407463014125824, -0.03863292932510376, -0.03651955723762512, -0.034406185150146484, -0.03229281306266785, -0.03017944097518921, -0.02806606888771057, -0.025952696800231934, -0.023839324712753296, -0.021725952625274658, -0.01961258053779602, -0.017499208450317383, -0.015385836362838745, -0.013272464275360107, -0.01115909218788147, -0.009045720100402832, -0.006932348012924194, -0.004818975925445557, -0.002705603837966919, -0.0005922317504882812, 0.0015211403369903564, 0.003634512424468994, 0.005747884511947632, 0.00786125659942627, 0.009974628686904907, 0.012088000774383545, 0.014201372861862183, 0.01631474494934082, 0.018428117036819458, 0.020541489124298096, 0.022654861211776733, 0.02476823329925537, 0.02688160538673401, 0.028994977474212646, 0.031108349561691284, 0.03322172164916992, 0.03533509373664856, 0.0374484658241272, 0.039561837911605835, 0.04167520999908447, 0.04378858208656311, 0.04590195417404175, 0.048015326261520386, 0.05012869834899902, 0.05224207043647766, 0.0543554425239563, 0.056468814611434937, 0.058582186698913574, 0.06069555878639221, 0.06280893087387085, 0.06492230296134949, 0.06703567504882812, 0.06914904713630676, 0.0712624192237854, 0.07337579131126404, 0.07548916339874268, 0.07760253548622131, 0.07971590757369995, 0.08182927966117859, 0.08394265174865723]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 15.0, 19.0, 21.0, 39.0, 70.0, 116.0, 146.0, 235.0, 427.0, 701.0, 1036.0, 1805.0, 3175.0, 6019.0, 11615.0, 26116.0, 73467.0, 271665.0, 441072.0, 133863.0, 41493.0, 17117.0, 8044.0, 4295.0, 2452.0, 1424.0, 771.0, 483.0, 296.0, 184.0, 130.0, 76.0, 51.0, 36.0, 27.0, 12.0, 9.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.15576171875, -0.15077590942382812, -0.14579010009765625, -0.14080429077148438, -0.1358184814453125, -0.13083267211914062, -0.12584686279296875, -0.12086105346679688, -0.115875244140625, -0.11088943481445312, -0.10590362548828125, -0.10091781616210938, -0.0959320068359375, -0.09094619750976562, -0.08596038818359375, -0.08097457885742188, -0.07598876953125, -0.07100296020507812, -0.06601715087890625, -0.061031341552734375, -0.0560455322265625, -0.051059722900390625, -0.04607391357421875, -0.041088104248046875, -0.036102294921875, -0.031116485595703125, -0.02613067626953125, -0.021144866943359375, -0.0161590576171875, -0.011173248291015625, -0.00618743896484375, -0.001201629638671875, 0.0037841796875, 0.008769989013671875, 0.01375579833984375, 0.018741607666015625, 0.0237274169921875, 0.028713226318359375, 0.03369903564453125, 0.038684844970703125, 0.043670654296875, 0.048656463623046875, 0.05364227294921875, 0.058628082275390625, 0.0636138916015625, 0.06859970092773438, 0.07358551025390625, 0.07857131958007812, 0.08355712890625, 0.08854293823242188, 0.09352874755859375, 0.09851455688476562, 0.1035003662109375, 0.10848617553710938, 0.11347198486328125, 0.11845779418945312, 0.123443603515625, 0.12842941284179688, 0.13341522216796875, 0.13840103149414062, 0.1433868408203125, 0.14837265014648438, 0.15335845947265625, 0.15834426879882812, 0.163330078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 8.0, 7.0, 9.0, 13.0, 19.0, 25.0, 32.0, 29.0, 51.0, 57.0, 62.0, 54.0, 65.0, 75.0, 57.0, 69.0, 58.0, 66.0, 45.0, 41.0, 38.0, 23.0, 22.0, 18.0, 10.0, 15.0, 6.0, 9.0, 3.0, 5.0, 4.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.167724609375, -0.1629486083984375, -0.158172607421875, -0.1533966064453125, -0.14862060546875, -0.1438446044921875, -0.139068603515625, -0.1342926025390625, -0.1295166015625, -0.1247406005859375, -0.119964599609375, -0.1151885986328125, -0.11041259765625, -0.1056365966796875, -0.100860595703125, -0.0960845947265625, -0.09130859375, -0.0865325927734375, -0.081756591796875, -0.0769805908203125, -0.07220458984375, -0.0674285888671875, -0.062652587890625, -0.0578765869140625, -0.0531005859375, -0.0483245849609375, -0.043548583984375, -0.0387725830078125, -0.03399658203125, -0.0292205810546875, -0.024444580078125, -0.0196685791015625, -0.014892578125, -0.0101165771484375, -0.005340576171875, -0.0005645751953125, 0.00421142578125, 0.0089874267578125, 0.013763427734375, 0.0185394287109375, 0.0233154296875, 0.0280914306640625, 0.032867431640625, 0.0376434326171875, 0.04241943359375, 0.0471954345703125, 0.051971435546875, 0.0567474365234375, 0.0615234375, 0.0662994384765625, 0.071075439453125, 0.0758514404296875, 0.08062744140625, 0.0854034423828125, 0.090179443359375, 0.0949554443359375, 0.0997314453125, 0.1045074462890625, 0.109283447265625, 0.1140594482421875, 0.11883544921875, 0.1236114501953125, 0.128387451171875, 0.1331634521484375, 0.137939453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 4.0, 7.0, 7.0, 16.0, 14.0, 24.0, 23.0, 40.0, 43.0, 41.0, 91.0, 134.0, 200.0, 347.0, 845.0, 3411.0, 22778.0, 418962.0, 567610.0, 27995.0, 3931.0, 973.0, 405.0, 215.0, 124.0, 79.0, 52.0, 53.0, 32.0, 17.0, 8.0, 18.0, 9.0, 5.0, 8.0, 9.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.347900390625, -0.3359222412109375, -0.323944091796875, -0.3119659423828125, -0.29998779296875, -0.2880096435546875, -0.276031494140625, -0.2640533447265625, -0.2520751953125, -0.2400970458984375, -0.228118896484375, -0.2161407470703125, -0.20416259765625, -0.1921844482421875, -0.180206298828125, -0.1682281494140625, -0.15625, -0.1442718505859375, -0.132293701171875, -0.1203155517578125, -0.10833740234375, -0.0963592529296875, -0.084381103515625, -0.0724029541015625, -0.0604248046875, -0.0484466552734375, -0.036468505859375, -0.0244903564453125, -0.01251220703125, -0.0005340576171875, 0.011444091796875, 0.0234222412109375, 0.035400390625, 0.0473785400390625, 0.059356689453125, 0.0713348388671875, 0.08331298828125, 0.0952911376953125, 0.107269287109375, 0.1192474365234375, 0.1312255859375, 0.1432037353515625, 0.155181884765625, 0.1671600341796875, 0.17913818359375, 0.1911163330078125, 0.203094482421875, 0.2150726318359375, 0.22705078125, 0.2390289306640625, 0.251007080078125, 0.2629852294921875, 0.27496337890625, 0.2869415283203125, 0.298919677734375, 0.3108978271484375, 0.3228759765625, 0.3348541259765625, 0.346832275390625, 0.3588104248046875, 0.37078857421875, 0.3827667236328125, 0.394744873046875, 0.4067230224609375, 0.418701171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 0.0, 7.0, 5.0, 7.0, 8.0, 16.0, 16.0, 19.0, 28.0, 18.0, 24.0, 31.0, 28.0, 29.0, 31.0, 31.0, 47.0, 47.0, 52.0, 43.0, 42.0, 41.0, 40.0, 42.0, 32.0, 49.0, 28.0, 33.0, 38.0, 24.0, 21.0, 18.0, 18.0, 18.0, 13.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.457763671875, -0.4443778991699219, -0.43099212646484375, -0.4176063537597656, -0.4042205810546875, -0.3908348083496094, -0.37744903564453125, -0.3640632629394531, -0.350677490234375, -0.3372917175292969, -0.32390594482421875, -0.3105201721191406, -0.2971343994140625, -0.2837486267089844, -0.27036285400390625, -0.2569770812988281, -0.24359130859375, -0.23020553588867188, -0.21681976318359375, -0.20343399047851562, -0.1900482177734375, -0.17666244506835938, -0.16327667236328125, -0.14989089965820312, -0.136505126953125, -0.12311935424804688, -0.10973358154296875, -0.09634780883789062, -0.0829620361328125, -0.06957626342773438, -0.05619049072265625, -0.042804718017578125, -0.0294189453125, -0.016033172607421875, -0.00264739990234375, 0.010738372802734375, 0.0241241455078125, 0.037509918212890625, 0.05089569091796875, 0.06428146362304688, 0.077667236328125, 0.09105300903320312, 0.10443878173828125, 0.11782455444335938, 0.1312103271484375, 0.14459609985351562, 0.15798187255859375, 0.17136764526367188, 0.18475341796875, 0.19813919067382812, 0.21152496337890625, 0.22491073608398438, 0.2382965087890625, 0.2516822814941406, 0.26506805419921875, 0.2784538269042969, 0.291839599609375, 0.3052253723144531, 0.31861114501953125, 0.3319969177246094, 0.3453826904296875, 0.3587684631347656, 0.37215423583984375, 0.3855400085449219, 0.39892578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 6.0, 9.0, 17.0, 22.0, 36.0, 75.0, 140.0, 349.0, 927.0, 5780.0, 851982.0, 184420.0, 3506.0, 747.0, 238.0, 145.0, 68.0, 30.0, 25.0, 14.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51318359375, -0.5009346008300781, -0.48868560791015625, -0.4764366149902344, -0.4641876220703125, -0.4519386291503906, -0.43968963623046875, -0.4274406433105469, -0.415191650390625, -0.4029426574707031, -0.39069366455078125, -0.3784446716308594, -0.3661956787109375, -0.3539466857910156, -0.34169769287109375, -0.3294486999511719, -0.31719970703125, -0.3049507141113281, -0.29270172119140625, -0.2804527282714844, -0.2682037353515625, -0.2559547424316406, -0.24370574951171875, -0.23145675659179688, -0.219207763671875, -0.20695877075195312, -0.19470977783203125, -0.18246078491210938, -0.1702117919921875, -0.15796279907226562, -0.14571380615234375, -0.13346481323242188, -0.1212158203125, -0.10896682739257812, -0.09671783447265625, -0.08446884155273438, -0.0722198486328125, -0.059970855712890625, -0.04772186279296875, -0.035472869873046875, -0.023223876953125, -0.010974884033203125, 0.00127410888671875, 0.013523101806640625, 0.0257720947265625, 0.038021087646484375, 0.05027008056640625, 0.06251907348632812, 0.07476806640625, 0.08701705932617188, 0.09926605224609375, 0.11151504516601562, 0.1237640380859375, 0.13601303100585938, 0.14826202392578125, 0.16051101684570312, 0.172760009765625, 0.18500900268554688, 0.19725799560546875, 0.20950698852539062, 0.2217559814453125, 0.23400497436523438, 0.24625396728515625, 0.2585029602050781, 0.270751953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 3.0, 5.0, 10.0, 4.0, 8.0, 13.0, 12.0, 17.0, 22.0, 31.0, 36.0, 42.0, 61.0, 80.0, 86.0, 85.0, 85.0, 64.0, 66.0, 48.0, 43.0, 47.0, 29.0, 21.0, 24.0, 21.0, 10.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.309415817260742e-05, -4.1472725570201874e-05, -3.9851292967796326e-05, -3.822986036539078e-05, -3.660842776298523e-05, -3.498699516057968e-05, -3.336556255817413e-05, -3.1744129955768585e-05, -3.0122697353363037e-05, -2.850126475095749e-05, -2.687983214855194e-05, -2.5258399546146393e-05, -2.3636966943740845e-05, -2.2015534341335297e-05, -2.039410173892975e-05, -1.87726691365242e-05, -1.7151236534118652e-05, -1.5529803931713104e-05, -1.3908371329307556e-05, -1.2286938726902008e-05, -1.066550612449646e-05, -9.044073522090912e-06, -7.422640919685364e-06, -5.801208317279816e-06, -4.179775714874268e-06, -2.5583431124687195e-06, -9.369105100631714e-07, 6.845220923423767e-07, 2.305954694747925e-06, 3.927387297153473e-06, 5.548819899559021e-06, 7.170252501964569e-06, 8.791685104370117e-06, 1.0413117706775665e-05, 1.2034550309181213e-05, 1.3655982911586761e-05, 1.527741551399231e-05, 1.6898848116397858e-05, 1.8520280718803406e-05, 2.0141713321208954e-05, 2.1763145923614502e-05, 2.338457852602005e-05, 2.5006011128425598e-05, 2.6627443730831146e-05, 2.8248876333236694e-05, 2.9870308935642242e-05, 3.149174153804779e-05, 3.311317414045334e-05, 3.473460674285889e-05, 3.6356039345264435e-05, 3.797747194766998e-05, 3.959890455007553e-05, 4.122033715248108e-05, 4.284176975488663e-05, 4.4463202357292175e-05, 4.6084634959697723e-05, 4.770606756210327e-05, 4.932750016450882e-05, 5.094893276691437e-05, 5.2570365369319916e-05, 5.4191797971725464e-05, 5.581323057413101e-05, 5.743466317653656e-05, 5.905609577894211e-05, 6.0677528381347656e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 15.0, 23.0, 57.0, 90.0, 173.0, 471.0, 2241.0, 22833.0, 957955.0, 59986.0, 3587.0, 683.0, 209.0, 89.0, 49.0, 29.0, 19.0, 10.0, 4.0, 10.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2344970703125, -0.2256908416748047, -0.21688461303710938, -0.20807838439941406, -0.19927215576171875, -0.19046592712402344, -0.18165969848632812, -0.1728534698486328, -0.1640472412109375, -0.1552410125732422, -0.14643478393554688, -0.13762855529785156, -0.12882232666015625, -0.12001609802246094, -0.11120986938476562, -0.10240364074707031, -0.093597412109375, -0.08479118347167969, -0.07598495483398438, -0.06717872619628906, -0.05837249755859375, -0.04956626892089844, -0.040760040283203125, -0.03195381164550781, -0.0231475830078125, -0.014341354370117188, -0.005535125732421875, 0.0032711029052734375, 0.01207733154296875, 0.020883560180664062, 0.029689788818359375, 0.03849601745605469, 0.04730224609375, 0.05610847473144531, 0.06491470336914062, 0.07372093200683594, 0.08252716064453125, 0.09133338928222656, 0.10013961791992188, 0.10894584655761719, 0.1177520751953125, 0.1265583038330078, 0.13536453247070312, 0.14417076110839844, 0.15297698974609375, 0.16178321838378906, 0.17058944702148438, 0.1793956756591797, 0.188201904296875, 0.1970081329345703, 0.20581436157226562, 0.21462059020996094, 0.22342681884765625, 0.23223304748535156, 0.24103927612304688, 0.2498455047607422, 0.2586517333984375, 0.2674579620361328, 0.2762641906738281, 0.28507041931152344, 0.29387664794921875, 0.30268287658691406, 0.3114891052246094, 0.3202953338623047, 0.3291015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 10.0, 9.0, 9.0, 16.0, 34.0, 52.0, 98.0, 219.0, 255.0, 147.0, 64.0, 25.0, 15.0, 19.0, 14.0, 6.0, 5.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.286376953125, -0.2774620056152344, -0.26854705810546875, -0.2596321105957031, -0.2507171630859375, -0.24180221557617188, -0.23288726806640625, -0.22397232055664062, -0.215057373046875, -0.20614242553710938, -0.19722747802734375, -0.18831253051757812, -0.1793975830078125, -0.17048263549804688, -0.16156768798828125, -0.15265274047851562, -0.14373779296875, -0.13482284545898438, -0.12590789794921875, -0.11699295043945312, -0.1080780029296875, -0.09916305541992188, -0.09024810791015625, -0.08133316040039062, -0.072418212890625, -0.06350326538085938, -0.05458831787109375, -0.045673370361328125, -0.0367584228515625, -0.027843475341796875, -0.01892852783203125, -0.010013580322265625, -0.0010986328125, 0.007816314697265625, 0.01673126220703125, 0.025646209716796875, 0.0345611572265625, 0.043476104736328125, 0.05239105224609375, 0.061305999755859375, 0.070220947265625, 0.07913589477539062, 0.08805084228515625, 0.09696578979492188, 0.1058807373046875, 0.11479568481445312, 0.12371063232421875, 0.13262557983398438, 0.14154052734375, 0.15045547485351562, 0.15937042236328125, 0.16828536987304688, 0.1772003173828125, 0.18611526489257812, 0.19503021240234375, 0.20394515991210938, 0.212860107421875, 0.22177505493164062, 0.23069000244140625, 0.23960494995117188, 0.2485198974609375, 0.2574348449707031, 0.26634979248046875, 0.2752647399902344, 0.2841796875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 10.0, 34.0, 149.0, 380.0, 290.0, 99.0, 36.0, 11.0, 3.0, 1.0, 2.0, 3.0], "bins": [-9.787286758422852, -9.611881256103516, -9.43647575378418, -9.261070251464844, -9.085664749145508, -8.910259246826172, -8.734853744506836, -8.5594482421875, -8.384041786193848, -8.208636283874512, -8.033230781555176, -7.85782527923584, -7.682419300079346, -7.50701379776001, -7.331608295440674, -7.156202793121338, -6.98079776763916, -6.805392265319824, -6.629986763000488, -6.454581260681152, -6.279175281524658, -6.103769779205322, -5.928364276885986, -5.75295877456665, -5.577552795410156, -5.40214729309082, -5.226741790771484, -5.051336288452148, -4.875930309295654, -4.700524806976318, -4.525119304656982, -4.3497138023376465, -4.1743083000183105, -3.9989027976989746, -3.8234970569610596, -3.6480915546417236, -3.4726860523223877, -3.2972803115844727, -3.1218748092651367, -2.946469306945801, -2.771063804626465, -2.595658302307129, -2.420252561569214, -2.244847059249878, -2.069441556930542, -1.8940359354019165, -1.718630313873291, -1.543224811553955, -1.36781907081604, -1.1924134492874146, -1.0170079469680786, -0.8416023254394531, -0.6661967635154724, -0.4907912015914917, -0.3153855800628662, -0.13998007774353027, 0.035425543785095215, 0.21083112061023712, 0.38623669743537903, 0.5616422891616821, 0.7370478510856628, 0.9124534130096436, 1.087859034538269, 1.263264536857605, 1.4386701583862305]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 7.0, 9.0, 17.0, 11.0, 9.0, 9.0, 12.0, 23.0, 18.0, 23.0, 34.0, 26.0, 39.0, 39.0, 38.0, 39.0, 34.0, 43.0, 41.0, 51.0, 50.0, 41.0, 44.0, 47.0, 32.0, 44.0, 39.0, 26.0, 25.0, 24.0, 12.0, 16.0, 15.0, 10.0, 9.0, 15.0, 6.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.28642201423645, -2.220757007598877, -2.1550920009613037, -2.0894269943237305, -2.023761749267578, -1.9580968618392944, -1.8924317359924316, -1.8267667293548584, -1.7611017227172852, -1.695436716079712, -1.6297717094421387, -1.5641065835952759, -1.4984415769577026, -1.4327765703201294, -1.3671114444732666, -1.3014464378356934, -1.2357814311981201, -1.1701164245605469, -1.1044514179229736, -1.0387862920761108, -0.9731212854385376, -0.9074562788009644, -0.8417912125587463, -0.7761261463165283, -0.7104611396789551, -0.6447961330413818, -0.5791310667991638, -0.5134660005569458, -0.44780099391937256, -0.38213595747947693, -0.3164709210395813, -0.25080588459968567, -0.18514108657836914, -0.11947605013847351, -0.05381101369857788, 0.011854022741317749, 0.07751905918121338, 0.143184095621109, 0.20884913206100464, 0.27451416850090027, 0.3401792049407959, 0.40584424138069153, 0.47150927782058716, 0.5371743440628052, 0.6028393507003784, 0.6685043573379517, 0.7341694235801697, 0.7998344898223877, 0.8654994964599609, 0.9311645030975342, 0.9968295693397522, 1.0624946355819702, 1.1281596422195435, 1.1938246488571167, 1.2594897747039795, 1.3251547813415527, 1.390819787979126, 1.4564847946166992, 1.5221498012542725, 1.5878149271011353, 1.6534799337387085, 1.7191449403762817, 1.7848100662231445, 1.8504750728607178, 1.916140079498291]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 2.0, 9.0, 13.0, 19.0, 37.0, 52.0, 78.0, 137.0, 197.0, 441.0, 940.0, 2582.0, 13675.0, 4113651.0, 55149.0, 4692.0, 1327.0, 534.0, 294.0, 164.0, 85.0, 71.0, 34.0, 27.0, 17.0, 18.0, 14.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3740234375, -0.3646068572998047, -0.3551902770996094, -0.34577369689941406, -0.33635711669921875, -0.32694053649902344, -0.3175239562988281, -0.3081073760986328, -0.2986907958984375, -0.2892742156982422, -0.2798576354980469, -0.27044105529785156, -0.26102447509765625, -0.25160789489746094, -0.24219131469726562, -0.2327747344970703, -0.223358154296875, -0.2139415740966797, -0.20452499389648438, -0.19510841369628906, -0.18569183349609375, -0.17627525329589844, -0.16685867309570312, -0.1574420928955078, -0.1480255126953125, -0.1386089324951172, -0.12919235229492188, -0.11977577209472656, -0.11035919189453125, -0.10094261169433594, -0.09152603149414062, -0.08210945129394531, -0.07269287109375, -0.06327629089355469, -0.053859710693359375, -0.04444313049316406, -0.03502655029296875, -0.025609970092773438, -0.016193389892578125, -0.0067768096923828125, 0.0026397705078125, 0.012056350708007812, 0.021472930908203125, 0.030889511108398438, 0.04030609130859375, 0.04972267150878906, 0.059139251708984375, 0.06855583190917969, 0.077972412109375, 0.08738899230957031, 0.09680557250976562, 0.10622215270996094, 0.11563873291015625, 0.12505531311035156, 0.13447189331054688, 0.1438884735107422, 0.1533050537109375, 0.1627216339111328, 0.17213821411132812, 0.18155479431152344, 0.19097137451171875, 0.20038795471191406, 0.20980453491210938, 0.2192211151123047, 0.2286376953125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 5.0, 18.0, 17.0, 17.0, 26.0, 30.0, 25.0, 50.0, 46.0, 50.0, 55.0, 58.0, 66.0, 59.0, 60.0, 56.0, 61.0, 41.0, 46.0, 36.0, 26.0, 25.0, 26.0, 17.0, 12.0, 20.0, 13.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0], "bins": [-0.1773681640625, -0.17307567596435547, -0.16878318786621094, -0.1644906997680664, -0.16019821166992188, -0.15590572357177734, -0.1516132354736328, -0.14732074737548828, -0.14302825927734375, -0.13873577117919922, -0.1344432830810547, -0.13015079498291016, -0.12585830688476562, -0.1215658187866211, -0.11727333068847656, -0.11298084259033203, -0.1086883544921875, -0.10439586639404297, -0.10010337829589844, -0.0958108901977539, -0.09151840209960938, -0.08722591400146484, -0.08293342590332031, -0.07864093780517578, -0.07434844970703125, -0.07005596160888672, -0.06576347351074219, -0.061470985412597656, -0.057178497314453125, -0.052886009216308594, -0.04859352111816406, -0.04430103302001953, -0.040008544921875, -0.03571605682373047, -0.03142356872558594, -0.027131080627441406, -0.022838592529296875, -0.018546104431152344, -0.014253616333007812, -0.009961128234863281, -0.00566864013671875, -0.0013761520385742188, 0.0029163360595703125, 0.007208824157714844, 0.011501312255859375, 0.015793800354003906, 0.020086288452148438, 0.02437877655029297, 0.0286712646484375, 0.03296375274658203, 0.03725624084472656, 0.041548728942871094, 0.045841217041015625, 0.050133705139160156, 0.05442619323730469, 0.05871868133544922, 0.06301116943359375, 0.06730365753173828, 0.07159614562988281, 0.07588863372802734, 0.08018112182617188, 0.0844736099243164, 0.08876609802246094, 0.09305858612060547, 0.09735107421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 7.0, 10.0, 14.0, 16.0, 20.0, 36.0, 23.0, 45.0, 83.0, 93.0, 150.0, 229.0, 347.0, 469.0, 913.0, 1555.0, 3412.0, 10159.0, 84426.0, 4053152.0, 27178.0, 6193.0, 2456.0, 1202.0, 698.0, 439.0, 296.0, 214.0, 130.0, 83.0, 56.0, 47.0, 27.0, 15.0, 14.0, 13.0, 9.0, 8.0, 6.0, 11.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.1888427734375, -0.18299484252929688, -0.17714691162109375, -0.17129898071289062, -0.1654510498046875, -0.15960311889648438, -0.15375518798828125, -0.14790725708007812, -0.142059326171875, -0.13621139526367188, -0.13036346435546875, -0.12451553344726562, -0.1186676025390625, -0.11281967163085938, -0.10697174072265625, -0.10112380981445312, -0.09527587890625, -0.08942794799804688, -0.08358001708984375, -0.07773208618164062, -0.0718841552734375, -0.06603622436523438, -0.06018829345703125, -0.054340362548828125, -0.048492431640625, -0.042644500732421875, -0.03679656982421875, -0.030948638916015625, -0.0251007080078125, -0.019252777099609375, -0.01340484619140625, -0.007556915283203125, -0.001708984375, 0.004138946533203125, 0.00998687744140625, 0.015834808349609375, 0.0216827392578125, 0.027530670166015625, 0.03337860107421875, 0.039226531982421875, 0.045074462890625, 0.050922393798828125, 0.05677032470703125, 0.06261825561523438, 0.0684661865234375, 0.07431411743164062, 0.08016204833984375, 0.08600997924804688, 0.09185791015625, 0.09770584106445312, 0.10355377197265625, 0.10940170288085938, 0.1152496337890625, 0.12109756469726562, 0.12694549560546875, 0.13279342651367188, 0.138641357421875, 0.14448928833007812, 0.15033721923828125, 0.15618515014648438, 0.1620330810546875, 0.16788101196289062, 0.17372894287109375, 0.17957687377929688, 0.1854248046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 12.0, 18.0, 65.0, 606.0, 3237.0, 70.0, 23.0, 15.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.067474365234375, -0.06549072265625, -0.063507080078125, -0.0615234375, -0.059539794921875, -0.05755615234375, -0.055572509765625, -0.0535888671875, -0.051605224609375, -0.04962158203125, -0.047637939453125, -0.045654296875, -0.043670654296875, -0.04168701171875, -0.039703369140625, -0.0377197265625, -0.035736083984375, -0.03375244140625, -0.031768798828125, -0.02978515625, -0.027801513671875, -0.02581787109375, -0.023834228515625, -0.0218505859375, -0.019866943359375, -0.01788330078125, -0.015899658203125, -0.013916015625, -0.011932373046875, -0.00994873046875, -0.007965087890625, -0.0059814453125, -0.003997802734375, -0.00201416015625, -3.0517578125e-05, 0.001953125, 0.003936767578125, 0.00592041015625, 0.007904052734375, 0.0098876953125, 0.011871337890625, 0.01385498046875, 0.015838623046875, 0.017822265625, 0.019805908203125, 0.02178955078125, 0.023773193359375, 0.0257568359375, 0.027740478515625, 0.02972412109375, 0.031707763671875, 0.03369140625, 0.035675048828125, 0.03765869140625, 0.039642333984375, 0.0416259765625, 0.043609619140625, 0.04559326171875, 0.047576904296875, 0.049560546875, 0.051544189453125, 0.05352783203125, 0.055511474609375, 0.0574951171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 26.0, 53.0, 121.0, 204.0, 272.0, 154.0, 89.0, 39.0, 17.0, 7.0, 5.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2907010018825531, -0.28236693143844604, -0.2740328907966614, -0.2656988203525543, -0.25736477971076965, -0.2490307092666626, -0.24069665372371674, -0.23236259818077087, -0.22402852773666382, -0.21569447219371796, -0.2073604166507721, -0.19902634620666504, -0.19069229066371918, -0.18235823512077332, -0.17402417957782745, -0.1656901240348816, -0.15735606849193573, -0.14902201294898987, -0.140687957406044, -0.13235390186309814, -0.12401983141899109, -0.11568577587604523, -0.10735172033309937, -0.0990176647901535, -0.09068360179662704, -0.08234954625368118, -0.07401548326015472, -0.06568142771720886, -0.0573473684489727, -0.04901330918073654, -0.04067925363779068, -0.03234519436955452, -0.02401113510131836, -0.0156770758330822, -0.007343018427491188, 0.000991038978099823, 0.009325098246335983, 0.017659157514572144, 0.025993213057518005, 0.034327272325754166, 0.042661331593990326, 0.050995390862226486, 0.059329450130462646, 0.06766350567340851, 0.07599756121635437, 0.08433162420988083, 0.09266567975282669, 0.10099974274635315, 0.10933379828929901, 0.11766785383224487, 0.12600190937519073, 0.1343359649181366, 0.14267003536224365, 0.15100409090518951, 0.15933814644813538, 0.16767220199108124, 0.1760062575340271, 0.18434031307697296, 0.19267436861991882, 0.20100843906402588, 0.20934249460697174, 0.2176765501499176, 0.22601060569286346, 0.23434466123580933, 0.24267873167991638]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 7.0, 8.0, 7.0, 15.0, 9.0, 10.0, 15.0, 19.0, 19.0, 21.0, 32.0, 24.0, 31.0, 37.0, 24.0, 27.0, 41.0, 44.0, 52.0, 36.0, 44.0, 43.0, 31.0, 31.0, 31.0, 36.0, 39.0, 34.0, 46.0, 27.0, 27.0, 17.0, 26.0, 14.0, 21.0, 9.0, 7.0, 11.0, 10.0, 7.0, 5.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07930302619934082, -0.07681325823068619, -0.07432348281145096, -0.07183371484279633, -0.0693439394235611, -0.06685417145490646, -0.06436440348625183, -0.0618746317923069, -0.05938486009836197, -0.05689508840441704, -0.05440531671047211, -0.051915548741817474, -0.04942577704787254, -0.04693600535392761, -0.04444623738527298, -0.04195646569132805, -0.03946669399738312, -0.03697692230343819, -0.034487150609493256, -0.03199738264083862, -0.029507610946893692, -0.02701783925294876, -0.02452806942164898, -0.022038299590349197, -0.019548527896404266, -0.017058756202459335, -0.014568986371159554, -0.012079215608537197, -0.00958944484591484, -0.007099674083292484, -0.004609903320670128, -0.002120133489370346, 0.00036963820457458496, 0.0028594089671969414, 0.005349179729819298, 0.007838950492441654, 0.01032872125506401, 0.012818492017686367, 0.015308262780308723, 0.017798032611608505, 0.020287804305553436, 0.022777575999498367, 0.02526734583079815, 0.02775711566209793, 0.030246887356042862, 0.03273665904998779, 0.035226427018642426, 0.03771619871258736, 0.04020597040653229, 0.04269574210047722, 0.04518551379442215, 0.04767528176307678, 0.05016505345702171, 0.052654825150966644, 0.05514459311962128, 0.05763436481356621, 0.06012413650751114, 0.06261390447616577, 0.065103679895401, 0.06759344786405563, 0.07008321583271027, 0.0725729912519455, 0.07506275922060013, 0.07755252718925476, 0.08004230260848999]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 11.0, 7.0, 16.0, 42.0, 35.0, 64.0, 91.0, 177.0, 271.0, 575.0, 1046.0, 2191.0, 4829.0, 12037.0, 32383.0, 96335.0, 294787.0, 380861.0, 146169.0, 47390.0, 16841.0, 6649.0, 2822.0, 1337.0, 688.0, 357.0, 215.0, 109.0, 73.0, 49.0, 28.0, 24.0, 15.0, 8.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11279296875, -0.10848426818847656, -0.10417556762695312, -0.09986686706542969, -0.09555816650390625, -0.09124946594238281, -0.08694076538085938, -0.08263206481933594, -0.0783233642578125, -0.07401466369628906, -0.06970596313476562, -0.06539726257324219, -0.06108856201171875, -0.05677986145019531, -0.052471160888671875, -0.04816246032714844, -0.043853759765625, -0.03954505920410156, -0.035236358642578125, -0.030927658081054688, -0.02661895751953125, -0.022310256958007812, -0.018001556396484375, -0.013692855834960938, -0.0093841552734375, -0.0050754547119140625, -0.000766754150390625, 0.0035419464111328125, 0.00785064697265625, 0.012159347534179688, 0.016468048095703125, 0.020776748657226562, 0.02508544921875, 0.029394149780273438, 0.033702850341796875, 0.03801155090332031, 0.04232025146484375, 0.04662895202636719, 0.050937652587890625, 0.05524635314941406, 0.0595550537109375, 0.06386375427246094, 0.06817245483398438, 0.07248115539550781, 0.07678985595703125, 0.08109855651855469, 0.08540725708007812, 0.08971595764160156, 0.094024658203125, 0.09833335876464844, 0.10264205932617188, 0.10695075988769531, 0.11125946044921875, 0.11556816101074219, 0.11987686157226562, 0.12418556213378906, 0.1284942626953125, 0.13280296325683594, 0.13711166381835938, 0.1414203643798828, 0.14572906494140625, 0.1500377655029297, 0.15434646606445312, 0.15865516662597656, 0.1629638671875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 4.0, 8.0, 10.0, 16.0, 14.0, 20.0, 25.0, 33.0, 32.0, 41.0, 46.0, 59.0, 64.0, 54.0, 75.0, 50.0, 62.0, 57.0, 56.0, 44.0, 38.0, 28.0, 32.0, 24.0, 23.0, 15.0, 20.0, 10.0, 14.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0], "bins": [-0.17822265625, -0.17386817932128906, -0.16951370239257812, -0.1651592254638672, -0.16080474853515625, -0.1564502716064453, -0.15209579467773438, -0.14774131774902344, -0.1433868408203125, -0.13903236389160156, -0.13467788696289062, -0.1303234100341797, -0.12596893310546875, -0.12161445617675781, -0.11725997924804688, -0.11290550231933594, -0.108551025390625, -0.10419654846191406, -0.09984207153320312, -0.09548759460449219, -0.09113311767578125, -0.08677864074707031, -0.08242416381835938, -0.07806968688964844, -0.0737152099609375, -0.06936073303222656, -0.06500625610351562, -0.06065177917480469, -0.05629730224609375, -0.05194282531738281, -0.047588348388671875, -0.04323387145996094, -0.03887939453125, -0.03452491760253906, -0.030170440673828125, -0.025815963745117188, -0.02146148681640625, -0.017107009887695312, -0.012752532958984375, -0.008398056030273438, -0.0040435791015625, 0.0003108978271484375, 0.004665374755859375, 0.009019851684570312, 0.01337432861328125, 0.017728805541992188, 0.022083282470703125, 0.026437759399414062, 0.030792236328125, 0.03514671325683594, 0.039501190185546875, 0.04385566711425781, 0.04821014404296875, 0.05256462097167969, 0.056919097900390625, 0.06127357482910156, 0.0656280517578125, 0.06998252868652344, 0.07433700561523438, 0.07869148254394531, 0.08304595947265625, 0.08740043640136719, 0.09175491333007812, 0.09610939025878906, 0.1004638671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 9.0, 2.0, 7.0, 11.0, 14.0, 17.0, 17.0, 25.0, 25.0, 34.0, 54.0, 54.0, 67.0, 87.0, 114.0, 152.0, 286.0, 510.0, 1051.0, 2791.0, 10139.0, 53946.0, 430242.0, 474454.0, 58168.0, 10757.0, 2897.0, 1063.0, 540.0, 295.0, 187.0, 105.0, 93.0, 66.0, 54.0, 36.0, 39.0, 39.0, 22.0, 20.0, 14.0, 16.0, 5.0, 8.0, 7.0, 11.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.25048828125, -0.24333572387695312, -0.23618316650390625, -0.22903060913085938, -0.2218780517578125, -0.21472549438476562, -0.20757293701171875, -0.20042037963867188, -0.193267822265625, -0.18611526489257812, -0.17896270751953125, -0.17181015014648438, -0.1646575927734375, -0.15750503540039062, -0.15035247802734375, -0.14319992065429688, -0.13604736328125, -0.12889480590820312, -0.12174224853515625, -0.11458969116210938, -0.1074371337890625, -0.10028457641601562, -0.09313201904296875, -0.08597946166992188, -0.078826904296875, -0.07167434692382812, -0.06452178955078125, -0.057369232177734375, -0.0502166748046875, -0.043064117431640625, -0.03591156005859375, -0.028759002685546875, -0.0216064453125, -0.014453887939453125, -0.00730133056640625, -0.000148773193359375, 0.0070037841796875, 0.014156341552734375, 0.02130889892578125, 0.028461456298828125, 0.035614013671875, 0.042766571044921875, 0.04991912841796875, 0.057071685791015625, 0.0642242431640625, 0.07137680053710938, 0.07852935791015625, 0.08568191528320312, 0.09283447265625, 0.09998703002929688, 0.10713958740234375, 0.11429214477539062, 0.1214447021484375, 0.12859725952148438, 0.13574981689453125, 0.14290237426757812, 0.150054931640625, 0.15720748901367188, 0.16436004638671875, 0.17151260375976562, 0.1786651611328125, 0.18581771850585938, 0.19297027587890625, 0.20012283325195312, 0.207275390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 4.0, 14.0, 12.0, 15.0, 20.0, 22.0, 22.0, 23.0, 26.0, 45.0, 33.0, 52.0, 61.0, 51.0, 55.0, 46.0, 60.0, 57.0, 38.0, 49.0, 33.0, 37.0, 28.0, 25.0, 30.0, 27.0, 17.0, 23.0, 19.0, 11.0, 13.0, 8.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57861328125, -0.5621910095214844, -0.5457687377929688, -0.5293464660644531, -0.5129241943359375, -0.4965019226074219, -0.48007965087890625, -0.4636573791503906, -0.447235107421875, -0.4308128356933594, -0.41439056396484375, -0.3979682922363281, -0.3815460205078125, -0.3651237487792969, -0.34870147705078125, -0.3322792053222656, -0.31585693359375, -0.2994346618652344, -0.28301239013671875, -0.2665901184082031, -0.2501678466796875, -0.23374557495117188, -0.21732330322265625, -0.20090103149414062, -0.184478759765625, -0.16805648803710938, -0.15163421630859375, -0.13521194458007812, -0.1187896728515625, -0.10236740112304688, -0.08594512939453125, -0.06952285766601562, -0.0531005859375, -0.036678314208984375, -0.02025604248046875, -0.003833770751953125, 0.0125885009765625, 0.029010772705078125, 0.04543304443359375, 0.061855316162109375, 0.078277587890625, 0.09469985961914062, 0.11112213134765625, 0.12754440307617188, 0.1439666748046875, 0.16038894653320312, 0.17681121826171875, 0.19323348999023438, 0.20965576171875, 0.22607803344726562, 0.24250030517578125, 0.2589225769042969, 0.2753448486328125, 0.2917671203613281, 0.30818939208984375, 0.3246116638183594, 0.341033935546875, 0.3574562072753906, 0.37387847900390625, 0.3903007507324219, 0.4067230224609375, 0.4231452941894531, 0.43956756591796875, 0.4559898376464844, 0.472412109375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 6.0, 8.0, 7.0, 15.0, 24.0, 34.0, 44.0, 72.0, 126.0, 267.0, 615.0, 1608.0, 6094.0, 51659.0, 887314.0, 88952.0, 8331.0, 1966.0, 729.0, 297.0, 134.0, 72.0, 54.0, 41.0, 23.0, 14.0, 12.0, 11.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1829833984375, -0.1778411865234375, -0.172698974609375, -0.1675567626953125, -0.16241455078125, -0.1572723388671875, -0.152130126953125, -0.1469879150390625, -0.141845703125, -0.1367034912109375, -0.131561279296875, -0.1264190673828125, -0.12127685546875, -0.1161346435546875, -0.110992431640625, -0.1058502197265625, -0.1007080078125, -0.0955657958984375, -0.090423583984375, -0.0852813720703125, -0.08013916015625, -0.0749969482421875, -0.069854736328125, -0.0647125244140625, -0.0595703125, -0.0544281005859375, -0.049285888671875, -0.0441436767578125, -0.03900146484375, -0.0338592529296875, -0.028717041015625, -0.0235748291015625, -0.0184326171875, -0.0132904052734375, -0.008148193359375, -0.0030059814453125, 0.00213623046875, 0.0072784423828125, 0.012420654296875, 0.0175628662109375, 0.022705078125, 0.0278472900390625, 0.032989501953125, 0.0381317138671875, 0.04327392578125, 0.0484161376953125, 0.053558349609375, 0.0587005615234375, 0.0638427734375, 0.0689849853515625, 0.074127197265625, 0.0792694091796875, 0.08441162109375, 0.0895538330078125, 0.094696044921875, 0.0998382568359375, 0.10498046875, 0.1101226806640625, 0.115264892578125, 0.1204071044921875, 0.12554931640625, 0.1306915283203125, 0.135833740234375, 0.1409759521484375, 0.1461181640625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 4.0, 4.0, 4.0, 8.0, 14.0, 12.0, 18.0, 26.0, 34.0, 55.0, 79.0, 127.0, 149.0, 133.0, 103.0, 65.0, 41.0, 32.0, 14.0, 20.0, 11.0, 12.0, 7.0, 3.0, 5.0, 5.0, 4.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.693601608276367e-05, -6.500538438558578e-05, -6.30747526884079e-05, -6.114412099123001e-05, -5.9213489294052124e-05, -5.728285759687424e-05, -5.535222589969635e-05, -5.342159420251846e-05, -5.1490962505340576e-05, -4.956033080816269e-05, -4.76296991109848e-05, -4.5699067413806915e-05, -4.376843571662903e-05, -4.183780401945114e-05, -3.9907172322273254e-05, -3.797654062509537e-05, -3.604590892791748e-05, -3.4115277230739594e-05, -3.2184645533561707e-05, -3.025401383638382e-05, -2.8323382139205933e-05, -2.6392750442028046e-05, -2.446211874485016e-05, -2.2531487047672272e-05, -2.0600855350494385e-05, -1.8670223653316498e-05, -1.673959195613861e-05, -1.4808960258960724e-05, -1.2878328561782837e-05, -1.094769686460495e-05, -9.017065167427063e-06, -7.086433470249176e-06, -5.155801773071289e-06, -3.225170075893402e-06, -1.2945383787155151e-06, 6.360933184623718e-07, 2.566725015640259e-06, 4.497356712818146e-06, 6.427988409996033e-06, 8.35862010717392e-06, 1.0289251804351807e-05, 1.2219883501529694e-05, 1.415051519870758e-05, 1.6081146895885468e-05, 1.8011778593063354e-05, 1.994241029024124e-05, 2.187304198741913e-05, 2.3803673684597015e-05, 2.5734305381774902e-05, 2.766493707895279e-05, 2.9595568776130676e-05, 3.152620047330856e-05, 3.345683217048645e-05, 3.538746386766434e-05, 3.7318095564842224e-05, 3.924872726202011e-05, 4.1179358959198e-05, 4.3109990656375885e-05, 4.504062235355377e-05, 4.697125405073166e-05, 4.8901885747909546e-05, 5.083251744508743e-05, 5.276314914226532e-05, 5.469378083944321e-05, 5.6624412536621094e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 8.0, 5.0, 7.0, 7.0, 10.0, 27.0, 39.0, 50.0, 108.0, 187.0, 529.0, 1614.0, 6221.0, 46957.0, 814510.0, 162252.0, 11929.0, 2586.0, 786.0, 332.0, 146.0, 81.0, 49.0, 31.0, 29.0, 6.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.14064979553222656, -0.13591384887695312, -0.1311779022216797, -0.12644195556640625, -0.12170600891113281, -0.11697006225585938, -0.11223411560058594, -0.1074981689453125, -0.10276222229003906, -0.09802627563476562, -0.09329032897949219, -0.08855438232421875, -0.08381843566894531, -0.07908248901367188, -0.07434654235839844, -0.069610595703125, -0.06487464904785156, -0.060138702392578125, -0.05540275573730469, -0.05066680908203125, -0.04593086242675781, -0.041194915771484375, -0.03645896911621094, -0.0317230224609375, -0.026987075805664062, -0.022251129150390625, -0.017515182495117188, -0.01277923583984375, -0.008043289184570312, -0.003307342529296875, 0.0014286041259765625, 0.00616455078125, 0.010900497436523438, 0.015636444091796875, 0.020372390747070312, 0.02510833740234375, 0.029844284057617188, 0.034580230712890625, 0.03931617736816406, 0.0440521240234375, 0.04878807067871094, 0.053524017333984375, 0.05825996398925781, 0.06299591064453125, 0.06773185729980469, 0.07246780395507812, 0.07720375061035156, 0.081939697265625, 0.08667564392089844, 0.09141159057617188, 0.09614753723144531, 0.10088348388671875, 0.10561943054199219, 0.11035537719726562, 0.11509132385253906, 0.1198272705078125, 0.12456321716308594, 0.12929916381835938, 0.1340351104736328, 0.13877105712890625, 0.1435070037841797, 0.14824295043945312, 0.15297889709472656, 0.15771484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 11.0, 21.0, 38.0, 88.0, 161.0, 232.0, 206.0, 103.0, 44.0, 28.0, 14.0, 11.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35205078125, -0.3432121276855469, -0.33437347412109375, -0.3255348205566406, -0.3166961669921875, -0.3078575134277344, -0.29901885986328125, -0.2901802062988281, -0.281341552734375, -0.2725028991699219, -0.26366424560546875, -0.2548255920410156, -0.2459869384765625, -0.23714828491210938, -0.22830963134765625, -0.21947097778320312, -0.21063232421875, -0.20179367065429688, -0.19295501708984375, -0.18411636352539062, -0.1752777099609375, -0.16643905639648438, -0.15760040283203125, -0.14876174926757812, -0.139923095703125, -0.13108444213867188, -0.12224578857421875, -0.11340713500976562, -0.1045684814453125, -0.09572982788085938, -0.08689117431640625, -0.07805252075195312, -0.0692138671875, -0.060375213623046875, -0.05153656005859375, -0.042697906494140625, -0.0338592529296875, -0.025020599365234375, -0.01618194580078125, -0.007343292236328125, 0.001495361328125, 0.010334014892578125, 0.01917266845703125, 0.028011322021484375, 0.0368499755859375, 0.045688629150390625, 0.05452728271484375, 0.06336593627929688, 0.07220458984375, 0.08104324340820312, 0.08988189697265625, 0.09872055053710938, 0.1075592041015625, 0.11639785766601562, 0.12523651123046875, 0.13407516479492188, 0.142913818359375, 0.15175247192382812, 0.16059112548828125, 0.16942977905273438, 0.1782684326171875, 0.18710708618164062, 0.19594573974609375, 0.20478439331054688, 0.213623046875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 2.0, 5.0, 11.0, 7.0, 19.0, 48.0, 55.0, 79.0, 109.0, 139.0, 141.0, 142.0, 109.0, 47.0, 34.0, 23.0, 9.0, 16.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0867371559143066, -2.0298352241516113, -1.9729334115982056, -1.9160315990447998, -1.8591296672821045, -1.8022278547286987, -1.7453259229660034, -1.6884241104125977, -1.6315221786499023, -1.5746203660964966, -1.5177184343338013, -1.4608166217803955, -1.4039146900177002, -1.3470128774642944, -1.2901109457015991, -1.2332091331481934, -1.176307201385498, -1.1194053888320923, -1.062503457069397, -1.0056016445159912, -0.9486997127532959, -0.8917979001998901, -0.8348959684371948, -0.7779941558837891, -0.7210923433303833, -0.6641904711723328, -0.6072885990142822, -0.5503867268562317, -0.49348485469818115, -0.436583012342453, -0.37968114018440247, -0.32277926802635193, -0.265877366065979, -0.20897549390792847, -0.15207362174987793, -0.09517176449298859, -0.03826989233493805, 0.018631964921951294, 0.07553383708000183, 0.13243570923805237, 0.1893375813961029, 0.24623945355415344, 0.303141325712204, 0.36004316806793213, 0.41694504022598267, 0.4738469123840332, 0.5307487845420837, 0.5876506567001343, 0.6445525288581848, 0.7014544010162354, 0.7583562731742859, 0.8152581453323364, 0.872160017490387, 0.9290618896484375, 0.9859637022018433, 1.0428656339645386, 1.0997674465179443, 1.15666925907135, 1.2135711908340454, 1.2704730033874512, 1.3273749351501465, 1.3842767477035522, 1.4411786794662476, 1.4980804920196533, 1.5549824237823486]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 8.0, 7.0, 11.0, 7.0, 17.0, 13.0, 17.0, 12.0, 25.0, 27.0, 25.0, 24.0, 36.0, 30.0, 41.0, 54.0, 35.0, 55.0, 64.0, 50.0, 48.0, 47.0, 43.0, 36.0, 33.0, 46.0, 26.0, 33.0, 24.0, 18.0, 18.0, 12.0, 15.0, 10.0, 4.0, 6.0, 2.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0074591636657715, -1.9423013925552368, -1.8771436214447021, -1.811985969543457, -1.7468281984329224, -1.6816704273223877, -1.6165127754211426, -1.551355004310608, -1.4861972332000732, -1.4210394620895386, -1.355881690979004, -1.2907240390777588, -1.2255662679672241, -1.1604084968566895, -1.0952508449554443, -1.0300930738449097, -0.964935302734375, -0.8997775316238403, -0.8346198201179504, -0.7694621086120605, -0.7043043375015259, -0.6391465663909912, -0.5739888548851013, -0.5088311433792114, -0.44367337226867676, -0.3785156309604645, -0.3133578896522522, -0.24820014834403992, -0.18304240703582764, -0.11788466572761536, -0.052726924419403076, 0.012430816888809204, 0.07758855819702148, 0.14274629950523376, 0.20790404081344604, 0.2730617821216583, 0.3382195234298706, 0.4033772647380829, 0.46853500604629517, 0.5336927175521851, 0.5988504886627197, 0.6640082597732544, 0.7291659712791443, 0.7943236827850342, 0.8594814538955688, 0.9246392250061035, 0.9897969365119934, 1.0549546480178833, 1.120112419128418, 1.1852701902389526, 1.2504279613494873, 1.3155856132507324, 1.380743384361267, 1.4459011554718018, 1.5110588073730469, 1.5762165784835815, 1.6413743495941162, 1.7065321207046509, 1.7716898918151855, 1.8368475437164307, 1.9020053148269653, 1.9671630859375, 2.032320737838745, 2.0974786281585693, 2.1626362800598145]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 7.0, 11.0, 14.0, 24.0, 23.0, 35.0, 60.0, 99.0, 122.0, 170.0, 246.0, 374.0, 605.0, 963.0, 1760.0, 3468.0, 9282.0, 49489.0, 4014737.0, 91139.0, 12308.0, 4203.0, 2075.0, 1086.0, 684.0, 444.0, 265.0, 190.0, 105.0, 87.0, 55.0, 50.0, 30.0, 13.0, 14.0, 9.0, 5.0, 5.0, 10.0, 1.0, 4.0, 3.0], "bins": [-0.2254638671875, -0.2199115753173828, -0.21435928344726562, -0.20880699157714844, -0.20325469970703125, -0.19770240783691406, -0.19215011596679688, -0.1865978240966797, -0.1810455322265625, -0.1754932403564453, -0.16994094848632812, -0.16438865661621094, -0.15883636474609375, -0.15328407287597656, -0.14773178100585938, -0.1421794891357422, -0.136627197265625, -0.1310749053955078, -0.12552261352539062, -0.11997032165527344, -0.11441802978515625, -0.10886573791503906, -0.10331344604492188, -0.09776115417480469, -0.0922088623046875, -0.08665657043457031, -0.08110427856445312, -0.07555198669433594, -0.06999969482421875, -0.06444740295410156, -0.058895111083984375, -0.05334281921386719, -0.04779052734375, -0.04223823547363281, -0.036685943603515625, -0.031133651733398438, -0.02558135986328125, -0.020029067993164062, -0.014476776123046875, -0.008924484252929688, -0.0033721923828125, 0.0021800994873046875, 0.007732391357421875, 0.013284683227539062, 0.01883697509765625, 0.024389266967773438, 0.029941558837890625, 0.03549385070800781, 0.041046142578125, 0.04659843444824219, 0.052150726318359375, 0.05770301818847656, 0.06325531005859375, 0.06880760192871094, 0.07435989379882812, 0.07991218566894531, 0.0854644775390625, 0.09101676940917969, 0.09656906127929688, 0.10212135314941406, 0.10767364501953125, 0.11322593688964844, 0.11877822875976562, 0.12433052062988281, 0.1298828125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 10.0, 8.0, 6.0, 16.0, 9.0, 18.0, 27.0, 27.0, 28.0, 39.0, 36.0, 40.0, 49.0, 58.0, 54.0, 70.0, 44.0, 53.0, 56.0, 50.0, 48.0, 46.0, 25.0, 30.0, 30.0, 21.0, 20.0, 16.0, 14.0, 11.0, 3.0, 8.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-0.1556396484375, -0.15176105499267578, -0.14788246154785156, -0.14400386810302734, -0.14012527465820312, -0.1362466812133789, -0.1323680877685547, -0.12848949432373047, -0.12461090087890625, -0.12073230743408203, -0.11685371398925781, -0.1129751205444336, -0.10909652709960938, -0.10521793365478516, -0.10133934020996094, -0.09746074676513672, -0.0935821533203125, -0.08970355987548828, -0.08582496643066406, -0.08194637298583984, -0.07806777954101562, -0.0741891860961914, -0.07031059265136719, -0.06643199920654297, -0.06255340576171875, -0.05867481231689453, -0.05479621887207031, -0.050917625427246094, -0.047039031982421875, -0.043160438537597656, -0.03928184509277344, -0.03540325164794922, -0.031524658203125, -0.02764606475830078, -0.023767471313476562, -0.019888877868652344, -0.016010284423828125, -0.012131690979003906, -0.008253097534179688, -0.004374504089355469, -0.00049591064453125, 0.0033826828002929688, 0.0072612762451171875, 0.011139869689941406, 0.015018463134765625, 0.018897056579589844, 0.022775650024414062, 0.02665424346923828, 0.0305328369140625, 0.03441143035888672, 0.03829002380371094, 0.042168617248535156, 0.046047210693359375, 0.049925804138183594, 0.05380439758300781, 0.05768299102783203, 0.06156158447265625, 0.06544017791748047, 0.06931877136230469, 0.0731973648071289, 0.07707595825195312, 0.08095455169677734, 0.08483314514160156, 0.08871173858642578, 0.09259033203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 3.0, 6.0, 9.0, 13.0, 14.0, 18.0, 28.0, 45.0, 57.0, 80.0, 104.0, 136.0, 229.0, 360.0, 644.0, 1120.0, 2456.0, 7450.0, 85443.0, 4066232.0, 21460.0, 4264.0, 1746.0, 854.0, 472.0, 307.0, 195.0, 138.0, 99.0, 80.0, 54.0, 43.0, 33.0, 27.0, 12.0, 8.0, 12.0, 13.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300537109375, -0.29093170166015625, -0.2813262939453125, -0.27172088623046875, -0.262115478515625, -0.25251007080078125, -0.2429046630859375, -0.23329925537109375, -0.22369384765625, -0.21408843994140625, -0.2044830322265625, -0.19487762451171875, -0.185272216796875, -0.17566680908203125, -0.1660614013671875, -0.15645599365234375, -0.1468505859375, -0.13724517822265625, -0.1276397705078125, -0.11803436279296875, -0.108428955078125, -0.09882354736328125, -0.0892181396484375, -0.07961273193359375, -0.07000732421875, -0.06040191650390625, -0.0507965087890625, -0.04119110107421875, -0.031585693359375, -0.02198028564453125, -0.0123748779296875, -0.00276947021484375, 0.0068359375, 0.01644134521484375, 0.0260467529296875, 0.03565216064453125, 0.045257568359375, 0.05486297607421875, 0.0644683837890625, 0.07407379150390625, 0.08367919921875, 0.09328460693359375, 0.1028900146484375, 0.11249542236328125, 0.122100830078125, 0.13170623779296875, 0.1413116455078125, 0.15091705322265625, 0.1605224609375, 0.17012786865234375, 0.1797332763671875, 0.18933868408203125, 0.198944091796875, 0.20854949951171875, 0.2181549072265625, 0.22776031494140625, 0.23736572265625, 0.24697113037109375, 0.2565765380859375, 0.26618194580078125, 0.275787353515625, 0.28539276123046875, 0.2949981689453125, 0.30460357666015625, 0.314208984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 10.0, 22.0, 128.0, 3610.0, 229.0, 43.0, 18.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21435546875, -0.2073535919189453, -0.20035171508789062, -0.19334983825683594, -0.18634796142578125, -0.17934608459472656, -0.17234420776367188, -0.1653423309326172, -0.1583404541015625, -0.1513385772705078, -0.14433670043945312, -0.13733482360839844, -0.13033294677734375, -0.12333106994628906, -0.11632919311523438, -0.10932731628417969, -0.102325439453125, -0.09532356262207031, -0.08832168579101562, -0.08131980895996094, -0.07431793212890625, -0.06731605529785156, -0.060314178466796875, -0.05331230163574219, -0.0463104248046875, -0.03930854797363281, -0.032306671142578125, -0.025304794311523438, -0.01830291748046875, -0.011301040649414062, -0.004299163818359375, 0.0027027130126953125, 0.00970458984375, 0.016706466674804688, 0.023708343505859375, 0.030710220336914062, 0.03771209716796875, 0.04471397399902344, 0.051715850830078125, 0.05871772766113281, 0.0657196044921875, 0.07272148132324219, 0.07972335815429688, 0.08672523498535156, 0.09372711181640625, 0.10072898864746094, 0.10773086547851562, 0.11473274230957031, 0.121734619140625, 0.1287364959716797, 0.13573837280273438, 0.14274024963378906, 0.14974212646484375, 0.15674400329589844, 0.16374588012695312, 0.1707477569580078, 0.1777496337890625, 0.1847515106201172, 0.19175338745117188, 0.19875526428222656, 0.20575714111328125, 0.21275901794433594, 0.21976089477539062, 0.2267627716064453, 0.2337646484375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 9.0, 11.0, 23.0, 40.0, 58.0, 83.0, 121.0, 147.0, 184.0, 127.0, 79.0, 46.0, 31.0, 13.0, 10.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36494317650794983, -0.3513897657394409, -0.3378363847732544, -0.3242829740047455, -0.3107295632362366, -0.29717618227005005, -0.28362277150154114, -0.2700693607330322, -0.2565159797668457, -0.24296258389949799, -0.22940917313098907, -0.21585577726364136, -0.20230236649513245, -0.18874897062778473, -0.175195574760437, -0.1616421639919281, -0.1480887532234192, -0.13453535735607147, -0.12098194658756256, -0.10742855072021484, -0.09387514740228653, -0.08032174408435822, -0.0667683482170105, -0.053214944899082184, -0.03966154158115387, -0.026108140125870705, -0.01255473867058754, 0.000998660922050476, 0.01455206423997879, 0.028105467557907104, 0.04165886342525482, 0.055212266743183136, 0.06876569986343384, 0.08231910318136215, 0.09587250649929047, 0.10942590236663818, 0.1229793056845665, 0.1365327090024948, 0.15008610486984253, 0.16363951563835144, 0.17719291150569916, 0.19074630737304688, 0.2042997181415558, 0.2178531140089035, 0.23140650987625122, 0.24495992064476013, 0.25851333141326904, 0.27206671237945557, 0.2856201231479645, 0.2991735339164734, 0.3127269148826599, 0.3262803256511688, 0.33983373641967773, 0.35338711738586426, 0.36694052815437317, 0.3804939389228821, 0.3940473198890686, 0.4076007306575775, 0.42115411162376404, 0.43470752239227295, 0.44826093316078186, 0.46181434392929077, 0.4753677248954773, 0.4889211356639862, 0.5024745464324951]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 10.0, 8.0, 14.0, 21.0, 22.0, 31.0, 38.0, 36.0, 38.0, 37.0, 45.0, 55.0, 54.0, 66.0, 52.0, 46.0, 52.0, 59.0, 59.0, 43.0, 33.0, 43.0, 26.0, 23.0, 20.0, 19.0, 13.0, 7.0, 8.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24484783411026, -0.23513230681419373, -0.22541677951812744, -0.21570125222206116, -0.20598572492599487, -0.1962701976299286, -0.1865546703338623, -0.17683914303779602, -0.16712361574172974, -0.15740808844566345, -0.14769256114959717, -0.13797703385353088, -0.1282615065574646, -0.11854597926139832, -0.10883045941591263, -0.09911493211984634, -0.08939941227436066, -0.07968388497829437, -0.06996835768222809, -0.0602528341114521, -0.05053730681538582, -0.040821779519319534, -0.03110625594854355, -0.021390728652477264, -0.01167520135641098, -0.0019596749916672707, 0.007755851373076439, 0.017471376806497574, 0.027186904102563858, 0.03690243139863014, 0.04661795496940613, 0.05633348226547241, 0.0660490095615387, 0.07576453685760498, 0.08548006415367126, 0.09519559144973755, 0.10491111874580383, 0.11462664604187012, 0.1243421658873558, 0.13405770063400269, 0.14377322793006897, 0.15348875522613525, 0.16320428252220154, 0.17291980981826782, 0.1826353371143341, 0.1923508644104004, 0.20206639170646667, 0.21178191900253296, 0.22149743139743805, 0.23121295869350433, 0.24092848598957062, 0.2506439983844757, 0.260359525680542, 0.2700750529766083, 0.27979058027267456, 0.28950610756874084, 0.29922163486480713, 0.3089371621608734, 0.3186526894569397, 0.328368216753006, 0.33808374404907227, 0.34779927134513855, 0.35751479864120483, 0.3672303259372711, 0.3769458532333374]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 13.0, 11.0, 19.0, 32.0, 27.0, 47.0, 85.0, 126.0, 244.0, 493.0, 1018.0, 2349.0, 6507.0, 22587.0, 104919.0, 523954.0, 310731.0, 54349.0, 13553.0, 4168.0, 1690.0, 732.0, 343.0, 214.0, 119.0, 78.0, 45.0, 31.0, 16.0, 16.0, 7.0, 10.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.260986328125, -0.2538948059082031, -0.24680328369140625, -0.23971176147460938, -0.2326202392578125, -0.22552871704101562, -0.21843719482421875, -0.21134567260742188, -0.204254150390625, -0.19716262817382812, -0.19007110595703125, -0.18297958374023438, -0.1758880615234375, -0.16879653930664062, -0.16170501708984375, -0.15461349487304688, -0.14752197265625, -0.14043045043945312, -0.13333892822265625, -0.12624740600585938, -0.1191558837890625, -0.11206436157226562, -0.10497283935546875, -0.09788131713867188, -0.090789794921875, -0.08369827270507812, -0.07660675048828125, -0.06951522827148438, -0.0624237060546875, -0.055332183837890625, -0.04824066162109375, -0.041149139404296875, -0.0340576171875, -0.026966094970703125, -0.01987457275390625, -0.012783050537109375, -0.0056915283203125, 0.001399993896484375, 0.00849151611328125, 0.015583038330078125, 0.022674560546875, 0.029766082763671875, 0.03685760498046875, 0.043949127197265625, 0.0510406494140625, 0.058132171630859375, 0.06522369384765625, 0.07231521606445312, 0.07940673828125, 0.08649826049804688, 0.09358978271484375, 0.10068130493164062, 0.1077728271484375, 0.11486434936523438, 0.12195587158203125, 0.12904739379882812, 0.136138916015625, 0.14323043823242188, 0.15032196044921875, 0.15741348266601562, 0.1645050048828125, 0.17159652709960938, 0.17868804931640625, 0.18577957153320312, 0.19287109375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 7.0, 13.0, 15.0, 12.0, 11.0, 20.0, 16.0, 35.0, 27.0, 33.0, 37.0, 51.0, 49.0, 36.0, 59.0, 51.0, 57.0, 54.0, 41.0, 48.0, 40.0, 43.0, 34.0, 30.0, 21.0, 27.0, 24.0, 21.0, 15.0, 12.0, 12.0, 8.0, 1.0, 15.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.147216796875, -0.1434640884399414, -0.1397113800048828, -0.13595867156982422, -0.13220596313476562, -0.12845325469970703, -0.12470054626464844, -0.12094783782958984, -0.11719512939453125, -0.11344242095947266, -0.10968971252441406, -0.10593700408935547, -0.10218429565429688, -0.09843158721923828, -0.09467887878417969, -0.0909261703491211, -0.0871734619140625, -0.0834207534790039, -0.07966804504394531, -0.07591533660888672, -0.07216262817382812, -0.06840991973876953, -0.06465721130371094, -0.060904502868652344, -0.05715179443359375, -0.053399085998535156, -0.04964637756347656, -0.04589366912841797, -0.042140960693359375, -0.03838825225830078, -0.03463554382324219, -0.030882835388183594, -0.027130126953125, -0.023377418518066406, -0.019624710083007812, -0.01587200164794922, -0.012119293212890625, -0.008366584777832031, -0.0046138763427734375, -0.0008611679077148438, 0.00289154052734375, 0.006644248962402344, 0.010396957397460938, 0.014149665832519531, 0.017902374267578125, 0.02165508270263672, 0.025407791137695312, 0.029160499572753906, 0.0329132080078125, 0.036665916442871094, 0.04041862487792969, 0.04417133331298828, 0.047924041748046875, 0.05167675018310547, 0.05542945861816406, 0.059182167053222656, 0.06293487548828125, 0.06668758392333984, 0.07044029235839844, 0.07419300079345703, 0.07794570922851562, 0.08169841766357422, 0.08545112609863281, 0.0892038345336914, 0.09295654296875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 11.0, 11.0, 23.0, 31.0, 32.0, 42.0, 63.0, 97.0, 156.0, 257.0, 423.0, 940.0, 2405.0, 9137.0, 56664.0, 659879.0, 283628.0, 26044.0, 5401.0, 1654.0, 649.0, 358.0, 212.0, 130.0, 78.0, 48.0, 52.0, 32.0, 30.0, 14.0, 7.0, 7.0, 8.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25927734375, -0.2499542236328125, -0.240631103515625, -0.2313079833984375, -0.22198486328125, -0.2126617431640625, -0.203338623046875, -0.1940155029296875, -0.1846923828125, -0.1753692626953125, -0.166046142578125, -0.1567230224609375, -0.14739990234375, -0.1380767822265625, -0.128753662109375, -0.1194305419921875, -0.110107421875, -0.1007843017578125, -0.091461181640625, -0.0821380615234375, -0.07281494140625, -0.0634918212890625, -0.054168701171875, -0.0448455810546875, -0.0355224609375, -0.0261993408203125, -0.016876220703125, -0.0075531005859375, 0.00177001953125, 0.0110931396484375, 0.020416259765625, 0.0297393798828125, 0.0390625, 0.0483856201171875, 0.057708740234375, 0.0670318603515625, 0.07635498046875, 0.0856781005859375, 0.095001220703125, 0.1043243408203125, 0.1136474609375, 0.1229705810546875, 0.132293701171875, 0.1416168212890625, 0.15093994140625, 0.1602630615234375, 0.169586181640625, 0.1789093017578125, 0.188232421875, 0.1975555419921875, 0.206878662109375, 0.2162017822265625, 0.22552490234375, 0.2348480224609375, 0.244171142578125, 0.2534942626953125, 0.2628173828125, 0.2721405029296875, 0.281463623046875, 0.2907867431640625, 0.30010986328125, 0.3094329833984375, 0.318756103515625, 0.3280792236328125, 0.33740234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 10.0, 12.0, 7.0, 10.0, 15.0, 12.0, 19.0, 23.0, 29.0, 27.0, 31.0, 39.0, 44.0, 37.0, 47.0, 38.0, 47.0, 51.0, 51.0, 47.0, 59.0, 44.0, 55.0, 35.0, 39.0, 36.0, 32.0, 16.0, 16.0, 8.0, 16.0, 8.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4677734375, -0.4536552429199219, -0.43953704833984375, -0.4254188537597656, -0.4113006591796875, -0.3971824645996094, -0.38306427001953125, -0.3689460754394531, -0.354827880859375, -0.3407096862792969, -0.32659149169921875, -0.3124732971191406, -0.2983551025390625, -0.2842369079589844, -0.27011871337890625, -0.2560005187988281, -0.24188232421875, -0.22776412963867188, -0.21364593505859375, -0.19952774047851562, -0.1854095458984375, -0.17129135131835938, -0.15717315673828125, -0.14305496215820312, -0.128936767578125, -0.11481857299804688, -0.10070037841796875, -0.08658218383789062, -0.0724639892578125, -0.058345794677734375, -0.04422760009765625, -0.030109405517578125, -0.0159912109375, -0.001873016357421875, 0.01224517822265625, 0.026363372802734375, 0.0404815673828125, 0.054599761962890625, 0.06871795654296875, 0.08283615112304688, 0.096954345703125, 0.11107254028320312, 0.12519073486328125, 0.13930892944335938, 0.1534271240234375, 0.16754531860351562, 0.18166351318359375, 0.19578170776367188, 0.20989990234375, 0.22401809692382812, 0.23813629150390625, 0.2522544860839844, 0.2663726806640625, 0.2804908752441406, 0.29460906982421875, 0.3087272644042969, 0.322845458984375, 0.3369636535644531, 0.35108184814453125, 0.3652000427246094, 0.3793182373046875, 0.3934364318847656, 0.40755462646484375, 0.4216728210449219, 0.435791015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 3.0, 8.0, 12.0, 23.0, 36.0, 62.0, 75.0, 142.0, 276.0, 594.0, 1770.0, 7683.0, 83025.0, 876793.0, 68452.0, 6881.0, 1545.0, 540.0, 255.0, 133.0, 78.0, 54.0, 41.0, 15.0, 15.0, 10.0, 7.0, 3.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1175537109375, -0.11381816864013672, -0.11008262634277344, -0.10634708404541016, -0.10261154174804688, -0.0988759994506836, -0.09514045715332031, -0.09140491485595703, -0.08766937255859375, -0.08393383026123047, -0.08019828796386719, -0.0764627456665039, -0.07272720336914062, -0.06899166107177734, -0.06525611877441406, -0.06152057647705078, -0.0577850341796875, -0.05404949188232422, -0.05031394958496094, -0.046578407287597656, -0.042842864990234375, -0.039107322692871094, -0.03537178039550781, -0.03163623809814453, -0.02790069580078125, -0.02416515350341797, -0.020429611206054688, -0.016694068908691406, -0.012958526611328125, -0.009222984313964844, -0.0054874420166015625, -0.0017518997192382812, 0.001983642578125, 0.005719184875488281, 0.009454727172851562, 0.013190269470214844, 0.016925811767578125, 0.020661354064941406, 0.024396896362304688, 0.02813243865966797, 0.03186798095703125, 0.03560352325439453, 0.03933906555175781, 0.043074607849121094, 0.046810150146484375, 0.050545692443847656, 0.05428123474121094, 0.05801677703857422, 0.0617523193359375, 0.06548786163330078, 0.06922340393066406, 0.07295894622802734, 0.07669448852539062, 0.0804300308227539, 0.08416557312011719, 0.08790111541748047, 0.09163665771484375, 0.09537220001220703, 0.09910774230957031, 0.1028432846069336, 0.10657882690429688, 0.11031436920166016, 0.11404991149902344, 0.11778545379638672, 0.12152099609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 9.0, 9.0, 7.0, 16.0, 13.0, 20.0, 14.0, 29.0, 30.0, 43.0, 58.0, 72.0, 119.0, 94.0, 123.0, 86.0, 56.0, 62.0, 26.0, 28.0, 17.0, 11.0, 11.0, 8.0, 7.0, 9.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-5.358457565307617e-05, -5.211867392063141e-05, -5.0652772188186646e-05, -4.918687045574188e-05, -4.772096872329712e-05, -4.6255066990852356e-05, -4.478916525840759e-05, -4.332326352596283e-05, -4.1857361793518066e-05, -4.03914600610733e-05, -3.892555832862854e-05, -3.745965659618378e-05, -3.5993754863739014e-05, -3.452785313129425e-05, -3.306195139884949e-05, -3.1596049666404724e-05, -3.013014793395996e-05, -2.8664246201515198e-05, -2.7198344469070435e-05, -2.573244273662567e-05, -2.4266541004180908e-05, -2.2800639271736145e-05, -2.1334737539291382e-05, -1.986883580684662e-05, -1.8402934074401855e-05, -1.6937032341957092e-05, -1.547113060951233e-05, -1.4005228877067566e-05, -1.2539327144622803e-05, -1.107342541217804e-05, -9.607523679733276e-06, -8.141621947288513e-06, -6.67572021484375e-06, -5.209818482398987e-06, -3.7439167499542236e-06, -2.2780150175094604e-06, -8.121132850646973e-07, 6.537884473800659e-07, 2.119690179824829e-06, 3.5855919122695923e-06, 5.0514936447143555e-06, 6.517395377159119e-06, 7.983297109603882e-06, 9.449198842048645e-06, 1.0915100574493408e-05, 1.2381002306938171e-05, 1.3846904039382935e-05, 1.5312805771827698e-05, 1.677870750427246e-05, 1.8244609236717224e-05, 1.9710510969161987e-05, 2.117641270160675e-05, 2.2642314434051514e-05, 2.4108216166496277e-05, 2.557411789894104e-05, 2.7040019631385803e-05, 2.8505921363830566e-05, 2.997182309627533e-05, 3.143772482872009e-05, 3.2903626561164856e-05, 3.436952829360962e-05, 3.583543002605438e-05, 3.7301331758499146e-05, 3.876723349094391e-05, 4.023313522338867e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 1.0, 4.0, 9.0, 12.0, 20.0, 49.0, 92.0, 242.0, 928.0, 5940.0, 281365.0, 748002.0, 10119.0, 1195.0, 321.0, 121.0, 72.0, 28.0, 11.0, 11.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.271728515625, -0.2655668258666992, -0.25940513610839844, -0.25324344635009766, -0.24708175659179688, -0.2409200668334961, -0.2347583770751953, -0.22859668731689453, -0.22243499755859375, -0.21627330780029297, -0.2101116180419922, -0.2039499282836914, -0.19778823852539062, -0.19162654876708984, -0.18546485900878906, -0.17930316925048828, -0.1731414794921875, -0.16697978973388672, -0.16081809997558594, -0.15465641021728516, -0.14849472045898438, -0.1423330307006836, -0.1361713409423828, -0.13000965118408203, -0.12384796142578125, -0.11768627166748047, -0.11152458190917969, -0.1053628921508789, -0.09920120239257812, -0.09303951263427734, -0.08687782287597656, -0.08071613311767578, -0.074554443359375, -0.06839275360107422, -0.06223106384277344, -0.056069374084472656, -0.049907684326171875, -0.043745994567871094, -0.03758430480957031, -0.03142261505126953, -0.02526092529296875, -0.01909923553466797, -0.012937545776367188, -0.006775856018066406, -0.000614166259765625, 0.005547523498535156, 0.011709213256835938, 0.01787090301513672, 0.0240325927734375, 0.03019428253173828, 0.03635597229003906, 0.042517662048339844, 0.048679351806640625, 0.054841041564941406, 0.06100273132324219, 0.06716442108154297, 0.07332611083984375, 0.07948780059814453, 0.08564949035644531, 0.0918111801147461, 0.09797286987304688, 0.10413455963134766, 0.11029624938964844, 0.11645793914794922, 0.12261962890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 11.0, 18.0, 18.0, 30.0, 54.0, 85.0, 127.0, 143.0, 144.0, 147.0, 85.0, 37.0, 23.0, 19.0, 13.0, 13.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09625244140625, -0.09143543243408203, -0.08661842346191406, -0.0818014144897461, -0.07698440551757812, -0.07216739654541016, -0.06735038757324219, -0.06253337860107422, -0.05771636962890625, -0.05289936065673828, -0.04808235168457031, -0.043265342712402344, -0.038448333740234375, -0.033631324768066406, -0.028814315795898438, -0.02399730682373047, -0.0191802978515625, -0.014363288879394531, -0.009546279907226562, -0.004729270935058594, 8.7738037109375e-05, 0.004904747009277344, 0.009721755981445312, 0.014538764953613281, 0.01935577392578125, 0.02417278289794922, 0.028989791870117188, 0.033806800842285156, 0.038623809814453125, 0.043440818786621094, 0.04825782775878906, 0.05307483673095703, 0.057891845703125, 0.06270885467529297, 0.06752586364746094, 0.0723428726196289, 0.07715988159179688, 0.08197689056396484, 0.08679389953613281, 0.09161090850830078, 0.09642791748046875, 0.10124492645263672, 0.10606193542480469, 0.11087894439697266, 0.11569595336914062, 0.1205129623413086, 0.12532997131347656, 0.13014698028564453, 0.1349639892578125, 0.13978099822998047, 0.14459800720214844, 0.1494150161743164, 0.15423202514648438, 0.15904903411865234, 0.1638660430908203, 0.16868305206298828, 0.17350006103515625, 0.17831707000732422, 0.1831340789794922, 0.18795108795166016, 0.19276809692382812, 0.1975851058959961, 0.20240211486816406, 0.20721912384033203, 0.2120361328125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 9.0, 12.0, 72.0, 194.0, 342.0, 243.0, 92.0, 26.0, 14.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.448692321777344, -5.31413459777832, -5.179576873779297, -5.045019149780273, -4.91046142578125, -4.775903701782227, -4.641345977783203, -4.50678825378418, -4.372230529785156, -4.237672805786133, -4.103115081787109, -3.968557357788086, -3.8339996337890625, -3.699441909790039, -3.5648841857910156, -3.430326461791992, -3.295768976211548, -3.1612112522125244, -3.026653528213501, -2.8920958042144775, -2.757538080215454, -2.6229803562164307, -2.4884228706359863, -2.353865146636963, -2.2193074226379395, -2.084749698638916, -1.9501919746398926, -1.8156342506408691, -1.6810765266418457, -1.5465188026428223, -1.4119611978530884, -1.277403473854065, -1.142845630645752, -1.0082879066467285, -0.8737301826477051, -0.7391725182533264, -0.604614794254303, -0.47005707025527954, -0.3354994058609009, -0.20094168186187744, -0.066383957862854, 0.06817375123500824, 0.20273146033287048, 0.33728915452957153, 0.47184687852859497, 0.6064046025276184, 0.7409622669219971, 0.8755199909210205, 1.010077714920044, 1.1446354389190674, 1.2791931629180908, 1.4137508869171143, 1.5483086109161377, 1.6828663349151611, 1.817423939704895, 1.9519816637039185, 2.0865392684936523, 2.221096992492676, 2.355654716491699, 2.4902124404907227, 2.624770164489746, 2.7593278884887695, 2.893885612487793, 3.0284433364868164, 3.16300106048584]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 12.0, 10.0, 13.0, 12.0, 22.0, 22.0, 23.0, 26.0, 28.0, 38.0, 47.0, 43.0, 50.0, 52.0, 56.0, 54.0, 72.0, 56.0, 58.0, 41.0, 39.0, 34.0, 37.0, 37.0, 23.0, 12.0, 11.0, 15.0, 9.0, 14.0, 11.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0071139335632324, -1.9408154487609863, -1.8745168447494507, -1.8082183599472046, -1.7419198751449585, -1.6756212711334229, -1.6093227863311768, -1.5430243015289307, -1.4767258167266846, -1.4104273319244385, -1.3441287279129028, -1.2778302431106567, -1.2115317583084106, -1.145233154296875, -1.078934669494629, -1.0126361846923828, -0.9463375806808472, -0.8800390362739563, -0.8137405514717102, -0.7474420070648193, -0.6811435222625732, -0.6148449778556824, -0.5485464334487915, -0.482247918844223, -0.41594940423965454, -0.34965088963508606, -0.2833523750305176, -0.2170538306236267, -0.15075531601905823, -0.08445680141448975, -0.018158257007598877, 0.048140257596969604, 0.11443877220153809, 0.18073728680610657, 0.24703581631183624, 0.3133343458175659, 0.3796328604221344, 0.4459313750267029, 0.5122299194335938, 0.5785284042358398, 0.6448269486427307, 0.7111254930496216, 0.7774239778518677, 0.8437225222587585, 0.9100210666656494, 0.9763195514678955, 1.0426180362701416, 1.1089166402816772, 1.1752151250839233, 1.2415136098861694, 1.307812213897705, 1.3741106986999512, 1.4404091835021973, 1.5067076683044434, 1.573006272315979, 1.639304757118225, 1.7056033611297607, 1.7719018459320068, 1.8382004499435425, 1.9044989347457886, 1.9707974195480347, 2.0370960235595703, 2.1033945083618164, 2.1696929931640625, 2.2359914779663086]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 6.0, 6.0, 8.0, 10.0, 16.0, 18.0, 28.0, 41.0, 42.0, 64.0, 82.0, 145.0, 239.0, 341.0, 539.0, 965.0, 1924.0, 4066.0, 9648.0, 31947.0, 394353.0, 3572750.0, 141243.0, 21139.0, 7595.0, 3271.0, 1590.0, 893.0, 458.0, 292.0, 158.0, 123.0, 62.0, 58.0, 34.0, 33.0, 23.0, 11.0, 10.0, 9.0, 17.0, 4.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1802978515625, -0.17489242553710938, -0.16948699951171875, -0.16408157348632812, -0.1586761474609375, -0.15327072143554688, -0.14786529541015625, -0.14245986938476562, -0.137054443359375, -0.13164901733398438, -0.12624359130859375, -0.12083816528320312, -0.1154327392578125, -0.11002731323242188, -0.10462188720703125, -0.09921646118164062, -0.09381103515625, -0.08840560913085938, -0.08300018310546875, -0.07759475708007812, -0.0721893310546875, -0.06678390502929688, -0.06137847900390625, -0.055973052978515625, -0.050567626953125, -0.045162200927734375, -0.03975677490234375, -0.034351348876953125, -0.0289459228515625, -0.023540496826171875, -0.01813507080078125, -0.012729644775390625, -0.00732421875, -0.001918792724609375, 0.00348663330078125, 0.008892059326171875, 0.0142974853515625, 0.019702911376953125, 0.02510833740234375, 0.030513763427734375, 0.035919189453125, 0.041324615478515625, 0.04673004150390625, 0.052135467529296875, 0.0575408935546875, 0.06294631958007812, 0.06835174560546875, 0.07375717163085938, 0.07916259765625, 0.08456802368164062, 0.08997344970703125, 0.09537887573242188, 0.1007843017578125, 0.10618972778320312, 0.11159515380859375, 0.11700057983398438, 0.122406005859375, 0.12781143188476562, 0.13321685791015625, 0.13862228393554688, 0.1440277099609375, 0.14943313598632812, 0.15483856201171875, 0.16024398803710938, 0.1656494140625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 5.0, 12.0, 10.0, 12.0, 11.0, 17.0, 30.0, 29.0, 45.0, 42.0, 45.0, 56.0, 34.0, 58.0, 68.0, 61.0, 50.0, 42.0, 57.0, 52.0, 39.0, 40.0, 32.0, 26.0, 29.0, 19.0, 19.0, 12.0, 7.0, 7.0, 5.0, 8.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12646484375, -0.1226968765258789, -0.11892890930175781, -0.11516094207763672, -0.11139297485351562, -0.10762500762939453, -0.10385704040527344, -0.10008907318115234, -0.09632110595703125, -0.09255313873291016, -0.08878517150878906, -0.08501720428466797, -0.08124923706054688, -0.07748126983642578, -0.07371330261230469, -0.0699453353881836, -0.0661773681640625, -0.062409400939941406, -0.05864143371582031, -0.05487346649169922, -0.051105499267578125, -0.04733753204345703, -0.04356956481933594, -0.039801597595214844, -0.03603363037109375, -0.032265663146972656, -0.028497695922851562, -0.02472972869873047, -0.020961761474609375, -0.01719379425048828, -0.013425827026367188, -0.009657859802246094, -0.005889892578125, -0.0021219253540039062, 0.0016460418701171875, 0.005414009094238281, 0.009181976318359375, 0.012949943542480469, 0.016717910766601562, 0.020485877990722656, 0.02425384521484375, 0.028021812438964844, 0.03178977966308594, 0.03555774688720703, 0.039325714111328125, 0.04309368133544922, 0.04686164855957031, 0.050629615783691406, 0.0543975830078125, 0.058165550231933594, 0.06193351745605469, 0.06570148468017578, 0.06946945190429688, 0.07323741912841797, 0.07700538635253906, 0.08077335357666016, 0.08454132080078125, 0.08830928802490234, 0.09207725524902344, 0.09584522247314453, 0.09961318969726562, 0.10338115692138672, 0.10714912414550781, 0.1109170913696289, 0.11468505859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 2.0, 8.0, 13.0, 18.0, 40.0, 64.0, 121.0, 295.0, 1006.0, 6280.0, 111165.0, 4045129.0, 26463.0, 2677.0, 616.0, 199.0, 70.0, 30.0, 25.0, 17.0, 9.0, 6.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.455322265625, -0.44077301025390625, -0.4262237548828125, -0.41167449951171875, -0.397125244140625, -0.38257598876953125, -0.3680267333984375, -0.35347747802734375, -0.33892822265625, -0.32437896728515625, -0.3098297119140625, -0.29528045654296875, -0.280731201171875, -0.26618194580078125, -0.2516326904296875, -0.23708343505859375, -0.2225341796875, -0.20798492431640625, -0.1934356689453125, -0.17888641357421875, -0.164337158203125, -0.14978790283203125, -0.1352386474609375, -0.12068939208984375, -0.10614013671875, -0.09159088134765625, -0.0770416259765625, -0.06249237060546875, -0.047943115234375, -0.03339385986328125, -0.0188446044921875, -0.00429534912109375, 0.01025390625, 0.02480316162109375, 0.0393524169921875, 0.05390167236328125, 0.068450927734375, 0.08300018310546875, 0.0975494384765625, 0.11209869384765625, 0.12664794921875, 0.14119720458984375, 0.1557464599609375, 0.17029571533203125, 0.184844970703125, 0.19939422607421875, 0.2139434814453125, 0.22849273681640625, 0.2430419921875, 0.25759124755859375, 0.2721405029296875, 0.28668975830078125, 0.301239013671875, 0.31578826904296875, 0.3303375244140625, 0.34488677978515625, 0.35943603515625, 0.37398529052734375, 0.3885345458984375, 0.40308380126953125, 0.417633056640625, 0.43218231201171875, 0.4467315673828125, 0.46128082275390625, 0.475830078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 3.0, 4.0, 13.0, 12.0, 13.0, 29.0, 41.0, 101.0, 368.0, 1894.0, 1191.0, 211.0, 73.0, 42.0, 18.0, 17.0, 15.0, 7.0, 6.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.3885650634765625, -0.377716064453125, -0.3668670654296875, -0.35601806640625, -0.3451690673828125, -0.334320068359375, -0.3234710693359375, -0.3126220703125, -0.3017730712890625, -0.290924072265625, -0.2800750732421875, -0.26922607421875, -0.2583770751953125, -0.247528076171875, -0.2366790771484375, -0.225830078125, -0.2149810791015625, -0.204132080078125, -0.1932830810546875, -0.18243408203125, -0.1715850830078125, -0.160736083984375, -0.1498870849609375, -0.1390380859375, -0.1281890869140625, -0.117340087890625, -0.1064910888671875, -0.09564208984375, -0.0847930908203125, -0.073944091796875, -0.0630950927734375, -0.05224609375, -0.0413970947265625, -0.030548095703125, -0.0196990966796875, -0.00885009765625, 0.0019989013671875, 0.012847900390625, 0.0236968994140625, 0.0345458984375, 0.0453948974609375, 0.056243896484375, 0.0670928955078125, 0.07794189453125, 0.0887908935546875, 0.099639892578125, 0.1104888916015625, 0.121337890625, 0.1321868896484375, 0.143035888671875, 0.1538848876953125, 0.16473388671875, 0.1755828857421875, 0.186431884765625, 0.1972808837890625, 0.2081298828125, 0.2189788818359375, 0.229827880859375, 0.2406768798828125, 0.25152587890625, 0.2623748779296875, 0.273223876953125, 0.2840728759765625, 0.294921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 12.0, 26.0, 83.0, 195.0, 343.0, 209.0, 83.0, 22.0, 13.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.519117832183838, -3.4436111450195312, -3.3681044578552246, -3.292597770690918, -3.2170910835266113, -3.1415841579437256, -3.066077470779419, -2.9905707836151123, -2.9150640964508057, -2.839557409286499, -2.7640507221221924, -2.6885440349578857, -2.613037109375, -2.5375304222106934, -2.4620237350463867, -2.38651704788208, -2.3110103607177734, -2.235503673553467, -2.15999698638916, -2.0844902992248535, -2.008983612060547, -1.9334768056869507, -1.8579699993133545, -1.7824633121490479, -1.7069566249847412, -1.6314499378204346, -1.555943250656128, -1.4804364442825317, -1.404929757118225, -1.3294230699539185, -1.2539162635803223, -1.1784095764160156, -1.1029026508331299, -1.0273959636688232, -0.9518892168998718, -0.8763824701309204, -0.8008757829666138, -0.7253690958023071, -0.6498623490333557, -0.5743556022644043, -0.49884891510009766, -0.42334219813346863, -0.3478354811668396, -0.27232876420021057, -0.19682204723358154, -0.12131533026695251, -0.045808613300323486, 0.02969813346862793, 0.10520482063293457, 0.1807115375995636, 0.2562182545661926, 0.33172497153282166, 0.4072316884994507, 0.4827384054660797, 0.5582451224327087, 0.6337518692016602, 0.7092585563659668, 0.7847652435302734, 0.8602719902992249, 0.9357787370681763, 1.011285424232483, 1.0867921113967896, 1.1622989177703857, 1.2378056049346924, 1.313312292098999]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 7.0, 6.0, 7.0, 5.0, 10.0, 16.0, 11.0, 29.0, 32.0, 31.0, 25.0, 47.0, 57.0, 68.0, 68.0, 77.0, 73.0, 60.0, 57.0, 64.0, 51.0, 43.0, 36.0, 25.0, 28.0, 22.0, 15.0, 12.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.303004503250122, -1.2634862661361694, -1.2239681482315063, -1.1844499111175537, -1.1449317932128906, -1.105413556098938, -1.0658953189849854, -1.0263772010803223, -0.9868589639663696, -0.9473407864570618, -0.9078226089477539, -0.8683043718338013, -0.8287861943244934, -0.7892680168151855, -0.7497497797012329, -0.710231602191925, -0.6707134246826172, -0.6311952471733093, -0.5916770696640015, -0.5521588325500488, -0.512640655040741, -0.4731224775314331, -0.43360427021980286, -0.3940860629081726, -0.35456788539886475, -0.3150497078895569, -0.27553150057792664, -0.23601330816745758, -0.19649511575698853, -0.15697692334651947, -0.11745873093605042, -0.07794052362442017, -0.038422346115112305, 0.0010958462953567505, 0.040614038705825806, 0.08013223111629486, 0.11965042352676392, 0.15916861593723297, 0.19868680834770203, 0.23820501565933228, 0.27772319316864014, 0.317241370677948, 0.35675957798957825, 0.3962777853012085, 0.43579596281051636, 0.4753141403198242, 0.5148323774337769, 0.5543505549430847, 0.5938687324523926, 0.6333869099617004, 0.6729050874710083, 0.7124233245849609, 0.7519415020942688, 0.7914596796035767, 0.8309779167175293, 0.8704960942268372, 0.910014271736145, 0.9495324492454529, 0.9890506267547607, 1.0285688638687134, 1.068087100982666, 1.107605218887329, 1.1471234560012817, 1.1866416931152344, 1.2261598110198975]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 6.0, 4.0, 7.0, 11.0, 16.0, 30.0, 36.0, 44.0, 96.0, 140.0, 228.0, 393.0, 665.0, 1098.0, 1944.0, 3664.0, 7096.0, 14437.0, 32246.0, 72979.0, 170191.0, 301194.0, 241664.0, 110778.0, 47277.0, 20969.0, 10000.0, 5097.0, 2618.0, 1454.0, 864.0, 462.0, 296.0, 189.0, 113.0, 70.0, 71.0, 31.0, 33.0, 18.0, 9.0, 11.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.102294921875, -0.09943294525146484, -0.09657096862792969, -0.09370899200439453, -0.09084701538085938, -0.08798503875732422, -0.08512306213378906, -0.0822610855102539, -0.07939910888671875, -0.0765371322631836, -0.07367515563964844, -0.07081317901611328, -0.06795120239257812, -0.06508922576904297, -0.06222724914550781, -0.059365272521972656, -0.0565032958984375, -0.053641319274902344, -0.05077934265136719, -0.04791736602783203, -0.045055389404296875, -0.04219341278076172, -0.03933143615722656, -0.036469459533691406, -0.03360748291015625, -0.030745506286621094, -0.027883529663085938, -0.02502155303955078, -0.022159576416015625, -0.01929759979248047, -0.016435623168945312, -0.013573646545410156, -0.010711669921875, -0.007849693298339844, -0.0049877166748046875, -0.0021257400512695312, 0.000736236572265625, 0.0035982131958007812, 0.0064601898193359375, 0.009322166442871094, 0.01218414306640625, 0.015046119689941406, 0.017908096313476562, 0.02077007293701172, 0.023632049560546875, 0.02649402618408203, 0.029356002807617188, 0.032217979431152344, 0.0350799560546875, 0.037941932678222656, 0.04080390930175781, 0.04366588592529297, 0.046527862548828125, 0.04938983917236328, 0.05225181579589844, 0.055113792419433594, 0.05797576904296875, 0.060837745666503906, 0.06369972229003906, 0.06656169891357422, 0.06942367553710938, 0.07228565216064453, 0.07514762878417969, 0.07800960540771484, 0.08087158203125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 10.0, 18.0, 17.0, 21.0, 15.0, 22.0, 27.0, 36.0, 49.0, 41.0, 52.0, 44.0, 52.0, 65.0, 56.0, 43.0, 66.0, 46.0, 37.0, 36.0, 51.0, 30.0, 26.0, 32.0, 22.0, 17.0, 13.0, 9.0, 4.0, 6.0, 8.0, 5.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1270751953125, -0.12338829040527344, -0.11970138549804688, -0.11601448059082031, -0.11232757568359375, -0.10864067077636719, -0.10495376586914062, -0.10126686096191406, -0.0975799560546875, -0.09389305114746094, -0.09020614624023438, -0.08651924133300781, -0.08283233642578125, -0.07914543151855469, -0.07545852661132812, -0.07177162170410156, -0.068084716796875, -0.06439781188964844, -0.060710906982421875, -0.05702400207519531, -0.05333709716796875, -0.04965019226074219, -0.045963287353515625, -0.04227638244628906, -0.0385894775390625, -0.03490257263183594, -0.031215667724609375, -0.027528762817382812, -0.02384185791015625, -0.020154953002929688, -0.016468048095703125, -0.012781143188476562, -0.00909423828125, -0.0054073333740234375, -0.001720428466796875, 0.0019664764404296875, 0.00565338134765625, 0.009340286254882812, 0.013027191162109375, 0.016714096069335938, 0.0204010009765625, 0.024087905883789062, 0.027774810791015625, 0.03146171569824219, 0.03514862060546875, 0.03883552551269531, 0.042522430419921875, 0.04620933532714844, 0.049896240234375, 0.05358314514160156, 0.057270050048828125, 0.06095695495605469, 0.06464385986328125, 0.06833076477050781, 0.07201766967773438, 0.07570457458496094, 0.0793914794921875, 0.08307838439941406, 0.08676528930664062, 0.09045219421386719, 0.09413909912109375, 0.09782600402832031, 0.10151290893554688, 0.10519981384277344, 0.10888671875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 3.0, 4.0, 9.0, 10.0, 13.0, 31.0, 39.0, 73.0, 96.0, 215.0, 342.0, 706.0, 1490.0, 6621.0, 152694.0, 852601.0, 28297.0, 3040.0, 1062.0, 469.0, 285.0, 168.0, 90.0, 67.0, 34.0, 31.0, 17.0, 15.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.32210540771484375, -0.3107147216796875, -0.29932403564453125, -0.287933349609375, -0.27654266357421875, -0.2651519775390625, -0.25376129150390625, -0.24237060546875, -0.23097991943359375, -0.2195892333984375, -0.20819854736328125, -0.196807861328125, -0.18541717529296875, -0.1740264892578125, -0.16263580322265625, -0.1512451171875, -0.13985443115234375, -0.1284637451171875, -0.11707305908203125, -0.105682373046875, -0.09429168701171875, -0.0829010009765625, -0.07151031494140625, -0.06011962890625, -0.04872894287109375, -0.0373382568359375, -0.02594757080078125, -0.014556884765625, -0.00316619873046875, 0.0082244873046875, 0.01961517333984375, 0.031005859375, 0.04239654541015625, 0.0537872314453125, 0.06517791748046875, 0.076568603515625, 0.08795928955078125, 0.0993499755859375, 0.11074066162109375, 0.12213134765625, 0.13352203369140625, 0.1449127197265625, 0.15630340576171875, 0.167694091796875, 0.17908477783203125, 0.1904754638671875, 0.20186614990234375, 0.2132568359375, 0.22464752197265625, 0.2360382080078125, 0.24742889404296875, 0.258819580078125, 0.27021026611328125, 0.2816009521484375, 0.29299163818359375, 0.30438232421875, 0.31577301025390625, 0.3271636962890625, 0.33855438232421875, 0.349945068359375, 0.36133575439453125, 0.3727264404296875, 0.38411712646484375, 0.3955078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 2.0, 4.0, 14.0, 12.0, 23.0, 22.0, 19.0, 33.0, 31.0, 26.0, 31.0, 33.0, 35.0, 35.0, 34.0, 38.0, 40.0, 49.0, 45.0, 51.0, 36.0, 42.0, 46.0, 34.0, 42.0, 35.0, 30.0, 25.0, 23.0, 13.0, 22.0, 14.0, 17.0, 12.0, 6.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.408447265625, -0.3973045349121094, -0.38616180419921875, -0.3750190734863281, -0.3638763427734375, -0.3527336120605469, -0.34159088134765625, -0.3304481506347656, -0.319305419921875, -0.3081626892089844, -0.29701995849609375, -0.2858772277832031, -0.2747344970703125, -0.2635917663574219, -0.25244903564453125, -0.24130630493164062, -0.23016357421875, -0.21902084350585938, -0.20787811279296875, -0.19673538208007812, -0.1855926513671875, -0.17444992065429688, -0.16330718994140625, -0.15216445922851562, -0.141021728515625, -0.12987899780273438, -0.11873626708984375, -0.10759353637695312, -0.0964508056640625, -0.08530807495117188, -0.07416534423828125, -0.06302261352539062, -0.0518798828125, -0.040737152099609375, -0.02959442138671875, -0.018451690673828125, -0.0073089599609375, 0.003833770751953125, 0.01497650146484375, 0.026119232177734375, 0.037261962890625, 0.048404693603515625, 0.05954742431640625, 0.07069015502929688, 0.0818328857421875, 0.09297561645507812, 0.10411834716796875, 0.11526107788085938, 0.12640380859375, 0.13754653930664062, 0.14868927001953125, 0.15983200073242188, 0.1709747314453125, 0.18211746215820312, 0.19326019287109375, 0.20440292358398438, 0.215545654296875, 0.22668838500976562, 0.23783111572265625, 0.24897384643554688, 0.2601165771484375, 0.2712593078613281, 0.28240203857421875, 0.2935447692871094, 0.3046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 9.0, 10.0, 10.0, 20.0, 38.0, 44.0, 111.0, 182.0, 476.0, 1395.0, 6219.0, 278479.0, 750242.0, 8615.0, 1649.0, 524.0, 252.0, 106.0, 60.0, 34.0, 26.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2130126953125, -0.20615768432617188, -0.19930267333984375, -0.19244766235351562, -0.1855926513671875, -0.17873764038085938, -0.17188262939453125, -0.16502761840820312, -0.158172607421875, -0.15131759643554688, -0.14446258544921875, -0.13760757446289062, -0.1307525634765625, -0.12389755249023438, -0.11704254150390625, -0.11018753051757812, -0.10333251953125, -0.09647750854492188, -0.08962249755859375, -0.08276748657226562, -0.0759124755859375, -0.06905746459960938, -0.06220245361328125, -0.055347442626953125, -0.048492431640625, -0.041637420654296875, -0.03478240966796875, -0.027927398681640625, -0.0210723876953125, -0.014217376708984375, -0.00736236572265625, -0.000507354736328125, 0.00634765625, 0.013202667236328125, 0.02005767822265625, 0.026912689208984375, 0.0337677001953125, 0.040622711181640625, 0.04747772216796875, 0.054332733154296875, 0.061187744140625, 0.06804275512695312, 0.07489776611328125, 0.08175277709960938, 0.0886077880859375, 0.09546279907226562, 0.10231781005859375, 0.10917282104492188, 0.11602783203125, 0.12288284301757812, 0.12973785400390625, 0.13659286499023438, 0.1434478759765625, 0.15030288696289062, 0.15715789794921875, 0.16401290893554688, 0.170867919921875, 0.17772293090820312, 0.18457794189453125, 0.19143295288085938, 0.1982879638671875, 0.20514297485351562, 0.21199798583984375, 0.21885299682617188, 0.2257080078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 7.0, 9.0, 13.0, 7.0, 14.0, 13.0, 22.0, 27.0, 45.0, 58.0, 81.0, 112.0, 135.0, 100.0, 77.0, 62.0, 48.0, 34.0, 26.0, 15.0, 15.0, 15.0, 10.0, 6.0, 6.0, 7.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.166364669799805e-05, -4.0024518966674805e-05, -3.838539123535156e-05, -3.674626350402832e-05, -3.510713577270508e-05, -3.3468008041381836e-05, -3.1828880310058594e-05, -3.018975257873535e-05, -2.855062484741211e-05, -2.6911497116088867e-05, -2.5272369384765625e-05, -2.3633241653442383e-05, -2.199411392211914e-05, -2.03549861907959e-05, -1.8715858459472656e-05, -1.7076730728149414e-05, -1.5437602996826172e-05, -1.379847526550293e-05, -1.2159347534179688e-05, -1.0520219802856445e-05, -8.881092071533203e-06, -7.241964340209961e-06, -5.602836608886719e-06, -3.9637088775634766e-06, -2.3245811462402344e-06, -6.854534149169922e-07, 9.5367431640625e-07, 2.592802047729492e-06, 4.231929779052734e-06, 5.8710575103759766e-06, 7.510185241699219e-06, 9.149312973022461e-06, 1.0788440704345703e-05, 1.2427568435668945e-05, 1.4066696166992188e-05, 1.570582389831543e-05, 1.7344951629638672e-05, 1.8984079360961914e-05, 2.0623207092285156e-05, 2.22623348236084e-05, 2.390146255493164e-05, 2.5540590286254883e-05, 2.7179718017578125e-05, 2.8818845748901367e-05, 3.045797348022461e-05, 3.209710121154785e-05, 3.3736228942871094e-05, 3.5375356674194336e-05, 3.701448440551758e-05, 3.865361213684082e-05, 4.029273986816406e-05, 4.1931867599487305e-05, 4.357099533081055e-05, 4.521012306213379e-05, 4.684925079345703e-05, 4.8488378524780273e-05, 5.0127506256103516e-05, 5.176663398742676e-05, 5.340576171875e-05, 5.504488945007324e-05, 5.6684017181396484e-05, 5.8323144912719727e-05, 5.996227264404297e-05, 6.160140037536621e-05, 6.324052810668945e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 10.0, 4.0, 15.0, 18.0, 21.0, 39.0, 47.0, 65.0, 104.0, 170.0, 335.0, 627.0, 1488.0, 3738.0, 12848.0, 117029.0, 819553.0, 76319.0, 10476.0, 3071.0, 1246.0, 573.0, 270.0, 156.0, 99.0, 73.0, 33.0, 35.0, 17.0, 15.0, 13.0, 7.0, 7.0, 10.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1064453125, -0.10326099395751953, -0.10007667541503906, -0.0968923568725586, -0.09370803833007812, -0.09052371978759766, -0.08733940124511719, -0.08415508270263672, -0.08097076416015625, -0.07778644561767578, -0.07460212707519531, -0.07141780853271484, -0.06823348999023438, -0.0650491714477539, -0.06186485290527344, -0.05868053436279297, -0.0554962158203125, -0.05231189727783203, -0.04912757873535156, -0.045943260192871094, -0.042758941650390625, -0.039574623107910156, -0.03639030456542969, -0.03320598602294922, -0.03002166748046875, -0.02683734893798828, -0.023653030395507812, -0.020468711853027344, -0.017284393310546875, -0.014100074768066406, -0.010915756225585938, -0.007731437683105469, -0.004547119140625, -0.0013628005981445312, 0.0018215179443359375, 0.005005836486816406, 0.008190155029296875, 0.011374473571777344, 0.014558792114257812, 0.01774311065673828, 0.02092742919921875, 0.02411174774169922, 0.027296066284179688, 0.030480384826660156, 0.033664703369140625, 0.036849021911621094, 0.04003334045410156, 0.04321765899658203, 0.0464019775390625, 0.04958629608154297, 0.05277061462402344, 0.055954933166503906, 0.059139251708984375, 0.062323570251464844, 0.06550788879394531, 0.06869220733642578, 0.07187652587890625, 0.07506084442138672, 0.07824516296386719, 0.08142948150634766, 0.08461380004882812, 0.0877981185913086, 0.09098243713378906, 0.09416675567626953, 0.09735107421875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 7.0, 2.0, 0.0, 6.0, 5.0, 5.0, 13.0, 16.0, 19.0, 37.0, 40.0, 51.0, 62.0, 76.0, 113.0, 92.0, 92.0, 88.0, 71.0, 63.0, 30.0, 38.0, 22.0, 14.0, 10.0, 5.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08599853515625, -0.08277416229248047, -0.07954978942871094, -0.0763254165649414, -0.07310104370117188, -0.06987667083740234, -0.06665229797363281, -0.06342792510986328, -0.06020355224609375, -0.05697917938232422, -0.05375480651855469, -0.050530433654785156, -0.047306060791015625, -0.044081687927246094, -0.04085731506347656, -0.03763294219970703, -0.0344085693359375, -0.03118419647216797, -0.027959823608398438, -0.024735450744628906, -0.021511077880859375, -0.018286705017089844, -0.015062332153320312, -0.011837959289550781, -0.00861358642578125, -0.005389213562011719, -0.0021648406982421875, 0.0010595321655273438, 0.004283905029296875, 0.007508277893066406, 0.010732650756835938, 0.013957023620605469, 0.017181396484375, 0.02040576934814453, 0.023630142211914062, 0.026854515075683594, 0.030078887939453125, 0.033303260803222656, 0.03652763366699219, 0.03975200653076172, 0.04297637939453125, 0.04620075225830078, 0.04942512512207031, 0.052649497985839844, 0.055873870849609375, 0.059098243713378906, 0.06232261657714844, 0.06554698944091797, 0.0687713623046875, 0.07199573516845703, 0.07522010803222656, 0.0784444808959961, 0.08166885375976562, 0.08489322662353516, 0.08811759948730469, 0.09134197235107422, 0.09456634521484375, 0.09779071807861328, 0.10101509094238281, 0.10423946380615234, 0.10746383666992188, 0.1106882095336914, 0.11391258239746094, 0.11713695526123047, 0.120361328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 8.0, 11.0, 33.0, 63.0, 128.0, 219.0, 200.0, 173.0, 76.0, 45.0, 13.0, 6.0, 11.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.728104829788208, -1.6668163537979126, -1.6055278778076172, -1.5442395210266113, -1.482951045036316, -1.4216625690460205, -1.360374093055725, -1.2990856170654297, -1.2377972602844238, -1.1765087842941284, -1.115220308303833, -1.0539319515228271, -0.9926434755325317, -0.9313549995422363, -0.8700665235519409, -0.8087780475616455, -0.7474895715713501, -0.6862010955810547, -0.624912679195404, -0.5636242032051086, -0.502335786819458, -0.4410473108291626, -0.3797588348388672, -0.31847038865089417, -0.25718194246292114, -0.19589349627494812, -0.1346050351858139, -0.07331657409667969, -0.012028127908706665, 0.04926031827926636, 0.11054879426956177, 0.1718372404575348, 0.2331256866455078, 0.29441413283348083, 0.35570257902145386, 0.41699105501174927, 0.4782795011997223, 0.5395679473876953, 0.6008564233779907, 0.6621448993682861, 0.7234333157539368, 0.7847217917442322, 0.8460102081298828, 0.9072986841201782, 0.9685871601104736, 1.0298755168914795, 1.0911641120910645, 1.1524524688720703, 1.2137409448623657, 1.2750294208526611, 1.3363178968429565, 1.397606372833252, 1.4588947296142578, 1.5201832056045532, 1.5814716815948486, 1.642760157585144, 1.7040486335754395, 1.7653371095657349, 1.8266255855560303, 1.8879139423370361, 1.9492024183273315, 2.010490894317627, 2.071779251098633, 2.1330678462982178, 2.1943562030792236]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 14.0, 10.0, 21.0, 15.0, 19.0, 22.0, 25.0, 28.0, 40.0, 45.0, 52.0, 53.0, 58.0, 62.0, 69.0, 51.0, 63.0, 45.0, 37.0, 30.0, 36.0, 38.0, 23.0, 24.0, 21.0, 20.0, 15.0, 17.0, 14.0, 5.0, 3.0, 2.0, 7.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.066498041152954, -2.0110204219818115, -1.955542802810669, -1.9000651836395264, -1.8445875644683838, -1.7891099452972412, -1.733632206916809, -1.6781545877456665, -1.622676968574524, -1.5671993494033813, -1.5117217302322388, -1.4562441110610962, -1.400766372680664, -1.3452887535095215, -1.289811134338379, -1.2343335151672363, -1.1788558959960938, -1.1233782768249512, -1.0679006576538086, -1.012423038482666, -0.9569453597068787, -0.9014677405357361, -0.8459900617599487, -0.7905124425888062, -0.7350348234176636, -0.679557204246521, -0.6240795850753784, -0.5686019062995911, -0.5131242871284485, -0.4576466679573059, -0.40216901898384094, -0.346691370010376, -0.29121363162994385, -0.23573599755764008, -0.1802583634853363, -0.12478072941303253, -0.06930309534072876, -0.013825476169586182, 0.041652172803878784, 0.09712982177734375, 0.15260744094848633, 0.2080850750207901, 0.26356270909309387, 0.31904035806655884, 0.3745179772377014, 0.429995596408844, 0.48547324538230896, 0.5409508943557739, 0.5964285135269165, 0.6519061326980591, 0.7073837518692017, 0.762861430644989, 0.8183390498161316, 0.8738166689872742, 0.9292943477630615, 0.9847719669342041, 1.0402495861053467, 1.0957272052764893, 1.1512048244476318, 1.2066824436187744, 1.262160062789917, 1.3176376819610596, 1.3731154203414917, 1.4285930395126343, 1.4840706586837769]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 7.0, 9.0, 14.0, 13.0, 19.0, 33.0, 32.0, 54.0, 63.0, 89.0, 114.0, 154.0, 246.0, 618.0, 5236.0, 4162781.0, 22934.0, 870.0, 300.0, 176.0, 105.0, 90.0, 64.0, 54.0, 43.0, 39.0, 19.0, 20.0, 13.0, 13.0, 9.0, 7.0, 8.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.8193359375, -0.7956924438476562, -0.7720489501953125, -0.7484054565429688, -0.724761962890625, -0.7011184692382812, -0.6774749755859375, -0.6538314819335938, -0.63018798828125, -0.6065444946289062, -0.5829010009765625, -0.5592575073242188, -0.535614013671875, -0.5119705200195312, -0.4883270263671875, -0.46468353271484375, -0.4410400390625, -0.41739654541015625, -0.3937530517578125, -0.37010955810546875, -0.346466064453125, -0.32282257080078125, -0.2991790771484375, -0.27553558349609375, -0.25189208984375, -0.22824859619140625, -0.2046051025390625, -0.18096160888671875, -0.157318115234375, -0.13367462158203125, -0.1100311279296875, -0.08638763427734375, -0.062744140625, -0.03910064697265625, -0.0154571533203125, 0.00818634033203125, 0.031829833984375, 0.05547332763671875, 0.0791168212890625, 0.10276031494140625, 0.12640380859375, 0.15004730224609375, 0.1736907958984375, 0.19733428955078125, 0.220977783203125, 0.24462127685546875, 0.2682647705078125, 0.29190826416015625, 0.3155517578125, 0.33919525146484375, 0.3628387451171875, 0.38648223876953125, 0.410125732421875, 0.43376922607421875, 0.4574127197265625, 0.48105621337890625, 0.50469970703125, 0.5283432006835938, 0.5519866943359375, 0.5756301879882812, 0.599273681640625, 0.6229171752929688, 0.6465606689453125, 0.6702041625976562, 0.69384765625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 8.0, 9.0, 19.0, 20.0, 22.0, 30.0, 43.0, 68.0, 68.0, 76.0, 84.0, 94.0, 85.0, 78.0, 63.0, 53.0, 54.0, 40.0, 25.0, 25.0, 19.0, 4.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2431640625, -0.23758316040039062, -0.23200225830078125, -0.22642135620117188, -0.2208404541015625, -0.21525955200195312, -0.20967864990234375, -0.20409774780273438, -0.198516845703125, -0.19293594360351562, -0.18735504150390625, -0.18177413940429688, -0.1761932373046875, -0.17061233520507812, -0.16503143310546875, -0.15945053100585938, -0.15386962890625, -0.14828872680664062, -0.14270782470703125, -0.13712692260742188, -0.1315460205078125, -0.12596511840820312, -0.12038421630859375, -0.11480331420898438, -0.109222412109375, -0.10364151000976562, -0.09806060791015625, -0.09247970581054688, -0.0868988037109375, -0.08131790161132812, -0.07573699951171875, -0.07015609741210938, -0.0645751953125, -0.058994293212890625, -0.05341339111328125, -0.047832489013671875, -0.0422515869140625, -0.036670684814453125, -0.03108978271484375, -0.025508880615234375, -0.019927978515625, -0.014347076416015625, -0.00876617431640625, -0.003185272216796875, 0.0023956298828125, 0.007976531982421875, 0.01355743408203125, 0.019138336181640625, 0.02471923828125, 0.030300140380859375, 0.03588104248046875, 0.041461944580078125, 0.0470428466796875, 0.052623748779296875, 0.05820465087890625, 0.06378555297851562, 0.069366455078125, 0.07494735717773438, 0.08052825927734375, 0.08610916137695312, 0.0916900634765625, 0.09727096557617188, 0.10285186767578125, 0.10843276977539062, 0.114013671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 9.0, 14.0, 16.0, 28.0, 38.0, 91.0, 144.0, 309.0, 752.0, 2727.0, 15411.0, 371750.0, 3757211.0, 37793.0, 5735.0, 1335.0, 472.0, 204.0, 113.0, 37.0, 38.0, 22.0, 10.0, 10.0, 6.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28759765625, -0.2789344787597656, -0.27027130126953125, -0.2616081237792969, -0.2529449462890625, -0.24428176879882812, -0.23561859130859375, -0.22695541381835938, -0.218292236328125, -0.20962905883789062, -0.20096588134765625, -0.19230270385742188, -0.1836395263671875, -0.17497634887695312, -0.16631317138671875, -0.15764999389648438, -0.14898681640625, -0.14032363891601562, -0.13166046142578125, -0.12299728393554688, -0.1143341064453125, -0.10567092895507812, -0.09700775146484375, -0.08834457397460938, -0.079681396484375, -0.07101821899414062, -0.06235504150390625, -0.053691864013671875, -0.0450286865234375, -0.036365509033203125, -0.02770233154296875, -0.019039154052734375, -0.0103759765625, -0.001712799072265625, 0.00695037841796875, 0.015613555908203125, 0.0242767333984375, 0.032939910888671875, 0.04160308837890625, 0.050266265869140625, 0.058929443359375, 0.06759262084960938, 0.07625579833984375, 0.08491897583007812, 0.0935821533203125, 0.10224533081054688, 0.11090850830078125, 0.11957168579101562, 0.12823486328125, 0.13689804077148438, 0.14556121826171875, 0.15422439575195312, 0.1628875732421875, 0.17155075073242188, 0.18021392822265625, 0.18887710571289062, 0.197540283203125, 0.20620346069335938, 0.21486663818359375, 0.22352981567382812, 0.2321929931640625, 0.24085617065429688, 0.24951934814453125, 0.2581825256347656, 0.266845703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 9.0, 12.0, 11.0, 25.0, 51.0, 114.0, 436.0, 1818.0, 1183.0, 245.0, 79.0, 26.0, 15.0, 20.0, 12.0, 9.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300537109375, -0.29137420654296875, -0.2822113037109375, -0.27304840087890625, -0.263885498046875, -0.25472259521484375, -0.2455596923828125, -0.23639678955078125, -0.22723388671875, -0.21807098388671875, -0.2089080810546875, -0.19974517822265625, -0.190582275390625, -0.18141937255859375, -0.1722564697265625, -0.16309356689453125, -0.1539306640625, -0.14476776123046875, -0.1356048583984375, -0.12644195556640625, -0.117279052734375, -0.10811614990234375, -0.0989532470703125, -0.08979034423828125, -0.08062744140625, -0.07146453857421875, -0.0623016357421875, -0.05313873291015625, -0.043975830078125, -0.03481292724609375, -0.0256500244140625, -0.01648712158203125, -0.00732421875, 0.00183868408203125, 0.0110015869140625, 0.02016448974609375, 0.029327392578125, 0.03849029541015625, 0.0476531982421875, 0.05681610107421875, 0.06597900390625, 0.07514190673828125, 0.0843048095703125, 0.09346771240234375, 0.102630615234375, 0.11179351806640625, 0.1209564208984375, 0.13011932373046875, 0.1392822265625, 0.14844512939453125, 0.1576080322265625, 0.16677093505859375, 0.175933837890625, 0.18509674072265625, 0.1942596435546875, 0.20342254638671875, 0.21258544921875, 0.22174835205078125, 0.2309112548828125, 0.24007415771484375, 0.249237060546875, 0.25839996337890625, 0.2675628662109375, 0.27672576904296875, 0.285888671875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 27.0, 40.0, 89.0, 151.0, 216.0, 196.0, 147.0, 62.0, 28.0, 13.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7672268152236938, -0.7290539741516113, -0.6908811330795288, -0.6527082920074463, -0.6145354509353638, -0.5763626098632812, -0.5381898283958435, -0.500016987323761, -0.46184414625167847, -0.42367130517959595, -0.3854984641075134, -0.3473256528377533, -0.3091528117656708, -0.27097997069358826, -0.23280714452266693, -0.1946343183517456, -0.15646147727966309, -0.11828864365816116, -0.08011581003665924, -0.04194297641515732, -0.0037701427936553955, 0.034402698278427124, 0.07257552444934845, 0.11074835062026978, 0.1489211916923523, 0.18709403276443481, 0.22526685893535614, 0.26343968510627747, 0.30161252617836, 0.3397853672504425, 0.37795817852020264, 0.41613101959228516, 0.4543037414550781, 0.49247658252716064, 0.5306494235992432, 0.5688222646713257, 0.6069951057434082, 0.6451679468154907, 0.6833407282829285, 0.721513569355011, 0.7596864104270935, 0.797859251499176, 0.8360320925712585, 0.8742049336433411, 0.9123777151107788, 0.9505505561828613, 0.9887233972549438, 1.0268962383270264, 1.0650690793991089, 1.1032419204711914, 1.141414761543274, 1.1795876026153564, 1.217760443687439, 1.2559332847595215, 1.294106125831604, 1.3322789669036865, 1.3704516887664795, 1.408624529838562, 1.4467973709106445, 1.484970211982727, 1.5231430530548096, 1.561315894126892, 1.5994887351989746, 1.6376614570617676, 1.6758344173431396]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 9.0, 16.0, 13.0, 22.0, 19.0, 24.0, 19.0, 48.0, 42.0, 51.0, 55.0, 60.0, 46.0, 68.0, 64.0, 50.0, 63.0, 47.0, 50.0, 39.0, 39.0, 31.0, 22.0, 19.0, 22.0, 12.0, 6.0, 9.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6847864985466003, -0.6613394618034363, -0.6378924250602722, -0.6144454479217529, -0.5909984111785889, -0.5675513744354248, -0.5441043376922607, -0.5206573009490967, -0.497210294008255, -0.47376325726509094, -0.45031625032424927, -0.4268692135810852, -0.40342217683792114, -0.37997516989707947, -0.3565281331539154, -0.33308112621307373, -0.30963408946990967, -0.2861870527267456, -0.26274004578590393, -0.23929300904273987, -0.215845987200737, -0.19239896535873413, -0.16895192861557007, -0.1455049067735672, -0.12205788493156433, -0.09861086308956146, -0.075163833796978, -0.05171680450439453, -0.028269782662391663, -0.004822760820388794, 0.01862427592277527, 0.04207129776477814, 0.06551837921142578, 0.08896540105342865, 0.11241243034601212, 0.13585945963859558, 0.15930648148059845, 0.18275350332260132, 0.20620054006576538, 0.22964756190776825, 0.2530945837497711, 0.2765416204929352, 0.29998862743377686, 0.3234356641769409, 0.346882700920105, 0.37032970786094666, 0.3937767446041107, 0.4172237515449524, 0.44067078828811646, 0.4641178250312805, 0.4875648319721222, 0.5110118389129639, 0.5344588756561279, 0.557905912399292, 0.581352949142456, 0.6047999858856201, 0.6282470226287842, 0.6516940593719482, 0.6751410961151123, 0.6985881328582764, 0.7220351099967957, 0.7454821467399597, 0.7689291834831238, 0.7923762202262878, 0.8158231973648071]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 3.0, 13.0, 10.0, 14.0, 14.0, 34.0, 44.0, 74.0, 104.0, 130.0, 205.0, 335.0, 443.0, 735.0, 1181.0, 2089.0, 4275.0, 8979.0, 22648.0, 64458.0, 191831.0, 382698.0, 236689.0, 81884.0, 27672.0, 11006.0, 4817.0, 2528.0, 1276.0, 821.0, 516.0, 349.0, 199.0, 143.0, 102.0, 65.0, 56.0, 50.0, 25.0, 13.0, 6.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12261962890625, -0.11861324310302734, -0.11460685729980469, -0.11060047149658203, -0.10659408569335938, -0.10258769989013672, -0.09858131408691406, -0.0945749282836914, -0.09056854248046875, -0.0865621566772461, -0.08255577087402344, -0.07854938507080078, -0.07454299926757812, -0.07053661346435547, -0.06653022766113281, -0.06252384185791016, -0.0585174560546875, -0.054511070251464844, -0.05050468444824219, -0.04649829864501953, -0.042491912841796875, -0.03848552703857422, -0.03447914123535156, -0.030472755432128906, -0.02646636962890625, -0.022459983825683594, -0.018453598022460938, -0.014447212219238281, -0.010440826416015625, -0.006434440612792969, -0.0024280548095703125, 0.0015783309936523438, 0.005584716796875, 0.009591102600097656, 0.013597488403320312, 0.01760387420654297, 0.021610260009765625, 0.02561664581298828, 0.029623031616210938, 0.033629417419433594, 0.03763580322265625, 0.041642189025878906, 0.04564857482910156, 0.04965496063232422, 0.053661346435546875, 0.05766773223876953, 0.06167411804199219, 0.06568050384521484, 0.0696868896484375, 0.07369327545166016, 0.07769966125488281, 0.08170604705810547, 0.08571243286132812, 0.08971881866455078, 0.09372520446777344, 0.0977315902709961, 0.10173797607421875, 0.1057443618774414, 0.10975074768066406, 0.11375713348388672, 0.11776351928710938, 0.12176990509033203, 0.1257762908935547, 0.12978267669677734, 0.1337890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 14.0, 13.0, 14.0, 13.0, 21.0, 27.0, 16.0, 35.0, 38.0, 49.0, 56.0, 53.0, 55.0, 56.0, 61.0, 64.0, 59.0, 42.0, 38.0, 42.0, 39.0, 36.0, 31.0, 27.0, 15.0, 26.0, 10.0, 14.0, 10.0, 3.0, 8.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12298583984375, -0.11921977996826172, -0.11545372009277344, -0.11168766021728516, -0.10792160034179688, -0.1041555404663086, -0.10038948059082031, -0.09662342071533203, -0.09285736083984375, -0.08909130096435547, -0.08532524108886719, -0.0815591812133789, -0.07779312133789062, -0.07402706146240234, -0.07026100158691406, -0.06649494171142578, -0.0627288818359375, -0.05896282196044922, -0.05519676208496094, -0.051430702209472656, -0.047664642333984375, -0.043898582458496094, -0.04013252258300781, -0.03636646270751953, -0.03260040283203125, -0.02883434295654297, -0.025068283081054688, -0.021302223205566406, -0.017536163330078125, -0.013770103454589844, -0.010004043579101562, -0.006237983703613281, -0.002471923828125, 0.0012941360473632812, 0.0050601959228515625, 0.008826255798339844, 0.012592315673828125, 0.016358375549316406, 0.020124435424804688, 0.02389049530029297, 0.02765655517578125, 0.03142261505126953, 0.03518867492675781, 0.038954734802246094, 0.042720794677734375, 0.046486854553222656, 0.05025291442871094, 0.05401897430419922, 0.0577850341796875, 0.06155109405517578, 0.06531715393066406, 0.06908321380615234, 0.07284927368164062, 0.0766153335571289, 0.08038139343261719, 0.08414745330810547, 0.08791351318359375, 0.09167957305908203, 0.09544563293457031, 0.0992116928100586, 0.10297775268554688, 0.10674381256103516, 0.11050987243652344, 0.11427593231201172, 0.1180419921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 10.0, 9.0, 12.0, 25.0, 53.0, 88.0, 189.0, 534.0, 1543.0, 12218.0, 745987.0, 279809.0, 6230.0, 1094.0, 395.0, 180.0, 79.0, 40.0, 22.0, 8.0, 4.0, 7.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.501953125, -0.48668670654296875, -0.4714202880859375, -0.45615386962890625, -0.440887451171875, -0.42562103271484375, -0.4103546142578125, -0.39508819580078125, -0.37982177734375, -0.36455535888671875, -0.3492889404296875, -0.33402252197265625, -0.318756103515625, -0.30348968505859375, -0.2882232666015625, -0.27295684814453125, -0.2576904296875, -0.24242401123046875, -0.2271575927734375, -0.21189117431640625, -0.196624755859375, -0.18135833740234375, -0.1660919189453125, -0.15082550048828125, -0.13555908203125, -0.12029266357421875, -0.1050262451171875, -0.08975982666015625, -0.074493408203125, -0.05922698974609375, -0.0439605712890625, -0.02869415283203125, -0.013427734375, 0.00183868408203125, 0.0171051025390625, 0.03237152099609375, 0.047637939453125, 0.06290435791015625, 0.0781707763671875, 0.09343719482421875, 0.10870361328125, 0.12397003173828125, 0.1392364501953125, 0.15450286865234375, 0.169769287109375, 0.18503570556640625, 0.2003021240234375, 0.21556854248046875, 0.2308349609375, 0.24610137939453125, 0.2613677978515625, 0.27663421630859375, 0.291900634765625, 0.30716705322265625, 0.3224334716796875, 0.33769989013671875, 0.35296630859375, 0.36823272705078125, 0.3834991455078125, 0.39876556396484375, 0.414031982421875, 0.42929840087890625, 0.4445648193359375, 0.45983123779296875, 0.47509765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 7.0, 7.0, 7.0, 11.0, 14.0, 16.0, 28.0, 28.0, 34.0, 33.0, 44.0, 46.0, 52.0, 45.0, 51.0, 50.0, 57.0, 52.0, 58.0, 44.0, 49.0, 43.0, 39.0, 25.0, 27.0, 23.0, 20.0, 24.0, 14.0, 15.0, 10.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.338134765625, -0.3258781433105469, -0.31362152099609375, -0.3013648986816406, -0.2891082763671875, -0.2768516540527344, -0.26459503173828125, -0.2523384094238281, -0.240081787109375, -0.22782516479492188, -0.21556854248046875, -0.20331192016601562, -0.1910552978515625, -0.17879867553710938, -0.16654205322265625, -0.15428543090820312, -0.14202880859375, -0.12977218627929688, -0.11751556396484375, -0.10525894165039062, -0.0930023193359375, -0.08074569702148438, -0.06848907470703125, -0.056232452392578125, -0.043975830078125, -0.031719207763671875, -0.01946258544921875, -0.007205963134765625, 0.0050506591796875, 0.017307281494140625, 0.02956390380859375, 0.041820526123046875, 0.0540771484375, 0.06633377075195312, 0.07859039306640625, 0.09084701538085938, 0.1031036376953125, 0.11536026000976562, 0.12761688232421875, 0.13987350463867188, 0.152130126953125, 0.16438674926757812, 0.17664337158203125, 0.18889999389648438, 0.2011566162109375, 0.21341323852539062, 0.22566986083984375, 0.23792648315429688, 0.25018310546875, 0.2624397277832031, 0.27469635009765625, 0.2869529724121094, 0.2992095947265625, 0.3114662170410156, 0.32372283935546875, 0.3359794616699219, 0.348236083984375, 0.3604927062988281, 0.37274932861328125, 0.3850059509277344, 0.3972625732421875, 0.4095191955566406, 0.42177581787109375, 0.4340324401855469, 0.4462890625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 2.0, 9.0, 10.0, 14.0, 19.0, 15.0, 32.0, 61.0, 118.0, 209.0, 568.0, 1444.0, 5924.0, 84547.0, 919813.0, 30148.0, 3730.0, 1055.0, 393.0, 193.0, 95.0, 56.0, 21.0, 20.0, 24.0, 4.0, 5.0, 5.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193359375, -0.1871929168701172, -0.18102645874023438, -0.17486000061035156, -0.16869354248046875, -0.16252708435058594, -0.15636062622070312, -0.1501941680908203, -0.1440277099609375, -0.1378612518310547, -0.13169479370117188, -0.12552833557128906, -0.11936187744140625, -0.11319541931152344, -0.10702896118164062, -0.10086250305175781, -0.094696044921875, -0.08852958679199219, -0.08236312866210938, -0.07619667053222656, -0.07003021240234375, -0.06386375427246094, -0.057697296142578125, -0.05153083801269531, -0.0453643798828125, -0.03919792175292969, -0.033031463623046875, -0.026865005493164062, -0.02069854736328125, -0.014532089233398438, -0.008365631103515625, -0.0021991729736328125, 0.00396728515625, 0.010133743286132812, 0.016300201416015625, 0.022466659545898438, 0.02863311767578125, 0.03479957580566406, 0.040966033935546875, 0.04713249206542969, 0.0532989501953125, 0.05946540832519531, 0.06563186645507812, 0.07179832458496094, 0.07796478271484375, 0.08413124084472656, 0.09029769897460938, 0.09646415710449219, 0.102630615234375, 0.10879707336425781, 0.11496353149414062, 0.12112998962402344, 0.12729644775390625, 0.13346290588378906, 0.13962936401367188, 0.1457958221435547, 0.1519622802734375, 0.1581287384033203, 0.16429519653320312, 0.17046165466308594, 0.17662811279296875, 0.18279457092285156, 0.18896102905273438, 0.1951274871826172, 0.2012939453125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 12.0, 11.0, 9.0, 12.0, 17.0, 24.0, 27.0, 48.0, 63.0, 92.0, 113.0, 128.0, 107.0, 75.0, 55.0, 54.0, 19.0, 21.0, 18.0, 10.0, 12.0, 11.0, 8.0, 10.0, 7.0, 1.0, 4.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.267692565917969e-05, -4.1171908378601074e-05, -3.966689109802246e-05, -3.816187381744385e-05, -3.6656856536865234e-05, -3.515183925628662e-05, -3.364682197570801e-05, -3.2141804695129395e-05, -3.063678741455078e-05, -2.9131770133972168e-05, -2.7626752853393555e-05, -2.612173557281494e-05, -2.4616718292236328e-05, -2.3111701011657715e-05, -2.16066837310791e-05, -2.0101666450500488e-05, -1.8596649169921875e-05, -1.7091631889343262e-05, -1.558661460876465e-05, -1.4081597328186035e-05, -1.2576580047607422e-05, -1.1071562767028809e-05, -9.566545486450195e-06, -8.061528205871582e-06, -6.556510925292969e-06, -5.0514936447143555e-06, -3.546476364135742e-06, -2.041459083557129e-06, -5.364418029785156e-07, 9.685754776000977e-07, 2.473592758178711e-06, 3.978610038757324e-06, 5.4836273193359375e-06, 6.988644599914551e-06, 8.493661880493164e-06, 9.998679161071777e-06, 1.150369644165039e-05, 1.3008713722229004e-05, 1.4513731002807617e-05, 1.601874828338623e-05, 1.7523765563964844e-05, 1.9028782844543457e-05, 2.053380012512207e-05, 2.2038817405700684e-05, 2.3543834686279297e-05, 2.504885196685791e-05, 2.6553869247436523e-05, 2.8058886528015137e-05, 2.956390380859375e-05, 3.106892108917236e-05, 3.2573938369750977e-05, 3.407895565032959e-05, 3.55839729309082e-05, 3.7088990211486816e-05, 3.859400749206543e-05, 4.009902477264404e-05, 4.1604042053222656e-05, 4.310905933380127e-05, 4.461407661437988e-05, 4.6119093894958496e-05, 4.762411117553711e-05, 4.912912845611572e-05, 5.0634145736694336e-05, 5.213916301727295e-05, 5.364418029785156e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 14.0, 13.0, 17.0, 22.0, 28.0, 55.0, 92.0, 168.0, 271.0, 508.0, 1148.0, 3082.0, 11838.0, 81626.0, 695092.0, 221694.0, 24401.0, 5216.0, 1719.0, 687.0, 318.0, 197.0, 109.0, 75.0, 46.0, 32.0, 26.0, 15.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1024169921875, -0.09937858581542969, -0.09634017944335938, -0.09330177307128906, -0.09026336669921875, -0.08722496032714844, -0.08418655395507812, -0.08114814758300781, -0.0781097412109375, -0.07507133483886719, -0.07203292846679688, -0.06899452209472656, -0.06595611572265625, -0.06291770935058594, -0.059879302978515625, -0.05684089660644531, -0.053802490234375, -0.05076408386230469, -0.047725677490234375, -0.04468727111816406, -0.04164886474609375, -0.03861045837402344, -0.035572052001953125, -0.03253364562988281, -0.0294952392578125, -0.026456832885742188, -0.023418426513671875, -0.020380020141601562, -0.01734161376953125, -0.014303207397460938, -0.011264801025390625, -0.008226394653320312, -0.00518798828125, -0.0021495819091796875, 0.000888824462890625, 0.0039272308349609375, 0.00696563720703125, 0.010004043579101562, 0.013042449951171875, 0.016080856323242188, 0.0191192626953125, 0.022157669067382812, 0.025196075439453125, 0.028234481811523438, 0.03127288818359375, 0.03431129455566406, 0.037349700927734375, 0.04038810729980469, 0.043426513671875, 0.04646492004394531, 0.049503326416015625, 0.05254173278808594, 0.05558013916015625, 0.05861854553222656, 0.061656951904296875, 0.06469535827636719, 0.0677337646484375, 0.07077217102050781, 0.07381057739257812, 0.07684898376464844, 0.07988739013671875, 0.08292579650878906, 0.08596420288085938, 0.08900260925292969, 0.092041015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 9.0, 6.0, 13.0, 20.0, 17.0, 28.0, 44.0, 50.0, 83.0, 83.0, 107.0, 112.0, 104.0, 91.0, 78.0, 48.0, 36.0, 20.0, 17.0, 20.0, 7.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1544189453125, -0.15040969848632812, -0.14640045166015625, -0.14239120483398438, -0.1383819580078125, -0.13437271118164062, -0.13036346435546875, -0.12635421752929688, -0.122344970703125, -0.11833572387695312, -0.11432647705078125, -0.11031723022460938, -0.1063079833984375, -0.10229873657226562, -0.09828948974609375, -0.09428024291992188, -0.09027099609375, -0.08626174926757812, -0.08225250244140625, -0.07824325561523438, -0.0742340087890625, -0.07022476196289062, -0.06621551513671875, -0.062206268310546875, -0.058197021484375, -0.054187774658203125, -0.05017852783203125, -0.046169281005859375, -0.0421600341796875, -0.038150787353515625, -0.03414154052734375, -0.030132293701171875, -0.026123046875, -0.022113800048828125, -0.01810455322265625, -0.014095306396484375, -0.0100860595703125, -0.006076812744140625, -0.00206756591796875, 0.001941680908203125, 0.005950927734375, 0.009960174560546875, 0.01396942138671875, 0.017978668212890625, 0.0219879150390625, 0.025997161865234375, 0.03000640869140625, 0.034015655517578125, 0.03802490234375, 0.042034149169921875, 0.04604339599609375, 0.050052642822265625, 0.0540618896484375, 0.058071136474609375, 0.06208038330078125, 0.06608963012695312, 0.070098876953125, 0.07410812377929688, 0.07811737060546875, 0.08212661743164062, 0.0861358642578125, 0.09014511108398438, 0.09415435791015625, 0.09816360473632812, 0.1021728515625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 12.0, 42.0, 133.0, 327.0, 335.0, 103.0, 28.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.97115159034729, -3.8614532947540283, -3.7517549991607666, -3.642056465148926, -3.532358169555664, -3.4226598739624023, -3.3129615783691406, -3.203263282775879, -3.093564987182617, -2.9838666915893555, -2.8741683959960938, -2.764470100402832, -2.654771566390991, -2.5450732707977295, -2.4353749752044678, -2.325676679611206, -2.2159781455993652, -2.1062798500061035, -1.9965814352035522, -1.8868831396102905, -1.7771847248077393, -1.6674864292144775, -1.5577881336212158, -1.448089838027954, -1.3383914232254028, -1.2286931276321411, -1.1189947128295898, -1.0092964172363281, -0.8995980620384216, -0.7898997068405151, -0.6802014112472534, -0.5705030560493469, -0.46080493927001953, -0.35110658407211304, -0.24140825867652893, -0.13170993328094482, -0.02201157808303833, 0.08768677711486816, 0.19738507270812988, 0.3070834279060364, 0.41678178310394287, 0.5264801383018494, 0.6361784934997559, 0.7458767890930176, 0.8555751442909241, 0.9652734994888306, 1.0749717950820923, 1.1846702098846436, 1.2943685054779053, 1.404066801071167, 1.5137652158737183, 1.62346351146698, 1.7331619262695312, 1.842860221862793, 1.9525585174560547, 2.0622568130493164, 2.171955108642578, 2.28165340423584, 2.3913516998291016, 2.5010499954223633, 2.610748529434204, 2.720446825027466, 2.8301451206207275, 2.9398434162139893, 3.04954195022583]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 13.0, 12.0, 16.0, 19.0, 17.0, 27.0, 25.0, 32.0, 43.0, 36.0, 46.0, 62.0, 61.0, 79.0, 55.0, 70.0, 61.0, 40.0, 36.0, 45.0, 31.0, 46.0, 31.0, 21.0, 14.0, 14.0, 10.0, 7.0, 13.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1596269607543945, -2.102816581726074, -2.046006202697754, -1.9891958236694336, -1.9323853254318237, -1.8755749464035034, -1.818764567375183, -1.7619541883468628, -1.705143690109253, -1.6483333110809326, -1.5915229320526123, -1.534712553024292, -1.4779020547866821, -1.4210916757583618, -1.3642812967300415, -1.3074709177017212, -1.2506605386734009, -1.1938501596450806, -1.1370397806167603, -1.0802292823791504, -1.02341890335083, -0.9666085243225098, -0.9097981452941895, -0.8529877662658691, -0.796177327632904, -0.7393669486045837, -0.6825565099716187, -0.6257461309432983, -0.568935751914978, -0.5121253132820129, -0.4553149342536926, -0.3985045254230499, -0.3416941165924072, -0.2848837077617645, -0.22807331383228302, -0.1712629199028015, -0.11445251107215881, -0.05764210224151611, -0.0008317232131958008, 0.0559786856174469, 0.1127890944480896, 0.1695995032787323, 0.2264098972082138, 0.2832202911376953, 0.340030699968338, 0.3968411087989807, 0.453651487827301, 0.5104619264602661, 0.5672723054885864, 0.6240826845169067, 0.6808931231498718, 0.7377035021781921, 0.7945139408111572, 0.8513243198394775, 0.9081346988677979, 0.9649450778961182, 1.0217554569244385, 1.0785658359527588, 1.135376214981079, 1.1921865940093994, 1.2489970922470093, 1.3058074712753296, 1.36261785030365, 1.4194282293319702, 1.47623872756958]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 12.0, 19.0, 11.0, 12.0, 42.0, 41.0, 44.0, 71.0, 97.0, 161.0, 248.0, 389.0, 761.0, 1925.0, 5772.0, 31786.0, 670293.0, 3325494.0, 134805.0, 15242.0, 4037.0, 1514.0, 634.0, 287.0, 172.0, 120.0, 76.0, 56.0, 40.0, 30.0, 16.0, 19.0, 10.0, 8.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18359375, -0.17790603637695312, -0.17221832275390625, -0.16653060913085938, -0.1608428955078125, -0.15515518188476562, -0.14946746826171875, -0.14377975463867188, -0.138092041015625, -0.13240432739257812, -0.12671661376953125, -0.12102890014648438, -0.1153411865234375, -0.10965347290039062, -0.10396575927734375, -0.09827804565429688, -0.09259033203125, -0.08690261840820312, -0.08121490478515625, -0.07552719116210938, -0.0698394775390625, -0.06415176391601562, -0.05846405029296875, -0.052776336669921875, -0.047088623046875, -0.041400909423828125, -0.03571319580078125, -0.030025482177734375, -0.0243377685546875, -0.018650054931640625, -0.01296234130859375, -0.007274627685546875, -0.0015869140625, 0.004100799560546875, 0.00978851318359375, 0.015476226806640625, 0.0211639404296875, 0.026851654052734375, 0.03253936767578125, 0.038227081298828125, 0.043914794921875, 0.049602508544921875, 0.05529022216796875, 0.060977935791015625, 0.0666656494140625, 0.07235336303710938, 0.07804107666015625, 0.08372879028320312, 0.08941650390625, 0.09510421752929688, 0.10079193115234375, 0.10647964477539062, 0.1121673583984375, 0.11785507202148438, 0.12354278564453125, 0.12923049926757812, 0.134918212890625, 0.14060592651367188, 0.14629364013671875, 0.15198135375976562, 0.1576690673828125, 0.16335678100585938, 0.16904449462890625, 0.17473220825195312, 0.180419921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 12.0, 10.0, 20.0, 23.0, 37.0, 38.0, 58.0, 79.0, 92.0, 104.0, 103.0, 108.0, 70.0, 69.0, 44.0, 38.0, 28.0, 33.0, 17.0, 9.0, 2.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2685546875, -0.26274871826171875, -0.2569427490234375, -0.25113677978515625, -0.245330810546875, -0.23952484130859375, -0.2337188720703125, -0.22791290283203125, -0.22210693359375, -0.21630096435546875, -0.2104949951171875, -0.20468902587890625, -0.198883056640625, -0.19307708740234375, -0.1872711181640625, -0.18146514892578125, -0.1756591796875, -0.16985321044921875, -0.1640472412109375, -0.15824127197265625, -0.152435302734375, -0.14662933349609375, -0.1408233642578125, -0.13501739501953125, -0.12921142578125, -0.12340545654296875, -0.1175994873046875, -0.11179351806640625, -0.105987548828125, -0.10018157958984375, -0.0943756103515625, -0.08856964111328125, -0.082763671875, -0.07695770263671875, -0.0711517333984375, -0.06534576416015625, -0.059539794921875, -0.05373382568359375, -0.0479278564453125, -0.04212188720703125, -0.03631591796875, -0.03050994873046875, -0.0247039794921875, -0.01889801025390625, -0.013092041015625, -0.00728607177734375, -0.0014801025390625, 0.00432586669921875, 0.0101318359375, 0.01593780517578125, 0.0217437744140625, 0.02754974365234375, 0.033355712890625, 0.03916168212890625, 0.0449676513671875, 0.05077362060546875, 0.05657958984375, 0.06238555908203125, 0.0681915283203125, 0.07399749755859375, 0.079803466796875, 0.08560943603515625, 0.0914154052734375, 0.09722137451171875, 0.10302734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 13.0, 11.0, 19.0, 21.0, 27.0, 36.0, 76.0, 122.0, 189.0, 370.0, 894.0, 2475.0, 8909.0, 43807.0, 638513.0, 3361160.0, 109522.0, 19186.0, 5291.0, 1843.0, 788.0, 404.0, 219.0, 125.0, 74.0, 51.0, 33.0, 25.0, 17.0, 12.0, 7.0, 10.0, 6.0, 2.0, 2.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.187744140625, -0.181915283203125, -0.17608642578125, -0.170257568359375, -0.1644287109375, -0.158599853515625, -0.15277099609375, -0.146942138671875, -0.14111328125, -0.135284423828125, -0.12945556640625, -0.123626708984375, -0.1177978515625, -0.111968994140625, -0.10614013671875, -0.100311279296875, -0.094482421875, -0.088653564453125, -0.08282470703125, -0.076995849609375, -0.0711669921875, -0.065338134765625, -0.05950927734375, -0.053680419921875, -0.0478515625, -0.042022705078125, -0.03619384765625, -0.030364990234375, -0.0245361328125, -0.018707275390625, -0.01287841796875, -0.007049560546875, -0.001220703125, 0.004608154296875, 0.01043701171875, 0.016265869140625, 0.0220947265625, 0.027923583984375, 0.03375244140625, 0.039581298828125, 0.04541015625, 0.051239013671875, 0.05706787109375, 0.062896728515625, 0.0687255859375, 0.074554443359375, 0.08038330078125, 0.086212158203125, 0.092041015625, 0.097869873046875, 0.10369873046875, 0.109527587890625, 0.1153564453125, 0.121185302734375, 0.12701416015625, 0.132843017578125, 0.138671875, 0.144500732421875, 0.15032958984375, 0.156158447265625, 0.1619873046875, 0.167816162109375, 0.17364501953125, 0.179473876953125, 0.185302734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 10.0, 15.0, 16.0, 13.0, 33.0, 37.0, 61.0, 105.0, 230.0, 609.0, 1042.0, 912.0, 432.0, 192.0, 102.0, 58.0, 51.0, 41.0, 20.0, 19.0, 17.0, 13.0, 5.0, 9.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.172607421875, -0.16594314575195312, -0.15927886962890625, -0.15261459350585938, -0.1459503173828125, -0.13928604125976562, -0.13262176513671875, -0.12595748901367188, -0.119293212890625, -0.11262893676757812, -0.10596466064453125, -0.09930038452148438, -0.0926361083984375, -0.08597183227539062, -0.07930755615234375, -0.07264328002929688, -0.06597900390625, -0.059314727783203125, -0.05265045166015625, -0.045986175537109375, -0.0393218994140625, -0.032657623291015625, -0.02599334716796875, -0.019329071044921875, -0.012664794921875, -0.006000518798828125, 0.00066375732421875, 0.007328033447265625, 0.0139923095703125, 0.020656585693359375, 0.02732086181640625, 0.033985137939453125, 0.0406494140625, 0.047313690185546875, 0.05397796630859375, 0.060642242431640625, 0.0673065185546875, 0.07397079467773438, 0.08063507080078125, 0.08729934692382812, 0.093963623046875, 0.10062789916992188, 0.10729217529296875, 0.11395645141601562, 0.1206207275390625, 0.12728500366210938, 0.13394927978515625, 0.14061355590820312, 0.14727783203125, 0.15394210815429688, 0.16060638427734375, 0.16727066040039062, 0.1739349365234375, 0.18059921264648438, 0.18726348876953125, 0.19392776489257812, 0.200592041015625, 0.20725631713867188, 0.21392059326171875, 0.22058486938476562, 0.2272491455078125, 0.23391342163085938, 0.24057769775390625, 0.24724197387695312, 0.25390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 0.0, 4.0, 18.0, 41.0, 94.0, 210.0, 268.0, 197.0, 91.0, 43.0, 13.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.014565944671631, -1.9520026445388794, -1.8894392251968384, -1.826875925064087, -1.764312505722046, -1.7017492055892944, -1.639185905456543, -1.576622486114502, -1.514059066772461, -1.4514957666397095, -1.3889323472976685, -1.326369047164917, -1.263805627822876, -1.2012423276901245, -1.138679027557373, -1.076115608215332, -1.0135523080825806, -0.9509889483451843, -0.8884255886077881, -0.8258622884750366, -0.7632988691329956, -0.7007355690002441, -0.6381722092628479, -0.5756088495254517, -0.5130454897880554, -0.4504821300506592, -0.38791877031326294, -0.3253554403781891, -0.26279208064079285, -0.2002287209033966, -0.13766539096832275, -0.07510203123092651, -0.012538790702819824, 0.05002456158399582, 0.11258791387081146, 0.1751512587070465, 0.23771461844444275, 0.300277978181839, 0.36284130811691284, 0.4254046678543091, 0.4879680275917053, 0.5505313873291016, 0.6130947470664978, 0.675658106803894, 0.7382214069366455, 0.8007848262786865, 0.863348126411438, 0.9259114861488342, 0.9884748458862305, 1.051038146018982, 1.113601565361023, 1.1761648654937744, 1.2387282848358154, 1.301291584968567, 1.3638548851013184, 1.4264183044433594, 1.4889817237854004, 1.5515450239181519, 1.6141084432601929, 1.6766717433929443, 1.7392351627349854, 1.8017984628677368, 1.8643617630004883, 1.9269251823425293, 1.9894884824752808]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 0.0, 5.0, 4.0, 9.0, 8.0, 12.0, 16.0, 23.0, 24.0, 22.0, 46.0, 46.0, 47.0, 58.0, 67.0, 61.0, 74.0, 58.0, 63.0, 56.0, 56.0, 55.0, 44.0, 38.0, 24.0, 24.0, 23.0, 8.0, 15.0, 6.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7212209105491638, -0.6860234141349792, -0.6508259177207947, -0.6156283617019653, -0.5804308652877808, -0.5452333688735962, -0.5100358724594116, -0.47483837604522705, -0.4396408498287201, -0.4044433534145355, -0.36924582719802856, -0.334048330783844, -0.2988508343696594, -0.26365330815315247, -0.2284558117389679, -0.19325830042362213, -0.15806078910827637, -0.1228632777929306, -0.08766577392816544, -0.05246827006340027, -0.017270758748054504, 0.01792675256729126, 0.05312424898147583, 0.0883217602968216, 0.12351927161216736, 0.15871678292751312, 0.1939142942428589, 0.22911179065704346, 0.264309287071228, 0.299506813287735, 0.33470430970191956, 0.3699018359184265, 0.40509939193725586, 0.44029688835144043, 0.4754944145679474, 0.5106918811798096, 0.5458894371986389, 0.5810869336128235, 0.6162844300270081, 0.6514819264411926, 0.686679482460022, 0.7218769788742065, 0.7570744752883911, 0.7922719717025757, 0.827469527721405, 0.8626670241355896, 0.8978645205497742, 0.9330620169639587, 0.9682595133781433, 1.0034570693969727, 1.0386545658111572, 1.0738520622253418, 1.1090495586395264, 1.144247055053711, 1.1794445514678955, 1.21464204788208, 1.2498395442962646, 1.2850370407104492, 1.3202345371246338, 1.3554320335388184, 1.390629529953003, 1.4258270263671875, 1.461024522781372, 1.4962221384048462, 1.5314196348190308]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 8.0, 13.0, 19.0, 31.0, 34.0, 43.0, 57.0, 91.0, 148.0, 269.0, 371.0, 512.0, 827.0, 1328.0, 2168.0, 3888.0, 6837.0, 12653.0, 24614.0, 49564.0, 100206.0, 182891.0, 243787.0, 194956.0, 109760.0, 55021.0, 26907.0, 13635.0, 7287.0, 4193.0, 2400.0, 1413.0, 925.0, 553.0, 388.0, 252.0, 154.0, 103.0, 64.0, 52.0, 39.0, 24.0, 14.0, 16.0, 11.0, 6.0, 12.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.069091796875, -0.06690311431884766, -0.06471443176269531, -0.06252574920654297, -0.060337066650390625, -0.05814838409423828, -0.05595970153808594, -0.053771018981933594, -0.05158233642578125, -0.049393653869628906, -0.04720497131347656, -0.04501628875732422, -0.042827606201171875, -0.04063892364501953, -0.03845024108886719, -0.036261558532714844, -0.0340728759765625, -0.031884193420410156, -0.029695510864257812, -0.02750682830810547, -0.025318145751953125, -0.02312946319580078, -0.020940780639648438, -0.018752098083496094, -0.01656341552734375, -0.014374732971191406, -0.012186050415039062, -0.009997367858886719, -0.007808685302734375, -0.005620002746582031, -0.0034313201904296875, -0.0012426376342773438, 0.000946044921875, 0.0031347274780273438, 0.0053234100341796875, 0.007512092590332031, 0.009700775146484375, 0.011889457702636719, 0.014078140258789062, 0.016266822814941406, 0.01845550537109375, 0.020644187927246094, 0.022832870483398438, 0.02502155303955078, 0.027210235595703125, 0.02939891815185547, 0.03158760070800781, 0.033776283264160156, 0.0359649658203125, 0.038153648376464844, 0.04034233093261719, 0.04253101348876953, 0.044719696044921875, 0.04690837860107422, 0.04909706115722656, 0.051285743713378906, 0.05347442626953125, 0.055663108825683594, 0.05785179138183594, 0.06004047393798828, 0.062229156494140625, 0.06441783905029297, 0.06660652160644531, 0.06879520416259766, 0.07098388671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 7.0, 10.0, 19.0, 13.0, 13.0, 26.0, 23.0, 30.0, 35.0, 30.0, 43.0, 42.0, 50.0, 58.0, 67.0, 61.0, 48.0, 57.0, 68.0, 42.0, 48.0, 40.0, 20.0, 15.0, 27.0, 17.0, 14.0, 9.0, 25.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.115234375, -0.11187267303466797, -0.10851097106933594, -0.1051492691040039, -0.10178756713867188, -0.09842586517333984, -0.09506416320800781, -0.09170246124267578, -0.08834075927734375, -0.08497905731201172, -0.08161735534667969, -0.07825565338134766, -0.07489395141601562, -0.0715322494506836, -0.06817054748535156, -0.06480884552001953, -0.0614471435546875, -0.05808544158935547, -0.05472373962402344, -0.051362037658691406, -0.048000335693359375, -0.044638633728027344, -0.04127693176269531, -0.03791522979736328, -0.03455352783203125, -0.03119182586669922, -0.027830123901367188, -0.024468421936035156, -0.021106719970703125, -0.017745018005371094, -0.014383316040039062, -0.011021614074707031, -0.007659912109375, -0.004298210144042969, -0.0009365081787109375, 0.0024251937866210938, 0.005786895751953125, 0.009148597717285156, 0.012510299682617188, 0.01587200164794922, 0.01923370361328125, 0.02259540557861328, 0.025957107543945312, 0.029318809509277344, 0.032680511474609375, 0.036042213439941406, 0.03940391540527344, 0.04276561737060547, 0.0461273193359375, 0.04948902130126953, 0.05285072326660156, 0.056212425231933594, 0.059574127197265625, 0.06293582916259766, 0.06629753112792969, 0.06965923309326172, 0.07302093505859375, 0.07638263702392578, 0.07974433898925781, 0.08310604095458984, 0.08646774291992188, 0.0898294448852539, 0.09319114685058594, 0.09655284881591797, 0.09991455078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 11.0, 4.0, 14.0, 24.0, 40.0, 31.0, 39.0, 64.0, 99.0, 107.0, 166.0, 221.0, 308.0, 507.0, 830.0, 1842.0, 7054.0, 75239.0, 860427.0, 89399.0, 7765.0, 1901.0, 843.0, 525.0, 295.0, 224.0, 162.0, 97.0, 90.0, 47.0, 51.0, 25.0, 28.0, 15.0, 15.0, 16.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340576171875, -0.3304176330566406, -0.32025909423828125, -0.3101005554199219, -0.2999420166015625, -0.2897834777832031, -0.27962493896484375, -0.2694664001464844, -0.259307861328125, -0.24914932250976562, -0.23899078369140625, -0.22883224487304688, -0.2186737060546875, -0.20851516723632812, -0.19835662841796875, -0.18819808959960938, -0.17803955078125, -0.16788101196289062, -0.15772247314453125, -0.14756393432617188, -0.1374053955078125, -0.12724685668945312, -0.11708831787109375, -0.10692977905273438, -0.096771240234375, -0.08661270141601562, -0.07645416259765625, -0.06629562377929688, -0.0561370849609375, -0.045978546142578125, -0.03582000732421875, -0.025661468505859375, -0.0155029296875, -0.005344390869140625, 0.00481414794921875, 0.014972686767578125, 0.0251312255859375, 0.035289764404296875, 0.04544830322265625, 0.055606842041015625, 0.065765380859375, 0.07592391967773438, 0.08608245849609375, 0.09624099731445312, 0.1063995361328125, 0.11655807495117188, 0.12671661376953125, 0.13687515258789062, 0.14703369140625, 0.15719223022460938, 0.16735076904296875, 0.17750930786132812, 0.1876678466796875, 0.19782638549804688, 0.20798492431640625, 0.21814346313476562, 0.228302001953125, 0.23846054077148438, 0.24861907958984375, 0.2587776184082031, 0.2689361572265625, 0.2790946960449219, 0.28925323486328125, 0.2994117736816406, 0.3095703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 8.0, 15.0, 4.0, 10.0, 15.0, 18.0, 16.0, 18.0, 28.0, 31.0, 39.0, 59.0, 50.0, 41.0, 59.0, 60.0, 51.0, 67.0, 63.0, 47.0, 59.0, 44.0, 34.0, 39.0, 31.0, 24.0, 12.0, 12.0, 10.0, 10.0, 4.0, 6.0, 3.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.5546875, -0.5394172668457031, -0.5241470336914062, -0.5088768005371094, -0.4936065673828125, -0.4783363342285156, -0.46306610107421875, -0.4477958679199219, -0.432525634765625, -0.4172554016113281, -0.40198516845703125, -0.3867149353027344, -0.3714447021484375, -0.3561744689941406, -0.34090423583984375, -0.3256340026855469, -0.31036376953125, -0.2950935363769531, -0.27982330322265625, -0.2645530700683594, -0.2492828369140625, -0.23401260375976562, -0.21874237060546875, -0.20347213745117188, -0.188201904296875, -0.17293167114257812, -0.15766143798828125, -0.14239120483398438, -0.1271209716796875, -0.11185073852539062, -0.09658050537109375, -0.08131027221679688, -0.0660400390625, -0.050769805908203125, -0.03549957275390625, -0.020229339599609375, -0.0049591064453125, 0.010311126708984375, 0.02558135986328125, 0.040851593017578125, 0.056121826171875, 0.07139205932617188, 0.08666229248046875, 0.10193252563476562, 0.1172027587890625, 0.13247299194335938, 0.14774322509765625, 0.16301345825195312, 0.17828369140625, 0.19355392456054688, 0.20882415771484375, 0.22409439086914062, 0.2393646240234375, 0.2546348571777344, 0.26990509033203125, 0.2851753234863281, 0.300445556640625, 0.3157157897949219, 0.33098602294921875, 0.3462562561035156, 0.3615264892578125, 0.3767967224121094, 0.39206695556640625, 0.4073371887207031, 0.422607421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 14.0, 7.0, 16.0, 16.0, 21.0, 36.0, 50.0, 58.0, 100.0, 120.0, 238.0, 354.0, 665.0, 1125.0, 1997.0, 4113.0, 9325.0, 26780.0, 133848.0, 689891.0, 134382.0, 26984.0, 9317.0, 4257.0, 2038.0, 1066.0, 647.0, 396.0, 220.0, 145.0, 95.0, 58.0, 52.0, 36.0, 22.0, 18.0, 8.0, 10.0, 7.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0635986328125, -0.06157970428466797, -0.05956077575683594, -0.057541847229003906, -0.055522918701171875, -0.053503990173339844, -0.05148506164550781, -0.04946613311767578, -0.04744720458984375, -0.04542827606201172, -0.04340934753417969, -0.041390419006347656, -0.039371490478515625, -0.037352561950683594, -0.03533363342285156, -0.03331470489501953, -0.0312957763671875, -0.02927684783935547, -0.027257919311523438, -0.025238990783691406, -0.023220062255859375, -0.021201133728027344, -0.019182205200195312, -0.01716327667236328, -0.01514434814453125, -0.013125419616699219, -0.011106491088867188, -0.009087562561035156, -0.007068634033203125, -0.005049705505371094, -0.0030307769775390625, -0.0010118484497070312, 0.001007080078125, 0.0030260086059570312, 0.0050449371337890625, 0.007063865661621094, 0.009082794189453125, 0.011101722717285156, 0.013120651245117188, 0.015139579772949219, 0.01715850830078125, 0.01917743682861328, 0.021196365356445312, 0.023215293884277344, 0.025234222412109375, 0.027253150939941406, 0.029272079467773438, 0.03129100799560547, 0.0333099365234375, 0.03532886505126953, 0.03734779357910156, 0.039366722106933594, 0.041385650634765625, 0.043404579162597656, 0.04542350769042969, 0.04744243621826172, 0.04946136474609375, 0.05148029327392578, 0.05349922180175781, 0.055518150329589844, 0.057537078857421875, 0.059556007385253906, 0.06157493591308594, 0.06359386444091797, 0.06561279296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 5.0, 5.0, 9.0, 3.0, 10.0, 10.0, 21.0, 27.0, 37.0, 49.0, 46.0, 76.0, 112.0, 102.0, 107.0, 108.0, 73.0, 50.0, 36.0, 21.0, 29.0, 10.0, 16.0, 6.0, 8.0, 9.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6597251892089844e-05, -3.492087125778198e-05, -3.324449062347412e-05, -3.156810998916626e-05, -2.98917293548584e-05, -2.8215348720550537e-05, -2.6538968086242676e-05, -2.4862587451934814e-05, -2.3186206817626953e-05, -2.1509826183319092e-05, -1.983344554901123e-05, -1.815706491470337e-05, -1.6480684280395508e-05, -1.4804303646087646e-05, -1.3127923011779785e-05, -1.1451542377471924e-05, -9.775161743164062e-06, -8.098781108856201e-06, -6.42240047454834e-06, -4.7460198402404785e-06, -3.069639205932617e-06, -1.3932585716247559e-06, 2.8312206268310547e-07, 1.959502696990967e-06, 3.635883331298828e-06, 5.3122639656066895e-06, 6.988644599914551e-06, 8.665025234222412e-06, 1.0341405868530273e-05, 1.2017786502838135e-05, 1.3694167137145996e-05, 1.5370547771453857e-05, 1.704692840576172e-05, 1.872330904006958e-05, 2.039968967437744e-05, 2.2076070308685303e-05, 2.3752450942993164e-05, 2.5428831577301025e-05, 2.7105212211608887e-05, 2.8781592845916748e-05, 3.045797348022461e-05, 3.213435411453247e-05, 3.381073474884033e-05, 3.548711538314819e-05, 3.7163496017456055e-05, 3.8839876651763916e-05, 4.051625728607178e-05, 4.219263792037964e-05, 4.38690185546875e-05, 4.554539918899536e-05, 4.722177982330322e-05, 4.8898160457611084e-05, 5.0574541091918945e-05, 5.225092172622681e-05, 5.392730236053467e-05, 5.560368299484253e-05, 5.728006362915039e-05, 5.895644426345825e-05, 6.063282489776611e-05, 6.230920553207397e-05, 6.398558616638184e-05, 6.56619668006897e-05, 6.733834743499756e-05, 6.901472806930542e-05, 7.069110870361328e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 4.0, 8.0, 6.0, 10.0, 14.0, 16.0, 18.0, 32.0, 34.0, 55.0, 72.0, 121.0, 189.0, 248.0, 436.0, 703.0, 1449.0, 2748.0, 6026.0, 15561.0, 61828.0, 559409.0, 329060.0, 46565.0, 13170.0, 5299.0, 2424.0, 1216.0, 668.0, 363.0, 246.0, 156.0, 104.0, 85.0, 52.0, 28.0, 23.0, 14.0, 20.0, 14.0, 19.0, 4.0, 8.0, 8.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0587158203125, -0.05675315856933594, -0.054790496826171875, -0.05282783508300781, -0.05086517333984375, -0.04890251159667969, -0.046939849853515625, -0.04497718811035156, -0.0430145263671875, -0.04105186462402344, -0.039089202880859375, -0.03712654113769531, -0.03516387939453125, -0.03320121765136719, -0.031238555908203125, -0.029275894165039062, -0.027313232421875, -0.025350570678710938, -0.023387908935546875, -0.021425247192382812, -0.01946258544921875, -0.017499923706054688, -0.015537261962890625, -0.013574600219726562, -0.0116119384765625, -0.009649276733398438, -0.007686614990234375, -0.0057239532470703125, -0.00376129150390625, -0.0017986297607421875, 0.000164031982421875, 0.0021266937255859375, 0.00408935546875, 0.0060520172119140625, 0.008014678955078125, 0.009977340698242188, 0.01194000244140625, 0.013902664184570312, 0.015865325927734375, 0.017827987670898438, 0.0197906494140625, 0.021753311157226562, 0.023715972900390625, 0.025678634643554688, 0.02764129638671875, 0.029603958129882812, 0.031566619873046875, 0.03352928161621094, 0.035491943359375, 0.03745460510253906, 0.039417266845703125, 0.04137992858886719, 0.04334259033203125, 0.04530525207519531, 0.047267913818359375, 0.04923057556152344, 0.0511932373046875, 0.05315589904785156, 0.055118560791015625, 0.05708122253417969, 0.05904388427734375, 0.06100654602050781, 0.06296920776367188, 0.06493186950683594, 0.06689453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 5.0, 5.0, 4.0, 7.0, 9.0, 12.0, 17.0, 29.0, 29.0, 25.0, 60.0, 64.0, 68.0, 75.0, 72.0, 76.0, 77.0, 66.0, 52.0, 66.0, 37.0, 41.0, 24.0, 17.0, 10.0, 10.0, 13.0, 7.0, 4.0, 5.0, 5.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059661865234375, -0.0573582649230957, -0.055054664611816406, -0.05275106430053711, -0.05044746398925781, -0.048143863677978516, -0.04584026336669922, -0.04353666305541992, -0.041233062744140625, -0.03892946243286133, -0.03662586212158203, -0.034322261810302734, -0.03201866149902344, -0.02971506118774414, -0.027411460876464844, -0.025107860565185547, -0.02280426025390625, -0.020500659942626953, -0.018197059631347656, -0.01589345932006836, -0.013589859008789062, -0.011286258697509766, -0.008982658386230469, -0.006679058074951172, -0.004375457763671875, -0.002071857452392578, 0.00023174285888671875, 0.0025353431701660156, 0.0048389434814453125, 0.007142543792724609, 0.009446144104003906, 0.011749744415283203, 0.0140533447265625, 0.016356945037841797, 0.018660545349121094, 0.02096414566040039, 0.023267745971679688, 0.025571346282958984, 0.02787494659423828, 0.030178546905517578, 0.032482147216796875, 0.03478574752807617, 0.03708934783935547, 0.039392948150634766, 0.04169654846191406, 0.04400014877319336, 0.046303749084472656, 0.04860734939575195, 0.05091094970703125, 0.05321455001831055, 0.055518150329589844, 0.05782175064086914, 0.06012535095214844, 0.062428951263427734, 0.06473255157470703, 0.06703615188598633, 0.06933975219726562, 0.07164335250854492, 0.07394695281982422, 0.07625055313110352, 0.07855415344238281, 0.08085775375366211, 0.0831613540649414, 0.0854649543762207, 0.0877685546875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 9.0, 44.0, 153.0, 492.0, 237.0, 42.0, 16.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28227424621582, -5.1458940505981445, -5.009513854980469, -4.873133659362793, -4.736753463745117, -4.600373268127441, -4.463993072509766, -4.327612400054932, -4.191232204437256, -4.05485200881958, -3.9184718132019043, -3.7820916175842285, -3.6457111835479736, -3.509330987930298, -3.372950792312622, -3.2365705966949463, -3.1001904010772705, -2.9638102054595947, -2.827430009841919, -2.691049575805664, -2.5546693801879883, -2.4182891845703125, -2.2819089889526367, -2.145528793334961, -2.009148597717285, -1.8727684020996094, -1.736388087272644, -1.6000078916549683, -1.463627576828003, -1.3272473812103271, -1.1908671855926514, -1.0544869899749756, -0.9181063175201416, -0.781726062297821, -0.6453458070755005, -0.5089656114578247, -0.37258535623550415, -0.2362051010131836, -0.09982490539550781, 0.036555349826812744, 0.1729356050491333, 0.30931586027145386, 0.445696085691452, 0.5820763111114502, 0.7184565663337708, 0.8548368215560913, 0.9912170171737671, 1.1275973320007324, 1.2639775276184082, 1.400357723236084, 1.5367380380630493, 1.673118233680725, 1.8094985485076904, 1.9458787441253662, 2.082258939743042, 2.2186391353607178, 2.3550195693969727, 2.4913997650146484, 2.627779960632324, 2.76416015625, 2.900540590286255, 3.0369207859039307, 3.1733009815216064, 3.3096811771392822, 3.446061372756958]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 6.0, 4.0, 9.0, 12.0, 10.0, 24.0, 23.0, 21.0, 31.0, 21.0, 35.0, 46.0, 32.0, 51.0, 64.0, 76.0, 66.0, 56.0, 53.0, 39.0, 42.0, 39.0, 33.0, 31.0, 28.0, 19.0, 19.0, 16.0, 14.0, 19.0, 10.0, 8.0, 7.0, 5.0, 8.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3647549152374268, -1.3149229288101196, -1.2650909423828125, -1.2152589559555054, -1.1654269695281982, -1.1155951023101807, -1.0657631158828735, -1.0159311294555664, -0.9660991430282593, -0.9162671566009521, -0.866435170173645, -0.8166032433509827, -0.7667712569236755, -0.7169392704963684, -0.667107343673706, -0.6172753572463989, -0.5674433708190918, -0.5176113843917847, -0.4677794277667999, -0.4179474711418152, -0.36811548471450806, -0.3182834982872009, -0.2684515416622162, -0.21861958503723145, -0.16878759860992432, -0.11895562708377838, -0.06912365555763245, -0.01929168403148651, 0.030540287494659424, 0.08037225902080536, 0.1302042305469513, 0.18003618717193604, 0.2298680543899536, 0.27970004081726074, 0.3295319974422455, 0.3793639540672302, 0.42919594049453735, 0.4790279269218445, 0.5288598537445068, 0.578691840171814, 0.6285238265991211, 0.6783558130264282, 0.7281877994537354, 0.7780197262763977, 0.8278517127037048, 0.877683699131012, 0.9275156259536743, 0.9773476123809814, 1.0271795988082886, 1.0770115852355957, 1.1268435716629028, 1.17667555809021, 1.2265074253082275, 1.2763394117355347, 1.3261713981628418, 1.376003384590149, 1.425835371017456, 1.4756673574447632, 1.5254993438720703, 1.5753313302993774, 1.6251633167266846, 1.6749951839447021, 1.7248271703720093, 1.7746591567993164, 1.8244911432266235]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 12.0, 19.0, 24.0, 45.0, 72.0, 118.0, 180.0, 320.0, 638.0, 1331.0, 3576.0, 12619.0, 70933.0, 761820.0, 2830092.0, 449841.0, 47231.0, 10051.0, 2975.0, 1092.0, 549.0, 279.0, 176.0, 102.0, 68.0, 42.0, 26.0, 18.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.140380859375, -0.13690567016601562, -0.13343048095703125, -0.12995529174804688, -0.1264801025390625, -0.12300491333007812, -0.11952972412109375, -0.11605453491210938, -0.112579345703125, -0.10910415649414062, -0.10562896728515625, -0.10215377807617188, -0.0986785888671875, -0.09520339965820312, -0.09172821044921875, -0.08825302124023438, -0.08477783203125, -0.08130264282226562, -0.07782745361328125, -0.07435226440429688, -0.0708770751953125, -0.06740188598632812, -0.06392669677734375, -0.060451507568359375, -0.056976318359375, -0.053501129150390625, -0.05002593994140625, -0.046550750732421875, -0.0430755615234375, -0.039600372314453125, -0.03612518310546875, -0.032649993896484375, -0.0291748046875, -0.025699615478515625, -0.02222442626953125, -0.018749237060546875, -0.0152740478515625, -0.011798858642578125, -0.00832366943359375, -0.004848480224609375, -0.001373291015625, 0.002101898193359375, 0.00557708740234375, 0.009052276611328125, 0.0125274658203125, 0.016002655029296875, 0.01947784423828125, 0.022953033447265625, 0.02642822265625, 0.029903411865234375, 0.03337860107421875, 0.036853790283203125, 0.0403289794921875, 0.043804168701171875, 0.04727935791015625, 0.050754547119140625, 0.054229736328125, 0.057704925537109375, 0.06118011474609375, 0.06465530395507812, 0.0681304931640625, 0.07160568237304688, 0.07508087158203125, 0.07855606079101562, 0.08203125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 10.0, 8.0, 10.0, 16.0, 17.0, 19.0, 23.0, 30.0, 30.0, 48.0, 47.0, 51.0, 53.0, 49.0, 57.0, 61.0, 68.0, 53.0, 54.0, 44.0, 55.0, 37.0, 24.0, 23.0, 20.0, 24.0, 19.0, 17.0, 9.0, 5.0, 8.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.1279296875, -0.12450313568115234, -0.12107658386230469, -0.11765003204345703, -0.11422348022460938, -0.11079692840576172, -0.10737037658691406, -0.1039438247680664, -0.10051727294921875, -0.0970907211303711, -0.09366416931152344, -0.09023761749267578, -0.08681106567382812, -0.08338451385498047, -0.07995796203613281, -0.07653141021728516, -0.0731048583984375, -0.06967830657958984, -0.06625175476074219, -0.06282520294189453, -0.059398651123046875, -0.05597209930419922, -0.05254554748535156, -0.049118995666503906, -0.04569244384765625, -0.042265892028808594, -0.03883934020996094, -0.03541278839111328, -0.031986236572265625, -0.02855968475341797, -0.025133132934570312, -0.021706581115722656, -0.018280029296875, -0.014853477478027344, -0.011426925659179688, -0.008000373840332031, -0.004573822021484375, -0.0011472702026367188, 0.0022792816162109375, 0.005705833435058594, 0.00913238525390625, 0.012558937072753906, 0.015985488891601562, 0.01941204071044922, 0.022838592529296875, 0.02626514434814453, 0.029691696166992188, 0.033118247985839844, 0.0365447998046875, 0.039971351623535156, 0.04339790344238281, 0.04682445526123047, 0.050251007080078125, 0.05367755889892578, 0.05710411071777344, 0.060530662536621094, 0.06395721435546875, 0.0673837661743164, 0.07081031799316406, 0.07423686981201172, 0.07766342163085938, 0.08108997344970703, 0.08451652526855469, 0.08794307708740234, 0.09136962890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 9.0, 19.0, 30.0, 42.0, 62.0, 116.0, 210.0, 491.0, 1380.0, 5966.0, 46306.0, 2637082.0, 1453441.0, 39236.0, 6631.0, 1760.0, 638.0, 333.0, 193.0, 105.0, 90.0, 51.0, 24.0, 19.0, 13.0, 8.0, 6.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.18896484375, -0.18220138549804688, -0.17543792724609375, -0.16867446899414062, -0.1619110107421875, -0.15514755249023438, -0.14838409423828125, -0.14162063598632812, -0.134857177734375, -0.12809371948242188, -0.12133026123046875, -0.11456680297851562, -0.1078033447265625, -0.10103988647460938, -0.09427642822265625, -0.08751296997070312, -0.08074951171875, -0.07398605346679688, -0.06722259521484375, -0.060459136962890625, -0.0536956787109375, -0.046932220458984375, -0.04016876220703125, -0.033405303955078125, -0.026641845703125, -0.019878387451171875, -0.01311492919921875, -0.006351470947265625, 0.0004119873046875, 0.007175445556640625, 0.01393890380859375, 0.020702362060546875, 0.0274658203125, 0.034229278564453125, 0.04099273681640625, 0.047756195068359375, 0.0545196533203125, 0.061283111572265625, 0.06804656982421875, 0.07481002807617188, 0.081573486328125, 0.08833694458007812, 0.09510040283203125, 0.10186386108398438, 0.1086273193359375, 0.11539077758789062, 0.12215423583984375, 0.12891769409179688, 0.13568115234375, 0.14244461059570312, 0.14920806884765625, 0.15597152709960938, 0.1627349853515625, 0.16949844360351562, 0.17626190185546875, 0.18302536010742188, 0.189788818359375, 0.19655227661132812, 0.20331573486328125, 0.21007919311523438, 0.2168426513671875, 0.22360610961914062, 0.23036956787109375, 0.23713302612304688, 0.243896484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 7.0, 7.0, 17.0, 18.0, 41.0, 49.0, 89.0, 188.0, 493.0, 987.0, 1059.0, 549.0, 245.0, 107.0, 69.0, 45.0, 28.0, 15.0, 12.0, 8.0, 10.0, 8.0, 3.0, 2.0, 2.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1968994140625, -0.18987464904785156, -0.18284988403320312, -0.1758251190185547, -0.16880035400390625, -0.1617755889892578, -0.15475082397460938, -0.14772605895996094, -0.1407012939453125, -0.13367652893066406, -0.12665176391601562, -0.11962699890136719, -0.11260223388671875, -0.10557746887207031, -0.09855270385742188, -0.09152793884277344, -0.084503173828125, -0.07747840881347656, -0.07045364379882812, -0.06342887878417969, -0.05640411376953125, -0.04937934875488281, -0.042354583740234375, -0.03532981872558594, -0.0283050537109375, -0.021280288696289062, -0.014255523681640625, -0.0072307586669921875, -0.00020599365234375, 0.0068187713623046875, 0.013843536376953125, 0.020868301391601562, 0.02789306640625, 0.03491783142089844, 0.041942596435546875, 0.04896736145019531, 0.05599212646484375, 0.06301689147949219, 0.07004165649414062, 0.07706642150878906, 0.0840911865234375, 0.09111595153808594, 0.09814071655273438, 0.10516548156738281, 0.11219024658203125, 0.11921501159667969, 0.12623977661132812, 0.13326454162597656, 0.140289306640625, 0.14731407165527344, 0.15433883666992188, 0.1613636016845703, 0.16838836669921875, 0.1754131317138672, 0.18243789672851562, 0.18946266174316406, 0.1964874267578125, 0.20351219177246094, 0.21053695678710938, 0.2175617218017578, 0.22458648681640625, 0.2316112518310547, 0.23863601684570312, 0.24566078186035156, 0.252685546875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 18.0, 49.0, 148.0, 243.0, 263.0, 149.0, 58.0, 24.0, 10.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.006287097930908, -2.943056344985962, -2.8798258304595947, -2.8165950775146484, -2.7533645629882812, -2.690133810043335, -2.6269030570983887, -2.5636725425720215, -2.500441789627075, -2.437211036682129, -2.3739805221557617, -2.3107497692108154, -2.247519016265869, -2.184288501739502, -2.1210577487945557, -2.0578272342681885, -1.9945964813232422, -1.9313658475875854, -1.8681352138519287, -1.8049044609069824, -1.7416738271713257, -1.678443193435669, -1.6152124404907227, -1.551981806755066, -1.4887511730194092, -1.4255205392837524, -1.3622899055480957, -1.2990591526031494, -1.2358285188674927, -1.172597885131836, -1.1093671321868896, -1.046136498451233, -0.9829059839248657, -0.919675350189209, -0.8564446568489075, -0.793213963508606, -0.7299833297729492, -0.6667526960372925, -0.603522002696991, -0.5402913093566895, -0.4770606756210327, -0.4138300120830536, -0.35059934854507446, -0.28736868500709534, -0.2241380214691162, -0.16090735793113708, -0.09767669439315796, -0.03444603085517883, 0.028784632682800293, 0.09201529622077942, 0.15524595975875854, 0.21847662329673767, 0.2817072868347168, 0.3449379503726959, 0.40816861391067505, 0.4713992774486542, 0.5346299409866333, 0.59786057472229, 0.6610912680625916, 0.7243219614028931, 0.7875525951385498, 0.8507832288742065, 0.9140139222145081, 0.9772446155548096, 1.0404752492904663]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 6.0, 12.0, 8.0, 14.0, 16.0, 18.0, 26.0, 22.0, 32.0, 35.0, 45.0, 52.0, 53.0, 38.0, 45.0, 55.0, 50.0, 57.0, 55.0, 38.0, 37.0, 48.0, 32.0, 29.0, 27.0, 21.0, 18.0, 26.0, 18.0, 13.0, 10.0, 11.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7946150898933411, -0.7675920724868774, -0.7405691146850586, -0.713546097278595, -0.6865230798721313, -0.6595000624656677, -0.6324770450592041, -0.6054540872573853, -0.5784310698509216, -0.551408052444458, -0.5243850946426392, -0.49736207723617554, -0.4703390598297119, -0.4433160424232483, -0.41629305481910706, -0.3892700672149658, -0.3622470498085022, -0.3352240324020386, -0.30820104479789734, -0.2811780571937561, -0.2541550397872925, -0.22713203728199005, -0.20010903477668762, -0.1730860322713852, -0.14606302976608276, -0.11904002726078033, -0.0920170247554779, -0.06499402225017548, -0.03797101974487305, -0.010948017239570618, 0.01607498526573181, 0.04309798777103424, 0.0701209306716919, 0.09714393317699432, 0.12416693568229675, 0.15118993818759918, 0.1782129406929016, 0.20523594319820404, 0.23225894570350647, 0.2592819333076477, 0.28630495071411133, 0.31332796812057495, 0.3403509557247162, 0.3673739433288574, 0.39439696073532104, 0.42141997814178467, 0.4484429657459259, 0.47546595335006714, 0.5024889707565308, 0.5295119881629944, 0.556535005569458, 0.5835579633712769, 0.6105809807777405, 0.6376039981842041, 0.664626955986023, 0.6916499733924866, 0.7186729907989502, 0.7456960082054138, 0.7727190256118774, 0.7997419834136963, 0.8267650008201599, 0.8537880182266235, 0.8808109760284424, 0.907833993434906, 0.9348570108413696]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 1.0, 10.0, 7.0, 5.0, 11.0, 22.0, 27.0, 33.0, 62.0, 79.0, 115.0, 166.0, 236.0, 390.0, 629.0, 924.0, 1544.0, 2423.0, 4066.0, 6855.0, 11802.0, 20516.0, 35765.0, 61733.0, 103554.0, 163118.0, 202800.0, 168355.0, 109053.0, 64756.0, 37061.0, 21510.0, 12348.0, 7173.0, 4289.0, 2537.0, 1621.0, 1047.0, 620.0, 439.0, 297.0, 178.0, 133.0, 64.0, 63.0, 39.0, 15.0, 19.0, 16.0, 8.0, 13.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.06524658203125, -0.06330156326293945, -0.061356544494628906, -0.05941152572631836, -0.05746650695800781, -0.055521488189697266, -0.05357646942138672, -0.05163145065307617, -0.049686431884765625, -0.04774141311645508, -0.04579639434814453, -0.043851375579833984, -0.04190635681152344, -0.03996133804321289, -0.038016319274902344, -0.0360713005065918, -0.03412628173828125, -0.0321812629699707, -0.030236244201660156, -0.02829122543334961, -0.026346206665039062, -0.024401187896728516, -0.02245616912841797, -0.020511150360107422, -0.018566131591796875, -0.016621112823486328, -0.014676094055175781, -0.012731075286865234, -0.010786056518554688, -0.00884103775024414, -0.006896018981933594, -0.004951000213623047, -0.0030059814453125, -0.0010609626770019531, 0.0008840560913085938, 0.0028290748596191406, 0.0047740936279296875, 0.006719112396240234, 0.008664131164550781, 0.010609149932861328, 0.012554168701171875, 0.014499187469482422, 0.01644420623779297, 0.018389225006103516, 0.020334243774414062, 0.02227926254272461, 0.024224281311035156, 0.026169300079345703, 0.02811431884765625, 0.030059337615966797, 0.032004356384277344, 0.03394937515258789, 0.03589439392089844, 0.037839412689208984, 0.03978443145751953, 0.04172945022583008, 0.043674468994140625, 0.04561948776245117, 0.04756450653076172, 0.049509525299072266, 0.05145454406738281, 0.05339956283569336, 0.055344581604003906, 0.05728960037231445, 0.059234619140625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 4.0, 13.0, 11.0, 17.0, 19.0, 28.0, 30.0, 36.0, 50.0, 34.0, 60.0, 42.0, 59.0, 68.0, 62.0, 55.0, 60.0, 64.0, 57.0, 35.0, 34.0, 25.0, 34.0, 24.0, 23.0, 10.0, 18.0, 8.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1268310546875, -0.12324714660644531, -0.11966323852539062, -0.11607933044433594, -0.11249542236328125, -0.10891151428222656, -0.10532760620117188, -0.10174369812011719, -0.0981597900390625, -0.09457588195800781, -0.09099197387695312, -0.08740806579589844, -0.08382415771484375, -0.08024024963378906, -0.07665634155273438, -0.07307243347167969, -0.069488525390625, -0.06590461730957031, -0.062320709228515625, -0.05873680114746094, -0.05515289306640625, -0.05156898498535156, -0.047985076904296875, -0.04440116882324219, -0.0408172607421875, -0.03723335266113281, -0.033649444580078125, -0.030065536499023438, -0.02648162841796875, -0.022897720336914062, -0.019313812255859375, -0.015729904174804688, -0.01214599609375, -0.008562088012695312, -0.004978179931640625, -0.0013942718505859375, 0.00218963623046875, 0.0057735443115234375, 0.009357452392578125, 0.012941360473632812, 0.0165252685546875, 0.020109176635742188, 0.023693084716796875, 0.027276992797851562, 0.03086090087890625, 0.03444480895996094, 0.038028717041015625, 0.04161262512207031, 0.045196533203125, 0.04878044128417969, 0.052364349365234375, 0.05594825744628906, 0.05953216552734375, 0.06311607360839844, 0.06669998168945312, 0.07028388977050781, 0.0738677978515625, 0.07745170593261719, 0.08103561401367188, 0.08461952209472656, 0.08820343017578125, 0.09178733825683594, 0.09537124633789062, 0.09895515441894531, 0.1025390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 11.0, 9.0, 16.0, 15.0, 21.0, 31.0, 54.0, 73.0, 94.0, 128.0, 175.0, 230.0, 384.0, 540.0, 1078.0, 2311.0, 9678.0, 104328.0, 812785.0, 101916.0, 9664.0, 2266.0, 1013.0, 542.0, 346.0, 216.0, 194.0, 111.0, 77.0, 60.0, 50.0, 46.0, 24.0, 21.0, 9.0, 12.0, 6.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2614860534667969, -0.25197601318359375, -0.24246597290039062, -0.2329559326171875, -0.22344589233398438, -0.21393585205078125, -0.20442581176757812, -0.194915771484375, -0.18540573120117188, -0.17589569091796875, -0.16638565063476562, -0.1568756103515625, -0.14736557006835938, -0.13785552978515625, -0.12834548950195312, -0.11883544921875, -0.10932540893554688, -0.09981536865234375, -0.09030532836914062, -0.0807952880859375, -0.07128524780273438, -0.06177520751953125, -0.052265167236328125, -0.042755126953125, -0.033245086669921875, -0.02373504638671875, -0.014225006103515625, -0.0047149658203125, 0.004795074462890625, 0.01430511474609375, 0.023815155029296875, 0.0333251953125, 0.042835235595703125, 0.05234527587890625, 0.061855316162109375, 0.0713653564453125, 0.08087539672851562, 0.09038543701171875, 0.09989547729492188, 0.109405517578125, 0.11891555786132812, 0.12842559814453125, 0.13793563842773438, 0.1474456787109375, 0.15695571899414062, 0.16646575927734375, 0.17597579956054688, 0.18548583984375, 0.19499588012695312, 0.20450592041015625, 0.21401596069335938, 0.2235260009765625, 0.23303604125976562, 0.24254608154296875, 0.2520561218261719, 0.261566162109375, 0.2710762023925781, 0.28058624267578125, 0.2900962829589844, 0.2996063232421875, 0.3091163635253906, 0.31862640380859375, 0.3281364440917969, 0.337646484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 4.0, 5.0, 7.0, 12.0, 11.0, 17.0, 21.0, 14.0, 21.0, 30.0, 29.0, 34.0, 47.0, 43.0, 43.0, 59.0, 55.0, 60.0, 57.0, 50.0, 60.0, 53.0, 35.0, 37.0, 38.0, 31.0, 21.0, 16.0, 21.0, 12.0, 12.0, 9.0, 8.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294189453125, -0.281829833984375, -0.26947021484375, -0.257110595703125, -0.2447509765625, -0.232391357421875, -0.22003173828125, -0.207672119140625, -0.1953125, -0.182952880859375, -0.17059326171875, -0.158233642578125, -0.1458740234375, -0.133514404296875, -0.12115478515625, -0.108795166015625, -0.096435546875, -0.084075927734375, -0.07171630859375, -0.059356689453125, -0.0469970703125, -0.034637451171875, -0.02227783203125, -0.009918212890625, 0.00244140625, 0.014801025390625, 0.02716064453125, 0.039520263671875, 0.0518798828125, 0.064239501953125, 0.07659912109375, 0.088958740234375, 0.101318359375, 0.113677978515625, 0.12603759765625, 0.138397216796875, 0.1507568359375, 0.163116455078125, 0.17547607421875, 0.187835693359375, 0.2001953125, 0.212554931640625, 0.22491455078125, 0.237274169921875, 0.2496337890625, 0.261993408203125, 0.27435302734375, 0.286712646484375, 0.299072265625, 0.311431884765625, 0.32379150390625, 0.336151123046875, 0.3485107421875, 0.360870361328125, 0.37322998046875, 0.385589599609375, 0.39794921875, 0.410308837890625, 0.42266845703125, 0.435028076171875, 0.4473876953125, 0.459747314453125, 0.47210693359375, 0.484466552734375, 0.496826171875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 8.0, 16.0, 16.0, 23.0, 27.0, 37.0, 51.0, 97.0, 123.0, 256.0, 453.0, 888.0, 1817.0, 4407.0, 13150.0, 53313.0, 318406.0, 559332.0, 70364.0, 16373.0, 5218.0, 1991.0, 906.0, 505.0, 287.0, 171.0, 101.0, 67.0, 36.0, 38.0, 22.0, 14.0, 15.0, 5.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07110595703125, -0.06888961791992188, -0.06667327880859375, -0.06445693969726562, -0.0622406005859375, -0.060024261474609375, -0.05780792236328125, -0.055591583251953125, -0.053375244140625, -0.051158905029296875, -0.04894256591796875, -0.046726226806640625, -0.0445098876953125, -0.042293548583984375, -0.04007720947265625, -0.037860870361328125, -0.03564453125, -0.033428192138671875, -0.03121185302734375, -0.028995513916015625, -0.0267791748046875, -0.024562835693359375, -0.02234649658203125, -0.020130157470703125, -0.017913818359375, -0.015697479248046875, -0.01348114013671875, -0.011264801025390625, -0.0090484619140625, -0.006832122802734375, -0.00461578369140625, -0.002399444580078125, -0.00018310546875, 0.002033233642578125, 0.00424957275390625, 0.006465911865234375, 0.0086822509765625, 0.010898590087890625, 0.01311492919921875, 0.015331268310546875, 0.017547607421875, 0.019763946533203125, 0.02198028564453125, 0.024196624755859375, 0.0264129638671875, 0.028629302978515625, 0.03084564208984375, 0.033061981201171875, 0.0352783203125, 0.037494659423828125, 0.03971099853515625, 0.041927337646484375, 0.0441436767578125, 0.046360015869140625, 0.04857635498046875, 0.050792694091796875, 0.053009033203125, 0.055225372314453125, 0.05744171142578125, 0.059658050537109375, 0.0618743896484375, 0.06409072875976562, 0.06630706787109375, 0.06852340698242188, 0.07073974609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 0.0, 2.0, 4.0, 0.0, 3.0, 6.0, 6.0, 5.0, 6.0, 10.0, 10.0, 7.0, 14.0, 20.0, 30.0, 28.0, 26.0, 53.0, 69.0, 78.0, 95.0, 101.0, 83.0, 79.0, 62.0, 45.0, 26.0, 27.0, 16.0, 17.0, 16.0, 12.0, 3.0, 6.0, 8.0, 7.0, 7.0, 3.0, 0.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.227327346801758e-05, -5.0661154091358185e-05, -4.904903471469879e-05, -4.74369153380394e-05, -4.5824795961380005e-05, -4.421267658472061e-05, -4.260055720806122e-05, -4.0988437831401825e-05, -3.937631845474243e-05, -3.776419907808304e-05, -3.6152079701423645e-05, -3.453996032476425e-05, -3.292784094810486e-05, -3.1315721571445465e-05, -2.9703602194786072e-05, -2.809148281812668e-05, -2.6479363441467285e-05, -2.4867244064807892e-05, -2.32551246881485e-05, -2.1643005311489105e-05, -2.0030885934829712e-05, -1.841876655817032e-05, -1.6806647181510925e-05, -1.5194527804851532e-05, -1.3582408428192139e-05, -1.1970289051532745e-05, -1.0358169674873352e-05, -8.746050298213959e-06, -7.1339309215545654e-06, -5.521811544895172e-06, -3.909692168235779e-06, -2.2975727915763855e-06, -6.854534149169922e-07, 9.266659617424011e-07, 2.5387853384017944e-06, 4.150904715061188e-06, 5.763024091720581e-06, 7.375143468379974e-06, 8.987262845039368e-06, 1.0599382221698761e-05, 1.2211501598358154e-05, 1.3823620975017548e-05, 1.543574035167694e-05, 1.7047859728336334e-05, 1.8659979104995728e-05, 2.027209848165512e-05, 2.1884217858314514e-05, 2.3496337234973907e-05, 2.51084566116333e-05, 2.6720575988292694e-05, 2.8332695364952087e-05, 2.994481474161148e-05, 3.1556934118270874e-05, 3.316905349493027e-05, 3.478117287158966e-05, 3.6393292248249054e-05, 3.800541162490845e-05, 3.961753100156784e-05, 4.1229650378227234e-05, 4.284176975488663e-05, 4.445388913154602e-05, 4.6066008508205414e-05, 4.767812788486481e-05, 4.92902472615242e-05, 5.0902366638183594e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 2.0, 7.0, 9.0, 7.0, 6.0, 14.0, 27.0, 34.0, 49.0, 72.0, 143.0, 223.0, 438.0, 764.0, 1438.0, 3576.0, 11125.0, 52283.0, 510219.0, 399832.0, 50749.0, 10896.0, 3473.0, 1470.0, 668.0, 416.0, 222.0, 134.0, 75.0, 50.0, 44.0, 24.0, 17.0, 12.0, 10.0, 6.0, 7.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.083984375, -0.0816507339477539, -0.07931709289550781, -0.07698345184326172, -0.07464981079101562, -0.07231616973876953, -0.06998252868652344, -0.06764888763427734, -0.06531524658203125, -0.06298160552978516, -0.06064796447753906, -0.05831432342529297, -0.055980682373046875, -0.05364704132080078, -0.05131340026855469, -0.048979759216308594, -0.0466461181640625, -0.044312477111816406, -0.04197883605957031, -0.03964519500732422, -0.037311553955078125, -0.03497791290283203, -0.03264427185058594, -0.030310630798339844, -0.02797698974609375, -0.025643348693847656, -0.023309707641601562, -0.02097606658935547, -0.018642425537109375, -0.01630878448486328, -0.013975143432617188, -0.011641502380371094, -0.009307861328125, -0.006974220275878906, -0.0046405792236328125, -0.0023069381713867188, 2.6702880859375e-05, 0.0023603439331054688, 0.0046939849853515625, 0.007027626037597656, 0.00936126708984375, 0.011694908142089844, 0.014028549194335938, 0.01636219024658203, 0.018695831298828125, 0.02102947235107422, 0.023363113403320312, 0.025696754455566406, 0.0280303955078125, 0.030364036560058594, 0.03269767761230469, 0.03503131866455078, 0.037364959716796875, 0.03969860076904297, 0.04203224182128906, 0.044365882873535156, 0.04669952392578125, 0.049033164978027344, 0.05136680603027344, 0.05370044708251953, 0.056034088134765625, 0.05836772918701172, 0.06070137023925781, 0.0630350112915039, 0.06536865234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 8.0, 9.0, 10.0, 18.0, 27.0, 31.0, 49.0, 59.0, 71.0, 59.0, 83.0, 91.0, 97.0, 77.0, 70.0, 57.0, 34.0, 39.0, 24.0, 16.0, 15.0, 7.0, 11.0, 10.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08868408203125, -0.0861978530883789, -0.08371162414550781, -0.08122539520263672, -0.07873916625976562, -0.07625293731689453, -0.07376670837402344, -0.07128047943115234, -0.06879425048828125, -0.06630802154541016, -0.06382179260253906, -0.06133556365966797, -0.058849334716796875, -0.05636310577392578, -0.05387687683105469, -0.051390647888183594, -0.0489044189453125, -0.046418190002441406, -0.04393196105957031, -0.04144573211669922, -0.038959503173828125, -0.03647327423095703, -0.03398704528808594, -0.031500816345214844, -0.02901458740234375, -0.026528358459472656, -0.024042129516601562, -0.02155590057373047, -0.019069671630859375, -0.01658344268798828, -0.014097213745117188, -0.011610984802246094, -0.009124755859375, -0.006638526916503906, -0.0041522979736328125, -0.0016660690307617188, 0.000820159912109375, 0.0033063888549804688, 0.0057926177978515625, 0.008278846740722656, 0.01076507568359375, 0.013251304626464844, 0.015737533569335938, 0.01822376251220703, 0.020709991455078125, 0.02319622039794922, 0.025682449340820312, 0.028168678283691406, 0.0306549072265625, 0.033141136169433594, 0.03562736511230469, 0.03811359405517578, 0.040599822998046875, 0.04308605194091797, 0.04557228088378906, 0.048058509826660156, 0.05054473876953125, 0.053030967712402344, 0.05551719665527344, 0.05800342559814453, 0.060489654541015625, 0.06297588348388672, 0.06546211242675781, 0.0679483413696289, 0.0704345703125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 16.0, 37.0, 59.0, 125.0, 194.0, 309.0, 128.0, 54.0, 32.0, 11.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1691173315048218, -1.1052755117416382, -1.0414338111877441, -0.9775919914245605, -0.9137502908706665, -0.8499084711074829, -0.7860667109489441, -0.7222249507904053, -0.6583831906318665, -0.5945414304733276, -0.5306996703147888, -0.4668578803539276, -0.4030161201953888, -0.33917436003685, -0.27533257007598877, -0.21149080991744995, -0.14764904975891113, -0.08380728214979172, -0.019965514540672302, 0.04387626051902771, 0.10771802067756653, 0.17155978083610535, 0.23540157079696655, 0.29924333095550537, 0.3630850911140442, 0.426926851272583, 0.4907686114311218, 0.5546103715896606, 0.6184521913528442, 0.6822938919067383, 0.7461357116699219, 0.8099774718284607, 0.87381911277771, 0.9376608729362488, 1.0015026330947876, 1.0653444528579712, 1.1291861534118652, 1.1930279731750488, 1.2568697929382324, 1.3207114934921265, 1.3845531940460205, 1.448395013809204, 1.5122367143630981, 1.5760785341262817, 1.6399202346801758, 1.7037620544433594, 1.767603874206543, 1.831445574760437, 1.8952873945236206, 1.9591292142868042, 2.0229709148406982, 2.086812734603882, 2.1506545543670654, 2.21449613571167, 2.2783379554748535, 2.342179775238037, 2.4060215950012207, 2.4698634147644043, 2.533705234527588, 2.5975468158721924, 2.661388635635376, 2.7252304553985596, 2.789072275161743, 2.8529138565063477, 2.9167556762695312]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 7.0, 5.0, 8.0, 10.0, 13.0, 18.0, 10.0, 16.0, 15.0, 21.0, 17.0, 27.0, 34.0, 26.0, 35.0, 30.0, 33.0, 60.0, 77.0, 68.0, 55.0, 41.0, 37.0, 41.0, 39.0, 32.0, 18.0, 21.0, 25.0, 23.0, 19.0, 14.0, 19.0, 13.0, 12.0, 5.0, 4.0, 10.0, 2.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0], "bins": [-1.3760292530059814, -1.334822416305542, -1.2936155796051025, -1.2524088621139526, -1.2112020254135132, -1.1699951887130737, -1.1287884712219238, -1.0875816345214844, -1.046374797821045, -1.0051679611206055, -0.9639611840248108, -0.9227544069290161, -0.8815475702285767, -0.8403407335281372, -0.7991339564323425, -0.7579271793365479, -0.7167203426361084, -0.675513505935669, -0.6343067288398743, -0.5930999517440796, -0.5518931150436401, -0.5106862783432007, -0.469479501247406, -0.42827269434928894, -0.3870658874511719, -0.3458590805530548, -0.30465227365493774, -0.2634454667568207, -0.2222386598587036, -0.18103185296058655, -0.13982504606246948, -0.09861823916435242, -0.05741143226623535, -0.016204625368118286, 0.02500218152999878, 0.06620898842811584, 0.10741579532623291, 0.14862260222434998, 0.18982940912246704, 0.2310362160205841, 0.27224302291870117, 0.31344982981681824, 0.3546566367149353, 0.39586344361305237, 0.43707025051116943, 0.4782770574092865, 0.5194838643074036, 0.5606906414031982, 0.6018974781036377, 0.6431043148040771, 0.6843110918998718, 0.7255178689956665, 0.766724705696106, 0.8079315423965454, 0.8491383194923401, 0.8903450965881348, 0.9315519332885742, 0.9727587699890137, 1.0139656066894531, 1.055172324180603, 1.0963791608810425, 1.137585997581482, 1.1787927150726318, 1.2199995517730713, 1.2612063884735107]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 5.0, 11.0, 7.0, 17.0, 21.0, 31.0, 52.0, 74.0, 96.0, 165.0, 239.0, 403.0, 748.0, 1827.0, 5343.0, 23953.0, 183521.0, 2011857.0, 1784221.0, 151240.0, 21146.0, 5549.0, 1922.0, 764.0, 383.0, 234.0, 153.0, 103.0, 68.0, 38.0, 29.0, 18.0, 12.0, 11.0, 5.0, 4.0, 2.0, 0.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.12451171875, -0.12095069885253906, -0.11738967895507812, -0.11382865905761719, -0.11026763916015625, -0.10670661926269531, -0.10314559936523438, -0.09958457946777344, -0.0960235595703125, -0.09246253967285156, -0.08890151977539062, -0.08534049987792969, -0.08177947998046875, -0.07821846008300781, -0.07465744018554688, -0.07109642028808594, -0.067535400390625, -0.06397438049316406, -0.060413360595703125, -0.05685234069824219, -0.05329132080078125, -0.04973030090332031, -0.046169281005859375, -0.04260826110839844, -0.0390472412109375, -0.03548622131347656, -0.031925201416015625, -0.028364181518554688, -0.02480316162109375, -0.021242141723632812, -0.017681121826171875, -0.014120101928710938, -0.01055908203125, -0.0069980621337890625, -0.003437042236328125, 0.0001239776611328125, 0.00368499755859375, 0.0072460174560546875, 0.010807037353515625, 0.014368057250976562, 0.0179290771484375, 0.021490097045898438, 0.025051116943359375, 0.028612136840820312, 0.03217315673828125, 0.03573417663574219, 0.039295196533203125, 0.04285621643066406, 0.046417236328125, 0.04997825622558594, 0.053539276123046875, 0.05710029602050781, 0.06066131591796875, 0.06422233581542969, 0.06778335571289062, 0.07134437561035156, 0.0749053955078125, 0.07846641540527344, 0.08202743530273438, 0.08558845520019531, 0.08914947509765625, 0.09271049499511719, 0.09627151489257812, 0.09983253479003906, 0.1033935546875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 10.0, 13.0, 15.0, 26.0, 29.0, 37.0, 46.0, 45.0, 65.0, 54.0, 54.0, 56.0, 68.0, 60.0, 70.0, 58.0, 48.0, 43.0, 39.0, 39.0, 24.0, 31.0, 21.0, 16.0, 13.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1368408203125, -0.13320446014404297, -0.12956809997558594, -0.1259317398071289, -0.12229537963867188, -0.11865901947021484, -0.11502265930175781, -0.11138629913330078, -0.10774993896484375, -0.10411357879638672, -0.10047721862792969, -0.09684085845947266, -0.09320449829101562, -0.0895681381225586, -0.08593177795410156, -0.08229541778564453, -0.0786590576171875, -0.07502269744873047, -0.07138633728027344, -0.0677499771118164, -0.06411361694335938, -0.060477256774902344, -0.05684089660644531, -0.05320453643798828, -0.04956817626953125, -0.04593181610107422, -0.04229545593261719, -0.038659095764160156, -0.035022735595703125, -0.031386375427246094, -0.027750015258789062, -0.02411365509033203, -0.020477294921875, -0.01684093475341797, -0.013204574584960938, -0.009568214416503906, -0.005931854248046875, -0.0022954940795898438, 0.0013408660888671875, 0.004977226257324219, 0.00861358642578125, 0.012249946594238281, 0.015886306762695312, 0.019522666931152344, 0.023159027099609375, 0.026795387268066406, 0.030431747436523438, 0.03406810760498047, 0.0377044677734375, 0.04134082794189453, 0.04497718811035156, 0.048613548278808594, 0.052249908447265625, 0.055886268615722656, 0.05952262878417969, 0.06315898895263672, 0.06679534912109375, 0.07043170928955078, 0.07406806945800781, 0.07770442962646484, 0.08134078979492188, 0.0849771499633789, 0.08861351013183594, 0.09224987030029297, 0.09588623046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 11.0, 14.0, 17.0, 33.0, 61.0, 67.0, 118.0, 201.0, 336.0, 660.0, 2262.0, 21291.0, 3799107.0, 360489.0, 6963.0, 1253.0, 468.0, 298.0, 218.0, 154.0, 97.0, 69.0, 29.0, 24.0, 21.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42431640625, -0.41246795654296875, -0.4006195068359375, -0.38877105712890625, -0.376922607421875, -0.36507415771484375, -0.3532257080078125, -0.34137725830078125, -0.32952880859375, -0.31768035888671875, -0.3058319091796875, -0.29398345947265625, -0.282135009765625, -0.27028656005859375, -0.2584381103515625, -0.24658966064453125, -0.2347412109375, -0.22289276123046875, -0.2110443115234375, -0.19919586181640625, -0.187347412109375, -0.17549896240234375, -0.1636505126953125, -0.15180206298828125, -0.13995361328125, -0.12810516357421875, -0.1162567138671875, -0.10440826416015625, -0.092559814453125, -0.08071136474609375, -0.0688629150390625, -0.05701446533203125, -0.045166015625, -0.03331756591796875, -0.0214691162109375, -0.00962066650390625, 0.002227783203125, 0.01407623291015625, 0.0259246826171875, 0.03777313232421875, 0.04962158203125, 0.06147003173828125, 0.0733184814453125, 0.08516693115234375, 0.097015380859375, 0.10886383056640625, 0.1207122802734375, 0.13256072998046875, 0.1444091796875, 0.15625762939453125, 0.1681060791015625, 0.17995452880859375, 0.191802978515625, 0.20365142822265625, 0.2154998779296875, 0.22734832763671875, 0.23919677734375, 0.25104522705078125, 0.2628936767578125, 0.27474212646484375, 0.286590576171875, 0.29843902587890625, 0.3102874755859375, 0.32213592529296875, 0.333984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 10.0, 16.0, 22.0, 33.0, 53.0, 130.0, 325.0, 1118.0, 1382.0, 638.0, 186.0, 67.0, 46.0, 23.0, 8.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1553955078125, -0.1451396942138672, -0.13488388061523438, -0.12462806701660156, -0.11437225341796875, -0.10411643981933594, -0.09386062622070312, -0.08360481262207031, -0.0733489990234375, -0.06309318542480469, -0.052837371826171875, -0.04258155822753906, -0.03232574462890625, -0.022069931030273438, -0.011814117431640625, -0.0015583038330078125, 0.008697509765625, 0.018953323364257812, 0.029209136962890625, 0.03946495056152344, 0.04972076416015625, 0.05997657775878906, 0.07023239135742188, 0.08048820495605469, 0.0907440185546875, 0.10099983215332031, 0.11125564575195312, 0.12151145935058594, 0.13176727294921875, 0.14202308654785156, 0.15227890014648438, 0.1625347137451172, 0.17279052734375, 0.1830463409423828, 0.19330215454101562, 0.20355796813964844, 0.21381378173828125, 0.22406959533691406, 0.23432540893554688, 0.2445812225341797, 0.2548370361328125, 0.2650928497314453, 0.2753486633300781, 0.28560447692871094, 0.29586029052734375, 0.30611610412597656, 0.3163719177246094, 0.3266277313232422, 0.336883544921875, 0.3471393585205078, 0.3573951721191406, 0.36765098571777344, 0.37790679931640625, 0.38816261291503906, 0.3984184265136719, 0.4086742401123047, 0.4189300537109375, 0.4291858673095703, 0.4394416809082031, 0.44969749450683594, 0.45995330810546875, 0.47020912170410156, 0.4804649353027344, 0.4907207489013672, 0.5009765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 8.0, 8.0, 9.0, 21.0, 40.0, 58.0, 100.0, 192.0, 192.0, 155.0, 91.0, 50.0, 29.0, 18.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6926915645599365, -1.6430004835128784, -1.5933094024658203, -1.5436183214187622, -1.493927240371704, -1.444236159324646, -1.394545078277588, -1.3448539972305298, -1.2951629161834717, -1.2454718351364136, -1.1957807540893555, -1.1460896730422974, -1.0963985919952393, -1.0467075109481812, -0.997016429901123, -0.9473253488540649, -0.8976342678070068, -0.8479431867599487, -0.7982521057128906, -0.7485610246658325, -0.6988699436187744, -0.6491788625717163, -0.5994877815246582, -0.5497967004776001, -0.500105619430542, -0.4504145383834839, -0.4007234573364258, -0.3510323762893677, -0.30134129524230957, -0.25165021419525146, -0.20195913314819336, -0.15226805210113525, -0.1025770902633667, -0.052886009216308594, -0.0031949281692504883, 0.04649615287780762, 0.09618723392486572, 0.14587831497192383, 0.19556939601898193, 0.24526047706604004, 0.29495155811309814, 0.34464263916015625, 0.39433372020721436, 0.44402480125427246, 0.49371588230133057, 0.5434069633483887, 0.5930980443954468, 0.6427891254425049, 0.692480206489563, 0.7421712875366211, 0.7918623685836792, 0.8415534496307373, 0.8912445306777954, 0.9409356117248535, 0.9906266927719116, 1.0403177738189697, 1.0900088548660278, 1.139699935913086, 1.189391016960144, 1.2390820980072021, 1.2887731790542603, 1.3384642601013184, 1.3881553411483765, 1.4378464221954346, 1.4875375032424927]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 5.0, 5.0, 7.0, 9.0, 8.0, 13.0, 17.0, 22.0, 28.0, 34.0, 25.0, 27.0, 41.0, 50.0, 40.0, 51.0, 40.0, 51.0, 41.0, 46.0, 40.0, 54.0, 45.0, 40.0, 34.0, 42.0, 29.0, 28.0, 14.0, 29.0, 8.0, 15.0, 12.0, 13.0, 12.0, 5.0, 6.0, 3.0, 7.0, 2.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0612034797668457, -1.0328896045684814, -1.0045758485794067, -0.9762619733810425, -0.9479480981826782, -0.9196342825889587, -0.8913204669952393, -0.863006591796875, -0.8346927165985107, -0.8063789010047913, -0.778065025806427, -0.7497512102127075, -0.7214373350143433, -0.6931235194206238, -0.6648097038269043, -0.63649582862854, -0.6081820130348206, -0.5798681974411011, -0.5515543222427368, -0.5232405066490173, -0.4949266314506531, -0.4666128158569336, -0.4382989704608917, -0.40998512506484985, -0.381671279668808, -0.3533574342727661, -0.32504358887672424, -0.2967297434806824, -0.2684159278869629, -0.24010206758975983, -0.21178823709487915, -0.18347439169883728, -0.15516048669815063, -0.12684664130210876, -0.09853280335664749, -0.07021896541118622, -0.04190512001514435, -0.013591274619102478, 0.014722555875778198, 0.04303640127182007, 0.07135024666786194, 0.09966409206390381, 0.12797793745994568, 0.15629176795482635, 0.18460561335086823, 0.2129194587469101, 0.24123328924179077, 0.26954713463783264, 0.2978609800338745, 0.3261748254299164, 0.35448867082595825, 0.38280248641967773, 0.411116361618042, 0.4394301772117615, 0.46774402260780334, 0.4960578680038452, 0.5243717432022095, 0.552685558795929, 0.5809994339942932, 0.6093132495880127, 0.637627124786377, 0.6659409403800964, 0.6942547559738159, 0.7225686311721802, 0.7508824467658997]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 11.0, 12.0, 22.0, 32.0, 51.0, 53.0, 114.0, 155.0, 238.0, 361.0, 533.0, 807.0, 1318.0, 2086.0, 3574.0, 6294.0, 11526.0, 21723.0, 42127.0, 82722.0, 150509.0, 226814.0, 214682.0, 132910.0, 71037.0, 36102.0, 18722.0, 10093.0, 5476.0, 3213.0, 1923.0, 1195.0, 669.0, 504.0, 287.0, 196.0, 148.0, 88.0, 60.0, 49.0, 27.0, 28.0, 20.0, 18.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07720947265625, -0.07478809356689453, -0.07236671447753906, -0.0699453353881836, -0.06752395629882812, -0.06510257720947266, -0.06268119812011719, -0.06025981903076172, -0.05783843994140625, -0.05541706085205078, -0.05299568176269531, -0.050574302673339844, -0.048152923583984375, -0.045731544494628906, -0.04331016540527344, -0.04088878631591797, -0.0384674072265625, -0.03604602813720703, -0.03362464904785156, -0.031203269958496094, -0.028781890869140625, -0.026360511779785156, -0.023939132690429688, -0.02151775360107422, -0.01909637451171875, -0.01667499542236328, -0.014253616333007812, -0.011832237243652344, -0.009410858154296875, -0.006989479064941406, -0.0045680999755859375, -0.0021467208862304688, 0.000274658203125, 0.0026960372924804688, 0.0051174163818359375, 0.007538795471191406, 0.009960174560546875, 0.012381553649902344, 0.014802932739257812, 0.01722431182861328, 0.01964569091796875, 0.02206707000732422, 0.024488449096679688, 0.026909828186035156, 0.029331207275390625, 0.031752586364746094, 0.03417396545410156, 0.03659534454345703, 0.0390167236328125, 0.04143810272216797, 0.04385948181152344, 0.046280860900878906, 0.048702239990234375, 0.051123619079589844, 0.05354499816894531, 0.05596637725830078, 0.05838775634765625, 0.06080913543701172, 0.06323051452636719, 0.06565189361572266, 0.06807327270507812, 0.0704946517944336, 0.07291603088378906, 0.07533740997314453, 0.0777587890625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 29.0, 19.0, 24.0, 42.0, 47.0, 40.0, 44.0, 49.0, 57.0, 57.0, 67.0, 66.0, 57.0, 60.0, 53.0, 49.0, 35.0, 35.0, 32.0, 36.0, 23.0, 17.0, 16.0, 8.0, 13.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1353759765625, -0.13173294067382812, -0.12808990478515625, -0.12444686889648438, -0.1208038330078125, -0.11716079711914062, -0.11351776123046875, -0.10987472534179688, -0.106231689453125, -0.10258865356445312, -0.09894561767578125, -0.09530258178710938, -0.0916595458984375, -0.08801651000976562, -0.08437347412109375, -0.08073043823242188, -0.07708740234375, -0.07344436645507812, -0.06980133056640625, -0.06615829467773438, -0.0625152587890625, -0.058872222900390625, -0.05522918701171875, -0.051586151123046875, -0.047943115234375, -0.044300079345703125, -0.04065704345703125, -0.037014007568359375, -0.0333709716796875, -0.029727935791015625, -0.02608489990234375, -0.022441864013671875, -0.018798828125, -0.015155792236328125, -0.01151275634765625, -0.007869720458984375, -0.0042266845703125, -0.000583648681640625, 0.00305938720703125, 0.006702423095703125, 0.010345458984375, 0.013988494873046875, 0.01763153076171875, 0.021274566650390625, 0.0249176025390625, 0.028560638427734375, 0.03220367431640625, 0.035846710205078125, 0.03948974609375, 0.043132781982421875, 0.04677581787109375, 0.050418853759765625, 0.0540618896484375, 0.057704925537109375, 0.06134796142578125, 0.06499099731445312, 0.068634033203125, 0.07227706909179688, 0.07592010498046875, 0.07956314086914062, 0.0832061767578125, 0.08684921264648438, 0.09049224853515625, 0.09413528442382812, 0.0977783203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 5.0, 3.0, 2.0, 6.0, 3.0, 3.0, 10.0, 9.0, 10.0, 9.0, 13.0, 12.0, 18.0, 35.0, 44.0, 69.0, 65.0, 100.0, 162.0, 237.0, 416.0, 1062.0, 2720.0, 9716.0, 45393.0, 256048.0, 610161.0, 96289.0, 18221.0, 4546.0, 1507.0, 652.0, 333.0, 198.0, 129.0, 77.0, 69.0, 49.0, 41.0, 24.0, 17.0, 17.0, 18.0, 12.0, 8.0, 8.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19287109375, -0.18626976013183594, -0.17966842651367188, -0.1730670928955078, -0.16646575927734375, -0.1598644256591797, -0.15326309204101562, -0.14666175842285156, -0.1400604248046875, -0.13345909118652344, -0.12685775756835938, -0.12025642395019531, -0.11365509033203125, -0.10705375671386719, -0.10045242309570312, -0.09385108947753906, -0.087249755859375, -0.08064842224121094, -0.07404708862304688, -0.06744575500488281, -0.06084442138671875, -0.05424308776855469, -0.047641754150390625, -0.04104042053222656, -0.0344390869140625, -0.027837753295898438, -0.021236419677734375, -0.014635086059570312, -0.00803375244140625, -0.0014324188232421875, 0.005168914794921875, 0.011770248413085938, 0.01837158203125, 0.024972915649414062, 0.031574249267578125, 0.03817558288574219, 0.04477691650390625, 0.05137825012207031, 0.057979583740234375, 0.06458091735839844, 0.0711822509765625, 0.07778358459472656, 0.08438491821289062, 0.09098625183105469, 0.09758758544921875, 0.10418891906738281, 0.11079025268554688, 0.11739158630371094, 0.123992919921875, 0.13059425354003906, 0.13719558715820312, 0.1437969207763672, 0.15039825439453125, 0.1569995880126953, 0.16360092163085938, 0.17020225524902344, 0.1768035888671875, 0.18340492248535156, 0.19000625610351562, 0.1966075897216797, 0.20320892333984375, 0.2098102569580078, 0.21641159057617188, 0.22301292419433594, 0.2296142578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 7.0, 11.0, 10.0, 8.0, 15.0, 9.0, 16.0, 13.0, 19.0, 24.0, 23.0, 41.0, 33.0, 42.0, 32.0, 42.0, 53.0, 45.0, 49.0, 58.0, 49.0, 43.0, 39.0, 47.0, 31.0, 40.0, 35.0, 24.0, 24.0, 25.0, 20.0, 12.0, 16.0, 6.0, 10.0, 10.0, 5.0, 4.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267578125, -0.2579994201660156, -0.24842071533203125, -0.23884201049804688, -0.2292633056640625, -0.21968460083007812, -0.21010589599609375, -0.20052719116210938, -0.190948486328125, -0.18136978149414062, -0.17179107666015625, -0.16221237182617188, -0.1526336669921875, -0.14305496215820312, -0.13347625732421875, -0.12389755249023438, -0.11431884765625, -0.10474014282226562, -0.09516143798828125, -0.08558273315429688, -0.0760040283203125, -0.06642532348632812, -0.05684661865234375, -0.047267913818359375, -0.037689208984375, -0.028110504150390625, -0.01853179931640625, -0.008953094482421875, 0.0006256103515625, 0.010204315185546875, 0.01978302001953125, 0.029361724853515625, 0.0389404296875, 0.048519134521484375, 0.05809783935546875, 0.06767654418945312, 0.0772552490234375, 0.08683395385742188, 0.09641265869140625, 0.10599136352539062, 0.115570068359375, 0.12514877319335938, 0.13472747802734375, 0.14430618286132812, 0.1538848876953125, 0.16346359252929688, 0.17304229736328125, 0.18262100219726562, 0.19219970703125, 0.20177841186523438, 0.21135711669921875, 0.22093582153320312, 0.2305145263671875, 0.24009323120117188, 0.24967193603515625, 0.2592506408691406, 0.268829345703125, 0.2784080505371094, 0.28798675537109375, 0.2975654602050781, 0.3071441650390625, 0.3167228698730469, 0.32630157470703125, 0.3358802795410156, 0.345458984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 3.0, 10.0, 7.0, 22.0, 21.0, 35.0, 44.0, 66.0, 74.0, 145.0, 225.0, 341.0, 585.0, 1078.0, 2042.0, 4062.0, 9630.0, 24833.0, 76381.0, 268753.0, 506857.0, 100031.0, 31355.0, 11690.0, 4920.0, 2410.0, 1103.0, 675.0, 368.0, 261.0, 160.0, 114.0, 78.0, 44.0, 30.0, 22.0, 18.0, 14.0, 13.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 6.0, 1.0], "bins": [-0.06805419921875, -0.06622028350830078, -0.06438636779785156, -0.06255245208740234, -0.060718536376953125, -0.058884620666503906, -0.05705070495605469, -0.05521678924560547, -0.05338287353515625, -0.05154895782470703, -0.04971504211425781, -0.047881126403808594, -0.046047210693359375, -0.044213294982910156, -0.04237937927246094, -0.04054546356201172, -0.0387115478515625, -0.03687763214111328, -0.03504371643066406, -0.033209800720214844, -0.031375885009765625, -0.029541969299316406, -0.027708053588867188, -0.02587413787841797, -0.02404022216796875, -0.02220630645751953, -0.020372390747070312, -0.018538475036621094, -0.016704559326171875, -0.014870643615722656, -0.013036727905273438, -0.011202812194824219, -0.009368896484375, -0.007534980773925781, -0.0057010650634765625, -0.0038671493530273438, -0.002033233642578125, -0.00019931793212890625, 0.0016345977783203125, 0.0034685134887695312, 0.00530242919921875, 0.007136344909667969, 0.008970260620117188, 0.010804176330566406, 0.012638092041015625, 0.014472007751464844, 0.016305923461914062, 0.01813983917236328, 0.0199737548828125, 0.02180767059326172, 0.023641586303710938, 0.025475502014160156, 0.027309417724609375, 0.029143333435058594, 0.030977249145507812, 0.03281116485595703, 0.03464508056640625, 0.03647899627685547, 0.03831291198730469, 0.040146827697753906, 0.041980743408203125, 0.043814659118652344, 0.04564857482910156, 0.04748249053955078, 0.04931640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 6.0, 4.0, 7.0, 11.0, 11.0, 27.0, 42.0, 54.0, 74.0, 83.0, 96.0, 119.0, 98.0, 98.0, 70.0, 69.0, 41.0, 24.0, 16.0, 16.0, 6.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.929304122924805e-05, -4.795379936695099e-05, -4.661455750465393e-05, -4.527531564235687e-05, -4.3936073780059814e-05, -4.2596831917762756e-05, -4.12575900554657e-05, -3.991834819316864e-05, -3.857910633087158e-05, -3.7239864468574524e-05, -3.5900622606277466e-05, -3.456138074398041e-05, -3.322213888168335e-05, -3.188289701938629e-05, -3.0543655157089233e-05, -2.9204413294792175e-05, -2.7865171432495117e-05, -2.652592957019806e-05, -2.5186687707901e-05, -2.3847445845603943e-05, -2.2508203983306885e-05, -2.1168962121009827e-05, -1.982972025871277e-05, -1.849047839641571e-05, -1.7151236534118652e-05, -1.5811994671821594e-05, -1.4472752809524536e-05, -1.3133510947227478e-05, -1.179426908493042e-05, -1.0455027222633362e-05, -9.115785360336304e-06, -7.776543498039246e-06, -6.4373016357421875e-06, -5.098059773445129e-06, -3.7588179111480713e-06, -2.419576048851013e-06, -1.080334186553955e-06, 2.5890767574310303e-07, 1.5981495380401611e-06, 2.9373914003372192e-06, 4.276633262634277e-06, 5.6158751249313354e-06, 6.9551169872283936e-06, 8.294358849525452e-06, 9.63360071182251e-06, 1.0972842574119568e-05, 1.2312084436416626e-05, 1.3651326298713684e-05, 1.4990568161010742e-05, 1.63298100233078e-05, 1.766905188560486e-05, 1.9008293747901917e-05, 2.0347535610198975e-05, 2.1686777472496033e-05, 2.302601933479309e-05, 2.436526119709015e-05, 2.5704503059387207e-05, 2.7043744921684265e-05, 2.8382986783981323e-05, 2.972222864627838e-05, 3.106147050857544e-05, 3.24007123708725e-05, 3.3739954233169556e-05, 3.5079196095466614e-05, 3.641843795776367e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 15.0, 12.0, 31.0, 44.0, 87.0, 161.0, 404.0, 1086.0, 3202.0, 12832.0, 69203.0, 606003.0, 298139.0, 44489.0, 8846.0, 2547.0, 776.0, 344.0, 139.0, 67.0, 42.0, 30.0, 13.0, 10.0, 7.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07598876953125, -0.07305240631103516, -0.07011604309082031, -0.06717967987060547, -0.06424331665039062, -0.06130695343017578, -0.05837059020996094, -0.055434226989746094, -0.05249786376953125, -0.049561500549316406, -0.04662513732910156, -0.04368877410888672, -0.040752410888671875, -0.03781604766845703, -0.03487968444824219, -0.031943321228027344, -0.0290069580078125, -0.026070594787597656, -0.023134231567382812, -0.02019786834716797, -0.017261505126953125, -0.014325141906738281, -0.011388778686523438, -0.008452415466308594, -0.00551605224609375, -0.0025796890258789062, 0.0003566741943359375, 0.0032930374145507812, 0.006229400634765625, 0.009165763854980469, 0.012102127075195312, 0.015038490295410156, 0.017974853515625, 0.020911216735839844, 0.023847579956054688, 0.02678394317626953, 0.029720306396484375, 0.03265666961669922, 0.03559303283691406, 0.038529396057128906, 0.04146575927734375, 0.044402122497558594, 0.04733848571777344, 0.05027484893798828, 0.053211212158203125, 0.05614757537841797, 0.05908393859863281, 0.062020301818847656, 0.0649566650390625, 0.06789302825927734, 0.07082939147949219, 0.07376575469970703, 0.07670211791992188, 0.07963848114013672, 0.08257484436035156, 0.0855112075805664, 0.08844757080078125, 0.0913839340209961, 0.09432029724121094, 0.09725666046142578, 0.10019302368164062, 0.10312938690185547, 0.10606575012207031, 0.10900211334228516, 0.1119384765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 10.0, 14.0, 17.0, 21.0, 42.0, 46.0, 58.0, 53.0, 68.0, 74.0, 84.0, 83.0, 83.0, 89.0, 46.0, 53.0, 39.0, 35.0, 15.0, 21.0, 8.0, 14.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.09307861328125, -0.09049606323242188, -0.08791351318359375, -0.08533096313476562, -0.0827484130859375, -0.08016586303710938, -0.07758331298828125, -0.07500076293945312, -0.072418212890625, -0.06983566284179688, -0.06725311279296875, -0.06467056274414062, -0.0620880126953125, -0.059505462646484375, -0.05692291259765625, -0.054340362548828125, -0.0517578125, -0.049175262451171875, -0.04659271240234375, -0.044010162353515625, -0.0414276123046875, -0.038845062255859375, -0.03626251220703125, -0.033679962158203125, -0.031097412109375, -0.028514862060546875, -0.02593231201171875, -0.023349761962890625, -0.0207672119140625, -0.018184661865234375, -0.01560211181640625, -0.013019561767578125, -0.01043701171875, -0.007854461669921875, -0.00527191162109375, -0.002689361572265625, -0.0001068115234375, 0.002475738525390625, 0.00505828857421875, 0.007640838623046875, 0.010223388671875, 0.012805938720703125, 0.01538848876953125, 0.017971038818359375, 0.0205535888671875, 0.023136138916015625, 0.02571868896484375, 0.028301239013671875, 0.0308837890625, 0.033466339111328125, 0.03604888916015625, 0.038631439208984375, 0.0412139892578125, 0.043796539306640625, 0.04637908935546875, 0.048961639404296875, 0.051544189453125, 0.054126739501953125, 0.05670928955078125, 0.059291839599609375, 0.0618743896484375, 0.06445693969726562, 0.06703948974609375, 0.06962203979492188, 0.07220458984375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 15.0, 35.0, 66.0, 94.0, 185.0, 275.0, 160.0, 60.0, 51.0, 21.0, 9.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5156450271606445, -2.453484296798706, -2.3913238048553467, -2.329163074493408, -2.267002582550049, -2.2048418521881104, -2.142681360244751, -2.0805206298828125, -2.018360137939453, -1.9561995267868042, -1.8940389156341553, -1.8318783044815063, -1.7697176933288574, -1.707556962966919, -1.6453964710235596, -1.583235740661621, -1.5210750102996826, -1.4589143991470337, -1.3967537879943848, -1.3345931768417358, -1.272432565689087, -1.2102718353271484, -1.148111343383789, -1.0859506130218506, -1.0237901210784912, -0.9616295099258423, -0.8994688987731934, -0.8373082876205444, -0.7751476168632507, -0.7129870057106018, -0.6508263945579529, -0.5886657238006592, -0.5265051126480103, -0.46434450149536133, -0.40218386054039, -0.3400232493877411, -0.2778626084327698, -0.21570199728012085, -0.15354138612747192, -0.09138074517250061, -0.029220134019851685, 0.03294048830866814, 0.09510111063718796, 0.15726172924041748, 0.2194223552942276, 0.2815829813480377, 0.34374359250068665, 0.40590423345565796, 0.4680648446083069, 0.5302254557609558, 0.5923860669136047, 0.6545467376708984, 0.7167073488235474, 0.7788679599761963, 0.8410285711288452, 0.9031891822814941, 0.9653497934341431, 1.027510404586792, 1.089671015739441, 1.1518316268920898, 1.2139922380447388, 1.2761528491973877, 1.3383135795593262, 1.400474190711975, 1.462634801864624]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 7.0, 7.0, 7.0, 8.0, 9.0, 14.0, 10.0, 9.0, 20.0, 25.0, 24.0, 22.0, 29.0, 23.0, 32.0, 43.0, 41.0, 51.0, 65.0, 78.0, 70.0, 50.0, 48.0, 35.0, 36.0, 38.0, 26.0, 31.0, 23.0, 17.0, 18.0, 14.0, 17.0, 8.0, 9.0, 12.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0125527381896973, -0.9771116971969604, -0.9416706562042236, -0.9062296152114868, -0.87078857421875, -0.8353475332260132, -0.7999064922332764, -0.7644654512405396, -0.7290244102478027, -0.6935833692550659, -0.6581423282623291, -0.6227012872695923, -0.5872602462768555, -0.5518192052841187, -0.5163781642913818, -0.48093709349632263, -0.4454960227012634, -0.4100549817085266, -0.3746139407157898, -0.339172899723053, -0.30373185873031616, -0.26829081773757935, -0.23284974694252014, -0.19740870594978333, -0.1619676649570465, -0.1265266239643097, -0.09108557552099228, -0.055644527077674866, -0.02020348608493805, 0.015237554907798767, 0.05067861080169678, 0.0861196517944336, 0.12156069278717041, 0.15700173377990723, 0.19244277477264404, 0.22788383066654205, 0.2633248567581177, 0.2987658977508545, 0.3342069685459137, 0.3696480095386505, 0.40508905053138733, 0.44053009152412415, 0.47597113251686096, 0.5114122033119202, 0.546853244304657, 0.5822942852973938, 0.6177353262901306, 0.6531763672828674, 0.6886174082756042, 0.7240584492683411, 0.7594994902610779, 0.7949405312538147, 0.8303815722465515, 0.8658226132392883, 0.9012637138366699, 0.9367047548294067, 0.9721457958221436, 1.0075868368148804, 1.0430278778076172, 1.078468918800354, 1.1139099597930908, 1.1493510007858276, 1.1847920417785645, 1.2202330827713013, 1.255674123764038]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 1.0, 2.0, 5.0, 1.0, 8.0, 5.0, 10.0, 9.0, 19.0, 17.0, 27.0, 37.0, 45.0, 85.0, 97.0, 148.0, 215.0, 294.0, 414.0, 738.0, 1231.0, 2574.0, 6562.0, 23199.0, 124371.0, 929319.0, 2398549.0, 596089.0, 82412.0, 16962.0, 5549.0, 2237.0, 1108.0, 656.0, 383.0, 267.0, 173.0, 141.0, 69.0, 79.0, 58.0, 24.0, 28.0, 22.0, 19.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0888671875, -0.08584308624267578, -0.08281898498535156, -0.07979488372802734, -0.07677078247070312, -0.0737466812133789, -0.07072257995605469, -0.06769847869873047, -0.06467437744140625, -0.06165027618408203, -0.05862617492675781, -0.055602073669433594, -0.052577972412109375, -0.049553871154785156, -0.04652976989746094, -0.04350566864013672, -0.0404815673828125, -0.03745746612548828, -0.03443336486816406, -0.031409263610839844, -0.028385162353515625, -0.025361061096191406, -0.022336959838867188, -0.01931285858154297, -0.01628875732421875, -0.013264656066894531, -0.010240554809570312, -0.007216453552246094, -0.004192352294921875, -0.0011682510375976562, 0.0018558502197265625, 0.004879951477050781, 0.007904052734375, 0.010928153991699219, 0.013952255249023438, 0.016976356506347656, 0.020000457763671875, 0.023024559020996094, 0.026048660278320312, 0.02907276153564453, 0.03209686279296875, 0.03512096405029297, 0.03814506530761719, 0.041169166564941406, 0.044193267822265625, 0.047217369079589844, 0.05024147033691406, 0.05326557159423828, 0.0562896728515625, 0.05931377410888672, 0.06233787536621094, 0.06536197662353516, 0.06838607788085938, 0.0714101791381836, 0.07443428039550781, 0.07745838165283203, 0.08048248291015625, 0.08350658416748047, 0.08653068542480469, 0.0895547866821289, 0.09257888793945312, 0.09560298919677734, 0.09862709045410156, 0.10165119171142578, 0.10467529296875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 5.0, 12.0, 12.0, 12.0, 13.0, 21.0, 32.0, 28.0, 37.0, 37.0, 38.0, 57.0, 45.0, 45.0, 65.0, 55.0, 46.0, 61.0, 59.0, 57.0, 48.0, 37.0, 37.0, 29.0, 22.0, 23.0, 14.0, 16.0, 7.0, 6.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1190185546875, -0.11565780639648438, -0.11229705810546875, -0.10893630981445312, -0.1055755615234375, -0.10221481323242188, -0.09885406494140625, -0.09549331665039062, -0.092132568359375, -0.08877182006835938, -0.08541107177734375, -0.08205032348632812, -0.0786895751953125, -0.07532882690429688, -0.07196807861328125, -0.06860733032226562, -0.06524658203125, -0.061885833740234375, -0.05852508544921875, -0.055164337158203125, -0.0518035888671875, -0.048442840576171875, -0.04508209228515625, -0.041721343994140625, -0.038360595703125, -0.034999847412109375, -0.03163909912109375, -0.028278350830078125, -0.0249176025390625, -0.021556854248046875, -0.01819610595703125, -0.014835357666015625, -0.011474609375, -0.008113861083984375, -0.00475311279296875, -0.001392364501953125, 0.0019683837890625, 0.005329132080078125, 0.00868988037109375, 0.012050628662109375, 0.015411376953125, 0.018772125244140625, 0.02213287353515625, 0.025493621826171875, 0.0288543701171875, 0.032215118408203125, 0.03557586669921875, 0.038936614990234375, 0.04229736328125, 0.045658111572265625, 0.04901885986328125, 0.052379608154296875, 0.0557403564453125, 0.059101104736328125, 0.06246185302734375, 0.06582260131835938, 0.069183349609375, 0.07254409790039062, 0.07590484619140625, 0.07926559448242188, 0.0826263427734375, 0.08598709106445312, 0.08934783935546875, 0.09270858764648438, 0.0960693359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 8.0, 19.0, 55.0, 138.0, 377.0, 1928.0, 114556.0, 4070438.0, 5687.0, 723.0, 205.0, 75.0, 34.0, 8.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7591476440429688, -0.7355804443359375, -0.7120132446289062, -0.688446044921875, -0.6648788452148438, -0.6413116455078125, -0.6177444458007812, -0.59417724609375, -0.5706100463867188, -0.5470428466796875, -0.5234756469726562, -0.499908447265625, -0.47634124755859375, -0.4527740478515625, -0.42920684814453125, -0.4056396484375, -0.38207244873046875, -0.3585052490234375, -0.33493804931640625, -0.311370849609375, -0.28780364990234375, -0.2642364501953125, -0.24066925048828125, -0.21710205078125, -0.19353485107421875, -0.1699676513671875, -0.14640045166015625, -0.122833251953125, -0.09926605224609375, -0.0756988525390625, -0.05213165283203125, -0.028564453125, -0.00499725341796875, 0.0185699462890625, 0.04213714599609375, 0.065704345703125, 0.08927154541015625, 0.1128387451171875, 0.13640594482421875, 0.15997314453125, 0.18354034423828125, 0.2071075439453125, 0.23067474365234375, 0.254241943359375, 0.27780914306640625, 0.3013763427734375, 0.32494354248046875, 0.3485107421875, 0.37207794189453125, 0.3956451416015625, 0.41921234130859375, 0.442779541015625, 0.46634674072265625, 0.4899139404296875, 0.5134811401367188, 0.53704833984375, 0.5606155395507812, 0.5841827392578125, 0.6077499389648438, 0.631317138671875, 0.6548843383789062, 0.6784515380859375, 0.7020187377929688, 0.7255859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 16.0, 14.0, 17.0, 36.0, 88.0, 189.0, 503.0, 1222.0, 1184.0, 430.0, 189.0, 86.0, 39.0, 31.0, 8.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.42578125, -0.4156208038330078, -0.4054603576660156, -0.39529991149902344, -0.38513946533203125, -0.37497901916503906, -0.3648185729980469, -0.3546581268310547, -0.3444976806640625, -0.3343372344970703, -0.3241767883300781, -0.31401634216308594, -0.30385589599609375, -0.29369544982910156, -0.2835350036621094, -0.2733745574951172, -0.263214111328125, -0.2530536651611328, -0.24289321899414062, -0.23273277282714844, -0.22257232666015625, -0.21241188049316406, -0.20225143432617188, -0.1920909881591797, -0.1819305419921875, -0.1717700958251953, -0.16160964965820312, -0.15144920349121094, -0.14128875732421875, -0.13112831115722656, -0.12096786499023438, -0.11080741882324219, -0.10064697265625, -0.09048652648925781, -0.08032608032226562, -0.07016563415527344, -0.06000518798828125, -0.04984474182128906, -0.039684295654296875, -0.029523849487304688, -0.0193634033203125, -0.009202957153320312, 0.000957489013671875, 0.011117935180664062, 0.02127838134765625, 0.03143882751464844, 0.041599273681640625, 0.05175971984863281, 0.061920166015625, 0.07208061218261719, 0.08224105834960938, 0.09240150451660156, 0.10256195068359375, 0.11272239685058594, 0.12288284301757812, 0.1330432891845703, 0.1432037353515625, 0.1533641815185547, 0.16352462768554688, 0.17368507385253906, 0.18384552001953125, 0.19400596618652344, 0.20416641235351562, 0.2143268585205078, 0.2244873046875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 11.0, 17.0, 41.0, 61.0, 141.0, 210.0, 197.0, 141.0, 94.0, 41.0, 26.0, 9.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.719484806060791, -2.6601996421813965, -2.600914239883423, -2.5416290760040283, -2.482343912124634, -2.42305850982666, -2.3637733459472656, -2.304488182067871, -2.2452027797698975, -2.185917615890503, -2.1266322135925293, -2.0673470497131348, -2.0080618858337402, -1.9487764835357666, -1.889491319656372, -1.830206036567688, -1.7709208726882935, -1.7116355895996094, -1.6523504257202148, -1.5930651426315308, -1.5337798595428467, -1.4744946956634521, -1.415209412574768, -1.355924129486084, -1.2966389656066895, -1.2373536825180054, -1.1780685186386108, -1.1187832355499268, -1.0594979524612427, -1.0002126693725586, -0.9409275054931641, -0.88164222240448, -0.8223570585250854, -0.7630718350410461, -0.7037865519523621, -0.6445013284683228, -0.5852160453796387, -0.5259308218955994, -0.46664559841156006, -0.40736034512519836, -0.34807509183883667, -0.288789838552475, -0.22950460016727448, -0.17021936178207397, -0.11093410849571228, -0.051648855209350586, 0.007636368274688721, 0.06692162156105042, 0.1262068748474121, 0.1854921281337738, 0.2447773665189743, 0.3040626049041748, 0.3633478581905365, 0.4226331114768982, 0.4819183349609375, 0.5412036180496216, 0.6004888415336609, 0.6597740650177002, 0.7190593481063843, 0.7783445715904236, 0.8376297950744629, 0.896915078163147, 0.9562003016471863, 1.0154855251312256, 1.0747708082199097]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 0.0, 6.0, 3.0, 8.0, 12.0, 13.0, 14.0, 11.0, 25.0, 27.0, 19.0, 22.0, 28.0, 31.0, 35.0, 41.0, 51.0, 50.0, 44.0, 40.0, 37.0, 51.0, 44.0, 48.0, 40.0, 40.0, 34.0, 32.0, 28.0, 17.0, 27.0, 21.0, 18.0, 11.0, 18.0, 12.0, 17.0, 6.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.8045223355293274, -0.7798269391059875, -0.7551315426826477, -0.7304361462593079, -0.7057408094406128, -0.681045413017273, -0.6563500165939331, -0.6316546201705933, -0.6069592237472534, -0.5822638273239136, -0.5575684309005737, -0.5328730344772339, -0.508177638053894, -0.4834822714328766, -0.45878690481185913, -0.4340915083885193, -0.40939611196517944, -0.3847007155418396, -0.36000531911849976, -0.3353099524974823, -0.31061455607414246, -0.2859191596508026, -0.26122379302978516, -0.2365283966064453, -0.21183300018310547, -0.18713760375976562, -0.16244222223758698, -0.13774684071540833, -0.11305144429206848, -0.08835605531930923, -0.06366066634654999, -0.03896528482437134, -0.014269888401031494, 0.010425500571727753, 0.035120889544487, 0.059816278517246246, 0.0845116674900055, 0.10920705646276474, 0.133902445435524, 0.15859782695770264, 0.18329322338104248, 0.20798861980438232, 0.23268400132656097, 0.2573793828487396, 0.28207477927207947, 0.3067701756954193, 0.33146554231643677, 0.3561609387397766, 0.38085633516311646, 0.4055517315864563, 0.43024712800979614, 0.4549424946308136, 0.47963789105415344, 0.5043332576751709, 0.5290286540985107, 0.5537240505218506, 0.5784194469451904, 0.6031148433685303, 0.6278102397918701, 0.65250563621521, 0.6772010326385498, 0.7018963694572449, 0.7265917658805847, 0.7512871623039246, 0.7759825587272644]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 12.0, 13.0, 19.0, 25.0, 38.0, 46.0, 81.0, 123.0, 199.0, 260.0, 424.0, 704.0, 1169.0, 1981.0, 3435.0, 6015.0, 11214.0, 21115.0, 41993.0, 82110.0, 161936.0, 259839.0, 216985.0, 116299.0, 58546.0, 29579.0, 15322.0, 8101.0, 4532.0, 2474.0, 1510.0, 917.0, 531.0, 320.0, 207.0, 154.0, 95.0, 71.0, 39.0, 42.0, 28.0, 10.0, 12.0, 7.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07135009765625, -0.06895160675048828, -0.06655311584472656, -0.06415462493896484, -0.061756134033203125, -0.059357643127441406, -0.05695915222167969, -0.05456066131591797, -0.05216217041015625, -0.04976367950439453, -0.04736518859863281, -0.044966697692871094, -0.042568206787109375, -0.040169715881347656, -0.03777122497558594, -0.03537273406982422, -0.0329742431640625, -0.03057575225830078, -0.028177261352539062, -0.025778770446777344, -0.023380279541015625, -0.020981788635253906, -0.018583297729492188, -0.01618480682373047, -0.01378631591796875, -0.011387825012207031, -0.008989334106445312, -0.006590843200683594, -0.004192352294921875, -0.0017938613891601562, 0.0006046295166015625, 0.0030031204223632812, 0.005401611328125, 0.007800102233886719, 0.010198593139648438, 0.012597084045410156, 0.014995574951171875, 0.017394065856933594, 0.019792556762695312, 0.02219104766845703, 0.02458953857421875, 0.02698802947998047, 0.029386520385742188, 0.031785011291503906, 0.034183502197265625, 0.036581993103027344, 0.03898048400878906, 0.04137897491455078, 0.0437774658203125, 0.04617595672607422, 0.04857444763183594, 0.050972938537597656, 0.053371429443359375, 0.055769920349121094, 0.05816841125488281, 0.06056690216064453, 0.06296539306640625, 0.06536388397216797, 0.06776237487792969, 0.0701608657836914, 0.07255935668945312, 0.07495784759521484, 0.07735633850097656, 0.07975482940673828, 0.0821533203125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 13.0, 8.0, 17.0, 13.0, 13.0, 29.0, 26.0, 30.0, 35.0, 32.0, 50.0, 50.0, 49.0, 33.0, 59.0, 47.0, 58.0, 65.0, 53.0, 45.0, 47.0, 41.0, 39.0, 29.0, 24.0, 12.0, 17.0, 22.0, 6.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1192626953125, -0.11587905883789062, -0.11249542236328125, -0.10911178588867188, -0.1057281494140625, -0.10234451293945312, -0.09896087646484375, -0.09557723999023438, -0.092193603515625, -0.08880996704101562, -0.08542633056640625, -0.08204269409179688, -0.0786590576171875, -0.07527542114257812, -0.07189178466796875, -0.06850814819335938, -0.06512451171875, -0.061740875244140625, -0.05835723876953125, -0.054973602294921875, -0.0515899658203125, -0.048206329345703125, -0.04482269287109375, -0.041439056396484375, -0.038055419921875, -0.034671783447265625, -0.03128814697265625, -0.027904510498046875, -0.0245208740234375, -0.021137237548828125, -0.01775360107421875, -0.014369964599609375, -0.010986328125, -0.007602691650390625, -0.00421905517578125, -0.000835418701171875, 0.0025482177734375, 0.005931854248046875, 0.00931549072265625, 0.012699127197265625, 0.016082763671875, 0.019466400146484375, 0.02285003662109375, 0.026233673095703125, 0.0296173095703125, 0.033000946044921875, 0.03638458251953125, 0.039768218994140625, 0.04315185546875, 0.046535491943359375, 0.04991912841796875, 0.053302764892578125, 0.0566864013671875, 0.060070037841796875, 0.06345367431640625, 0.06683731079101562, 0.070220947265625, 0.07360458374023438, 0.07698822021484375, 0.08037185668945312, 0.0837554931640625, 0.08713912963867188, 0.09052276611328125, 0.09390640258789062, 0.0972900390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 8.0, 3.0, 10.0, 3.0, 10.0, 14.0, 17.0, 21.0, 51.0, 41.0, 73.0, 91.0, 128.0, 193.0, 274.0, 511.0, 991.0, 2297.0, 7997.0, 44482.0, 615634.0, 329124.0, 35348.0, 6860.0, 2087.0, 823.0, 493.0, 271.0, 213.0, 147.0, 82.0, 70.0, 49.0, 34.0, 24.0, 18.0, 10.0, 13.0, 10.0, 8.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.271240234375, -0.26274871826171875, -0.2542572021484375, -0.24576568603515625, -0.237274169921875, -0.22878265380859375, -0.2202911376953125, -0.21179962158203125, -0.20330810546875, -0.19481658935546875, -0.1863250732421875, -0.17783355712890625, -0.169342041015625, -0.16085052490234375, -0.1523590087890625, -0.14386749267578125, -0.1353759765625, -0.12688446044921875, -0.1183929443359375, -0.10990142822265625, -0.101409912109375, -0.09291839599609375, -0.0844268798828125, -0.07593536376953125, -0.06744384765625, -0.05895233154296875, -0.0504608154296875, -0.04196929931640625, -0.033477783203125, -0.02498626708984375, -0.0164947509765625, -0.00800323486328125, 0.00048828125, 0.00897979736328125, 0.0174713134765625, 0.02596282958984375, 0.034454345703125, 0.04294586181640625, 0.0514373779296875, 0.05992889404296875, 0.06842041015625, 0.07691192626953125, 0.0854034423828125, 0.09389495849609375, 0.102386474609375, 0.11087799072265625, 0.1193695068359375, 0.12786102294921875, 0.1363525390625, 0.14484405517578125, 0.1533355712890625, 0.16182708740234375, 0.170318603515625, 0.17881011962890625, 0.1873016357421875, 0.19579315185546875, 0.20428466796875, 0.21277618408203125, 0.2212677001953125, 0.22975921630859375, 0.238250732421875, 0.24674224853515625, 0.2552337646484375, 0.26372528076171875, 0.272216796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 9.0, 6.0, 12.0, 16.0, 25.0, 14.0, 34.0, 43.0, 52.0, 49.0, 58.0, 69.0, 72.0, 71.0, 84.0, 76.0, 59.0, 51.0, 41.0, 34.0, 30.0, 27.0, 15.0, 13.0, 14.0, 6.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5081634521484375, -0.491424560546875, -0.4746856689453125, -0.45794677734375, -0.4412078857421875, -0.424468994140625, -0.4077301025390625, -0.3909912109375, -0.3742523193359375, -0.357513427734375, -0.3407745361328125, -0.32403564453125, -0.3072967529296875, -0.290557861328125, -0.2738189697265625, -0.257080078125, -0.2403411865234375, -0.223602294921875, -0.2068634033203125, -0.19012451171875, -0.1733856201171875, -0.156646728515625, -0.1399078369140625, -0.1231689453125, -0.1064300537109375, -0.089691162109375, -0.0729522705078125, -0.05621337890625, -0.0394744873046875, -0.022735595703125, -0.0059967041015625, 0.0107421875, 0.0274810791015625, 0.044219970703125, 0.0609588623046875, 0.07769775390625, 0.0944366455078125, 0.111175537109375, 0.1279144287109375, 0.1446533203125, 0.1613922119140625, 0.178131103515625, 0.1948699951171875, 0.21160888671875, 0.2283477783203125, 0.245086669921875, 0.2618255615234375, 0.278564453125, 0.2953033447265625, 0.312042236328125, 0.3287811279296875, 0.34552001953125, 0.3622589111328125, 0.378997802734375, 0.3957366943359375, 0.4124755859375, 0.4292144775390625, 0.445953369140625, 0.4626922607421875, 0.47943115234375, 0.4961700439453125, 0.512908935546875, 0.5296478271484375, 0.54638671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 7.0, 9.0, 7.0, 16.0, 27.0, 39.0, 59.0, 92.0, 140.0, 292.0, 561.0, 1199.0, 2931.0, 7671.0, 25654.0, 124552.0, 741216.0, 108153.0, 23538.0, 7302.0, 2706.0, 1162.0, 562.0, 281.0, 163.0, 86.0, 47.0, 24.0, 18.0, 18.0, 10.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09222412109375, -0.08954811096191406, -0.08687210083007812, -0.08419609069824219, -0.08152008056640625, -0.07884407043457031, -0.07616806030273438, -0.07349205017089844, -0.0708160400390625, -0.06814002990722656, -0.06546401977539062, -0.06278800964355469, -0.06011199951171875, -0.05743598937988281, -0.054759979248046875, -0.05208396911621094, -0.049407958984375, -0.04673194885253906, -0.044055938720703125, -0.04137992858886719, -0.03870391845703125, -0.03602790832519531, -0.033351898193359375, -0.030675888061523438, -0.0279998779296875, -0.025323867797851562, -0.022647857666015625, -0.019971847534179688, -0.01729583740234375, -0.014619827270507812, -0.011943817138671875, -0.009267807006835938, -0.006591796875, -0.0039157867431640625, -0.001239776611328125, 0.0014362335205078125, 0.00411224365234375, 0.0067882537841796875, 0.009464263916015625, 0.012140274047851562, 0.0148162841796875, 0.017492294311523438, 0.020168304443359375, 0.022844314575195312, 0.02552032470703125, 0.028196334838867188, 0.030872344970703125, 0.03354835510253906, 0.036224365234375, 0.03890037536621094, 0.041576385498046875, 0.04425239562988281, 0.04692840576171875, 0.04960441589355469, 0.052280426025390625, 0.05495643615722656, 0.0576324462890625, 0.06030845642089844, 0.06298446655273438, 0.06566047668457031, 0.06833648681640625, 0.07101249694824219, 0.07368850708007812, 0.07636451721191406, 0.07904052734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 5.0, 16.0, 7.0, 15.0, 16.0, 24.0, 29.0, 36.0, 67.0, 92.0, 118.0, 117.0, 122.0, 83.0, 58.0, 46.0, 28.0, 26.0, 24.0, 8.0, 9.0, 8.0, 9.0, 3.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1961669921875e-05, -4.074070602655411e-05, -3.9519742131233215e-05, -3.829877823591232e-05, -3.707781434059143e-05, -3.585685044527054e-05, -3.4635886549949646e-05, -3.3414922654628754e-05, -3.219395875930786e-05, -3.097299486398697e-05, -2.9752030968666077e-05, -2.8531067073345184e-05, -2.7310103178024292e-05, -2.60891392827034e-05, -2.4868175387382507e-05, -2.3647211492061615e-05, -2.2426247596740723e-05, -2.120528370141983e-05, -1.9984319806098938e-05, -1.8763355910778046e-05, -1.7542392015457153e-05, -1.632142812013626e-05, -1.5100464224815369e-05, -1.3879500329494476e-05, -1.2658536434173584e-05, -1.1437572538852692e-05, -1.02166086435318e-05, -8.995644748210907e-06, -7.774680852890015e-06, -6.553716957569122e-06, -5.33275306224823e-06, -4.111789166927338e-06, -2.8908252716064453e-06, -1.669861376285553e-06, -4.4889748096466064e-07, 7.720664143562317e-07, 1.993030309677124e-06, 3.2139942049980164e-06, 4.434958100318909e-06, 5.655921995639801e-06, 6.876885890960693e-06, 8.097849786281586e-06, 9.318813681602478e-06, 1.053977757692337e-05, 1.1760741472244263e-05, 1.2981705367565155e-05, 1.4202669262886047e-05, 1.542363315820694e-05, 1.6644597053527832e-05, 1.7865560948848724e-05, 1.9086524844169617e-05, 2.030748873949051e-05, 2.15284526348114e-05, 2.2749416530132294e-05, 2.3970380425453186e-05, 2.519134432077408e-05, 2.641230821609497e-05, 2.7633272111415863e-05, 2.8854236006736755e-05, 3.0075199902057648e-05, 3.129616379737854e-05, 3.251712769269943e-05, 3.3738091588020325e-05, 3.495905548334122e-05, 3.618001937866211e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 9.0, 15.0, 16.0, 23.0, 34.0, 68.0, 102.0, 202.0, 394.0, 915.0, 2607.0, 9587.0, 62196.0, 792126.0, 155123.0, 18554.0, 4177.0, 1288.0, 552.0, 234.0, 118.0, 71.0, 44.0, 39.0, 21.0, 17.0, 8.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.149169921875, -0.14550399780273438, -0.14183807373046875, -0.13817214965820312, -0.1345062255859375, -0.13084030151367188, -0.12717437744140625, -0.12350845336914062, -0.119842529296875, -0.11617660522460938, -0.11251068115234375, -0.10884475708007812, -0.1051788330078125, -0.10151290893554688, -0.09784698486328125, -0.09418106079101562, -0.09051513671875, -0.08684921264648438, -0.08318328857421875, -0.07951736450195312, -0.0758514404296875, -0.07218551635742188, -0.06851959228515625, -0.06485366821289062, -0.061187744140625, -0.057521820068359375, -0.05385589599609375, -0.050189971923828125, -0.0465240478515625, -0.042858123779296875, -0.03919219970703125, -0.035526275634765625, -0.0318603515625, -0.028194427490234375, -0.02452850341796875, -0.020862579345703125, -0.0171966552734375, -0.013530731201171875, -0.00986480712890625, -0.006198883056640625, -0.002532958984375, 0.001132965087890625, 0.00479888916015625, 0.008464813232421875, 0.0121307373046875, 0.015796661376953125, 0.01946258544921875, 0.023128509521484375, 0.02679443359375, 0.030460357666015625, 0.03412628173828125, 0.037792205810546875, 0.0414581298828125, 0.045124053955078125, 0.04878997802734375, 0.052455902099609375, 0.056121826171875, 0.059787750244140625, 0.06345367431640625, 0.06711959838867188, 0.0707855224609375, 0.07445144653320312, 0.07811737060546875, 0.08178329467773438, 0.08544921875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 9.0, 2.0, 8.0, 6.0, 8.0, 9.0, 18.0, 20.0, 22.0, 31.0, 51.0, 57.0, 81.0, 106.0, 120.0, 103.0, 101.0, 53.0, 37.0, 40.0, 22.0, 22.0, 17.0, 22.0, 15.0, 7.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.128173828125, -0.12515735626220703, -0.12214088439941406, -0.1191244125366211, -0.11610794067382812, -0.11309146881103516, -0.11007499694824219, -0.10705852508544922, -0.10404205322265625, -0.10102558135986328, -0.09800910949707031, -0.09499263763427734, -0.09197616577148438, -0.0889596939086914, -0.08594322204589844, -0.08292675018310547, -0.0799102783203125, -0.07689380645751953, -0.07387733459472656, -0.0708608627319336, -0.06784439086914062, -0.06482791900634766, -0.06181144714355469, -0.05879497528076172, -0.05577850341796875, -0.05276203155517578, -0.04974555969238281, -0.046729087829589844, -0.043712615966796875, -0.040696144104003906, -0.03767967224121094, -0.03466320037841797, -0.031646728515625, -0.02863025665283203, -0.025613784790039062, -0.022597312927246094, -0.019580841064453125, -0.016564369201660156, -0.013547897338867188, -0.010531425476074219, -0.00751495361328125, -0.004498481750488281, -0.0014820098876953125, 0.0015344619750976562, 0.004550933837890625, 0.007567405700683594, 0.010583877563476562, 0.013600349426269531, 0.0166168212890625, 0.01963329315185547, 0.022649765014648438, 0.025666236877441406, 0.028682708740234375, 0.031699180603027344, 0.03471565246582031, 0.03773212432861328, 0.04074859619140625, 0.04376506805419922, 0.04678153991699219, 0.049798011779785156, 0.052814483642578125, 0.055830955505371094, 0.05884742736816406, 0.06186389923095703, 0.06488037109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 13.0, 19.0, 32.0, 52.0, 107.0, 148.0, 301.0, 117.0, 75.0, 45.0, 33.0, 17.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1613118648529053, -2.1052229404449463, -2.0491340160369873, -1.9930450916290283, -1.9369560480117798, -1.8808671236038208, -1.8247781991958618, -1.7686892747879028, -1.7126003503799438, -1.6565114259719849, -1.6004225015640259, -1.5443334579467773, -1.4882445335388184, -1.4321556091308594, -1.3760666847229004, -1.3199777603149414, -1.2638888359069824, -1.2077999114990234, -1.1517109870910645, -1.0956220626831055, -1.039533019065857, -0.983444094657898, -0.927355170249939, -0.87126624584198, -0.8151772022247314, -0.7590882778167725, -0.7029992938041687, -0.6469103693962097, -0.5908214449882507, -0.534732460975647, -0.478643536567688, -0.422554612159729, -0.36646568775177, -0.31037673354148865, -0.25428780913352966, -0.1981988549232483, -0.1421099156141281, -0.08602097630500793, -0.029932022094726562, 0.026156902313232422, 0.0822458565235138, 0.13833479583263397, 0.19442373514175415, 0.2505126893520355, 0.3066016435623169, 0.3626905679702759, 0.41877952218055725, 0.47486844658851624, 0.5309574007987976, 0.5870463252067566, 0.6431353092193604, 0.6992242336273193, 0.7553131580352783, 0.8114020824432373, 0.8674910664558411, 0.9235799908638, 0.9796689748764038, 1.0357578992843628, 1.0918468236923218, 1.1479358673095703, 1.2040247917175293, 1.2601137161254883, 1.3162026405334473, 1.3722915649414062, 1.4283804893493652]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 3.0, 7.0, 9.0, 14.0, 14.0, 10.0, 14.0, 17.0, 14.0, 23.0, 23.0, 29.0, 20.0, 30.0, 36.0, 43.0, 69.0, 103.0, 101.0, 72.0, 46.0, 42.0, 29.0, 29.0, 29.0, 19.0, 20.0, 14.0, 15.0, 18.0, 10.0, 10.0, 7.0, 4.0, 6.0, 7.0, 8.0, 2.0, 8.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3526108264923096, -1.3089009523391724, -1.2651911973953247, -1.2214813232421875, -1.1777715682983398, -1.1340616941452026, -1.0903518199920654, -1.0466420650482178, -1.0029321908950806, -0.9592223763465881, -0.9155125617980957, -0.8718026876449585, -0.8280928730964661, -0.7843830585479736, -0.7406731843948364, -0.696963369846344, -0.6532535552978516, -0.6095437407493591, -0.5658339262008667, -0.5221240520477295, -0.47841423749923706, -0.43470442295074463, -0.3909945785999298, -0.347284734249115, -0.30357491970062256, -0.2598651051521301, -0.2161552608013153, -0.17244543135166168, -0.12873560190200806, -0.08502577245235443, -0.041315943002700806, 0.0023939013481140137, 0.046103835105895996, 0.08981366455554962, 0.13352349400520325, 0.17723332345485687, 0.2209431529045105, 0.26465296745300293, 0.30836281180381775, 0.35207265615463257, 0.395782470703125, 0.43949228525161743, 0.48320212960243225, 0.5269119739532471, 0.5706217885017395, 0.6143316030502319, 0.6580414772033691, 0.7017512917518616, 0.745461106300354, 0.7891709208488464, 0.8328807353973389, 0.8765906095504761, 0.9203004240989685, 0.9640102386474609, 1.0077201128005981, 1.0514299869537354, 1.095139741897583, 1.1388496160507202, 1.1825593709945679, 1.226269245147705, 1.2699790000915527, 1.31368887424469, 1.3573987483978271, 1.4011085033416748, 1.444818377494812]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 8.0, 15.0, 14.0, 19.0, 23.0, 29.0, 43.0, 41.0, 53.0, 70.0, 109.0, 182.0, 299.0, 605.0, 1388.0, 4393.0, 25314.0, 392459.0, 3037558.0, 679716.0, 42491.0, 6054.0, 1780.0, 688.0, 286.0, 183.0, 92.0, 71.0, 54.0, 55.0, 41.0, 35.0, 33.0, 19.0, 17.0, 13.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15380859375, -0.14861106872558594, -0.14341354370117188, -0.1382160186767578, -0.13301849365234375, -0.1278209686279297, -0.12262344360351562, -0.11742591857910156, -0.1122283935546875, -0.10703086853027344, -0.10183334350585938, -0.09663581848144531, -0.09143829345703125, -0.08624076843261719, -0.08104324340820312, -0.07584571838378906, -0.070648193359375, -0.06545066833496094, -0.060253143310546875, -0.05505561828613281, -0.04985809326171875, -0.04466056823730469, -0.039463043212890625, -0.03426551818847656, -0.0290679931640625, -0.023870468139648438, -0.018672943115234375, -0.013475418090820312, -0.00827789306640625, -0.0030803680419921875, 0.002117156982421875, 0.0073146820068359375, 0.01251220703125, 0.017709732055664062, 0.022907257080078125, 0.028104782104492188, 0.03330230712890625, 0.03849983215332031, 0.043697357177734375, 0.04889488220214844, 0.0540924072265625, 0.05928993225097656, 0.06448745727539062, 0.06968498229980469, 0.07488250732421875, 0.08008003234863281, 0.08527755737304688, 0.09047508239746094, 0.095672607421875, 0.10087013244628906, 0.10606765747070312, 0.11126518249511719, 0.11646270751953125, 0.12166023254394531, 0.12685775756835938, 0.13205528259277344, 0.1372528076171875, 0.14245033264160156, 0.14764785766601562, 0.1528453826904297, 0.15804290771484375, 0.1632404327392578, 0.16843795776367188, 0.17363548278808594, 0.1788330078125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 8.0, 8.0, 4.0, 12.0, 14.0, 13.0, 22.0, 26.0, 24.0, 38.0, 37.0, 38.0, 47.0, 30.0, 59.0, 46.0, 42.0, 56.0, 39.0, 55.0, 60.0, 42.0, 35.0, 42.0, 40.0, 35.0, 19.0, 20.0, 20.0, 18.0, 11.0, 9.0, 6.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11773681640625, -0.11440181732177734, -0.11106681823730469, -0.10773181915283203, -0.10439682006835938, -0.10106182098388672, -0.09772682189941406, -0.0943918228149414, -0.09105682373046875, -0.0877218246459961, -0.08438682556152344, -0.08105182647705078, -0.07771682739257812, -0.07438182830810547, -0.07104682922363281, -0.06771183013916016, -0.0643768310546875, -0.061041831970214844, -0.05770683288574219, -0.05437183380126953, -0.051036834716796875, -0.04770183563232422, -0.04436683654785156, -0.041031837463378906, -0.03769683837890625, -0.034361839294433594, -0.031026840209960938, -0.02769184112548828, -0.024356842041015625, -0.02102184295654297, -0.017686843872070312, -0.014351844787597656, -0.011016845703125, -0.007681846618652344, -0.0043468475341796875, -0.0010118484497070312, 0.002323150634765625, 0.005658149719238281, 0.008993148803710938, 0.012328147888183594, 0.01566314697265625, 0.018998146057128906, 0.022333145141601562, 0.02566814422607422, 0.029003143310546875, 0.03233814239501953, 0.03567314147949219, 0.039008140563964844, 0.0423431396484375, 0.045678138732910156, 0.04901313781738281, 0.05234813690185547, 0.055683135986328125, 0.05901813507080078, 0.06235313415527344, 0.0656881332397461, 0.06902313232421875, 0.0723581314086914, 0.07569313049316406, 0.07902812957763672, 0.08236312866210938, 0.08569812774658203, 0.08903312683105469, 0.09236812591552734, 0.095703125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 13.0, 14.0, 24.0, 36.0, 67.0, 128.0, 255.0, 738.0, 2635.0, 32149.0, 3936723.0, 213263.0, 6369.0, 1098.0, 374.0, 188.0, 75.0, 45.0, 30.0, 15.0, 13.0, 2.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50390625, -0.49018096923828125, -0.4764556884765625, -0.46273040771484375, -0.449005126953125, -0.43527984619140625, -0.4215545654296875, -0.40782928466796875, -0.39410400390625, -0.38037872314453125, -0.3666534423828125, -0.35292816162109375, -0.339202880859375, -0.32547760009765625, -0.3117523193359375, -0.29802703857421875, -0.2843017578125, -0.27057647705078125, -0.2568511962890625, -0.24312591552734375, -0.229400634765625, -0.21567535400390625, -0.2019500732421875, -0.18822479248046875, -0.17449951171875, -0.16077423095703125, -0.1470489501953125, -0.13332366943359375, -0.119598388671875, -0.10587310791015625, -0.0921478271484375, -0.07842254638671875, -0.064697265625, -0.05097198486328125, -0.0372467041015625, -0.02352142333984375, -0.009796142578125, 0.00392913818359375, 0.0176544189453125, 0.03137969970703125, 0.04510498046875, 0.05883026123046875, 0.0725555419921875, 0.08628082275390625, 0.100006103515625, 0.11373138427734375, 0.1274566650390625, 0.14118194580078125, 0.1549072265625, 0.16863250732421875, 0.1823577880859375, 0.19608306884765625, 0.209808349609375, 0.22353363037109375, 0.2372589111328125, 0.25098419189453125, 0.26470947265625, 0.27843475341796875, 0.2921600341796875, 0.30588531494140625, 0.319610595703125, 0.33333587646484375, 0.3470611572265625, 0.36078643798828125, 0.37451171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 4.0, 5.0, 4.0, 19.0, 25.0, 30.0, 38.0, 69.0, 103.0, 178.0, 336.0, 640.0, 892.0, 728.0, 420.0, 248.0, 114.0, 79.0, 49.0, 24.0, 21.0, 14.0, 9.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2020263671875, -0.19414329528808594, -0.18626022338867188, -0.1783771514892578, -0.17049407958984375, -0.1626110076904297, -0.15472793579101562, -0.14684486389160156, -0.1389617919921875, -0.13107872009277344, -0.12319564819335938, -0.11531257629394531, -0.10742950439453125, -0.09954643249511719, -0.09166336059570312, -0.08378028869628906, -0.075897216796875, -0.06801414489746094, -0.060131072998046875, -0.05224800109863281, -0.04436492919921875, -0.03648185729980469, -0.028598785400390625, -0.020715713500976562, -0.0128326416015625, -0.0049495697021484375, 0.002933502197265625, 0.010816574096679688, 0.01869964599609375, 0.026582717895507812, 0.034465789794921875, 0.04234886169433594, 0.05023193359375, 0.05811500549316406, 0.06599807739257812, 0.07388114929199219, 0.08176422119140625, 0.08964729309082031, 0.09753036499023438, 0.10541343688964844, 0.1132965087890625, 0.12117958068847656, 0.12906265258789062, 0.1369457244873047, 0.14482879638671875, 0.1527118682861328, 0.16059494018554688, 0.16847801208496094, 0.176361083984375, 0.18424415588378906, 0.19212722778320312, 0.2000102996826172, 0.20789337158203125, 0.2157764434814453, 0.22365951538085938, 0.23154258728027344, 0.2394256591796875, 0.24730873107910156, 0.2551918029785156, 0.2630748748779297, 0.27095794677734375, 0.2788410186767578, 0.2867240905761719, 0.29460716247558594, 0.302490234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 13.0, 34.0, 64.0, 223.0, 317.0, 208.0, 98.0, 18.0, 14.0, 8.0, 4.0, 2.0], "bins": [-5.664047718048096, -5.56368350982666, -5.463318824768066, -5.362954616546631, -5.262590408325195, -5.162225723266602, -5.061861515045166, -4.9614973068237305, -4.861132621765137, -4.760768413543701, -4.660403728485107, -4.560039520263672, -4.459675312042236, -4.359310626983643, -4.258946418762207, -4.158581733703613, -4.058217525482178, -3.957853078842163, -3.8574888706207275, -3.757124423980713, -3.6567599773406982, -3.5563955307006836, -3.456031322479248, -3.3556668758392334, -3.255302667617798, -3.154938220977783, -3.0545740127563477, -2.954209566116333, -2.8538451194763184, -2.753480911254883, -2.653116464614868, -2.5527520179748535, -2.4523873329162598, -2.352022886276245, -2.2516586780548096, -2.151294231414795, -2.0509297847747803, -1.9505654573440552, -1.85020112991333, -1.7498366832733154, -1.6494724750518799, -1.5491081476211548, -1.4487437009811401, -1.348379373550415, -1.2480149269104004, -1.1476505994796753, -1.0472862720489502, -0.9469218254089355, -0.8465573787689209, -0.746192991733551, -0.6458286046981812, -0.545464277267456, -0.4450998604297638, -0.3447355031967163, -0.24437111616134644, -0.14400672912597656, -0.04364234209060669, 0.05672203749418259, 0.15708641707897186, 0.25745078921318054, 0.3578151762485504, 0.4581795334815979, 0.5585439205169678, 0.6589083075523376, 0.7592726945877075]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 8.0, 9.0, 5.0, 8.0, 11.0, 13.0, 20.0, 32.0, 24.0, 23.0, 27.0, 41.0, 36.0, 40.0, 41.0, 58.0, 66.0, 58.0, 52.0, 60.0, 46.0, 53.0, 30.0, 40.0, 38.0, 22.0, 29.0, 22.0, 16.0, 16.0, 13.0, 6.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8728641867637634, -0.8426277041435242, -0.8123912215232849, -0.7821547985076904, -0.7519183158874512, -0.7216818332672119, -0.6914453506469727, -0.6612088680267334, -0.6309723854064941, -0.6007359027862549, -0.5704994201660156, -0.5402629375457764, -0.5100265145301819, -0.4797900319099426, -0.44955354928970337, -0.4193170666694641, -0.38908064365386963, -0.35884416103363037, -0.3286077082157135, -0.29837122559547424, -0.2681347727775574, -0.23789829015731812, -0.20766180753707886, -0.1774253398180008, -0.14718887209892273, -0.11695240437984467, -0.086715929210186, -0.056479454040527344, -0.02624298632144928, 0.003993481397628784, 0.03422996401786804, 0.0644664317369461, 0.0947028398513794, 0.12493930757045746, 0.15517577528953552, 0.18541225790977478, 0.21564872562885284, 0.2458851933479309, 0.27612167596817017, 0.3063581585884094, 0.3365946114063263, 0.36683109402656555, 0.3970675468444824, 0.4273040294647217, 0.45754051208496094, 0.4877769649028778, 0.5180134773254395, 0.5482499003410339, 0.5784863829612732, 0.6087228655815125, 0.6389593482017517, 0.6691957712173462, 0.6994322538375854, 0.7296687364578247, 0.759905219078064, 0.7901417016983032, 0.8203781843185425, 0.8506146669387817, 0.880851149559021, 0.9110876321792603, 0.9413240551948547, 0.971560537815094, 1.0017969608306885, 1.0320334434509277, 1.062269926071167]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 8.0, 8.0, 12.0, 13.0, 20.0, 34.0, 42.0, 72.0, 113.0, 180.0, 295.0, 442.0, 801.0, 1307.0, 2262.0, 3975.0, 7678.0, 15827.0, 35103.0, 83079.0, 219813.0, 369613.0, 180276.0, 69035.0, 29699.0, 13546.0, 6869.0, 3565.0, 1871.0, 1169.0, 667.0, 408.0, 279.0, 155.0, 119.0, 60.0, 53.0, 25.0, 19.0, 21.0, 8.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12261962890625, -0.1187143325805664, -0.11480903625488281, -0.11090373992919922, -0.10699844360351562, -0.10309314727783203, -0.09918785095214844, -0.09528255462646484, -0.09137725830078125, -0.08747196197509766, -0.08356666564941406, -0.07966136932373047, -0.07575607299804688, -0.07185077667236328, -0.06794548034667969, -0.0640401840209961, -0.0601348876953125, -0.056229591369628906, -0.05232429504394531, -0.04841899871826172, -0.044513702392578125, -0.04060840606689453, -0.03670310974121094, -0.032797813415527344, -0.02889251708984375, -0.024987220764160156, -0.021081924438476562, -0.01717662811279297, -0.013271331787109375, -0.009366035461425781, -0.0054607391357421875, -0.0015554428100585938, 0.002349853515625, 0.006255149841308594, 0.010160446166992188, 0.014065742492675781, 0.017971038818359375, 0.02187633514404297, 0.025781631469726562, 0.029686927795410156, 0.03359222412109375, 0.037497520446777344, 0.04140281677246094, 0.04530811309814453, 0.049213409423828125, 0.05311870574951172, 0.05702400207519531, 0.060929298400878906, 0.0648345947265625, 0.0687398910522461, 0.07264518737792969, 0.07655048370361328, 0.08045578002929688, 0.08436107635498047, 0.08826637268066406, 0.09217166900634766, 0.09607696533203125, 0.09998226165771484, 0.10388755798339844, 0.10779285430908203, 0.11169815063476562, 0.11560344696044922, 0.11950874328613281, 0.1234140396118164, 0.1273193359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 16.0, 12.0, 10.0, 22.0, 21.0, 18.0, 27.0, 29.0, 38.0, 40.0, 53.0, 44.0, 47.0, 62.0, 24.0, 52.0, 38.0, 56.0, 51.0, 47.0, 37.0, 27.0, 29.0, 34.0, 22.0, 24.0, 19.0, 15.0, 19.0, 11.0, 12.0, 6.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.11328125, -0.11006927490234375, -0.1068572998046875, -0.10364532470703125, -0.100433349609375, -0.09722137451171875, -0.0940093994140625, -0.09079742431640625, -0.08758544921875, -0.08437347412109375, -0.0811614990234375, -0.07794952392578125, -0.074737548828125, -0.07152557373046875, -0.0683135986328125, -0.06510162353515625, -0.0618896484375, -0.05867767333984375, -0.0554656982421875, -0.05225372314453125, -0.049041748046875, -0.04582977294921875, -0.0426177978515625, -0.03940582275390625, -0.03619384765625, -0.03298187255859375, -0.0297698974609375, -0.02655792236328125, -0.023345947265625, -0.02013397216796875, -0.0169219970703125, -0.01371002197265625, -0.010498046875, -0.00728607177734375, -0.0040740966796875, -0.00086212158203125, 0.002349853515625, 0.00556182861328125, 0.0087738037109375, 0.01198577880859375, 0.01519775390625, 0.01840972900390625, 0.0216217041015625, 0.02483367919921875, 0.028045654296875, 0.03125762939453125, 0.0344696044921875, 0.03768157958984375, 0.0408935546875, 0.04410552978515625, 0.0473175048828125, 0.05052947998046875, 0.053741455078125, 0.05695343017578125, 0.0601654052734375, 0.06337738037109375, 0.06658935546875, 0.06980133056640625, 0.0730133056640625, 0.07622528076171875, 0.079437255859375, 0.08264923095703125, 0.0858612060546875, 0.08907318115234375, 0.09228515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 9.0, 16.0, 17.0, 17.0, 35.0, 40.0, 80.0, 102.0, 131.0, 290.0, 475.0, 943.0, 2185.0, 10887.0, 338912.0, 677141.0, 12686.0, 2350.0, 990.0, 469.0, 277.0, 177.0, 109.0, 68.0, 44.0, 26.0, 26.0, 15.0, 12.0, 11.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.448974609375, -0.4345054626464844, -0.42003631591796875, -0.4055671691894531, -0.3910980224609375, -0.3766288757324219, -0.36215972900390625, -0.3476905822753906, -0.333221435546875, -0.3187522888183594, -0.30428314208984375, -0.2898139953613281, -0.2753448486328125, -0.2608757019042969, -0.24640655517578125, -0.23193740844726562, -0.21746826171875, -0.20299911499023438, -0.18852996826171875, -0.17406082153320312, -0.1595916748046875, -0.14512252807617188, -0.13065338134765625, -0.11618423461914062, -0.101715087890625, -0.08724594116210938, -0.07277679443359375, -0.058307647705078125, -0.0438385009765625, -0.029369354248046875, -0.01490020751953125, -0.000431060791015625, 0.0140380859375, 0.028507232666015625, 0.04297637939453125, 0.057445526123046875, 0.0719146728515625, 0.08638381958007812, 0.10085296630859375, 0.11532211303710938, 0.129791259765625, 0.14426040649414062, 0.15872955322265625, 0.17319869995117188, 0.1876678466796875, 0.20213699340820312, 0.21660614013671875, 0.23107528686523438, 0.24554443359375, 0.2600135803222656, 0.27448272705078125, 0.2889518737792969, 0.3034210205078125, 0.3178901672363281, 0.33235931396484375, 0.3468284606933594, 0.361297607421875, 0.3757667541503906, 0.39023590087890625, 0.4047050476074219, 0.4191741943359375, 0.4336433410644531, 0.44811248779296875, 0.4625816345214844, 0.47705078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 4.0, 5.0, 10.0, 18.0, 20.0, 22.0, 36.0, 40.0, 55.0, 57.0, 62.0, 86.0, 64.0, 79.0, 81.0, 62.0, 60.0, 47.0, 51.0, 27.0, 24.0, 17.0, 14.0, 15.0, 7.0, 3.0, 5.0, 5.0, 4.0, 1.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57861328125, -0.5628204345703125, -0.547027587890625, -0.5312347412109375, -0.51544189453125, -0.4996490478515625, -0.483856201171875, -0.4680633544921875, -0.4522705078125, -0.4364776611328125, -0.420684814453125, -0.4048919677734375, -0.38909912109375, -0.3733062744140625, -0.357513427734375, -0.3417205810546875, -0.325927734375, -0.3101348876953125, -0.294342041015625, -0.2785491943359375, -0.26275634765625, -0.2469635009765625, -0.231170654296875, -0.2153778076171875, -0.1995849609375, -0.1837921142578125, -0.167999267578125, -0.1522064208984375, -0.13641357421875, -0.1206207275390625, -0.104827880859375, -0.0890350341796875, -0.0732421875, -0.0574493408203125, -0.041656494140625, -0.0258636474609375, -0.01007080078125, 0.0057220458984375, 0.021514892578125, 0.0373077392578125, 0.0531005859375, 0.0688934326171875, 0.084686279296875, 0.1004791259765625, 0.11627197265625, 0.1320648193359375, 0.147857666015625, 0.1636505126953125, 0.179443359375, 0.1952362060546875, 0.211029052734375, 0.2268218994140625, 0.24261474609375, 0.2584075927734375, 0.274200439453125, 0.2899932861328125, 0.3057861328125, 0.3215789794921875, 0.337371826171875, 0.3531646728515625, 0.36895751953125, 0.3847503662109375, 0.400543212890625, 0.4163360595703125, 0.43212890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 12.0, 20.0, 36.0, 60.0, 91.0, 147.0, 319.0, 710.0, 2046.0, 7701.0, 43152.0, 768306.0, 198129.0, 20833.0, 4462.0, 1366.0, 518.0, 227.0, 140.0, 76.0, 49.0, 24.0, 15.0, 14.0, 11.0, 14.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08660888671875, -0.08388614654541016, -0.08116340637207031, -0.07844066619873047, -0.07571792602539062, -0.07299518585205078, -0.07027244567871094, -0.0675497055053711, -0.06482696533203125, -0.062104225158691406, -0.05938148498535156, -0.05665874481201172, -0.053936004638671875, -0.05121326446533203, -0.04849052429199219, -0.045767784118652344, -0.0430450439453125, -0.040322303771972656, -0.03759956359863281, -0.03487682342529297, -0.032154083251953125, -0.02943134307861328, -0.026708602905273438, -0.023985862731933594, -0.02126312255859375, -0.018540382385253906, -0.015817642211914062, -0.013094902038574219, -0.010372161865234375, -0.007649421691894531, -0.0049266815185546875, -0.0022039413452148438, 0.000518798828125, 0.0032415390014648438, 0.0059642791748046875, 0.008687019348144531, 0.011409759521484375, 0.014132499694824219, 0.016855239868164062, 0.019577980041503906, 0.02230072021484375, 0.025023460388183594, 0.027746200561523438, 0.03046894073486328, 0.033191680908203125, 0.03591442108154297, 0.03863716125488281, 0.041359901428222656, 0.0440826416015625, 0.046805381774902344, 0.04952812194824219, 0.05225086212158203, 0.054973602294921875, 0.05769634246826172, 0.06041908264160156, 0.0631418228149414, 0.06586456298828125, 0.0685873031616211, 0.07131004333496094, 0.07403278350830078, 0.07675552368164062, 0.07947826385498047, 0.08220100402832031, 0.08492374420166016, 0.087646484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 8.0, 2.0, 3.0, 8.0, 11.0, 10.0, 16.0, 22.0, 16.0, 16.0, 30.0, 27.0, 39.0, 55.0, 71.0, 79.0, 86.0, 89.0, 80.0, 65.0, 46.0, 53.0, 33.0, 24.0, 23.0, 16.0, 21.0, 9.0, 6.0, 5.0, 3.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9981136322021484e-05, -2.9012560844421387e-05, -2.804398536682129e-05, -2.707540988922119e-05, -2.6106834411621094e-05, -2.5138258934020996e-05, -2.41696834564209e-05, -2.32011079788208e-05, -2.2232532501220703e-05, -2.1263957023620605e-05, -2.0295381546020508e-05, -1.932680606842041e-05, -1.8358230590820312e-05, -1.7389655113220215e-05, -1.6421079635620117e-05, -1.545250415802002e-05, -1.4483928680419922e-05, -1.3515353202819824e-05, -1.2546777725219727e-05, -1.1578202247619629e-05, -1.0609626770019531e-05, -9.641051292419434e-06, -8.672475814819336e-06, -7.703900337219238e-06, -6.735324859619141e-06, -5.766749382019043e-06, -4.798173904418945e-06, -3.829598426818848e-06, -2.86102294921875e-06, -1.8924474716186523e-06, -9.238719940185547e-07, 4.470348358154297e-08, 1.0132789611816406e-06, 1.9818544387817383e-06, 2.950429916381836e-06, 3.919005393981934e-06, 4.887580871582031e-06, 5.856156349182129e-06, 6.8247318267822266e-06, 7.793307304382324e-06, 8.761882781982422e-06, 9.73045825958252e-06, 1.0699033737182617e-05, 1.1667609214782715e-05, 1.2636184692382812e-05, 1.360476016998291e-05, 1.4573335647583008e-05, 1.5541911125183105e-05, 1.6510486602783203e-05, 1.74790620803833e-05, 1.84476375579834e-05, 1.9416213035583496e-05, 2.0384788513183594e-05, 2.135336399078369e-05, 2.232193946838379e-05, 2.3290514945983887e-05, 2.4259090423583984e-05, 2.5227665901184082e-05, 2.619624137878418e-05, 2.7164816856384277e-05, 2.8133392333984375e-05, 2.9101967811584473e-05, 3.007054328918457e-05, 3.103911876678467e-05, 3.2007694244384766e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 15.0, 9.0, 25.0, 38.0, 44.0, 81.0, 131.0, 173.0, 367.0, 691.0, 1622.0, 4513.0, 17840.0, 122369.0, 790389.0, 89436.0, 14170.0, 3755.0, 1369.0, 642.0, 328.0, 173.0, 111.0, 70.0, 44.0, 40.0, 29.0, 22.0, 9.0, 7.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06842041015625, -0.06609535217285156, -0.06377029418945312, -0.06144523620605469, -0.05912017822265625, -0.05679512023925781, -0.054470062255859375, -0.05214500427246094, -0.0498199462890625, -0.04749488830566406, -0.045169830322265625, -0.04284477233886719, -0.04051971435546875, -0.03819465637207031, -0.035869598388671875, -0.03354454040527344, -0.031219482421875, -0.028894424438476562, -0.026569366455078125, -0.024244308471679688, -0.02191925048828125, -0.019594192504882812, -0.017269134521484375, -0.014944076538085938, -0.0126190185546875, -0.010293960571289062, -0.007968902587890625, -0.0056438446044921875, -0.00331878662109375, -0.0009937286376953125, 0.001331329345703125, 0.0036563873291015625, 0.0059814453125, 0.008306503295898438, 0.010631561279296875, 0.012956619262695312, 0.01528167724609375, 0.017606735229492188, 0.019931793212890625, 0.022256851196289062, 0.0245819091796875, 0.026906967163085938, 0.029232025146484375, 0.03155708312988281, 0.03388214111328125, 0.03620719909667969, 0.038532257080078125, 0.04085731506347656, 0.043182373046875, 0.04550743103027344, 0.047832489013671875, 0.05015754699707031, 0.05248260498046875, 0.05480766296386719, 0.057132720947265625, 0.05945777893066406, 0.0617828369140625, 0.06410789489746094, 0.06643295288085938, 0.06875801086425781, 0.07108306884765625, 0.07340812683105469, 0.07573318481445312, 0.07805824279785156, 0.08038330078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 8.0, 15.0, 14.0, 15.0, 29.0, 19.0, 40.0, 57.0, 84.0, 150.0, 127.0, 115.0, 87.0, 61.0, 54.0, 27.0, 32.0, 17.0, 7.0, 14.0, 7.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0650634765625, -0.062419891357421875, -0.05977630615234375, -0.057132720947265625, -0.0544891357421875, -0.051845550537109375, -0.04920196533203125, -0.046558380126953125, -0.043914794921875, -0.041271209716796875, -0.03862762451171875, -0.035984039306640625, -0.0333404541015625, -0.030696868896484375, -0.02805328369140625, -0.025409698486328125, -0.02276611328125, -0.020122528076171875, -0.01747894287109375, -0.014835357666015625, -0.0121917724609375, -0.009548187255859375, -0.00690460205078125, -0.004261016845703125, -0.001617431640625, 0.001026153564453125, 0.00366973876953125, 0.006313323974609375, 0.0089569091796875, 0.011600494384765625, 0.01424407958984375, 0.016887664794921875, 0.01953125, 0.022174835205078125, 0.02481842041015625, 0.027462005615234375, 0.0301055908203125, 0.032749176025390625, 0.03539276123046875, 0.038036346435546875, 0.040679931640625, 0.043323516845703125, 0.04596710205078125, 0.048610687255859375, 0.0512542724609375, 0.053897857666015625, 0.05654144287109375, 0.059185028076171875, 0.06182861328125, 0.06447219848632812, 0.06711578369140625, 0.06975936889648438, 0.0724029541015625, 0.07504653930664062, 0.07769012451171875, 0.08033370971679688, 0.082977294921875, 0.08562088012695312, 0.08826446533203125, 0.09090805053710938, 0.0935516357421875, 0.09619522094726562, 0.09883880615234375, 0.10148239135742188, 0.1041259765625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 10.0, 15.0, 38.0, 113.0, 307.0, 385.0, 91.0, 30.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8249331712722778, -1.7238578796386719, -1.6227824687957764, -1.5217071771621704, -1.4206318855285645, -1.319556474685669, -1.218481183052063, -1.117405891418457, -1.0163304805755615, -0.9152551293373108, -0.8141798377037048, -0.7131044864654541, -0.6120291948318481, -0.5109538435935974, -0.4098784923553467, -0.3088032007217407, -0.20772790908813477, -0.10665258020162582, -0.005577251315116882, 0.09549808502197266, 0.196573406457901, 0.29764872789382935, 0.3987240791320801, 0.49979937076568604, 0.6008747220039368, 0.7019500732421875, 0.8030253648757935, 0.9041007161140442, 1.005176067352295, 1.1062513589859009, 1.2073266506195068, 1.3084020614624023, 1.4094774723052979, 1.5105527639389038, 1.6116281747817993, 1.7127034664154053, 1.8137787580490112, 1.9148540496826172, 2.0159294605255127, 2.117004871368408, 2.2180800437927246, 2.31915545463562, 2.4202306270599365, 2.521306037902832, 2.6223814487457275, 2.723456621170044, 2.8245320320129395, 2.925607204437256, 3.0266828536987305, 3.127758264541626, 3.2288334369659424, 3.329908847808838, 3.4309842586517334, 3.53205943107605, 3.6331348419189453, 3.7342100143432617, 3.8352854251861572, 3.9363608360290527, 4.037436008453369, 4.138511657714844, 4.23958683013916, 4.340662002563477, 4.441737174987793, 4.542812824249268, 4.643887996673584]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 4.0, 8.0, 3.0, 9.0, 7.0, 13.0, 12.0, 12.0, 15.0, 15.0, 24.0, 16.0, 23.0, 34.0, 34.0, 38.0, 60.0, 87.0, 176.0, 75.0, 52.0, 39.0, 38.0, 27.0, 29.0, 25.0, 20.0, 18.0, 20.0, 13.0, 12.0, 7.0, 3.0, 8.0, 4.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3344430923461914, -1.2888784408569336, -1.2433139085769653, -1.1977492570877075, -1.1521847248077393, -1.1066200733184814, -1.0610554218292236, -1.0154907703399658, -0.9699262380599976, -0.9243616461753845, -0.8787970542907715, -0.8332324028015137, -0.7876678109169006, -0.7421032190322876, -0.6965385675430298, -0.6509739756584167, -0.6054093837738037, -0.5598447918891907, -0.5142802000045776, -0.4687155485153198, -0.4231509566307068, -0.37758636474609375, -0.3320217430591583, -0.2864571213722229, -0.24089252948760986, -0.19532792270183563, -0.1497633159160614, -0.10419870913028717, -0.05863410234451294, -0.013069495558738708, 0.03249511122703552, 0.07805973291397095, 0.12362432479858398, 0.16918893158435822, 0.21475353837013245, 0.26031816005706787, 0.3058827519416809, 0.35144734382629395, 0.39701196551322937, 0.4425765872001648, 0.48814117908477783, 0.5337057709693909, 0.5792703628540039, 0.6248350143432617, 0.6703996062278748, 0.7159641981124878, 0.7615288496017456, 0.8070934414863586, 0.8526580333709717, 0.8982226252555847, 0.9437872171401978, 0.9893518686294556, 1.0349164009094238, 1.0804810523986816, 1.1260457038879395, 1.1716103553771973, 1.2171748876571655, 1.2627395391464233, 1.3083040714263916, 1.3538687229156494, 1.3994333744049072, 1.4449979066848755, 1.4905625581741333, 1.5361270904541016, 1.5816917419433594]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 8.0, 15.0, 17.0, 30.0, 42.0, 48.0, 67.0, 90.0, 121.0, 174.0, 308.0, 416.0, 593.0, 965.0, 1506.0, 2660.0, 5009.0, 10397.0, 26402.0, 82610.0, 289211.0, 883815.0, 1555223.0, 903211.0, 296483.0, 83515.0, 28229.0, 10936.0, 4981.0, 2793.0, 1554.0, 901.0, 626.0, 411.0, 264.0, 170.0, 144.0, 88.0, 75.0, 34.0, 33.0, 22.0, 22.0, 19.0, 16.0, 3.0, 3.0, 5.0, 0.0, 8.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0950927734375, -0.09216785430908203, -0.08924293518066406, -0.0863180160522461, -0.08339309692382812, -0.08046817779541016, -0.07754325866699219, -0.07461833953857422, -0.07169342041015625, -0.06876850128173828, -0.06584358215332031, -0.06291866302490234, -0.059993743896484375, -0.057068824768066406, -0.05414390563964844, -0.05121898651123047, -0.0482940673828125, -0.04536914825439453, -0.04244422912597656, -0.039519309997558594, -0.036594390869140625, -0.033669471740722656, -0.030744552612304688, -0.02781963348388672, -0.02489471435546875, -0.02196979522705078, -0.019044876098632812, -0.016119956970214844, -0.013195037841796875, -0.010270118713378906, -0.0073451995849609375, -0.004420280456542969, -0.001495361328125, 0.0014295578002929688, 0.0043544769287109375, 0.007279396057128906, 0.010204315185546875, 0.013129234313964844, 0.016054153442382812, 0.01897907257080078, 0.02190399169921875, 0.02482891082763672, 0.027753829956054688, 0.030678749084472656, 0.033603668212890625, 0.036528587341308594, 0.03945350646972656, 0.04237842559814453, 0.0453033447265625, 0.04822826385498047, 0.05115318298339844, 0.054078102111816406, 0.057003021240234375, 0.059927940368652344, 0.06285285949707031, 0.06577777862548828, 0.06870269775390625, 0.07162761688232422, 0.07455253601074219, 0.07747745513916016, 0.08040237426757812, 0.0833272933959961, 0.08625221252441406, 0.08917713165283203, 0.09210205078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 13.0, 10.0, 12.0, 14.0, 19.0, 18.0, 30.0, 30.0, 36.0, 41.0, 45.0, 44.0, 48.0, 51.0, 50.0, 40.0, 55.0, 48.0, 49.0, 42.0, 41.0, 36.0, 37.0, 22.0, 32.0, 29.0, 14.0, 16.0, 18.0, 12.0, 10.0, 7.0, 4.0, 1.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0992431640625, -0.09629535675048828, -0.09334754943847656, -0.09039974212646484, -0.08745193481445312, -0.0845041275024414, -0.08155632019042969, -0.07860851287841797, -0.07566070556640625, -0.07271289825439453, -0.06976509094238281, -0.0668172836303711, -0.06386947631835938, -0.060921669006347656, -0.05797386169433594, -0.05502605438232422, -0.0520782470703125, -0.04913043975830078, -0.04618263244628906, -0.043234825134277344, -0.040287017822265625, -0.037339210510253906, -0.03439140319824219, -0.03144359588623047, -0.02849578857421875, -0.02554798126220703, -0.022600173950195312, -0.019652366638183594, -0.016704559326171875, -0.013756752014160156, -0.010808944702148438, -0.007861137390136719, -0.004913330078125, -0.0019655227661132812, 0.0009822845458984375, 0.003930091857910156, 0.006877899169921875, 0.009825706481933594, 0.012773513793945312, 0.01572132110595703, 0.01866912841796875, 0.02161693572998047, 0.024564743041992188, 0.027512550354003906, 0.030460357666015625, 0.033408164978027344, 0.03635597229003906, 0.03930377960205078, 0.0422515869140625, 0.04519939422607422, 0.04814720153808594, 0.051095008850097656, 0.054042816162109375, 0.056990623474121094, 0.05993843078613281, 0.06288623809814453, 0.06583404541015625, 0.06878185272216797, 0.07172966003417969, 0.0746774673461914, 0.07762527465820312, 0.08057308197021484, 0.08352088928222656, 0.08646869659423828, 0.08941650390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 5.0, 10.0, 10.0, 6.0, 18.0, 19.0, 29.0, 46.0, 70.0, 89.0, 142.0, 227.0, 377.0, 520.0, 1035.0, 2095.0, 7221.0, 93610.0, 3971736.0, 104698.0, 7754.0, 2140.0, 969.0, 505.0, 318.0, 183.0, 139.0, 88.0, 54.0, 48.0, 22.0, 32.0, 16.0, 11.0, 11.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.51611328125, -0.5015792846679688, -0.4870452880859375, -0.47251129150390625, -0.457977294921875, -0.44344329833984375, -0.4289093017578125, -0.41437530517578125, -0.39984130859375, -0.38530731201171875, -0.3707733154296875, -0.35623931884765625, -0.341705322265625, -0.32717132568359375, -0.3126373291015625, -0.29810333251953125, -0.2835693359375, -0.26903533935546875, -0.2545013427734375, -0.23996734619140625, -0.225433349609375, -0.21089935302734375, -0.1963653564453125, -0.18183135986328125, -0.16729736328125, -0.15276336669921875, -0.1382293701171875, -0.12369537353515625, -0.109161376953125, -0.09462738037109375, -0.0800933837890625, -0.06555938720703125, -0.051025390625, -0.03649139404296875, -0.0219573974609375, -0.00742340087890625, 0.007110595703125, 0.02164459228515625, 0.0361785888671875, 0.05071258544921875, 0.06524658203125, 0.07978057861328125, 0.0943145751953125, 0.10884857177734375, 0.123382568359375, 0.13791656494140625, 0.1524505615234375, 0.16698455810546875, 0.1815185546875, 0.19605255126953125, 0.2105865478515625, 0.22512054443359375, 0.239654541015625, 0.25418853759765625, 0.2687225341796875, 0.28325653076171875, 0.29779052734375, 0.31232452392578125, 0.3268585205078125, 0.34139251708984375, 0.355926513671875, 0.37046051025390625, 0.3849945068359375, 0.39952850341796875, 0.4140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 12.0, 5.0, 8.0, 6.0, 11.0, 18.0, 20.0, 35.0, 33.0, 56.0, 93.0, 120.0, 194.0, 252.0, 357.0, 479.0, 609.0, 467.0, 367.0, 246.0, 188.0, 134.0, 87.0, 74.0, 48.0, 37.0, 30.0, 28.0, 16.0, 11.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.314697265625, -0.3062782287597656, -0.29785919189453125, -0.2894401550292969, -0.2810211181640625, -0.2726020812988281, -0.26418304443359375, -0.2557640075683594, -0.247344970703125, -0.23892593383789062, -0.23050689697265625, -0.22208786010742188, -0.2136688232421875, -0.20524978637695312, -0.19683074951171875, -0.18841171264648438, -0.17999267578125, -0.17157363891601562, -0.16315460205078125, -0.15473556518554688, -0.1463165283203125, -0.13789749145507812, -0.12947845458984375, -0.12105941772460938, -0.112640380859375, -0.10422134399414062, -0.09580230712890625, -0.08738327026367188, -0.0789642333984375, -0.07054519653320312, -0.06212615966796875, -0.053707122802734375, -0.0452880859375, -0.036869049072265625, -0.02845001220703125, -0.020030975341796875, -0.0116119384765625, -0.003192901611328125, 0.00522613525390625, 0.013645172119140625, 0.022064208984375, 0.030483245849609375, 0.03890228271484375, 0.047321319580078125, 0.0557403564453125, 0.06415939331054688, 0.07257843017578125, 0.08099746704101562, 0.08941650390625, 0.09783554077148438, 0.10625457763671875, 0.11467361450195312, 0.1230926513671875, 0.13151168823242188, 0.13993072509765625, 0.14834976196289062, 0.156768798828125, 0.16518783569335938, 0.17360687255859375, 0.18202590942382812, 0.1904449462890625, 0.19886398315429688, 0.20728302001953125, 0.21570205688476562, 0.22412109375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 11.0, 8.0, 24.0, 61.0, 142.0, 240.0, 260.0, 139.0, 64.0, 25.0, 15.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.275860786437988, -6.118461608886719, -5.961061954498291, -5.8036627769470215, -5.646263122558594, -5.488863945007324, -5.3314642906188965, -5.174065113067627, -5.016665458679199, -4.85926628112793, -4.701866626739502, -4.544467449188232, -4.387067794799805, -4.229668617248535, -4.072268962860107, -3.914869785308838, -3.7574706077575684, -3.6000711917877197, -3.442671775817871, -3.2852723598480225, -3.127872943878174, -2.9704737663269043, -2.8130743503570557, -2.655674934387207, -2.4982755184173584, -2.3408761024475098, -2.183476686477661, -2.0260772705078125, -1.8686779737472534, -1.7112785577774048, -1.5538792610168457, -1.396479845046997, -1.2390809059143066, -1.081681489944458, -0.9242821335792542, -0.7668827772140503, -0.6094833612442017, -0.452083945274353, -0.29468458890914917, -0.1372852325439453, 0.02011418342590332, 0.17751356959342957, 0.3349129557609558, 0.49231234192848206, 0.6497117280960083, 0.8071111440658569, 0.9645105004310608, 1.1219098567962646, 1.2793092727661133, 1.436708688735962, 1.5941081047058105, 1.7515074014663696, 1.9089068174362183, 2.0663061141967773, 2.223705530166626, 2.3811049461364746, 2.5385043621063232, 2.695903778076172, 2.8533031940460205, 3.010702610015869, 3.1681017875671387, 3.3255014419555664, 3.482900619506836, 3.6403000354766846, 3.797699451446533]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 10.0, 10.0, 15.0, 20.0, 21.0, 46.0, 45.0, 45.0, 51.0, 84.0, 99.0, 92.0, 85.0, 54.0, 68.0, 51.0, 58.0, 32.0, 33.0, 28.0, 20.0, 13.0, 10.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.195653200149536, -3.114492893218994, -3.033332586288452, -2.95217227935791, -2.871011734008789, -2.789851427078247, -2.708691120147705, -2.627530813217163, -2.546370506286621, -2.465210199356079, -2.384049892425537, -2.302889585494995, -2.221729278564453, -2.140568733215332, -2.05940842628479, -1.978248119354248, -1.897087812423706, -1.815927505493164, -1.734767198562622, -1.6536067724227905, -1.5724464654922485, -1.4912861585617065, -1.410125732421875, -1.328965425491333, -1.247805118560791, -1.166644811630249, -1.085484504699707, -1.0043240785598755, -0.9231637716293335, -0.8420034646987915, -0.7608430981636047, -0.679682731628418, -0.598522424697876, -0.517362117767334, -0.4362017512321472, -0.35504141449928284, -0.27388107776641846, -0.19272074103355408, -0.1115604043006897, -0.03040003776550293, 0.05076026916503906, 0.13192060589790344, 0.21308094263076782, 0.2942412793636322, 0.3754016160964966, 0.45656195282936096, 0.5377222895622253, 0.6188826560974121, 0.7000429630279541, 0.7812032699584961, 0.8623636364936829, 0.9435240030288696, 1.0246843099594116, 1.1058446168899536, 1.1870050430297852, 1.2681653499603271, 1.3493256568908691, 1.4304859638214111, 1.5116462707519531, 1.5928066968917847, 1.6739670038223267, 1.7551273107528687, 1.8362877368927002, 1.9174480438232422, 1.9986083507537842]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 3.0, 6.0, 10.0, 9.0, 15.0, 15.0, 26.0, 34.0, 58.0, 65.0, 122.0, 233.0, 546.0, 1515.0, 4814.0, 19845.0, 143181.0, 784774.0, 74868.0, 12923.0, 3391.0, 1120.0, 451.0, 205.0, 124.0, 53.0, 41.0, 36.0, 24.0, 11.0, 7.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270263671875, -0.2610588073730469, -0.25185394287109375, -0.24264907836914062, -0.2334442138671875, -0.22423934936523438, -0.21503448486328125, -0.20582962036132812, -0.196624755859375, -0.18741989135742188, -0.17821502685546875, -0.16901016235351562, -0.1598052978515625, -0.15060043334960938, -0.14139556884765625, -0.13219070434570312, -0.12298583984375, -0.11378097534179688, -0.10457611083984375, -0.09537124633789062, -0.0861663818359375, -0.07696151733398438, -0.06775665283203125, -0.058551788330078125, -0.049346923828125, -0.040142059326171875, -0.03093719482421875, -0.021732330322265625, -0.0125274658203125, -0.003322601318359375, 0.00588226318359375, 0.015087127685546875, 0.0242919921875, 0.033496856689453125, 0.04270172119140625, 0.051906585693359375, 0.0611114501953125, 0.07031631469726562, 0.07952117919921875, 0.08872604370117188, 0.097930908203125, 0.10713577270507812, 0.11634063720703125, 0.12554550170898438, 0.1347503662109375, 0.14395523071289062, 0.15316009521484375, 0.16236495971679688, 0.17156982421875, 0.18077468872070312, 0.18997955322265625, 0.19918441772460938, 0.2083892822265625, 0.21759414672851562, 0.22679901123046875, 0.23600387573242188, 0.245208740234375, 0.2544136047363281, 0.26361846923828125, 0.2728233337402344, 0.2820281982421875, 0.2912330627441406, 0.30043792724609375, 0.3096427917480469, 0.31884765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 10.0, 22.0, 40.0, 56.0, 56.0, 96.0, 119.0, 98.0, 118.0, 107.0, 87.0, 69.0, 42.0, 28.0, 18.0, 11.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329345703125, -0.3212776184082031, -0.31320953369140625, -0.3051414489746094, -0.2970733642578125, -0.2890052795410156, -0.28093719482421875, -0.2728691101074219, -0.264801025390625, -0.2567329406738281, -0.24866485595703125, -0.24059677124023438, -0.2325286865234375, -0.22446060180664062, -0.21639251708984375, -0.20832443237304688, -0.20025634765625, -0.19218826293945312, -0.18412017822265625, -0.17605209350585938, -0.1679840087890625, -0.15991592407226562, -0.15184783935546875, -0.14377975463867188, -0.135711669921875, -0.12764358520507812, -0.11957550048828125, -0.11150741577148438, -0.1034393310546875, -0.09537124633789062, -0.08730316162109375, -0.07923507690429688, -0.0711669921875, -0.06309890747070312, -0.05503082275390625, -0.046962738037109375, -0.0388946533203125, -0.030826568603515625, -0.02275848388671875, -0.014690399169921875, -0.006622314453125, 0.001445770263671875, 0.00951385498046875, 0.017581939697265625, 0.0256500244140625, 0.033718109130859375, 0.04178619384765625, 0.049854278564453125, 0.05792236328125, 0.06599044799804688, 0.07405853271484375, 0.08212661743164062, 0.0901947021484375, 0.09826278686523438, 0.10633087158203125, 0.11439895629882812, 0.122467041015625, 0.13053512573242188, 0.13860321044921875, 0.14667129516601562, 0.1547393798828125, 0.16280746459960938, 0.17087554931640625, 0.17894363403320312, 0.18701171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 10.0, 12.0, 12.0, 24.0, 26.0, 43.0, 42.0, 72.0, 151.0, 220.0, 395.0, 872.0, 2804.0, 17982.0, 854669.0, 158202.0, 9619.0, 1848.0, 700.0, 330.0, 169.0, 115.0, 75.0, 56.0, 29.0, 21.0, 16.0, 11.0, 13.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371826171875, -0.36200714111328125, -0.3521881103515625, -0.34236907958984375, -0.332550048828125, -0.32273101806640625, -0.3129119873046875, -0.30309295654296875, -0.29327392578125, -0.28345489501953125, -0.2736358642578125, -0.26381683349609375, -0.253997802734375, -0.24417877197265625, -0.2343597412109375, -0.22454071044921875, -0.2147216796875, -0.20490264892578125, -0.1950836181640625, -0.18526458740234375, -0.175445556640625, -0.16562652587890625, -0.1558074951171875, -0.14598846435546875, -0.13616943359375, -0.12635040283203125, -0.1165313720703125, -0.10671234130859375, -0.096893310546875, -0.08707427978515625, -0.0772552490234375, -0.06743621826171875, -0.0576171875, -0.04779815673828125, -0.0379791259765625, -0.02816009521484375, -0.018341064453125, -0.00852203369140625, 0.0012969970703125, 0.01111602783203125, 0.02093505859375, 0.03075408935546875, 0.0405731201171875, 0.05039215087890625, 0.060211181640625, 0.07003021240234375, 0.0798492431640625, 0.08966827392578125, 0.0994873046875, 0.10930633544921875, 0.1191253662109375, 0.12894439697265625, 0.138763427734375, 0.14858245849609375, 0.1584014892578125, 0.16822052001953125, 0.17803955078125, 0.18785858154296875, 0.1976776123046875, 0.20749664306640625, 0.217315673828125, 0.22713470458984375, 0.2369537353515625, 0.24677276611328125, 0.256591796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 9.0, 9.0, 9.0, 12.0, 10.0, 21.0, 21.0, 19.0, 33.0, 21.0, 32.0, 28.0, 37.0, 52.0, 66.0, 65.0, 73.0, 74.0, 75.0, 71.0, 34.0, 30.0, 34.0, 25.0, 20.0, 21.0, 21.0, 13.0, 12.0, 14.0, 8.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.52294921875, -0.5094566345214844, -0.49596405029296875, -0.4824714660644531, -0.4689788818359375, -0.4554862976074219, -0.44199371337890625, -0.4285011291503906, -0.415008544921875, -0.4015159606933594, -0.38802337646484375, -0.3745307922363281, -0.3610382080078125, -0.3475456237792969, -0.33405303955078125, -0.3205604553222656, -0.30706787109375, -0.2935752868652344, -0.28008270263671875, -0.2665901184082031, -0.2530975341796875, -0.23960494995117188, -0.22611236572265625, -0.21261978149414062, -0.199127197265625, -0.18563461303710938, -0.17214202880859375, -0.15864944458007812, -0.1451568603515625, -0.13166427612304688, -0.11817169189453125, -0.10467910766601562, -0.0911865234375, -0.07769393920898438, -0.06420135498046875, -0.050708770751953125, -0.0372161865234375, -0.023723602294921875, -0.01023101806640625, 0.003261566162109375, 0.016754150390625, 0.030246734619140625, 0.04373931884765625, 0.057231903076171875, 0.0707244873046875, 0.08421707153320312, 0.09770965576171875, 0.11120223999023438, 0.12469482421875, 0.13818740844726562, 0.15167999267578125, 0.16517257690429688, 0.1786651611328125, 0.19215774536132812, 0.20565032958984375, 0.21914291381835938, 0.232635498046875, 0.24612808227539062, 0.25962066650390625, 0.2731132507324219, 0.2866058349609375, 0.3000984191894531, 0.31359100341796875, 0.3270835876464844, 0.340576171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 2.0, 15.0, 11.0, 26.0, 34.0, 48.0, 83.0, 133.0, 249.0, 535.0, 1297.0, 4425.0, 28282.0, 953441.0, 50663.0, 6317.0, 1592.0, 631.0, 329.0, 165.0, 89.0, 57.0, 41.0, 21.0, 20.0, 15.0, 7.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0799560546875, -0.07750415802001953, -0.07505226135253906, -0.0726003646850586, -0.07014846801757812, -0.06769657135009766, -0.06524467468261719, -0.06279277801513672, -0.06034088134765625, -0.05788898468017578, -0.05543708801269531, -0.052985191345214844, -0.050533294677734375, -0.048081398010253906, -0.04562950134277344, -0.04317760467529297, -0.0407257080078125, -0.03827381134033203, -0.03582191467285156, -0.033370018005371094, -0.030918121337890625, -0.028466224670410156, -0.026014328002929688, -0.02356243133544922, -0.02111053466796875, -0.01865863800048828, -0.016206741333007812, -0.013754844665527344, -0.011302947998046875, -0.008851051330566406, -0.0063991546630859375, -0.003947257995605469, -0.001495361328125, 0.0009565353393554688, 0.0034084320068359375, 0.005860328674316406, 0.008312225341796875, 0.010764122009277344, 0.013216018676757812, 0.01566791534423828, 0.01811981201171875, 0.02057170867919922, 0.023023605346679688, 0.025475502014160156, 0.027927398681640625, 0.030379295349121094, 0.03283119201660156, 0.03528308868408203, 0.0377349853515625, 0.04018688201904297, 0.04263877868652344, 0.045090675354003906, 0.047542572021484375, 0.049994468688964844, 0.05244636535644531, 0.05489826202392578, 0.05735015869140625, 0.05980205535888672, 0.06225395202636719, 0.06470584869384766, 0.06715774536132812, 0.0696096420288086, 0.07206153869628906, 0.07451343536376953, 0.07696533203125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 7.0, 9.0, 7.0, 20.0, 18.0, 26.0, 20.0, 32.0, 44.0, 50.0, 72.0, 90.0, 84.0, 78.0, 92.0, 72.0, 60.0, 43.0, 31.0, 23.0, 20.0, 17.0, 14.0, 17.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.74913215637207e-05, -3.645382821559906e-05, -3.541633486747742e-05, -3.4378841519355774e-05, -3.334134817123413e-05, -3.230385482311249e-05, -3.1266361474990845e-05, -3.02288681268692e-05, -2.919137477874756e-05, -2.8153881430625916e-05, -2.7116388082504272e-05, -2.607889473438263e-05, -2.5041401386260986e-05, -2.4003908038139343e-05, -2.29664146900177e-05, -2.1928921341896057e-05, -2.0891427993774414e-05, -1.985393464565277e-05, -1.8816441297531128e-05, -1.7778947949409485e-05, -1.6741454601287842e-05, -1.57039612531662e-05, -1.4666467905044556e-05, -1.3628974556922913e-05, -1.259148120880127e-05, -1.1553987860679626e-05, -1.0516494512557983e-05, -9.47900116443634e-06, -8.441507816314697e-06, -7.404014468193054e-06, -6.366521120071411e-06, -5.329027771949768e-06, -4.291534423828125e-06, -3.254041075706482e-06, -2.216547727584839e-06, -1.1790543794631958e-06, -1.4156103134155273e-07, 8.959323167800903e-07, 1.9334256649017334e-06, 2.9709190130233765e-06, 4.0084123611450195e-06, 5.045905709266663e-06, 6.083399057388306e-06, 7.120892405509949e-06, 8.158385753631592e-06, 9.195879101753235e-06, 1.0233372449874878e-05, 1.1270865797996521e-05, 1.2308359146118164e-05, 1.3345852494239807e-05, 1.438334584236145e-05, 1.5420839190483093e-05, 1.6458332538604736e-05, 1.749582588672638e-05, 1.8533319234848022e-05, 1.9570812582969666e-05, 2.060830593109131e-05, 2.164579927921295e-05, 2.2683292627334595e-05, 2.3720785975456238e-05, 2.475827932357788e-05, 2.5795772671699524e-05, 2.6833266019821167e-05, 2.787075936794281e-05, 2.8908252716064453e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 7.0, 13.0, 23.0, 23.0, 37.0, 53.0, 93.0, 190.0, 288.0, 537.0, 1086.0, 2521.0, 6830.0, 23331.0, 249926.0, 725359.0, 25677.0, 7322.0, 2723.0, 1156.0, 564.0, 318.0, 170.0, 98.0, 62.0, 32.0, 29.0, 22.0, 15.0, 12.0, 2.0, 10.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03973388671875, -0.03831624984741211, -0.03689861297607422, -0.03548097610473633, -0.03406333923339844, -0.03264570236206055, -0.031228065490722656, -0.029810428619384766, -0.028392791748046875, -0.026975154876708984, -0.025557518005371094, -0.024139881134033203, -0.022722244262695312, -0.021304607391357422, -0.01988697052001953, -0.01846933364868164, -0.01705169677734375, -0.01563405990600586, -0.014216423034667969, -0.012798786163330078, -0.011381149291992188, -0.009963512420654297, -0.008545875549316406, -0.007128238677978516, -0.005710601806640625, -0.004292964935302734, -0.0028753280639648438, -0.0014576911926269531, -4.00543212890625e-05, 0.0013775825500488281, 0.0027952194213867188, 0.004212856292724609, 0.0056304931640625, 0.007048130035400391, 0.008465766906738281, 0.009883403778076172, 0.011301040649414062, 0.012718677520751953, 0.014136314392089844, 0.015553951263427734, 0.016971588134765625, 0.018389225006103516, 0.019806861877441406, 0.021224498748779297, 0.022642135620117188, 0.024059772491455078, 0.02547740936279297, 0.02689504623413086, 0.02831268310546875, 0.02973031997680664, 0.03114795684814453, 0.03256559371948242, 0.03398323059082031, 0.0354008674621582, 0.036818504333496094, 0.038236141204833984, 0.039653778076171875, 0.041071414947509766, 0.042489051818847656, 0.04390668869018555, 0.04532432556152344, 0.04674196243286133, 0.04815959930419922, 0.04957723617553711, 0.050994873046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 8.0, 7.0, 12.0, 21.0, 20.0, 24.0, 26.0, 30.0, 34.0, 46.0, 84.0, 116.0, 141.0, 98.0, 66.0, 54.0, 37.0, 25.0, 23.0, 19.0, 11.0, 14.0, 15.0, 5.0, 7.0, 7.0, 7.0, 4.0, 2.0, 3.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0382080078125, -0.03698539733886719, -0.035762786865234375, -0.03454017639160156, -0.03331756591796875, -0.03209495544433594, -0.030872344970703125, -0.029649734497070312, -0.0284271240234375, -0.027204513549804688, -0.025981903076171875, -0.024759292602539062, -0.02353668212890625, -0.022314071655273438, -0.021091461181640625, -0.019868850708007812, -0.018646240234375, -0.017423629760742188, -0.016201019287109375, -0.014978408813476562, -0.01375579833984375, -0.012533187866210938, -0.011310577392578125, -0.010087966918945312, -0.0088653564453125, -0.0076427459716796875, -0.006420135498046875, -0.0051975250244140625, -0.00397491455078125, -0.0027523040771484375, -0.001529693603515625, -0.0003070831298828125, 0.00091552734375, 0.0021381378173828125, 0.003360748291015625, 0.0045833587646484375, 0.00580596923828125, 0.0070285797119140625, 0.008251190185546875, 0.009473800659179688, 0.0106964111328125, 0.011919021606445312, 0.013141632080078125, 0.014364242553710938, 0.01558685302734375, 0.016809463500976562, 0.018032073974609375, 0.019254684448242188, 0.020477294921875, 0.021699905395507812, 0.022922515869140625, 0.024145126342773438, 0.02536773681640625, 0.026590347290039062, 0.027812957763671875, 0.029035568237304688, 0.0302581787109375, 0.03148078918457031, 0.032703399658203125, 0.03392601013183594, 0.03514862060546875, 0.03637123107910156, 0.037593841552734375, 0.03881645202636719, 0.0400390625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 40.0, 86.0, 571.0, 194.0, 54.0, 25.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.972259521484375, -3.8644375801086426, -3.75661563873291, -3.6487936973571777, -3.5409717559814453, -3.433149814605713, -3.3253278732299805, -3.217505931854248, -3.1096839904785156, -3.001862049102783, -2.894040107727051, -2.7862181663513184, -2.678396224975586, -2.5705742835998535, -2.462752342224121, -2.3549304008483887, -2.2471084594726562, -2.139286518096924, -2.0314645767211914, -1.923642635345459, -1.8158206939697266, -1.7079987525939941, -1.6001768112182617, -1.4923548698425293, -1.3845326900482178, -1.2767107486724854, -1.168888807296753, -1.0610668659210205, -0.9532449245452881, -0.8454229235649109, -0.7376009821891785, -0.629779040813446, -0.5219571590423584, -0.414135217666626, -0.30631327629089355, -0.19849130511283875, -0.09066936373710632, 0.017152607440948486, 0.12497454881668091, 0.23279649019241333, 0.34061843156814575, 0.4484403729438782, 0.5562623143196106, 0.6640843152999878, 0.7719062566757202, 0.8797281980514526, 0.9875501394271851, 1.0953720808029175, 1.20319402217865, 1.3110159635543823, 1.4188379049301147, 1.5266598463058472, 1.6344817876815796, 1.7423038482666016, 1.850125789642334, 1.9579477310180664, 2.065769672393799, 2.1735916137695312, 2.2814135551452637, 2.389235496520996, 2.4970574378967285, 2.604879379272461, 2.7127013206481934, 2.820523262023926, 2.928345203399658]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 7.0, 9.0, 17.0, 13.0, 18.0, 20.0, 13.0, 27.0, 19.0, 26.0, 24.0, 34.0, 129.0, 316.0, 74.0, 26.0, 34.0, 22.0, 17.0, 16.0, 16.0, 12.0, 17.0, 9.0, 8.0, 7.0, 7.0, 10.0, 8.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2284584045410156, -1.1880301237106323, -1.147601842880249, -1.1071734428405762, -1.0667451620101929, -1.0263168811798096, -0.9858886003494263, -0.9454602599143982, -0.9050319194793701, -0.8646036386489868, -0.8241752982139587, -0.7837470173835754, -0.7433186769485474, -0.7028903961181641, -0.6624621152877808, -0.6220337748527527, -0.5816054940223694, -0.5411772131919861, -0.500748872756958, -0.4603205919265747, -0.41989225149154663, -0.37946397066116333, -0.33903566002845764, -0.29860734939575195, -0.25817903876304626, -0.21775072813034058, -0.1773224174976349, -0.1368941217660904, -0.0964658111333847, -0.056037500500679016, -0.015609204769134521, 0.024819105863571167, 0.06524741649627686, 0.10567572712898254, 0.14610403776168823, 0.18653233349323273, 0.22696064412593842, 0.2673889398574829, 0.3078172504901886, 0.3482455611228943, 0.3886738717556, 0.42910218238830566, 0.46953049302101135, 0.509958803653717, 0.5503870844841003, 0.5908154249191284, 0.6312437057495117, 0.671671986579895, 0.7121003270149231, 0.7525286078453064, 0.7929569482803345, 0.8333852291107178, 0.8738135695457458, 0.9142418503761292, 0.9546701908111572, 0.9950984716415405, 1.0355267524719238, 1.0759550333023071, 1.1163833141326904, 1.1568117141723633, 1.1972399950027466, 1.2376682758331299, 1.2780965566635132, 1.3185248374938965, 1.3589532375335693]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 6.0, 4.0, 8.0, 12.0, 14.0, 20.0, 16.0, 22.0, 24.0, 30.0, 38.0, 38.0, 85.0, 246.0, 95.0, 48.0, 49.0, 39.0, 37.0, 13.0, 21.0, 13.0, 20.0, 11.0, 13.0, 12.0, 3.0, 8.0, 6.0, 7.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.10479736328125, -0.10167503356933594, -0.09855270385742188, -0.09543037414550781, -0.09230804443359375, -0.08918571472167969, -0.08606338500976562, -0.08294105529785156, -0.0798187255859375, -0.07669639587402344, -0.07357406616210938, -0.07045173645019531, -0.06732940673828125, -0.06420707702636719, -0.061084747314453125, -0.05796241760253906, -0.054840087890625, -0.05171775817871094, -0.048595428466796875, -0.04547309875488281, -0.04235076904296875, -0.03922843933105469, -0.036106109619140625, -0.03298377990722656, -0.0298614501953125, -0.026739120483398438, -0.023616790771484375, -0.020494461059570312, -0.01737213134765625, -0.014249801635742188, -0.011127471923828125, -0.008005142211914062, -0.0048828125, -0.0017604827880859375, 0.001361846923828125, 0.0044841766357421875, 0.00760650634765625, 0.010728836059570312, 0.013851165771484375, 0.016973495483398438, 0.0200958251953125, 0.023218154907226562, 0.026340484619140625, 0.029462814331054688, 0.03258514404296875, 0.03570747375488281, 0.038829803466796875, 0.04195213317871094, 0.045074462890625, 0.04819679260253906, 0.051319122314453125, 0.05444145202636719, 0.05756378173828125, 0.06068611145019531, 0.06380844116210938, 0.06693077087402344, 0.0700531005859375, 0.07317543029785156, 0.07629776000976562, 0.07942008972167969, 0.08254241943359375, 0.08566474914550781, 0.08878707885742188, 0.09190940856933594, 0.09503173828125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 2.0, 7.0, 7.0, 15.0, 18.0, 31.0, 52.0, 58.0, 127.0, 215.0, 585.0, 2083.0, 18128.0, 8355497.0, 9468.0, 1416.0, 363.0, 185.0, 109.0, 86.0, 47.0, 22.0, 16.0, 4.0, 6.0, 3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 7.0, 6.0], "bins": [-1.727432131767273, -1.6866792440414429, -1.6459263563156128, -1.6051735877990723, -1.5644207000732422, -1.523667812347412, -1.482914924621582, -1.442162036895752, -1.4014091491699219, -1.3606562614440918, -1.3199033737182617, -1.2791506052017212, -1.2383977174758911, -1.197644829750061, -1.156891942024231, -1.1161390542984009, -1.0753862857818604, -1.0346333980560303, -0.993880569934845, -0.9531276822090149, -0.9123748540878296, -0.8716219663619995, -0.8308690786361694, -0.7901161909103394, -0.749363362789154, -0.708610475063324, -0.6678576469421387, -0.6271047592163086, -0.5863518714904785, -0.5455990433692932, -0.5048461556434631, -0.46409329771995544, -0.423340380191803, -0.3825875222682953, -0.3418346643447876, -0.3010817766189575, -0.26032891869544983, -0.21957606077194214, -0.17882318794727325, -0.13807031512260437, -0.09731745719909668, -0.05656459182500839, -0.015811726450920105, 0.024941138923168182, 0.06569400429725647, 0.10644686222076416, 0.14719973504543304, 0.18795260787010193, 0.22870546579360962, 0.2694583237171173, 0.310211181640625, 0.3509640693664551, 0.39171692728996277, 0.43246978521347046, 0.47322267293930054, 0.5139755010604858, 0.5547283887863159, 0.595481276512146, 0.6362341046333313, 0.6769869923591614, 0.7177398204803467, 0.7584927082061768, 0.7992455959320068, 0.8399984836578369, 0.8807513117790222]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 2.0, 3.0, 6.0, 2.0, 3.0, 2.0, 5.0, 7.0, 3.0, 6.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8476085662841797, -0.810314953327179, -0.7730213403701782, -0.7357277274131775, -0.6984341144561768, -0.6611405611038208, -0.6238469481468201, -0.5865533351898193, -0.5492597222328186, -0.5119661092758179, -0.47467249631881714, -0.4373789131641388, -0.40008530020713806, -0.36279168725013733, -0.325498104095459, -0.28820449113845825, -0.2509108781814575, -0.2136172652244568, -0.17632366716861725, -0.1390300691127777, -0.10173645615577698, -0.06444284319877625, -0.027149245142936707, 0.010144352912902832, 0.047437965869903564, 0.0847315713763237, 0.12202517688274384, 0.15931877493858337, 0.1966123878955841, 0.23390600085258484, 0.2711995840072632, 0.3084931969642639, 0.3457869291305542, 0.38308054208755493, 0.42037415504455566, 0.457667738199234, 0.49496135115623474, 0.5322549343109131, 0.5695485472679138, 0.6068421602249146, 0.6441357731819153, 0.681429386138916, 0.7187229990959167, 0.7560166120529175, 0.7933101654052734, 0.830603837966919, 0.8678973913192749, 0.9051910042762756, 0.9424846172332764, 0.9797782301902771, 1.0170718431472778, 1.0543653964996338, 1.0916590690612793, 1.1289526224136353, 1.1662462949752808, 1.2035398483276367, 1.2408335208892822, 1.2781270742416382, 1.3154207468032837, 1.3527143001556396, 1.3900079727172852, 1.4273015260696411, 1.4645951986312866, 1.5018887519836426, 1.5391823053359985]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 9.0, 3.0, 8.0, 6.0, 25.0, 29.0, 37.0, 71.0, 80.0, 117.0, 208.0, 352.0, 545.0, 932.0, 1781.0, 3639.0, 8081.0, 21462.0, 65313.0, 189003.0, 153837.0, 48876.0, 16877.0, 6587.0, 2838.0, 1500.0, 789.0, 445.0, 273.0, 188.0, 116.0, 83.0, 39.0, 37.0, 28.0, 19.0, 10.0, 7.0, 8.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.93896484375, -0.9135055541992188, -0.8880462646484375, -0.8625869750976562, -0.837127685546875, -0.8116683959960938, -0.7862091064453125, -0.7607498168945312, -0.73529052734375, -0.7098312377929688, -0.6843719482421875, -0.6589126586914062, -0.633453369140625, -0.6079940795898438, -0.5825347900390625, -0.5570755004882812, -0.5316162109375, -0.5061569213867188, -0.4806976318359375, -0.45523834228515625, -0.429779052734375, -0.40431976318359375, -0.3788604736328125, -0.35340118408203125, -0.32794189453125, -0.30248260498046875, -0.2770233154296875, -0.25156402587890625, -0.226104736328125, -0.20064544677734375, -0.1751861572265625, -0.14972686767578125, -0.124267578125, -0.09880828857421875, -0.0733489990234375, -0.04788970947265625, -0.022430419921875, 0.00302886962890625, 0.0284881591796875, 0.05394744873046875, 0.07940673828125, 0.10486602783203125, 0.1303253173828125, 0.15578460693359375, 0.181243896484375, 0.20670318603515625, 0.2321624755859375, 0.25762176513671875, 0.2830810546875, 0.30854034423828125, 0.3339996337890625, 0.35945892333984375, 0.384918212890625, 0.41037750244140625, 0.4358367919921875, 0.46129608154296875, 0.48675537109375, 0.5122146606445312, 0.5376739501953125, 0.5631332397460938, 0.588592529296875, 0.6140518188476562, 0.6395111083984375, 0.6649703979492188, 0.6904296875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 10.0, 14.0, 26.0, 44.0, 57.0, 98.0, 148.0, 131.0, 130.0, 112.0, 63.0, 48.0, 39.0, 27.0, 26.0, 11.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322509765625, -0.3142223358154297, -0.3059349060058594, -0.29764747619628906, -0.28936004638671875, -0.28107261657714844, -0.2727851867675781, -0.2644977569580078, -0.2562103271484375, -0.2479228973388672, -0.23963546752929688, -0.23134803771972656, -0.22306060791015625, -0.21477317810058594, -0.20648574829101562, -0.1981983184814453, -0.189910888671875, -0.1816234588623047, -0.17333602905273438, -0.16504859924316406, -0.15676116943359375, -0.14847373962402344, -0.14018630981445312, -0.1318988800048828, -0.1236114501953125, -0.11532402038574219, -0.10703659057617188, -0.09874916076660156, -0.09046173095703125, -0.08217430114746094, -0.07388687133789062, -0.06559944152832031, -0.05731201171875, -0.04902458190917969, -0.040737152099609375, -0.03244972229003906, -0.02416229248046875, -0.015874862670898438, -0.007587432861328125, 0.0006999969482421875, 0.0089874267578125, 0.017274856567382812, 0.025562286376953125, 0.03384971618652344, 0.04213714599609375, 0.05042457580566406, 0.058712005615234375, 0.06699943542480469, 0.075286865234375, 0.08357429504394531, 0.09186172485351562, 0.10014915466308594, 0.10843658447265625, 0.11672401428222656, 0.12501144409179688, 0.1332988739013672, 0.1415863037109375, 0.1498737335205078, 0.15816116333007812, 0.16644859313964844, 0.17473602294921875, 0.18302345275878906, 0.19131088256835938, 0.1995983123779297, 0.2078857421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 16.0, 31.0, 49.0, 117.0, 110.0, 64.0, 43.0, 11.0, 6.0, 5.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6203757524490356, -1.5752099752426147, -1.5300440788269043, -1.4848783016204834, -1.439712405204773, -1.394546627998352, -1.3493807315826416, -1.3042149543762207, -1.2590491771697998, -1.213883399963379, -1.1687175035476685, -1.1235517263412476, -1.078385829925537, -1.0332200527191162, -0.9880542159080505, -0.9428883790969849, -0.8977224826812744, -0.8525566458702087, -0.8073908090591431, -0.7622250318527222, -0.7170591354370117, -0.6718933582305908, -0.6267275214195251, -0.5815616846084595, -0.5363958477973938, -0.4912300109863281, -0.44606417417526245, -0.40089836716651917, -0.3557325303554535, -0.3105666935443878, -0.26540088653564453, -0.22023504972457886, -0.17506933212280273, -0.12990349531173706, -0.08473767340183258, -0.0395718514919281, 0.005593985319137573, 0.05075982213020325, 0.09592562913894653, 0.1410914659500122, 0.18625730276107788, 0.23142313957214355, 0.27658897638320923, 0.3217547833919525, 0.3669206202030182, 0.41208645701408386, 0.45725226402282715, 0.5024181008338928, 0.5475839376449585, 0.5927497744560242, 0.6379156112670898, 0.6830813884735107, 0.7282472848892212, 0.7734130620956421, 0.8185788989067078, 0.8637447357177734, 0.9089105725288391, 0.9540764093399048, 0.9992422461509705, 1.0444080829620361, 1.089573860168457, 1.1347397565841675, 1.1799055337905884, 1.2250714302062988, 1.2702372074127197]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 6.0, 15.0, 6.0, 21.0, 58.0, 117.0, 123.0, 55.0, 17.0, 13.0, 8.0, 1.0, 3.0, 2.0, 8.0, 8.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1648681163787842, -1.1329078674316406, -1.100947618484497, -1.0689873695373535, -1.03702712059021, -1.0050668716430664, -0.9731065630912781, -0.9411463141441345, -0.909186065196991, -0.8772258162498474, -0.8452655673027039, -0.8133053183555603, -0.781345009803772, -0.7493847608566284, -0.7174245119094849, -0.6854642629623413, -0.6535040140151978, -0.6215437650680542, -0.5895835161209106, -0.5576232671737671, -0.5256630182266235, -0.4937027394771576, -0.46174246072769165, -0.4297822117805481, -0.39782196283340454, -0.365861713886261, -0.33390146493911743, -0.3019411861896515, -0.26998093724250793, -0.23802068829536438, -0.20606042444705963, -0.17410016059875488, -0.14213979244232178, -0.11017953604459763, -0.07821927964687347, -0.04625902324914932, -0.014298766851425171, 0.017661482095718384, 0.04962174594402313, 0.08158200979232788, 0.11354225873947144, 0.145502507686615, 0.17746277153491974, 0.2094230353832245, 0.24138328433036804, 0.2733435332775116, 0.30530381202697754, 0.3372640609741211, 0.36922430992126465, 0.4011845588684082, 0.43314480781555176, 0.4651050865650177, 0.49706533551216125, 0.5290255546569824, 0.5609858632087708, 0.5929461121559143, 0.6249063611030579, 0.6568666100502014, 0.688826858997345, 0.7207871079444885, 0.7527474164962769, 0.7847076654434204, 0.816667914390564, 0.8486281633377075, 0.8805884122848511]}, "eval/loss": 4.194759368896484, "eval/wer": 2.4282625942086473, "eval/runtime": 1143.8371, "eval/samples_per_second": 2.31, "eval/steps_per_second": 0.289, "train/train_runtime": 6364.0567, "train/train_samples_per_second": 4.484, "train/train_steps_per_second": 0.14, "train/total_flos": 0.0, "train/train_loss": 4.297821357913081} \ No newline at end of file +{"train/loss": 4.0199, "train/learning_rate": 7.653061224489796e-08, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 7825, "_timestamp": 1646059131, "_step": 894, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 101.0, 880.0, 34.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.887240409851074, -9.418985366821289, -2.9507312774658203, 3.517523765563965, 9.985777854919434, 16.45403289794922, 22.922286987304688, 29.390541076660156, 35.858795166015625, 42.327049255371094, 48.79530334472656, 55.26355743408203, 61.7318115234375, 68.2000732421875, 74.66831970214844, 81.13658142089844, 87.6048355102539, 94.07308959960938, 100.54134368896484, 107.00959777832031, 113.47785186767578, 119.94610595703125, 126.41436767578125, 132.8826141357422, 139.3508758544922, 145.8191375732422, 152.28738403320312, 158.75564575195312, 165.22389221191406, 171.69215393066406, 178.160400390625, 184.628662109375, 191.09690856933594, 197.56517028808594, 204.03341674804688, 210.50167846679688, 216.9699249267578, 223.4381866455078, 229.90643310546875, 236.37469482421875, 242.8429412841797, 249.3112030029297, 255.77944946289062, 262.2477111816406, 268.7159729003906, 275.1842041015625, 281.6524658203125, 288.1207275390625, 294.5889892578125, 301.0572509765625, 307.5255126953125, 313.9937438964844, 320.4620056152344, 326.9302673339844, 333.3985290527344, 339.86676025390625, 346.33502197265625, 352.80328369140625, 359.27154541015625, 365.7397766113281, 372.2080383300781, 378.6763000488281, 385.1445617675781, 391.61279296875, 398.0810546875]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 11.0, 5.0, 13.0, 5.0, 16.0, 23.0, 19.0, 22.0, 31.0, 42.0, 36.0, 35.0, 42.0, 39.0, 52.0, 63.0, 66.0, 56.0, 65.0, 65.0, 46.0, 40.0, 50.0, 26.0, 31.0, 19.0, 19.0, 17.0, 7.0, 11.0, 11.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.502586364746094, -29.423606872558594, -28.344627380371094, -27.265649795532227, -26.186670303344727, -25.107690811157227, -24.02871322631836, -22.94973373413086, -21.87075424194336, -20.79177474975586, -19.71279525756836, -18.633817672729492, -17.554838180541992, -16.475858688354492, -15.396880149841309, -14.317901611328125, -13.238922119140625, -12.159942626953125, -11.080964088439941, -10.001985549926758, -8.923006057739258, -7.844027042388916, -6.765048027038574, -5.686069011688232, -4.607089996337891, -3.528110980987549, -2.449131965637207, -1.3701529502868652, -0.29117393493652344, 0.7878050804138184, 1.8667840957641602, 2.945763111114502, 4.024742126464844, 5.1037211418151855, 6.182700157165527, 7.261679172515869, 8.340658187866211, 9.419637680053711, 10.498616218566895, 11.577594757080078, 12.656574249267578, 13.735553741455078, 14.814532279968262, 15.893510818481445, 16.972490310668945, 18.051469802856445, 19.130447387695312, 20.209426879882812, 21.288406372070312, 22.367385864257812, 23.446365356445312, 24.52534294128418, 25.60432243347168, 26.68330192565918, 27.762279510498047, 28.841259002685547, 29.920238494873047, 30.999217987060547, 32.07819747924805, 33.15717697143555, 34.23615264892578, 35.31513214111328, 36.39411163330078, 37.47309112548828, 38.55207061767578]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 9.0, 9.0, 10.0, 6.0, 13.0, 9.0, 17.0, 21.0, 26.0, 21.0, 20.0, 26.0, 45.0, 50.0, 43.0, 57.0, 31.0, 41.0, 60.0, 58.0, 55.0, 58.0, 46.0, 44.0, 38.0, 31.0, 27.0, 20.0, 15.0, 15.0, 20.0, 16.0, 11.0, 12.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9337921142578125, -1.877349853515625, -1.8209075927734375, -1.76446533203125, -1.7080230712890625, -1.651580810546875, -1.5951385498046875, -1.5386962890625, -1.4822540283203125, -1.425811767578125, -1.3693695068359375, -1.31292724609375, -1.2564849853515625, -1.200042724609375, -1.1436004638671875, -1.087158203125, -1.0307159423828125, -0.974273681640625, -0.9178314208984375, -0.86138916015625, -0.8049468994140625, -0.748504638671875, -0.6920623779296875, -0.6356201171875, -0.5791778564453125, -0.522735595703125, -0.4662933349609375, -0.40985107421875, -0.3534088134765625, -0.296966552734375, -0.2405242919921875, -0.18408203125, -0.1276397705078125, -0.071197509765625, -0.0147552490234375, 0.04168701171875, 0.0981292724609375, 0.154571533203125, 0.2110137939453125, 0.2674560546875, 0.3238983154296875, 0.380340576171875, 0.4367828369140625, 0.49322509765625, 0.5496673583984375, 0.606109619140625, 0.6625518798828125, 0.718994140625, 0.7754364013671875, 0.831878662109375, 0.8883209228515625, 0.94476318359375, 1.0012054443359375, 1.057647705078125, 1.1140899658203125, 1.1705322265625, 1.2269744873046875, 1.283416748046875, 1.3398590087890625, 1.39630126953125, 1.4527435302734375, 1.509185791015625, 1.5656280517578125, 1.6220703125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 8.0, 8.0, 7.0, 17.0, 19.0, 31.0, 43.0, 46.0, 63.0, 102.0, 147.0, 232.0, 318.0, 463.0, 754.0, 1153.0, 2061.0, 3794.0, 8242.0, 23126.0, 90145.0, 629874.0, 2531855.0, 752435.0, 105746.0, 25547.0, 8820.0, 3836.0, 2137.0, 1182.0, 658.0, 450.0, 303.0, 210.0, 143.0, 120.0, 60.0, 32.0, 27.0, 32.0, 14.0, 9.0, 9.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.125, -3.98046875, -3.8359375, -3.69140625, -3.546875, -3.40234375, -3.2578125, -3.11328125, -2.96875, -2.82421875, -2.6796875, -2.53515625, -2.390625, -2.24609375, -2.1015625, -1.95703125, -1.8125, -1.66796875, -1.5234375, -1.37890625, -1.234375, -1.08984375, -0.9453125, -0.80078125, -0.65625, -0.51171875, -0.3671875, -0.22265625, -0.078125, 0.06640625, 0.2109375, 0.35546875, 0.5, 0.64453125, 0.7890625, 0.93359375, 1.078125, 1.22265625, 1.3671875, 1.51171875, 1.65625, 1.80078125, 1.9453125, 2.08984375, 2.234375, 2.37890625, 2.5234375, 2.66796875, 2.8125, 2.95703125, 3.1015625, 3.24609375, 3.390625, 3.53515625, 3.6796875, 3.82421875, 3.96875, 4.11328125, 4.2578125, 4.40234375, 4.546875, 4.69140625, 4.8359375, 4.98046875, 5.125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 5.0, 19.0, 22.0, 41.0, 79.0, 139.0, 250.0, 500.0, 880.0, 859.0, 529.0, 309.0, 172.0, 104.0, 67.0, 34.0, 24.0, 10.0, 6.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.453125, -9.1148681640625, -8.776611328125, -8.4383544921875, -8.10009765625, -7.7618408203125, -7.423583984375, -7.0853271484375, -6.7470703125, -6.4088134765625, -6.070556640625, -5.7322998046875, -5.39404296875, -5.0557861328125, -4.717529296875, -4.3792724609375, -4.041015625, -3.7027587890625, -3.364501953125, -3.0262451171875, -2.68798828125, -2.3497314453125, -2.011474609375, -1.6732177734375, -1.3349609375, -0.9967041015625, -0.658447265625, -0.3201904296875, 0.01806640625, 0.3563232421875, 0.694580078125, 1.0328369140625, 1.37109375, 1.7093505859375, 2.047607421875, 2.3858642578125, 2.72412109375, 3.0623779296875, 3.400634765625, 3.7388916015625, 4.0771484375, 4.4154052734375, 4.753662109375, 5.0919189453125, 5.43017578125, 5.7684326171875, 6.106689453125, 6.4449462890625, 6.783203125, 7.1214599609375, 7.459716796875, 7.7979736328125, 8.13623046875, 8.4744873046875, 8.812744140625, 9.1510009765625, 9.4892578125, 9.8275146484375, 10.165771484375, 10.5040283203125, 10.84228515625, 11.1805419921875, 11.518798828125, 11.8570556640625, 12.1953125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 16.0, 16.0, 20.0, 50.0, 76.0, 159.0, 269.0, 602.0, 1602.0, 8923.0, 3179612.0, 993909.0, 6244.0, 1496.0, 606.0, 279.0, 160.0, 84.0, 52.0, 28.0, 20.0, 14.0, 9.0, 6.0, 5.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.96875, -27.93115234375, -26.8935546875, -25.85595703125, -24.818359375, -23.78076171875, -22.7431640625, -21.70556640625, -20.66796875, -19.63037109375, -18.5927734375, -17.55517578125, -16.517578125, -15.47998046875, -14.4423828125, -13.40478515625, -12.3671875, -11.32958984375, -10.2919921875, -9.25439453125, -8.216796875, -7.17919921875, -6.1416015625, -5.10400390625, -4.06640625, -3.02880859375, -1.9912109375, -0.95361328125, 0.083984375, 1.12158203125, 2.1591796875, 3.19677734375, 4.234375, 5.27197265625, 6.3095703125, 7.34716796875, 8.384765625, 9.42236328125, 10.4599609375, 11.49755859375, 12.53515625, 13.57275390625, 14.6103515625, 15.64794921875, 16.685546875, 17.72314453125, 18.7607421875, 19.79833984375, 20.8359375, 21.87353515625, 22.9111328125, 23.94873046875, 24.986328125, 26.02392578125, 27.0615234375, 28.09912109375, 29.13671875, 30.17431640625, 31.2119140625, 32.24951171875, 33.287109375, 34.32470703125, 35.3623046875, 36.39990234375, 37.4375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 10.0, 599.0, 389.0, 14.0, 1.0, 1.0, 0.0, 1.0], "bins": [-297.2367858886719, -292.0941467285156, -286.9515075683594, -281.8088684082031, -276.6662292480469, -271.5235900878906, -266.3809509277344, -261.2383117675781, -256.0956726074219, -250.95303344726562, -245.81039428710938, -240.66775512695312, -235.52511596679688, -230.38247680664062, -225.23983764648438, -220.09718322753906, -214.95452880859375, -209.8118896484375, -204.66925048828125, -199.526611328125, -194.38397216796875, -189.2413330078125, -184.09869384765625, -178.95603942871094, -173.81341552734375, -168.6707763671875, -163.52813720703125, -158.385498046875, -153.24285888671875, -148.1002197265625, -142.95758056640625, -137.81492614746094, -132.67227172851562, -127.52963256835938, -122.38699340820312, -117.24435424804688, -112.1017074584961, -106.95906829833984, -101.8164291381836, -96.67378234863281, -91.5311508178711, -86.38851165771484, -81.2458724975586, -76.10322570800781, -70.96058654785156, -65.81794738769531, -60.67530822753906, -55.53266525268555, -50.39002227783203, -45.24738311767578, -40.104740142822266, -34.962100982666016, -29.819459915161133, -24.67681884765625, -19.5341796875, -14.391536712646484, -9.248899459838867, -4.106258869171143, 1.036381721496582, 6.179021835327148, 11.321662902832031, 16.464303970336914, 21.606943130493164, 26.74958610534668, 31.89222526550293]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 9.0, 9.0, 5.0, 3.0, 6.0, 13.0, 10.0, 13.0, 13.0, 22.0, 18.0, 24.0, 26.0, 26.0, 35.0, 33.0, 24.0, 38.0, 37.0, 43.0, 42.0, 56.0, 36.0, 44.0, 43.0, 49.0, 34.0, 33.0, 37.0, 33.0, 38.0, 26.0, 24.0, 22.0, 16.0, 10.0, 13.0, 9.0, 13.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-30.77267074584961, -29.925748825073242, -29.078826904296875, -28.23190689086914, -27.384984970092773, -26.538063049316406, -25.691143035888672, -24.844221115112305, -23.997299194335938, -23.15037727355957, -22.303455352783203, -21.45653533935547, -20.6096134185791, -19.762691497802734, -18.915771484375, -18.068849563598633, -17.221927642822266, -16.3750057220459, -15.528084754943848, -14.681163787841797, -13.83424186706543, -12.987319946289062, -12.140398979187012, -11.293478012084961, -10.446556091308594, -9.599634170532227, -8.752713203430176, -7.905791759490967, -7.058870315551758, -6.211948871612549, -5.36502742767334, -4.518105983734131, -3.671182632446289, -2.82426118850708, -1.977339744567871, -1.130418300628662, -0.2834968566894531, 0.5634245872497559, 1.4103460311889648, 2.257267475128174, 3.104188919067383, 3.951110363006592, 4.798031806945801, 5.64495325088501, 6.491874694824219, 7.338796138763428, 8.185717582702637, 9.032638549804688, 9.879560470581055, 10.726482391357422, 11.573403358459473, 12.420324325561523, 13.26724624633789, 14.114168167114258, 14.961089134216309, 15.80801010131836, 16.654932022094727, 17.501853942871094, 18.348773956298828, 19.195695877075195, 20.042617797851562, 20.88953971862793, 21.736461639404297, 22.58338165283203, 23.4303035736084]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 1.0, 5.0, 6.0, 10.0, 12.0, 11.0, 15.0, 21.0, 19.0, 23.0, 24.0, 20.0, 34.0, 44.0, 35.0, 41.0, 42.0, 37.0, 47.0, 54.0, 51.0, 45.0, 46.0, 49.0, 37.0, 43.0, 34.0, 22.0, 31.0, 25.0, 18.0, 29.0, 10.0, 11.0, 8.0, 13.0, 3.0, 5.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.499847412109375, -1.44500732421875, -1.390167236328125, -1.3353271484375, -1.280487060546875, -1.22564697265625, -1.170806884765625, -1.115966796875, -1.061126708984375, -1.00628662109375, -0.951446533203125, -0.8966064453125, -0.841766357421875, -0.78692626953125, -0.732086181640625, -0.67724609375, -0.622406005859375, -0.56756591796875, -0.512725830078125, -0.4578857421875, -0.403045654296875, -0.34820556640625, -0.293365478515625, -0.238525390625, -0.183685302734375, -0.12884521484375, -0.074005126953125, -0.0191650390625, 0.035675048828125, 0.09051513671875, 0.145355224609375, 0.2001953125, 0.255035400390625, 0.30987548828125, 0.364715576171875, 0.4195556640625, 0.474395751953125, 0.52923583984375, 0.584075927734375, 0.638916015625, 0.693756103515625, 0.74859619140625, 0.803436279296875, 0.8582763671875, 0.913116455078125, 0.96795654296875, 1.022796630859375, 1.07763671875, 1.132476806640625, 1.18731689453125, 1.242156982421875, 1.2969970703125, 1.351837158203125, 1.40667724609375, 1.461517333984375, 1.516357421875, 1.571197509765625, 1.62603759765625, 1.680877685546875, 1.7357177734375, 1.790557861328125, 1.84539794921875, 1.900238037109375, 1.955078125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 14.0, 15.0, 17.0, 22.0, 40.0, 54.0, 88.0, 110.0, 148.0, 280.0, 350.0, 479.0, 804.0, 1204.0, 1724.0, 2618.0, 4032.0, 5900.0, 9354.0, 14738.0, 23585.0, 39743.0, 70557.0, 137214.0, 308373.0, 198468.0, 94899.0, 51644.0, 30078.0, 18486.0, 11625.0, 7476.0, 4740.0, 3281.0, 2010.0, 1463.0, 950.0, 596.0, 452.0, 325.0, 193.0, 119.0, 112.0, 67.0, 42.0, 30.0, 14.0, 8.0, 5.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.29345703125, -0.284210205078125, -0.27496337890625, -0.265716552734375, -0.2564697265625, -0.247222900390625, -0.23797607421875, -0.228729248046875, -0.219482421875, -0.210235595703125, -0.20098876953125, -0.191741943359375, -0.1824951171875, -0.173248291015625, -0.16400146484375, -0.154754638671875, -0.1455078125, -0.136260986328125, -0.12701416015625, -0.117767333984375, -0.1085205078125, -0.099273681640625, -0.09002685546875, -0.080780029296875, -0.071533203125, -0.062286376953125, -0.05303955078125, -0.043792724609375, -0.0345458984375, -0.025299072265625, -0.01605224609375, -0.006805419921875, 0.00244140625, 0.011688232421875, 0.02093505859375, 0.030181884765625, 0.0394287109375, 0.048675537109375, 0.05792236328125, 0.067169189453125, 0.076416015625, 0.085662841796875, 0.09490966796875, 0.104156494140625, 0.1134033203125, 0.122650146484375, 0.13189697265625, 0.141143798828125, 0.150390625, 0.159637451171875, 0.16888427734375, 0.178131103515625, 0.1873779296875, 0.196624755859375, 0.20587158203125, 0.215118408203125, 0.224365234375, 0.233612060546875, 0.24285888671875, 0.252105712890625, 0.2613525390625, 0.270599365234375, 0.27984619140625, 0.289093017578125, 0.29833984375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 3.0, 8.0, 4.0, 14.0, 12.0, 11.0, 21.0, 13.0, 12.0, 25.0, 24.0, 33.0, 31.0, 23.0, 32.0, 45.0, 43.0, 40.0, 40.0, 44.0, 1081.0, 27.0, 39.0, 37.0, 32.0, 34.0, 36.0, 26.0, 27.0, 24.0, 25.0, 22.0, 32.0, 20.0, 20.0, 15.0, 15.0, 3.0, 7.0, 6.0, 7.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0634765625, -1.03118896484375, -0.9989013671875, -0.96661376953125, -0.934326171875, -0.90203857421875, -0.8697509765625, -0.83746337890625, -0.80517578125, -0.77288818359375, -0.7406005859375, -0.70831298828125, -0.676025390625, -0.64373779296875, -0.6114501953125, -0.57916259765625, -0.546875, -0.51458740234375, -0.4822998046875, -0.45001220703125, -0.417724609375, -0.38543701171875, -0.3531494140625, -0.32086181640625, -0.28857421875, -0.25628662109375, -0.2239990234375, -0.19171142578125, -0.159423828125, -0.12713623046875, -0.0948486328125, -0.06256103515625, -0.0302734375, 0.00201416015625, 0.0343017578125, 0.06658935546875, 0.098876953125, 0.13116455078125, 0.1634521484375, 0.19573974609375, 0.22802734375, 0.26031494140625, 0.2926025390625, 0.32489013671875, 0.357177734375, 0.38946533203125, 0.4217529296875, 0.45404052734375, 0.486328125, 0.51861572265625, 0.5509033203125, 0.58319091796875, 0.615478515625, 0.64776611328125, 0.6800537109375, 0.71234130859375, 0.74462890625, 0.77691650390625, 0.8092041015625, 0.84149169921875, 0.873779296875, 0.90606689453125, 0.9383544921875, 0.97064208984375, 1.0029296875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 3.0, 9.0, 16.0, 14.0, 23.0, 41.0, 55.0, 63.0, 108.0, 153.0, 223.0, 340.0, 488.0, 654.0, 957.0, 1436.0, 1972.0, 2964.0, 4471.0, 6159.0, 8963.0, 12893.0, 18837.0, 27545.0, 41787.0, 66383.0, 116669.0, 1289573.0, 209407.0, 103500.0, 60285.0, 38497.0, 25841.0, 17584.0, 11864.0, 8388.0, 5704.0, 3864.0, 2744.0, 1912.0, 1381.0, 964.0, 705.0, 447.0, 370.0, 242.0, 189.0, 142.0, 94.0, 77.0, 43.0, 34.0, 29.0, 10.0, 10.0, 8.0, 5.0, 4.0, 0.0, 1.0], "bins": [-0.2288818359375, -0.22170639038085938, -0.21453094482421875, -0.20735549926757812, -0.2001800537109375, -0.19300460815429688, -0.18582916259765625, -0.17865371704101562, -0.171478271484375, -0.16430282592773438, -0.15712738037109375, -0.14995193481445312, -0.1427764892578125, -0.13560104370117188, -0.12842559814453125, -0.12125015258789062, -0.11407470703125, -0.10689926147460938, -0.09972381591796875, -0.09254837036132812, -0.0853729248046875, -0.07819747924804688, -0.07102203369140625, -0.06384658813476562, -0.056671142578125, -0.049495697021484375, -0.04232025146484375, -0.035144805908203125, -0.0279693603515625, -0.020793914794921875, -0.01361846923828125, -0.006443023681640625, 0.000732421875, 0.007907867431640625, 0.01508331298828125, 0.022258758544921875, 0.0294342041015625, 0.036609649658203125, 0.04378509521484375, 0.050960540771484375, 0.058135986328125, 0.06531143188476562, 0.07248687744140625, 0.07966232299804688, 0.0868377685546875, 0.09401321411132812, 0.10118865966796875, 0.10836410522460938, 0.11553955078125, 0.12271499633789062, 0.12989044189453125, 0.13706588745117188, 0.1442413330078125, 0.15141677856445312, 0.15859222412109375, 0.16576766967773438, 0.172943115234375, 0.18011856079101562, 0.18729400634765625, 0.19446945190429688, 0.2016448974609375, 0.20882034301757812, 0.21599578857421875, 0.22317123413085938, 0.2303466796875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 4.0, 9.0, 9.0, 12.0, 14.0, 14.0, 12.0, 20.0, 26.0, 32.0, 39.0, 48.0, 50.0, 55.0, 53.0, 68.0, 71.0, 65.0, 54.0, 48.0, 52.0, 29.0, 41.0, 27.0, 33.0, 26.0, 10.0, 12.0, 10.0, 10.0, 3.0, 8.0, 9.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.937980651855469e-05, -6.724148988723755e-05, -6.510317325592041e-05, -6.296485662460327e-05, -6.082653999328613e-05, -5.8688223361968994e-05, -5.6549906730651855e-05, -5.441159009933472e-05, -5.227327346801758e-05, -5.013495683670044e-05, -4.79966402053833e-05, -4.585832357406616e-05, -4.3720006942749023e-05, -4.1581690311431885e-05, -3.9443373680114746e-05, -3.730505704879761e-05, -3.516674041748047e-05, -3.302842378616333e-05, -3.089010715484619e-05, -2.8751790523529053e-05, -2.6613473892211914e-05, -2.4475157260894775e-05, -2.2336840629577637e-05, -2.0198523998260498e-05, -1.806020736694336e-05, -1.592189073562622e-05, -1.3783574104309082e-05, -1.1645257472991943e-05, -9.506940841674805e-06, -7.368624210357666e-06, -5.230307579040527e-06, -3.0919909477233887e-06, -9.5367431640625e-07, 1.1846423149108887e-06, 3.3229589462280273e-06, 5.461275577545166e-06, 7.599592208862305e-06, 9.737908840179443e-06, 1.1876225471496582e-05, 1.401454210281372e-05, 1.615285873413086e-05, 1.8291175365447998e-05, 2.0429491996765137e-05, 2.2567808628082275e-05, 2.4706125259399414e-05, 2.6844441890716553e-05, 2.898275852203369e-05, 3.112107515335083e-05, 3.325939178466797e-05, 3.539770841598511e-05, 3.7536025047302246e-05, 3.9674341678619385e-05, 4.1812658309936523e-05, 4.395097494125366e-05, 4.60892915725708e-05, 4.822760820388794e-05, 5.036592483520508e-05, 5.250424146652222e-05, 5.4642558097839355e-05, 5.6780874729156494e-05, 5.891919136047363e-05, 6.105750799179077e-05, 6.319582462310791e-05, 6.533414125442505e-05, 6.747245788574219e-05]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 7.0, 5.0, 11.0, 23.0, 16.0, 21.0, 22.0, 46.0, 32.0, 40.0, 47.0, 59.0, 98.0, 128.0, 149.0, 241.0, 317.0, 469.0, 865.0, 13397.0, 1028482.0, 1825.0, 682.0, 413.0, 285.0, 170.0, 147.0, 146.0, 88.0, 73.0, 44.0, 35.0, 24.0, 23.0, 21.0, 35.0, 9.0, 11.0, 10.0, 5.0, 6.0, 10.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0010995864868164062, -0.001063317060470581, -0.0010270476341247559, -0.0009907782077789307, -0.0009545087814331055, -0.0009182393550872803, -0.0008819699287414551, -0.0008457005023956299, -0.0008094310760498047, -0.0007731616497039795, -0.0007368922233581543, -0.0007006227970123291, -0.0006643533706665039, -0.0006280839443206787, -0.0005918145179748535, -0.0005555450916290283, -0.0005192756652832031, -0.00048300623893737793, -0.00044673681259155273, -0.00041046738624572754, -0.00037419795989990234, -0.00033792853355407715, -0.00030165910720825195, -0.00026538968086242676, -0.00022912025451660156, -0.00019285082817077637, -0.00015658140182495117, -0.00012031197547912598, -8.404254913330078e-05, -4.7773122787475586e-05, -1.150369644165039e-05, 2.4765729904174805e-05, 6.103515625e-05, 9.73045825958252e-05, 0.0001335740089416504, 0.00016984343528747559, 0.00020611286163330078, 0.00024238228797912598, 0.00027865171432495117, 0.00031492114067077637, 0.00035119056701660156, 0.00038745999336242676, 0.00042372941970825195, 0.00045999884605407715, 0.0004962682723999023, 0.0005325376987457275, 0.0005688071250915527, 0.0006050765514373779, 0.0006413459777832031, 0.0006776154041290283, 0.0007138848304748535, 0.0007501542568206787, 0.0007864236831665039, 0.0008226931095123291, 0.0008589625358581543, 0.0008952319622039795, 0.0009315013885498047, 0.0009677708148956299, 0.001004040241241455, 0.0010403096675872803, 0.0010765790939331055, 0.0011128485202789307, 0.0011491179466247559, 0.001185387372970581, 0.0012216567993164062]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 35.0, 888.0, 93.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001707318442640826, -0.00016243892605416477, -0.00015414600784424692, -0.00014585308963432908, -0.000137560156872496, -0.00012926723866257817, -0.00012097432045266032, -0.00011268140224274248, -0.00010438847675686702, -9.609555854694918e-05, -8.780263306107372e-05, -7.950971485115588e-05, -7.121679664123803e-05, -6.292387115536258e-05, -5.463095294544473e-05, -4.633803109754808e-05, -3.804510924965143e-05, -2.975218740175478e-05, -2.1459267372847535e-05, -1.3166347343940288e-05, -4.873425496043637e-06, 3.419496351853013e-06, 1.1712414561770856e-05, 2.0005336409667507e-05, 2.8298258257564157e-05, 3.659118010546081e-05, 4.488410195335746e-05, 5.31770201632753e-05, 6.146993837319314e-05, 6.97628638590686e-05, 7.805578206898645e-05, 8.63487075548619e-05, 9.464164031669497e-05, 0.00010293455852661282, 0.00011122748401248828, 0.00011952040222240612, 0.00012781332770828158, 0.00013610624591819942, 0.00014439916412811726, 0.0001526920823380351, 0.00016098501509986818, 0.00016927793330978602, 0.00017757085151970387, 0.00018586378428153694, 0.00019415670249145478, 0.00020244962070137262, 0.00021074253891129047, 0.0002190354571212083, 0.00022732837533112615, 0.000235621293541044, 0.00024391421175096184, 0.0002522071299608797, 0.00026050006272271276, 0.00026879296638071537, 0.00027708589914254844, 0.0002853788319043815, 0.00029367173556238413, 0.0003019646683242172, 0.0003102575719822198, 0.0003185505047440529, 0.0003268434084020555, 0.0003351363411638886, 0.00034342927392572165, 0.00035172217758372426, 0.00036001511034555733]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 7.0, 4.0, 7.0, 10.0, 15.0, 13.0, 15.0, 11.0, 13.0, 19.0, 27.0, 22.0, 32.0, 38.0, 26.0, 32.0, 28.0, 41.0, 27.0, 37.0, 38.0, 46.0, 49.0, 46.0, 37.0, 39.0, 33.0, 21.0, 31.0, 25.0, 15.0, 27.0, 17.0, 40.0, 22.0, 21.0, 14.0, 12.0, 6.0, 9.0, 7.0, 4.0, 5.0, 9.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.635883331298828e-05, -3.5315752029418945e-05, -3.427267074584961e-05, -3.3229589462280273e-05, -3.218650817871094e-05, -3.11434268951416e-05, -3.0100345611572266e-05, -2.905726432800293e-05, -2.8014183044433594e-05, -2.6971101760864258e-05, -2.5928020477294922e-05, -2.4884939193725586e-05, -2.384185791015625e-05, -2.2798776626586914e-05, -2.1755695343017578e-05, -2.0712614059448242e-05, -1.9669532775878906e-05, -1.862645149230957e-05, -1.7583370208740234e-05, -1.65402889251709e-05, -1.5497207641601562e-05, -1.4454126358032227e-05, -1.341104507446289e-05, -1.2367963790893555e-05, -1.1324882507324219e-05, -1.0281801223754883e-05, -9.238719940185547e-06, -8.195638656616211e-06, -7.152557373046875e-06, -6.109476089477539e-06, -5.066394805908203e-06, -4.023313522338867e-06, -2.9802322387695312e-06, -1.9371509552001953e-06, -8.940696716308594e-07, 1.4901161193847656e-07, 1.1920928955078125e-06, 2.2351741790771484e-06, 3.2782554626464844e-06, 4.32133674621582e-06, 5.364418029785156e-06, 6.407499313354492e-06, 7.450580596923828e-06, 8.493661880493164e-06, 9.5367431640625e-06, 1.0579824447631836e-05, 1.1622905731201172e-05, 1.2665987014770508e-05, 1.3709068298339844e-05, 1.475214958190918e-05, 1.5795230865478516e-05, 1.683831214904785e-05, 1.7881393432617188e-05, 1.8924474716186523e-05, 1.996755599975586e-05, 2.1010637283325195e-05, 2.205371856689453e-05, 2.3096799850463867e-05, 2.4139881134033203e-05, 2.518296241760254e-05, 2.6226043701171875e-05, 2.726912498474121e-05, 2.8312206268310547e-05, 2.9355287551879883e-05, 3.039836883544922e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 1.0, 5.0, 6.0, 10.0, 12.0, 11.0, 15.0, 21.0, 19.0, 23.0, 24.0, 20.0, 34.0, 44.0, 35.0, 41.0, 42.0, 37.0, 47.0, 54.0, 51.0, 45.0, 46.0, 49.0, 37.0, 43.0, 34.0, 22.0, 31.0, 25.0, 18.0, 29.0, 10.0, 11.0, 8.0, 13.0, 3.0, 5.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.499847412109375, -1.44500732421875, -1.390167236328125, -1.3353271484375, -1.280487060546875, -1.22564697265625, -1.170806884765625, -1.115966796875, -1.061126708984375, -1.00628662109375, -0.951446533203125, -0.8966064453125, -0.841766357421875, -0.78692626953125, -0.732086181640625, -0.67724609375, -0.622406005859375, -0.56756591796875, -0.512725830078125, -0.4578857421875, -0.403045654296875, -0.34820556640625, -0.293365478515625, -0.238525390625, -0.183685302734375, -0.12884521484375, -0.074005126953125, -0.0191650390625, 0.035675048828125, 0.09051513671875, 0.145355224609375, 0.2001953125, 0.255035400390625, 0.30987548828125, 0.364715576171875, 0.4195556640625, 0.474395751953125, 0.52923583984375, 0.584075927734375, 0.638916015625, 0.693756103515625, 0.74859619140625, 0.803436279296875, 0.8582763671875, 0.913116455078125, 0.96795654296875, 1.022796630859375, 1.07763671875, 1.132476806640625, 1.18731689453125, 1.242156982421875, 1.2969970703125, 1.351837158203125, 1.40667724609375, 1.461517333984375, 1.516357421875, 1.571197509765625, 1.62603759765625, 1.680877685546875, 1.7357177734375, 1.790557861328125, 1.84539794921875, 1.900238037109375, 1.955078125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 5.0, 5.0, 5.0, 13.0, 17.0, 24.0, 24.0, 36.0, 54.0, 65.0, 93.0, 108.0, 167.0, 204.0, 284.0, 385.0, 512.0, 709.0, 1041.0, 1343.0, 1881.0, 2874.0, 4679.0, 8767.0, 20892.0, 101709.0, 672134.0, 176356.0, 27795.0, 10147.0, 5401.0, 3226.0, 2145.0, 1514.0, 1046.0, 707.0, 560.0, 471.0, 280.0, 213.0, 179.0, 129.0, 92.0, 70.0, 59.0, 44.0, 22.0, 19.0, 17.0, 15.0, 9.0, 7.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.87109375, -6.63909912109375, -6.4071044921875, -6.17510986328125, -5.943115234375, -5.71112060546875, -5.4791259765625, -5.24713134765625, -5.01513671875, -4.78314208984375, -4.5511474609375, -4.31915283203125, -4.087158203125, -3.85516357421875, -3.6231689453125, -3.39117431640625, -3.1591796875, -2.92718505859375, -2.6951904296875, -2.46319580078125, -2.231201171875, -1.99920654296875, -1.7672119140625, -1.53521728515625, -1.30322265625, -1.07122802734375, -0.8392333984375, -0.60723876953125, -0.375244140625, -0.14324951171875, 0.0887451171875, 0.32073974609375, 0.552734375, 0.78472900390625, 1.0167236328125, 1.24871826171875, 1.480712890625, 1.71270751953125, 1.9447021484375, 2.17669677734375, 2.40869140625, 2.64068603515625, 2.8726806640625, 3.10467529296875, 3.336669921875, 3.56866455078125, 3.8006591796875, 4.03265380859375, 4.2646484375, 4.49664306640625, 4.7286376953125, 4.96063232421875, 5.192626953125, 5.42462158203125, 5.6566162109375, 5.88861083984375, 6.12060546875, 6.35260009765625, 6.5845947265625, 6.81658935546875, 7.048583984375, 7.28057861328125, 7.5125732421875, 7.74456787109375, 7.9765625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 15.0, 14.0, 17.0, 11.0, 15.0, 21.0, 25.0, 22.0, 30.0, 28.0, 40.0, 37.0, 41.0, 65.0, 113.0, 190.0, 276.0, 1370.0, 167.0, 92.0, 65.0, 62.0, 34.0, 34.0, 28.0, 26.0, 36.0, 17.0, 21.0, 20.0, 18.0, 10.0, 10.0, 10.0, 6.0, 9.0, 9.0, 3.0, 5.0, 2.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0], "bins": [-5.6953125, -5.5328369140625, -5.370361328125, -5.2078857421875, -5.04541015625, -4.8829345703125, -4.720458984375, -4.5579833984375, -4.3955078125, -4.2330322265625, -4.070556640625, -3.9080810546875, -3.74560546875, -3.5831298828125, -3.420654296875, -3.2581787109375, -3.095703125, -2.9332275390625, -2.770751953125, -2.6082763671875, -2.44580078125, -2.2833251953125, -2.120849609375, -1.9583740234375, -1.7958984375, -1.6334228515625, -1.470947265625, -1.3084716796875, -1.14599609375, -0.9835205078125, -0.821044921875, -0.6585693359375, -0.49609375, -0.3336181640625, -0.171142578125, -0.0086669921875, 0.15380859375, 0.3162841796875, 0.478759765625, 0.6412353515625, 0.8037109375, 0.9661865234375, 1.128662109375, 1.2911376953125, 1.45361328125, 1.6160888671875, 1.778564453125, 1.9410400390625, 2.103515625, 2.2659912109375, 2.428466796875, 2.5909423828125, 2.75341796875, 2.9158935546875, 3.078369140625, 3.2408447265625, 3.4033203125, 3.5657958984375, 3.728271484375, 3.8907470703125, 4.05322265625, 4.2156982421875, 4.378173828125, 4.5406494140625, 4.703125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 10.0, 4.0, 6.0, 9.0, 8.0, 11.0, 9.0, 13.0, 16.0, 12.0, 25.0, 14.0, 27.0, 35.0, 35.0, 73.0, 102.0, 154.0, 274.0, 631.0, 2175.0, 68979.0, 3052408.0, 18001.0, 1447.0, 482.0, 242.0, 125.0, 69.0, 54.0, 35.0, 27.0, 39.0, 29.0, 21.0, 11.0, 14.0, 19.0, 11.0, 11.0, 9.0, 6.0, 4.0, 6.0, 1.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.640625, -17.0400390625, -16.439453125, -15.8388671875, -15.23828125, -14.6376953125, -14.037109375, -13.4365234375, -12.8359375, -12.2353515625, -11.634765625, -11.0341796875, -10.43359375, -9.8330078125, -9.232421875, -8.6318359375, -8.03125, -7.4306640625, -6.830078125, -6.2294921875, -5.62890625, -5.0283203125, -4.427734375, -3.8271484375, -3.2265625, -2.6259765625, -2.025390625, -1.4248046875, -0.82421875, -0.2236328125, 0.376953125, 0.9775390625, 1.578125, 2.1787109375, 2.779296875, 3.3798828125, 3.98046875, 4.5810546875, 5.181640625, 5.7822265625, 6.3828125, 6.9833984375, 7.583984375, 8.1845703125, 8.78515625, 9.3857421875, 9.986328125, 10.5869140625, 11.1875, 11.7880859375, 12.388671875, 12.9892578125, 13.58984375, 14.1904296875, 14.791015625, 15.3916015625, 15.9921875, 16.5927734375, 17.193359375, 17.7939453125, 18.39453125, 18.9951171875, 19.595703125, 20.1962890625, 20.796875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 169.0, 657.0, 167.0, 10.0, 0.0, 1.0], "bins": [-82.16666412353516, -80.78565216064453, -79.4046401977539, -78.02362823486328, -76.64261627197266, -75.26160430908203, -73.8805923461914, -72.49958038330078, -71.11856842041016, -69.73755645751953, -68.3565444946289, -66.97553253173828, -65.59452056884766, -64.21350860595703, -62.832496643066406, -61.45148468017578, -60.070472717285156, -58.68946075439453, -57.308448791503906, -55.92743682861328, -54.546424865722656, -53.16541290283203, -51.784400939941406, -50.40338897705078, -49.02237319946289, -47.641361236572266, -46.26034927368164, -44.879337310791016, -43.49832534790039, -42.117313385009766, -40.73630142211914, -39.355289459228516, -37.97427749633789, -36.593265533447266, -35.21225357055664, -33.831241607666016, -32.45022964477539, -31.069217681884766, -29.68820571899414, -28.307193756103516, -26.92618179321289, -25.545169830322266, -24.16415786743164, -22.783145904541016, -21.40213394165039, -20.021121978759766, -18.64011001586914, -17.259098052978516, -15.878084182739258, -14.497072219848633, -13.116060256958008, -11.735048294067383, -10.354036331176758, -8.973024368286133, -7.592011451721191, -6.210999488830566, -4.829987525939941, -3.4489755630493164, -2.0679633617401123, -0.6869511604309082, 0.6940608024597168, 2.075072765350342, 3.456085205078125, 4.83709716796875, 6.218109130859375]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 6.0, 7.0, 9.0, 15.0, 6.0, 6.0, 16.0, 17.0, 16.0, 19.0, 15.0, 27.0, 13.0, 28.0, 30.0, 31.0, 27.0, 36.0, 43.0, 42.0, 28.0, 49.0, 37.0, 41.0, 37.0, 34.0, 43.0, 29.0, 33.0, 37.0, 25.0, 17.0, 39.0, 14.0, 22.0, 25.0, 12.0, 9.0, 16.0, 12.0, 7.0, 6.0, 2.0, 1.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.75569725036621, -16.251174926757812, -15.746650695800781, -15.242127418518066, -14.737604141235352, -14.233081817626953, -13.728558540344238, -13.224035263061523, -12.719511985778809, -12.214988708496094, -11.710465431213379, -11.205942153930664, -10.701419830322266, -10.196895599365234, -9.692373275756836, -9.187849998474121, -8.683326721191406, -8.178803443908691, -7.674280166625977, -7.16975736618042, -6.665234088897705, -6.16071081161499, -5.656188011169434, -5.151664733886719, -4.647141456604004, -4.142618179321289, -3.6380951404571533, -3.1335721015930176, -2.6290488243103027, -2.124525547027588, -1.6200025081634521, -1.1154794692993164, -0.6109542846679688, -0.10643112659454346, 0.39809203147888184, 0.9026151895523071, 1.4071383476257324, 1.9116616249084473, 2.416184663772583, 2.9207077026367188, 3.4252309799194336, 3.9297542572021484, 4.434277534484863, 4.93880033493042, 5.443323612213135, 5.94784688949585, 6.452369689941406, 6.956892967224121, 7.461416244506836, 7.965939521789551, 8.470462799072266, 8.97498607635498, 9.479509353637695, 9.984031677246094, 10.488554954528809, 10.993078231811523, 11.497601509094238, 12.002124786376953, 12.506648063659668, 13.011171340942383, 13.515693664550781, 14.020217895507812, 14.524740219116211, 15.029263496398926, 15.53378677368164]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 10.0, 7.0, 5.0, 11.0, 10.0, 13.0, 19.0, 15.0, 20.0, 27.0, 26.0, 27.0, 31.0, 43.0, 43.0, 26.0, 47.0, 43.0, 47.0, 55.0, 53.0, 44.0, 42.0, 42.0, 45.0, 35.0, 33.0, 28.0, 30.0, 23.0, 17.0, 20.0, 12.0, 18.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.74609375, -1.685760498046875, -1.62542724609375, -1.565093994140625, -1.5047607421875, -1.444427490234375, -1.38409423828125, -1.323760986328125, -1.263427734375, -1.203094482421875, -1.14276123046875, -1.082427978515625, -1.0220947265625, -0.961761474609375, -0.90142822265625, -0.841094970703125, -0.78076171875, -0.720428466796875, -0.66009521484375, -0.599761962890625, -0.5394287109375, -0.479095458984375, -0.41876220703125, -0.358428955078125, -0.298095703125, -0.237762451171875, -0.17742919921875, -0.117095947265625, -0.0567626953125, 0.003570556640625, 0.06390380859375, 0.124237060546875, 0.1845703125, 0.244903564453125, 0.30523681640625, 0.365570068359375, 0.4259033203125, 0.486236572265625, 0.54656982421875, 0.606903076171875, 0.667236328125, 0.727569580078125, 0.78790283203125, 0.848236083984375, 0.9085693359375, 0.968902587890625, 1.02923583984375, 1.089569091796875, 1.14990234375, 1.210235595703125, 1.27056884765625, 1.330902099609375, 1.3912353515625, 1.451568603515625, 1.51190185546875, 1.572235107421875, 1.632568359375, 1.692901611328125, 1.75323486328125, 1.813568115234375, 1.8739013671875, 1.934234619140625, 1.99456787109375, 2.054901123046875, 2.115234375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 11.0, 6.0, 7.0, 15.0, 17.0, 22.0, 29.0, 47.0, 58.0, 89.0, 111.0, 138.0, 217.0, 327.0, 539.0, 925.0, 1530.0, 2854.0, 5924.0, 13750.0, 42170.0, 237811.0, 2545061.0, 1187643.0, 109444.0, 26385.0, 9608.0, 4283.0, 2172.0, 1148.0, 651.0, 391.0, 261.0, 177.0, 108.0, 92.0, 71.0, 41.0, 37.0, 29.0, 15.0, 13.0, 14.0, 6.0, 6.0, 3.0, 6.0, 1.0, 8.0, 2.0, 2.0, 2.0, 1.0], "bins": [-7.64453125, -7.41839599609375, -7.1922607421875, -6.96612548828125, -6.739990234375, -6.51385498046875, -6.2877197265625, -6.06158447265625, -5.83544921875, -5.60931396484375, -5.3831787109375, -5.15704345703125, -4.930908203125, -4.70477294921875, -4.4786376953125, -4.25250244140625, -4.0263671875, -3.80023193359375, -3.5740966796875, -3.34796142578125, -3.121826171875, -2.89569091796875, -2.6695556640625, -2.44342041015625, -2.21728515625, -1.99114990234375, -1.7650146484375, -1.53887939453125, -1.312744140625, -1.08660888671875, -0.8604736328125, -0.63433837890625, -0.408203125, -0.18206787109375, 0.0440673828125, 0.27020263671875, 0.496337890625, 0.72247314453125, 0.9486083984375, 1.17474365234375, 1.40087890625, 1.62701416015625, 1.8531494140625, 2.07928466796875, 2.305419921875, 2.53155517578125, 2.7576904296875, 2.98382568359375, 3.2099609375, 3.43609619140625, 3.6622314453125, 3.88836669921875, 4.114501953125, 4.34063720703125, 4.5667724609375, 4.79290771484375, 5.01904296875, 5.24517822265625, 5.4713134765625, 5.69744873046875, 5.923583984375, 6.14971923828125, 6.3758544921875, 6.60198974609375, 6.828125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 12.0, 11.0, 19.0, 43.0, 66.0, 92.0, 180.0, 266.0, 498.0, 779.0, 794.0, 508.0, 348.0, 197.0, 102.0, 69.0, 43.0, 18.0, 15.0, 10.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.890625, -6.5302734375, -6.169921875, -5.8095703125, -5.44921875, -5.0888671875, -4.728515625, -4.3681640625, -4.0078125, -3.6474609375, -3.287109375, -2.9267578125, -2.56640625, -2.2060546875, -1.845703125, -1.4853515625, -1.125, -0.7646484375, -0.404296875, -0.0439453125, 0.31640625, 0.6767578125, 1.037109375, 1.3974609375, 1.7578125, 2.1181640625, 2.478515625, 2.8388671875, 3.19921875, 3.5595703125, 3.919921875, 4.2802734375, 4.640625, 5.0009765625, 5.361328125, 5.7216796875, 6.08203125, 6.4423828125, 6.802734375, 7.1630859375, 7.5234375, 7.8837890625, 8.244140625, 8.6044921875, 8.96484375, 9.3251953125, 9.685546875, 10.0458984375, 10.40625, 10.7666015625, 11.126953125, 11.4873046875, 11.84765625, 12.2080078125, 12.568359375, 12.9287109375, 13.2890625, 13.6494140625, 14.009765625, 14.3701171875, 14.73046875, 15.0908203125, 15.451171875, 15.8115234375, 16.171875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 10.0, 7.0, 15.0, 28.0, 41.0, 72.0, 140.0, 280.0, 878.0, 13716.0, 4160214.0, 17197.0, 1008.0, 329.0, 131.0, 75.0, 54.0, 36.0, 13.0, 17.0, 8.0, 4.0, 5.0, 3.0, 0.0, 3.0], "bins": [-70.9375, -69.475341796875, -68.01318359375, -66.551025390625, -65.0888671875, -63.626708984375, -62.16455078125, -60.702392578125, -59.240234375, -57.778076171875, -56.31591796875, -54.853759765625, -53.3916015625, -51.929443359375, -50.46728515625, -49.005126953125, -47.54296875, -46.080810546875, -44.61865234375, -43.156494140625, -41.6943359375, -40.232177734375, -38.77001953125, -37.307861328125, -35.845703125, -34.383544921875, -32.92138671875, -31.459228515625, -29.9970703125, -28.534912109375, -27.07275390625, -25.610595703125, -24.1484375, -22.686279296875, -21.22412109375, -19.761962890625, -18.2998046875, -16.837646484375, -15.37548828125, -13.913330078125, -12.451171875, -10.989013671875, -9.52685546875, -8.064697265625, -6.6025390625, -5.140380859375, -3.67822265625, -2.216064453125, -0.75390625, 0.708251953125, 2.17041015625, 3.632568359375, 5.0947265625, 6.556884765625, 8.01904296875, 9.481201171875, 10.943359375, 12.405517578125, 13.86767578125, 15.329833984375, 16.7919921875, 18.254150390625, 19.71630859375, 21.178466796875, 22.640625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 31.0, 631.0, 349.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-173.17491149902344, -168.1968994140625, -163.2188720703125, -158.24085998535156, -153.26283264160156, -148.28482055664062, -143.30679321289062, -138.3287811279297, -133.35076904296875, -128.3727569580078, -123.39472961425781, -118.41670989990234, -113.43869018554688, -108.46067810058594, -103.48265838623047, -98.504638671875, -93.526611328125, -88.54859161376953, -83.57057189941406, -78.5925521850586, -73.61453247070312, -68.63652038574219, -63.65850067138672, -58.68048095703125, -53.70246124267578, -48.72444152832031, -43.746421813964844, -38.76840591430664, -33.79038619995117, -28.812366485595703, -23.834348678588867, -18.85633087158203, -13.878326416015625, -8.900307655334473, -3.9222888946533203, 1.055729866027832, 6.033748626708984, 11.011768341064453, 15.989786148071289, 20.967803955078125, 25.945823669433594, 30.923843383789062, 35.90186309814453, 40.879878997802734, 45.8578987121582, 50.83591842651367, 55.813934326171875, 60.791954040527344, 65.76997375488281, 70.74799346923828, 75.72601318359375, 80.70403289794922, 85.68205261230469, 90.66006469726562, 95.6380844116211, 100.61610412597656, 105.59412384033203, 110.5721435546875, 115.55016326904297, 120.52818298339844, 125.50619506835938, 130.48422241210938, 135.4622344970703, 140.44024658203125, 145.41827392578125]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 8.0, 18.0, 6.0, 15.0, 17.0, 21.0, 25.0, 26.0, 25.0, 29.0, 31.0, 34.0, 49.0, 41.0, 52.0, 48.0, 38.0, 49.0, 35.0, 62.0, 38.0, 27.0, 33.0, 36.0, 33.0, 33.0, 26.0, 22.0, 18.0, 15.0, 11.0, 10.0, 9.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-29.26920509338379, -28.47728157043457, -27.68535804748535, -26.893434524536133, -26.101511001586914, -25.309587478637695, -24.517663955688477, -23.725740432739258, -22.93381690979004, -22.14189338684082, -21.3499698638916, -20.558046340942383, -19.766122817993164, -18.974199295043945, -18.182275772094727, -17.390352249145508, -16.59842872619629, -15.80650520324707, -15.014581680297852, -14.222658157348633, -13.430734634399414, -12.638811111450195, -11.846887588500977, -11.054964065551758, -10.263040542602539, -9.47111701965332, -8.679193496704102, -7.887269973754883, -7.095346450805664, -6.303422927856445, -5.511499404907227, -4.719575881958008, -3.927654266357422, -3.135730743408203, -2.3438072204589844, -1.5518836975097656, -0.7599601745605469, 0.031963348388671875, 0.8238868713378906, 1.6158103942871094, 2.407733917236328, 3.199657440185547, 3.9915809631347656, 4.783504486083984, 5.575428009033203, 6.367351531982422, 7.159275054931641, 7.951198577880859, 8.743122100830078, 9.535045623779297, 10.326969146728516, 11.118892669677734, 11.910816192626953, 12.702739715576172, 13.49466323852539, 14.28658676147461, 15.078510284423828, 15.870433807373047, 16.662357330322266, 17.454280853271484, 18.246204376220703, 19.038127899169922, 19.83005142211914, 20.62197494506836, 21.413898468017578]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 1.0, 10.0, 11.0, 6.0, 7.0, 12.0, 12.0, 18.0, 21.0, 14.0, 22.0, 30.0, 26.0, 29.0, 29.0, 33.0, 28.0, 35.0, 37.0, 43.0, 40.0, 61.0, 50.0, 41.0, 46.0, 40.0, 44.0, 38.0, 29.0, 33.0, 25.0, 20.0, 21.0, 11.0, 20.0, 17.0, 11.0, 5.0, 6.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.9409942626953125, -1.881988525390625, -1.8229827880859375, -1.76397705078125, -1.7049713134765625, -1.645965576171875, -1.5869598388671875, -1.5279541015625, -1.4689483642578125, -1.409942626953125, -1.3509368896484375, -1.29193115234375, -1.2329254150390625, -1.173919677734375, -1.1149139404296875, -1.055908203125, -0.9969024658203125, -0.937896728515625, -0.8788909912109375, -0.81988525390625, -0.7608795166015625, -0.701873779296875, -0.6428680419921875, -0.5838623046875, -0.5248565673828125, -0.465850830078125, -0.4068450927734375, -0.34783935546875, -0.2888336181640625, -0.229827880859375, -0.1708221435546875, -0.11181640625, -0.0528106689453125, 0.006195068359375, 0.0652008056640625, 0.12420654296875, 0.1832122802734375, 0.242218017578125, 0.3012237548828125, 0.3602294921875, 0.4192352294921875, 0.478240966796875, 0.5372467041015625, 0.59625244140625, 0.6552581787109375, 0.714263916015625, 0.7732696533203125, 0.832275390625, 0.8912811279296875, 0.950286865234375, 1.0092926025390625, 1.06829833984375, 1.1273040771484375, 1.186309814453125, 1.2453155517578125, 1.3043212890625, 1.3633270263671875, 1.422332763671875, 1.4813385009765625, 1.54034423828125, 1.5993499755859375, 1.658355712890625, 1.7173614501953125, 1.7763671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 9.0, 12.0, 31.0, 28.0, 43.0, 74.0, 102.0, 127.0, 212.0, 341.0, 445.0, 710.0, 988.0, 1548.0, 2371.0, 3366.0, 5271.0, 8430.0, 13109.0, 21275.0, 35288.0, 59312.0, 105862.0, 240259.0, 273999.0, 113601.0, 62751.0, 37111.0, 22422.0, 13931.0, 8684.0, 5610.0, 3744.0, 2474.0, 1596.0, 1085.0, 741.0, 505.0, 351.0, 235.0, 169.0, 103.0, 75.0, 50.0, 41.0, 27.0, 13.0, 9.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.329833984375, -0.3192138671875, -0.30859375, -0.2979736328125, -0.287353515625, -0.2767333984375, -0.26611328125, -0.2554931640625, -0.244873046875, -0.2342529296875, -0.2236328125, -0.2130126953125, -0.202392578125, -0.1917724609375, -0.18115234375, -0.1705322265625, -0.159912109375, -0.1492919921875, -0.138671875, -0.1280517578125, -0.117431640625, -0.1068115234375, -0.09619140625, -0.0855712890625, -0.074951171875, -0.0643310546875, -0.0537109375, -0.0430908203125, -0.032470703125, -0.0218505859375, -0.01123046875, -0.0006103515625, 0.010009765625, 0.0206298828125, 0.03125, 0.0418701171875, 0.052490234375, 0.0631103515625, 0.07373046875, 0.0843505859375, 0.094970703125, 0.1055908203125, 0.1162109375, 0.1268310546875, 0.137451171875, 0.1480712890625, 0.15869140625, 0.1693115234375, 0.179931640625, 0.1905517578125, 0.201171875, 0.2117919921875, 0.222412109375, 0.2330322265625, 0.24365234375, 0.2542724609375, 0.264892578125, 0.2755126953125, 0.2861328125, 0.2967529296875, 0.307373046875, 0.3179931640625, 0.32861328125, 0.3392333984375, 0.349853515625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 4.0, 12.0, 10.0, 9.0, 16.0, 19.0, 20.0, 22.0, 12.0, 14.0, 16.0, 25.0, 29.0, 25.0, 31.0, 30.0, 32.0, 24.0, 40.0, 38.0, 34.0, 1064.0, 31.0, 37.0, 37.0, 46.0, 37.0, 29.0, 34.0, 24.0, 25.0, 28.0, 22.0, 22.0, 18.0, 21.0, 10.0, 16.0, 9.0, 8.0, 8.0, 9.0, 7.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0498046875, -1.0162506103515625, -0.982696533203125, -0.9491424560546875, -0.91558837890625, -0.8820343017578125, -0.848480224609375, -0.8149261474609375, -0.7813720703125, -0.7478179931640625, -0.714263916015625, -0.6807098388671875, -0.64715576171875, -0.6136016845703125, -0.580047607421875, -0.5464935302734375, -0.512939453125, -0.4793853759765625, -0.445831298828125, -0.4122772216796875, -0.37872314453125, -0.3451690673828125, -0.311614990234375, -0.2780609130859375, -0.2445068359375, -0.2109527587890625, -0.177398681640625, -0.1438446044921875, -0.11029052734375, -0.0767364501953125, -0.043182373046875, -0.0096282958984375, 0.02392578125, 0.0574798583984375, 0.091033935546875, 0.1245880126953125, 0.15814208984375, 0.1916961669921875, 0.225250244140625, 0.2588043212890625, 0.2923583984375, 0.3259124755859375, 0.359466552734375, 0.3930206298828125, 0.42657470703125, 0.4601287841796875, 0.493682861328125, 0.5272369384765625, 0.560791015625, 0.5943450927734375, 0.627899169921875, 0.6614532470703125, 0.69500732421875, 0.7285614013671875, 0.762115478515625, 0.7956695556640625, 0.8292236328125, 0.8627777099609375, 0.896331787109375, 0.9298858642578125, 0.96343994140625, 0.9969940185546875, 1.030548095703125, 1.0641021728515625, 1.09765625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 3.0, 8.0, 12.0, 21.0, 39.0, 57.0, 64.0, 90.0, 132.0, 174.0, 280.0, 414.0, 514.0, 696.0, 1026.0, 1412.0, 1910.0, 2671.0, 3779.0, 5171.0, 7078.0, 9874.0, 13753.0, 19038.0, 26981.0, 39583.0, 60424.0, 98990.0, 186081.0, 1275836.0, 119936.0, 69929.0, 45029.0, 30523.0, 21165.0, 15086.0, 10726.0, 7912.0, 5685.0, 4233.0, 3059.0, 2216.0, 1686.0, 1137.0, 793.0, 578.0, 401.0, 275.0, 209.0, 136.0, 111.0, 72.0, 56.0, 25.0, 25.0, 11.0, 7.0, 3.0, 3.0, 2.0, 3.0], "bins": [-0.2374267578125, -0.23004531860351562, -0.22266387939453125, -0.21528244018554688, -0.2079010009765625, -0.20051956176757812, -0.19313812255859375, -0.18575668334960938, -0.178375244140625, -0.17099380493164062, -0.16361236572265625, -0.15623092651367188, -0.1488494873046875, -0.14146804809570312, -0.13408660888671875, -0.12670516967773438, -0.11932373046875, -0.11194229125976562, -0.10456085205078125, -0.09717941284179688, -0.0897979736328125, -0.08241653442382812, -0.07503509521484375, -0.06765365600585938, -0.060272216796875, -0.052890777587890625, -0.04550933837890625, -0.038127899169921875, -0.0307464599609375, -0.023365020751953125, -0.01598358154296875, -0.008602142333984375, -0.001220703125, 0.006160736083984375, 0.01354217529296875, 0.020923614501953125, 0.0283050537109375, 0.035686492919921875, 0.04306793212890625, 0.050449371337890625, 0.057830810546875, 0.06521224975585938, 0.07259368896484375, 0.07997512817382812, 0.0873565673828125, 0.09473800659179688, 0.10211944580078125, 0.10950088500976562, 0.11688232421875, 0.12426376342773438, 0.13164520263671875, 0.13902664184570312, 0.1464080810546875, 0.15378952026367188, 0.16117095947265625, 0.16855239868164062, 0.175933837890625, 0.18331527709960938, 0.19069671630859375, 0.19807815551757812, 0.2054595947265625, 0.21284103393554688, 0.22022247314453125, 0.22760391235351562, 0.2349853515625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 8.0, 9.0, 10.0, 12.0, 20.0, 21.0, 29.0, 40.0, 47.0, 52.0, 59.0, 66.0, 65.0, 81.0, 82.0, 66.0, 49.0, 49.0, 51.0, 39.0, 33.0, 24.0, 18.0, 14.0, 9.0, 6.0, 5.0, 2.0, 5.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.578466415405273e-05, -9.315088391304016e-05, -9.051710367202759e-05, -8.788332343101501e-05, -8.524954319000244e-05, -8.261576294898987e-05, -7.99819827079773e-05, -7.734820246696472e-05, -7.471442222595215e-05, -7.208064198493958e-05, -6.9446861743927e-05, -6.681308150291443e-05, -6.417930126190186e-05, -6.154552102088928e-05, -5.891174077987671e-05, -5.6277960538864136e-05, -5.364418029785156e-05, -5.101040005683899e-05, -4.8376619815826416e-05, -4.574283957481384e-05, -4.310905933380127e-05, -4.0475279092788696e-05, -3.784149885177612e-05, -3.520771861076355e-05, -3.2573938369750977e-05, -2.9940158128738403e-05, -2.730637788772583e-05, -2.4672597646713257e-05, -2.2038817405700684e-05, -1.940503716468811e-05, -1.6771256923675537e-05, -1.4137476682662964e-05, -1.150369644165039e-05, -8.869916200637817e-06, -6.236135959625244e-06, -3.602355718612671e-06, -9.685754776000977e-07, 1.6652047634124756e-06, 4.298985004425049e-06, 6.932765245437622e-06, 9.566545486450195e-06, 1.2200325727462769e-05, 1.4834105968475342e-05, 1.7467886209487915e-05, 2.0101666450500488e-05, 2.273544669151306e-05, 2.5369226932525635e-05, 2.8003007173538208e-05, 3.063678741455078e-05, 3.3270567655563354e-05, 3.590434789657593e-05, 3.85381281375885e-05, 4.1171908378601074e-05, 4.380568861961365e-05, 4.643946886062622e-05, 4.9073249101638794e-05, 5.170702934265137e-05, 5.434080958366394e-05, 5.6974589824676514e-05, 5.960837006568909e-05, 6.224215030670166e-05, 6.487593054771423e-05, 6.75097107887268e-05, 7.014349102973938e-05, 7.277727127075195e-05]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 7.0, 7.0, 7.0, 16.0, 15.0, 23.0, 29.0, 45.0, 60.0, 72.0, 123.0, 158.0, 264.0, 505.0, 1214.0, 978979.0, 64951.0, 910.0, 400.0, 219.0, 147.0, 98.0, 105.0, 57.0, 45.0, 23.0, 19.0, 11.0, 12.0, 8.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015001296997070312, -0.0014442652463912964, -0.0013884007930755615, -0.0013325363397598267, -0.0012766718864440918, -0.001220807433128357, -0.001164942979812622, -0.0011090785264968872, -0.0010532140731811523, -0.0009973496198654175, -0.0009414851665496826, -0.0008856207132339478, -0.0008297562599182129, -0.000773891806602478, -0.0007180273532867432, -0.0006621628999710083, -0.0006062984466552734, -0.0005504339933395386, -0.0004945695400238037, -0.00043870508670806885, -0.000382840633392334, -0.0003269761800765991, -0.00027111172676086426, -0.0002152472734451294, -0.00015938282012939453, -0.00010351836681365967, -4.7653913497924805e-05, 8.210539817810059e-06, 6.407499313354492e-05, 0.00011993944644927979, 0.00017580389976501465, 0.0002316683530807495, 0.0002875328063964844, 0.00034339725971221924, 0.0003992617130279541, 0.00045512616634368896, 0.0005109906196594238, 0.0005668550729751587, 0.0006227195262908936, 0.0006785839796066284, 0.0007344484329223633, 0.0007903128862380981, 0.000846177339553833, 0.0009020417928695679, 0.0009579062461853027, 0.0010137706995010376, 0.0010696351528167725, 0.0011254996061325073, 0.0011813640594482422, 0.001237228512763977, 0.001293092966079712, 0.0013489574193954468, 0.0014048218727111816, 0.0014606863260269165, 0.0015165507793426514, 0.0015724152326583862, 0.001628279685974121, 0.001684144139289856, 0.0017400085926055908, 0.0017958730459213257, 0.0018517374992370605, 0.0019076019525527954, 0.0019634664058685303, 0.002019330859184265, 0.0020751953125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 81.0, 663.0, 255.0, 11.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003224206157028675, -0.0003155171580146998, -0.0003086137003265321, -0.00030171024263836443, -0.00029480678495019674, -0.00028790332726202905, -0.00028099986957386136, -0.00027409641188569367, -0.000267192954197526, -0.0002602894965093583, -0.0002533860388211906, -0.0002464825811330229, -0.0002395791234448552, -0.00023267566575668752, -0.00022577220806851983, -0.00021886876493226737, -0.0002119653217960149, -0.00020506186410784721, -0.00019815840641967952, -0.00019125494873151183, -0.00018435149104334414, -0.00017744803335517645, -0.00017054457566700876, -0.0001636411325307563, -0.00015673766029067338, -0.00014983420260250568, -0.000142930744914338, -0.0001360272872261703, -0.0001291238295380026, -0.00012222037184983492, -0.00011531692143762484, -0.00010841347102541476, -0.00010151002061320469, -9.4606562925037e-05, -8.77031052368693e-05, -8.079965482465923e-05, -7.389619713649154e-05, -6.699273944832385e-05, -6.0089281760156155e-05, -5.318582770996727e-05, -4.628237002179958e-05, -3.937891233363189e-05, -3.2475458283443004e-05, -2.5572000595275313e-05, -1.8668544726097025e-05, -1.1765088856918737e-05, -4.861631168751046e-06, 2.041822881437838e-06, 8.94528056960553e-06, 1.5848736438783817e-05, 2.2752192307962105e-05, 2.9655649996129796e-05, 3.655910404631868e-05, 4.346256173448637e-05, 5.036601942265406e-05, 5.726947347284295e-05, 6.417292752303183e-05, 7.107638521119952e-05, 7.797984289936721e-05, 8.48833005875349e-05, 9.178675099974498e-05, 9.869020868791267e-05, 0.00010559366637608036, 0.00011249711678829044, 0.00011940058175241575]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 6.0, 8.0, 2.0, 7.0, 9.0, 16.0, 10.0, 15.0, 16.0, 11.0, 14.0, 19.0, 29.0, 34.0, 32.0, 24.0, 38.0, 35.0, 39.0, 51.0, 50.0, 46.0, 49.0, 35.0, 37.0, 32.0, 35.0, 31.0, 43.0, 30.0, 37.0, 27.0, 11.0, 28.0, 22.0, 20.0, 11.0, 8.0, 7.0, 12.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.62396240234375e-05, -3.496836870908737e-05, -3.3697113394737244e-05, -3.2425858080387115e-05, -3.115460276603699e-05, -2.988334745168686e-05, -2.861209213733673e-05, -2.7340836822986603e-05, -2.6069581508636475e-05, -2.4798326194286346e-05, -2.3527070879936218e-05, -2.225581556558609e-05, -2.0984560251235962e-05, -1.9713304936885834e-05, -1.8442049622535706e-05, -1.7170794308185577e-05, -1.589953899383545e-05, -1.4628283679485321e-05, -1.3357028365135193e-05, -1.2085773050785065e-05, -1.0814517736434937e-05, -9.543262422084808e-06, -8.27200710773468e-06, -7.000751793384552e-06, -5.729496479034424e-06, -4.458241164684296e-06, -3.1869858503341675e-06, -1.9157305359840393e-06, -6.444752216339111e-07, 6.26780092716217e-07, 1.8980354070663452e-06, 3.1692907214164734e-06, 4.4405460357666016e-06, 5.71180135011673e-06, 6.983056664466858e-06, 8.254311978816986e-06, 9.525567293167114e-06, 1.0796822607517242e-05, 1.206807792186737e-05, 1.3339333236217499e-05, 1.4610588550567627e-05, 1.5881843864917755e-05, 1.7153099179267883e-05, 1.842435449361801e-05, 1.969560980796814e-05, 2.0966865122318268e-05, 2.2238120436668396e-05, 2.3509375751018524e-05, 2.4780631065368652e-05, 2.605188637971878e-05, 2.732314169406891e-05, 2.8594397008419037e-05, 2.9865652322769165e-05, 3.113690763711929e-05, 3.240816295146942e-05, 3.367941826581955e-05, 3.495067358016968e-05, 3.6221928894519806e-05, 3.7493184208869934e-05, 3.876443952322006e-05, 4.003569483757019e-05, 4.130695015192032e-05, 4.257820546627045e-05, 4.3849460780620575e-05, 4.51207160949707e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 1.0, 10.0, 11.0, 6.0, 7.0, 12.0, 12.0, 18.0, 21.0, 14.0, 22.0, 30.0, 26.0, 29.0, 29.0, 33.0, 28.0, 35.0, 37.0, 43.0, 40.0, 61.0, 50.0, 41.0, 46.0, 40.0, 44.0, 38.0, 29.0, 33.0, 25.0, 20.0, 21.0, 11.0, 20.0, 17.0, 11.0, 5.0, 6.0, 2.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.9409942626953125, -1.881988525390625, -1.8229827880859375, -1.76397705078125, -1.7049713134765625, -1.645965576171875, -1.5869598388671875, -1.5279541015625, -1.4689483642578125, -1.409942626953125, -1.3509368896484375, -1.29193115234375, -1.2329254150390625, -1.173919677734375, -1.1149139404296875, -1.055908203125, -0.9969024658203125, -0.937896728515625, -0.8788909912109375, -0.81988525390625, -0.7608795166015625, -0.701873779296875, -0.6428680419921875, -0.5838623046875, -0.5248565673828125, -0.465850830078125, -0.4068450927734375, -0.34783935546875, -0.2888336181640625, -0.229827880859375, -0.1708221435546875, -0.11181640625, -0.0528106689453125, 0.006195068359375, 0.0652008056640625, 0.12420654296875, 0.1832122802734375, 0.242218017578125, 0.3012237548828125, 0.3602294921875, 0.4192352294921875, 0.478240966796875, 0.5372467041015625, 0.59625244140625, 0.6552581787109375, 0.714263916015625, 0.7732696533203125, 0.832275390625, 0.8912811279296875, 0.950286865234375, 1.0092926025390625, 1.06829833984375, 1.1273040771484375, 1.186309814453125, 1.2453155517578125, 1.3043212890625, 1.3633270263671875, 1.422332763671875, 1.4813385009765625, 1.54034423828125, 1.5993499755859375, 1.658355712890625, 1.7173614501953125, 1.7763671875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 10.0, 8.0, 23.0, 24.0, 22.0, 36.0, 58.0, 81.0, 97.0, 151.0, 199.0, 298.0, 420.0, 718.0, 1287.0, 2288.0, 4678.0, 9991.0, 23459.0, 62141.0, 169298.0, 344182.0, 259544.0, 102242.0, 37395.0, 15451.0, 6761.0, 3280.0, 1712.0, 945.0, 562.0, 366.0, 226.0, 156.0, 124.0, 91.0, 62.0, 54.0, 28.0, 29.0, 13.0, 18.0, 11.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.37109375, -2.3028564453125, -2.234619140625, -2.1663818359375, -2.09814453125, -2.0299072265625, -1.961669921875, -1.8934326171875, -1.8251953125, -1.7569580078125, -1.688720703125, -1.6204833984375, -1.55224609375, -1.4840087890625, -1.415771484375, -1.3475341796875, -1.279296875, -1.2110595703125, -1.142822265625, -1.0745849609375, -1.00634765625, -0.9381103515625, -0.869873046875, -0.8016357421875, -0.7333984375, -0.6651611328125, -0.596923828125, -0.5286865234375, -0.46044921875, -0.3922119140625, -0.323974609375, -0.2557373046875, -0.1875, -0.1192626953125, -0.051025390625, 0.0172119140625, 0.08544921875, 0.1536865234375, 0.221923828125, 0.2901611328125, 0.3583984375, 0.4266357421875, 0.494873046875, 0.5631103515625, 0.63134765625, 0.6995849609375, 0.767822265625, 0.8360595703125, 0.904296875, 0.9725341796875, 1.040771484375, 1.1090087890625, 1.17724609375, 1.2454833984375, 1.313720703125, 1.3819580078125, 1.4501953125, 1.5184326171875, 1.586669921875, 1.6549072265625, 1.72314453125, 1.7913818359375, 1.859619140625, 1.9278564453125, 1.99609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 11.0, 5.0, 12.0, 12.0, 14.0, 15.0, 17.0, 21.0, 31.0, 44.0, 43.0, 36.0, 53.0, 64.0, 91.0, 164.0, 1512.0, 318.0, 136.0, 81.0, 49.0, 44.0, 34.0, 36.0, 36.0, 30.0, 26.0, 26.0, 18.0, 16.0, 6.0, 12.0, 9.0, 2.0, 1.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.390625, -7.1583251953125, -6.926025390625, -6.6937255859375, -6.46142578125, -6.2291259765625, -5.996826171875, -5.7645263671875, -5.5322265625, -5.2999267578125, -5.067626953125, -4.8353271484375, -4.60302734375, -4.3707275390625, -4.138427734375, -3.9061279296875, -3.673828125, -3.4415283203125, -3.209228515625, -2.9769287109375, -2.74462890625, -2.5123291015625, -2.280029296875, -2.0477294921875, -1.8154296875, -1.5831298828125, -1.350830078125, -1.1185302734375, -0.88623046875, -0.6539306640625, -0.421630859375, -0.1893310546875, 0.04296875, 0.2752685546875, 0.507568359375, 0.7398681640625, 0.97216796875, 1.2044677734375, 1.436767578125, 1.6690673828125, 1.9013671875, 2.1336669921875, 2.365966796875, 2.5982666015625, 2.83056640625, 3.0628662109375, 3.295166015625, 3.5274658203125, 3.759765625, 3.9920654296875, 4.224365234375, 4.4566650390625, 4.68896484375, 4.9212646484375, 5.153564453125, 5.3858642578125, 5.6181640625, 5.8504638671875, 6.082763671875, 6.3150634765625, 6.54736328125, 6.7796630859375, 7.011962890625, 7.2442626953125, 7.4765625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 2.0, 2.0, 5.0, 3.0, 9.0, 7.0, 11.0, 11.0, 24.0, 18.0, 28.0, 39.0, 47.0, 59.0, 66.0, 119.0, 197.0, 369.0, 1019.0, 5349.0, 451560.0, 2672278.0, 11843.0, 1452.0, 450.0, 239.0, 121.0, 89.0, 68.0, 43.0, 47.0, 25.0, 17.0, 18.0, 18.0, 10.0, 8.0, 10.0, 14.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-14.46875, -14.004150390625, -13.53955078125, -13.074951171875, -12.6103515625, -12.145751953125, -11.68115234375, -11.216552734375, -10.751953125, -10.287353515625, -9.82275390625, -9.358154296875, -8.8935546875, -8.428955078125, -7.96435546875, -7.499755859375, -7.03515625, -6.570556640625, -6.10595703125, -5.641357421875, -5.1767578125, -4.712158203125, -4.24755859375, -3.782958984375, -3.318359375, -2.853759765625, -2.38916015625, -1.924560546875, -1.4599609375, -0.995361328125, -0.53076171875, -0.066162109375, 0.3984375, 0.863037109375, 1.32763671875, 1.792236328125, 2.2568359375, 2.721435546875, 3.18603515625, 3.650634765625, 4.115234375, 4.579833984375, 5.04443359375, 5.509033203125, 5.9736328125, 6.438232421875, 6.90283203125, 7.367431640625, 7.83203125, 8.296630859375, 8.76123046875, 9.225830078125, 9.6904296875, 10.155029296875, 10.61962890625, 11.084228515625, 11.548828125, 12.013427734375, 12.47802734375, 12.942626953125, 13.4072265625, 13.871826171875, 14.33642578125, 14.801025390625, 15.265625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 31.0, 299.0, 569.0, 97.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-73.2428207397461, -71.9386215209961, -70.63442993164062, -69.33023071289062, -68.02603149414062, -66.72183227539062, -65.41764068603516, -64.11344146728516, -62.80924606323242, -61.50505065917969, -60.20085144042969, -58.89665603637695, -57.59245681762695, -56.28826141357422, -54.98406219482422, -53.679866790771484, -52.37567138671875, -51.071475982666016, -49.767276763916016, -48.46308135986328, -47.15888214111328, -45.85468673706055, -44.55049133300781, -43.24629211425781, -41.94209289550781, -40.63789749145508, -39.33369827270508, -38.029502868652344, -36.725303649902344, -35.42110824584961, -34.116912841796875, -32.812713623046875, -31.508520126342773, -30.204322814941406, -28.90012550354004, -27.595928192138672, -26.291732788085938, -24.98753547668457, -23.683338165283203, -22.37914276123047, -21.07494354248047, -19.7707462310791, -18.466548919677734, -17.162353515625, -15.858156204223633, -14.553958892822266, -13.249761581420898, -11.945565223693848, -10.641368865966797, -9.33717155456543, -8.032975196838379, -6.728777885437012, -5.424581050872803, -4.120384216308594, -2.8161869049072266, -1.5119905471801758, -0.2077932357788086, 1.09640371799469, 2.4006006717681885, 3.7047977447509766, 5.0089945793151855, 6.3131914138793945, 7.617388725280762, 8.921585083007812, 10.22578239440918]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 6.0, 5.0, 12.0, 8.0, 7.0, 12.0, 11.0, 12.0, 24.0, 21.0, 28.0, 23.0, 25.0, 30.0, 37.0, 43.0, 45.0, 51.0, 58.0, 47.0, 40.0, 45.0, 37.0, 44.0, 32.0, 38.0, 36.0, 28.0, 32.0, 27.0, 21.0, 25.0, 13.0, 22.0, 13.0, 7.0, 7.0, 6.0, 5.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.31951141357422, -22.629880905151367, -21.940250396728516, -21.250619888305664, -20.560989379882812, -19.871360778808594, -19.18172836303711, -18.49209976196289, -17.80246925354004, -17.112838745117188, -16.423208236694336, -15.733577728271484, -15.04394817352295, -14.354317665100098, -13.664687156677246, -12.975057601928711, -12.285426139831543, -11.595795631408691, -10.90616512298584, -10.216535568237305, -9.526905059814453, -8.837274551391602, -8.14764404296875, -7.458014011383057, -6.768383502960205, -6.0787529945373535, -5.38912296295166, -4.699492454528809, -4.009861946105957, -3.3202319145202637, -2.630601406097412, -1.9409713745117188, -1.2513408660888672, -0.56171053647995, 0.12791979312896729, 0.8175501823425293, 1.5071804523468018, 2.196810722351074, 2.886441230773926, 3.576071262359619, 4.265701770782471, 4.955332279205322, 5.644962310791016, 6.334592819213867, 7.024223327636719, 7.713853359222412, 8.403484344482422, 9.093113899230957, 9.782744407653809, 10.47237491607666, 11.162005424499512, 11.851634979248047, 12.541265487670898, 13.23089599609375, 13.920526504516602, 14.610157012939453, 15.299787521362305, 15.989418029785156, 16.679048538208008, 17.36867904663086, 18.05830955505371, 18.747940063476562, 19.43756866455078, 20.127199172973633, 20.816829681396484]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 8.0, 9.0, 7.0, 12.0, 16.0, 14.0, 26.0, 23.0, 28.0, 23.0, 30.0, 30.0, 34.0, 31.0, 34.0, 42.0, 42.0, 49.0, 56.0, 55.0, 45.0, 66.0, 35.0, 29.0, 42.0, 39.0, 35.0, 24.0, 18.0, 18.0, 15.0, 9.0, 7.0, 13.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30859375, -2.2423858642578125, -2.176177978515625, -2.1099700927734375, -2.04376220703125, -1.9775543212890625, -1.911346435546875, -1.8451385498046875, -1.7789306640625, -1.7127227783203125, -1.646514892578125, -1.5803070068359375, -1.51409912109375, -1.4478912353515625, -1.381683349609375, -1.3154754638671875, -1.249267578125, -1.1830596923828125, -1.116851806640625, -1.0506439208984375, -0.98443603515625, -0.9182281494140625, -0.852020263671875, -0.7858123779296875, -0.7196044921875, -0.6533966064453125, -0.587188720703125, -0.5209808349609375, -0.45477294921875, -0.3885650634765625, -0.322357177734375, -0.2561492919921875, -0.18994140625, -0.1237335205078125, -0.057525634765625, 0.0086822509765625, 0.07489013671875, 0.1410980224609375, 0.207305908203125, 0.2735137939453125, 0.3397216796875, 0.4059295654296875, 0.472137451171875, 0.5383453369140625, 0.60455322265625, 0.6707611083984375, 0.736968994140625, 0.8031768798828125, 0.869384765625, 0.9355926513671875, 1.001800537109375, 1.0680084228515625, 1.13421630859375, 1.2004241943359375, 1.266632080078125, 1.3328399658203125, 1.3990478515625, 1.4652557373046875, 1.531463623046875, 1.5976715087890625, 1.66387939453125, 1.7300872802734375, 1.796295166015625, 1.8625030517578125, 1.9287109375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 9.0, 12.0, 16.0, 19.0, 24.0, 18.0, 20.0, 38.0, 60.0, 86.0, 107.0, 178.0, 270.0, 542.0, 1348.0, 4361.0, 21695.0, 170462.0, 1976015.0, 1832545.0, 159411.0, 20266.0, 4177.0, 1245.0, 549.0, 256.0, 157.0, 106.0, 69.0, 44.0, 33.0, 27.0, 30.0, 21.0, 15.0, 7.0, 9.0, 8.0, 5.0, 5.0, 7.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-6.62109375, -6.43182373046875, -6.2425537109375, -6.05328369140625, -5.864013671875, -5.67474365234375, -5.4854736328125, -5.29620361328125, -5.10693359375, -4.91766357421875, -4.7283935546875, -4.53912353515625, -4.349853515625, -4.16058349609375, -3.9713134765625, -3.78204345703125, -3.5927734375, -3.40350341796875, -3.2142333984375, -3.02496337890625, -2.835693359375, -2.64642333984375, -2.4571533203125, -2.26788330078125, -2.07861328125, -1.88934326171875, -1.7000732421875, -1.51080322265625, -1.321533203125, -1.13226318359375, -0.9429931640625, -0.75372314453125, -0.564453125, -0.37518310546875, -0.1859130859375, 0.00335693359375, 0.192626953125, 0.38189697265625, 0.5711669921875, 0.76043701171875, 0.94970703125, 1.13897705078125, 1.3282470703125, 1.51751708984375, 1.706787109375, 1.89605712890625, 2.0853271484375, 2.27459716796875, 2.4638671875, 2.65313720703125, 2.8424072265625, 3.03167724609375, 3.220947265625, 3.41021728515625, 3.5994873046875, 3.78875732421875, 3.97802734375, 4.16729736328125, 4.3565673828125, 4.54583740234375, 4.735107421875, 4.92437744140625, 5.1136474609375, 5.30291748046875, 5.4921875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 14.0, 6.0, 14.0, 15.0, 22.0, 41.0, 48.0, 53.0, 80.0, 92.0, 138.0, 184.0, 221.0, 318.0, 404.0, 398.0, 419.0, 337.0, 286.0, 227.0, 174.0, 137.0, 118.0, 76.0, 69.0, 42.0, 35.0, 25.0, 19.0, 18.0, 5.0, 7.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.33984375, -6.1593017578125, -5.978759765625, -5.7982177734375, -5.61767578125, -5.4371337890625, -5.256591796875, -5.0760498046875, -4.8955078125, -4.7149658203125, -4.534423828125, -4.3538818359375, -4.17333984375, -3.9927978515625, -3.812255859375, -3.6317138671875, -3.451171875, -3.2706298828125, -3.090087890625, -2.9095458984375, -2.72900390625, -2.5484619140625, -2.367919921875, -2.1873779296875, -2.0068359375, -1.8262939453125, -1.645751953125, -1.4652099609375, -1.28466796875, -1.1041259765625, -0.923583984375, -0.7430419921875, -0.5625, -0.3819580078125, -0.201416015625, -0.0208740234375, 0.15966796875, 0.3402099609375, 0.520751953125, 0.7012939453125, 0.8818359375, 1.0623779296875, 1.242919921875, 1.4234619140625, 1.60400390625, 1.7845458984375, 1.965087890625, 2.1456298828125, 2.326171875, 2.5067138671875, 2.687255859375, 2.8677978515625, 3.04833984375, 3.2288818359375, 3.409423828125, 3.5899658203125, 3.7705078125, 3.9510498046875, 4.131591796875, 4.3121337890625, 4.49267578125, 4.6732177734375, 4.853759765625, 5.0343017578125, 5.21484375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 15.0, 18.0, 34.0, 44.0, 87.0, 143.0, 261.0, 557.0, 2170.0, 62725.0, 3959119.0, 164549.0, 3235.0, 659.0, 286.0, 133.0, 91.0, 52.0, 35.0, 21.0, 14.0, 10.0, 8.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.96875, -29.192138671875, -28.41552734375, -27.638916015625, -26.8623046875, -26.085693359375, -25.30908203125, -24.532470703125, -23.755859375, -22.979248046875, -22.20263671875, -21.426025390625, -20.6494140625, -19.872802734375, -19.09619140625, -18.319580078125, -17.54296875, -16.766357421875, -15.98974609375, -15.213134765625, -14.4365234375, -13.659912109375, -12.88330078125, -12.106689453125, -11.330078125, -10.553466796875, -9.77685546875, -9.000244140625, -8.2236328125, -7.447021484375, -6.67041015625, -5.893798828125, -5.1171875, -4.340576171875, -3.56396484375, -2.787353515625, -2.0107421875, -1.234130859375, -0.45751953125, 0.319091796875, 1.095703125, 1.872314453125, 2.64892578125, 3.425537109375, 4.2021484375, 4.978759765625, 5.75537109375, 6.531982421875, 7.30859375, 8.085205078125, 8.86181640625, 9.638427734375, 10.4150390625, 11.191650390625, 11.96826171875, 12.744873046875, 13.521484375, 14.298095703125, 15.07470703125, 15.851318359375, 16.6279296875, 17.404541015625, 18.18115234375, 18.957763671875, 19.734375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 90.0, 256.0, 334.0, 239.0, 68.0, 11.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.97063446044922, -34.863502502441406, -32.756370544433594, -30.64923858642578, -28.54210662841797, -26.434974670410156, -24.327842712402344, -22.22071075439453, -20.11357879638672, -18.006446838378906, -15.899314880371094, -13.792182922363281, -11.685050964355469, -9.577919006347656, -7.470787048339844, -5.363655090332031, -3.2565231323242188, -1.1493911743164062, 0.9577407836914062, 3.0648727416992188, 5.172004699707031, 7.279136657714844, 9.386268615722656, 11.493400573730469, 13.600532531738281, 15.707664489746094, 17.814796447753906, 19.92192840576172, 22.02906036376953, 24.136192321777344, 26.243324279785156, 28.35045623779297, 30.45758056640625, 32.56471252441406, 34.671844482421875, 36.77897644042969, 38.8861083984375, 40.99324035644531, 43.100372314453125, 45.20750427246094, 47.31463623046875, 49.42176818847656, 51.528900146484375, 53.63603210449219, 55.7431640625, 57.85029602050781, 59.957427978515625, 62.06455993652344, 64.17169189453125, 66.27882385253906, 68.38595581054688, 70.49308776855469, 72.6002197265625, 74.70735168457031, 76.81448364257812, 78.92161560058594, 81.02874755859375, 83.13587951660156, 85.24301147460938, 87.35014343261719, 89.457275390625, 91.56440734863281, 93.67153930664062, 95.77867126464844, 97.88580322265625]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 6.0, 7.0, 10.0, 7.0, 11.0, 19.0, 19.0, 25.0, 16.0, 22.0, 25.0, 37.0, 30.0, 48.0, 46.0, 39.0, 52.0, 45.0, 34.0, 49.0, 44.0, 41.0, 40.0, 44.0, 40.0, 29.0, 30.0, 23.0, 21.0, 13.0, 21.0, 14.0, 16.0, 13.0, 11.0, 10.0, 8.0, 7.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.987842559814453, -19.301700592041016, -18.61556053161621, -17.929418563842773, -17.243276596069336, -16.5571346282959, -15.870994567871094, -15.184852600097656, -14.498710632324219, -13.812569618225098, -13.12642765045166, -12.440286636352539, -11.754144668579102, -11.06800365447998, -10.38186264038086, -9.695720672607422, -9.0095796585083, -8.32343864440918, -7.637296676635742, -6.951155662536621, -6.265013694763184, -5.5788726806640625, -4.892731189727783, -4.206589698791504, -3.5204482078552246, -2.8343067169189453, -2.148165225982666, -1.4620239734649658, -0.7758824825286865, -0.08974099159240723, 0.596400260925293, 1.2825417518615723, 1.9686832427978516, 2.654824733734131, 3.34096622467041, 4.027107238769531, 4.713249206542969, 5.39939022064209, 6.085531711578369, 6.771673202514648, 7.457814693450928, 8.143956184387207, 8.830097198486328, 9.516239166259766, 10.202380180358887, 10.888522148132324, 11.574663162231445, 12.260805130004883, 12.946946144104004, 13.633087158203125, 14.319229125976562, 15.005370140075684, 15.691512107849121, 16.377653121948242, 17.06379508972168, 17.749935150146484, 18.436077117919922, 19.12221908569336, 19.808359146118164, 20.4945011138916, 21.18064308166504, 21.866785049438477, 22.55292510986328, 23.23906707763672, 23.925209045410156]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 1.0, 9.0, 13.0, 7.0, 20.0, 17.0, 7.0, 14.0, 16.0, 15.0, 25.0, 23.0, 33.0, 23.0, 30.0, 30.0, 35.0, 36.0, 50.0, 45.0, 47.0, 53.0, 53.0, 40.0, 43.0, 28.0, 39.0, 37.0, 33.0, 29.0, 31.0, 26.0, 18.0, 12.0, 10.0, 10.0, 8.0, 6.0, 5.0, 3.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.123687744140625, -2.06182861328125, -1.999969482421875, -1.9381103515625, -1.876251220703125, -1.81439208984375, -1.752532958984375, -1.690673828125, -1.628814697265625, -1.56695556640625, -1.505096435546875, -1.4432373046875, -1.381378173828125, -1.31951904296875, -1.257659912109375, -1.19580078125, -1.133941650390625, -1.07208251953125, -1.010223388671875, -0.9483642578125, -0.886505126953125, -0.82464599609375, -0.762786865234375, -0.700927734375, -0.639068603515625, -0.57720947265625, -0.515350341796875, -0.4534912109375, -0.391632080078125, -0.32977294921875, -0.267913818359375, -0.2060546875, -0.144195556640625, -0.08233642578125, -0.020477294921875, 0.0413818359375, 0.103240966796875, 0.16510009765625, 0.226959228515625, 0.288818359375, 0.350677490234375, 0.41253662109375, 0.474395751953125, 0.5362548828125, 0.598114013671875, 0.65997314453125, 0.721832275390625, 0.78369140625, 0.845550537109375, 0.90740966796875, 0.969268798828125, 1.0311279296875, 1.092987060546875, 1.15484619140625, 1.216705322265625, 1.278564453125, 1.340423583984375, 1.40228271484375, 1.464141845703125, 1.5260009765625, 1.587860107421875, 1.64971923828125, 1.711578369140625, 1.7734375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 8.0, 4.0, 5.0, 13.0, 16.0, 20.0, 25.0, 57.0, 76.0, 104.0, 197.0, 303.0, 494.0, 809.0, 1291.0, 2260.0, 3831.0, 6446.0, 11170.0, 19550.0, 35809.0, 68235.0, 146490.0, 357552.0, 205752.0, 86932.0, 44285.0, 23964.0, 13536.0, 7808.0, 4631.0, 2632.0, 1650.0, 982.0, 592.0, 352.0, 238.0, 135.0, 95.0, 74.0, 47.0, 29.0, 25.0, 14.0, 9.0, 2.0, 7.0, 3.0, 7.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3659210205078125, -0.352203369140625, -0.3384857177734375, -0.32476806640625, -0.3110504150390625, -0.297332763671875, -0.2836151123046875, -0.2698974609375, -0.2561798095703125, -0.242462158203125, -0.2287445068359375, -0.21502685546875, -0.2013092041015625, -0.187591552734375, -0.1738739013671875, -0.16015625, -0.1464385986328125, -0.132720947265625, -0.1190032958984375, -0.10528564453125, -0.0915679931640625, -0.077850341796875, -0.0641326904296875, -0.0504150390625, -0.0366973876953125, -0.022979736328125, -0.0092620849609375, 0.00445556640625, 0.0181732177734375, 0.031890869140625, 0.0456085205078125, 0.059326171875, 0.0730438232421875, 0.086761474609375, 0.1004791259765625, 0.11419677734375, 0.1279144287109375, 0.141632080078125, 0.1553497314453125, 0.1690673828125, 0.1827850341796875, 0.196502685546875, 0.2102203369140625, 0.22393798828125, 0.2376556396484375, 0.251373291015625, 0.2650909423828125, 0.27880859375, 0.2925262451171875, 0.306243896484375, 0.3199615478515625, 0.33367919921875, 0.3473968505859375, 0.361114501953125, 0.3748321533203125, 0.3885498046875, 0.4022674560546875, 0.415985107421875, 0.4297027587890625, 0.44342041015625, 0.4571380615234375, 0.470855712890625, 0.4845733642578125, 0.498291015625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 3.0, 11.0, 14.0, 8.0, 13.0, 21.0, 17.0, 22.0, 27.0, 27.0, 32.0, 19.0, 43.0, 43.0, 41.0, 27.0, 38.0, 40.0, 1065.0, 46.0, 40.0, 45.0, 46.0, 23.0, 48.0, 42.0, 32.0, 30.0, 28.0, 29.0, 18.0, 15.0, 13.0, 6.0, 11.0, 6.0, 8.0, 6.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.37890625, -1.3394775390625, -1.300048828125, -1.2606201171875, -1.22119140625, -1.1817626953125, -1.142333984375, -1.1029052734375, -1.0634765625, -1.0240478515625, -0.984619140625, -0.9451904296875, -0.90576171875, -0.8663330078125, -0.826904296875, -0.7874755859375, -0.748046875, -0.7086181640625, -0.669189453125, -0.6297607421875, -0.59033203125, -0.5509033203125, -0.511474609375, -0.4720458984375, -0.4326171875, -0.3931884765625, -0.353759765625, -0.3143310546875, -0.27490234375, -0.2354736328125, -0.196044921875, -0.1566162109375, -0.1171875, -0.0777587890625, -0.038330078125, 0.0010986328125, 0.04052734375, 0.0799560546875, 0.119384765625, 0.1588134765625, 0.1982421875, 0.2376708984375, 0.277099609375, 0.3165283203125, 0.35595703125, 0.3953857421875, 0.434814453125, 0.4742431640625, 0.513671875, 0.5531005859375, 0.592529296875, 0.6319580078125, 0.67138671875, 0.7108154296875, 0.750244140625, 0.7896728515625, 0.8291015625, 0.8685302734375, 0.907958984375, 0.9473876953125, 0.98681640625, 1.0262451171875, 1.065673828125, 1.1051025390625, 1.14453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 6.0, 2.0, 11.0, 11.0, 22.0, 37.0, 47.0, 47.0, 92.0, 141.0, 178.0, 276.0, 424.0, 608.0, 858.0, 1186.0, 1766.0, 2576.0, 3894.0, 5707.0, 8644.0, 13402.0, 20189.0, 31498.0, 49860.0, 83676.0, 158735.0, 1333063.0, 156420.0, 82359.0, 50357.0, 31328.0, 19893.0, 12890.0, 8660.0, 5788.0, 3969.0, 2713.0, 1864.0, 1203.0, 892.0, 557.0, 389.0, 281.0, 201.0, 119.0, 100.0, 72.0, 31.0, 33.0, 18.0, 18.0, 16.0, 7.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.287353515625, -0.278228759765625, -0.26910400390625, -0.259979248046875, -0.2508544921875, -0.241729736328125, -0.23260498046875, -0.223480224609375, -0.21435546875, -0.205230712890625, -0.19610595703125, -0.186981201171875, -0.1778564453125, -0.168731689453125, -0.15960693359375, -0.150482177734375, -0.141357421875, -0.132232666015625, -0.12310791015625, -0.113983154296875, -0.1048583984375, -0.095733642578125, -0.08660888671875, -0.077484130859375, -0.068359375, -0.059234619140625, -0.05010986328125, -0.040985107421875, -0.0318603515625, -0.022735595703125, -0.01361083984375, -0.004486083984375, 0.004638671875, 0.013763427734375, 0.02288818359375, 0.032012939453125, 0.0411376953125, 0.050262451171875, 0.05938720703125, 0.068511962890625, 0.07763671875, 0.086761474609375, 0.09588623046875, 0.105010986328125, 0.1141357421875, 0.123260498046875, 0.13238525390625, 0.141510009765625, 0.150634765625, 0.159759521484375, 0.16888427734375, 0.178009033203125, 0.1871337890625, 0.196258544921875, 0.20538330078125, 0.214508056640625, 0.2236328125, 0.232757568359375, 0.24188232421875, 0.251007080078125, 0.2601318359375, 0.269256591796875, 0.27838134765625, 0.287506103515625, 0.296630859375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 3.0, 8.0, 8.0, 6.0, 8.0, 15.0, 22.0, 23.0, 27.0, 42.0, 37.0, 39.0, 43.0, 77.0, 70.0, 69.0, 62.0, 61.0, 59.0, 56.0, 47.0, 36.0, 34.0, 32.0, 24.0, 19.0, 16.0, 9.0, 7.0, 12.0, 6.0, 2.0, 3.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.128715515136719e-05, -6.90976157784462e-05, -6.690807640552521e-05, -6.471853703260422e-05, -6.252899765968323e-05, -6.033945828676224e-05, -5.814991891384125e-05, -5.596037954092026e-05, -5.377084016799927e-05, -5.158130079507828e-05, -4.939176142215729e-05, -4.72022220492363e-05, -4.501268267631531e-05, -4.282314330339432e-05, -4.063360393047333e-05, -3.844406455755234e-05, -3.625452518463135e-05, -3.406498581171036e-05, -3.187544643878937e-05, -2.9685907065868378e-05, -2.7496367692947388e-05, -2.5306828320026398e-05, -2.3117288947105408e-05, -2.0927749574184418e-05, -1.8738210201263428e-05, -1.6548670828342438e-05, -1.4359131455421448e-05, -1.2169592082500458e-05, -9.980052709579468e-06, -7.790513336658478e-06, -5.600973963737488e-06, -3.411434590816498e-06, -1.2218952178955078e-06, 9.676441550254822e-07, 3.157183527946472e-06, 5.346722900867462e-06, 7.536262273788452e-06, 9.725801646709442e-06, 1.1915341019630432e-05, 1.4104880392551422e-05, 1.6294419765472412e-05, 1.8483959138393402e-05, 2.0673498511314392e-05, 2.2863037884235382e-05, 2.5052577257156372e-05, 2.7242116630077362e-05, 2.9431656002998352e-05, 3.162119537591934e-05, 3.381073474884033e-05, 3.600027412176132e-05, 3.818981349468231e-05, 4.03793528676033e-05, 4.256889224052429e-05, 4.475843161344528e-05, 4.694797098636627e-05, 4.913751035928726e-05, 5.132704973220825e-05, 5.351658910512924e-05, 5.570612847805023e-05, 5.789566785097122e-05, 6.008520722389221e-05, 6.22747465968132e-05, 6.446428596973419e-05, 6.665382534265518e-05, 6.884336471557617e-05]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 9.0, 9.0, 9.0, 13.0, 23.0, 30.0, 32.0, 36.0, 59.0, 66.0, 100.0, 149.0, 168.0, 299.0, 497.0, 1532.0, 669083.0, 373763.0, 1201.0, 456.0, 248.0, 194.0, 156.0, 104.0, 83.0, 63.0, 44.0, 26.0, 18.0, 18.0, 12.0, 14.0, 6.0, 6.0, 2.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0014019012451171875, -0.0013606101274490356, -0.0013193190097808838, -0.001278027892112732, -0.00123673677444458, -0.0011954456567764282, -0.0011541545391082764, -0.0011128634214401245, -0.0010715723037719727, -0.0010302811861038208, -0.000988990068435669, -0.0009476989507675171, -0.0009064078330993652, -0.0008651167154312134, -0.0008238255977630615, -0.0007825344800949097, -0.0007412433624267578, -0.000699952244758606, -0.0006586611270904541, -0.0006173700094223022, -0.0005760788917541504, -0.0005347877740859985, -0.0004934966564178467, -0.0004522055387496948, -0.00041091442108154297, -0.0003696233034133911, -0.00032833218574523926, -0.0002870410680770874, -0.00024574995040893555, -0.0002044588327407837, -0.00016316771507263184, -0.00012187659740447998, -8.058547973632812e-05, -3.929436206817627e-05, 1.996755599975586e-06, 4.328787326812744e-05, 8.45789909362793e-05, 0.00012587010860443115, 0.000167161226272583, 0.00020845234394073486, 0.0002497434616088867, 0.0002910345792770386, 0.00033232569694519043, 0.0003736168146133423, 0.00041490793228149414, 0.000456199049949646, 0.0004974901676177979, 0.0005387812852859497, 0.0005800724029541016, 0.0006213635206222534, 0.0006626546382904053, 0.0007039457559585571, 0.000745236873626709, 0.0007865279912948608, 0.0008278191089630127, 0.0008691102266311646, 0.0009104013442993164, 0.0009516924619674683, 0.0009929835796356201, 0.001034274697303772, 0.0010755658149719238, 0.0011168569326400757, 0.0011581480503082275, 0.0011994391679763794, 0.0012407302856445312]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 15.0, 33.0, 100.0, 184.0, 265.0, 209.0, 117.0, 56.0, 13.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44899157830514e-05, -5.185039117350243e-05, -4.921086292597465e-05, -4.657133831642568e-05, -4.39318100688979e-05, -4.129228545934893e-05, -3.865276084979996e-05, -3.601323260227218e-05, -3.337370799272321e-05, -3.073418338317424e-05, -2.8094655135646462e-05, -2.545513052609749e-05, -2.2815604097559117e-05, -2.0176077669020742e-05, -1.753655305947177e-05, -1.4897026630933397e-05, -1.2257500202395022e-05, -9.617973773856647e-06, -6.9784482548129745e-06, -4.338922735769302e-06, -1.699396307230927e-06, 9.401301213074476e-07, 3.5796547308564186e-06, 6.219181159394793e-06, 8.858707587933168e-06, 1.1498234016471542e-05, 1.4137759535515215e-05, 1.6777285054558888e-05, 1.9416811483097263e-05, 2.2056337911635637e-05, 2.469586252118461e-05, 2.7335388949722983e-05, 2.9974922654218972e-05, 3.261444726376794e-05, 3.525397551129572e-05, 3.789350012084469e-05, 4.053302836837247e-05, 4.317255297792144e-05, 4.581207758747041e-05, 4.845160583499819e-05, 5.109113044454716e-05, 5.373065505409613e-05, 5.637018330162391e-05, 5.900970791117288e-05, 6.164923252072185e-05, 6.428876076824963e-05, 6.692828901577741e-05, 6.956780998734757e-05, 7.220733823487535e-05, 7.484686648240313e-05, 7.74863874539733e-05, 8.012591570150107e-05, 8.276544394902885e-05, 8.540497219655663e-05, 8.804449316812679e-05, 9.068402141565457e-05, 9.332354238722473e-05, 9.596307063475251e-05, 9.860259160632268e-05, 0.00010124211985385045, 0.00010388164810137823, 0.0001065211690729484, 0.00010916069732047617, 0.00011180022556800395, 0.00011443975381553173]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 5.0, 4.0, 11.0, 9.0, 9.0, 23.0, 17.0, 22.0, 21.0, 31.0, 30.0, 44.0, 36.0, 34.0, 48.0, 60.0, 43.0, 49.0, 54.0, 36.0, 52.0, 41.0, 35.0, 41.0, 29.0, 29.0, 28.0, 27.0, 22.0, 19.0, 22.0, 18.0, 15.0, 10.0, 8.0, 2.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.13060188293457e-05, -4.010181874036789e-05, -3.8897618651390076e-05, -3.769341856241226e-05, -3.648921847343445e-05, -3.5285018384456635e-05, -3.408081829547882e-05, -3.287661820650101e-05, -3.167241811752319e-05, -3.046821802854538e-05, -2.9264017939567566e-05, -2.8059817850589752e-05, -2.685561776161194e-05, -2.5651417672634125e-05, -2.444721758365631e-05, -2.3243017494678497e-05, -2.2038817405700684e-05, -2.083461731672287e-05, -1.9630417227745056e-05, -1.8426217138767242e-05, -1.722201704978943e-05, -1.6017816960811615e-05, -1.4813616871833801e-05, -1.3609416782855988e-05, -1.2405216693878174e-05, -1.120101660490036e-05, -9.996816515922546e-06, -8.792616426944733e-06, -7.588416337966919e-06, -6.384216248989105e-06, -5.1800161600112915e-06, -3.975816071033478e-06, -2.771615982055664e-06, -1.5674158930778503e-06, -3.632158041000366e-07, 8.409842848777771e-07, 2.045184373855591e-06, 3.2493844628334045e-06, 4.453584551811218e-06, 5.657784640789032e-06, 6.861984729766846e-06, 8.06618481874466e-06, 9.270384907722473e-06, 1.0474584996700287e-05, 1.16787850856781e-05, 1.2882985174655914e-05, 1.4087185263633728e-05, 1.5291385352611542e-05, 1.6495585441589355e-05, 1.769978553056717e-05, 1.8903985619544983e-05, 2.0108185708522797e-05, 2.131238579750061e-05, 2.2516585886478424e-05, 2.3720785975456238e-05, 2.492498606443405e-05, 2.6129186153411865e-05, 2.733338624238968e-05, 2.8537586331367493e-05, 2.9741786420345306e-05, 3.094598650932312e-05, 3.2150186598300934e-05, 3.335438668727875e-05, 3.455858677625656e-05, 3.5762786865234375e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 1.0, 9.0, 13.0, 7.0, 20.0, 17.0, 7.0, 14.0, 15.0, 16.0, 25.0, 23.0, 33.0, 23.0, 30.0, 30.0, 35.0, 36.0, 50.0, 45.0, 47.0, 53.0, 53.0, 40.0, 43.0, 28.0, 39.0, 37.0, 33.0, 29.0, 31.0, 26.0, 18.0, 12.0, 10.0, 10.0, 8.0, 6.0, 5.0, 3.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.123687744140625, -2.06182861328125, -1.999969482421875, -1.9381103515625, -1.876251220703125, -1.81439208984375, -1.752532958984375, -1.690673828125, -1.628814697265625, -1.56695556640625, -1.505096435546875, -1.4432373046875, -1.381378173828125, -1.31951904296875, -1.257659912109375, -1.19580078125, -1.133941650390625, -1.07208251953125, -1.010223388671875, -0.9483642578125, -0.886505126953125, -0.82464599609375, -0.762786865234375, -0.700927734375, -0.639068603515625, -0.57720947265625, -0.515350341796875, -0.4534912109375, -0.391632080078125, -0.32977294921875, -0.267913818359375, -0.2060546875, -0.144195556640625, -0.08233642578125, -0.020477294921875, 0.0413818359375, 0.103240966796875, 0.16510009765625, 0.226959228515625, 0.288818359375, 0.350677490234375, 0.41253662109375, 0.474395751953125, 0.5362548828125, 0.598114013671875, 0.65997314453125, 0.721832275390625, 0.78369140625, 0.845550537109375, 0.90740966796875, 0.969268798828125, 1.0311279296875, 1.092987060546875, 1.15484619140625, 1.216705322265625, 1.278564453125, 1.340423583984375, 1.40228271484375, 1.464141845703125, 1.5260009765625, 1.587860107421875, 1.64971923828125, 1.711578369140625, 1.7734375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 12.0, 10.0, 14.0, 18.0, 41.0, 54.0, 56.0, 96.0, 136.0, 196.0, 274.0, 474.0, 716.0, 1276.0, 2094.0, 3836.0, 7437.0, 15460.0, 34927.0, 98178.0, 328634.0, 368591.0, 112101.0, 39093.0, 16698.0, 8121.0, 4238.0, 2287.0, 1267.0, 817.0, 446.0, 304.0, 196.0, 138.0, 102.0, 73.0, 58.0, 32.0, 17.0, 8.0, 9.0, 8.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9072265625, -1.8392486572265625, -1.771270751953125, -1.7032928466796875, -1.63531494140625, -1.5673370361328125, -1.499359130859375, -1.4313812255859375, -1.3634033203125, -1.2954254150390625, -1.227447509765625, -1.1594696044921875, -1.09149169921875, -1.0235137939453125, -0.955535888671875, -0.8875579833984375, -0.819580078125, -0.7516021728515625, -0.683624267578125, -0.6156463623046875, -0.54766845703125, -0.4796905517578125, -0.411712646484375, -0.3437347412109375, -0.2757568359375, -0.2077789306640625, -0.139801025390625, -0.0718231201171875, -0.00384521484375, 0.0641326904296875, 0.132110595703125, 0.2000885009765625, 0.26806640625, 0.3360443115234375, 0.404022216796875, 0.4720001220703125, 0.53997802734375, 0.6079559326171875, 0.675933837890625, 0.7439117431640625, 0.8118896484375, 0.8798675537109375, 0.947845458984375, 1.0158233642578125, 1.08380126953125, 1.1517791748046875, 1.219757080078125, 1.2877349853515625, 1.355712890625, 1.4236907958984375, 1.491668701171875, 1.5596466064453125, 1.62762451171875, 1.6956024169921875, 1.763580322265625, 1.8315582275390625, 1.8995361328125, 1.9675140380859375, 2.035491943359375, 2.1034698486328125, 2.17144775390625, 2.2394256591796875, 2.307403564453125, 2.3753814697265625, 2.443359375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 7.0, 14.0, 13.0, 13.0, 14.0, 16.0, 21.0, 25.0, 26.0, 32.0, 34.0, 40.0, 53.0, 51.0, 48.0, 76.0, 129.0, 1543.0, 382.0, 99.0, 63.0, 44.0, 36.0, 37.0, 33.0, 34.0, 22.0, 25.0, 18.0, 18.0, 18.0, 19.0, 11.0, 4.0, 10.0, 2.0, 5.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.515625, -7.27984619140625, -7.0440673828125, -6.80828857421875, -6.572509765625, -6.33673095703125, -6.1009521484375, -5.86517333984375, -5.62939453125, -5.39361572265625, -5.1578369140625, -4.92205810546875, -4.686279296875, -4.45050048828125, -4.2147216796875, -3.97894287109375, -3.7431640625, -3.50738525390625, -3.2716064453125, -3.03582763671875, -2.800048828125, -2.56427001953125, -2.3284912109375, -2.09271240234375, -1.85693359375, -1.62115478515625, -1.3853759765625, -1.14959716796875, -0.913818359375, -0.67803955078125, -0.4422607421875, -0.20648193359375, 0.029296875, 0.26507568359375, 0.5008544921875, 0.73663330078125, 0.972412109375, 1.20819091796875, 1.4439697265625, 1.67974853515625, 1.91552734375, 2.15130615234375, 2.3870849609375, 2.62286376953125, 2.858642578125, 3.09442138671875, 3.3302001953125, 3.56597900390625, 3.8017578125, 4.03753662109375, 4.2733154296875, 4.50909423828125, 4.744873046875, 4.98065185546875, 5.2164306640625, 5.45220947265625, 5.68798828125, 5.92376708984375, 6.1595458984375, 6.39532470703125, 6.631103515625, 6.86688232421875, 7.1026611328125, 7.33843994140625, 7.57421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 14.0, 12.0, 17.0, 21.0, 24.0, 22.0, 39.0, 43.0, 48.0, 66.0, 116.0, 181.0, 342.0, 843.0, 5185.0, 157199.0, 2945351.0, 32345.0, 2371.0, 563.0, 283.0, 147.0, 120.0, 62.0, 53.0, 35.0, 34.0, 37.0, 29.0, 20.0, 11.0, 17.0, 12.0, 2.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4609375, -12.06298828125, -11.6650390625, -11.26708984375, -10.869140625, -10.47119140625, -10.0732421875, -9.67529296875, -9.27734375, -8.87939453125, -8.4814453125, -8.08349609375, -7.685546875, -7.28759765625, -6.8896484375, -6.49169921875, -6.09375, -5.69580078125, -5.2978515625, -4.89990234375, -4.501953125, -4.10400390625, -3.7060546875, -3.30810546875, -2.91015625, -2.51220703125, -2.1142578125, -1.71630859375, -1.318359375, -0.92041015625, -0.5224609375, -0.12451171875, 0.2734375, 0.67138671875, 1.0693359375, 1.46728515625, 1.865234375, 2.26318359375, 2.6611328125, 3.05908203125, 3.45703125, 3.85498046875, 4.2529296875, 4.65087890625, 5.048828125, 5.44677734375, 5.8447265625, 6.24267578125, 6.640625, 7.03857421875, 7.4365234375, 7.83447265625, 8.232421875, 8.63037109375, 9.0283203125, 9.42626953125, 9.82421875, 10.22216796875, 10.6201171875, 11.01806640625, 11.416015625, 11.81396484375, 12.2119140625, 12.60986328125, 13.0078125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 9.0, 19.0, 62.0, 130.0, 184.0, 228.0, 187.0, 93.0, 62.0, 19.0, 9.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.176681518554688, -19.700082778930664, -19.22348403930664, -18.746885299682617, -18.270286560058594, -17.793685913085938, -17.317087173461914, -16.84048843383789, -16.363889694213867, -15.887290954589844, -15.41069221496582, -14.93409252166748, -14.457493782043457, -13.980895042419434, -13.504295349121094, -13.02769660949707, -12.551097869873047, -12.074499130249023, -11.597900390625, -11.12130069732666, -10.644701957702637, -10.168103218078613, -9.691503524780273, -9.21490478515625, -8.738306045532227, -8.261707305908203, -7.7851080894470215, -7.30850887298584, -6.831910133361816, -6.355311393737793, -5.878712177276611, -5.40211296081543, -4.925515174865723, -4.448916435241699, -3.9723172187805176, -3.495718240737915, -3.0191192626953125, -2.54252028465271, -2.0659213066101074, -1.5893223285675049, -1.1127233505249023, -0.6361243724822998, -0.15952539443969727, 0.3170735836029053, 0.7936725616455078, 1.2702715396881104, 1.746870517730713, 2.2234694957733154, 2.700068473815918, 3.1766674518585205, 3.653266429901123, 4.129865646362305, 4.606464385986328, 5.083063125610352, 5.559662342071533, 6.036261558532715, 6.512860298156738, 6.989459037780762, 7.466058254241943, 7.942657470703125, 8.419256210327148, 8.895854949951172, 9.372453689575195, 9.849053382873535, 10.325652122497559]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 6.0, 7.0, 7.0, 9.0, 8.0, 14.0, 15.0, 15.0, 22.0, 17.0, 33.0, 31.0, 20.0, 26.0, 33.0, 36.0, 39.0, 40.0, 34.0, 44.0, 43.0, 46.0, 53.0, 51.0, 42.0, 46.0, 32.0, 29.0, 27.0, 24.0, 32.0, 29.0, 14.0, 20.0, 10.0, 12.0, 7.0, 8.0, 3.0, 3.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.622669219970703, -21.874195098876953, -21.125720977783203, -20.377248764038086, -19.628774642944336, -18.880300521850586, -18.13182830810547, -17.38335418701172, -16.63488006591797, -15.886405944824219, -15.137932777404785, -14.389459609985352, -13.640985488891602, -12.892511367797852, -12.144038200378418, -11.395565032958984, -10.647090911865234, -9.898616790771484, -9.15014362335205, -8.401670455932617, -7.653196334838867, -6.904722690582275, -6.156249046325684, -5.407775402069092, -4.6593017578125, -3.910828113555908, -3.1623544692993164, -2.4138808250427246, -1.6654071807861328, -0.916933536529541, -0.16845989227294922, 0.5800137519836426, 1.3284893035888672, 2.076962947845459, 2.825436592102051, 3.5739102363586426, 4.322383880615234, 5.070857524871826, 5.819331169128418, 6.56780481338501, 7.316278457641602, 8.064752578735352, 8.813225746154785, 9.561698913574219, 10.310173034667969, 11.058647155761719, 11.807120323181152, 12.555593490600586, 13.304067611694336, 14.052541732788086, 14.80101490020752, 15.549488067626953, 16.297962188720703, 17.046436309814453, 17.794910430908203, 18.54338264465332, 19.29185676574707, 20.04033088684082, 20.788803100585938, 21.537277221679688, 22.285751342773438, 23.034225463867188, 23.782699584960938, 24.531171798706055, 25.279645919799805]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 12.0, 11.0, 9.0, 13.0, 17.0, 12.0, 14.0, 15.0, 13.0, 29.0, 24.0, 35.0, 33.0, 27.0, 40.0, 39.0, 37.0, 53.0, 39.0, 49.0, 36.0, 49.0, 45.0, 40.0, 51.0, 43.0, 27.0, 32.0, 32.0, 26.0, 18.0, 15.0, 9.0, 11.0, 5.0, 5.0, 9.0, 6.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.435546875, -2.3675994873046875, -2.299652099609375, -2.2317047119140625, -2.16375732421875, -2.0958099365234375, -2.027862548828125, -1.9599151611328125, -1.8919677734375, -1.8240203857421875, -1.756072998046875, -1.6881256103515625, -1.62017822265625, -1.5522308349609375, -1.484283447265625, -1.4163360595703125, -1.348388671875, -1.2804412841796875, -1.212493896484375, -1.1445465087890625, -1.07659912109375, -1.0086517333984375, -0.940704345703125, -0.8727569580078125, -0.8048095703125, -0.7368621826171875, -0.668914794921875, -0.6009674072265625, -0.53302001953125, -0.4650726318359375, -0.397125244140625, -0.3291778564453125, -0.26123046875, -0.1932830810546875, -0.125335693359375, -0.0573883056640625, 0.01055908203125, 0.0785064697265625, 0.146453857421875, 0.2144012451171875, 0.2823486328125, 0.3502960205078125, 0.418243408203125, 0.4861907958984375, 0.55413818359375, 0.6220855712890625, 0.690032958984375, 0.7579803466796875, 0.825927734375, 0.8938751220703125, 0.961822509765625, 1.0297698974609375, 1.09771728515625, 1.1656646728515625, 1.233612060546875, 1.3015594482421875, 1.3695068359375, 1.4374542236328125, 1.505401611328125, 1.5733489990234375, 1.64129638671875, 1.7092437744140625, 1.777191162109375, 1.8451385498046875, 1.9130859375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 4.0, 6.0, 2.0, 11.0, 7.0, 5.0, 10.0, 10.0, 10.0, 20.0, 14.0, 19.0, 25.0, 21.0, 26.0, 33.0, 50.0, 65.0, 104.0, 330.0, 1407.0, 11399.0, 273402.0, 3590325.0, 302869.0, 11961.0, 1402.0, 272.0, 125.0, 68.0, 48.0, 26.0, 29.0, 29.0, 23.0, 24.0, 20.0, 12.0, 18.0, 10.0, 4.0, 11.0, 5.0, 4.0, 2.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5859375, -10.27001953125, -9.9541015625, -9.63818359375, -9.322265625, -9.00634765625, -8.6904296875, -8.37451171875, -8.05859375, -7.74267578125, -7.4267578125, -7.11083984375, -6.794921875, -6.47900390625, -6.1630859375, -5.84716796875, -5.53125, -5.21533203125, -4.8994140625, -4.58349609375, -4.267578125, -3.95166015625, -3.6357421875, -3.31982421875, -3.00390625, -2.68798828125, -2.3720703125, -2.05615234375, -1.740234375, -1.42431640625, -1.1083984375, -0.79248046875, -0.4765625, -0.16064453125, 0.1552734375, 0.47119140625, 0.787109375, 1.10302734375, 1.4189453125, 1.73486328125, 2.05078125, 2.36669921875, 2.6826171875, 2.99853515625, 3.314453125, 3.63037109375, 3.9462890625, 4.26220703125, 4.578125, 4.89404296875, 5.2099609375, 5.52587890625, 5.841796875, 6.15771484375, 6.4736328125, 6.78955078125, 7.10546875, 7.42138671875, 7.7373046875, 8.05322265625, 8.369140625, 8.68505859375, 9.0009765625, 9.31689453125, 9.6328125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 2.0, 11.0, 20.0, 43.0, 59.0, 100.0, 185.0, 286.0, 506.0, 699.0, 767.0, 560.0, 353.0, 184.0, 137.0, 67.0, 48.0, 19.0, 17.0, 8.0, 6.0, 4.0], "bins": [-16.46875, -16.152923583984375, -15.83709716796875, -15.521270751953125, -15.2054443359375, -14.889617919921875, -14.57379150390625, -14.257965087890625, -13.942138671875, -13.626312255859375, -13.31048583984375, -12.994659423828125, -12.6788330078125, -12.363006591796875, -12.04718017578125, -11.731353759765625, -11.41552734375, -11.099700927734375, -10.78387451171875, -10.468048095703125, -10.1522216796875, -9.836395263671875, -9.52056884765625, -9.204742431640625, -8.888916015625, -8.573089599609375, -8.25726318359375, -7.941436767578125, -7.6256103515625, -7.309783935546875, -6.99395751953125, -6.678131103515625, -6.3623046875, -6.046478271484375, -5.73065185546875, -5.414825439453125, -5.0989990234375, -4.783172607421875, -4.46734619140625, -4.151519775390625, -3.835693359375, -3.519866943359375, -3.20404052734375, -2.888214111328125, -2.5723876953125, -2.256561279296875, -1.94073486328125, -1.624908447265625, -1.30908203125, -0.993255615234375, -0.67742919921875, -0.361602783203125, -0.0457763671875, 0.270050048828125, 0.58587646484375, 0.901702880859375, 1.217529296875, 1.533355712890625, 1.84918212890625, 2.165008544921875, 2.4808349609375, 2.796661376953125, 3.11248779296875, 3.428314208984375, 3.744140625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 18.0, 31.0, 46.0, 96.0, 148.0, 220.0, 400.0, 984.0, 10297.0, 2416651.0, 1755167.0, 8335.0, 930.0, 382.0, 227.0, 135.0, 86.0, 36.0, 34.0, 13.0, 15.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6171875, -13.8038330078125, -12.990478515625, -12.1771240234375, -11.36376953125, -10.5504150390625, -9.737060546875, -8.9237060546875, -8.1103515625, -7.2969970703125, -6.483642578125, -5.6702880859375, -4.85693359375, -4.0435791015625, -3.230224609375, -2.4168701171875, -1.603515625, -0.7901611328125, 0.023193359375, 0.8365478515625, 1.64990234375, 2.4632568359375, 3.276611328125, 4.0899658203125, 4.9033203125, 5.7166748046875, 6.530029296875, 7.3433837890625, 8.15673828125, 8.9700927734375, 9.783447265625, 10.5968017578125, 11.41015625, 12.2235107421875, 13.036865234375, 13.8502197265625, 14.66357421875, 15.4769287109375, 16.290283203125, 17.1036376953125, 17.9169921875, 18.7303466796875, 19.543701171875, 20.3570556640625, 21.17041015625, 21.9837646484375, 22.797119140625, 23.6104736328125, 24.423828125, 25.2371826171875, 26.050537109375, 26.8638916015625, 27.67724609375, 28.4906005859375, 29.303955078125, 30.1173095703125, 30.9306640625, 31.7440185546875, 32.557373046875, 33.3707275390625, 34.18408203125, 34.9974365234375, 35.810791015625, 36.6241455078125, 37.4375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 11.0, 44.0, 100.0, 231.0, 245.0, 220.0, 109.0, 38.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.50689697265625, -67.70074462890625, -65.89459228515625, -64.08843994140625, -62.28228759765625, -60.47613525390625, -58.66998291015625, -56.863834381103516, -55.057682037353516, -53.251529693603516, -51.445377349853516, -49.639225006103516, -47.833072662353516, -46.02692413330078, -44.22077178955078, -42.41461944580078, -40.60846710205078, -38.80231475830078, -36.99616241455078, -35.19001007080078, -33.38385772705078, -31.577707290649414, -29.771554946899414, -27.965404510498047, -26.15924835205078, -24.35309600830078, -22.54694366455078, -20.74079132080078, -18.934640884399414, -17.128488540649414, -15.322336196899414, -13.51618480682373, -11.710033416748047, -9.903881072998047, -8.097729682922363, -6.291577339172363, -4.4854254722595215, -2.6792736053466797, -0.8731212615966797, 0.9330301284790039, 2.739182472229004, 4.545334339141846, 6.3514862060546875, 8.157638549804688, 9.963790893554688, 11.769942283630371, 13.576094627380371, 15.382246017456055, 17.188398361206055, 18.994550704956055, 20.800703048706055, 22.606853485107422, 24.413005828857422, 26.219158172607422, 28.025310516357422, 29.831462860107422, 31.637615203857422, 33.44376754760742, 35.24991989135742, 37.05607223510742, 38.86222457885742, 40.668373107910156, 42.474525451660156, 44.280677795410156, 46.086830139160156]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 14.0, 6.0, 8.0, 9.0, 14.0, 11.0, 11.0, 18.0, 21.0, 23.0, 31.0, 21.0, 31.0, 26.0, 27.0, 36.0, 34.0, 30.0, 43.0, 44.0, 37.0, 38.0, 52.0, 35.0, 28.0, 22.0, 30.0, 29.0, 38.0, 28.0, 26.0, 18.0, 27.0, 16.0, 17.0, 13.0, 12.0, 12.0, 10.0, 7.0, 4.0, 7.0, 11.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.114425659179688, -16.55829620361328, -16.002166748046875, -15.446037292480469, -14.889907836914062, -14.333778381347656, -13.77764892578125, -13.221519470214844, -12.665390014648438, -12.109260559082031, -11.553131103515625, -10.997001647949219, -10.440872192382812, -9.884742736816406, -9.32861328125, -8.772483825683594, -8.216355323791504, -7.660225868225098, -7.104096412658691, -6.547966957092285, -5.991837501525879, -5.435708045959473, -4.879579067230225, -4.323449611663818, -3.767320156097412, -3.211190700531006, -2.6550612449645996, -2.0989320278167725, -1.5428025722503662, -0.98667311668396, -0.4305438995361328, 0.12558555603027344, 0.6817150115966797, 1.237844467163086, 1.7939738035202026, 2.3501031398773193, 2.9062325954437256, 3.462362051010132, 4.018491268157959, 4.574620723724365, 5.1307501792907715, 5.686879634857178, 6.243009090423584, 6.799138069152832, 7.355267524719238, 7.9113969802856445, 8.46752643585205, 9.023655891418457, 9.579785346984863, 10.13591480255127, 10.692044258117676, 11.248173713684082, 11.804303169250488, 12.360432624816895, 12.916561126708984, 13.47269058227539, 14.028820037841797, 14.584949493408203, 15.14107894897461, 15.697208404541016, 16.253337860107422, 16.809467315673828, 17.365596771240234, 17.92172622680664, 18.477855682373047]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 5.0, 8.0, 3.0, 12.0, 16.0, 17.0, 10.0, 16.0, 14.0, 18.0, 19.0, 17.0, 29.0, 23.0, 38.0, 50.0, 39.0, 50.0, 43.0, 44.0, 49.0, 35.0, 41.0, 55.0, 39.0, 36.0, 33.0, 46.0, 38.0, 27.0, 29.0, 18.0, 21.0, 7.0, 14.0, 10.0, 4.0, 5.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.662109375, -2.590667724609375, -2.51922607421875, -2.447784423828125, -2.3763427734375, -2.304901123046875, -2.23345947265625, -2.162017822265625, -2.090576171875, -2.019134521484375, -1.94769287109375, -1.876251220703125, -1.8048095703125, -1.733367919921875, -1.66192626953125, -1.590484619140625, -1.51904296875, -1.447601318359375, -1.37615966796875, -1.304718017578125, -1.2332763671875, -1.161834716796875, -1.09039306640625, -1.018951416015625, -0.947509765625, -0.876068115234375, -0.80462646484375, -0.733184814453125, -0.6617431640625, -0.590301513671875, -0.51885986328125, -0.447418212890625, -0.3759765625, -0.304534912109375, -0.23309326171875, -0.161651611328125, -0.0902099609375, -0.018768310546875, 0.05267333984375, 0.124114990234375, 0.195556640625, 0.266998291015625, 0.33843994140625, 0.409881591796875, 0.4813232421875, 0.552764892578125, 0.62420654296875, 0.695648193359375, 0.76708984375, 0.838531494140625, 0.90997314453125, 0.981414794921875, 1.0528564453125, 1.124298095703125, 1.19573974609375, 1.267181396484375, 1.338623046875, 1.410064697265625, 1.48150634765625, 1.552947998046875, 1.6243896484375, 1.695831298828125, 1.76727294921875, 1.838714599609375, 1.91015625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 12.0, 20.0, 33.0, 41.0, 56.0, 114.0, 171.0, 288.0, 485.0, 770.0, 1301.0, 2218.0, 3646.0, 6347.0, 10521.0, 17924.0, 31885.0, 60797.0, 127073.0, 320745.0, 245575.0, 102906.0, 50152.0, 27372.0, 15777.0, 9015.0, 5336.0, 3225.0, 1850.0, 1138.0, 693.0, 437.0, 244.0, 139.0, 88.0, 43.0, 46.0, 21.0, 16.0, 10.0, 11.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50634765625, -0.4909400939941406, -0.47553253173828125, -0.4601249694824219, -0.4447174072265625, -0.4293098449707031, -0.41390228271484375, -0.3984947204589844, -0.383087158203125, -0.3676795959472656, -0.35227203369140625, -0.3368644714355469, -0.3214569091796875, -0.3060493469238281, -0.29064178466796875, -0.2752342224121094, -0.25982666015625, -0.24441909790039062, -0.22901153564453125, -0.21360397338867188, -0.1981964111328125, -0.18278884887695312, -0.16738128662109375, -0.15197372436523438, -0.136566162109375, -0.12115859985351562, -0.10575103759765625, -0.09034347534179688, -0.0749359130859375, -0.059528350830078125, -0.04412078857421875, -0.028713226318359375, -0.0133056640625, 0.002101898193359375, 0.01750946044921875, 0.032917022705078125, 0.0483245849609375, 0.06373214721679688, 0.07913970947265625, 0.09454727172851562, 0.109954833984375, 0.12536239624023438, 0.14076995849609375, 0.15617752075195312, 0.1715850830078125, 0.18699264526367188, 0.20240020751953125, 0.21780776977539062, 0.23321533203125, 0.24862289428710938, 0.26403045654296875, 0.2794380187988281, 0.2948455810546875, 0.3102531433105469, 0.32566070556640625, 0.3410682678222656, 0.356475830078125, 0.3718833923339844, 0.38729095458984375, 0.4026985168457031, 0.4181060791015625, 0.4335136413574219, 0.44892120361328125, 0.4643287658691406, 0.479736328125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 10.0, 10.0, 7.0, 10.0, 13.0, 22.0, 12.0, 14.0, 23.0, 25.0, 26.0, 30.0, 35.0, 37.0, 37.0, 31.0, 43.0, 35.0, 32.0, 37.0, 1064.0, 27.0, 32.0, 44.0, 37.0, 33.0, 29.0, 36.0, 24.0, 28.0, 25.0, 25.0, 23.0, 17.0, 16.0, 16.0, 6.0, 6.0, 9.0, 11.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3583984375, -1.3172760009765625, -1.276153564453125, -1.2350311279296875, -1.19390869140625, -1.1527862548828125, -1.111663818359375, -1.0705413818359375, -1.0294189453125, -0.9882965087890625, -0.947174072265625, -0.9060516357421875, -0.86492919921875, -0.8238067626953125, -0.782684326171875, -0.7415618896484375, -0.700439453125, -0.6593170166015625, -0.618194580078125, -0.5770721435546875, -0.53594970703125, -0.4948272705078125, -0.453704833984375, -0.4125823974609375, -0.3714599609375, -0.3303375244140625, -0.289215087890625, -0.2480926513671875, -0.20697021484375, -0.1658477783203125, -0.124725341796875, -0.0836029052734375, -0.04248046875, -0.0013580322265625, 0.039764404296875, 0.0808868408203125, 0.12200927734375, 0.1631317138671875, 0.204254150390625, 0.2453765869140625, 0.2864990234375, 0.3276214599609375, 0.368743896484375, 0.4098663330078125, 0.45098876953125, 0.4921112060546875, 0.533233642578125, 0.5743560791015625, 0.615478515625, 0.6566009521484375, 0.697723388671875, 0.7388458251953125, 0.77996826171875, 0.8210906982421875, 0.862213134765625, 0.9033355712890625, 0.9444580078125, 0.9855804443359375, 1.026702880859375, 1.0678253173828125, 1.10894775390625, 1.1500701904296875, 1.191192626953125, 1.2323150634765625, 1.2734375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 5.0, 4.0, 5.0, 9.0, 15.0, 22.0, 35.0, 40.0, 63.0, 110.0, 152.0, 190.0, 331.0, 440.0, 642.0, 885.0, 1219.0, 1738.0, 2416.0, 3516.0, 4800.0, 6669.0, 9396.0, 13324.0, 18943.0, 27182.0, 40491.0, 61636.0, 100250.0, 189570.0, 1277059.0, 118268.0, 69913.0, 45503.0, 30412.0, 20984.0, 14722.0, 10340.0, 7371.0, 5184.0, 3813.0, 2759.0, 1913.0, 1351.0, 1088.0, 655.0, 506.0, 395.0, 252.0, 173.0, 116.0, 83.0, 57.0, 39.0, 30.0, 22.0, 14.0, 9.0, 13.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.2744140625, -0.26560211181640625, -0.2567901611328125, -0.24797821044921875, -0.239166259765625, -0.23035430908203125, -0.2215423583984375, -0.21273040771484375, -0.20391845703125, -0.19510650634765625, -0.1862945556640625, -0.17748260498046875, -0.168670654296875, -0.15985870361328125, -0.1510467529296875, -0.14223480224609375, -0.1334228515625, -0.12461090087890625, -0.1157989501953125, -0.10698699951171875, -0.098175048828125, -0.08936309814453125, -0.0805511474609375, -0.07173919677734375, -0.06292724609375, -0.05411529541015625, -0.0453033447265625, -0.03649139404296875, -0.027679443359375, -0.01886749267578125, -0.0100555419921875, -0.00124359130859375, 0.007568359375, 0.01638031005859375, 0.0251922607421875, 0.03400421142578125, 0.042816162109375, 0.05162811279296875, 0.0604400634765625, 0.06925201416015625, 0.07806396484375, 0.08687591552734375, 0.0956878662109375, 0.10449981689453125, 0.113311767578125, 0.12212371826171875, 0.1309356689453125, 0.13974761962890625, 0.1485595703125, 0.15737152099609375, 0.1661834716796875, 0.17499542236328125, 0.183807373046875, 0.19261932373046875, 0.2014312744140625, 0.21024322509765625, 0.21905517578125, 0.22786712646484375, 0.2366790771484375, 0.24549102783203125, 0.254302978515625, 0.26311492919921875, 0.2719268798828125, 0.28073883056640625, 0.28955078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 6.0, 10.0, 10.0, 8.0, 16.0, 18.0, 21.0, 39.0, 27.0, 33.0, 42.0, 68.0, 55.0, 53.0, 64.0, 69.0, 54.0, 63.0, 48.0, 50.0, 37.0, 27.0, 43.0, 19.0, 21.0, 16.0, 14.0, 16.0, 12.0, 8.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.920099258422852e-05, -6.668083369731903e-05, -6.416067481040955e-05, -6.164051592350006e-05, -5.9120357036590576e-05, -5.660019814968109e-05, -5.4080039262771606e-05, -5.155988037586212e-05, -4.903972148895264e-05, -4.651956260204315e-05, -4.399940371513367e-05, -4.147924482822418e-05, -3.89590859413147e-05, -3.643892705440521e-05, -3.391876816749573e-05, -3.139860928058624e-05, -2.8878450393676758e-05, -2.6358291506767273e-05, -2.3838132619857788e-05, -2.1317973732948303e-05, -1.879781484603882e-05, -1.6277655959129333e-05, -1.3757497072219849e-05, -1.1237338185310364e-05, -8.717179298400879e-06, -6.197020411491394e-06, -3.676861524581909e-06, -1.1567026376724243e-06, 1.3634562492370605e-06, 3.883615136146545e-06, 6.40377402305603e-06, 8.923932909965515e-06, 1.1444091796875e-05, 1.3964250683784485e-05, 1.648440957069397e-05, 1.9004568457603455e-05, 2.152472734451294e-05, 2.4044886231422424e-05, 2.656504511833191e-05, 2.9085204005241394e-05, 3.160536289215088e-05, 3.4125521779060364e-05, 3.664568066596985e-05, 3.9165839552879333e-05, 4.168599843978882e-05, 4.42061573266983e-05, 4.672631621360779e-05, 4.924647510051727e-05, 5.176663398742676e-05, 5.428679287433624e-05, 5.680695176124573e-05, 5.932711064815521e-05, 6.18472695350647e-05, 6.436742842197418e-05, 6.688758730888367e-05, 6.940774619579315e-05, 7.192790508270264e-05, 7.444806396961212e-05, 7.69682228565216e-05, 7.948838174343109e-05, 8.200854063034058e-05, 8.452869951725006e-05, 8.704885840415955e-05, 8.956901729106903e-05, 9.208917617797852e-05]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 8.0, 9.0, 8.0, 10.0, 20.0, 33.0, 35.0, 57.0, 65.0, 75.0, 111.0, 171.0, 286.0, 469.0, 899.0, 135450.0, 907729.0, 1677.0, 511.0, 252.0, 213.0, 92.0, 111.0, 64.0, 47.0, 42.0, 22.0, 17.0, 12.0, 16.0, 11.0, 8.0, 3.0, 3.0, 1.0, 6.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0017881393432617188, -0.001735791563987732, -0.0016834437847137451, -0.0016310960054397583, -0.0015787482261657715, -0.0015264004468917847, -0.0014740526676177979, -0.001421704888343811, -0.0013693571090698242, -0.0013170093297958374, -0.0012646615505218506, -0.0012123137712478638, -0.001159965991973877, -0.0011076182126998901, -0.0010552704334259033, -0.0010029226541519165, -0.0009505748748779297, -0.0008982270956039429, -0.0008458793163299561, -0.0007935315370559692, -0.0007411837577819824, -0.0006888359785079956, -0.0006364881992340088, -0.000584140419960022, -0.0005317926406860352, -0.00047944486141204834, -0.0004270970821380615, -0.0003747493028640747, -0.0003224015235900879, -0.0002700537443161011, -0.00021770596504211426, -0.00016535818576812744, -0.00011301040649414062, -6.066262722015381e-05, -8.314847946166992e-06, 4.4032931327819824e-05, 9.638071060180664e-05, 0.00014872848987579346, 0.00020107626914978027, 0.0002534240484237671, 0.0003057718276977539, 0.0003581196069717407, 0.00041046738624572754, 0.00046281516551971436, 0.0005151629447937012, 0.000567510724067688, 0.0006198585033416748, 0.0006722062826156616, 0.0007245540618896484, 0.0007769018411636353, 0.0008292496204376221, 0.0008815973997116089, 0.0009339451789855957, 0.0009862929582595825, 0.0010386407375335693, 0.0010909885168075562, 0.001143336296081543, 0.0011956840753555298, 0.0012480318546295166, 0.0013003796339035034, 0.0013527274131774902, 0.001405075192451477, 0.0014574229717254639, 0.0015097707509994507, 0.0015621185302734375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 18.0, 74.0, 200.0, 315.0, 251.0, 106.0, 32.0, 9.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014139461563900113, -0.00013720209244638681, -0.0001330095692537725, -0.00012881704606115818, -0.00012462452286854386, -0.00012043199967592955, -0.00011623947648331523, -0.00011204695329070091, -0.0001078544300980866, -0.00010366190690547228, -9.946938371285796e-05, -9.527686052024364e-05, -9.108433732762933e-05, -8.689181413501501e-05, -8.26992909424007e-05, -7.850676774978638e-05, -7.431424455717206e-05, -7.012172136455774e-05, -6.592919817194343e-05, -6.173667497932911e-05, -5.754415178671479e-05, -5.3351628594100475e-05, -4.915910540148616e-05, -4.496658220887184e-05, -4.0774059016257524e-05, -3.658153582364321e-05, -3.238901263102889e-05, -2.8196489438414574e-05, -2.4003966245800257e-05, -1.981144305318594e-05, -1.5618919860571623e-05, -1.1426396667957306e-05, -7.233888027258217e-06, -3.0413648346439004e-06, 1.1511583579704165e-06, 5.3436815505847335e-06, 9.53620474319905e-06, 1.3728727935813367e-05, 1.7921251128427684e-05, 2.2113774321042e-05, 2.6306297513656318e-05, 3.0498820706270635e-05, 3.469134389888495e-05, 3.888386709149927e-05, 4.3076390284113586e-05, 4.72689134767279e-05, 5.146143666934222e-05, 5.565395986195654e-05, 5.9846483054570854e-05, 6.403900624718517e-05, 6.823152943979949e-05, 7.24240526324138e-05, 7.661657582502812e-05, 8.080909901764244e-05, 8.500162221025676e-05, 8.919414540287107e-05, 9.338666859548539e-05, 9.75791917880997e-05, 0.00010177171498071402, 0.00010596423817332834, 0.00011015676136594266, 0.00011434928455855697, 0.00011854180775117129, 0.0001227343309437856, 0.00012692685413639992]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 4.0, 7.0, 7.0, 11.0, 12.0, 15.0, 12.0, 16.0, 13.0, 24.0, 24.0, 40.0, 29.0, 30.0, 36.0, 43.0, 35.0, 39.0, 40.0, 44.0, 20.0, 42.0, 46.0, 39.0, 36.0, 38.0, 39.0, 37.0, 27.0, 33.0, 29.0, 19.0, 19.0, 16.0, 14.0, 14.0, 8.0, 8.0, 7.0, 9.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.993511199951172e-05, -3.862474113702774e-05, -3.731437027454376e-05, -3.6003999412059784e-05, -3.4693628549575806e-05, -3.338325768709183e-05, -3.207288682460785e-05, -3.076251596212387e-05, -2.9452145099639893e-05, -2.8141774237155914e-05, -2.6831403374671936e-05, -2.5521032512187958e-05, -2.421066164970398e-05, -2.290029078722e-05, -2.1589919924736023e-05, -2.0279549062252045e-05, -1.8969178199768066e-05, -1.7658807337284088e-05, -1.634843647480011e-05, -1.5038065612316132e-05, -1.3727694749832153e-05, -1.2417323887348175e-05, -1.1106953024864197e-05, -9.796582162380219e-06, -8.48621129989624e-06, -7.175840437412262e-06, -5.865469574928284e-06, -4.555098712444305e-06, -3.244727849960327e-06, -1.934356987476349e-06, -6.239861249923706e-07, 6.863847374916077e-07, 1.996755599975586e-06, 3.307126462459564e-06, 4.6174973249435425e-06, 5.927868187427521e-06, 7.238239049911499e-06, 8.548609912395477e-06, 9.858980774879456e-06, 1.1169351637363434e-05, 1.2479722499847412e-05, 1.379009336233139e-05, 1.5100464224815369e-05, 1.6410835087299347e-05, 1.7721205949783325e-05, 1.9031576812267303e-05, 2.0341947674751282e-05, 2.165231853723526e-05, 2.2962689399719238e-05, 2.4273060262203217e-05, 2.5583431124687195e-05, 2.6893801987171173e-05, 2.820417284965515e-05, 2.951454371213913e-05, 3.082491457462311e-05, 3.2135285437107086e-05, 3.3445656299591064e-05, 3.475602716207504e-05, 3.606639802455902e-05, 3.7376768887043e-05, 3.868713974952698e-05, 3.9997510612010956e-05, 4.1307881474494934e-05, 4.261825233697891e-05, 4.392862319946289e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 5.0, 8.0, 3.0, 12.0, 16.0, 17.0, 10.0, 16.0, 14.0, 18.0, 19.0, 17.0, 29.0, 23.0, 38.0, 50.0, 39.0, 50.0, 43.0, 44.0, 49.0, 35.0, 41.0, 55.0, 39.0, 36.0, 33.0, 46.0, 38.0, 27.0, 29.0, 18.0, 21.0, 7.0, 14.0, 10.0, 4.0, 5.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.662109375, -2.590667724609375, -2.51922607421875, -2.447784423828125, -2.3763427734375, -2.304901123046875, -2.23345947265625, -2.162017822265625, -2.090576171875, -2.019134521484375, -1.94769287109375, -1.876251220703125, -1.8048095703125, -1.733367919921875, -1.66192626953125, -1.590484619140625, -1.51904296875, -1.447601318359375, -1.37615966796875, -1.304718017578125, -1.2332763671875, -1.161834716796875, -1.09039306640625, -1.018951416015625, -0.947509765625, -0.876068115234375, -0.80462646484375, -0.733184814453125, -0.6617431640625, -0.590301513671875, -0.51885986328125, -0.447418212890625, -0.3759765625, -0.304534912109375, -0.23309326171875, -0.161651611328125, -0.0902099609375, -0.018768310546875, 0.05267333984375, 0.124114990234375, 0.195556640625, 0.266998291015625, 0.33843994140625, 0.409881591796875, 0.4813232421875, 0.552764892578125, 0.62420654296875, 0.695648193359375, 0.76708984375, 0.838531494140625, 0.90997314453125, 0.981414794921875, 1.0528564453125, 1.124298095703125, 1.19573974609375, 1.267181396484375, 1.338623046875, 1.410064697265625, 1.48150634765625, 1.552947998046875, 1.6243896484375, 1.695831298828125, 1.76727294921875, 1.838714599609375, 1.91015625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 5.0, 9.0, 5.0, 7.0, 20.0, 24.0, 28.0, 44.0, 46.0, 83.0, 89.0, 124.0, 160.0, 265.0, 432.0, 600.0, 1161.0, 2082.0, 4168.0, 9598.0, 27434.0, 103100.0, 415593.0, 357992.0, 84778.0, 23181.0, 8720.0, 3802.0, 1931.0, 1132.0, 624.0, 429.0, 267.0, 180.0, 126.0, 94.0, 60.0, 42.0, 32.0, 20.0, 17.0, 17.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.767578125, -2.6883544921875, -2.609130859375, -2.5299072265625, -2.45068359375, -2.3714599609375, -2.292236328125, -2.2130126953125, -2.1337890625, -2.0545654296875, -1.975341796875, -1.8961181640625, -1.81689453125, -1.7376708984375, -1.658447265625, -1.5792236328125, -1.5, -1.4207763671875, -1.341552734375, -1.2623291015625, -1.18310546875, -1.1038818359375, -1.024658203125, -0.9454345703125, -0.8662109375, -0.7869873046875, -0.707763671875, -0.6285400390625, -0.54931640625, -0.4700927734375, -0.390869140625, -0.3116455078125, -0.232421875, -0.1531982421875, -0.073974609375, 0.0052490234375, 0.08447265625, 0.1636962890625, 0.242919921875, 0.3221435546875, 0.4013671875, 0.4805908203125, 0.559814453125, 0.6390380859375, 0.71826171875, 0.7974853515625, 0.876708984375, 0.9559326171875, 1.03515625, 1.1143798828125, 1.193603515625, 1.2728271484375, 1.35205078125, 1.4312744140625, 1.510498046875, 1.5897216796875, 1.6689453125, 1.7481689453125, 1.827392578125, 1.9066162109375, 1.98583984375, 2.0650634765625, 2.144287109375, 2.2235107421875, 2.302734375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 3.0, 9.0, 10.0, 11.0, 7.0, 9.0, 16.0, 17.0, 18.0, 29.0, 26.0, 37.0, 26.0, 32.0, 37.0, 47.0, 54.0, 54.0, 197.0, 1701.0, 210.0, 70.0, 46.0, 58.0, 37.0, 47.0, 38.0, 31.0, 22.0, 26.0, 27.0, 19.0, 12.0, 16.0, 12.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.376708984375, -6.13623046875, -5.895751953125, -5.6552734375, -5.414794921875, -5.17431640625, -4.933837890625, -4.693359375, -4.452880859375, -4.21240234375, -3.971923828125, -3.7314453125, -3.490966796875, -3.25048828125, -3.010009765625, -2.76953125, -2.529052734375, -2.28857421875, -2.048095703125, -1.8076171875, -1.567138671875, -1.32666015625, -1.086181640625, -0.845703125, -0.605224609375, -0.36474609375, -0.124267578125, 0.1162109375, 0.356689453125, 0.59716796875, 0.837646484375, 1.078125, 1.318603515625, 1.55908203125, 1.799560546875, 2.0400390625, 2.280517578125, 2.52099609375, 2.761474609375, 3.001953125, 3.242431640625, 3.48291015625, 3.723388671875, 3.9638671875, 4.204345703125, 4.44482421875, 4.685302734375, 4.92578125, 5.166259765625, 5.40673828125, 5.647216796875, 5.8876953125, 6.128173828125, 6.36865234375, 6.609130859375, 6.849609375, 7.090087890625, 7.33056640625, 7.571044921875, 7.8115234375, 8.052001953125, 8.29248046875, 8.532958984375, 8.7734375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 5.0, 3.0, 3.0, 11.0, 11.0, 24.0, 24.0, 31.0, 36.0, 61.0, 71.0, 105.0, 182.0, 345.0, 934.0, 4902.0, 431975.0, 2695044.0, 9714.0, 1206.0, 398.0, 220.0, 111.0, 77.0, 40.0, 38.0, 30.0, 23.0, 15.0, 16.0, 14.0, 11.0, 7.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0703125, -14.60107421875, -14.1318359375, -13.66259765625, -13.193359375, -12.72412109375, -12.2548828125, -11.78564453125, -11.31640625, -10.84716796875, -10.3779296875, -9.90869140625, -9.439453125, -8.97021484375, -8.5009765625, -8.03173828125, -7.5625, -7.09326171875, -6.6240234375, -6.15478515625, -5.685546875, -5.21630859375, -4.7470703125, -4.27783203125, -3.80859375, -3.33935546875, -2.8701171875, -2.40087890625, -1.931640625, -1.46240234375, -0.9931640625, -0.52392578125, -0.0546875, 0.41455078125, 0.8837890625, 1.35302734375, 1.822265625, 2.29150390625, 2.7607421875, 3.22998046875, 3.69921875, 4.16845703125, 4.6376953125, 5.10693359375, 5.576171875, 6.04541015625, 6.5146484375, 6.98388671875, 7.453125, 7.92236328125, 8.3916015625, 8.86083984375, 9.330078125, 9.79931640625, 10.2685546875, 10.73779296875, 11.20703125, 11.67626953125, 12.1455078125, 12.61474609375, 13.083984375, 13.55322265625, 14.0224609375, 14.49169921875, 14.9609375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 61.0, 830.0, 123.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6708807945251465, -4.1117095947265625, -1.5525383949279785, 1.0066328048706055, 3.5658040046691895, 6.124975681304932, 8.684146881103516, 11.243316650390625, 13.802488327026367, 16.36166000366211, 18.92082977294922, 21.48000144958496, 24.039173126220703, 26.598344802856445, 29.157516479492188, 31.716686248779297, 34.27585983276367, 36.83502960205078, 39.394203186035156, 41.953372955322266, 44.512542724609375, 47.07171630859375, 49.63088607788086, 52.19005584716797, 54.749229431152344, 57.30839920043945, 59.86757278442383, 62.42674255371094, 64.98591613769531, 67.54508972167969, 70.10425567626953, 72.6634292602539, 75.22259521484375, 77.78176879882812, 80.34093475341797, 82.90010833740234, 85.45928192138672, 88.01844787597656, 90.57762145996094, 93.13679504394531, 95.69596862792969, 98.25514221191406, 100.8143081665039, 103.37348175048828, 105.93265533447266, 108.4918212890625, 111.05099487304688, 113.61016845703125, 116.1693344116211, 118.72850799560547, 121.28767395019531, 123.84684753417969, 126.40602111816406, 128.96519470214844, 131.5243682861328, 134.08352661132812, 136.6427001953125, 139.20187377929688, 141.76104736328125, 144.32022094726562, 146.87937927246094, 149.4385528564453, 151.9977264404297, 154.55690002441406, 157.11607360839844]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 8.0, 11.0, 12.0, 10.0, 19.0, 15.0, 28.0, 33.0, 26.0, 35.0, 39.0, 43.0, 42.0, 41.0, 40.0, 41.0, 50.0, 38.0, 44.0, 41.0, 39.0, 46.0, 32.0, 37.0, 45.0, 37.0, 22.0, 20.0, 16.0, 19.0, 12.0, 6.0, 10.0, 4.0, 8.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.410625457763672, -24.621408462524414, -23.832191467285156, -23.0429744720459, -22.25375747680664, -21.464542388916016, -20.675325393676758, -19.8861083984375, -19.096891403198242, -18.307674407958984, -17.518457412719727, -16.72924041748047, -15.940024375915527, -15.15080738067627, -14.361591339111328, -13.57237434387207, -12.783157348632812, -11.993940353393555, -11.204723358154297, -10.415507316589355, -9.626290321350098, -8.83707332611084, -8.047857284545898, -7.258640289306641, -6.469423294067383, -5.680206298828125, -4.890989780426025, -4.101773262023926, -3.312556266784668, -2.5233395099639893, -1.7341227531433105, -0.9449062347412109, -0.15568923950195312, 0.6335275173187256, 1.4227442741394043, 2.211961030960083, 3.0011777877807617, 3.7903945446014404, 4.579611301422119, 5.368827819824219, 6.158044815063477, 6.947261810302734, 7.736478328704834, 8.525694847106934, 9.314911842346191, 10.10412883758545, 10.89334487915039, 11.682561874389648, 12.471778869628906, 13.260995864868164, 14.050212860107422, 14.839428901672363, 15.628645896911621, 16.417861938476562, 17.20707893371582, 17.996295928955078, 18.785512924194336, 19.574729919433594, 20.36394691467285, 21.15316390991211, 21.942378997802734, 22.731595993041992, 23.52081298828125, 24.310029983520508, 25.099246978759766]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 11.0, 4.0, 6.0, 10.0, 12.0, 14.0, 19.0, 20.0, 12.0, 14.0, 18.0, 23.0, 26.0, 27.0, 34.0, 33.0, 53.0, 34.0, 52.0, 47.0, 45.0, 43.0, 44.0, 47.0, 45.0, 35.0, 34.0, 56.0, 32.0, 24.0, 26.0, 17.0, 25.0, 13.0, 10.0, 5.0, 7.0, 7.0, 6.0, 11.0, 1.0, 0.0, 4.0, 2.0, 3.0], "bins": [-2.92578125, -2.8514556884765625, -2.777130126953125, -2.7028045654296875, -2.62847900390625, -2.5541534423828125, -2.479827880859375, -2.4055023193359375, -2.3311767578125, -2.2568511962890625, -2.182525634765625, -2.1082000732421875, -2.03387451171875, -1.9595489501953125, -1.885223388671875, -1.8108978271484375, -1.736572265625, -1.6622467041015625, -1.587921142578125, -1.5135955810546875, -1.43927001953125, -1.3649444580078125, -1.290618896484375, -1.2162933349609375, -1.1419677734375, -1.0676422119140625, -0.993316650390625, -0.9189910888671875, -0.84466552734375, -0.7703399658203125, -0.696014404296875, -0.6216888427734375, -0.54736328125, -0.4730377197265625, -0.398712158203125, -0.3243865966796875, -0.25006103515625, -0.1757354736328125, -0.101409912109375, -0.0270843505859375, 0.0472412109375, 0.1215667724609375, 0.195892333984375, 0.2702178955078125, 0.34454345703125, 0.4188690185546875, 0.493194580078125, 0.5675201416015625, 0.641845703125, 0.7161712646484375, 0.790496826171875, 0.8648223876953125, 0.93914794921875, 1.0134735107421875, 1.087799072265625, 1.1621246337890625, 1.2364501953125, 1.3107757568359375, 1.385101318359375, 1.4594268798828125, 1.53375244140625, 1.6080780029296875, 1.682403564453125, 1.7567291259765625, 1.8310546875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 7.0, 8.0, 14.0, 21.0, 17.0, 36.0, 34.0, 33.0, 54.0, 83.0, 115.0, 227.0, 441.0, 951.0, 2538.0, 8113.0, 30121.0, 147084.0, 992768.0, 2233312.0, 645707.0, 100963.0, 21946.0, 6151.0, 1940.0, 753.0, 305.0, 142.0, 116.0, 74.0, 48.0, 37.0, 23.0, 20.0, 20.0, 13.0, 10.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-5.25390625, -5.1094970703125, -4.965087890625, -4.8206787109375, -4.67626953125, -4.5318603515625, -4.387451171875, -4.2430419921875, -4.0986328125, -3.9542236328125, -3.809814453125, -3.6654052734375, -3.52099609375, -3.3765869140625, -3.232177734375, -3.0877685546875, -2.943359375, -2.7989501953125, -2.654541015625, -2.5101318359375, -2.36572265625, -2.2213134765625, -2.076904296875, -1.9324951171875, -1.7880859375, -1.6436767578125, -1.499267578125, -1.3548583984375, -1.21044921875, -1.0660400390625, -0.921630859375, -0.7772216796875, -0.6328125, -0.4884033203125, -0.343994140625, -0.1995849609375, -0.05517578125, 0.0892333984375, 0.233642578125, 0.3780517578125, 0.5224609375, 0.6668701171875, 0.811279296875, 0.9556884765625, 1.10009765625, 1.2445068359375, 1.388916015625, 1.5333251953125, 1.677734375, 1.8221435546875, 1.966552734375, 2.1109619140625, 2.25537109375, 2.3997802734375, 2.544189453125, 2.6885986328125, 2.8330078125, 2.9774169921875, 3.121826171875, 3.2662353515625, 3.41064453125, 3.5550537109375, 3.699462890625, 3.8438720703125, 3.98828125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 13.0, 31.0, 39.0, 94.0, 181.0, 323.0, 627.0, 974.0, 806.0, 464.0, 273.0, 117.0, 58.0, 32.0, 17.0, 12.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -16.04931640625, -15.6455078125, -15.24169921875, -14.837890625, -14.43408203125, -14.0302734375, -13.62646484375, -13.22265625, -12.81884765625, -12.4150390625, -12.01123046875, -11.607421875, -11.20361328125, -10.7998046875, -10.39599609375, -9.9921875, -9.58837890625, -9.1845703125, -8.78076171875, -8.376953125, -7.97314453125, -7.5693359375, -7.16552734375, -6.76171875, -6.35791015625, -5.9541015625, -5.55029296875, -5.146484375, -4.74267578125, -4.3388671875, -3.93505859375, -3.53125, -3.12744140625, -2.7236328125, -2.31982421875, -1.916015625, -1.51220703125, -1.1083984375, -0.70458984375, -0.30078125, 0.10302734375, 0.5068359375, 0.91064453125, 1.314453125, 1.71826171875, 2.1220703125, 2.52587890625, 2.9296875, 3.33349609375, 3.7373046875, 4.14111328125, 4.544921875, 4.94873046875, 5.3525390625, 5.75634765625, 6.16015625, 6.56396484375, 6.9677734375, 7.37158203125, 7.775390625, 8.17919921875, 8.5830078125, 8.98681640625, 9.390625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 10.0, 11.0, 26.0, 30.0, 70.0, 155.0, 293.0, 947.0, 24119.0, 4097448.0, 69170.0, 1297.0, 334.0, 154.0, 88.0, 57.0, 19.0, 19.0, 10.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.59375, -22.50048828125, -21.4072265625, -20.31396484375, -19.220703125, -18.12744140625, -17.0341796875, -15.94091796875, -14.84765625, -13.75439453125, -12.6611328125, -11.56787109375, -10.474609375, -9.38134765625, -8.2880859375, -7.19482421875, -6.1015625, -5.00830078125, -3.9150390625, -2.82177734375, -1.728515625, -0.63525390625, 0.4580078125, 1.55126953125, 2.64453125, 3.73779296875, 4.8310546875, 5.92431640625, 7.017578125, 8.11083984375, 9.2041015625, 10.29736328125, 11.390625, 12.48388671875, 13.5771484375, 14.67041015625, 15.763671875, 16.85693359375, 17.9501953125, 19.04345703125, 20.13671875, 21.22998046875, 22.3232421875, 23.41650390625, 24.509765625, 25.60302734375, 26.6962890625, 27.78955078125, 28.8828125, 29.97607421875, 31.0693359375, 32.16259765625, 33.255859375, 34.34912109375, 35.4423828125, 36.53564453125, 37.62890625, 38.72216796875, 39.8154296875, 40.90869140625, 42.001953125, 43.09521484375, 44.1884765625, 45.28173828125, 46.375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 22.0, 62.0, 128.0, 199.0, 208.0, 201.0, 108.0, 46.0, 23.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.61354446411133, -51.95621871948242, -50.29888916015625, -48.641563415527344, -46.98423767089844, -45.326908111572266, -43.66958236694336, -42.01225280761719, -40.35492706298828, -38.697601318359375, -37.0402717590332, -35.3829460144043, -33.725616455078125, -32.06829071044922, -30.410964965820312, -28.753637313842773, -27.096309661865234, -25.438982009887695, -23.781654357910156, -22.12432861328125, -20.46700096130371, -18.809673309326172, -17.152347564697266, -15.495019912719727, -13.837692260742188, -12.180364608764648, -10.523037910461426, -8.865711212158203, -7.208383560180664, -5.551055908203125, -3.8937292098999023, -2.2364025115966797, -0.5790748596191406, 1.0782523155212402, 2.735579490661621, 4.392906665802002, 6.050233840942383, 7.707561492919922, 9.364888191223145, 11.022214889526367, 12.679542541503906, 14.336870193481445, 15.994196891784668, 17.65152359008789, 19.30885124206543, 20.96617889404297, 22.623504638671875, 24.280832290649414, 25.938159942626953, 27.595487594604492, 29.25281524658203, 30.910140991210938, 32.567466735839844, 34.224796295166016, 35.88212203979492, 37.539451599121094, 39.19677734375, 40.854103088378906, 42.51143264770508, 44.168758392333984, 45.826087951660156, 47.48341369628906, 49.14073944091797, 50.798065185546875, 52.45539474487305]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 11.0, 7.0, 10.0, 12.0, 13.0, 15.0, 15.0, 17.0, 25.0, 38.0, 34.0, 29.0, 40.0, 35.0, 45.0, 46.0, 35.0, 41.0, 39.0, 38.0, 46.0, 43.0, 39.0, 45.0, 30.0, 25.0, 29.0, 29.0, 41.0, 17.0, 21.0, 23.0, 13.0, 12.0, 14.0, 4.0, 4.0, 5.0, 4.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.47956657409668, -21.828731536865234, -21.177898406982422, -20.527063369750977, -19.87622833251953, -19.22539520263672, -18.574560165405273, -17.923725128173828, -17.272891998291016, -16.62205696105957, -15.971222877502441, -15.320388793945312, -14.669554710388184, -14.018720626831055, -13.36788558959961, -12.71705150604248, -12.066216468811035, -11.415382385253906, -10.764547348022461, -10.113713264465332, -9.462879180908203, -8.812044143676758, -8.161210060119629, -7.5103759765625, -6.859541416168213, -6.208706855773926, -5.557872772216797, -4.90703821182251, -4.256203651428223, -3.6053695678710938, -2.9545350074768066, -2.3037009239196777, -1.6528663635253906, -1.0020320415496826, -0.35119760036468506, 0.2996368408203125, 0.9504711627960205, 1.6013054847717285, 2.2521400451660156, 2.9029741287231445, 3.5538086891174316, 4.204643249511719, 4.855477333068848, 5.506311893463135, 6.157146453857422, 6.807980537414551, 7.458815097808838, 8.109649658203125, 8.760483741760254, 9.411317825317383, 10.062152862548828, 10.712986946105957, 11.363821029663086, 12.014656066894531, 12.66549015045166, 13.316324234008789, 13.967159271240234, 14.617993354797363, 15.268828392028809, 15.919662475585938, 16.570497512817383, 17.221330642700195, 17.87216567993164, 18.522998809814453, 19.1738338470459]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 11.0, 13.0, 11.0, 16.0, 14.0, 12.0, 21.0, 16.0, 25.0, 30.0, 37.0, 36.0, 42.0, 54.0, 44.0, 45.0, 50.0, 50.0, 52.0, 43.0, 41.0, 47.0, 42.0, 42.0, 39.0, 23.0, 29.0, 24.0, 10.0, 18.0, 14.0, 7.0, 11.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.232421875, -3.1514434814453125, -3.070465087890625, -2.9894866943359375, -2.90850830078125, -2.8275299072265625, -2.746551513671875, -2.6655731201171875, -2.5845947265625, -2.5036163330078125, -2.422637939453125, -2.3416595458984375, -2.26068115234375, -2.1797027587890625, -2.098724365234375, -2.0177459716796875, -1.936767578125, -1.8557891845703125, -1.774810791015625, -1.6938323974609375, -1.61285400390625, -1.5318756103515625, -1.450897216796875, -1.3699188232421875, -1.2889404296875, -1.2079620361328125, -1.126983642578125, -1.0460052490234375, -0.96502685546875, -0.8840484619140625, -0.803070068359375, -0.7220916748046875, -0.64111328125, -0.5601348876953125, -0.479156494140625, -0.3981781005859375, -0.31719970703125, -0.2362213134765625, -0.155242919921875, -0.0742645263671875, 0.0067138671875, 0.0876922607421875, 0.168670654296875, 0.2496490478515625, 0.33062744140625, 0.4116058349609375, 0.492584228515625, 0.5735626220703125, 0.654541015625, 0.7355194091796875, 0.816497802734375, 0.8974761962890625, 0.97845458984375, 1.0594329833984375, 1.140411376953125, 1.2213897705078125, 1.3023681640625, 1.3833465576171875, 1.464324951171875, 1.5453033447265625, 1.62628173828125, 1.7072601318359375, 1.788238525390625, 1.8692169189453125, 1.9501953125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 5.0, 10.0, 12.0, 14.0, 37.0, 56.0, 84.0, 147.0, 250.0, 483.0, 805.0, 1347.0, 2331.0, 3829.0, 6424.0, 10481.0, 17596.0, 30680.0, 56806.0, 118067.0, 316779.0, 261425.0, 102532.0, 49978.0, 27564.0, 16236.0, 9706.0, 5966.0, 3579.0, 2140.0, 1318.0, 761.0, 426.0, 265.0, 151.0, 85.0, 62.0, 30.0, 18.0, 22.0, 9.0, 10.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4462890625, -0.43085479736328125, -0.4154205322265625, -0.39998626708984375, -0.384552001953125, -0.36911773681640625, -0.3536834716796875, -0.33824920654296875, -0.32281494140625, -0.30738067626953125, -0.2919464111328125, -0.27651214599609375, -0.261077880859375, -0.24564361572265625, -0.2302093505859375, -0.21477508544921875, -0.1993408203125, -0.18390655517578125, -0.1684722900390625, -0.15303802490234375, -0.137603759765625, -0.12216949462890625, -0.1067352294921875, -0.09130096435546875, -0.07586669921875, -0.06043243408203125, -0.0449981689453125, -0.02956390380859375, -0.014129638671875, 0.00130462646484375, 0.0167388916015625, 0.03217315673828125, 0.047607421875, 0.06304168701171875, 0.0784759521484375, 0.09391021728515625, 0.109344482421875, 0.12477874755859375, 0.1402130126953125, 0.15564727783203125, 0.17108154296875, 0.18651580810546875, 0.2019500732421875, 0.21738433837890625, 0.232818603515625, 0.24825286865234375, 0.2636871337890625, 0.27912139892578125, 0.2945556640625, 0.30998992919921875, 0.3254241943359375, 0.34085845947265625, 0.356292724609375, 0.37172698974609375, 0.3871612548828125, 0.40259552001953125, 0.41802978515625, 0.43346405029296875, 0.4488983154296875, 0.46433258056640625, 0.479766845703125, 0.49520111083984375, 0.5106353759765625, 0.5260696411132812, 0.54150390625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 4.0, 14.0, 17.0, 15.0, 12.0, 10.0, 17.0, 17.0, 18.0, 18.0, 29.0, 25.0, 26.0, 34.0, 37.0, 35.0, 35.0, 38.0, 47.0, 1067.0, 38.0, 46.0, 37.0, 43.0, 33.0, 43.0, 33.0, 37.0, 26.0, 29.0, 16.0, 24.0, 16.0, 14.0, 10.0, 10.0, 12.0, 6.0, 6.0, 7.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.4453125, -1.4029998779296875, -1.360687255859375, -1.3183746337890625, -1.27606201171875, -1.2337493896484375, -1.191436767578125, -1.1491241455078125, -1.1068115234375, -1.0644989013671875, -1.022186279296875, -0.9798736572265625, -0.93756103515625, -0.8952484130859375, -0.852935791015625, -0.8106231689453125, -0.768310546875, -0.7259979248046875, -0.683685302734375, -0.6413726806640625, -0.59906005859375, -0.5567474365234375, -0.514434814453125, -0.4721221923828125, -0.4298095703125, -0.3874969482421875, -0.345184326171875, -0.3028717041015625, -0.26055908203125, -0.2182464599609375, -0.175933837890625, -0.1336212158203125, -0.09130859375, -0.0489959716796875, -0.006683349609375, 0.0356292724609375, 0.07794189453125, 0.1202545166015625, 0.162567138671875, 0.2048797607421875, 0.2471923828125, 0.2895050048828125, 0.331817626953125, 0.3741302490234375, 0.41644287109375, 0.4587554931640625, 0.501068115234375, 0.5433807373046875, 0.585693359375, 0.6280059814453125, 0.670318603515625, 0.7126312255859375, 0.75494384765625, 0.7972564697265625, 0.839569091796875, 0.8818817138671875, 0.9241943359375, 0.9665069580078125, 1.008819580078125, 1.0511322021484375, 1.09344482421875, 1.1357574462890625, 1.178070068359375, 1.2203826904296875, 1.2626953125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 20.0, 23.0, 35.0, 60.0, 70.0, 105.0, 140.0, 213.0, 272.0, 441.0, 660.0, 862.0, 1267.0, 1818.0, 2627.0, 3591.0, 5277.0, 7562.0, 10803.0, 15374.0, 22404.0, 34066.0, 53037.0, 87605.0, 167943.0, 1317842.0, 141310.0, 76666.0, 47566.0, 30733.0, 20426.0, 13736.0, 9531.0, 6697.0, 4802.0, 3395.0, 2456.0, 1754.0, 1214.0, 898.0, 591.0, 397.0, 284.0, 185.0, 123.0, 94.0, 44.0, 36.0, 24.0, 19.0, 7.0, 14.0, 7.0, 9.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2978515625, -0.288360595703125, -0.27886962890625, -0.269378662109375, -0.2598876953125, -0.250396728515625, -0.24090576171875, -0.231414794921875, -0.221923828125, -0.212432861328125, -0.20294189453125, -0.193450927734375, -0.1839599609375, -0.174468994140625, -0.16497802734375, -0.155487060546875, -0.14599609375, -0.136505126953125, -0.12701416015625, -0.117523193359375, -0.1080322265625, -0.098541259765625, -0.08905029296875, -0.079559326171875, -0.070068359375, -0.060577392578125, -0.05108642578125, -0.041595458984375, -0.0321044921875, -0.022613525390625, -0.01312255859375, -0.003631591796875, 0.005859375, 0.015350341796875, 0.02484130859375, 0.034332275390625, 0.0438232421875, 0.053314208984375, 0.06280517578125, 0.072296142578125, 0.081787109375, 0.091278076171875, 0.10076904296875, 0.110260009765625, 0.1197509765625, 0.129241943359375, 0.13873291015625, 0.148223876953125, 0.15771484375, 0.167205810546875, 0.17669677734375, 0.186187744140625, 0.1956787109375, 0.205169677734375, 0.21466064453125, 0.224151611328125, 0.233642578125, 0.243133544921875, 0.25262451171875, 0.262115478515625, 0.2716064453125, 0.281097412109375, 0.29058837890625, 0.300079345703125, 0.3095703125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 4.0, 7.0, 12.0, 9.0, 14.0, 15.0, 24.0, 23.0, 29.0, 27.0, 40.0, 47.0, 60.0, 71.0, 85.0, 72.0, 69.0, 66.0, 65.0, 44.0, 41.0, 34.0, 33.0, 24.0, 16.0, 15.0, 9.0, 6.0, 5.0, 2.0, 4.0, 2.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.855892181396484e-05, -7.606390863656998e-05, -7.356889545917511e-05, -7.107388228178024e-05, -6.857886910438538e-05, -6.608385592699051e-05, -6.358884274959564e-05, -6.109382957220078e-05, -5.859881639480591e-05, -5.610380321741104e-05, -5.3608790040016174e-05, -5.111377686262131e-05, -4.861876368522644e-05, -4.6123750507831573e-05, -4.3628737330436707e-05, -4.113372415304184e-05, -3.863871097564697e-05, -3.6143697798252106e-05, -3.364868462085724e-05, -3.115367144346237e-05, -2.8658658266067505e-05, -2.6163645088672638e-05, -2.366863191127777e-05, -2.1173618733882904e-05, -1.8678605556488037e-05, -1.618359237909317e-05, -1.3688579201698303e-05, -1.1193566024303436e-05, -8.69855284690857e-06, -6.203539669513702e-06, -3.7085264921188354e-06, -1.2135133147239685e-06, 1.2814998626708984e-06, 3.7765130400657654e-06, 6.271526217460632e-06, 8.7665393948555e-06, 1.1261552572250366e-05, 1.3756565749645233e-05, 1.62515789270401e-05, 1.8746592104434967e-05, 2.1241605281829834e-05, 2.37366184592247e-05, 2.6231631636619568e-05, 2.8726644814014435e-05, 3.12216579914093e-05, 3.371667116880417e-05, 3.6211684346199036e-05, 3.87066975235939e-05, 4.120171070098877e-05, 4.3696723878383636e-05, 4.6191737055778503e-05, 4.868675023317337e-05, 5.118176341056824e-05, 5.3676776587963104e-05, 5.617178976535797e-05, 5.866680294275284e-05, 6.11618161201477e-05, 6.365682929754257e-05, 6.615184247493744e-05, 6.86468556523323e-05, 7.114186882972717e-05, 7.363688200712204e-05, 7.61318951845169e-05, 7.862690836191177e-05, 8.112192153930664e-05]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 2.0, 3.0, 6.0, 7.0, 7.0, 7.0, 13.0, 13.0, 24.0, 25.0, 54.0, 64.0, 89.0, 119.0, 194.0, 315.0, 491.0, 1439.0, 476897.0, 565577.0, 1664.0, 505.0, 316.0, 218.0, 138.0, 93.0, 63.0, 40.0, 32.0, 23.0, 26.0, 21.0, 15.0, 15.0, 15.0, 3.0, 3.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00157928466796875, -0.001531451940536499, -0.001483619213104248, -0.001435786485671997, -0.001387953758239746, -0.0013401210308074951, -0.0012922883033752441, -0.0012444555759429932, -0.0011966228485107422, -0.0011487901210784912, -0.0011009573936462402, -0.0010531246662139893, -0.0010052919387817383, -0.0009574592113494873, -0.0009096264839172363, -0.0008617937564849854, -0.0008139610290527344, -0.0007661283016204834, -0.0007182955741882324, -0.0006704628467559814, -0.0006226301193237305, -0.0005747973918914795, -0.0005269646644592285, -0.00047913193702697754, -0.00043129920959472656, -0.0003834664821624756, -0.0003356337547302246, -0.00028780102729797363, -0.00023996829986572266, -0.00019213557243347168, -0.0001443028450012207, -9.647011756896973e-05, -4.863739013671875e-05, -8.046627044677734e-07, 4.70280647277832e-05, 9.486079216003418e-05, 0.00014269351959228516, 0.00019052624702453613, 0.0002383589744567871, 0.0002861917018890381, 0.00033402442932128906, 0.00038185715675354004, 0.000429689884185791, 0.000477522611618042, 0.000525355339050293, 0.0005731880664825439, 0.0006210207939147949, 0.0006688535213470459, 0.0007166862487792969, 0.0007645189762115479, 0.0008123517036437988, 0.0008601844310760498, 0.0009080171585083008, 0.0009558498859405518, 0.0010036826133728027, 0.0010515153408050537, 0.0010993480682373047, 0.0011471807956695557, 0.0011950135231018066, 0.0012428462505340576, 0.0012906789779663086, 0.0013385117053985596, 0.0013863444328308105, 0.0014341771602630615, 0.0014820098876953125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 35.0, 89.0, 200.0, 292.0, 227.0, 113.0, 41.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019078976765740663, -0.00018678136984817684, -0.00018277298659086227, -0.00017876458878163248, -0.0001747561909724027, -0.0001707477931631729, -0.0001667393953539431, -0.00016273101209662855, -0.00015872261428739876, -0.00015471421647816896, -0.0001507058332208544, -0.0001466974354116246, -0.00014268903760239482, -0.00013868063979316503, -0.00013467224198393524, -0.00013066385872662067, -0.00012665546091739088, -0.0001226470631081611, -0.00011863867257488891, -0.00011463028204161674, -0.00011062188423238695, -0.00010661348642315716, -0.00010260509588988498, -9.85967053566128e-05, -9.458830754738301e-05, -9.057990973815322e-05, -8.657151920488104e-05, -8.256312867160887e-05, -7.855473086237907e-05, -7.454633305314928e-05, -7.05379425198771e-05, -6.652955198660493e-05, -6.252114690141752e-05, -5.851275273016654e-05, -5.4504358558915555e-05, -5.049596438766457e-05, -4.648757021641359e-05, -4.24791760451626e-05, -3.847078187391162e-05, -3.4462387702660635e-05, -3.045399353140965e-05, -2.6445599360158667e-05, -2.2437205188907683e-05, -1.84288110176567e-05, -1.4420416846405715e-05, -1.041202267515473e-05, -6.403628503903747e-06, -2.3952343326527625e-06, 1.6131598385982215e-06, 5.621554009849206e-06, 9.62994818110019e-06, 1.3638342352351174e-05, 1.7646736523602158e-05, 2.1655130694853142e-05, 2.5663524866104126e-05, 2.967191903735511e-05, 3.3680313208606094e-05, 3.768870737985708e-05, 4.169710155110806e-05, 4.5705495722359046e-05, 4.971388989361003e-05, 5.3722284064861014e-05, 5.7730678236112e-05, 6.173907604534179e-05, 6.574746657861397e-05]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 9.0, 5.0, 8.0, 6.0, 7.0, 3.0, 23.0, 14.0, 19.0, 17.0, 21.0, 27.0, 42.0, 37.0, 32.0, 46.0, 41.0, 51.0, 52.0, 43.0, 42.0, 58.0, 47.0, 42.0, 50.0, 42.0, 39.0, 29.0, 31.0, 24.0, 13.0, 11.0, 14.0, 14.0, 11.0, 8.0, 6.0, 3.0, 6.0, 1.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.999471664428711e-05, -3.8691796362400055e-05, -3.7388876080513e-05, -3.6085955798625946e-05, -3.478303551673889e-05, -3.348011523485184e-05, -3.217719495296478e-05, -3.087427467107773e-05, -2.9571354389190674e-05, -2.826843410730362e-05, -2.6965513825416565e-05, -2.566259354352951e-05, -2.4359673261642456e-05, -2.30567529797554e-05, -2.1753832697868347e-05, -2.0450912415981293e-05, -1.9147992134094238e-05, -1.7845071852207184e-05, -1.654215157032013e-05, -1.5239231288433075e-05, -1.393631100654602e-05, -1.2633390724658966e-05, -1.1330470442771912e-05, -1.0027550160884857e-05, -8.724629878997803e-06, -7.421709597110748e-06, -6.118789315223694e-06, -4.815869033336639e-06, -3.512948751449585e-06, -2.2100284695625305e-06, -9.071081876754761e-07, 3.9581209421157837e-07, 1.6987323760986328e-06, 3.0016526579856873e-06, 4.304572939872742e-06, 5.607493221759796e-06, 6.910413503646851e-06, 8.213333785533905e-06, 9.51625406742096e-06, 1.0819174349308014e-05, 1.2122094631195068e-05, 1.3425014913082123e-05, 1.4727935194969177e-05, 1.603085547685623e-05, 1.7333775758743286e-05, 1.863669604063034e-05, 1.9939616322517395e-05, 2.124253660440445e-05, 2.2545456886291504e-05, 2.384837716817856e-05, 2.5151297450065613e-05, 2.6454217731952667e-05, 2.775713801383972e-05, 2.9060058295726776e-05, 3.036297857761383e-05, 3.1665898859500885e-05, 3.296881914138794e-05, 3.4271739423274994e-05, 3.557465970516205e-05, 3.68775799870491e-05, 3.818050026893616e-05, 3.948342055082321e-05, 4.0786340832710266e-05, 4.208926111459732e-05, 4.3392181396484375e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 11.0, 13.0, 11.0, 16.0, 14.0, 12.0, 21.0, 16.0, 25.0, 30.0, 37.0, 36.0, 42.0, 54.0, 44.0, 45.0, 50.0, 50.0, 52.0, 43.0, 41.0, 47.0, 42.0, 42.0, 39.0, 23.0, 29.0, 24.0, 10.0, 18.0, 14.0, 7.0, 11.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.232421875, -3.1514434814453125, -3.070465087890625, -2.9894866943359375, -2.90850830078125, -2.8275299072265625, -2.746551513671875, -2.6655731201171875, -2.5845947265625, -2.5036163330078125, -2.422637939453125, -2.3416595458984375, -2.26068115234375, -2.1797027587890625, -2.098724365234375, -2.0177459716796875, -1.936767578125, -1.8557891845703125, -1.774810791015625, -1.6938323974609375, -1.61285400390625, -1.5318756103515625, -1.450897216796875, -1.3699188232421875, -1.2889404296875, -1.2079620361328125, -1.126983642578125, -1.0460052490234375, -0.96502685546875, -0.8840484619140625, -0.803070068359375, -0.7220916748046875, -0.64111328125, -0.5601348876953125, -0.479156494140625, -0.3981781005859375, -0.31719970703125, -0.2362213134765625, -0.155242919921875, -0.0742645263671875, 0.0067138671875, 0.0876922607421875, 0.168670654296875, 0.2496490478515625, 0.33062744140625, 0.4116058349609375, 0.492584228515625, 0.5735626220703125, 0.654541015625, 0.7355194091796875, 0.816497802734375, 0.8974761962890625, 0.97845458984375, 1.0594329833984375, 1.140411376953125, 1.2213897705078125, 1.3023681640625, 1.3833465576171875, 1.464324951171875, 1.5453033447265625, 1.62628173828125, 1.7072601318359375, 1.788238525390625, 1.8692169189453125, 1.9501953125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 9.0, 14.0, 30.0, 33.0, 48.0, 80.0, 112.0, 169.0, 323.0, 552.0, 1048.0, 1983.0, 3668.0, 7344.0, 15553.0, 37299.0, 94567.0, 231560.0, 338505.0, 186482.0, 73900.0, 29711.0, 12659.0, 6001.0, 3053.0, 1611.0, 915.0, 484.0, 320.0, 187.0, 128.0, 70.0, 55.0, 34.0, 17.0, 15.0, 5.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.24609375, -2.1859893798828125, -2.125885009765625, -2.0657806396484375, -2.00567626953125, -1.9455718994140625, -1.885467529296875, -1.8253631591796875, -1.7652587890625, -1.7051544189453125, -1.645050048828125, -1.5849456787109375, -1.52484130859375, -1.4647369384765625, -1.404632568359375, -1.3445281982421875, -1.284423828125, -1.2243194580078125, -1.164215087890625, -1.1041107177734375, -1.04400634765625, -0.9839019775390625, -0.923797607421875, -0.8636932373046875, -0.8035888671875, -0.7434844970703125, -0.683380126953125, -0.6232757568359375, -0.56317138671875, -0.5030670166015625, -0.442962646484375, -0.3828582763671875, -0.32275390625, -0.2626495361328125, -0.202545166015625, -0.1424407958984375, -0.08233642578125, -0.0222320556640625, 0.037872314453125, 0.0979766845703125, 0.1580810546875, 0.2181854248046875, 0.278289794921875, 0.3383941650390625, 0.39849853515625, 0.4586029052734375, 0.518707275390625, 0.5788116455078125, 0.638916015625, 0.6990203857421875, 0.759124755859375, 0.8192291259765625, 0.87933349609375, 0.9394378662109375, 0.999542236328125, 1.0596466064453125, 1.1197509765625, 1.1798553466796875, 1.239959716796875, 1.3000640869140625, 1.36016845703125, 1.4202728271484375, 1.480377197265625, 1.5404815673828125, 1.6005859375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 9.0, 13.0, 14.0, 12.0, 16.0, 20.0, 22.0, 37.0, 38.0, 50.0, 60.0, 48.0, 76.0, 154.0, 439.0, 1467.0, 126.0, 84.0, 74.0, 49.0, 33.0, 33.0, 30.0, 23.0, 26.0, 22.0, 17.0, 13.0, 13.0, 10.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.07373046875, -9.7490234375, -9.42431640625, -9.099609375, -8.77490234375, -8.4501953125, -8.12548828125, -7.80078125, -7.47607421875, -7.1513671875, -6.82666015625, -6.501953125, -6.17724609375, -5.8525390625, -5.52783203125, -5.203125, -4.87841796875, -4.5537109375, -4.22900390625, -3.904296875, -3.57958984375, -3.2548828125, -2.93017578125, -2.60546875, -2.28076171875, -1.9560546875, -1.63134765625, -1.306640625, -0.98193359375, -0.6572265625, -0.33251953125, -0.0078125, 0.31689453125, 0.6416015625, 0.96630859375, 1.291015625, 1.61572265625, 1.9404296875, 2.26513671875, 2.58984375, 2.91455078125, 3.2392578125, 3.56396484375, 3.888671875, 4.21337890625, 4.5380859375, 4.86279296875, 5.1875, 5.51220703125, 5.8369140625, 6.16162109375, 6.486328125, 6.81103515625, 7.1357421875, 7.46044921875, 7.78515625, 8.10986328125, 8.4345703125, 8.75927734375, 9.083984375, 9.40869140625, 9.7333984375, 10.05810546875, 10.3828125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 14.0, 13.0, 20.0, 21.0, 21.0, 44.0, 45.0, 41.0, 73.0, 104.0, 187.0, 314.0, 759.0, 3352.0, 96768.0, 2997886.0, 42071.0, 2407.0, 666.0, 277.0, 195.0, 103.0, 68.0, 61.0, 33.0, 30.0, 26.0, 20.0, 13.0, 14.0, 14.0, 9.0, 6.0, 5.0, 6.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.4296875, -13.9552001953125, -13.480712890625, -13.0062255859375, -12.53173828125, -12.0572509765625, -11.582763671875, -11.1082763671875, -10.6337890625, -10.1593017578125, -9.684814453125, -9.2103271484375, -8.73583984375, -8.2613525390625, -7.786865234375, -7.3123779296875, -6.837890625, -6.3634033203125, -5.888916015625, -5.4144287109375, -4.93994140625, -4.4654541015625, -3.990966796875, -3.5164794921875, -3.0419921875, -2.5675048828125, -2.093017578125, -1.6185302734375, -1.14404296875, -0.6695556640625, -0.195068359375, 0.2794189453125, 0.75390625, 1.2283935546875, 1.702880859375, 2.1773681640625, 2.65185546875, 3.1263427734375, 3.600830078125, 4.0753173828125, 4.5498046875, 5.0242919921875, 5.498779296875, 5.9732666015625, 6.44775390625, 6.9222412109375, 7.396728515625, 7.8712158203125, 8.345703125, 8.8201904296875, 9.294677734375, 9.7691650390625, 10.24365234375, 10.7181396484375, 11.192626953125, 11.6671142578125, 12.1416015625, 12.6160888671875, 13.090576171875, 13.5650634765625, 14.03955078125, 14.5140380859375, 14.988525390625, 15.4630126953125, 15.9375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 5.0, 15.0, 40.0, 71.0, 137.0, 185.0, 200.0, 168.0, 109.0, 51.0, 19.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6231865882873535, -5.011821269989014, -4.400455474853516, -3.789090156555176, -3.177724599838257, -2.566359043121338, -1.954993724822998, -1.3436279296875, -0.7322626113891602, -0.12089711427688599, 0.4904683828353882, 1.1018338203430176, 1.7131993770599365, 2.3245649337768555, 2.9359302520751953, 3.5472960472106934, 4.158661365509033, 4.770026683807373, 5.381392478942871, 5.992757797241211, 6.604123115539551, 7.215488910675049, 7.826854228973389, 8.438220024108887, 9.049585342407227, 9.660950660705566, 10.272315979003906, 10.883682250976562, 11.495047569274902, 12.106412887573242, 12.717778205871582, 13.329143524169922, 13.940507888793945, 14.551873207092285, 15.163238525390625, 15.774604797363281, 16.385969161987305, 16.99733543395996, 17.608699798583984, 18.22006607055664, 18.831432342529297, 19.442798614501953, 20.054162979125977, 20.665529251098633, 21.276893615722656, 21.888259887695312, 22.49962615966797, 23.110990524291992, 23.722354888916016, 24.333721160888672, 24.945085525512695, 25.55645179748535, 26.167816162109375, 26.77918243408203, 27.390548706054688, 28.00191307067871, 28.613279342651367, 29.224645614624023, 29.836009979248047, 30.447376251220703, 31.058740615844727, 31.670106887817383, 32.281471252441406, 32.89283752441406, 33.50420379638672]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 9.0, 7.0, 4.0, 4.0, 8.0, 12.0, 8.0, 14.0, 18.0, 31.0, 25.0, 21.0, 34.0, 25.0, 26.0, 30.0, 58.0, 47.0, 41.0, 38.0, 44.0, 49.0, 38.0, 37.0, 43.0, 49.0, 35.0, 33.0, 28.0, 24.0, 31.0, 14.0, 11.0, 18.0, 10.0, 16.0, 19.0, 10.0, 10.0, 3.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.636640548706055, -28.737361907958984, -27.838083267211914, -26.938804626464844, -26.039527893066406, -25.140247344970703, -24.240970611572266, -23.341691970825195, -22.442413330078125, -21.543134689331055, -20.643856048583984, -19.744577407836914, -18.845298767089844, -17.946022033691406, -17.046743392944336, -16.147464752197266, -15.248186111450195, -14.348907470703125, -13.449628829956055, -12.5503511428833, -11.65107250213623, -10.75179386138916, -9.852516174316406, -8.953237533569336, -8.053958892822266, -7.154680252075195, -6.255402088165283, -5.356123924255371, -4.456845283508301, -3.5575666427612305, -2.6582884788513184, -1.7590103149414062, -0.8597335815429688, 0.03954482078552246, 0.9388232231140137, 1.8381016254425049, 2.737380027770996, 3.6366586685180664, 4.5359368324279785, 5.435214996337891, 6.334493637084961, 7.233772277832031, 8.133050918579102, 9.032328605651855, 9.931607246398926, 10.830885887145996, 11.73016357421875, 12.62944221496582, 13.52872085571289, 14.427999496459961, 15.327278137207031, 16.2265567779541, 17.125835418701172, 18.02511215209961, 18.92439079284668, 19.82366943359375, 20.72294807434082, 21.62222671508789, 22.52150535583496, 23.42078399658203, 24.32006072998047, 25.219341278076172, 26.11861801147461, 27.01789665222168, 27.91717529296875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 4.0, 10.0, 10.0, 16.0, 9.0, 20.0, 15.0, 12.0, 20.0, 20.0, 23.0, 32.0, 33.0, 43.0, 35.0, 56.0, 47.0, 51.0, 50.0, 44.0, 58.0, 45.0, 44.0, 45.0, 42.0, 39.0, 35.0, 30.0, 20.0, 25.0, 16.0, 9.0, 9.0, 10.0, 12.0, 6.0, 4.0, 6.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.52734375, -3.440399169921875, -3.35345458984375, -3.266510009765625, -3.1795654296875, -3.092620849609375, -3.00567626953125, -2.918731689453125, -2.831787109375, -2.744842529296875, -2.65789794921875, -2.570953369140625, -2.4840087890625, -2.397064208984375, -2.31011962890625, -2.223175048828125, -2.13623046875, -2.049285888671875, -1.96234130859375, -1.875396728515625, -1.7884521484375, -1.701507568359375, -1.61456298828125, -1.527618408203125, -1.440673828125, -1.353729248046875, -1.26678466796875, -1.179840087890625, -1.0928955078125, -1.005950927734375, -0.91900634765625, -0.832061767578125, -0.7451171875, -0.658172607421875, -0.57122802734375, -0.484283447265625, -0.3973388671875, -0.310394287109375, -0.22344970703125, -0.136505126953125, -0.049560546875, 0.037384033203125, 0.12432861328125, 0.211273193359375, 0.2982177734375, 0.385162353515625, 0.47210693359375, 0.559051513671875, 0.64599609375, 0.732940673828125, 0.81988525390625, 0.906829833984375, 0.9937744140625, 1.080718994140625, 1.16766357421875, 1.254608154296875, 1.341552734375, 1.428497314453125, 1.51544189453125, 1.602386474609375, 1.6893310546875, 1.776275634765625, 1.86322021484375, 1.950164794921875, 2.037109375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 8.0, 9.0, 10.0, 14.0, 10.0, 10.0, 21.0, 12.0, 27.0, 36.0, 56.0, 86.0, 115.0, 314.0, 794.0, 3004.0, 18718.0, 189584.0, 2281401.0, 1569903.0, 114078.0, 12595.0, 2273.0, 566.0, 239.0, 121.0, 73.0, 50.0, 39.0, 32.0, 13.0, 15.0, 10.0, 12.0, 8.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.359375, -8.1387939453125, -7.918212890625, -7.6976318359375, -7.47705078125, -7.2564697265625, -7.035888671875, -6.8153076171875, -6.5947265625, -6.3741455078125, -6.153564453125, -5.9329833984375, -5.71240234375, -5.4918212890625, -5.271240234375, -5.0506591796875, -4.830078125, -4.6094970703125, -4.388916015625, -4.1683349609375, -3.94775390625, -3.7271728515625, -3.506591796875, -3.2860107421875, -3.0654296875, -2.8448486328125, -2.624267578125, -2.4036865234375, -2.18310546875, -1.9625244140625, -1.741943359375, -1.5213623046875, -1.30078125, -1.0802001953125, -0.859619140625, -0.6390380859375, -0.41845703125, -0.1978759765625, 0.022705078125, 0.2432861328125, 0.4638671875, 0.6844482421875, 0.905029296875, 1.1256103515625, 1.34619140625, 1.5667724609375, 1.787353515625, 2.0079345703125, 2.228515625, 2.4490966796875, 2.669677734375, 2.8902587890625, 3.11083984375, 3.3314208984375, 3.552001953125, 3.7725830078125, 3.9931640625, 4.2137451171875, 4.434326171875, 4.6549072265625, 4.87548828125, 5.0960693359375, 5.316650390625, 5.5372314453125, 5.7578125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 4.0, 13.0, 25.0, 28.0, 45.0, 81.0, 134.0, 216.0, 317.0, 462.0, 636.0, 633.0, 502.0, 347.0, 237.0, 149.0, 87.0, 60.0, 41.0, 17.0, 12.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.890625, -6.6044921875, -6.318359375, -6.0322265625, -5.74609375, -5.4599609375, -5.173828125, -4.8876953125, -4.6015625, -4.3154296875, -4.029296875, -3.7431640625, -3.45703125, -3.1708984375, -2.884765625, -2.5986328125, -2.3125, -2.0263671875, -1.740234375, -1.4541015625, -1.16796875, -0.8818359375, -0.595703125, -0.3095703125, -0.0234375, 0.2626953125, 0.548828125, 0.8349609375, 1.12109375, 1.4072265625, 1.693359375, 1.9794921875, 2.265625, 2.5517578125, 2.837890625, 3.1240234375, 3.41015625, 3.6962890625, 3.982421875, 4.2685546875, 4.5546875, 4.8408203125, 5.126953125, 5.4130859375, 5.69921875, 5.9853515625, 6.271484375, 6.5576171875, 6.84375, 7.1298828125, 7.416015625, 7.7021484375, 7.98828125, 8.2744140625, 8.560546875, 8.8466796875, 9.1328125, 9.4189453125, 9.705078125, 9.9912109375, 10.27734375, 10.5634765625, 10.849609375, 11.1357421875, 11.421875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 10.0, 9.0, 19.0, 21.0, 28.0, 53.0, 71.0, 131.0, 205.0, 349.0, 800.0, 3643.0, 119067.0, 3885003.0, 178717.0, 4426.0, 821.0, 371.0, 178.0, 121.0, 72.0, 51.0, 43.0, 26.0, 17.0, 12.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.9375, -24.23583984375, -23.5341796875, -22.83251953125, -22.130859375, -21.42919921875, -20.7275390625, -20.02587890625, -19.32421875, -18.62255859375, -17.9208984375, -17.21923828125, -16.517578125, -15.81591796875, -15.1142578125, -14.41259765625, -13.7109375, -13.00927734375, -12.3076171875, -11.60595703125, -10.904296875, -10.20263671875, -9.5009765625, -8.79931640625, -8.09765625, -7.39599609375, -6.6943359375, -5.99267578125, -5.291015625, -4.58935546875, -3.8876953125, -3.18603515625, -2.484375, -1.78271484375, -1.0810546875, -0.37939453125, 0.322265625, 1.02392578125, 1.7255859375, 2.42724609375, 3.12890625, 3.83056640625, 4.5322265625, 5.23388671875, 5.935546875, 6.63720703125, 7.3388671875, 8.04052734375, 8.7421875, 9.44384765625, 10.1455078125, 10.84716796875, 11.548828125, 12.25048828125, 12.9521484375, 13.65380859375, 14.35546875, 15.05712890625, 15.7587890625, 16.46044921875, 17.162109375, 17.86376953125, 18.5654296875, 19.26708984375, 19.96875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 50.0, 143.0, 312.0, 282.0, 162.0, 44.0, 14.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.97673034667969, -57.36958312988281, -54.76243591308594, -52.15528869628906, -49.54814529418945, -46.94099807739258, -44.3338508605957, -41.726707458496094, -39.11956024169922, -36.512413024902344, -33.90526580810547, -31.298120498657227, -28.690975189208984, -26.08382797241211, -23.476680755615234, -20.869535446166992, -18.262386322021484, -15.655240058898926, -13.048093795776367, -10.440946578979492, -7.833800315856934, -5.226654052734375, -2.6195068359375, -0.012361526489257812, 2.594785690307617, 5.201931953430176, 7.809078693389893, 10.41622543334961, 13.023371696472168, 15.630517959594727, 18.2376651763916, 20.844810485839844, 23.45195770263672, 26.059104919433594, 28.666250228881836, 31.27339744567871, 33.88054275512695, 36.48768997192383, 39.0948371887207, 41.70198059082031, 44.30912780761719, 46.91627502441406, 49.52342224121094, 52.13056945800781, 54.73771286010742, 57.3448600769043, 59.95200729370117, 62.55915069580078, 65.16630554199219, 67.77345275878906, 70.38059997558594, 72.98774719238281, 75.59489440917969, 78.20204162597656, 80.80918884277344, 83.41632843017578, 86.02347564697266, 88.63062286376953, 91.2377700805664, 93.84491729736328, 96.45206451416016, 99.0592041015625, 101.66635131835938, 104.27349853515625, 106.88064575195312]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 0.0, 4.0, 10.0, 11.0, 12.0, 19.0, 16.0, 11.0, 22.0, 17.0, 21.0, 19.0, 20.0, 39.0, 41.0, 43.0, 36.0, 36.0, 31.0, 39.0, 42.0, 36.0, 29.0, 33.0, 41.0, 30.0, 47.0, 34.0, 29.0, 23.0, 28.0, 29.0, 26.0, 21.0, 16.0, 15.0, 13.0, 10.0, 4.0, 10.0, 12.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-20.96520233154297, -20.3347225189209, -19.704240798950195, -19.073760986328125, -18.443281173706055, -17.812801361083984, -17.18231964111328, -16.55183982849121, -15.921359062194824, -15.290878295898438, -14.660398483276367, -14.02991771697998, -13.399436950683594, -12.768957138061523, -12.138476371765137, -11.50799560546875, -10.87751579284668, -10.247035026550293, -9.616555213928223, -8.986074447631836, -8.355594635009766, -7.725113868713379, -7.094633102416992, -6.464152812957764, -5.833672523498535, -5.203192234039307, -4.572711944580078, -3.9422311782836914, -3.311750888824463, -2.6812705993652344, -2.0507900714874268, -1.4203095436096191, -0.7898292541503906, -0.15934884548187256, 0.4711315631866455, 1.1016119718551636, 1.7320923805236816, 2.36257266998291, 2.9930531978607178, 3.6235337257385254, 4.254014015197754, 4.884494304656982, 5.514974594116211, 6.145455360412598, 6.775935649871826, 7.406415939331055, 8.036896705627441, 8.667377471923828, 9.297857284545898, 9.928338050842285, 10.558817863464355, 11.189298629760742, 11.819778442382812, 12.4502592086792, 13.080739974975586, 13.711219787597656, 14.341700553894043, 14.97218132019043, 15.6026611328125, 16.23314094543457, 16.863622665405273, 17.494102478027344, 18.124582290649414, 18.755064010620117, 19.385543823242188]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 5.0, 10.0, 10.0, 17.0, 18.0, 13.0, 20.0, 26.0, 24.0, 32.0, 37.0, 37.0, 33.0, 53.0, 50.0, 55.0, 55.0, 51.0, 45.0, 55.0, 55.0, 41.0, 36.0, 33.0, 36.0, 18.0, 29.0, 24.0, 14.0, 15.0, 11.0, 15.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.546875, -3.4552001953125, -3.363525390625, -3.2718505859375, -3.18017578125, -3.0885009765625, -2.996826171875, -2.9051513671875, -2.8134765625, -2.7218017578125, -2.630126953125, -2.5384521484375, -2.44677734375, -2.3551025390625, -2.263427734375, -2.1717529296875, -2.080078125, -1.9884033203125, -1.896728515625, -1.8050537109375, -1.71337890625, -1.6217041015625, -1.530029296875, -1.4383544921875, -1.3466796875, -1.2550048828125, -1.163330078125, -1.0716552734375, -0.97998046875, -0.8883056640625, -0.796630859375, -0.7049560546875, -0.61328125, -0.5216064453125, -0.429931640625, -0.3382568359375, -0.24658203125, -0.1549072265625, -0.063232421875, 0.0284423828125, 0.1201171875, 0.2117919921875, 0.303466796875, 0.3951416015625, 0.48681640625, 0.5784912109375, 0.670166015625, 0.7618408203125, 0.853515625, 0.9451904296875, 1.036865234375, 1.1285400390625, 1.22021484375, 1.3118896484375, 1.403564453125, 1.4952392578125, 1.5869140625, 1.6785888671875, 1.770263671875, 1.8619384765625, 1.95361328125, 2.0452880859375, 2.136962890625, 2.2286376953125, 2.3203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 14.0, 17.0, 26.0, 41.0, 74.0, 101.0, 165.0, 290.0, 421.0, 763.0, 1257.0, 2105.0, 3448.0, 5817.0, 9934.0, 16766.0, 29955.0, 56664.0, 117734.0, 313142.0, 265863.0, 106161.0, 51585.0, 27820.0, 15837.0, 8979.0, 5376.0, 3265.0, 2004.0, 1127.0, 707.0, 436.0, 238.0, 148.0, 88.0, 58.0, 36.0, 24.0, 17.0, 14.0, 10.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5673828125, -0.5496139526367188, -0.5318450927734375, -0.5140762329101562, -0.496307373046875, -0.47853851318359375, -0.4607696533203125, -0.44300079345703125, -0.42523193359375, -0.40746307373046875, -0.3896942138671875, -0.37192535400390625, -0.354156494140625, -0.33638763427734375, -0.3186187744140625, -0.30084991455078125, -0.2830810546875, -0.26531219482421875, -0.2475433349609375, -0.22977447509765625, -0.212005615234375, -0.19423675537109375, -0.1764678955078125, -0.15869903564453125, -0.14093017578125, -0.12316131591796875, -0.1053924560546875, -0.08762359619140625, -0.069854736328125, -0.05208587646484375, -0.0343170166015625, -0.01654815673828125, 0.001220703125, 0.01898956298828125, 0.0367584228515625, 0.05452728271484375, 0.072296142578125, 0.09006500244140625, 0.1078338623046875, 0.12560272216796875, 0.14337158203125, 0.16114044189453125, 0.1789093017578125, 0.19667816162109375, 0.214447021484375, 0.23221588134765625, 0.2499847412109375, 0.26775360107421875, 0.2855224609375, 0.30329132080078125, 0.3210601806640625, 0.33882904052734375, 0.356597900390625, 0.37436676025390625, 0.3921356201171875, 0.40990447998046875, 0.42767333984375, 0.44544219970703125, 0.4632110595703125, 0.48097991943359375, 0.498748779296875, 0.5165176391601562, 0.5342864990234375, 0.5520553588867188, 0.56982421875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 8.0, 2.0, 2.0, 3.0, 10.0, 15.0, 9.0, 9.0, 15.0, 14.0, 24.0, 23.0, 26.0, 28.0, 19.0, 26.0, 31.0, 47.0, 37.0, 48.0, 43.0, 43.0, 1055.0, 44.0, 37.0, 32.0, 35.0, 43.0, 29.0, 38.0, 29.0, 30.0, 31.0, 20.0, 19.0, 18.0, 26.0, 15.0, 5.0, 9.0, 4.0, 6.0, 2.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.470703125, -1.4229278564453125, -1.375152587890625, -1.3273773193359375, -1.27960205078125, -1.2318267822265625, -1.184051513671875, -1.1362762451171875, -1.0885009765625, -1.0407257080078125, -0.992950439453125, -0.9451751708984375, -0.89739990234375, -0.8496246337890625, -0.801849365234375, -0.7540740966796875, -0.706298828125, -0.6585235595703125, -0.610748291015625, -0.5629730224609375, -0.51519775390625, -0.4674224853515625, -0.419647216796875, -0.3718719482421875, -0.3240966796875, -0.2763214111328125, -0.228546142578125, -0.1807708740234375, -0.13299560546875, -0.0852203369140625, -0.037445068359375, 0.0103302001953125, 0.05810546875, 0.1058807373046875, 0.153656005859375, 0.2014312744140625, 0.24920654296875, 0.2969818115234375, 0.344757080078125, 0.3925323486328125, 0.4403076171875, 0.4880828857421875, 0.535858154296875, 0.5836334228515625, 0.63140869140625, 0.6791839599609375, 0.726959228515625, 0.7747344970703125, 0.822509765625, 0.8702850341796875, 0.918060302734375, 0.9658355712890625, 1.01361083984375, 1.0613861083984375, 1.109161376953125, 1.1569366455078125, 1.2047119140625, 1.2524871826171875, 1.300262451171875, 1.3480377197265625, 1.39581298828125, 1.4435882568359375, 1.491363525390625, 1.5391387939453125, 1.5869140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 19.0, 16.0, 20.0, 42.0, 61.0, 98.0, 119.0, 168.0, 271.0, 347.0, 498.0, 667.0, 980.0, 1314.0, 1971.0, 2782.0, 3946.0, 5708.0, 8182.0, 12009.0, 17587.0, 25895.0, 39375.0, 62290.0, 107691.0, 217972.0, 1280980.0, 114065.0, 65832.0, 41027.0, 26663.0, 17942.0, 12212.0, 8565.0, 5910.0, 4172.0, 2856.0, 2048.0, 1398.0, 1055.0, 743.0, 488.0, 331.0, 236.0, 192.0, 113.0, 90.0, 70.0, 40.0, 34.0, 18.0, 15.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.34423828125, -0.33349609375, -0.32275390625, -0.31201171875, -0.30126953125, -0.29052734375, -0.27978515625, -0.26904296875, -0.25830078125, -0.24755859375, -0.23681640625, -0.22607421875, -0.21533203125, -0.20458984375, -0.19384765625, -0.18310546875, -0.17236328125, -0.16162109375, -0.15087890625, -0.14013671875, -0.12939453125, -0.11865234375, -0.10791015625, -0.09716796875, -0.08642578125, -0.07568359375, -0.06494140625, -0.05419921875, -0.04345703125, -0.03271484375, -0.02197265625, -0.01123046875, -0.00048828125, 0.01025390625, 0.02099609375, 0.03173828125, 0.04248046875, 0.05322265625, 0.06396484375, 0.07470703125, 0.08544921875, 0.09619140625, 0.10693359375, 0.11767578125, 0.12841796875, 0.13916015625, 0.14990234375, 0.16064453125, 0.17138671875, 0.18212890625, 0.19287109375, 0.20361328125, 0.21435546875, 0.22509765625, 0.23583984375, 0.24658203125, 0.25732421875, 0.26806640625, 0.27880859375, 0.28955078125, 0.30029296875, 0.31103515625, 0.32177734375, 0.33251953125, 0.34326171875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 11.0, 7.0, 5.0, 7.0, 4.0, 17.0, 14.0, 35.0, 37.0, 44.0, 53.0, 40.0, 56.0, 86.0, 93.0, 82.0, 69.0, 59.0, 58.0, 55.0, 32.0, 28.0, 23.0, 20.0, 10.0, 12.0, 10.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012302398681640625, -0.0001193443313241005, -0.00011566467583179474, -0.00011198502033948898, -0.00010830536484718323, -0.00010462570935487747, -0.00010094605386257172, -9.726639837026596e-05, -9.35867428779602e-05, -8.990708738565445e-05, -8.62274318933487e-05, -8.254777640104294e-05, -7.886812090873718e-05, -7.518846541643143e-05, -7.150880992412567e-05, -6.782915443181992e-05, -6.414949893951416e-05, -6.0469843447208405e-05, -5.679018795490265e-05, -5.311053246259689e-05, -4.943087697029114e-05, -4.575122147798538e-05, -4.2071565985679626e-05, -3.839191049337387e-05, -3.4712255001068115e-05, -3.103259950876236e-05, -2.7352944016456604e-05, -2.367328852415085e-05, -1.9993633031845093e-05, -1.6313977539539337e-05, -1.2634322047233582e-05, -8.954666554927826e-06, -5.27501106262207e-06, -1.5953555703163147e-06, 2.084299921989441e-06, 5.7639554142951965e-06, 9.443610906600952e-06, 1.3123266398906708e-05, 1.6802921891212463e-05, 2.048257738351822e-05, 2.4162232875823975e-05, 2.784188836812973e-05, 3.1521543860435486e-05, 3.520119935274124e-05, 3.8880854845047e-05, 4.256051033735275e-05, 4.624016582965851e-05, 4.9919821321964264e-05, 5.359947681427002e-05, 5.7279132306575775e-05, 6.095878779888153e-05, 6.463844329118729e-05, 6.831809878349304e-05, 7.19977542757988e-05, 7.567740976810455e-05, 7.935706526041031e-05, 8.303672075271606e-05, 8.671637624502182e-05, 9.039603173732758e-05, 9.407568722963333e-05, 9.775534272193909e-05, 0.00010143499821424484, 0.0001051146537065506, 0.00010879430919885635, 0.00011247396469116211]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 8.0, 16.0, 14.0, 25.0, 34.0, 51.0, 77.0, 98.0, 170.0, 268.0, 490.0, 1442.0, 883484.0, 160292.0, 955.0, 426.0, 237.0, 151.0, 112.0, 54.0, 35.0, 32.0, 20.0, 13.0, 9.0, 5.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0021686553955078125, -0.0020935535430908203, -0.002018451690673828, -0.001943349838256836, -0.0018682479858398438, -0.0017931461334228516, -0.0017180442810058594, -0.0016429424285888672, -0.001567840576171875, -0.0014927387237548828, -0.0014176368713378906, -0.0013425350189208984, -0.0012674331665039062, -0.001192331314086914, -0.0011172294616699219, -0.0010421276092529297, -0.0009670257568359375, -0.0008919239044189453, -0.0008168220520019531, -0.0007417201995849609, -0.0006666183471679688, -0.0005915164947509766, -0.0005164146423339844, -0.0004413127899169922, -0.0003662109375, -0.0002911090850830078, -0.00021600723266601562, -0.00014090538024902344, -6.580352783203125e-05, 9.298324584960938e-06, 8.440017700195312e-05, 0.0001595020294189453, 0.0002346038818359375, 0.0003097057342529297, 0.0003848075866699219, 0.00045990943908691406, 0.0005350112915039062, 0.0006101131439208984, 0.0006852149963378906, 0.0007603168487548828, 0.000835418701171875, 0.0009105205535888672, 0.0009856224060058594, 0.0010607242584228516, 0.0011358261108398438, 0.001210927963256836, 0.0012860298156738281, 0.0013611316680908203, 0.0014362335205078125, 0.0015113353729248047, 0.0015864372253417969, 0.001661539077758789, 0.0017366409301757812, 0.0018117427825927734, 0.0018868446350097656, 0.001961946487426758, 0.00203704833984375, 0.002112150192260742, 0.0021872520446777344, 0.0022623538970947266, 0.0023374557495117188, 0.002412557601928711, 0.002487659454345703, 0.0025627613067626953, 0.0026378631591796875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 10.0, 74.0, 178.0, 319.0, 252.0, 126.0, 42.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002227829972980544, -0.00021745401318185031, -0.00021212502906564623, -0.00020679604494944215, -0.00020146706083323807, -0.00019613807671703398, -0.00019080910715274513, -0.00018548010848462582, -0.00018015113892033696, -0.00017482215480413288, -0.0001694931706879288, -0.0001641641865717247, -0.00015883520245552063, -0.00015350621833931655, -0.00014817723422311246, -0.0001428482646588236, -0.0001375192659907043, -0.00013219028187450022, -0.00012686129775829613, -0.00012153231364209205, -0.00011620332952588797, -0.00011087434540968388, -0.00010554536856943741, -0.00010021638445323333, -9.488740033702925e-05, -8.955841622082517e-05, -8.422943210462108e-05, -7.890045526437461e-05, -7.357147114817053e-05, -6.824248703196645e-05, -6.291350291576236e-05, -5.758451879955828e-05, -5.22555346833542e-05, -4.6926550567150116e-05, -4.159756645094603e-05, -3.626858597272076e-05, -3.0939601856516674e-05, -2.561061774031259e-05, -2.0281637262087315e-05, -1.4952653145883232e-05, -9.62366902967915e-06, -4.294685822969768e-06, 1.034297383739613e-06, 6.363279680954292e-06, 1.1692263797158375e-05, 1.702124791336246e-05, 2.2350228391587734e-05, 2.7679212507791817e-05, 3.30081966239959e-05, 3.833718074019998e-05, 4.3666164856404066e-05, 4.899514533462934e-05, 5.4324129450833425e-05, 5.965311356703751e-05, 6.498209404526278e-05, 7.031107816146687e-05, 7.564006227767095e-05, 8.096904639387503e-05, 8.629803051007912e-05, 9.162700735032558e-05, 9.695599146652967e-05, 0.00010228497558273375, 0.00010761395969893783, 0.00011294294381514192, 0.000118271927931346]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 8.0, 8.0, 13.0, 9.0, 11.0, 13.0, 25.0, 17.0, 17.0, 24.0, 22.0, 30.0, 31.0, 42.0, 39.0, 50.0, 33.0, 39.0, 55.0, 39.0, 44.0, 49.0, 37.0, 29.0, 38.0, 34.0, 32.0, 26.0, 38.0, 31.0, 19.0, 11.0, 19.0, 15.0, 10.0, 12.0, 2.0, 6.0, 5.0, 5.0, 6.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.710124969482422e-05, -5.5429525673389435e-05, -5.375780165195465e-05, -5.208607763051987e-05, -5.041435360908508e-05, -4.87426295876503e-05, -4.7070905566215515e-05, -4.539918154478073e-05, -4.372745752334595e-05, -4.205573350191116e-05, -4.038400948047638e-05, -3.8712285459041595e-05, -3.704056143760681e-05, -3.536883741617203e-05, -3.3697113394737244e-05, -3.202538937330246e-05, -3.0353665351867676e-05, -2.8681941330432892e-05, -2.7010217308998108e-05, -2.5338493287563324e-05, -2.366676926612854e-05, -2.1995045244693756e-05, -2.0323321223258972e-05, -1.8651597201824188e-05, -1.6979873180389404e-05, -1.530814915895462e-05, -1.3636425137519836e-05, -1.1964701116085052e-05, -1.0292977094650269e-05, -8.621253073215485e-06, -6.949529051780701e-06, -5.277805030345917e-06, -3.606081008911133e-06, -1.934356987476349e-06, -2.6263296604156494e-07, 1.409091055393219e-06, 3.080815076828003e-06, 4.752539098262787e-06, 6.424263119697571e-06, 8.095987141132355e-06, 9.767711162567139e-06, 1.1439435184001923e-05, 1.3111159205436707e-05, 1.478288322687149e-05, 1.6454607248306274e-05, 1.812633126974106e-05, 1.9798055291175842e-05, 2.1469779312610626e-05, 2.314150333404541e-05, 2.4813227355480194e-05, 2.6484951376914978e-05, 2.8156675398349762e-05, 2.9828399419784546e-05, 3.150012344121933e-05, 3.3171847462654114e-05, 3.48435714840889e-05, 3.651529550552368e-05, 3.8187019526958466e-05, 3.985874354839325e-05, 4.1530467569828033e-05, 4.320219159126282e-05, 4.48739156126976e-05, 4.6545639634132385e-05, 4.821736365556717e-05, 4.988908767700195e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 5.0, 10.0, 10.0, 17.0, 18.0, 13.0, 20.0, 26.0, 24.0, 32.0, 37.0, 37.0, 33.0, 53.0, 50.0, 55.0, 55.0, 51.0, 45.0, 55.0, 55.0, 41.0, 36.0, 33.0, 36.0, 18.0, 29.0, 24.0, 14.0, 15.0, 11.0, 15.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.546875, -3.4552001953125, -3.363525390625, -3.2718505859375, -3.18017578125, -3.0885009765625, -2.996826171875, -2.9051513671875, -2.8134765625, -2.7218017578125, -2.630126953125, -2.5384521484375, -2.44677734375, -2.3551025390625, -2.263427734375, -2.1717529296875, -2.080078125, -1.9884033203125, -1.896728515625, -1.8050537109375, -1.71337890625, -1.6217041015625, -1.530029296875, -1.4383544921875, -1.3466796875, -1.2550048828125, -1.163330078125, -1.0716552734375, -0.97998046875, -0.8883056640625, -0.796630859375, -0.7049560546875, -0.61328125, -0.5216064453125, -0.429931640625, -0.3382568359375, -0.24658203125, -0.1549072265625, -0.063232421875, 0.0284423828125, 0.1201171875, 0.2117919921875, 0.303466796875, 0.3951416015625, 0.48681640625, 0.5784912109375, 0.670166015625, 0.7618408203125, 0.853515625, 0.9451904296875, 1.036865234375, 1.1285400390625, 1.22021484375, 1.3118896484375, 1.403564453125, 1.4952392578125, 1.5869140625, 1.6785888671875, 1.770263671875, 1.8619384765625, 1.95361328125, 2.0452880859375, 2.136962890625, 2.2286376953125, 2.3203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 14.0, 14.0, 16.0, 23.0, 26.0, 50.0, 64.0, 71.0, 168.0, 256.0, 415.0, 793.0, 1380.0, 2698.0, 5352.0, 11418.0, 29065.0, 97757.0, 481515.0, 308960.0, 68181.0, 21553.0, 9296.0, 4360.0, 2244.0, 1162.0, 629.0, 383.0, 210.0, 162.0, 99.0, 67.0, 44.0, 29.0, 32.0, 14.0, 9.0, 8.0, 6.0, 2.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2578125, -3.13653564453125, -3.0152587890625, -2.89398193359375, -2.772705078125, -2.65142822265625, -2.5301513671875, -2.40887451171875, -2.28759765625, -2.16632080078125, -2.0450439453125, -1.92376708984375, -1.802490234375, -1.68121337890625, -1.5599365234375, -1.43865966796875, -1.3173828125, -1.19610595703125, -1.0748291015625, -0.95355224609375, -0.832275390625, -0.71099853515625, -0.5897216796875, -0.46844482421875, -0.34716796875, -0.22589111328125, -0.1046142578125, 0.01666259765625, 0.137939453125, 0.25921630859375, 0.3804931640625, 0.50177001953125, 0.623046875, 0.74432373046875, 0.8656005859375, 0.98687744140625, 1.108154296875, 1.22943115234375, 1.3507080078125, 1.47198486328125, 1.59326171875, 1.71453857421875, 1.8358154296875, 1.95709228515625, 2.078369140625, 2.19964599609375, 2.3209228515625, 2.44219970703125, 2.5634765625, 2.68475341796875, 2.8060302734375, 2.92730712890625, 3.048583984375, 3.16986083984375, 3.2911376953125, 3.41241455078125, 3.53369140625, 3.65496826171875, 3.7762451171875, 3.89752197265625, 4.018798828125, 4.14007568359375, 4.2613525390625, 4.38262939453125, 4.50390625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 1.0, 5.0, 8.0, 10.0, 7.0, 11.0, 15.0, 24.0, 18.0, 35.0, 28.0, 38.0, 44.0, 47.0, 61.0, 63.0, 94.0, 201.0, 1590.0, 201.0, 91.0, 64.0, 64.0, 47.0, 50.0, 38.0, 35.0, 25.0, 20.0, 27.0, 13.0, 21.0, 7.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -8.9923095703125, -8.687744140625, -8.3831787109375, -8.07861328125, -7.7740478515625, -7.469482421875, -7.1649169921875, -6.8603515625, -6.5557861328125, -6.251220703125, -5.9466552734375, -5.64208984375, -5.3375244140625, -5.032958984375, -4.7283935546875, -4.423828125, -4.1192626953125, -3.814697265625, -3.5101318359375, -3.20556640625, -2.9010009765625, -2.596435546875, -2.2918701171875, -1.9873046875, -1.6827392578125, -1.378173828125, -1.0736083984375, -0.76904296875, -0.4644775390625, -0.159912109375, 0.1446533203125, 0.44921875, 0.7537841796875, 1.058349609375, 1.3629150390625, 1.66748046875, 1.9720458984375, 2.276611328125, 2.5811767578125, 2.8857421875, 3.1903076171875, 3.494873046875, 3.7994384765625, 4.10400390625, 4.4085693359375, 4.713134765625, 5.0177001953125, 5.322265625, 5.6268310546875, 5.931396484375, 6.2359619140625, 6.54052734375, 6.8450927734375, 7.149658203125, 7.4542236328125, 7.7587890625, 8.0633544921875, 8.367919921875, 8.6724853515625, 8.97705078125, 9.2816162109375, 9.586181640625, 9.8907470703125, 10.1953125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 13.0, 9.0, 6.0, 12.0, 27.0, 33.0, 41.0, 66.0, 90.0, 146.0, 268.0, 537.0, 2887.0, 386636.0, 2748022.0, 5382.0, 697.0, 288.0, 188.0, 111.0, 59.0, 46.0, 42.0, 17.0, 19.0, 12.0, 12.0, 6.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.890625, -29.01416015625, -28.1376953125, -27.26123046875, -26.384765625, -25.50830078125, -24.6318359375, -23.75537109375, -22.87890625, -22.00244140625, -21.1259765625, -20.24951171875, -19.373046875, -18.49658203125, -17.6201171875, -16.74365234375, -15.8671875, -14.99072265625, -14.1142578125, -13.23779296875, -12.361328125, -11.48486328125, -10.6083984375, -9.73193359375, -8.85546875, -7.97900390625, -7.1025390625, -6.22607421875, -5.349609375, -4.47314453125, -3.5966796875, -2.72021484375, -1.84375, -0.96728515625, -0.0908203125, 0.78564453125, 1.662109375, 2.53857421875, 3.4150390625, 4.29150390625, 5.16796875, 6.04443359375, 6.9208984375, 7.79736328125, 8.673828125, 9.55029296875, 10.4267578125, 11.30322265625, 12.1796875, 13.05615234375, 13.9326171875, 14.80908203125, 15.685546875, 16.56201171875, 17.4384765625, 18.31494140625, 19.19140625, 20.06787109375, 20.9443359375, 21.82080078125, 22.697265625, 23.57373046875, 24.4501953125, 25.32666015625, 26.203125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 6.0, 15.0, 23.0, 33.0, 50.0, 79.0, 98.0, 114.0, 141.0, 112.0, 92.0, 91.0, 53.0, 43.0, 25.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.73713207244873, -9.322479248046875, -8.907827377319336, -8.49317455291748, -8.078522682189941, -7.663869857788086, -7.249217510223389, -6.834565162658691, -6.419912815093994, -6.005260467529297, -5.5906081199646, -5.175955772399902, -4.761302947998047, -4.346651077270508, -3.9319982528686523, -3.517345905303955, -3.102693557739258, -2.6880412101745605, -2.2733888626098633, -1.858736276626587, -1.4440839290618896, -1.0294315814971924, -0.614778995513916, -0.20012664794921875, 0.21452569961547852, 0.6291781067848206, 1.0438305139541626, 1.4584829807281494, 1.8731353282928467, 2.287787675857544, 2.7024402618408203, 3.1170926094055176, 3.5317459106445312, 3.9463982582092285, 4.361050605773926, 4.775703430175781, 5.19035530090332, 5.605008125305176, 6.019660472869873, 6.43431282043457, 6.848965167999268, 7.263617515563965, 7.678269863128662, 8.09292221069336, 8.507575035095215, 8.922226905822754, 9.33687973022461, 9.751531600952148, 10.166184425354004, 10.58083724975586, 10.995489120483398, 11.410141944885254, 11.824793815612793, 12.239446640014648, 12.654098510742188, 13.068751335144043, 13.483404159545898, 13.898056983947754, 14.312708854675293, 14.727361679077148, 15.142013549804688, 15.556666374206543, 15.971319198608398, 16.385971069335938, 16.800622940063477]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 0.0, 3.0, 5.0, 3.0, 3.0, 9.0, 13.0, 10.0, 9.0, 16.0, 20.0, 16.0, 18.0, 25.0, 41.0, 31.0, 23.0, 27.0, 46.0, 34.0, 45.0, 56.0, 49.0, 42.0, 46.0, 42.0, 47.0, 36.0, 34.0, 36.0, 28.0, 28.0, 20.0, 23.0, 15.0, 20.0, 15.0, 14.0, 13.0, 11.0, 11.0, 8.0, 5.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.16049575805664, -27.354175567626953, -26.5478572845459, -25.74153709411621, -24.935216903686523, -24.12889862060547, -23.32257843017578, -22.516258239746094, -21.709938049316406, -20.90361785888672, -20.097299575805664, -19.290979385375977, -18.48465919494629, -17.678340911865234, -16.872020721435547, -16.06570053100586, -15.259382247924805, -14.453063011169434, -13.646742820739746, -12.840423583984375, -12.034103393554688, -11.227784156799316, -10.421464920043945, -9.615144729614258, -8.808825492858887, -8.002506256103516, -7.196186065673828, -6.389866828918457, -5.583547115325928, -4.777227401733398, -3.9709081649780273, -3.164588451385498, -2.358266830444336, -1.5519472360610962, -0.7456276416778564, 0.06069183349609375, 0.867011547088623, 1.6733312606811523, 2.4796504974365234, 3.2859702110290527, 4.092289924621582, 4.898609638214111, 5.704929351806641, 6.511248588562012, 7.317568302154541, 8.12388801574707, 8.930207252502441, 9.736526489257812, 10.5428466796875, 11.349165916442871, 12.155486106872559, 12.96180534362793, 13.768125534057617, 14.574444770812988, 15.38076400756836, 16.187084197998047, 16.993404388427734, 17.799724578857422, 18.606042861938477, 19.412363052368164, 20.21868324279785, 21.025001525878906, 21.831321716308594, 22.63764190673828, 23.443960189819336]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 8.0, 14.0, 14.0, 17.0, 19.0, 19.0, 19.0, 32.0, 28.0, 24.0, 37.0, 52.0, 44.0, 47.0, 49.0, 53.0, 42.0, 51.0, 40.0, 52.0, 47.0, 41.0, 34.0, 24.0, 35.0, 29.0, 18.0, 19.0, 18.0, 15.0, 9.0, 11.0, 7.0, 8.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.52734375, -3.4345703125, -3.341796875, -3.2490234375, -3.15625, -3.0634765625, -2.970703125, -2.8779296875, -2.78515625, -2.6923828125, -2.599609375, -2.5068359375, -2.4140625, -2.3212890625, -2.228515625, -2.1357421875, -2.04296875, -1.9501953125, -1.857421875, -1.7646484375, -1.671875, -1.5791015625, -1.486328125, -1.3935546875, -1.30078125, -1.2080078125, -1.115234375, -1.0224609375, -0.9296875, -0.8369140625, -0.744140625, -0.6513671875, -0.55859375, -0.4658203125, -0.373046875, -0.2802734375, -0.1875, -0.0947265625, -0.001953125, 0.0908203125, 0.18359375, 0.2763671875, 0.369140625, 0.4619140625, 0.5546875, 0.6474609375, 0.740234375, 0.8330078125, 0.92578125, 1.0185546875, 1.111328125, 1.2041015625, 1.296875, 1.3896484375, 1.482421875, 1.5751953125, 1.66796875, 1.7607421875, 1.853515625, 1.9462890625, 2.0390625, 2.1318359375, 2.224609375, 2.3173828125, 2.41015625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 8.0, 4.0, 10.0, 13.0, 15.0, 22.0, 36.0, 39.0, 49.0, 75.0, 105.0, 138.0, 245.0, 378.0, 608.0, 1175.0, 2280.0, 5060.0, 11889.0, 31186.0, 91513.0, 300274.0, 880384.0, 1434242.0, 934082.0, 337108.0, 104542.0, 34983.0, 13094.0, 5404.0, 2450.0, 1202.0, 596.0, 332.0, 211.0, 143.0, 97.0, 89.0, 58.0, 43.0, 26.0, 16.0, 18.0, 10.0, 9.0, 10.0, 2.0, 6.0, 5.0, 1.0, 2.0], "bins": [-3.470703125, -3.375732421875, -3.28076171875, -3.185791015625, -3.0908203125, -2.995849609375, -2.90087890625, -2.805908203125, -2.7109375, -2.615966796875, -2.52099609375, -2.426025390625, -2.3310546875, -2.236083984375, -2.14111328125, -2.046142578125, -1.951171875, -1.856201171875, -1.76123046875, -1.666259765625, -1.5712890625, -1.476318359375, -1.38134765625, -1.286376953125, -1.19140625, -1.096435546875, -1.00146484375, -0.906494140625, -0.8115234375, -0.716552734375, -0.62158203125, -0.526611328125, -0.431640625, -0.336669921875, -0.24169921875, -0.146728515625, -0.0517578125, 0.043212890625, 0.13818359375, 0.233154296875, 0.328125, 0.423095703125, 0.51806640625, 0.613037109375, 0.7080078125, 0.802978515625, 0.89794921875, 0.992919921875, 1.087890625, 1.182861328125, 1.27783203125, 1.372802734375, 1.4677734375, 1.562744140625, 1.65771484375, 1.752685546875, 1.84765625, 1.942626953125, 2.03759765625, 2.132568359375, 2.2275390625, 2.322509765625, 2.41748046875, 2.512451171875, 2.607421875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 5.0, 5.0, 7.0, 23.0, 32.0, 57.0, 72.0, 115.0, 186.0, 282.0, 388.0, 511.0, 633.0, 591.0, 381.0, 259.0, 179.0, 139.0, 81.0, 43.0, 33.0, 25.0, 8.0, 10.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8203125, -10.53961181640625, -10.2589111328125, -9.97821044921875, -9.697509765625, -9.41680908203125, -9.1361083984375, -8.85540771484375, -8.57470703125, -8.29400634765625, -8.0133056640625, -7.73260498046875, -7.451904296875, -7.17120361328125, -6.8905029296875, -6.60980224609375, -6.3291015625, -6.04840087890625, -5.7677001953125, -5.48699951171875, -5.206298828125, -4.92559814453125, -4.6448974609375, -4.36419677734375, -4.08349609375, -3.80279541015625, -3.5220947265625, -3.24139404296875, -2.960693359375, -2.67999267578125, -2.3992919921875, -2.11859130859375, -1.837890625, -1.55718994140625, -1.2764892578125, -0.99578857421875, -0.715087890625, -0.43438720703125, -0.1536865234375, 0.12701416015625, 0.40771484375, 0.68841552734375, 0.9691162109375, 1.24981689453125, 1.530517578125, 1.81121826171875, 2.0919189453125, 2.37261962890625, 2.6533203125, 2.93402099609375, 3.2147216796875, 3.49542236328125, 3.776123046875, 4.05682373046875, 4.3375244140625, 4.61822509765625, 4.89892578125, 5.17962646484375, 5.4603271484375, 5.74102783203125, 6.021728515625, 6.30242919921875, 6.5831298828125, 6.86383056640625, 7.14453125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 9.0, 21.0, 16.0, 15.0, 36.0, 58.0, 86.0, 114.0, 191.0, 372.0, 827.0, 4837.0, 196554.0, 3784228.0, 200357.0, 4862.0, 803.0, 324.0, 187.0, 105.0, 79.0, 56.0, 40.0, 24.0, 20.0, 16.0, 16.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-22.015625, -21.3955078125, -20.775390625, -20.1552734375, -19.53515625, -18.9150390625, -18.294921875, -17.6748046875, -17.0546875, -16.4345703125, -15.814453125, -15.1943359375, -14.57421875, -13.9541015625, -13.333984375, -12.7138671875, -12.09375, -11.4736328125, -10.853515625, -10.2333984375, -9.61328125, -8.9931640625, -8.373046875, -7.7529296875, -7.1328125, -6.5126953125, -5.892578125, -5.2724609375, -4.65234375, -4.0322265625, -3.412109375, -2.7919921875, -2.171875, -1.5517578125, -0.931640625, -0.3115234375, 0.30859375, 0.9287109375, 1.548828125, 2.1689453125, 2.7890625, 3.4091796875, 4.029296875, 4.6494140625, 5.26953125, 5.8896484375, 6.509765625, 7.1298828125, 7.75, 8.3701171875, 8.990234375, 9.6103515625, 10.23046875, 10.8505859375, 11.470703125, 12.0908203125, 12.7109375, 13.3310546875, 13.951171875, 14.5712890625, 15.19140625, 15.8115234375, 16.431640625, 17.0517578125, 17.671875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 18.0, 39.0, 90.0, 189.0, 238.0, 209.0, 130.0, 61.0, 22.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.017578125, -71.08941650390625, -69.16124725341797, -67.23308563232422, -65.30491638183594, -63.37675476074219, -61.44858932495117, -59.520423889160156, -57.59225845336914, -55.664093017578125, -53.73592758178711, -51.807762145996094, -49.879600524902344, -47.95143127441406, -46.02326965332031, -44.0951042175293, -42.16693878173828, -40.238773345947266, -38.31060791015625, -36.382442474365234, -34.45427703857422, -32.52611541748047, -30.597949981689453, -28.669784545898438, -26.741619110107422, -24.813453674316406, -22.88528823852539, -20.957124710083008, -19.028959274291992, -17.100793838500977, -15.172629356384277, -13.244464874267578, -11.316303253173828, -9.388137817382812, -7.459973335266113, -5.531808376312256, -3.6036434173583984, -1.6754779815673828, 0.2526865005493164, 2.1808509826660156, 4.109016418457031, 6.037181377410889, 7.965346336364746, 9.893510818481445, 11.821676254272461, 13.749841690063477, 15.678006172180176, 17.606170654296875, 19.53433609008789, 21.462501525878906, 23.390666961669922, 25.318830490112305, 27.24699592590332, 29.175161361694336, 31.10332489013672, 33.031490325927734, 34.95965576171875, 36.887821197509766, 38.81598663330078, 40.7441520690918, 42.67231750488281, 44.60047912597656, 46.52864456176758, 48.456809997558594, 50.38497543334961]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 9.0, 11.0, 9.0, 14.0, 16.0, 21.0, 20.0, 18.0, 30.0, 26.0, 34.0, 40.0, 42.0, 51.0, 47.0, 38.0, 47.0, 47.0, 48.0, 61.0, 47.0, 25.0, 41.0, 35.0, 31.0, 27.0, 22.0, 21.0, 14.0, 17.0, 22.0, 12.0, 12.0, 8.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.206607818603516, -25.440139770507812, -24.67367172241211, -23.907203674316406, -23.140737533569336, -22.374269485473633, -21.60780143737793, -20.841333389282227, -20.074867248535156, -19.308399200439453, -18.54193115234375, -17.775463104248047, -17.008996963500977, -16.242528915405273, -15.47606086730957, -14.709592819213867, -13.943124771118164, -13.176656723022461, -12.410189628601074, -11.643721580505371, -10.877254486083984, -10.110786437988281, -9.344318389892578, -8.577850341796875, -7.811383247375488, -7.044915676116943, -6.278448104858398, -5.511980056762695, -4.74551248550415, -3.9790449142456055, -3.2125768661499023, -2.4461092948913574, -1.6796398162841797, -0.9131721258163452, -0.14670443534851074, 0.6197633743286133, 1.3862309455871582, 2.152698516845703, 2.9191665649414062, 3.685634136199951, 4.452101707458496, 5.218569278717041, 5.985036849975586, 6.751504898071289, 7.517972469329834, 8.284440040588379, 9.050908088684082, 9.817375183105469, 10.583843231201172, 11.350311279296875, 12.116778373718262, 12.883246421813965, 13.649713516235352, 14.416181564331055, 15.182649612426758, 15.949117660522461, 16.71558380126953, 17.482051849365234, 18.248519897460938, 19.01498794555664, 19.78145408630371, 20.547922134399414, 21.314390182495117, 22.08085823059082, 22.847326278686523]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 3.0, 10.0, 12.0, 10.0, 13.0, 11.0, 23.0, 24.0, 24.0, 22.0, 28.0, 29.0, 33.0, 32.0, 41.0, 41.0, 49.0, 52.0, 51.0, 46.0, 47.0, 38.0, 47.0, 47.0, 36.0, 28.0, 27.0, 32.0, 20.0, 23.0, 18.0, 23.0, 15.0, 8.0, 7.0, 14.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.48828125, -3.39752197265625, -3.3067626953125, -3.21600341796875, -3.125244140625, -3.03448486328125, -2.9437255859375, -2.85296630859375, -2.76220703125, -2.67144775390625, -2.5806884765625, -2.48992919921875, -2.399169921875, -2.30841064453125, -2.2176513671875, -2.12689208984375, -2.0361328125, -1.94537353515625, -1.8546142578125, -1.76385498046875, -1.673095703125, -1.58233642578125, -1.4915771484375, -1.40081787109375, -1.31005859375, -1.21929931640625, -1.1285400390625, -1.03778076171875, -0.947021484375, -0.85626220703125, -0.7655029296875, -0.67474365234375, -0.583984375, -0.49322509765625, -0.4024658203125, -0.31170654296875, -0.220947265625, -0.13018798828125, -0.0394287109375, 0.05133056640625, 0.14208984375, 0.23284912109375, 0.3236083984375, 0.41436767578125, 0.505126953125, 0.59588623046875, 0.6866455078125, 0.77740478515625, 0.8681640625, 0.95892333984375, 1.0496826171875, 1.14044189453125, 1.231201171875, 1.32196044921875, 1.4127197265625, 1.50347900390625, 1.59423828125, 1.68499755859375, 1.7757568359375, 1.86651611328125, 1.957275390625, 2.04803466796875, 2.1387939453125, 2.22955322265625, 2.3203125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 12.0, 16.0, 35.0, 48.0, 85.0, 143.0, 185.0, 298.0, 511.0, 780.0, 1269.0, 2028.0, 3165.0, 5121.0, 8338.0, 13489.0, 22218.0, 37510.0, 67126.0, 134326.0, 323971.0, 209656.0, 93429.0, 50254.0, 29272.0, 17349.0, 10639.0, 6545.0, 4044.0, 2484.0, 1471.0, 984.0, 608.0, 420.0, 234.0, 171.0, 99.0, 63.0, 45.0, 34.0, 23.0, 14.0, 8.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.464111328125, -0.4479713439941406, -0.43183135986328125, -0.4156913757324219, -0.3995513916015625, -0.3834114074707031, -0.36727142333984375, -0.3511314392089844, -0.334991455078125, -0.3188514709472656, -0.30271148681640625, -0.2865715026855469, -0.2704315185546875, -0.2542915344238281, -0.23815155029296875, -0.22201156616210938, -0.20587158203125, -0.18973159790039062, -0.17359161376953125, -0.15745162963867188, -0.1413116455078125, -0.12517166137695312, -0.10903167724609375, -0.09289169311523438, -0.076751708984375, -0.060611724853515625, -0.04447174072265625, -0.028331756591796875, -0.0121917724609375, 0.003948211669921875, 0.02008819580078125, 0.036228179931640625, 0.0523681640625, 0.06850814819335938, 0.08464813232421875, 0.10078811645507812, 0.1169281005859375, 0.13306808471679688, 0.14920806884765625, 0.16534805297851562, 0.181488037109375, 0.19762802124023438, 0.21376800537109375, 0.22990798950195312, 0.2460479736328125, 0.2621879577636719, 0.27832794189453125, 0.2944679260253906, 0.31060791015625, 0.3267478942871094, 0.34288787841796875, 0.3590278625488281, 0.3751678466796875, 0.3913078308105469, 0.40744781494140625, 0.4235877990722656, 0.439727783203125, 0.4558677673339844, 0.47200775146484375, 0.4881477355957031, 0.5042877197265625, 0.5204277038574219, 0.5365676879882812, 0.5527076721191406, 0.56884765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 3.0, 7.0, 6.0, 7.0, 8.0, 11.0, 9.0, 14.0, 15.0, 25.0, 18.0, 26.0, 21.0, 26.0, 24.0, 33.0, 39.0, 40.0, 48.0, 30.0, 49.0, 1073.0, 40.0, 30.0, 58.0, 41.0, 33.0, 38.0, 33.0, 34.0, 30.0, 29.0, 20.0, 15.0, 20.0, 12.0, 13.0, 11.0, 5.0, 11.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7998046875, -1.7458953857421875, -1.691986083984375, -1.6380767822265625, -1.58416748046875, -1.5302581787109375, -1.476348876953125, -1.4224395751953125, -1.3685302734375, -1.3146209716796875, -1.260711669921875, -1.2068023681640625, -1.15289306640625, -1.0989837646484375, -1.045074462890625, -0.9911651611328125, -0.937255859375, -0.8833465576171875, -0.829437255859375, -0.7755279541015625, -0.72161865234375, -0.6677093505859375, -0.613800048828125, -0.5598907470703125, -0.5059814453125, -0.4520721435546875, -0.398162841796875, -0.3442535400390625, -0.29034423828125, -0.2364349365234375, -0.182525634765625, -0.1286163330078125, -0.07470703125, -0.0207977294921875, 0.033111572265625, 0.0870208740234375, 0.14093017578125, 0.1948394775390625, 0.248748779296875, 0.3026580810546875, 0.3565673828125, 0.4104766845703125, 0.464385986328125, 0.5182952880859375, 0.57220458984375, 0.6261138916015625, 0.680023193359375, 0.7339324951171875, 0.787841796875, 0.8417510986328125, 0.895660400390625, 0.9495697021484375, 1.00347900390625, 1.0573883056640625, 1.111297607421875, 1.1652069091796875, 1.2191162109375, 1.2730255126953125, 1.326934814453125, 1.3808441162109375, 1.43475341796875, 1.4886627197265625, 1.542572021484375, 1.5964813232421875, 1.650390625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 13.0, 10.0, 18.0, 31.0, 44.0, 70.0, 92.0, 160.0, 214.0, 348.0, 488.0, 672.0, 1003.0, 1431.0, 1984.0, 2911.0, 4098.0, 5830.0, 8440.0, 12601.0, 18339.0, 27434.0, 42086.0, 69565.0, 128134.0, 1307992.0, 200803.0, 97701.0, 56548.0, 35408.0, 22665.0, 15471.0, 10498.0, 7310.0, 5170.0, 3462.0, 2530.0, 1663.0, 1157.0, 816.0, 571.0, 402.0, 282.0, 217.0, 128.0, 99.0, 69.0, 45.0, 37.0, 24.0, 21.0, 10.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0], "bins": [-0.385009765625, -0.37290191650390625, -0.3607940673828125, -0.34868621826171875, -0.336578369140625, -0.32447052001953125, -0.3123626708984375, -0.30025482177734375, -0.28814697265625, -0.27603912353515625, -0.2639312744140625, -0.25182342529296875, -0.239715576171875, -0.22760772705078125, -0.2154998779296875, -0.20339202880859375, -0.1912841796875, -0.17917633056640625, -0.1670684814453125, -0.15496063232421875, -0.142852783203125, -0.13074493408203125, -0.1186370849609375, -0.10652923583984375, -0.09442138671875, -0.08231353759765625, -0.0702056884765625, -0.05809783935546875, -0.045989990234375, -0.03388214111328125, -0.0217742919921875, -0.00966644287109375, 0.00244140625, 0.01454925537109375, 0.0266571044921875, 0.03876495361328125, 0.050872802734375, 0.06298065185546875, 0.0750885009765625, 0.08719635009765625, 0.09930419921875, 0.11141204833984375, 0.1235198974609375, 0.13562774658203125, 0.147735595703125, 0.15984344482421875, 0.1719512939453125, 0.18405914306640625, 0.1961669921875, 0.20827484130859375, 0.2203826904296875, 0.23249053955078125, 0.244598388671875, 0.25670623779296875, 0.2688140869140625, 0.28092193603515625, 0.29302978515625, 0.30513763427734375, 0.3172454833984375, 0.32935333251953125, 0.341461181640625, 0.35356903076171875, 0.3656768798828125, 0.37778472900390625, 0.389892578125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 7.0, 9.0, 9.0, 18.0, 13.0, 20.0, 13.0, 26.0, 24.0, 43.0, 35.0, 47.0, 52.0, 61.0, 65.0, 62.0, 67.0, 59.0, 51.0, 50.0, 45.0, 35.0, 24.0, 36.0, 21.0, 13.0, 18.0, 22.0, 9.0, 5.0, 7.0, 4.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.00011789798736572266, -0.00011467467993497849, -0.00011145137250423431, -0.00010822806507349014, -0.00010500475764274597, -0.0001017814502120018, -9.855814278125763e-05, -9.533483535051346e-05, -9.211152791976929e-05, -8.888822048902512e-05, -8.566491305828094e-05, -8.244160562753677e-05, -7.92182981967926e-05, -7.599499076604843e-05, -7.277168333530426e-05, -6.954837590456009e-05, -6.632506847381592e-05, -6.310176104307175e-05, -5.9878453612327576e-05, -5.6655146181583405e-05, -5.3431838750839233e-05, -5.020853132009506e-05, -4.698522388935089e-05, -4.376191645860672e-05, -4.053860902786255e-05, -3.731530159711838e-05, -3.4091994166374207e-05, -3.0868686735630035e-05, -2.7645379304885864e-05, -2.4422071874141693e-05, -2.1198764443397522e-05, -1.797545701265335e-05, -1.475214958190918e-05, -1.1528842151165009e-05, -8.305534720420837e-06, -5.082227289676666e-06, -1.8589198589324951e-06, 1.364387571811676e-06, 4.587695002555847e-06, 7.811002433300018e-06, 1.103430986404419e-05, 1.425761729478836e-05, 1.7480924725532532e-05, 2.0704232156276703e-05, 2.3927539587020874e-05, 2.7150847017765045e-05, 3.0374154448509216e-05, 3.359746187925339e-05, 3.682076930999756e-05, 4.004407674074173e-05, 4.32673841714859e-05, 4.649069160223007e-05, 4.971399903297424e-05, 5.2937306463718414e-05, 5.6160613894462585e-05, 5.9383921325206757e-05, 6.260722875595093e-05, 6.58305361866951e-05, 6.905384361743927e-05, 7.227715104818344e-05, 7.550045847892761e-05, 7.872376590967178e-05, 8.194707334041595e-05, 8.517038077116013e-05, 8.83936882019043e-05]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 7.0, 17.0, 15.0, 20.0, 37.0, 34.0, 60.0, 105.0, 113.0, 189.0, 292.0, 561.0, 1497.0, 598272.0, 444482.0, 1393.0, 553.0, 304.0, 168.0, 129.0, 82.0, 55.0, 38.0, 25.0, 25.0, 12.0, 16.0, 5.0, 8.0, 4.0, 2.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019092559814453125, -0.0018410086631774902, -0.001772761344909668, -0.0017045140266418457, -0.0016362667083740234, -0.0015680193901062012, -0.001499772071838379, -0.0014315247535705566, -0.0013632774353027344, -0.0012950301170349121, -0.0012267827987670898, -0.0011585354804992676, -0.0010902881622314453, -0.001022040843963623, -0.0009537935256958008, -0.0008855462074279785, -0.0008172988891601562, -0.000749051570892334, -0.0006808042526245117, -0.0006125569343566895, -0.0005443096160888672, -0.0004760622978210449, -0.00040781497955322266, -0.0003395676612854004, -0.0002713203430175781, -0.00020307302474975586, -0.0001348257064819336, -6.657838821411133e-05, 1.6689300537109375e-06, 6.99162483215332e-05, 0.00013816356658935547, 0.00020641088485717773, 0.000274658203125, 0.00034290552139282227, 0.00041115283966064453, 0.0004794001579284668, 0.0005476474761962891, 0.0006158947944641113, 0.0006841421127319336, 0.0007523894309997559, 0.0008206367492675781, 0.0008888840675354004, 0.0009571313858032227, 0.001025378704071045, 0.0010936260223388672, 0.0011618733406066895, 0.0012301206588745117, 0.001298367977142334, 0.0013666152954101562, 0.0014348626136779785, 0.0015031099319458008, 0.001571357250213623, 0.0016396045684814453, 0.0017078518867492676, 0.0017760992050170898, 0.0018443465232849121, 0.0019125938415527344, 0.0019808411598205566, 0.002049088478088379, 0.002117335796356201, 0.0021855831146240234, 0.0022538304328918457, 0.002322077751159668, 0.0023903250694274902, 0.0024585723876953125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 57.0, 291.0, 433.0, 206.0, 21.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021717695926781744, -0.00020923932606820017, -0.0002013016928685829, -0.00019336407422088087, -0.0001854264410212636, -0.00017748880782164633, -0.00016955117462202907, -0.0001616135414224118, -0.00015367590822279453, -0.00014573827502317727, -0.00013780064182356, -0.00012986300862394273, -0.0001219253899762407, -0.00011398775677662343, -0.00010605012357700616, -9.81124903773889e-05, -9.017487172968686e-05, -8.223723853006959e-05, -7.429961260640994e-05, -6.636197940679267e-05, -5.842434984515421e-05, -5.048672028351575e-05, -4.2549087083898485e-05, -3.4611457522260025e-05, -2.6673827960621566e-05, -1.8736198398983106e-05, -1.0798567018355243e-05, -2.86093563772738e-06, 5.07669392391108e-06, 1.301432348554954e-05, 2.0951956685166806e-05, 2.8889586246805266e-05, 3.6827230360358953e-05, 4.476485992199741e-05, 5.270248948363587e-05, 6.064012268325314e-05, 6.857774860691279e-05, 7.651538180653006e-05, 8.445301500614733e-05, 9.239064820576459e-05, 0.00010032827412942424, 0.00010826590732904151, 0.00011620353325270116, 0.00012414116645231843, 0.0001320787996519357, 0.00014001643285155296, 0.00014795406605117023, 0.00015589168469887227, 0.00016382931789848953, 0.0001717669510981068, 0.00017970458429772407, 0.0001876422029454261, 0.00019557983614504337, 0.00020351746934466064, 0.0002114551025442779, 0.00021939273574389517, 0.00022733036894351244, 0.0002352680021431297, 0.00024320563534274697, 0.00025114326854236424, 0.0002590809017419815, 0.0002670185058377683, 0.00027495616814121604, 0.00028289377223700285, 0.0002908314054366201]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 5.0, 5.0, 10.0, 11.0, 9.0, 14.0, 14.0, 16.0, 16.0, 27.0, 29.0, 24.0, 40.0, 33.0, 39.0, 43.0, 40.0, 40.0, 36.0, 28.0, 41.0, 40.0, 38.0, 34.0, 39.0, 37.0, 36.0, 43.0, 22.0, 21.0, 22.0, 18.0, 20.0, 17.0, 14.0, 18.0, 10.0, 9.0, 8.0, 4.0, 11.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.881620407104492e-05, -4.726182669401169e-05, -4.5707449316978455e-05, -4.415307193994522e-05, -4.259869456291199e-05, -4.1044317185878754e-05, -3.948993980884552e-05, -3.7935562431812286e-05, -3.638118505477905e-05, -3.482680767774582e-05, -3.3272430300712585e-05, -3.171805292367935e-05, -3.0163675546646118e-05, -2.8609298169612885e-05, -2.705492079257965e-05, -2.5500543415546417e-05, -2.3946166038513184e-05, -2.239178866147995e-05, -2.0837411284446716e-05, -1.9283033907413483e-05, -1.772865653038025e-05, -1.6174279153347015e-05, -1.4619901776313782e-05, -1.3065524399280548e-05, -1.1511147022247314e-05, -9.95676964521408e-06, -8.402392268180847e-06, -6.8480148911476135e-06, -5.29363751411438e-06, -3.7392601370811462e-06, -2.1848827600479126e-06, -6.30505383014679e-07, 9.238719940185547e-07, 2.4782493710517883e-06, 4.032626748085022e-06, 5.587004125118256e-06, 7.141381502151489e-06, 8.695758879184723e-06, 1.0250136256217957e-05, 1.180451363325119e-05, 1.3358891010284424e-05, 1.4913268387317657e-05, 1.646764576435089e-05, 1.8022023141384125e-05, 1.957640051841736e-05, 2.1130777895450592e-05, 2.2685155272483826e-05, 2.423953264951706e-05, 2.5793910026550293e-05, 2.7348287403583527e-05, 2.890266478061676e-05, 3.0457042157649994e-05, 3.201141953468323e-05, 3.356579691171646e-05, 3.5120174288749695e-05, 3.667455166578293e-05, 3.822892904281616e-05, 3.9783306419849396e-05, 4.133768379688263e-05, 4.289206117391586e-05, 4.44464385509491e-05, 4.600081592798233e-05, 4.7555193305015564e-05, 4.91095706820488e-05, 5.066394805908203e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 3.0, 10.0, 12.0, 10.0, 13.0, 11.0, 23.0, 24.0, 24.0, 22.0, 28.0, 29.0, 33.0, 32.0, 41.0, 41.0, 49.0, 52.0, 51.0, 46.0, 47.0, 38.0, 47.0, 47.0, 36.0, 28.0, 27.0, 32.0, 20.0, 23.0, 18.0, 23.0, 15.0, 8.0, 7.0, 14.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.48828125, -3.39752197265625, -3.3067626953125, -3.21600341796875, -3.125244140625, -3.03448486328125, -2.9437255859375, -2.85296630859375, -2.76220703125, -2.67144775390625, -2.5806884765625, -2.48992919921875, -2.399169921875, -2.30841064453125, -2.2176513671875, -2.12689208984375, -2.0361328125, -1.94537353515625, -1.8546142578125, -1.76385498046875, -1.673095703125, -1.58233642578125, -1.4915771484375, -1.40081787109375, -1.31005859375, -1.21929931640625, -1.1285400390625, -1.03778076171875, -0.947021484375, -0.85626220703125, -0.7655029296875, -0.67474365234375, -0.583984375, -0.49322509765625, -0.4024658203125, -0.31170654296875, -0.220947265625, -0.13018798828125, -0.0394287109375, 0.05133056640625, 0.14208984375, 0.23284912109375, 0.3236083984375, 0.41436767578125, 0.505126953125, 0.59588623046875, 0.6866455078125, 0.77740478515625, 0.8681640625, 0.95892333984375, 1.0496826171875, 1.14044189453125, 1.231201171875, 1.32196044921875, 1.4127197265625, 1.50347900390625, 1.59423828125, 1.68499755859375, 1.7757568359375, 1.86651611328125, 1.957275390625, 2.04803466796875, 2.1387939453125, 2.22955322265625, 2.3203125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 5.0, 2.0, 7.0, 9.0, 17.0, 16.0, 32.0, 44.0, 78.0, 118.0, 175.0, 283.0, 464.0, 795.0, 1479.0, 2761.0, 5428.0, 11499.0, 26069.0, 68385.0, 210360.0, 418787.0, 192132.0, 62959.0, 24601.0, 10866.0, 5210.0, 2657.0, 1359.0, 772.0, 486.0, 234.0, 154.0, 99.0, 76.0, 46.0, 25.0, 18.0, 9.0, 11.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0], "bins": [-3.697265625, -3.60113525390625, -3.5050048828125, -3.40887451171875, -3.312744140625, -3.21661376953125, -3.1204833984375, -3.02435302734375, -2.92822265625, -2.83209228515625, -2.7359619140625, -2.63983154296875, -2.543701171875, -2.44757080078125, -2.3514404296875, -2.25531005859375, -2.1591796875, -2.06304931640625, -1.9669189453125, -1.87078857421875, -1.774658203125, -1.67852783203125, -1.5823974609375, -1.48626708984375, -1.39013671875, -1.29400634765625, -1.1978759765625, -1.10174560546875, -1.005615234375, -0.90948486328125, -0.8133544921875, -0.71722412109375, -0.62109375, -0.52496337890625, -0.4288330078125, -0.33270263671875, -0.236572265625, -0.14044189453125, -0.0443115234375, 0.05181884765625, 0.14794921875, 0.24407958984375, 0.3402099609375, 0.43634033203125, 0.532470703125, 0.62860107421875, 0.7247314453125, 0.82086181640625, 0.9169921875, 1.01312255859375, 1.1092529296875, 1.20538330078125, 1.301513671875, 1.39764404296875, 1.4937744140625, 1.58990478515625, 1.68603515625, 1.78216552734375, 1.8782958984375, 1.97442626953125, 2.070556640625, 2.16668701171875, 2.2628173828125, 2.35894775390625, 2.455078125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 5.0, 3.0, 8.0, 6.0, 7.0, 7.0, 16.0, 17.0, 8.0, 23.0, 23.0, 20.0, 25.0, 37.0, 41.0, 43.0, 43.0, 53.0, 96.0, 205.0, 1506.0, 291.0, 115.0, 70.0, 50.0, 47.0, 45.0, 26.0, 31.0, 28.0, 23.0, 17.0, 23.0, 22.0, 19.0, 14.0, 5.0, 10.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0], "bins": [-12.53125, -12.198974609375, -11.86669921875, -11.534423828125, -11.2021484375, -10.869873046875, -10.53759765625, -10.205322265625, -9.873046875, -9.540771484375, -9.20849609375, -8.876220703125, -8.5439453125, -8.211669921875, -7.87939453125, -7.547119140625, -7.21484375, -6.882568359375, -6.55029296875, -6.218017578125, -5.8857421875, -5.553466796875, -5.22119140625, -4.888916015625, -4.556640625, -4.224365234375, -3.89208984375, -3.559814453125, -3.2275390625, -2.895263671875, -2.56298828125, -2.230712890625, -1.8984375, -1.566162109375, -1.23388671875, -0.901611328125, -0.5693359375, -0.237060546875, 0.09521484375, 0.427490234375, 0.759765625, 1.092041015625, 1.42431640625, 1.756591796875, 2.0888671875, 2.421142578125, 2.75341796875, 3.085693359375, 3.41796875, 3.750244140625, 4.08251953125, 4.414794921875, 4.7470703125, 5.079345703125, 5.41162109375, 5.743896484375, 6.076171875, 6.408447265625, 6.74072265625, 7.072998046875, 7.4052734375, 7.737548828125, 8.06982421875, 8.402099609375, 8.734375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 8.0, 4.0, 4.0, 9.0, 6.0, 28.0, 20.0, 41.0, 40.0, 59.0, 85.0, 104.0, 173.0, 301.0, 630.0, 3625.0, 2420970.0, 715503.0, 2713.0, 543.0, 281.0, 184.0, 97.0, 67.0, 48.0, 42.0, 36.0, 26.0, 11.0, 8.0, 11.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.03125, -32.0859375, -31.140625, -30.1953125, -29.25, -28.3046875, -27.359375, -26.4140625, -25.46875, -24.5234375, -23.578125, -22.6328125, -21.6875, -20.7421875, -19.796875, -18.8515625, -17.90625, -16.9609375, -16.015625, -15.0703125, -14.125, -13.1796875, -12.234375, -11.2890625, -10.34375, -9.3984375, -8.453125, -7.5078125, -6.5625, -5.6171875, -4.671875, -3.7265625, -2.78125, -1.8359375, -0.890625, 0.0546875, 1.0, 1.9453125, 2.890625, 3.8359375, 4.78125, 5.7265625, 6.671875, 7.6171875, 8.5625, 9.5078125, 10.453125, 11.3984375, 12.34375, 13.2890625, 14.234375, 15.1796875, 16.125, 17.0703125, 18.015625, 18.9609375, 19.90625, 20.8515625, 21.796875, 22.7421875, 23.6875, 24.6328125, 25.578125, 26.5234375, 27.46875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 178.0, 732.0, 100.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.644240379333496, -12.759722709655762, -9.875204086303711, -6.990686416625977, -4.106168746948242, -1.2216510772705078, 1.662867546081543, 4.547385215759277, 7.431902885437012, 10.316420555114746, 13.200939178466797, 16.08545684814453, 18.969974517822266, 21.8544921875, 24.739009857177734, 27.62352752685547, 30.508045196533203, 33.39256286621094, 36.27708053588867, 39.161598205566406, 42.04611587524414, 44.930633544921875, 47.815155029296875, 50.699668884277344, 53.584190368652344, 56.46870803833008, 59.35322570800781, 62.23774337768555, 65.12226104736328, 68.00678253173828, 70.89129638671875, 73.77581787109375, 76.66033172607422, 79.54485321044922, 82.42936706542969, 85.31388854980469, 88.19840240478516, 91.08292388916016, 93.96743774414062, 96.85195922851562, 99.7364730834961, 102.6209945678711, 105.50550842285156, 108.39002990722656, 111.27454376220703, 114.15906524658203, 117.0435791015625, 119.9281005859375, 122.8126220703125, 125.6971435546875, 128.5816650390625, 131.46617126464844, 134.35069274902344, 137.23521423339844, 140.11973571777344, 143.00424194335938, 145.88876342773438, 148.77328491210938, 151.65780639648438, 154.5423126220703, 157.4268341064453, 160.3113555908203, 163.1958770751953, 166.08038330078125, 168.96490478515625]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 9.0, 10.0, 6.0, 9.0, 13.0, 10.0, 24.0, 24.0, 27.0, 22.0, 36.0, 29.0, 34.0, 38.0, 40.0, 37.0, 38.0, 39.0, 41.0, 44.0, 42.0, 50.0, 38.0, 45.0, 37.0, 27.0, 32.0, 34.0, 19.0, 14.0, 26.0, 25.0, 15.0, 12.0, 16.0, 9.0, 7.0, 4.0, 4.0, 6.0, 5.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.087427139282227, -26.29973602294922, -25.51204490661621, -24.724353790283203, -23.936662673950195, -23.148971557617188, -22.36128044128418, -21.573589324951172, -20.785898208618164, -19.998207092285156, -19.21051597595215, -18.42282485961914, -17.635133743286133, -16.847442626953125, -16.059751510620117, -15.27206039428711, -14.484368324279785, -13.696677207946777, -12.90898609161377, -12.121294975280762, -11.333603858947754, -10.545912742614746, -9.758220672607422, -8.970529556274414, -8.182838439941406, -7.395147323608398, -6.607456207275391, -5.819765090942383, -5.032073974609375, -4.244382858276367, -3.456691265106201, -2.6690001487731934, -1.8813095092773438, -1.093618392944336, -0.3059271574020386, 0.4817640781402588, 1.2694551944732666, 2.0571463108062744, 2.8448376655578613, 3.632528781890869, 4.420219898223877, 5.207911014556885, 5.995602130889893, 6.783293724060059, 7.570984840393066, 8.358675956726074, 9.146367073059082, 9.93405818939209, 10.721749305725098, 11.509440422058105, 12.297131538391113, 13.084822654724121, 13.872513771057129, 14.660204887390137, 15.447896957397461, 16.23558807373047, 17.023279190063477, 17.810970306396484, 18.598661422729492, 19.3863525390625, 20.174043655395508, 20.961734771728516, 21.749425888061523, 22.53711700439453, 23.32480812072754]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 9.0, 2.0, 9.0, 9.0, 13.0, 10.0, 18.0, 18.0, 20.0, 26.0, 29.0, 32.0, 37.0, 33.0, 38.0, 37.0, 52.0, 49.0, 39.0, 50.0, 48.0, 49.0, 43.0, 47.0, 30.0, 36.0, 28.0, 31.0, 22.0, 26.0, 22.0, 20.0, 14.0, 14.0, 11.0, 8.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.72265625, -3.62689208984375, -3.5311279296875, -3.43536376953125, -3.339599609375, -3.24383544921875, -3.1480712890625, -3.05230712890625, -2.95654296875, -2.86077880859375, -2.7650146484375, -2.66925048828125, -2.573486328125, -2.47772216796875, -2.3819580078125, -2.28619384765625, -2.1904296875, -2.09466552734375, -1.9989013671875, -1.90313720703125, -1.807373046875, -1.71160888671875, -1.6158447265625, -1.52008056640625, -1.42431640625, -1.32855224609375, -1.2327880859375, -1.13702392578125, -1.041259765625, -0.94549560546875, -0.8497314453125, -0.75396728515625, -0.658203125, -0.56243896484375, -0.4666748046875, -0.37091064453125, -0.275146484375, -0.17938232421875, -0.0836181640625, 0.01214599609375, 0.10791015625, 0.20367431640625, 0.2994384765625, 0.39520263671875, 0.490966796875, 0.58673095703125, 0.6824951171875, 0.77825927734375, 0.8740234375, 0.96978759765625, 1.0655517578125, 1.16131591796875, 1.257080078125, 1.35284423828125, 1.4486083984375, 1.54437255859375, 1.64013671875, 1.73590087890625, 1.8316650390625, 1.92742919921875, 2.023193359375, 2.11895751953125, 2.2147216796875, 2.31048583984375, 2.40625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 4.0, 7.0, 11.0, 10.0, 10.0, 24.0, 19.0, 21.0, 34.0, 43.0, 49.0, 48.0, 65.0, 78.0, 132.0, 214.0, 558.0, 3366.0, 114100.0, 3649984.0, 417365.0, 6543.0, 741.0, 221.0, 151.0, 85.0, 71.0, 60.0, 41.0, 42.0, 25.0, 32.0, 28.0, 28.0, 12.0, 17.0, 4.0, 11.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-16.578125, -16.14892578125, -15.7197265625, -15.29052734375, -14.861328125, -14.43212890625, -14.0029296875, -13.57373046875, -13.14453125, -12.71533203125, -12.2861328125, -11.85693359375, -11.427734375, -10.99853515625, -10.5693359375, -10.14013671875, -9.7109375, -9.28173828125, -8.8525390625, -8.42333984375, -7.994140625, -7.56494140625, -7.1357421875, -6.70654296875, -6.27734375, -5.84814453125, -5.4189453125, -4.98974609375, -4.560546875, -4.13134765625, -3.7021484375, -3.27294921875, -2.84375, -2.41455078125, -1.9853515625, -1.55615234375, -1.126953125, -0.69775390625, -0.2685546875, 0.16064453125, 0.58984375, 1.01904296875, 1.4482421875, 1.87744140625, 2.306640625, 2.73583984375, 3.1650390625, 3.59423828125, 4.0234375, 4.45263671875, 4.8818359375, 5.31103515625, 5.740234375, 6.16943359375, 6.5986328125, 7.02783203125, 7.45703125, 7.88623046875, 8.3154296875, 8.74462890625, 9.173828125, 9.60302734375, 10.0322265625, 10.46142578125, 10.890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 11.0, 21.0, 23.0, 50.0, 84.0, 111.0, 198.0, 324.0, 463.0, 681.0, 668.0, 518.0, 347.0, 208.0, 134.0, 90.0, 63.0, 22.0, 30.0, 11.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.3507080078125, -10.037353515625, -9.7239990234375, -9.41064453125, -9.0972900390625, -8.783935546875, -8.4705810546875, -8.1572265625, -7.8438720703125, -7.530517578125, -7.2171630859375, -6.90380859375, -6.5904541015625, -6.277099609375, -5.9637451171875, -5.650390625, -5.3370361328125, -5.023681640625, -4.7103271484375, -4.39697265625, -4.0836181640625, -3.770263671875, -3.4569091796875, -3.1435546875, -2.8302001953125, -2.516845703125, -2.2034912109375, -1.89013671875, -1.5767822265625, -1.263427734375, -0.9500732421875, -0.63671875, -0.3233642578125, -0.010009765625, 0.3033447265625, 0.61669921875, 0.9300537109375, 1.243408203125, 1.5567626953125, 1.8701171875, 2.1834716796875, 2.496826171875, 2.8101806640625, 3.12353515625, 3.4368896484375, 3.750244140625, 4.0635986328125, 4.376953125, 4.6903076171875, 5.003662109375, 5.3170166015625, 5.63037109375, 5.9437255859375, 6.257080078125, 6.5704345703125, 6.8837890625, 7.1971435546875, 7.510498046875, 7.8238525390625, 8.13720703125, 8.4505615234375, 8.763916015625, 9.0772705078125, 9.390625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 15.0, 14.0, 33.0, 54.0, 83.0, 149.0, 210.0, 329.0, 901.0, 6439.0, 2433339.0, 1746017.0, 4995.0, 822.0, 324.0, 222.0, 131.0, 75.0, 42.0, 36.0, 15.0, 12.0, 8.0, 4.0, 1.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.21875, -24.28369140625, -23.3486328125, -22.41357421875, -21.478515625, -20.54345703125, -19.6083984375, -18.67333984375, -17.73828125, -16.80322265625, -15.8681640625, -14.93310546875, -13.998046875, -13.06298828125, -12.1279296875, -11.19287109375, -10.2578125, -9.32275390625, -8.3876953125, -7.45263671875, -6.517578125, -5.58251953125, -4.6474609375, -3.71240234375, -2.77734375, -1.84228515625, -0.9072265625, 0.02783203125, 0.962890625, 1.89794921875, 2.8330078125, 3.76806640625, 4.703125, 5.63818359375, 6.5732421875, 7.50830078125, 8.443359375, 9.37841796875, 10.3134765625, 11.24853515625, 12.18359375, 13.11865234375, 14.0537109375, 14.98876953125, 15.923828125, 16.85888671875, 17.7939453125, 18.72900390625, 19.6640625, 20.59912109375, 21.5341796875, 22.46923828125, 23.404296875, 24.33935546875, 25.2744140625, 26.20947265625, 27.14453125, 28.07958984375, 29.0146484375, 29.94970703125, 30.884765625, 31.81982421875, 32.7548828125, 33.68994140625, 34.625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 19.0, 81.0, 217.0, 317.0, 255.0, 92.0, 25.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.065269470214844, -15.283468246459961, -12.501667976379395, -9.719867706298828, -6.938066482543945, -4.1562652587890625, -1.3744659423828125, 1.4073352813720703, 4.189136505126953, 6.970937252044678, 9.752737998962402, 12.534538269042969, 15.316339492797852, 18.098140716552734, 20.879940032958984, 23.661741256713867, 26.44354248046875, 29.225343704223633, 32.007144927978516, 34.788944244384766, 37.57074737548828, 40.35254669189453, 43.13434600830078, 45.91614532470703, 48.69794845581055, 51.4797477722168, 54.26155090332031, 57.04335021972656, 59.82514953613281, 62.60695266723633, 65.38874816894531, 68.1705551147461, 70.95234680175781, 73.73414611816406, 76.51594543457031, 79.29774475097656, 82.07955169677734, 84.8613510131836, 87.64315032958984, 90.4249496459961, 93.20675659179688, 95.98855590820312, 98.77035522460938, 101.55215454101562, 104.3339614868164, 107.11576080322266, 109.8975601196289, 112.67935943603516, 115.4611587524414, 118.24295806884766, 121.0247573852539, 123.80656433105469, 126.58836364746094, 129.3701629638672, 132.15196228027344, 134.9337615966797, 137.71556091308594, 140.4973602294922, 143.27915954589844, 146.0609588623047, 148.84275817871094, 151.62457275390625, 154.4063720703125, 157.18817138671875, 159.969970703125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 7.0, 2.0, 2.0, 7.0, 10.0, 10.0, 7.0, 12.0, 20.0, 16.0, 15.0, 18.0, 18.0, 15.0, 27.0, 25.0, 37.0, 22.0, 31.0, 38.0, 30.0, 36.0, 40.0, 26.0, 43.0, 50.0, 47.0, 31.0, 43.0, 33.0, 33.0, 29.0, 21.0, 34.0, 18.0, 19.0, 16.0, 16.0, 19.0, 11.0, 12.0, 8.0, 8.0, 10.0, 10.0, 6.0, 4.0, 2.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.316221237182617, -17.724740982055664, -17.13326072692871, -16.541780471801758, -15.950300216674805, -15.358819961547852, -14.767340660095215, -14.175860404968262, -13.584380149841309, -12.992899894714355, -12.401419639587402, -11.80993938446045, -11.218460083007812, -10.62697982788086, -10.035499572753906, -9.444019317626953, -8.8525390625, -8.261058807373047, -7.669578552246094, -7.078098773956299, -6.486618518829346, -5.895138263702393, -5.303658485412598, -4.7121782302856445, -4.120697975158691, -3.5292177200317383, -2.9377377033233643, -2.3462576866149902, -1.754777431488037, -1.163297176361084, -0.57181715965271, 0.019662857055664062, 0.61114501953125, 1.2026251554489136, 1.7941052913665771, 2.385585308074951, 2.9770655632019043, 3.5685458183288574, 4.160025596618652, 4.7515058517456055, 5.342986106872559, 5.934466361999512, 6.525946617126465, 7.11742639541626, 7.708906650543213, 8.300386428833008, 8.891866683959961, 9.483346939086914, 10.074827194213867, 10.66630744934082, 11.257787704467773, 11.849267959594727, 12.44074821472168, 13.032228469848633, 13.62370777130127, 14.215188026428223, 14.806668281555176, 15.398148536682129, 15.989628791809082, 16.58110809326172, 17.172588348388672, 17.764068603515625, 18.355548858642578, 18.94702911376953, 19.538509368896484]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 7.0, 5.0, 15.0, 10.0, 14.0, 10.0, 14.0, 19.0, 22.0, 22.0, 28.0, 33.0, 48.0, 43.0, 47.0, 46.0, 34.0, 47.0, 47.0, 50.0, 45.0, 53.0, 45.0, 33.0, 31.0, 26.0, 30.0, 25.0, 34.0, 18.0, 17.0, 22.0, 21.0, 12.0, 6.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.9296875, -3.831787109375, -3.73388671875, -3.635986328125, -3.5380859375, -3.440185546875, -3.34228515625, -3.244384765625, -3.146484375, -3.048583984375, -2.95068359375, -2.852783203125, -2.7548828125, -2.656982421875, -2.55908203125, -2.461181640625, -2.36328125, -2.265380859375, -2.16748046875, -2.069580078125, -1.9716796875, -1.873779296875, -1.77587890625, -1.677978515625, -1.580078125, -1.482177734375, -1.38427734375, -1.286376953125, -1.1884765625, -1.090576171875, -0.99267578125, -0.894775390625, -0.796875, -0.698974609375, -0.60107421875, -0.503173828125, -0.4052734375, -0.307373046875, -0.20947265625, -0.111572265625, -0.013671875, 0.084228515625, 0.18212890625, 0.280029296875, 0.3779296875, 0.475830078125, 0.57373046875, 0.671630859375, 0.76953125, 0.867431640625, 0.96533203125, 1.063232421875, 1.1611328125, 1.259033203125, 1.35693359375, 1.454833984375, 1.552734375, 1.650634765625, 1.74853515625, 1.846435546875, 1.9443359375, 2.042236328125, 2.14013671875, 2.238037109375, 2.3359375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 17.0, 22.0, 33.0, 40.0, 66.0, 113.0, 196.0, 349.0, 598.0, 1173.0, 2159.0, 3912.0, 7220.0, 13312.0, 25795.0, 52789.0, 120005.0, 330069.0, 286200.0, 106489.0, 47495.0, 23536.0, 12517.0, 6712.0, 3496.0, 1859.0, 1000.0, 587.0, 316.0, 184.0, 114.0, 61.0, 36.0, 30.0, 10.0, 14.0, 11.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.75927734375, -0.7369003295898438, -0.7145233154296875, -0.6921463012695312, -0.669769287109375, -0.6473922729492188, -0.6250152587890625, -0.6026382446289062, -0.58026123046875, -0.5578842163085938, -0.5355072021484375, -0.5131301879882812, -0.490753173828125, -0.46837615966796875, -0.4459991455078125, -0.42362213134765625, -0.4012451171875, -0.37886810302734375, -0.3564910888671875, -0.33411407470703125, -0.311737060546875, -0.28936004638671875, -0.2669830322265625, -0.24460601806640625, -0.22222900390625, -0.19985198974609375, -0.1774749755859375, -0.15509796142578125, -0.132720947265625, -0.11034393310546875, -0.0879669189453125, -0.06558990478515625, -0.043212890625, -0.02083587646484375, 0.0015411376953125, 0.02391815185546875, 0.046295166015625, 0.06867218017578125, 0.0910491943359375, 0.11342620849609375, 0.13580322265625, 0.15818023681640625, 0.1805572509765625, 0.20293426513671875, 0.225311279296875, 0.24768829345703125, 0.2700653076171875, 0.29244232177734375, 0.3148193359375, 0.33719635009765625, 0.3595733642578125, 0.38195037841796875, 0.404327392578125, 0.42670440673828125, 0.4490814208984375, 0.47145843505859375, 0.49383544921875, 0.5162124633789062, 0.5385894775390625, 0.5609664916992188, 0.583343505859375, 0.6057205200195312, 0.6280975341796875, 0.6504745483398438, 0.6728515625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 4.0, 6.0, 10.0, 14.0, 11.0, 12.0, 14.0, 15.0, 30.0, 30.0, 27.0, 31.0, 34.0, 31.0, 40.0, 35.0, 31.0, 40.0, 41.0, 44.0, 1060.0, 38.0, 34.0, 29.0, 45.0, 49.0, 34.0, 13.0, 31.0, 22.0, 16.0, 29.0, 17.0, 23.0, 14.0, 10.0, 9.0, 7.0, 13.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8388671875, -1.7852935791015625, -1.731719970703125, -1.6781463623046875, -1.62457275390625, -1.5709991455078125, -1.517425537109375, -1.4638519287109375, -1.4102783203125, -1.3567047119140625, -1.303131103515625, -1.2495574951171875, -1.19598388671875, -1.1424102783203125, -1.088836669921875, -1.0352630615234375, -0.981689453125, -0.9281158447265625, -0.874542236328125, -0.8209686279296875, -0.76739501953125, -0.7138214111328125, -0.660247802734375, -0.6066741943359375, -0.5531005859375, -0.4995269775390625, -0.445953369140625, -0.3923797607421875, -0.33880615234375, -0.2852325439453125, -0.231658935546875, -0.1780853271484375, -0.12451171875, -0.0709381103515625, -0.017364501953125, 0.0362091064453125, 0.08978271484375, 0.1433563232421875, 0.196929931640625, 0.2505035400390625, 0.3040771484375, 0.3576507568359375, 0.411224365234375, 0.4647979736328125, 0.51837158203125, 0.5719451904296875, 0.625518798828125, 0.6790924072265625, 0.732666015625, 0.7862396240234375, 0.839813232421875, 0.8933868408203125, 0.94696044921875, 1.0005340576171875, 1.054107666015625, 1.1076812744140625, 1.1612548828125, 1.2148284912109375, 1.268402099609375, 1.3219757080078125, 1.37554931640625, 1.4291229248046875, 1.482696533203125, 1.5362701416015625, 1.58984375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 8.0, 13.0, 21.0, 27.0, 51.0, 87.0, 126.0, 160.0, 243.0, 343.0, 512.0, 741.0, 1018.0, 1533.0, 2162.0, 3028.0, 4493.0, 6457.0, 9237.0, 13545.0, 19938.0, 29827.0, 46058.0, 73770.0, 132589.0, 1305608.0, 181939.0, 94788.0, 56250.0, 35796.0, 24133.0, 16305.0, 11381.0, 7612.0, 5325.0, 3647.0, 2476.0, 1807.0, 1238.0, 819.0, 614.0, 415.0, 308.0, 195.0, 141.0, 100.0, 67.0, 55.0, 43.0, 37.0, 18.0, 12.0, 10.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.3896484375, -0.3773651123046875, -0.365081787109375, -0.3527984619140625, -0.34051513671875, -0.3282318115234375, -0.315948486328125, -0.3036651611328125, -0.2913818359375, -0.2790985107421875, -0.266815185546875, -0.2545318603515625, -0.24224853515625, -0.2299652099609375, -0.217681884765625, -0.2053985595703125, -0.193115234375, -0.1808319091796875, -0.168548583984375, -0.1562652587890625, -0.14398193359375, -0.1316986083984375, -0.119415283203125, -0.1071319580078125, -0.0948486328125, -0.0825653076171875, -0.070281982421875, -0.0579986572265625, -0.04571533203125, -0.0334320068359375, -0.021148681640625, -0.0088653564453125, 0.00341796875, 0.0157012939453125, 0.027984619140625, 0.0402679443359375, 0.05255126953125, 0.0648345947265625, 0.077117919921875, 0.0894012451171875, 0.1016845703125, 0.1139678955078125, 0.126251220703125, 0.1385345458984375, 0.15081787109375, 0.1631011962890625, 0.175384521484375, 0.1876678466796875, 0.199951171875, 0.2122344970703125, 0.224517822265625, 0.2368011474609375, 0.24908447265625, 0.2613677978515625, 0.273651123046875, 0.2859344482421875, 0.2982177734375, 0.3105010986328125, 0.322784423828125, 0.3350677490234375, 0.34735107421875, 0.3596343994140625, 0.371917724609375, 0.3842010498046875, 0.396484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 11.0, 7.0, 12.0, 9.0, 13.0, 7.0, 24.0, 36.0, 41.0, 53.0, 77.0, 66.0, 84.0, 96.0, 79.0, 73.0, 71.0, 49.0, 44.0, 36.0, 23.0, 14.0, 13.0, 11.0, 8.0, 6.0, 7.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010526180267333984, -0.00010079145431518555, -9.632110595703125e-05, -9.185075759887695e-05, -8.738040924072266e-05, -8.291006088256836e-05, -7.843971252441406e-05, -7.396936416625977e-05, -6.949901580810547e-05, -6.502866744995117e-05, -6.0558319091796875e-05, -5.608797073364258e-05, -5.161762237548828e-05, -4.7147274017333984e-05, -4.267692565917969e-05, -3.820657730102539e-05, -3.3736228942871094e-05, -2.9265880584716797e-05, -2.47955322265625e-05, -2.0325183868408203e-05, -1.5854835510253906e-05, -1.138448715209961e-05, -6.9141387939453125e-06, -2.4437904357910156e-06, 2.0265579223632812e-06, 6.496906280517578e-06, 1.0967254638671875e-05, 1.5437602996826172e-05, 1.990795135498047e-05, 2.4378299713134766e-05, 2.8848648071289062e-05, 3.331899642944336e-05, 3.7789344787597656e-05, 4.225969314575195e-05, 4.673004150390625e-05, 5.120038986206055e-05, 5.5670738220214844e-05, 6.014108657836914e-05, 6.461143493652344e-05, 6.908178329467773e-05, 7.355213165283203e-05, 7.802248001098633e-05, 8.249282836914062e-05, 8.696317672729492e-05, 9.143352508544922e-05, 9.590387344360352e-05, 0.00010037422180175781, 0.00010484457015991211, 0.0001093149185180664, 0.0001137852668762207, 0.000118255615234375, 0.0001227259635925293, 0.0001271963119506836, 0.0001316666603088379, 0.0001361370086669922, 0.00014060735702514648, 0.00014507770538330078, 0.00014954805374145508, 0.00015401840209960938, 0.00015848875045776367, 0.00016295909881591797, 0.00016742944717407227, 0.00017189979553222656, 0.00017637014389038086, 0.00018084049224853516]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 7.0, 2.0, 4.0, 6.0, 6.0, 3.0, 11.0, 8.0, 10.0, 24.0, 30.0, 34.0, 48.0, 65.0, 103.0, 176.0, 338.0, 573.0, 2753.0, 996935.0, 45371.0, 971.0, 397.0, 234.0, 144.0, 99.0, 55.0, 36.0, 27.0, 17.0, 12.0, 13.0, 7.0, 14.0, 4.0, 5.0, 6.0, 2.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.003032684326171875, -0.0029523074626922607, -0.0028719305992126465, -0.0027915537357330322, -0.002711176872253418, -0.0026308000087738037, -0.0025504231452941895, -0.002470046281814575, -0.002389669418334961, -0.0023092925548553467, -0.0022289156913757324, -0.002148538827896118, -0.002068161964416504, -0.0019877851009368896, -0.0019074082374572754, -0.0018270313739776611, -0.0017466545104980469, -0.0016662776470184326, -0.0015859007835388184, -0.001505523920059204, -0.0014251470565795898, -0.0013447701930999756, -0.0012643933296203613, -0.001184016466140747, -0.0011036396026611328, -0.0010232627391815186, -0.0009428858757019043, -0.00086250901222229, -0.0007821321487426758, -0.0007017552852630615, -0.0006213784217834473, -0.000541001558303833, -0.00046062469482421875, -0.0003802478313446045, -0.00029987096786499023, -0.00021949410438537598, -0.00013911724090576172, -5.874037742614746e-05, 2.1636486053466797e-05, 0.00010201334953308105, 0.0001823902130126953, 0.00026276707649230957, 0.00034314393997192383, 0.0004235208034515381, 0.0005038976669311523, 0.0005842745304107666, 0.0006646513938903809, 0.0007450282573699951, 0.0008254051208496094, 0.0009057819843292236, 0.0009861588478088379, 0.0010665357112884521, 0.0011469125747680664, 0.0012272894382476807, 0.001307666301727295, 0.0013880431652069092, 0.0014684200286865234, 0.0015487968921661377, 0.001629173755645752, 0.0017095506191253662, 0.0017899274826049805, 0.0018703043460845947, 0.001950681209564209, 0.0020310580730438232, 0.0021114349365234375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 48.0, 143.0, 282.0, 263.0, 176.0, 68.0, 12.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.282000246457756e-05, -8.704788342583925e-05, -8.127576438710093e-05, -7.550364534836262e-05, -6.973153358558193e-05, -6.395941454684362e-05, -5.818729550810531e-05, -5.2415180107345805e-05, -4.6643061068607494e-05, -4.0870942029869184e-05, -3.509882662910968e-05, -2.932670759037137e-05, -2.3554590370622464e-05, -1.7782473150873557e-05, -1.2010354112135246e-05, -6.238238711375743e-06, -4.661196726374328e-07, 5.305998001858825e-06, 1.1078115676355083e-05, 1.685023380559869e-05, 2.2622351025347598e-05, 2.8394468245096505e-05, 3.4166587283834815e-05, 3.993870268459432e-05, 4.571082172333263e-05, 5.148294076207094e-05, 5.725505616283044e-05, 6.302717520156875e-05, 6.879929424030706e-05, 7.457140600308776e-05, 8.034352504182607e-05, 8.611564408056438e-05, 9.188776311930269e-05, 9.7659882158041e-05, 0.00010343200119677931, 0.00010920412023551762, 0.00011497623199829832, 0.00012074835103703663, 0.00012652046279981732, 0.00013229258183855563, 0.00013806470087729394, 0.00014383681991603225, 0.00014960893895477057, 0.00015538105799350888, 0.00016115317703224719, 0.00016692528151907027, 0.0001726974151097238, 0.0001784695195965469, 0.00018424165318720043, 0.00019001377222593874, 0.00019578589126467705, 0.00020155801030341536, 0.00020733012934215367, 0.00021310223382897675, 0.0002188743674196303, 0.00022464647190645337, 0.00023041859094519168, 0.00023619070998393, 0.0002419628290226683, 0.0002477349480614066, 0.0002535070525482297, 0.00025927918613888323, 0.0002650512906257063, 0.00027082342421635985, 0.00027659552870318294]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 2.0, 10.0, 13.0, 11.0, 16.0, 16.0, 15.0, 15.0, 26.0, 24.0, 32.0, 27.0, 33.0, 38.0, 35.0, 37.0, 42.0, 53.0, 42.0, 38.0, 44.0, 34.0, 43.0, 34.0, 41.0, 35.0, 34.0, 38.0, 25.0, 28.0, 18.0, 19.0, 13.0, 9.0, 11.0, 9.0, 8.0, 6.0, 6.0, 7.0, 0.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.252527236938477e-05, -6.053224205970764e-05, -5.853921175003052e-05, -5.6546181440353394e-05, -5.455315113067627e-05, -5.2560120820999146e-05, -5.056709051132202e-05, -4.85740602016449e-05, -4.6581029891967773e-05, -4.458799958229065e-05, -4.2594969272613525e-05, -4.06019389629364e-05, -3.860890865325928e-05, -3.661587834358215e-05, -3.462284803390503e-05, -3.2629817724227905e-05, -3.063678741455078e-05, -2.8643757104873657e-05, -2.6650726795196533e-05, -2.465769648551941e-05, -2.2664666175842285e-05, -2.067163586616516e-05, -1.8678605556488037e-05, -1.6685575246810913e-05, -1.4692544937133789e-05, -1.2699514627456665e-05, -1.0706484317779541e-05, -8.713454008102417e-06, -6.720423698425293e-06, -4.727393388748169e-06, -2.734363079071045e-06, -7.413327693939209e-07, 1.2516975402832031e-06, 3.244727849960327e-06, 5.237758159637451e-06, 7.230788469314575e-06, 9.2238187789917e-06, 1.1216849088668823e-05, 1.3209879398345947e-05, 1.5202909708023071e-05, 1.7195940017700195e-05, 1.918897032737732e-05, 2.1182000637054443e-05, 2.3175030946731567e-05, 2.516806125640869e-05, 2.7161091566085815e-05, 2.915412187576294e-05, 3.1147152185440063e-05, 3.314018249511719e-05, 3.513321280479431e-05, 3.7126243114471436e-05, 3.911927342414856e-05, 4.1112303733825684e-05, 4.310533404350281e-05, 4.509836435317993e-05, 4.7091394662857056e-05, 4.908442497253418e-05, 5.1077455282211304e-05, 5.307048559188843e-05, 5.506351590156555e-05, 5.7056546211242676e-05, 5.90495765209198e-05, 6.104260683059692e-05, 6.303563714027405e-05, 6.502866744995117e-05]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 7.0, 5.0, 15.0, 10.0, 14.0, 10.0, 14.0, 19.0, 22.0, 22.0, 28.0, 33.0, 48.0, 43.0, 47.0, 46.0, 34.0, 47.0, 47.0, 50.0, 45.0, 53.0, 45.0, 33.0, 31.0, 26.0, 30.0, 25.0, 34.0, 18.0, 17.0, 22.0, 21.0, 12.0, 6.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.9296875, -3.831787109375, -3.73388671875, -3.635986328125, -3.5380859375, -3.440185546875, -3.34228515625, -3.244384765625, -3.146484375, -3.048583984375, -2.95068359375, -2.852783203125, -2.7548828125, -2.656982421875, -2.55908203125, -2.461181640625, -2.36328125, -2.265380859375, -2.16748046875, -2.069580078125, -1.9716796875, -1.873779296875, -1.77587890625, -1.677978515625, -1.580078125, -1.482177734375, -1.38427734375, -1.286376953125, -1.1884765625, -1.090576171875, -0.99267578125, -0.894775390625, -0.796875, -0.698974609375, -0.60107421875, -0.503173828125, -0.4052734375, -0.307373046875, -0.20947265625, -0.111572265625, -0.013671875, 0.084228515625, 0.18212890625, 0.280029296875, 0.3779296875, 0.475830078125, 0.57373046875, 0.671630859375, 0.76953125, 0.867431640625, 0.96533203125, 1.063232421875, 1.1611328125, 1.259033203125, 1.35693359375, 1.454833984375, 1.552734375, 1.650634765625, 1.74853515625, 1.846435546875, 1.9443359375, 2.042236328125, 2.14013671875, 2.238037109375, 2.3359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 12.0, 15.0, 19.0, 19.0, 36.0, 57.0, 77.0, 157.0, 247.0, 469.0, 861.0, 1831.0, 3604.0, 7369.0, 14911.0, 31104.0, 67229.0, 163699.0, 383447.0, 215767.0, 83685.0, 37819.0, 18380.0, 8952.0, 4323.0, 2157.0, 1074.0, 504.0, 279.0, 168.0, 86.0, 55.0, 39.0, 33.0, 24.0, 11.0, 6.0, 10.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.150482177734375, -2.06658935546875, -1.982696533203125, -1.8988037109375, -1.814910888671875, -1.73101806640625, -1.647125244140625, -1.563232421875, -1.479339599609375, -1.39544677734375, -1.311553955078125, -1.2276611328125, -1.143768310546875, -1.05987548828125, -0.975982666015625, -0.89208984375, -0.808197021484375, -0.72430419921875, -0.640411376953125, -0.5565185546875, -0.472625732421875, -0.38873291015625, -0.304840087890625, -0.220947265625, -0.137054443359375, -0.05316162109375, 0.030731201171875, 0.1146240234375, 0.198516845703125, 0.28240966796875, 0.366302490234375, 0.4501953125, 0.534088134765625, 0.61798095703125, 0.701873779296875, 0.7857666015625, 0.869659423828125, 0.95355224609375, 1.037445068359375, 1.121337890625, 1.205230712890625, 1.28912353515625, 1.373016357421875, 1.4569091796875, 1.540802001953125, 1.62469482421875, 1.708587646484375, 1.79248046875, 1.876373291015625, 1.96026611328125, 2.044158935546875, 2.1280517578125, 2.211944580078125, 2.29583740234375, 2.379730224609375, 2.463623046875, 2.547515869140625, 2.63140869140625, 2.715301513671875, 2.7991943359375, 2.883087158203125, 2.96697998046875, 3.050872802734375, 3.134765625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 5.0, 12.0, 4.0, 7.0, 19.0, 17.0, 28.0, 31.0, 45.0, 39.0, 52.0, 52.0, 56.0, 74.0, 184.0, 1578.0, 280.0, 105.0, 56.0, 52.0, 47.0, 45.0, 29.0, 48.0, 30.0, 22.0, 19.0, 16.0, 21.0, 11.0, 6.0, 16.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.9296875, -12.5455322265625, -12.161376953125, -11.7772216796875, -11.39306640625, -11.0089111328125, -10.624755859375, -10.2406005859375, -9.8564453125, -9.4722900390625, -9.088134765625, -8.7039794921875, -8.31982421875, -7.9356689453125, -7.551513671875, -7.1673583984375, -6.783203125, -6.3990478515625, -6.014892578125, -5.6307373046875, -5.24658203125, -4.8624267578125, -4.478271484375, -4.0941162109375, -3.7099609375, -3.3258056640625, -2.941650390625, -2.5574951171875, -2.17333984375, -1.7891845703125, -1.405029296875, -1.0208740234375, -0.63671875, -0.2525634765625, 0.131591796875, 0.5157470703125, 0.89990234375, 1.2840576171875, 1.668212890625, 2.0523681640625, 2.4365234375, 2.8206787109375, 3.204833984375, 3.5889892578125, 3.97314453125, 4.3572998046875, 4.741455078125, 5.1256103515625, 5.509765625, 5.8939208984375, 6.278076171875, 6.6622314453125, 7.04638671875, 7.4305419921875, 7.814697265625, 8.1988525390625, 8.5830078125, 8.9671630859375, 9.351318359375, 9.7354736328125, 10.11962890625, 10.5037841796875, 10.887939453125, 11.2720947265625, 11.65625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 7.0, 14.0, 18.0, 27.0, 52.0, 64.0, 93.0, 156.0, 327.0, 758.0, 19809.0, 3120747.0, 2531.0, 491.0, 230.0, 117.0, 71.0, 55.0, 37.0, 28.0, 17.0, 12.0, 9.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.03125, -61.34228515625, -59.6533203125, -57.96435546875, -56.275390625, -54.58642578125, -52.8974609375, -51.20849609375, -49.51953125, -47.83056640625, -46.1416015625, -44.45263671875, -42.763671875, -41.07470703125, -39.3857421875, -37.69677734375, -36.0078125, -34.31884765625, -32.6298828125, -30.94091796875, -29.251953125, -27.56298828125, -25.8740234375, -24.18505859375, -22.49609375, -20.80712890625, -19.1181640625, -17.42919921875, -15.740234375, -14.05126953125, -12.3623046875, -10.67333984375, -8.984375, -7.29541015625, -5.6064453125, -3.91748046875, -2.228515625, -0.53955078125, 1.1494140625, 2.83837890625, 4.52734375, 6.21630859375, 7.9052734375, 9.59423828125, 11.283203125, 12.97216796875, 14.6611328125, 16.35009765625, 18.0390625, 19.72802734375, 21.4169921875, 23.10595703125, 24.794921875, 26.48388671875, 28.1728515625, 29.86181640625, 31.55078125, 33.23974609375, 34.9287109375, 36.61767578125, 38.306640625, 39.99560546875, 41.6845703125, 43.37353515625, 45.0625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [725.0, 293.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.27552604675293, 0.7519025802612305, 10.77933120727539, 20.806760787963867, 30.83418846130371, 40.86161804199219, 50.88904571533203, 60.916473388671875, 70.94390106201172, 80.97132873535156, 90.9987564086914, 101.02618408203125, 111.05361938476562, 121.08103942871094, 131.1084747314453, 141.13589477539062, 151.163330078125, 161.19076538085938, 171.2181854248047, 181.24562072753906, 191.27304077148438, 201.30047607421875, 211.32791137695312, 221.35533142089844, 231.3827667236328, 241.4102020263672, 251.4376220703125, 261.4650573730469, 271.49249267578125, 281.5198974609375, 291.5473327636719, 301.57476806640625, 311.6022033691406, 321.629638671875, 331.6570739746094, 341.6844787597656, 351.7119140625, 361.7393493652344, 371.76678466796875, 381.794189453125, 391.8216247558594, 401.84906005859375, 411.8764953613281, 421.9039001464844, 431.93133544921875, 441.9587707519531, 451.9862060546875, 462.01361083984375, 472.04107666015625, 482.0685119628906, 492.095947265625, 502.12335205078125, 512.1508178710938, 522.17822265625, 532.2056274414062, 542.2330932617188, 552.260498046875, 562.2879028320312, 572.3153686523438, 582.3427734375, 592.3702392578125, 602.3976440429688, 612.425048828125, 622.4525146484375, 632.4799194335938]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 6.0, 8.0, 12.0, 14.0, 6.0, 15.0, 9.0, 16.0, 15.0, 23.0, 23.0, 32.0, 26.0, 33.0, 37.0, 39.0, 42.0, 49.0, 42.0, 33.0, 30.0, 53.0, 32.0, 39.0, 39.0, 39.0, 43.0, 27.0, 30.0, 23.0, 33.0, 26.0, 17.0, 14.0, 16.0, 12.0, 9.0, 10.0, 8.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-38.100563049316406, -37.094482421875, -36.088401794433594, -35.08232116699219, -34.07624053955078, -33.070159912109375, -32.06407928466797, -31.05799674987793, -30.05191421508789, -29.045833587646484, -28.039752960205078, -27.033672332763672, -26.027589797973633, -25.021509170532227, -24.01542854309082, -23.009347915649414, -22.003267288208008, -20.9971866607666, -19.991106033325195, -18.985023498535156, -17.97894287109375, -16.972862243652344, -15.966781616210938, -14.960700988769531, -13.954619407653809, -12.948538780212402, -11.94245719909668, -10.936376571655273, -9.930295944213867, -8.924214363098145, -7.918133735656738, -6.912052631378174, -5.905971527099609, -4.899890422821045, -3.8938095569610596, -2.887728691101074, -1.8816475868225098, -0.8755664825439453, 0.13051414489746094, 1.1365952491760254, 2.14267635345459, 3.1487574577331543, 4.154838562011719, 5.160919189453125, 6.1670002937316895, 7.173081398010254, 8.17916202545166, 9.185243606567383, 10.191324234008789, 11.197404861450195, 12.203486442565918, 13.209567070007324, 14.215648651123047, 15.221729278564453, 16.22780990600586, 17.233890533447266, 18.239971160888672, 19.246051788330078, 20.252132415771484, 21.25821304321289, 22.26429557800293, 23.270376205444336, 24.276456832885742, 25.28253746032715, 26.288619995117188]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 9.0, 3.0, 18.0, 10.0, 13.0, 11.0, 14.0, 19.0, 23.0, 24.0, 28.0, 35.0, 43.0, 48.0, 50.0, 46.0, 46.0, 36.0, 47.0, 41.0, 44.0, 44.0, 41.0, 37.0, 39.0, 29.0, 27.0, 25.0, 29.0, 26.0, 23.0, 16.0, 15.0, 13.0, 12.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0, -3.892120361328125, -3.78424072265625, -3.676361083984375, -3.5684814453125, -3.460601806640625, -3.35272216796875, -3.244842529296875, -3.136962890625, -3.029083251953125, -2.92120361328125, -2.813323974609375, -2.7054443359375, -2.597564697265625, -2.48968505859375, -2.381805419921875, -2.27392578125, -2.166046142578125, -2.05816650390625, -1.950286865234375, -1.8424072265625, -1.734527587890625, -1.62664794921875, -1.518768310546875, -1.410888671875, -1.303009033203125, -1.19512939453125, -1.087249755859375, -0.9793701171875, -0.871490478515625, -0.76361083984375, -0.655731201171875, -0.5478515625, -0.439971923828125, -0.33209228515625, -0.224212646484375, -0.1163330078125, -0.008453369140625, 0.09942626953125, 0.207305908203125, 0.315185546875, 0.423065185546875, 0.53094482421875, 0.638824462890625, 0.7467041015625, 0.854583740234375, 0.96246337890625, 1.070343017578125, 1.17822265625, 1.286102294921875, 1.39398193359375, 1.501861572265625, 1.6097412109375, 1.717620849609375, 1.82550048828125, 1.933380126953125, 2.041259765625, 2.149139404296875, 2.25701904296875, 2.364898681640625, 2.4727783203125, 2.580657958984375, 2.68853759765625, 2.796417236328125, 2.904296875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 5.0, 2.0, 10.0, 12.0, 9.0, 9.0, 15.0, 12.0, 18.0, 28.0, 26.0, 48.0, 56.0, 93.0, 164.0, 271.0, 424.0, 868.0, 2014.0, 6708.0, 29587.0, 165876.0, 919522.0, 1908192.0, 932550.0, 185288.0, 31737.0, 6888.0, 1962.0, 771.0, 402.0, 242.0, 128.0, 98.0, 61.0, 33.0, 31.0, 28.0, 19.0, 16.0, 13.0, 18.0, 4.0, 8.0, 7.0, 4.0, 5.0, 4.0, 0.0, 4.0], "bins": [-5.8203125, -5.6651611328125, -5.510009765625, -5.3548583984375, -5.19970703125, -5.0445556640625, -4.889404296875, -4.7342529296875, -4.5791015625, -4.4239501953125, -4.268798828125, -4.1136474609375, -3.95849609375, -3.8033447265625, -3.648193359375, -3.4930419921875, -3.337890625, -3.1827392578125, -3.027587890625, -2.8724365234375, -2.71728515625, -2.5621337890625, -2.406982421875, -2.2518310546875, -2.0966796875, -1.9415283203125, -1.786376953125, -1.6312255859375, -1.47607421875, -1.3209228515625, -1.165771484375, -1.0106201171875, -0.85546875, -0.7003173828125, -0.545166015625, -0.3900146484375, -0.23486328125, -0.0797119140625, 0.075439453125, 0.2305908203125, 0.3857421875, 0.5408935546875, 0.696044921875, 0.8511962890625, 1.00634765625, 1.1614990234375, 1.316650390625, 1.4718017578125, 1.626953125, 1.7821044921875, 1.937255859375, 2.0924072265625, 2.24755859375, 2.4027099609375, 2.557861328125, 2.7130126953125, 2.8681640625, 3.0233154296875, 3.178466796875, 3.3336181640625, 3.48876953125, 3.6439208984375, 3.799072265625, 3.9542236328125, 4.109375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 9.0, 19.0, 40.0, 56.0, 91.0, 124.0, 218.0, 313.0, 504.0, 637.0, 647.0, 485.0, 337.0, 228.0, 127.0, 97.0, 64.0, 34.0, 24.0, 10.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.002197265625, -7.66845703125, -7.334716796875, -7.0009765625, -6.667236328125, -6.33349609375, -5.999755859375, -5.666015625, -5.332275390625, -4.99853515625, -4.664794921875, -4.3310546875, -3.997314453125, -3.66357421875, -3.329833984375, -2.99609375, -2.662353515625, -2.32861328125, -1.994873046875, -1.6611328125, -1.327392578125, -0.99365234375, -0.659912109375, -0.326171875, 0.007568359375, 0.34130859375, 0.675048828125, 1.0087890625, 1.342529296875, 1.67626953125, 2.010009765625, 2.34375, 2.677490234375, 3.01123046875, 3.344970703125, 3.6787109375, 4.012451171875, 4.34619140625, 4.679931640625, 5.013671875, 5.347412109375, 5.68115234375, 6.014892578125, 6.3486328125, 6.682373046875, 7.01611328125, 7.349853515625, 7.68359375, 8.017333984375, 8.35107421875, 8.684814453125, 9.0185546875, 9.352294921875, 9.68603515625, 10.019775390625, 10.353515625, 10.687255859375, 11.02099609375, 11.354736328125, 11.6884765625, 12.022216796875, 12.35595703125, 12.689697265625, 13.0234375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 9.0, 10.0, 13.0, 28.0, 25.0, 45.0, 50.0, 70.0, 115.0, 166.0, 245.0, 350.0, 689.0, 2849.0, 89844.0, 3610989.0, 478946.0, 7464.0, 1033.0, 481.0, 287.0, 165.0, 123.0, 88.0, 59.0, 49.0, 28.0, 21.0, 9.0, 9.0, 7.0, 8.0, 5.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-25.046875, -24.4156494140625, -23.784423828125, -23.1531982421875, -22.52197265625, -21.8907470703125, -21.259521484375, -20.6282958984375, -19.9970703125, -19.3658447265625, -18.734619140625, -18.1033935546875, -17.47216796875, -16.8409423828125, -16.209716796875, -15.5784912109375, -14.947265625, -14.3160400390625, -13.684814453125, -13.0535888671875, -12.42236328125, -11.7911376953125, -11.159912109375, -10.5286865234375, -9.8974609375, -9.2662353515625, -8.635009765625, -8.0037841796875, -7.37255859375, -6.7413330078125, -6.110107421875, -5.4788818359375, -4.84765625, -4.2164306640625, -3.585205078125, -2.9539794921875, -2.32275390625, -1.6915283203125, -1.060302734375, -0.4290771484375, 0.2021484375, 0.8333740234375, 1.464599609375, 2.0958251953125, 2.72705078125, 3.3582763671875, 3.989501953125, 4.6207275390625, 5.251953125, 5.8831787109375, 6.514404296875, 7.1456298828125, 7.77685546875, 8.4080810546875, 9.039306640625, 9.6705322265625, 10.3017578125, 10.9329833984375, 11.564208984375, 12.1954345703125, 12.82666015625, 13.4578857421875, 14.089111328125, 14.7203369140625, 15.3515625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 66.0, 197.0, 318.0, 278.0, 108.0, 33.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.41168975830078, -69.58451080322266, -66.75733184814453, -63.93014907836914, -61.102970123291016, -58.275787353515625, -55.4486083984375, -52.621429443359375, -49.79425048828125, -46.967071533203125, -44.139888763427734, -41.31270980834961, -38.485530853271484, -35.658348083496094, -32.83116912841797, -30.003990173339844, -27.176807403564453, -24.349626541137695, -21.52244758605957, -18.695266723632812, -15.868086814880371, -13.04090690612793, -10.213726043701172, -7.386547088623047, -4.559366226196289, -1.7321860790252686, 1.094994068145752, 3.9221744537353516, 6.749354362487793, 9.576534271240234, 12.403715133666992, 15.230894088745117, 18.058074951171875, 20.885255813598633, 23.712434768676758, 26.539615631103516, 29.36679458618164, 32.19397735595703, 35.021156311035156, 37.84833526611328, 40.675514221191406, 43.50269317626953, 46.32987594604492, 49.15705490112305, 51.98423385620117, 54.81141662597656, 57.63859558105469, 60.46577453613281, 63.2929573059082, 66.1201400756836, 68.94731903076172, 71.77449798583984, 74.60167694091797, 77.4288558959961, 80.25604248046875, 83.08322143554688, 85.910400390625, 88.73757934570312, 91.56475830078125, 94.39193725585938, 97.21912384033203, 100.04630279541016, 102.87348175048828, 105.7006607055664, 108.52783966064453]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 1.0, 3.0, 5.0, 8.0, 5.0, 4.0, 8.0, 17.0, 21.0, 11.0, 18.0, 19.0, 30.0, 26.0, 23.0, 21.0, 34.0, 27.0, 32.0, 36.0, 42.0, 31.0, 34.0, 36.0, 39.0, 38.0, 50.0, 48.0, 30.0, 24.0, 24.0, 33.0, 16.0, 26.0, 21.0, 28.0, 26.0, 16.0, 10.0, 14.0, 12.0, 5.0, 9.0, 13.0, 7.0, 1.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0], "bins": [-22.092737197875977, -21.41645622253418, -20.74017333984375, -20.063892364501953, -19.387609481811523, -18.711328506469727, -18.035045623779297, -17.3587646484375, -16.682483673095703, -16.006202697753906, -15.329919815063477, -14.65363883972168, -13.97735595703125, -13.301074981689453, -12.62479305267334, -11.948511123657227, -11.272228240966797, -10.595946311950684, -9.91966438293457, -9.243383407592773, -8.567100524902344, -7.890819072723389, -7.214537620544434, -6.53825569152832, -5.861973762512207, -5.185691833496094, -4.5094099044799805, -3.8331284523010254, -3.156846523284912, -2.480564594268799, -1.8042831420898438, -1.1280012130737305, -0.4517173767089844, 0.22456443309783936, 0.9008462429046631, 1.5771279335021973, 2.2534098625183105, 2.929691791534424, 3.605973243713379, 4.282255172729492, 4.9585371017456055, 5.634819030761719, 6.311100959777832, 6.987382411956787, 7.6636643409729, 8.339946746826172, 9.016227722167969, 9.692509651184082, 10.368791580200195, 11.045073509216309, 11.721355438232422, 12.397636413574219, 13.073919296264648, 13.750200271606445, 14.426482200622559, 15.102764129638672, 15.779046058654785, 16.4553279876709, 17.131608963012695, 17.807891845703125, 18.484172821044922, 19.16045570373535, 19.83673667907715, 20.513019561767578, 21.189300537109375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 14.0, 14.0, 21.0, 15.0, 27.0, 24.0, 34.0, 22.0, 33.0, 39.0, 45.0, 39.0, 47.0, 50.0, 48.0, 50.0, 41.0, 31.0, 61.0, 37.0, 36.0, 35.0, 28.0, 24.0, 35.0, 26.0, 20.0, 12.0, 15.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.00390625, -3.896942138671875, -3.78997802734375, -3.683013916015625, -3.5760498046875, -3.469085693359375, -3.36212158203125, -3.255157470703125, -3.148193359375, -3.041229248046875, -2.93426513671875, -2.827301025390625, -2.7203369140625, -2.613372802734375, -2.50640869140625, -2.399444580078125, -2.29248046875, -2.185516357421875, -2.07855224609375, -1.971588134765625, -1.8646240234375, -1.757659912109375, -1.65069580078125, -1.543731689453125, -1.436767578125, -1.329803466796875, -1.22283935546875, -1.115875244140625, -1.0089111328125, -0.901947021484375, -0.79498291015625, -0.688018798828125, -0.5810546875, -0.474090576171875, -0.36712646484375, -0.260162353515625, -0.1531982421875, -0.046234130859375, 0.06072998046875, 0.167694091796875, 0.274658203125, 0.381622314453125, 0.48858642578125, 0.595550537109375, 0.7025146484375, 0.809478759765625, 0.91644287109375, 1.023406982421875, 1.13037109375, 1.237335205078125, 1.34429931640625, 1.451263427734375, 1.5582275390625, 1.665191650390625, 1.77215576171875, 1.879119873046875, 1.986083984375, 2.093048095703125, 2.20001220703125, 2.306976318359375, 2.4139404296875, 2.520904541015625, 2.62786865234375, 2.734832763671875, 2.841796875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 23.0, 32.0, 30.0, 42.0, 91.0, 123.0, 165.0, 240.0, 348.0, 542.0, 793.0, 1244.0, 1866.0, 2963.0, 4587.0, 7052.0, 10931.0, 17860.0, 28486.0, 47724.0, 86013.0, 174728.0, 314658.0, 153931.0, 77851.0, 44371.0, 26491.0, 16290.0, 10296.0, 6503.0, 4280.0, 2723.0, 1759.0, 1137.0, 810.0, 538.0, 332.0, 238.0, 154.0, 95.0, 64.0, 49.0, 31.0, 21.0, 8.0, 5.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.5859375, -0.5684051513671875, -0.550872802734375, -0.5333404541015625, -0.51580810546875, -0.4982757568359375, -0.480743408203125, -0.4632110595703125, -0.4456787109375, -0.4281463623046875, -0.410614013671875, -0.3930816650390625, -0.37554931640625, -0.3580169677734375, -0.340484619140625, -0.3229522705078125, -0.305419921875, -0.2878875732421875, -0.270355224609375, -0.2528228759765625, -0.23529052734375, -0.2177581787109375, -0.200225830078125, -0.1826934814453125, -0.1651611328125, -0.1476287841796875, -0.130096435546875, -0.1125640869140625, -0.09503173828125, -0.0774993896484375, -0.059967041015625, -0.0424346923828125, -0.02490234375, -0.0073699951171875, 0.010162353515625, 0.0276947021484375, 0.04522705078125, 0.0627593994140625, 0.080291748046875, 0.0978240966796875, 0.1153564453125, 0.1328887939453125, 0.150421142578125, 0.1679534912109375, 0.18548583984375, 0.2030181884765625, 0.220550537109375, 0.2380828857421875, 0.255615234375, 0.2731475830078125, 0.290679931640625, 0.3082122802734375, 0.32574462890625, 0.3432769775390625, 0.360809326171875, 0.3783416748046875, 0.3958740234375, 0.4134063720703125, 0.430938720703125, 0.4484710693359375, 0.46600341796875, 0.4835357666015625, 0.501068115234375, 0.5186004638671875, 0.5361328125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 12.0, 6.0, 9.0, 10.0, 9.0, 13.0, 9.0, 14.0, 26.0, 26.0, 15.0, 29.0, 25.0, 36.0, 24.0, 37.0, 42.0, 42.0, 40.0, 1057.0, 46.0, 42.0, 40.0, 34.0, 34.0, 41.0, 46.0, 38.0, 21.0, 34.0, 25.0, 22.0, 26.0, 14.0, 12.0, 12.0, 10.0, 6.0, 8.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.0078125, -1.946502685546875, -1.88519287109375, -1.823883056640625, -1.7625732421875, -1.701263427734375, -1.63995361328125, -1.578643798828125, -1.517333984375, -1.456024169921875, -1.39471435546875, -1.333404541015625, -1.2720947265625, -1.210784912109375, -1.14947509765625, -1.088165283203125, -1.02685546875, -0.965545654296875, -0.90423583984375, -0.842926025390625, -0.7816162109375, -0.720306396484375, -0.65899658203125, -0.597686767578125, -0.536376953125, -0.475067138671875, -0.41375732421875, -0.352447509765625, -0.2911376953125, -0.229827880859375, -0.16851806640625, -0.107208251953125, -0.0458984375, 0.015411376953125, 0.07672119140625, 0.138031005859375, 0.1993408203125, 0.260650634765625, 0.32196044921875, 0.383270263671875, 0.444580078125, 0.505889892578125, 0.56719970703125, 0.628509521484375, 0.6898193359375, 0.751129150390625, 0.81243896484375, 0.873748779296875, 0.93505859375, 0.996368408203125, 1.05767822265625, 1.118988037109375, 1.1802978515625, 1.241607666015625, 1.30291748046875, 1.364227294921875, 1.425537109375, 1.486846923828125, 1.54815673828125, 1.609466552734375, 1.6707763671875, 1.732086181640625, 1.79339599609375, 1.854705810546875, 1.916015625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 7.0, 14.0, 12.0, 20.0, 23.0, 43.0, 60.0, 91.0, 136.0, 186.0, 264.0, 366.0, 512.0, 684.0, 991.0, 1339.0, 1912.0, 2622.0, 3713.0, 5144.0, 7206.0, 10272.0, 14764.0, 21578.0, 31931.0, 48479.0, 78792.0, 141772.0, 1304729.0, 165472.0, 88323.0, 53985.0, 34884.0, 23131.0, 15901.0, 10951.0, 7489.0, 5463.0, 3944.0, 2739.0, 1970.0, 1441.0, 1039.0, 788.0, 541.0, 418.0, 283.0, 204.0, 152.0, 98.0, 83.0, 51.0, 54.0, 31.0, 23.0, 7.0, 7.0, 9.0, 2.0, 0.0, 1.0], "bins": [-0.42041015625, -0.40711212158203125, -0.3938140869140625, -0.38051605224609375, -0.367218017578125, -0.35391998291015625, -0.3406219482421875, -0.32732391357421875, -0.31402587890625, -0.30072784423828125, -0.2874298095703125, -0.27413177490234375, -0.260833740234375, -0.24753570556640625, -0.2342376708984375, -0.22093963623046875, -0.2076416015625, -0.19434356689453125, -0.1810455322265625, -0.16774749755859375, -0.154449462890625, -0.14115142822265625, -0.1278533935546875, -0.11455535888671875, -0.10125732421875, -0.08795928955078125, -0.0746612548828125, -0.06136322021484375, -0.048065185546875, -0.03476715087890625, -0.0214691162109375, -0.00817108154296875, 0.005126953125, 0.01842498779296875, 0.0317230224609375, 0.04502105712890625, 0.058319091796875, 0.07161712646484375, 0.0849151611328125, 0.09821319580078125, 0.11151123046875, 0.12480926513671875, 0.1381072998046875, 0.15140533447265625, 0.164703369140625, 0.17800140380859375, 0.1912994384765625, 0.20459747314453125, 0.2178955078125, 0.23119354248046875, 0.2444915771484375, 0.25778961181640625, 0.271087646484375, 0.28438568115234375, 0.2976837158203125, 0.31098175048828125, 0.32427978515625, 0.33757781982421875, 0.3508758544921875, 0.36417388916015625, 0.377471923828125, 0.39076995849609375, 0.4040679931640625, 0.41736602783203125, 0.4306640625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 7.0, 8.0, 3.0, 9.0, 4.0, 10.0, 11.0, 10.0, 20.0, 14.0, 23.0, 29.0, 37.0, 44.0, 45.0, 40.0, 53.0, 59.0, 54.0, 66.0, 59.0, 60.0, 48.0, 49.0, 40.0, 30.0, 31.0, 15.0, 19.0, 18.0, 27.0, 5.0, 11.0, 12.0, 8.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.620189666748047e-05, -9.30512323975563e-05, -8.990056812763214e-05, -8.674990385770798e-05, -8.359923958778381e-05, -8.044857531785965e-05, -7.729791104793549e-05, -7.414724677801132e-05, -7.099658250808716e-05, -6.7845918238163e-05, -6.469525396823883e-05, -6.154458969831467e-05, -5.83939254283905e-05, -5.524326115846634e-05, -5.2092596888542175e-05, -4.894193261861801e-05, -4.579126834869385e-05, -4.2640604078769684e-05, -3.948993980884552e-05, -3.6339275538921356e-05, -3.318861126899719e-05, -3.003794699907303e-05, -2.6887282729148865e-05, -2.37366184592247e-05, -2.0585954189300537e-05, -1.7435289919376373e-05, -1.428462564945221e-05, -1.1133961379528046e-05, -7.983297109603882e-06, -4.832632839679718e-06, -1.6819685697555542e-06, 1.4686957001686096e-06, 4.6193599700927734e-06, 7.770024240016937e-06, 1.0920688509941101e-05, 1.4071352779865265e-05, 1.722201704978943e-05, 2.0372681319713593e-05, 2.3523345589637756e-05, 2.667400985956192e-05, 2.9824674129486084e-05, 3.297533839941025e-05, 3.612600266933441e-05, 3.9276666939258575e-05, 4.242733120918274e-05, 4.55779954791069e-05, 4.872865974903107e-05, 5.187932401895523e-05, 5.5029988288879395e-05, 5.818065255880356e-05, 6.133131682872772e-05, 6.448198109865189e-05, 6.763264536857605e-05, 7.078330963850021e-05, 7.393397390842438e-05, 7.708463817834854e-05, 8.02353024482727e-05, 8.338596671819687e-05, 8.653663098812103e-05, 8.96872952580452e-05, 9.283795952796936e-05, 9.598862379789352e-05, 9.913928806781769e-05, 0.00010228995233774185, 0.00010544061660766602]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 11.0, 3.0, 10.0, 16.0, 19.0, 14.0, 25.0, 49.0, 41.0, 64.0, 107.0, 148.0, 267.0, 469.0, 1124.0, 61887.0, 977988.0, 4480.0, 708.0, 382.0, 230.0, 134.0, 106.0, 56.0, 43.0, 33.0, 29.0, 19.0, 10.0, 17.0, 14.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002185821533203125, -0.0021201670169830322, -0.0020545125007629395, -0.0019888579845428467, -0.001923203468322754, -0.0018575489521026611, -0.0017918944358825684, -0.0017262399196624756, -0.0016605854034423828, -0.00159493088722229, -0.0015292763710021973, -0.0014636218547821045, -0.0013979673385620117, -0.001332312822341919, -0.0012666583061218262, -0.0012010037899017334, -0.0011353492736816406, -0.0010696947574615479, -0.001004040241241455, -0.0009383857250213623, -0.0008727312088012695, -0.0008070766925811768, -0.000741422176361084, -0.0006757676601409912, -0.0006101131439208984, -0.0005444586277008057, -0.0004788041114807129, -0.0004131495952606201, -0.00034749507904052734, -0.00028184056282043457, -0.0002161860466003418, -0.00015053153038024902, -8.487701416015625e-05, -1.9222497940063477e-05, 4.64320182800293e-05, 0.00011208653450012207, 0.00017774105072021484, 0.00024339556694030762, 0.0003090500831604004, 0.00037470459938049316, 0.00044035911560058594, 0.0005060136318206787, 0.0005716681480407715, 0.0006373226642608643, 0.000702977180480957, 0.0007686316967010498, 0.0008342862129211426, 0.0008999407291412354, 0.0009655952453613281, 0.001031249761581421, 0.0010969042778015137, 0.0011625587940216064, 0.0012282133102416992, 0.001293867826461792, 0.0013595223426818848, 0.0014251768589019775, 0.0014908313751220703, 0.001556485891342163, 0.0016221404075622559, 0.0016877949237823486, 0.0017534494400024414, 0.0018191039562225342, 0.001884758472442627, 0.0019504129886627197, 0.0020160675048828125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 39.0, 96.0, 225.0, 269.0, 214.0, 111.0, 30.0, 10.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001448805705877021, -0.00013960935757495463, -0.00013433814456220716, -0.0001290669315494597, -0.00012379571853671223, -0.00011852450552396476, -0.00011325328523525968, -0.00010798207222251222, -0.00010271085920976475, -9.743964619701728e-05, -9.216843318426982e-05, -8.689721289556473e-05, -8.162599988281727e-05, -7.63547868700698e-05, -7.108357385732234e-05, -6.581236084457487e-05, -6.05411478318274e-05, -5.5269934819079936e-05, -4.999872180633247e-05, -4.4727505155606195e-05, -3.945629214285873e-05, -3.418507913011126e-05, -2.891386247938499e-05, -2.3642649466637522e-05, -1.8371436453890055e-05, -1.3100222531647887e-05, -7.829008609405719e-06, -2.5577937776688486e-06, 2.713419235078618e-06, 7.984632247826084e-06, 1.3255848898552358e-05, 1.8527061911299825e-05, 2.379828947596252e-05, 2.9069502488709986e-05, 3.434071550145745e-05, 3.9611932152183726e-05, 4.488314516493119e-05, 5.015435817767866e-05, 5.542557482840493e-05, 6.06967878411524e-05, 6.596800085389987e-05, 7.123921386664733e-05, 7.65104268793948e-05, 8.178164716809988e-05, 8.705286018084735e-05, 9.232407319359481e-05, 9.759528620634228e-05, 0.00010286649921908975, 0.00010813771223183721, 0.00011340892524458468, 0.00011868013825733215, 0.0001239513512700796, 0.00012922256428282708, 0.00013449377729557455, 0.00013976500486023724, 0.00014503620332106948, 0.00015030743088573217, 0.00015557864389847964, 0.0001608498569112271, 0.00016612106992397457, 0.00017139228293672204, 0.0001766634959494695, 0.00018193470896221697, 0.00018720593652687967, 0.0001924771349877119]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 5.0, 7.0, 11.0, 14.0, 15.0, 24.0, 30.0, 23.0, 26.0, 22.0, 28.0, 33.0, 38.0, 46.0, 39.0, 45.0, 48.0, 59.0, 40.0, 53.0, 44.0, 42.0, 50.0, 34.0, 29.0, 25.0, 30.0, 27.0, 20.0, 16.0, 14.0, 13.0, 8.0, 12.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9664249420166016e-05, -5.783233791589737e-05, -5.600042641162872e-05, -5.416851490736008e-05, -5.233660340309143e-05, -5.0504691898822784e-05, -4.867278039455414e-05, -4.684086889028549e-05, -4.5008957386016846e-05, -4.31770458817482e-05, -4.134513437747955e-05, -3.951322287321091e-05, -3.768131136894226e-05, -3.5849399864673615e-05, -3.401748836040497e-05, -3.218557685613632e-05, -3.0353665351867676e-05, -2.852175384759903e-05, -2.6689842343330383e-05, -2.4857930839061737e-05, -2.302601933479309e-05, -2.1194107830524445e-05, -1.93621963262558e-05, -1.7530284821987152e-05, -1.5698373317718506e-05, -1.386646181344986e-05, -1.2034550309181213e-05, -1.0202638804912567e-05, -8.370727300643921e-06, -6.538815796375275e-06, -4.706904292106628e-06, -2.874992787837982e-06, -1.043081283569336e-06, 7.888302206993103e-07, 2.6207417249679565e-06, 4.452653229236603e-06, 6.284564733505249e-06, 8.116476237773895e-06, 9.948387742042542e-06, 1.1780299246311188e-05, 1.3612210750579834e-05, 1.544412225484848e-05, 1.7276033759117126e-05, 1.9107945263385773e-05, 2.093985676765442e-05, 2.2771768271923065e-05, 2.460367977619171e-05, 2.6435591280460358e-05, 2.8267502784729004e-05, 3.009941428899765e-05, 3.1931325793266296e-05, 3.376323729753494e-05, 3.559514880180359e-05, 3.7427060306072235e-05, 3.925897181034088e-05, 4.109088331460953e-05, 4.2922794818878174e-05, 4.475470632314682e-05, 4.6586617827415466e-05, 4.841852933168411e-05, 5.025044083595276e-05, 5.2082352340221405e-05, 5.391426384449005e-05, 5.57461753487587e-05, 5.7578086853027344e-05]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 14.0, 14.0, 21.0, 15.0, 27.0, 24.0, 34.0, 22.0, 32.0, 40.0, 45.0, 39.0, 47.0, 50.0, 48.0, 50.0, 41.0, 31.0, 61.0, 37.0, 36.0, 35.0, 28.0, 24.0, 35.0, 26.0, 20.0, 12.0, 15.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.00390625, -3.896942138671875, -3.78997802734375, -3.683013916015625, -3.5760498046875, -3.469085693359375, -3.36212158203125, -3.255157470703125, -3.148193359375, -3.041229248046875, -2.93426513671875, -2.827301025390625, -2.7203369140625, -2.613372802734375, -2.50640869140625, -2.399444580078125, -2.29248046875, -2.185516357421875, -2.07855224609375, -1.971588134765625, -1.8646240234375, -1.757659912109375, -1.65069580078125, -1.543731689453125, -1.436767578125, -1.329803466796875, -1.22283935546875, -1.115875244140625, -1.0089111328125, -0.901947021484375, -0.79498291015625, -0.688018798828125, -0.5810546875, -0.474090576171875, -0.36712646484375, -0.260162353515625, -0.1531982421875, -0.046234130859375, 0.06072998046875, 0.167694091796875, 0.274658203125, 0.381622314453125, 0.48858642578125, 0.595550537109375, 0.7025146484375, 0.809478759765625, 0.91644287109375, 1.023406982421875, 1.13037109375, 1.237335205078125, 1.34429931640625, 1.451263427734375, 1.5582275390625, 1.665191650390625, 1.77215576171875, 1.879119873046875, 1.986083984375, 2.093048095703125, 2.20001220703125, 2.306976318359375, 2.4139404296875, 2.520904541015625, 2.62786865234375, 2.734832763671875, 2.841796875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 3.0, 8.0, 6.0, 16.0, 18.0, 30.0, 45.0, 66.0, 89.0, 114.0, 157.0, 235.0, 346.0, 605.0, 949.0, 1706.0, 3073.0, 5700.0, 11007.0, 20918.0, 40590.0, 76829.0, 147774.0, 255466.0, 225896.0, 122654.0, 63646.0, 33139.0, 17450.0, 8958.0, 4799.0, 2557.0, 1406.0, 809.0, 511.0, 315.0, 214.0, 142.0, 104.0, 58.0, 50.0, 41.0, 13.0, 14.0, 16.0, 4.0, 9.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.520477294921875, -2.44134521484375, -2.362213134765625, -2.2830810546875, -2.203948974609375, -2.12481689453125, -2.045684814453125, -1.966552734375, -1.887420654296875, -1.80828857421875, -1.729156494140625, -1.6500244140625, -1.570892333984375, -1.49176025390625, -1.412628173828125, -1.33349609375, -1.254364013671875, -1.17523193359375, -1.096099853515625, -1.0169677734375, -0.937835693359375, -0.85870361328125, -0.779571533203125, -0.700439453125, -0.621307373046875, -0.54217529296875, -0.463043212890625, -0.3839111328125, -0.304779052734375, -0.22564697265625, -0.146514892578125, -0.0673828125, 0.011749267578125, 0.09088134765625, 0.170013427734375, 0.2491455078125, 0.328277587890625, 0.40740966796875, 0.486541748046875, 0.565673828125, 0.644805908203125, 0.72393798828125, 0.803070068359375, 0.8822021484375, 0.961334228515625, 1.04046630859375, 1.119598388671875, 1.19873046875, 1.277862548828125, 1.35699462890625, 1.436126708984375, 1.5152587890625, 1.594390869140625, 1.67352294921875, 1.752655029296875, 1.831787109375, 1.910919189453125, 1.99005126953125, 2.069183349609375, 2.1483154296875, 2.227447509765625, 2.30657958984375, 2.385711669921875, 2.46484375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 13.0, 13.0, 21.0, 23.0, 33.0, 23.0, 51.0, 43.0, 53.0, 67.0, 104.0, 170.0, 1520.0, 345.0, 132.0, 71.0, 59.0, 57.0, 37.0, 36.0, 30.0, 35.0, 20.0, 16.0, 15.0, 11.0, 7.0, 9.0, 3.0, 10.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-19.484375, -18.9698486328125, -18.455322265625, -17.9407958984375, -17.42626953125, -16.9117431640625, -16.397216796875, -15.8826904296875, -15.3681640625, -14.8536376953125, -14.339111328125, -13.8245849609375, -13.31005859375, -12.7955322265625, -12.281005859375, -11.7664794921875, -11.251953125, -10.7374267578125, -10.222900390625, -9.7083740234375, -9.19384765625, -8.6793212890625, -8.164794921875, -7.6502685546875, -7.1357421875, -6.6212158203125, -6.106689453125, -5.5921630859375, -5.07763671875, -4.5631103515625, -4.048583984375, -3.5340576171875, -3.01953125, -2.5050048828125, -1.990478515625, -1.4759521484375, -0.96142578125, -0.4468994140625, 0.067626953125, 0.5821533203125, 1.0966796875, 1.6112060546875, 2.125732421875, 2.6402587890625, 3.15478515625, 3.6693115234375, 4.183837890625, 4.6983642578125, 5.212890625, 5.7274169921875, 6.241943359375, 6.7564697265625, 7.27099609375, 7.7855224609375, 8.300048828125, 8.8145751953125, 9.3291015625, 9.8436279296875, 10.358154296875, 10.8726806640625, 11.38720703125, 11.9017333984375, 12.416259765625, 12.9307861328125, 13.4453125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 7.0, 12.0, 16.0, 17.0, 19.0, 19.0, 39.0, 51.0, 74.0, 101.0, 135.0, 192.0, 303.0, 579.0, 2800.0, 2409730.0, 728039.0, 2071.0, 541.0, 316.0, 179.0, 101.0, 93.0, 72.0, 50.0, 39.0, 29.0, 15.0, 8.0, 11.0, 6.0, 8.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.78125, -38.49560546875, -37.2099609375, -35.92431640625, -34.638671875, -33.35302734375, -32.0673828125, -30.78173828125, -29.49609375, -28.21044921875, -26.9248046875, -25.63916015625, -24.353515625, -23.06787109375, -21.7822265625, -20.49658203125, -19.2109375, -17.92529296875, -16.6396484375, -15.35400390625, -14.068359375, -12.78271484375, -11.4970703125, -10.21142578125, -8.92578125, -7.64013671875, -6.3544921875, -5.06884765625, -3.783203125, -2.49755859375, -1.2119140625, 0.07373046875, 1.359375, 2.64501953125, 3.9306640625, 5.21630859375, 6.501953125, 7.78759765625, 9.0732421875, 10.35888671875, 11.64453125, 12.93017578125, 14.2158203125, 15.50146484375, 16.787109375, 18.07275390625, 19.3583984375, 20.64404296875, 21.9296875, 23.21533203125, 24.5009765625, 25.78662109375, 27.072265625, 28.35791015625, 29.6435546875, 30.92919921875, 32.21484375, 33.50048828125, 34.7861328125, 36.07177734375, 37.357421875, 38.64306640625, 39.9287109375, 41.21435546875, 42.5]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 12.0, 660.0, 344.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.052346229553223, -9.838336944580078, -4.62432861328125, 0.5896806716918945, 5.803689002990723, 11.01769733428955, 16.231708526611328, 21.445716857910156, 26.659725189208984, 31.873733520507812, 37.08774185180664, 42.30175018310547, 47.51576232910156, 52.729766845703125, 57.94377899169922, 63.15778732299805, 68.37179565429688, 73.58580780029297, 78.79981231689453, 84.01382446289062, 89.22782897949219, 94.44184112548828, 99.65585327148438, 104.86985778808594, 110.0838623046875, 115.2978744506836, 120.51187896728516, 125.72589111328125, 130.9398956298828, 136.15390014648438, 141.367919921875, 146.58192443847656, 151.7959442138672, 157.00994873046875, 162.22396850585938, 167.43797302246094, 172.6519775390625, 177.86598205566406, 183.0800018310547, 188.29400634765625, 193.5080108642578, 198.72201538085938, 203.93603515625, 209.15003967285156, 214.36404418945312, 219.5780487060547, 224.7920684814453, 230.00607299804688, 235.2200927734375, 240.43409729003906, 245.6481170654297, 250.86212158203125, 256.0761413574219, 261.2901306152344, 266.504150390625, 271.7181396484375, 276.9321594238281, 282.14617919921875, 287.36016845703125, 292.5741882324219, 297.7882080078125, 303.002197265625, 308.2162170410156, 313.43023681640625, 318.64422607421875]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 3.0, 1.0, 9.0, 8.0, 4.0, 14.0, 12.0, 11.0, 22.0, 12.0, 20.0, 13.0, 20.0, 23.0, 33.0, 34.0, 33.0, 30.0, 31.0, 28.0, 38.0, 43.0, 28.0, 31.0, 42.0, 50.0, 33.0, 31.0, 39.0, 28.0, 34.0, 29.0, 23.0, 27.0, 19.0, 18.0, 17.0, 13.0, 10.0, 11.0, 21.0, 10.0, 6.0, 7.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-26.892616271972656, -26.06068229675293, -25.228750228881836, -24.39681625366211, -23.564882278442383, -22.732948303222656, -21.901016235351562, -21.069082260131836, -20.23714828491211, -19.405214309692383, -18.57328224182129, -17.741348266601562, -16.909414291381836, -16.07748031616211, -15.245548248291016, -14.413614273071289, -13.581681251525879, -12.749748229980469, -11.917814254760742, -11.085881233215332, -10.253947257995605, -9.422014236450195, -8.590080261230469, -7.758147239685059, -6.92621374130249, -6.094280242919922, -5.2623467445373535, -4.430413246154785, -3.598479986190796, -2.7665467262268066, -1.9346132278442383, -1.10267972946167, -0.27074623107910156, 0.561187207698822, 1.3931206464767456, 2.2250540256500244, 3.0569875240325928, 3.888920783996582, 4.72085428237915, 5.552787780761719, 6.384721279144287, 7.2166547775268555, 8.048587799072266, 8.880521774291992, 9.712454795837402, 10.544387817382812, 11.376321792602539, 12.208255767822266, 13.040188789367676, 13.872121810913086, 14.704055786132812, 15.535988807678223, 16.367921829223633, 17.19985580444336, 18.031789779663086, 18.863723754882812, 19.695655822753906, 20.527589797973633, 21.359521865844727, 22.191455841064453, 23.02338981628418, 23.855323791503906, 24.687255859375, 25.519189834594727, 26.351123809814453]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 4.0, 8.0, 7.0, 11.0, 14.0, 16.0, 13.0, 20.0, 12.0, 30.0, 28.0, 35.0, 37.0, 39.0, 34.0, 46.0, 42.0, 41.0, 55.0, 50.0, 50.0, 39.0, 31.0, 37.0, 37.0, 38.0, 31.0, 24.0, 19.0, 28.0, 23.0, 11.0, 22.0, 18.0, 9.0, 11.0, 6.0, 7.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.955078125, -3.84149169921875, -3.7279052734375, -3.61431884765625, -3.500732421875, -3.38714599609375, -3.2735595703125, -3.15997314453125, -3.04638671875, -2.93280029296875, -2.8192138671875, -2.70562744140625, -2.592041015625, -2.47845458984375, -2.3648681640625, -2.25128173828125, -2.1376953125, -2.02410888671875, -1.9105224609375, -1.79693603515625, -1.683349609375, -1.56976318359375, -1.4561767578125, -1.34259033203125, -1.22900390625, -1.11541748046875, -1.0018310546875, -0.88824462890625, -0.774658203125, -0.66107177734375, -0.5474853515625, -0.43389892578125, -0.3203125, -0.20672607421875, -0.0931396484375, 0.02044677734375, 0.134033203125, 0.24761962890625, 0.3612060546875, 0.47479248046875, 0.58837890625, 0.70196533203125, 0.8155517578125, 0.92913818359375, 1.042724609375, 1.15631103515625, 1.2698974609375, 1.38348388671875, 1.4970703125, 1.61065673828125, 1.7242431640625, 1.83782958984375, 1.951416015625, 2.06500244140625, 2.1785888671875, 2.29217529296875, 2.40576171875, 2.51934814453125, 2.6329345703125, 2.74652099609375, 2.860107421875, 2.97369384765625, 3.0872802734375, 3.20086669921875, 3.314453125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 6.0, 5.0, 2.0, 5.0, 8.0, 11.0, 8.0, 17.0, 17.0, 14.0, 19.0, 16.0, 25.0, 30.0, 39.0, 53.0, 79.0, 167.0, 342.0, 1341.0, 11334.0, 493605.0, 3344308.0, 332975.0, 8046.0, 1031.0, 307.0, 123.0, 78.0, 38.0, 33.0, 27.0, 17.0, 27.0, 26.0, 20.0, 21.0, 14.0, 13.0, 14.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.255126953125, -11.87744140625, -11.499755859375, -11.1220703125, -10.744384765625, -10.36669921875, -9.989013671875, -9.611328125, -9.233642578125, -8.85595703125, -8.478271484375, -8.1005859375, -7.722900390625, -7.34521484375, -6.967529296875, -6.58984375, -6.212158203125, -5.83447265625, -5.456787109375, -5.0791015625, -4.701416015625, -4.32373046875, -3.946044921875, -3.568359375, -3.190673828125, -2.81298828125, -2.435302734375, -2.0576171875, -1.679931640625, -1.30224609375, -0.924560546875, -0.546875, -0.169189453125, 0.20849609375, 0.586181640625, 0.9638671875, 1.341552734375, 1.71923828125, 2.096923828125, 2.474609375, 2.852294921875, 3.22998046875, 3.607666015625, 3.9853515625, 4.363037109375, 4.74072265625, 5.118408203125, 5.49609375, 5.873779296875, 6.25146484375, 6.629150390625, 7.0068359375, 7.384521484375, 7.76220703125, 8.139892578125, 8.517578125, 8.895263671875, 9.27294921875, 9.650634765625, 10.0283203125, 10.406005859375, 10.78369140625, 11.161376953125, 11.5390625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 8.0, 9.0, 18.0, 26.0, 25.0, 47.0, 57.0, 68.0, 116.0, 173.0, 236.0, 315.0, 384.0, 476.0, 467.0, 398.0, 356.0, 239.0, 189.0, 112.0, 92.0, 75.0, 50.0, 42.0, 31.0, 18.0, 10.0, 6.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84765625, -6.60382080078125, -6.3599853515625, -6.11614990234375, -5.872314453125, -5.62847900390625, -5.3846435546875, -5.14080810546875, -4.89697265625, -4.65313720703125, -4.4093017578125, -4.16546630859375, -3.921630859375, -3.67779541015625, -3.4339599609375, -3.19012451171875, -2.9462890625, -2.70245361328125, -2.4586181640625, -2.21478271484375, -1.970947265625, -1.72711181640625, -1.4832763671875, -1.23944091796875, -0.99560546875, -0.75177001953125, -0.5079345703125, -0.26409912109375, -0.020263671875, 0.22357177734375, 0.4674072265625, 0.71124267578125, 0.955078125, 1.19891357421875, 1.4427490234375, 1.68658447265625, 1.930419921875, 2.17425537109375, 2.4180908203125, 2.66192626953125, 2.90576171875, 3.14959716796875, 3.3934326171875, 3.63726806640625, 3.881103515625, 4.12493896484375, 4.3687744140625, 4.61260986328125, 4.8564453125, 5.10028076171875, 5.3441162109375, 5.58795166015625, 5.831787109375, 6.07562255859375, 6.3194580078125, 6.56329345703125, 6.80712890625, 7.05096435546875, 7.2947998046875, 7.53863525390625, 7.782470703125, 8.02630615234375, 8.2701416015625, 8.51397705078125, 8.7578125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 10.0, 7.0, 11.0, 15.0, 21.0, 20.0, 33.0, 44.0, 63.0, 90.0, 97.0, 131.0, 155.0, 271.0, 441.0, 926.0, 6117.0, 230831.0, 3673553.0, 272325.0, 6704.0, 1010.0, 456.0, 253.0, 168.0, 136.0, 94.0, 67.0, 46.0, 43.0, 27.0, 31.0, 21.0, 16.0, 11.0, 7.0, 7.0, 9.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.484375, -18.903076171875, -18.32177734375, -17.740478515625, -17.1591796875, -16.577880859375, -15.99658203125, -15.415283203125, -14.833984375, -14.252685546875, -13.67138671875, -13.090087890625, -12.5087890625, -11.927490234375, -11.34619140625, -10.764892578125, -10.18359375, -9.602294921875, -9.02099609375, -8.439697265625, -7.8583984375, -7.277099609375, -6.69580078125, -6.114501953125, -5.533203125, -4.951904296875, -4.37060546875, -3.789306640625, -3.2080078125, -2.626708984375, -2.04541015625, -1.464111328125, -0.8828125, -0.301513671875, 0.27978515625, 0.861083984375, 1.4423828125, 2.023681640625, 2.60498046875, 3.186279296875, 3.767578125, 4.348876953125, 4.93017578125, 5.511474609375, 6.0927734375, 6.674072265625, 7.25537109375, 7.836669921875, 8.41796875, 8.999267578125, 9.58056640625, 10.161865234375, 10.7431640625, 11.324462890625, 11.90576171875, 12.487060546875, 13.068359375, 13.649658203125, 14.23095703125, 14.812255859375, 15.3935546875, 15.974853515625, 16.55615234375, 17.137451171875, 17.71875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 16.0, 66.0, 167.0, 278.0, 277.0, 141.0, 49.0, 12.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.045875549316406, -29.544979095458984, -27.04408073425293, -24.543182373046875, -22.042285919189453, -19.54138946533203, -17.040491104125977, -14.539592742919922, -12.0386962890625, -9.537798881530762, -7.036901473999023, -4.536004066467285, -2.035106658935547, 0.4657907485961914, 2.9666881561279297, 5.467586517333984, 7.968482971191406, 10.469380378723145, 12.970277786254883, 15.471175193786621, 17.97207260131836, 20.47296905517578, 22.973867416381836, 25.47476577758789, 27.975662231445312, 30.476558685302734, 32.977455139160156, 35.478355407714844, 37.979251861572266, 40.48014831542969, 42.981048583984375, 45.4819450378418, 47.98283386230469, 50.48373031616211, 52.98462677001953, 55.48552703857422, 57.98642349243164, 60.48731994628906, 62.98822021484375, 65.48912048339844, 67.9900131225586, 70.49091339111328, 72.99180603027344, 75.49270629882812, 77.99360656738281, 80.49449920654297, 82.99539947509766, 85.49629211425781, 87.9971923828125, 90.49809265136719, 92.99898529052734, 95.49988555908203, 98.00077819824219, 100.50167846679688, 103.00257873535156, 105.50347900390625, 108.0043716430664, 110.5052719116211, 113.00616455078125, 115.50706481933594, 118.00796508789062, 120.50885772705078, 123.00975799560547, 125.51065063476562, 128.0115509033203]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 2.0, 9.0, 14.0, 11.0, 11.0, 19.0, 13.0, 24.0, 20.0, 22.0, 30.0, 24.0, 35.0, 29.0, 41.0, 30.0, 30.0, 32.0, 45.0, 49.0, 43.0, 42.0, 40.0, 35.0, 31.0, 35.0, 18.0, 24.0, 33.0, 27.0, 31.0, 19.0, 23.0, 15.0, 17.0, 8.0, 19.0, 9.0, 12.0, 7.0, 3.0, 2.0, 9.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.791484832763672, -20.0788631439209, -19.366241455078125, -18.65361976623535, -17.940998077392578, -17.228376388549805, -16.51575469970703, -15.803133964538574, -15.0905122756958, -14.377890586853027, -13.665268898010254, -12.952648162841797, -12.240026473999023, -11.52740478515625, -10.814783096313477, -10.102161407470703, -9.38953971862793, -8.676918029785156, -7.964296340942383, -7.251675128936768, -6.539053440093994, -5.826431751251221, -5.1138105392456055, -4.401188850402832, -3.6885671615600586, -2.975945472717285, -2.263324022293091, -1.5507025718688965, -0.838080883026123, -0.1254591941833496, 0.5871620178222656, 1.299783706665039, 2.0124073028564453, 2.7250289916992188, 3.437650442123413, 4.150271892547607, 4.862893581390381, 5.575515270233154, 6.2881364822387695, 7.000758171081543, 7.713379859924316, 8.42600154876709, 9.138623237609863, 9.85124397277832, 10.563865661621094, 11.276487350463867, 11.98910903930664, 12.701730728149414, 13.414352416992188, 14.126974105834961, 14.839595794677734, 15.552217483520508, 16.26483917236328, 16.977460861206055, 17.690082550048828, 18.40270233154297, 19.115325927734375, 19.82794761657715, 20.540569305419922, 21.253190994262695, 21.96581268310547, 22.678434371948242, 23.391056060791016, 24.103675842285156, 24.81629753112793]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 9.0, 5.0, 12.0, 8.0, 19.0, 18.0, 23.0, 27.0, 22.0, 30.0, 34.0, 29.0, 38.0, 44.0, 49.0, 49.0, 33.0, 42.0, 53.0, 44.0, 50.0, 37.0, 44.0, 26.0, 37.0, 27.0, 24.0, 34.0, 20.0, 25.0, 14.0, 15.0, 11.0, 10.0, 8.0, 6.0, 8.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.47906494140625, -3.3663330078125, -3.25360107421875, -3.140869140625, -3.02813720703125, -2.9154052734375, -2.80267333984375, -2.68994140625, -2.57720947265625, -2.4644775390625, -2.35174560546875, -2.239013671875, -2.12628173828125, -2.0135498046875, -1.90081787109375, -1.7880859375, -1.67535400390625, -1.5626220703125, -1.44989013671875, -1.337158203125, -1.22442626953125, -1.1116943359375, -0.99896240234375, -0.88623046875, -0.77349853515625, -0.6607666015625, -0.54803466796875, -0.435302734375, -0.32257080078125, -0.2098388671875, -0.09710693359375, 0.015625, 0.12835693359375, 0.2410888671875, 0.35382080078125, 0.466552734375, 0.57928466796875, 0.6920166015625, 0.80474853515625, 0.91748046875, 1.03021240234375, 1.1429443359375, 1.25567626953125, 1.368408203125, 1.48114013671875, 1.5938720703125, 1.70660400390625, 1.8193359375, 1.93206787109375, 2.0447998046875, 2.15753173828125, 2.270263671875, 2.38299560546875, 2.4957275390625, 2.60845947265625, 2.72119140625, 2.83392333984375, 2.9466552734375, 3.05938720703125, 3.172119140625, 3.28485107421875, 3.3975830078125, 3.51031494140625, 3.623046875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 2.0, 13.0, 18.0, 21.0, 37.0, 41.0, 68.0, 99.0, 155.0, 228.0, 328.0, 484.0, 685.0, 1046.0, 1520.0, 2301.0, 3405.0, 5078.0, 7474.0, 11643.0, 17644.0, 27880.0, 44875.0, 77510.0, 151498.0, 291996.0, 177524.0, 87259.0, 50113.0, 30731.0, 19319.0, 12444.0, 8348.0, 5438.0, 3704.0, 2450.0, 1670.0, 1156.0, 739.0, 512.0, 340.0, 240.0, 184.0, 112.0, 81.0, 41.0, 31.0, 20.0, 20.0, 15.0, 11.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.56103515625, -0.5427017211914062, -0.5243682861328125, -0.5060348510742188, -0.487701416015625, -0.46936798095703125, -0.4510345458984375, -0.43270111083984375, -0.41436767578125, -0.39603424072265625, -0.3777008056640625, -0.35936737060546875, -0.341033935546875, -0.32270050048828125, -0.3043670654296875, -0.28603363037109375, -0.2677001953125, -0.24936676025390625, -0.2310333251953125, -0.21269989013671875, -0.194366455078125, -0.17603302001953125, -0.1576995849609375, -0.13936614990234375, -0.12103271484375, -0.10269927978515625, -0.0843658447265625, -0.06603240966796875, -0.047698974609375, -0.02936553955078125, -0.0110321044921875, 0.00730133056640625, 0.025634765625, 0.04396820068359375, 0.0623016357421875, 0.08063507080078125, 0.098968505859375, 0.11730194091796875, 0.1356353759765625, 0.15396881103515625, 0.17230224609375, 0.19063568115234375, 0.2089691162109375, 0.22730255126953125, 0.245635986328125, 0.26396942138671875, 0.2823028564453125, 0.30063629150390625, 0.3189697265625, 0.33730316162109375, 0.3556365966796875, 0.37397003173828125, 0.392303466796875, 0.41063690185546875, 0.4289703369140625, 0.44730377197265625, 0.46563720703125, 0.48397064208984375, 0.5023040771484375, 0.5206375122070312, 0.538970947265625, 0.5573043823242188, 0.5756378173828125, 0.5939712524414062, 0.6123046875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 7.0, 10.0, 7.0, 10.0, 14.0, 19.0, 16.0, 24.0, 22.0, 27.0, 33.0, 28.0, 31.0, 27.0, 34.0, 45.0, 37.0, 38.0, 35.0, 1071.0, 53.0, 35.0, 35.0, 32.0, 37.0, 40.0, 22.0, 44.0, 25.0, 27.0, 19.0, 22.0, 16.0, 24.0, 12.0, 8.0, 7.0, 5.0, 8.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9580078125, -1.8905792236328125, -1.823150634765625, -1.7557220458984375, -1.68829345703125, -1.6208648681640625, -1.553436279296875, -1.4860076904296875, -1.4185791015625, -1.3511505126953125, -1.283721923828125, -1.2162933349609375, -1.14886474609375, -1.0814361572265625, -1.014007568359375, -0.9465789794921875, -0.879150390625, -0.8117218017578125, -0.744293212890625, -0.6768646240234375, -0.60943603515625, -0.5420074462890625, -0.474578857421875, -0.4071502685546875, -0.3397216796875, -0.2722930908203125, -0.204864501953125, -0.1374359130859375, -0.07000732421875, -0.0025787353515625, 0.064849853515625, 0.1322784423828125, 0.19970703125, 0.2671356201171875, 0.334564208984375, 0.4019927978515625, 0.46942138671875, 0.5368499755859375, 0.604278564453125, 0.6717071533203125, 0.7391357421875, 0.8065643310546875, 0.873992919921875, 0.9414215087890625, 1.00885009765625, 1.0762786865234375, 1.143707275390625, 1.2111358642578125, 1.278564453125, 1.3459930419921875, 1.413421630859375, 1.4808502197265625, 1.54827880859375, 1.6157073974609375, 1.683135986328125, 1.7505645751953125, 1.8179931640625, 1.8854217529296875, 1.952850341796875, 2.0202789306640625, 2.08770751953125, 2.1551361083984375, 2.222564697265625, 2.2899932861328125, 2.357421875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 10.0, 8.0, 18.0, 19.0, 32.0, 36.0, 60.0, 88.0, 153.0, 208.0, 296.0, 439.0, 598.0, 921.0, 1348.0, 2080.0, 3006.0, 4395.0, 6460.0, 9573.0, 14339.0, 21239.0, 32352.0, 49679.0, 81903.0, 156438.0, 1326280.0, 156362.0, 81740.0, 49621.0, 32315.0, 21433.0, 14119.0, 9565.0, 6470.0, 4300.0, 2940.0, 1967.0, 1348.0, 966.0, 674.0, 418.0, 299.0, 206.0, 135.0, 95.0, 65.0, 47.0, 25.0, 22.0, 12.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.50537109375, -0.4898223876953125, -0.474273681640625, -0.4587249755859375, -0.44317626953125, -0.4276275634765625, -0.412078857421875, -0.3965301513671875, -0.3809814453125, -0.3654327392578125, -0.349884033203125, -0.3343353271484375, -0.31878662109375, -0.3032379150390625, -0.287689208984375, -0.2721405029296875, -0.256591796875, -0.2410430908203125, -0.225494384765625, -0.2099456787109375, -0.19439697265625, -0.1788482666015625, -0.163299560546875, -0.1477508544921875, -0.1322021484375, -0.1166534423828125, -0.101104736328125, -0.0855560302734375, -0.07000732421875, -0.0544586181640625, -0.038909912109375, -0.0233612060546875, -0.0078125, 0.0077362060546875, 0.023284912109375, 0.0388336181640625, 0.05438232421875, 0.0699310302734375, 0.085479736328125, 0.1010284423828125, 0.1165771484375, 0.1321258544921875, 0.147674560546875, 0.1632232666015625, 0.17877197265625, 0.1943206787109375, 0.209869384765625, 0.2254180908203125, 0.240966796875, 0.2565155029296875, 0.272064208984375, 0.2876129150390625, 0.30316162109375, 0.3187103271484375, 0.334259033203125, 0.3498077392578125, 0.3653564453125, 0.3809051513671875, 0.396453857421875, 0.4120025634765625, 0.42755126953125, 0.4430999755859375, 0.458648681640625, 0.4741973876953125, 0.48974609375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 10.0, 10.0, 11.0, 15.0, 21.0, 24.0, 31.0, 39.0, 60.0, 69.0, 75.0, 70.0, 88.0, 74.0, 86.0, 60.0, 55.0, 42.0, 29.0, 39.0, 17.0, 19.0, 14.0, 8.0, 6.0, 11.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001627206802368164, -0.0001574549823999405, -0.00015218928456306458, -0.00014692358672618866, -0.00014165788888931274, -0.00013639219105243683, -0.0001311264932155609, -0.000125860795378685, -0.00012059509754180908, -0.00011532939970493317, -0.00011006370186805725, -0.00010479800403118134, -9.953230619430542e-05, -9.42666083574295e-05, -8.900091052055359e-05, -8.373521268367767e-05, -7.846951484680176e-05, -7.320381700992584e-05, -6.793811917304993e-05, -6.267242133617401e-05, -5.7406723499298096e-05, -5.214102566242218e-05, -4.6875327825546265e-05, -4.160962998867035e-05, -3.6343932151794434e-05, -3.107823431491852e-05, -2.5812536478042603e-05, -2.0546838641166687e-05, -1.528114080429077e-05, -1.0015442967414856e-05, -4.7497451305389404e-06, 5.159527063369751e-07, 5.781650543212891e-06, 1.1047348380088806e-05, 1.631304621696472e-05, 2.1578744053840637e-05, 2.6844441890716553e-05, 3.211013972759247e-05, 3.7375837564468384e-05, 4.26415354013443e-05, 4.7907233238220215e-05, 5.317293107509613e-05, 5.8438628911972046e-05, 6.370432674884796e-05, 6.897002458572388e-05, 7.423572242259979e-05, 7.950142025947571e-05, 8.476711809635162e-05, 9.003281593322754e-05, 9.529851377010345e-05, 0.00010056421160697937, 0.00010582990944385529, 0.0001110956072807312, 0.00011636130511760712, 0.00012162700295448303, 0.00012689270079135895, 0.00013215839862823486, 0.00013742409646511078, 0.0001426897943019867, 0.0001479554921388626, 0.00015322118997573853, 0.00015848688781261444, 0.00016375258564949036, 0.00016901828348636627, 0.0001742839813232422]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 9.0, 16.0, 22.0, 35.0, 50.0, 54.0, 89.0, 153.0, 262.0, 713.0, 7543.0, 1035717.0, 2586.0, 586.0, 268.0, 130.0, 88.0, 61.0, 43.0, 28.0, 34.0, 15.0, 8.0, 11.0, 9.0, 5.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0037899017333984375, -0.0036764442920684814, -0.0035629868507385254, -0.0034495294094085693, -0.0033360719680786133, -0.0032226145267486572, -0.003109157085418701, -0.002995699644088745, -0.002882242202758789, -0.002768784761428833, -0.002655327320098877, -0.002541869878768921, -0.002428412437438965, -0.002314954996109009, -0.0022014975547790527, -0.0020880401134490967, -0.0019745826721191406, -0.0018611252307891846, -0.0017476677894592285, -0.0016342103481292725, -0.0015207529067993164, -0.0014072954654693604, -0.0012938380241394043, -0.0011803805828094482, -0.0010669231414794922, -0.0009534657001495361, -0.0008400082588195801, -0.000726550817489624, -0.000613093376159668, -0.0004996359348297119, -0.00038617849349975586, -0.0002727210521697998, -0.00015926361083984375, -4.5806169509887695e-05, 6.765127182006836e-05, 0.00018110871315002441, 0.00029456615447998047, 0.0004080235958099365, 0.0005214810371398926, 0.0006349384784698486, 0.0007483959197998047, 0.0008618533611297607, 0.0009753108024597168, 0.0010887682437896729, 0.001202225685119629, 0.001315683126449585, 0.001429140567779541, 0.001542598009109497, 0.0016560554504394531, 0.0017695128917694092, 0.0018829703330993652, 0.0019964277744293213, 0.0021098852157592773, 0.0022233426570892334, 0.0023368000984191895, 0.0024502575397491455, 0.0025637149810791016, 0.0026771724224090576, 0.0027906298637390137, 0.0029040873050689697, 0.0030175447463989258, 0.003131002187728882, 0.003244459629058838, 0.003357917070388794, 0.00347137451171875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 22.0, 99.0, 228.0, 302.0, 239.0, 99.0, 15.0, 10.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.797560202656314e-05, -3.105178984696977e-05, -2.41279776673764e-05, -1.7204167306772433e-05, -1.0280355127179064e-05, -3.356544766575098e-06, 3.5672674130182713e-06, 1.049107959261164e-05, 1.741489177220501e-05, 2.433870395179838e-05, 3.126251613139175e-05, 3.818632831098512e-05, 4.511013685259968e-05, 5.203394903219305e-05, 5.895776121178642e-05, 6.588156975340098e-05, 7.280538557097316e-05, 7.972919411258772e-05, 8.66530099301599e-05, 9.357681847177446e-05, 0.00010050063428934664, 0.0001074244428309612, 0.00011434825137257576, 0.00012127206719014794, 0.0001281958830077201, 0.0001351196988252923, 0.00014204350009094924, 0.00014896731590852141, 0.0001558911317260936, 0.00016281494754366577, 0.00016973874880932271, 0.0001766625646268949, 0.00018358636589255184, 0.00019051018171012402, 0.00019743398297578096, 0.00020435779879335314, 0.00021128161461092532, 0.00021820541587658226, 0.00022512923169415444, 0.00023205304751172662, 0.0002389768633292988, 0.00024590067914687097, 0.0002528244804125279, 0.0002597483107820153, 0.00026667211204767227, 0.0002735959133133292, 0.0002805197436828166, 0.00028744354494847357, 0.0002943673462141305, 0.00030129114747978747, 0.0003082149778492749, 0.0003151387791149318, 0.00032206258038058877, 0.0003289864107500762, 0.0003359102120157331, 0.00034283404238522053, 0.0003497578436508775, 0.0003566816449165344, 0.00036360547528602183, 0.0003705292765516788, 0.0003774530778173357, 0.00038437690818682313, 0.0003913007094524801, 0.000398224510718137, 0.00040514834108762443]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 8.0, 7.0, 7.0, 12.0, 7.0, 16.0, 10.0, 6.0, 13.0, 15.0, 17.0, 26.0, 21.0, 27.0, 45.0, 43.0, 34.0, 40.0, 42.0, 42.0, 33.0, 51.0, 32.0, 41.0, 22.0, 44.0, 39.0, 39.0, 35.0, 35.0, 32.0, 28.0, 20.0, 23.0, 20.0, 12.0, 10.0, 14.0, 10.0, 6.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.257129669189453e-05, -5.047023296356201e-05, -4.836916923522949e-05, -4.626810550689697e-05, -4.416704177856445e-05, -4.2065978050231934e-05, -3.9964914321899414e-05, -3.7863850593566895e-05, -3.5762786865234375e-05, -3.3661723136901855e-05, -3.1560659408569336e-05, -2.9459595680236816e-05, -2.7358531951904297e-05, -2.5257468223571777e-05, -2.3156404495239258e-05, -2.1055340766906738e-05, -1.895427703857422e-05, -1.68532133102417e-05, -1.475214958190918e-05, -1.265108585357666e-05, -1.055002212524414e-05, -8.448958396911621e-06, -6.3478946685791016e-06, -4.246830940246582e-06, -2.1457672119140625e-06, -4.470348358154297e-08, 2.0563602447509766e-06, 4.157423973083496e-06, 6.258487701416016e-06, 8.359551429748535e-06, 1.0460615158081055e-05, 1.2561678886413574e-05, 1.4662742614746094e-05, 1.6763806343078613e-05, 1.8864870071411133e-05, 2.0965933799743652e-05, 2.3066997528076172e-05, 2.516806125640869e-05, 2.726912498474121e-05, 2.937018871307373e-05, 3.147125244140625e-05, 3.357231616973877e-05, 3.567337989807129e-05, 3.777444362640381e-05, 3.987550735473633e-05, 4.197657108306885e-05, 4.407763481140137e-05, 4.617869853973389e-05, 4.8279762268066406e-05, 5.0380825996398926e-05, 5.2481889724731445e-05, 5.4582953453063965e-05, 5.6684017181396484e-05, 5.8785080909729004e-05, 6.0886144638061523e-05, 6.298720836639404e-05, 6.508827209472656e-05, 6.718933582305908e-05, 6.92903995513916e-05, 7.139146327972412e-05, 7.349252700805664e-05, 7.559359073638916e-05, 7.769465446472168e-05, 7.97957181930542e-05, 8.189678192138672e-05]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 9.0, 5.0, 12.0, 8.0, 19.0, 18.0, 23.0, 27.0, 22.0, 30.0, 34.0, 29.0, 38.0, 44.0, 49.0, 49.0, 33.0, 42.0, 53.0, 44.0, 50.0, 37.0, 44.0, 26.0, 37.0, 27.0, 24.0, 34.0, 20.0, 25.0, 14.0, 15.0, 11.0, 10.0, 8.0, 6.0, 8.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.47906494140625, -3.3663330078125, -3.25360107421875, -3.140869140625, -3.02813720703125, -2.9154052734375, -2.80267333984375, -2.68994140625, -2.57720947265625, -2.4644775390625, -2.35174560546875, -2.239013671875, -2.12628173828125, -2.0135498046875, -1.90081787109375, -1.7880859375, -1.67535400390625, -1.5626220703125, -1.44989013671875, -1.337158203125, -1.22442626953125, -1.1116943359375, -0.99896240234375, -0.88623046875, -0.77349853515625, -0.6607666015625, -0.54803466796875, -0.435302734375, -0.32257080078125, -0.2098388671875, -0.09710693359375, 0.015625, 0.12835693359375, 0.2410888671875, 0.35382080078125, 0.466552734375, 0.57928466796875, 0.6920166015625, 0.80474853515625, 0.91748046875, 1.03021240234375, 1.1429443359375, 1.25567626953125, 1.368408203125, 1.48114013671875, 1.5938720703125, 1.70660400390625, 1.8193359375, 1.93206787109375, 2.0447998046875, 2.15753173828125, 2.270263671875, 2.38299560546875, 2.4957275390625, 2.60845947265625, 2.72119140625, 2.83392333984375, 2.9466552734375, 3.05938720703125, 3.172119140625, 3.28485107421875, 3.3975830078125, 3.51031494140625, 3.623046875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 13.0, 16.0, 32.0, 41.0, 56.0, 89.0, 136.0, 217.0, 379.0, 672.0, 1432.0, 3494.0, 9328.0, 25098.0, 66703.0, 179319.0, 394431.0, 230284.0, 84595.0, 32163.0, 11969.0, 4402.0, 1778.0, 822.0, 409.0, 239.0, 149.0, 93.0, 59.0, 44.0, 33.0, 14.0, 13.0, 7.0, 7.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5, -3.373291015625, -3.24658203125, -3.119873046875, -2.9931640625, -2.866455078125, -2.73974609375, -2.613037109375, -2.486328125, -2.359619140625, -2.23291015625, -2.106201171875, -1.9794921875, -1.852783203125, -1.72607421875, -1.599365234375, -1.47265625, -1.345947265625, -1.21923828125, -1.092529296875, -0.9658203125, -0.839111328125, -0.71240234375, -0.585693359375, -0.458984375, -0.332275390625, -0.20556640625, -0.078857421875, 0.0478515625, 0.174560546875, 0.30126953125, 0.427978515625, 0.5546875, 0.681396484375, 0.80810546875, 0.934814453125, 1.0615234375, 1.188232421875, 1.31494140625, 1.441650390625, 1.568359375, 1.695068359375, 1.82177734375, 1.948486328125, 2.0751953125, 2.201904296875, 2.32861328125, 2.455322265625, 2.58203125, 2.708740234375, 2.83544921875, 2.962158203125, 3.0888671875, 3.215576171875, 3.34228515625, 3.468994140625, 3.595703125, 3.722412109375, 3.84912109375, 3.975830078125, 4.1025390625, 4.229248046875, 4.35595703125, 4.482666015625, 4.609375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 11.0, 13.0, 12.0, 21.0, 20.0, 28.0, 39.0, 32.0, 45.0, 47.0, 57.0, 103.0, 273.0, 1613.0, 222.0, 88.0, 70.0, 49.0, 44.0, 47.0, 39.0, 38.0, 26.0, 20.0, 15.0, 11.0, 10.0, 10.0, 6.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.0, -13.5408935546875, -13.081787109375, -12.6226806640625, -12.16357421875, -11.7044677734375, -11.245361328125, -10.7862548828125, -10.3271484375, -9.8680419921875, -9.408935546875, -8.9498291015625, -8.49072265625, -8.0316162109375, -7.572509765625, -7.1134033203125, -6.654296875, -6.1951904296875, -5.736083984375, -5.2769775390625, -4.81787109375, -4.3587646484375, -3.899658203125, -3.4405517578125, -2.9814453125, -2.5223388671875, -2.063232421875, -1.6041259765625, -1.14501953125, -0.6859130859375, -0.226806640625, 0.2322998046875, 0.69140625, 1.1505126953125, 1.609619140625, 2.0687255859375, 2.52783203125, 2.9869384765625, 3.446044921875, 3.9051513671875, 4.3642578125, 4.8233642578125, 5.282470703125, 5.7415771484375, 6.20068359375, 6.6597900390625, 7.118896484375, 7.5780029296875, 8.037109375, 8.4962158203125, 8.955322265625, 9.4144287109375, 9.87353515625, 10.3326416015625, 10.791748046875, 11.2508544921875, 11.7099609375, 12.1690673828125, 12.628173828125, 13.0872802734375, 13.54638671875, 14.0054931640625, 14.464599609375, 14.9237060546875, 15.3828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 8.0, 10.0, 14.0, 23.0, 22.0, 39.0, 41.0, 70.0, 94.0, 138.0, 210.0, 462.0, 1612.0, 2845950.0, 294976.0, 1109.0, 362.0, 173.0, 111.0, 71.0, 59.0, 42.0, 31.0, 17.0, 13.0, 13.0, 13.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.6875, -51.0859375, -49.484375, -47.8828125, -46.28125, -44.6796875, -43.078125, -41.4765625, -39.875, -38.2734375, -36.671875, -35.0703125, -33.46875, -31.8671875, -30.265625, -28.6640625, -27.0625, -25.4609375, -23.859375, -22.2578125, -20.65625, -19.0546875, -17.453125, -15.8515625, -14.25, -12.6484375, -11.046875, -9.4453125, -7.84375, -6.2421875, -4.640625, -3.0390625, -1.4375, 0.1640625, 1.765625, 3.3671875, 4.96875, 6.5703125, 8.171875, 9.7734375, 11.375, 12.9765625, 14.578125, 16.1796875, 17.78125, 19.3828125, 20.984375, 22.5859375, 24.1875, 25.7890625, 27.390625, 28.9921875, 30.59375, 32.1953125, 33.796875, 35.3984375, 37.0, 38.6015625, 40.203125, 41.8046875, 43.40625, 45.0078125, 46.609375, 48.2109375, 49.8125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [242.0, 773.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.701264381408691, -1.5497503280639648, 5.601763725280762, 12.753277778625488, 19.90479278564453, 27.056304931640625, 34.207820892333984, 41.359336853027344, 48.51084899902344, 55.66236114501953, 62.81387710571289, 69.96539306640625, 77.11690521240234, 84.26841735839844, 91.41993713378906, 98.57144927978516, 105.72296142578125, 112.87447357177734, 120.02598571777344, 127.17750549316406, 134.32901000976562, 141.48052978515625, 148.63204956054688, 155.7835693359375, 162.93507385253906, 170.0865936279297, 177.23809814453125, 184.38961791992188, 191.5411376953125, 198.69264221191406, 205.8441619873047, 212.99566650390625, 220.14718627929688, 227.2987060546875, 234.45021057128906, 241.6017303466797, 248.75323486328125, 255.90475463867188, 263.0562744140625, 270.2077941894531, 277.35931396484375, 284.5108337402344, 291.662353515625, 298.8138427734375, 305.9653625488281, 313.11688232421875, 320.2684020996094, 327.419921875, 334.5714111328125, 341.7229309082031, 348.87445068359375, 356.02593994140625, 363.1774597167969, 370.3289794921875, 377.4804992675781, 384.63201904296875, 391.78350830078125, 398.9350280761719, 406.0865478515625, 413.238037109375, 420.3895568847656, 427.54107666015625, 434.6925964355469, 441.8441162109375, 448.9956359863281]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 11.0, 5.0, 14.0, 14.0, 15.0, 21.0, 27.0, 21.0, 28.0, 22.0, 32.0, 37.0, 26.0, 41.0, 50.0, 41.0, 53.0, 33.0, 43.0, 37.0, 34.0, 26.0, 34.0, 43.0, 40.0, 41.0, 30.0, 28.0, 19.0, 19.0, 14.0, 11.0, 16.0, 17.0, 12.0, 10.0, 12.0, 5.0, 3.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.32056427001953, -38.190773010253906, -37.06098175048828, -35.93118667602539, -34.801395416259766, -33.67160415649414, -32.541812896728516, -31.41202163696289, -30.282228469848633, -29.152437210083008, -28.02264404296875, -26.892852783203125, -25.7630615234375, -24.633268356323242, -23.503477096557617, -22.37368392944336, -21.243892669677734, -20.11410140991211, -18.98430824279785, -17.854516983032227, -16.72472381591797, -15.594932556152344, -14.465141296386719, -13.335349082946777, -12.205556869506836, -11.075764656066895, -9.945972442626953, -8.816181182861328, -7.686388969421387, -6.556596755981445, -5.426805019378662, -4.297013282775879, -3.167217254638672, -2.0374252796173096, -0.9076333045959473, 0.22215867042541504, 1.3519506454467773, 2.4817428588867188, 3.611534595489502, 4.741326332092285, 5.871118545532227, 7.000910758972168, 8.13070297241211, 9.260494232177734, 10.390286445617676, 11.520078659057617, 12.649869918823242, 13.779662132263184, 14.909454345703125, 16.03924560546875, 17.169038772583008, 18.298830032348633, 19.42862319946289, 20.558414459228516, 21.68820571899414, 22.817996978759766, 23.947790145874023, 25.07758140563965, 26.207374572753906, 27.33716583251953, 28.466957092285156, 29.596750259399414, 30.72654151916504, 31.856334686279297, 32.98612594604492]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 7.0, 4.0, 9.0, 15.0, 13.0, 21.0, 16.0, 21.0, 21.0, 21.0, 32.0, 41.0, 44.0, 43.0, 43.0, 35.0, 35.0, 43.0, 48.0, 39.0, 47.0, 30.0, 49.0, 39.0, 36.0, 35.0, 31.0, 33.0, 28.0, 16.0, 14.0, 12.0, 17.0, 14.0, 7.0, 6.0, 11.0, 6.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.998046875, -3.87109375, -3.744140625, -3.6171875, -3.490234375, -3.36328125, -3.236328125, -3.109375, -2.982421875, -2.85546875, -2.728515625, -2.6015625, -2.474609375, -2.34765625, -2.220703125, -2.09375, -1.966796875, -1.83984375, -1.712890625, -1.5859375, -1.458984375, -1.33203125, -1.205078125, -1.078125, -0.951171875, -0.82421875, -0.697265625, -0.5703125, -0.443359375, -0.31640625, -0.189453125, -0.0625, 0.064453125, 0.19140625, 0.318359375, 0.4453125, 0.572265625, 0.69921875, 0.826171875, 0.953125, 1.080078125, 1.20703125, 1.333984375, 1.4609375, 1.587890625, 1.71484375, 1.841796875, 1.96875, 2.095703125, 2.22265625, 2.349609375, 2.4765625, 2.603515625, 2.73046875, 2.857421875, 2.984375, 3.111328125, 3.23828125, 3.365234375, 3.4921875, 3.619140625, 3.74609375, 3.873046875, 4.0]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 11.0, 9.0, 10.0, 15.0, 18.0, 15.0, 22.0, 25.0, 18.0, 33.0, 48.0, 48.0, 76.0, 131.0, 381.0, 1410.0, 11417.0, 523601.0, 3307037.0, 340126.0, 7977.0, 1084.0, 301.0, 131.0, 58.0, 51.0, 31.0, 26.0, 20.0, 26.0, 23.0, 13.0, 13.0, 17.0, 8.0, 3.0, 10.0, 5.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.125, -12.720458984375, -12.31591796875, -11.911376953125, -11.5068359375, -11.102294921875, -10.69775390625, -10.293212890625, -9.888671875, -9.484130859375, -9.07958984375, -8.675048828125, -8.2705078125, -7.865966796875, -7.46142578125, -7.056884765625, -6.65234375, -6.247802734375, -5.84326171875, -5.438720703125, -5.0341796875, -4.629638671875, -4.22509765625, -3.820556640625, -3.416015625, -3.011474609375, -2.60693359375, -2.202392578125, -1.7978515625, -1.393310546875, -0.98876953125, -0.584228515625, -0.1796875, 0.224853515625, 0.62939453125, 1.033935546875, 1.4384765625, 1.843017578125, 2.24755859375, 2.652099609375, 3.056640625, 3.461181640625, 3.86572265625, 4.270263671875, 4.6748046875, 5.079345703125, 5.48388671875, 5.888427734375, 6.29296875, 6.697509765625, 7.10205078125, 7.506591796875, 7.9111328125, 8.315673828125, 8.72021484375, 9.124755859375, 9.529296875, 9.933837890625, 10.33837890625, 10.742919921875, 11.1474609375, 11.552001953125, 11.95654296875, 12.361083984375, 12.765625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 10.0, 7.0, 6.0, 12.0, 22.0, 42.0, 62.0, 83.0, 130.0, 198.0, 286.0, 365.0, 538.0, 559.0, 515.0, 372.0, 266.0, 202.0, 123.0, 78.0, 70.0, 36.0, 35.0, 16.0, 11.0, 10.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.4124755859375, -8.106201171875, -7.7999267578125, -7.49365234375, -7.1873779296875, -6.881103515625, -6.5748291015625, -6.2685546875, -5.9622802734375, -5.656005859375, -5.3497314453125, -5.04345703125, -4.7371826171875, -4.430908203125, -4.1246337890625, -3.818359375, -3.5120849609375, -3.205810546875, -2.8995361328125, -2.59326171875, -2.2869873046875, -1.980712890625, -1.6744384765625, -1.3681640625, -1.0618896484375, -0.755615234375, -0.4493408203125, -0.14306640625, 0.1632080078125, 0.469482421875, 0.7757568359375, 1.08203125, 1.3883056640625, 1.694580078125, 2.0008544921875, 2.30712890625, 2.6134033203125, 2.919677734375, 3.2259521484375, 3.5322265625, 3.8385009765625, 4.144775390625, 4.4510498046875, 4.75732421875, 5.0635986328125, 5.369873046875, 5.6761474609375, 5.982421875, 6.2886962890625, 6.594970703125, 6.9012451171875, 7.20751953125, 7.5137939453125, 7.820068359375, 8.1263427734375, 8.4326171875, 8.7388916015625, 9.045166015625, 9.3514404296875, 9.65771484375, 9.9639892578125, 10.270263671875, 10.5765380859375, 10.8828125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 6.0, 14.0, 21.0, 16.0, 37.0, 58.0, 90.0, 114.0, 162.0, 273.0, 385.0, 777.0, 9814.0, 3827696.0, 351404.0, 1916.0, 515.0, 302.0, 200.0, 169.0, 104.0, 67.0, 46.0, 27.0, 17.0, 15.0, 9.0, 12.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.59375, -37.5146484375, -36.435546875, -35.3564453125, -34.27734375, -33.1982421875, -32.119140625, -31.0400390625, -29.9609375, -28.8818359375, -27.802734375, -26.7236328125, -25.64453125, -24.5654296875, -23.486328125, -22.4072265625, -21.328125, -20.2490234375, -19.169921875, -18.0908203125, -17.01171875, -15.9326171875, -14.853515625, -13.7744140625, -12.6953125, -11.6162109375, -10.537109375, -9.4580078125, -8.37890625, -7.2998046875, -6.220703125, -5.1416015625, -4.0625, -2.9833984375, -1.904296875, -0.8251953125, 0.25390625, 1.3330078125, 2.412109375, 3.4912109375, 4.5703125, 5.6494140625, 6.728515625, 7.8076171875, 8.88671875, 9.9658203125, 11.044921875, 12.1240234375, 13.203125, 14.2822265625, 15.361328125, 16.4404296875, 17.51953125, 18.5986328125, 19.677734375, 20.7568359375, 21.8359375, 22.9150390625, 23.994140625, 25.0732421875, 26.15234375, 27.2314453125, 28.310546875, 29.3896484375, 30.46875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 232.0, 594.0, 172.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.4194793701172, -152.83926391601562, -147.25904846191406, -141.6788330078125, -136.09861755371094, -130.51840209960938, -124.93819427490234, -119.35797882080078, -113.77776336669922, -108.19754791259766, -102.6173324584961, -97.03712463378906, -91.4569091796875, -85.87669372558594, -80.29647827148438, -74.71626281738281, -69.13604736328125, -63.55583190917969, -57.975616455078125, -52.39540481567383, -46.815189361572266, -41.2349739074707, -35.654762268066406, -30.074546813964844, -24.49433135986328, -18.91411590576172, -13.333902359008789, -7.753688812255859, -2.173473358154297, 3.4067420959472656, 8.986953735351562, 14.567169189453125, 20.147369384765625, 25.727584838867188, 31.307798385620117, 36.88801193237305, 42.46822738647461, 48.04844284057617, 53.62865447998047, 59.20886993408203, 64.7890853881836, 70.36930084228516, 75.94951629638672, 81.52972412109375, 87.10993957519531, 92.69015502929688, 98.27037048339844, 103.8505859375, 109.43080139160156, 115.01101684570312, 120.59123229980469, 126.17144775390625, 131.7516632080078, 137.33187866210938, 142.91207885742188, 148.4923095703125, 154.072509765625, 159.65272521972656, 165.23294067382812, 170.8131561279297, 176.39337158203125, 181.9735870361328, 187.55380249023438, 193.13400268554688, 198.7142333984375]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 5.0, 7.0, 12.0, 8.0, 9.0, 16.0, 13.0, 17.0, 18.0, 26.0, 24.0, 26.0, 30.0, 27.0, 41.0, 40.0, 36.0, 39.0, 37.0, 45.0, 50.0, 47.0, 38.0, 37.0, 42.0, 40.0, 34.0, 27.0, 28.0, 25.0, 23.0, 23.0, 23.0, 10.0, 11.0, 15.0, 10.0, 14.0, 5.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.617599487304688, -24.805749893188477, -23.993900299072266, -23.182048797607422, -22.37019920349121, -21.558349609375, -20.74650001525879, -19.934650421142578, -19.122798919677734, -18.310949325561523, -17.499099731445312, -16.68724822998047, -15.875398635864258, -15.063549041748047, -14.251699447631836, -13.439849853515625, -12.628000259399414, -11.816150665283203, -11.004300117492676, -10.192450523376465, -9.380599975585938, -8.568750381469727, -7.756900787353516, -6.9450507164001465, -6.133200645446777, -5.321350574493408, -4.509500503540039, -3.697650909423828, -2.885800838470459, -2.07395076751709, -1.262101173400879, -0.45025110244750977, 0.3616008758544922, 1.1734508275985718, 1.9853007793426514, 2.7971506118774414, 3.6090006828308105, 4.42085075378418, 5.232700347900391, 6.04455041885376, 6.856400489807129, 7.668250560760498, 8.480100631713867, 9.291950225830078, 10.103799819946289, 10.915650367736816, 11.727499961853027, 12.539350509643555, 13.351200103759766, 14.163049697875977, 14.974900245666504, 15.786749839782715, 16.598600387573242, 17.410449981689453, 18.222299575805664, 19.034149169921875, 19.84600067138672, 20.65785026550293, 21.46969985961914, 22.281551361083984, 23.093400955200195, 23.905250549316406, 24.717100143432617, 25.528949737548828, 26.34079933166504]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 4.0, 9.0, 7.0, 5.0, 18.0, 10.0, 15.0, 23.0, 23.0, 23.0, 24.0, 30.0, 29.0, 33.0, 38.0, 46.0, 40.0, 30.0, 54.0, 46.0, 43.0, 38.0, 45.0, 43.0, 33.0, 37.0, 39.0, 38.0, 26.0, 19.0, 9.0, 16.0, 21.0, 15.0, 11.0, 8.0, 14.0, 12.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8984375, -3.78204345703125, -3.6656494140625, -3.54925537109375, -3.432861328125, -3.31646728515625, -3.2000732421875, -3.08367919921875, -2.96728515625, -2.85089111328125, -2.7344970703125, -2.61810302734375, -2.501708984375, -2.38531494140625, -2.2689208984375, -2.15252685546875, -2.0361328125, -1.91973876953125, -1.8033447265625, -1.68695068359375, -1.570556640625, -1.45416259765625, -1.3377685546875, -1.22137451171875, -1.10498046875, -0.98858642578125, -0.8721923828125, -0.75579833984375, -0.639404296875, -0.52301025390625, -0.4066162109375, -0.29022216796875, -0.173828125, -0.05743408203125, 0.0589599609375, 0.17535400390625, 0.291748046875, 0.40814208984375, 0.5245361328125, 0.64093017578125, 0.75732421875, 0.87371826171875, 0.9901123046875, 1.10650634765625, 1.222900390625, 1.33929443359375, 1.4556884765625, 1.57208251953125, 1.6884765625, 1.80487060546875, 1.9212646484375, 2.03765869140625, 2.154052734375, 2.27044677734375, 2.3868408203125, 2.50323486328125, 2.61962890625, 2.73602294921875, 2.8524169921875, 2.96881103515625, 3.085205078125, 3.20159912109375, 3.3179931640625, 3.43438720703125, 3.55078125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 11.0, 11.0, 22.0, 31.0, 36.0, 54.0, 74.0, 113.0, 163.0, 230.0, 352.0, 511.0, 711.0, 992.0, 1471.0, 2058.0, 3092.0, 4357.0, 6194.0, 9273.0, 13450.0, 20537.0, 31857.0, 51407.0, 89186.0, 176059.0, 283937.0, 144756.0, 76359.0, 45400.0, 28111.0, 18476.0, 12333.0, 8357.0, 5685.0, 3894.0, 2703.0, 1873.0, 1284.0, 922.0, 686.0, 468.0, 345.0, 220.0, 149.0, 114.0, 78.0, 46.0, 42.0, 31.0, 7.0, 14.0, 8.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.6064453125, -0.5882720947265625, -0.570098876953125, -0.5519256591796875, -0.53375244140625, -0.5155792236328125, -0.497406005859375, -0.4792327880859375, -0.4610595703125, -0.4428863525390625, -0.424713134765625, -0.4065399169921875, -0.38836669921875, -0.3701934814453125, -0.352020263671875, -0.3338470458984375, -0.315673828125, -0.2975006103515625, -0.279327392578125, -0.2611541748046875, -0.24298095703125, -0.2248077392578125, -0.206634521484375, -0.1884613037109375, -0.1702880859375, -0.1521148681640625, -0.133941650390625, -0.1157684326171875, -0.09759521484375, -0.0794219970703125, -0.061248779296875, -0.0430755615234375, -0.02490234375, -0.0067291259765625, 0.011444091796875, 0.0296173095703125, 0.04779052734375, 0.0659637451171875, 0.084136962890625, 0.1023101806640625, 0.1204833984375, 0.1386566162109375, 0.156829833984375, 0.1750030517578125, 0.19317626953125, 0.2113494873046875, 0.229522705078125, 0.2476959228515625, 0.265869140625, 0.2840423583984375, 0.302215576171875, 0.3203887939453125, 0.33856201171875, 0.3567352294921875, 0.374908447265625, 0.3930816650390625, 0.4112548828125, 0.4294281005859375, 0.447601318359375, 0.4657745361328125, 0.48394775390625, 0.5021209716796875, 0.520294189453125, 0.5384674072265625, 0.556640625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 8.0, 9.0, 8.0, 13.0, 6.0, 15.0, 12.0, 24.0, 16.0, 19.0, 17.0, 28.0, 22.0, 39.0, 25.0, 28.0, 34.0, 43.0, 41.0, 38.0, 1061.0, 36.0, 40.0, 46.0, 31.0, 44.0, 35.0, 26.0, 42.0, 38.0, 22.0, 21.0, 18.0, 21.0, 15.0, 21.0, 9.0, 10.0, 13.0, 11.0, 2.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.158203125, -2.088470458984375, -2.01873779296875, -1.949005126953125, -1.8792724609375, -1.809539794921875, -1.73980712890625, -1.670074462890625, -1.600341796875, -1.530609130859375, -1.46087646484375, -1.391143798828125, -1.3214111328125, -1.251678466796875, -1.18194580078125, -1.112213134765625, -1.04248046875, -0.972747802734375, -0.90301513671875, -0.833282470703125, -0.7635498046875, -0.693817138671875, -0.62408447265625, -0.554351806640625, -0.484619140625, -0.414886474609375, -0.34515380859375, -0.275421142578125, -0.2056884765625, -0.135955810546875, -0.06622314453125, 0.003509521484375, 0.0732421875, 0.142974853515625, 0.21270751953125, 0.282440185546875, 0.3521728515625, 0.421905517578125, 0.49163818359375, 0.561370849609375, 0.631103515625, 0.700836181640625, 0.77056884765625, 0.840301513671875, 0.9100341796875, 0.979766845703125, 1.04949951171875, 1.119232177734375, 1.18896484375, 1.258697509765625, 1.32843017578125, 1.398162841796875, 1.4678955078125, 1.537628173828125, 1.60736083984375, 1.677093505859375, 1.746826171875, 1.816558837890625, 1.88629150390625, 1.956024169921875, 2.0257568359375, 2.095489501953125, 2.16522216796875, 2.234954833984375, 2.3046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 14.0, 11.0, 10.0, 22.0, 28.0, 49.0, 57.0, 99.0, 122.0, 168.0, 248.0, 354.0, 539.0, 728.0, 1063.0, 1507.0, 2031.0, 2870.0, 4194.0, 5664.0, 8085.0, 11297.0, 16352.0, 23637.0, 34971.0, 53150.0, 87596.0, 163476.0, 1304221.0, 142133.0, 77933.0, 48841.0, 32228.0, 21839.0, 14966.0, 10609.0, 7468.0, 5277.0, 3740.0, 2751.0, 1903.0, 1414.0, 997.0, 704.0, 522.0, 362.0, 264.0, 184.0, 139.0, 89.0, 72.0, 41.0, 32.0, 33.0, 13.0, 10.0, 6.0, 2.0, 5.0, 3.0], "bins": [-0.494384765625, -0.4791259765625, -0.4638671875, -0.4486083984375, -0.433349609375, -0.4180908203125, -0.40283203125, -0.3875732421875, -0.372314453125, -0.3570556640625, -0.341796875, -0.3265380859375, -0.311279296875, -0.2960205078125, -0.28076171875, -0.2655029296875, -0.250244140625, -0.2349853515625, -0.2197265625, -0.2044677734375, -0.189208984375, -0.1739501953125, -0.15869140625, -0.1434326171875, -0.128173828125, -0.1129150390625, -0.09765625, -0.0823974609375, -0.067138671875, -0.0518798828125, -0.03662109375, -0.0213623046875, -0.006103515625, 0.0091552734375, 0.0244140625, 0.0396728515625, 0.054931640625, 0.0701904296875, 0.08544921875, 0.1007080078125, 0.115966796875, 0.1312255859375, 0.146484375, 0.1617431640625, 0.177001953125, 0.1922607421875, 0.20751953125, 0.2227783203125, 0.238037109375, 0.2532958984375, 0.2685546875, 0.2838134765625, 0.299072265625, 0.3143310546875, 0.32958984375, 0.3448486328125, 0.360107421875, 0.3753662109375, 0.390625, 0.4058837890625, 0.421142578125, 0.4364013671875, 0.45166015625, 0.4669189453125, 0.482177734375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 6.0, 6.0, 5.0, 5.0, 7.0, 8.0, 16.0, 17.0, 23.0, 46.0, 32.0, 43.0, 49.0, 51.0, 63.0, 60.0, 80.0, 62.0, 59.0, 63.0, 53.0, 50.0, 38.0, 28.0, 29.0, 23.0, 20.0, 12.0, 8.0, 10.0, 5.0, 4.0, 1.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012958049774169922, -0.00012500397861003876, -0.0001204274594783783, -0.00011585094034671783, -0.00011127442121505737, -0.00010669790208339691, -0.00010212138295173645, -9.754486382007599e-05, -9.296834468841553e-05, -8.839182555675507e-05, -8.38153064250946e-05, -7.923878729343414e-05, -7.466226816177368e-05, -7.008574903011322e-05, -6.550922989845276e-05, -6.09327107667923e-05, -5.6356191635131836e-05, -5.1779672503471375e-05, -4.720315337181091e-05, -4.262663424015045e-05, -3.805011510848999e-05, -3.347359597682953e-05, -2.8897076845169067e-05, -2.4320557713508606e-05, -1.9744038581848145e-05, -1.5167519450187683e-05, -1.0591000318527222e-05, -6.01448118686676e-06, -1.4379620552062988e-06, 3.1385570764541626e-06, 7.715076208114624e-06, 1.2291595339775085e-05, 1.6868114471435547e-05, 2.1444633603096008e-05, 2.602115273475647e-05, 3.059767186641693e-05, 3.517419099807739e-05, 3.9750710129737854e-05, 4.4327229261398315e-05, 4.890374839305878e-05, 5.348026752471924e-05, 5.80567866563797e-05, 6.263330578804016e-05, 6.720982491970062e-05, 7.178634405136108e-05, 7.636286318302155e-05, 8.093938231468201e-05, 8.551590144634247e-05, 9.009242057800293e-05, 9.466893970966339e-05, 9.924545884132385e-05, 0.00010382197797298431, 0.00010839849710464478, 0.00011297501623630524, 0.0001175515353679657, 0.00012212805449962616, 0.00012670457363128662, 0.00013128109276294708, 0.00013585761189460754, 0.000140434131026268, 0.00014501065015792847, 0.00014958716928958893, 0.0001541636884212494, 0.00015874020755290985, 0.0001633167266845703]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 8.0, 16.0, 16.0, 27.0, 26.0, 32.0, 41.0, 70.0, 99.0, 131.0, 217.0, 368.0, 1119.0, 209194.0, 834384.0, 1637.0, 467.0, 229.0, 120.0, 86.0, 56.0, 58.0, 32.0, 24.0, 18.0, 16.0, 12.0, 4.0, 8.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0035247802734375, -0.00342714786529541, -0.0033295154571533203, -0.0032318830490112305, -0.0031342506408691406, -0.0030366182327270508, -0.002938985824584961, -0.002841353416442871, -0.0027437210083007812, -0.0026460886001586914, -0.0025484561920166016, -0.0024508237838745117, -0.002353191375732422, -0.002255558967590332, -0.002157926559448242, -0.0020602941513061523, -0.0019626617431640625, -0.0018650293350219727, -0.0017673969268798828, -0.001669764518737793, -0.0015721321105957031, -0.0014744997024536133, -0.0013768672943115234, -0.0012792348861694336, -0.0011816024780273438, -0.001083970069885254, -0.000986337661743164, -0.0008887052536010742, -0.0007910728454589844, -0.0006934404373168945, -0.0005958080291748047, -0.0004981756210327148, -0.000400543212890625, -0.00030291080474853516, -0.0002052783966064453, -0.00010764598846435547, -1.0013580322265625e-05, 8.761882781982422e-05, 0.00018525123596191406, 0.0002828836441040039, 0.00038051605224609375, 0.0004781484603881836, 0.0005757808685302734, 0.0006734132766723633, 0.0007710456848144531, 0.000868678092956543, 0.0009663105010986328, 0.0010639429092407227, 0.0011615753173828125, 0.0012592077255249023, 0.0013568401336669922, 0.001454472541809082, 0.0015521049499511719, 0.0016497373580932617, 0.0017473697662353516, 0.0018450021743774414, 0.0019426345825195312, 0.002040266990661621, 0.002137899398803711, 0.0022355318069458008, 0.0023331642150878906, 0.0024307966232299805, 0.0025284290313720703, 0.00262606143951416, 0.00272369384765625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 10.0, 38.0, 159.0, 275.0, 277.0, 157.0, 70.0, 16.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016755824617575854, -0.00016060580674093217, -0.0001536533673061058, -0.00014670092787127942, -0.00013974847388453782, -0.00013279603444971144, -0.00012584359501488507, -0.0001188911555800587, -0.00011193871614523232, -0.00010498627671040595, -9.803383727557957e-05, -9.108139056479558e-05, -8.412895112996921e-05, -7.717651169514284e-05, -7.022406498435885e-05, -6.327162554953247e-05, -5.63191861147061e-05, -4.9366746679879725e-05, -4.2414303607074544e-05, -3.546186053426936e-05, -2.850942109944299e-05, -2.1556981664616615e-05, -1.4604538591811433e-05, -7.652095519006252e-06, -6.996560841798782e-07, 6.252785169635899e-06, 1.3205226423451677e-05, 2.0157667677267455e-05, 2.7110108931083232e-05, 3.4062548365909606e-05, 4.101499143871479e-05, 4.796743451151997e-05, 5.491988849826157e-05, 6.187232793308794e-05, 6.882476736791432e-05, 7.577721407869831e-05, 8.272965351352468e-05, 8.968209294835106e-05, 9.663453965913504e-05, 0.00010358697909396142, 0.00011053941852878779, 0.00011749185796361417, 0.00012444429739844054, 0.00013139673683326691, 0.00013834919082000852, 0.0001453016302548349, 0.00015225406968966126, 0.00015920650912448764, 0.000166158948559314, 0.0001731113879941404, 0.00018006382742896676, 0.00018701626686379313, 0.0001939687062986195, 0.00020092114573344588, 0.00020787359972018749, 0.00021482603915501386, 0.00022177847858984023, 0.0002287309180246666, 0.00023568335745949298, 0.00024263579689431936, 0.00024958825088106096, 0.00025654069031588733, 0.0002634931297507137, 0.0002704455691855401, 0.00027739800862036645]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 3.0, 6.0, 4.0, 6.0, 3.0, 10.0, 7.0, 18.0, 14.0, 12.0, 19.0, 38.0, 17.0, 25.0, 24.0, 33.0, 39.0, 48.0, 32.0, 38.0, 31.0, 37.0, 50.0, 47.0, 40.0, 36.0, 32.0, 29.0, 31.0, 33.0, 25.0, 28.0, 26.0, 19.0, 17.0, 22.0, 12.0, 9.0, 18.0, 13.0, 7.0, 8.0, 3.0, 8.0, 5.0, 11.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.538629531860352e-05, -6.334111094474792e-05, -6.129592657089233e-05, -5.925074219703674e-05, -5.720555782318115e-05, -5.516037344932556e-05, -5.311518907546997e-05, -5.107000470161438e-05, -4.902482032775879e-05, -4.69796359539032e-05, -4.493445158004761e-05, -4.2889267206192017e-05, -4.0844082832336426e-05, -3.8798898458480835e-05, -3.6753714084625244e-05, -3.470852971076965e-05, -3.266334533691406e-05, -3.061816096305847e-05, -2.857297658920288e-05, -2.652779221534729e-05, -2.44826078414917e-05, -2.243742346763611e-05, -2.0392239093780518e-05, -1.8347054719924927e-05, -1.6301870346069336e-05, -1.4256685972213745e-05, -1.2211501598358154e-05, -1.0166317224502563e-05, -8.121132850646973e-06, -6.075948476791382e-06, -4.030764102935791e-06, -1.9855797290802e-06, 5.960464477539063e-08, 2.1047890186309814e-06, 4.149973392486572e-06, 6.195157766342163e-06, 8.240342140197754e-06, 1.0285526514053345e-05, 1.2330710887908936e-05, 1.4375895261764526e-05, 1.6421079635620117e-05, 1.8466264009475708e-05, 2.05114483833313e-05, 2.255663275718689e-05, 2.460181713104248e-05, 2.664700150489807e-05, 2.8692185878753662e-05, 3.073737025260925e-05, 3.2782554626464844e-05, 3.4827739000320435e-05, 3.6872923374176025e-05, 3.8918107748031616e-05, 4.096329212188721e-05, 4.30084764957428e-05, 4.505366086959839e-05, 4.709884524345398e-05, 4.914402961730957e-05, 5.118921399116516e-05, 5.323439836502075e-05, 5.527958273887634e-05, 5.7324767112731934e-05, 5.9369951486587524e-05, 6.141513586044312e-05, 6.34603202342987e-05, 6.55055046081543e-05]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 4.0, 9.0, 7.0, 5.0, 18.0, 10.0, 15.0, 23.0, 23.0, 23.0, 24.0, 30.0, 29.0, 33.0, 38.0, 46.0, 40.0, 30.0, 54.0, 46.0, 43.0, 38.0, 45.0, 43.0, 33.0, 37.0, 39.0, 38.0, 26.0, 19.0, 9.0, 16.0, 21.0, 15.0, 11.0, 8.0, 14.0, 12.0, 4.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8984375, -3.78204345703125, -3.6656494140625, -3.54925537109375, -3.432861328125, -3.31646728515625, -3.2000732421875, -3.08367919921875, -2.96728515625, -2.85089111328125, -2.7344970703125, -2.61810302734375, -2.501708984375, -2.38531494140625, -2.2689208984375, -2.15252685546875, -2.0361328125, -1.91973876953125, -1.8033447265625, -1.68695068359375, -1.570556640625, -1.45416259765625, -1.3377685546875, -1.22137451171875, -1.10498046875, -0.98858642578125, -0.8721923828125, -0.75579833984375, -0.639404296875, -0.52301025390625, -0.4066162109375, -0.29022216796875, -0.173828125, -0.05743408203125, 0.0589599609375, 0.17535400390625, 0.291748046875, 0.40814208984375, 0.5245361328125, 0.64093017578125, 0.75732421875, 0.87371826171875, 0.9901123046875, 1.10650634765625, 1.222900390625, 1.33929443359375, 1.4556884765625, 1.57208251953125, 1.6884765625, 1.80487060546875, 1.9212646484375, 2.03765869140625, 2.154052734375, 2.27044677734375, 2.3868408203125, 2.50323486328125, 2.61962890625, 2.73602294921875, 2.8524169921875, 2.96881103515625, 3.085205078125, 3.20159912109375, 3.3179931640625, 3.43438720703125, 3.55078125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 17.0, 10.0, 20.0, 25.0, 37.0, 55.0, 57.0, 89.0, 121.0, 197.0, 308.0, 460.0, 873.0, 1687.0, 3702.0, 8564.0, 20025.0, 48135.0, 115888.0, 271075.0, 327819.0, 144160.0, 60278.0, 25085.0, 10444.0, 4628.0, 2077.0, 1074.0, 581.0, 334.0, 213.0, 130.0, 119.0, 70.0, 55.0, 43.0, 33.0, 25.0, 7.0, 13.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.68359375, -3.568939208984375, -3.45428466796875, -3.339630126953125, -3.2249755859375, -3.110321044921875, -2.99566650390625, -2.881011962890625, -2.766357421875, -2.651702880859375, -2.53704833984375, -2.422393798828125, -2.3077392578125, -2.193084716796875, -2.07843017578125, -1.963775634765625, -1.84912109375, -1.734466552734375, -1.61981201171875, -1.505157470703125, -1.3905029296875, -1.275848388671875, -1.16119384765625, -1.046539306640625, -0.931884765625, -0.817230224609375, -0.70257568359375, -0.587921142578125, -0.4732666015625, -0.358612060546875, -0.24395751953125, -0.129302978515625, -0.0146484375, 0.100006103515625, 0.21466064453125, 0.329315185546875, 0.4439697265625, 0.558624267578125, 0.67327880859375, 0.787933349609375, 0.902587890625, 1.017242431640625, 1.13189697265625, 1.246551513671875, 1.3612060546875, 1.475860595703125, 1.59051513671875, 1.705169677734375, 1.81982421875, 1.934478759765625, 2.04913330078125, 2.163787841796875, 2.2784423828125, 2.393096923828125, 2.50775146484375, 2.622406005859375, 2.737060546875, 2.851715087890625, 2.96636962890625, 3.081024169921875, 3.1956787109375, 3.310333251953125, 3.42498779296875, 3.539642333984375, 3.654296875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 10.0, 6.0, 2.0, 7.0, 14.0, 12.0, 13.0, 13.0, 24.0, 27.0, 28.0, 36.0, 41.0, 39.0, 56.0, 58.0, 60.0, 121.0, 279.0, 1507.0, 210.0, 83.0, 64.0, 50.0, 45.0, 38.0, 30.0, 24.0, 28.0, 21.0, 23.0, 18.0, 17.0, 7.0, 6.0, 7.0, 10.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.3604736328125, -11.924072265625, -11.4876708984375, -11.05126953125, -10.6148681640625, -10.178466796875, -9.7420654296875, -9.3056640625, -8.8692626953125, -8.432861328125, -7.9964599609375, -7.56005859375, -7.1236572265625, -6.687255859375, -6.2508544921875, -5.814453125, -5.3780517578125, -4.941650390625, -4.5052490234375, -4.06884765625, -3.6324462890625, -3.196044921875, -2.7596435546875, -2.3232421875, -1.8868408203125, -1.450439453125, -1.0140380859375, -0.57763671875, -0.1412353515625, 0.295166015625, 0.7315673828125, 1.16796875, 1.6043701171875, 2.040771484375, 2.4771728515625, 2.91357421875, 3.3499755859375, 3.786376953125, 4.2227783203125, 4.6591796875, 5.0955810546875, 5.531982421875, 5.9683837890625, 6.40478515625, 6.8411865234375, 7.277587890625, 7.7139892578125, 8.150390625, 8.5867919921875, 9.023193359375, 9.4595947265625, 9.89599609375, 10.3323974609375, 10.768798828125, 11.2052001953125, 11.6416015625, 12.0780029296875, 12.514404296875, 12.9508056640625, 13.38720703125, 13.8236083984375, 14.260009765625, 14.6964111328125, 15.1328125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 2.0, 8.0, 11.0, 11.0, 10.0, 11.0, 11.0, 15.0, 20.0, 25.0, 58.0, 64.0, 107.0, 188.0, 311.0, 653.0, 6130.0, 3131795.0, 4728.0, 625.0, 341.0, 178.0, 109.0, 74.0, 57.0, 38.0, 39.0, 15.0, 21.0, 6.0, 12.0, 5.0, 7.0, 3.0, 3.0, 7.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.1875, -64.1494140625, -62.111328125, -60.0732421875, -58.03515625, -55.9970703125, -53.958984375, -51.9208984375, -49.8828125, -47.8447265625, -45.806640625, -43.7685546875, -41.73046875, -39.6923828125, -37.654296875, -35.6162109375, -33.578125, -31.5400390625, -29.501953125, -27.4638671875, -25.42578125, -23.3876953125, -21.349609375, -19.3115234375, -17.2734375, -15.2353515625, -13.197265625, -11.1591796875, -9.12109375, -7.0830078125, -5.044921875, -3.0068359375, -0.96875, 1.0693359375, 3.107421875, 5.1455078125, 7.18359375, 9.2216796875, 11.259765625, 13.2978515625, 15.3359375, 17.3740234375, 19.412109375, 21.4501953125, 23.48828125, 25.5263671875, 27.564453125, 29.6025390625, 31.640625, 33.6787109375, 35.716796875, 37.7548828125, 39.79296875, 41.8310546875, 43.869140625, 45.9072265625, 47.9453125, 49.9833984375, 52.021484375, 54.0595703125, 56.09765625, 58.1357421875, 60.173828125, 62.2119140625, 64.25]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 16.0, 110.0, 511.0, 338.0, 38.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.560304641723633, -17.05166244506836, -14.543020248413086, -12.034379005432129, -9.525736808776855, -7.017094612121582, -4.508453369140625, -1.9998111724853516, 0.5088310241699219, 3.017472982406616, 5.5261149406433105, 8.034756660461426, 10.5433988571167, 13.052041053771973, 15.56068229675293, 18.069324493408203, 20.577966690063477, 23.08660888671875, 25.595251083374023, 28.103893280029297, 30.612533569335938, 33.121177673339844, 35.629817962646484, 38.138458251953125, 40.64710235595703, 43.15574264526367, 45.66438674926758, 48.17302703857422, 50.681671142578125, 53.190311431884766, 55.698951721191406, 58.20759582519531, 60.71623992919922, 63.22488021850586, 65.7335205078125, 68.2421646118164, 70.75080871582031, 73.25945281982422, 75.7680892944336, 78.2767333984375, 80.7853775024414, 83.29402160644531, 85.80265808105469, 88.3113021850586, 90.8199462890625, 93.3285903930664, 95.83722686767578, 98.34587097167969, 100.85450744628906, 103.36315155029297, 105.87178802490234, 108.38043212890625, 110.88907623291016, 113.39772033691406, 115.90635681152344, 118.41500091552734, 120.92364501953125, 123.43228912353516, 125.94092559814453, 128.44956970214844, 130.9582061767578, 133.46685791015625, 135.97549438476562, 138.484130859375, 140.99278259277344]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 1.0, 5.0, 3.0, 12.0, 8.0, 8.0, 16.0, 15.0, 14.0, 10.0, 14.0, 23.0, 20.0, 18.0, 25.0, 18.0, 28.0, 37.0, 41.0, 38.0, 38.0, 35.0, 40.0, 29.0, 32.0, 33.0, 37.0, 28.0, 32.0, 29.0, 26.0, 40.0, 25.0, 28.0, 27.0, 30.0, 25.0, 23.0, 11.0, 13.0, 8.0, 13.0, 12.0, 7.0, 4.0, 4.0, 5.0, 8.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0], "bins": [-32.69915771484375, -31.740915298461914, -30.782670974731445, -29.82442855834961, -28.86618423461914, -27.907941818237305, -26.94969940185547, -25.991455078125, -25.033212661743164, -24.074970245361328, -23.11672592163086, -22.158483505249023, -21.200241088867188, -20.24199676513672, -19.283754348754883, -18.325511932373047, -17.367267608642578, -16.409025192260742, -15.450780868530273, -14.492538452148438, -13.534295082092285, -12.576051712036133, -11.617809295654297, -10.659565925598145, -9.701322555541992, -8.74307918548584, -7.784836292266846, -6.826593399047852, -5.868350028991699, -4.910106658935547, -3.9518637657165527, -2.9936208724975586, -2.0353755950927734, -1.0771324634552002, -0.11888933181762695, 0.8393537998199463, 1.7975969314575195, 2.755840301513672, 3.714083194732666, 4.67232608795166, 5.6305694580078125, 6.588812828063965, 7.547055721282959, 8.505298614501953, 9.463541984558105, 10.421785354614258, 11.380027770996094, 12.338271141052246, 13.296514511108398, 14.25475788116455, 15.213001251220703, 16.17124366760254, 17.129486083984375, 18.087730407714844, 19.04597282409668, 20.004215240478516, 20.962459564208984, 21.92070198059082, 22.87894630432129, 23.837188720703125, 24.795433044433594, 25.75367546081543, 26.711917877197266, 27.670162200927734, 28.62840461730957]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 11.0, 10.0, 16.0, 7.0, 8.0, 11.0, 17.0, 16.0, 18.0, 25.0, 22.0, 28.0, 29.0, 41.0, 37.0, 35.0, 52.0, 41.0, 34.0, 44.0, 40.0, 42.0, 51.0, 40.0, 30.0, 38.0, 34.0, 29.0, 36.0, 21.0, 16.0, 18.0, 16.0, 15.0, 13.0, 15.0, 6.0, 8.0, 4.0, 11.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 4.0], "bins": [-4.75390625, -4.62432861328125, -4.4947509765625, -4.36517333984375, -4.235595703125, -4.10601806640625, -3.9764404296875, -3.84686279296875, -3.71728515625, -3.58770751953125, -3.4581298828125, -3.32855224609375, -3.198974609375, -3.06939697265625, -2.9398193359375, -2.81024169921875, -2.6806640625, -2.55108642578125, -2.4215087890625, -2.29193115234375, -2.162353515625, -2.03277587890625, -1.9031982421875, -1.77362060546875, -1.64404296875, -1.51446533203125, -1.3848876953125, -1.25531005859375, -1.125732421875, -0.99615478515625, -0.8665771484375, -0.73699951171875, -0.607421875, -0.47784423828125, -0.3482666015625, -0.21868896484375, -0.089111328125, 0.04046630859375, 0.1700439453125, 0.29962158203125, 0.42919921875, 0.55877685546875, 0.6883544921875, 0.81793212890625, 0.947509765625, 1.07708740234375, 1.2066650390625, 1.33624267578125, 1.4658203125, 1.59539794921875, 1.7249755859375, 1.85455322265625, 1.984130859375, 2.11370849609375, 2.2432861328125, 2.37286376953125, 2.50244140625, 2.63201904296875, 2.7615966796875, 2.89117431640625, 3.020751953125, 3.15032958984375, 3.2799072265625, 3.40948486328125, 3.5390625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 8.0, 11.0, 7.0, 15.0, 12.0, 11.0, 20.0, 21.0, 24.0, 37.0, 59.0, 77.0, 106.0, 167.0, 285.0, 676.0, 2834.0, 33418.0, 785883.0, 2789221.0, 553822.0, 23917.0, 2219.0, 581.0, 283.0, 162.0, 99.0, 64.0, 58.0, 34.0, 33.0, 21.0, 15.0, 12.0, 9.0, 10.0, 10.0, 5.0, 9.0, 6.0, 5.0, 5.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.0, -10.6895751953125, -10.379150390625, -10.0687255859375, -9.75830078125, -9.4478759765625, -9.137451171875, -8.8270263671875, -8.5166015625, -8.2061767578125, -7.895751953125, -7.5853271484375, -7.27490234375, -6.9644775390625, -6.654052734375, -6.3436279296875, -6.033203125, -5.7227783203125, -5.412353515625, -5.1019287109375, -4.79150390625, -4.4810791015625, -4.170654296875, -3.8602294921875, -3.5498046875, -3.2393798828125, -2.928955078125, -2.6185302734375, -2.30810546875, -1.9976806640625, -1.687255859375, -1.3768310546875, -1.06640625, -0.7559814453125, -0.445556640625, -0.1351318359375, 0.17529296875, 0.4857177734375, 0.796142578125, 1.1065673828125, 1.4169921875, 1.7274169921875, 2.037841796875, 2.3482666015625, 2.65869140625, 2.9691162109375, 3.279541015625, 3.5899658203125, 3.900390625, 4.2108154296875, 4.521240234375, 4.8316650390625, 5.14208984375, 5.4525146484375, 5.762939453125, 6.0733642578125, 6.3837890625, 6.6942138671875, 7.004638671875, 7.3150634765625, 7.62548828125, 7.9359130859375, 8.246337890625, 8.5567626953125, 8.8671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 7.0, 9.0, 6.0, 17.0, 17.0, 26.0, 20.0, 43.0, 50.0, 74.0, 98.0, 125.0, 148.0, 230.0, 317.0, 371.0, 411.0, 443.0, 401.0, 326.0, 245.0, 185.0, 135.0, 93.0, 60.0, 53.0, 36.0, 37.0, 29.0, 15.0, 8.0, 14.0, 10.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.41644287109375, -7.1766357421875, -6.93682861328125, -6.697021484375, -6.45721435546875, -6.2174072265625, -5.97760009765625, -5.73779296875, -5.49798583984375, -5.2581787109375, -5.01837158203125, -4.778564453125, -4.53875732421875, -4.2989501953125, -4.05914306640625, -3.8193359375, -3.57952880859375, -3.3397216796875, -3.09991455078125, -2.860107421875, -2.62030029296875, -2.3804931640625, -2.14068603515625, -1.90087890625, -1.66107177734375, -1.4212646484375, -1.18145751953125, -0.941650390625, -0.70184326171875, -0.4620361328125, -0.22222900390625, 0.017578125, 0.25738525390625, 0.4971923828125, 0.73699951171875, 0.976806640625, 1.21661376953125, 1.4564208984375, 1.69622802734375, 1.93603515625, 2.17584228515625, 2.4156494140625, 2.65545654296875, 2.895263671875, 3.13507080078125, 3.3748779296875, 3.61468505859375, 3.8544921875, 4.09429931640625, 4.3341064453125, 4.57391357421875, 4.813720703125, 5.05352783203125, 5.2933349609375, 5.53314208984375, 5.77294921875, 6.01275634765625, 6.2525634765625, 6.49237060546875, 6.732177734375, 6.97198486328125, 7.2117919921875, 7.45159912109375, 7.69140625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 4.0, 10.0, 14.0, 18.0, 17.0, 27.0, 39.0, 52.0, 66.0, 78.0, 92.0, 146.0, 190.0, 259.0, 388.0, 556.0, 2700.0, 316918.0, 3824235.0, 45760.0, 1124.0, 464.0, 277.0, 175.0, 154.0, 118.0, 114.0, 73.0, 53.0, 41.0, 24.0, 27.0, 20.0, 14.0, 8.0, 10.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.21875, -25.40771484375, -24.5966796875, -23.78564453125, -22.974609375, -22.16357421875, -21.3525390625, -20.54150390625, -19.73046875, -18.91943359375, -18.1083984375, -17.29736328125, -16.486328125, -15.67529296875, -14.8642578125, -14.05322265625, -13.2421875, -12.43115234375, -11.6201171875, -10.80908203125, -9.998046875, -9.18701171875, -8.3759765625, -7.56494140625, -6.75390625, -5.94287109375, -5.1318359375, -4.32080078125, -3.509765625, -2.69873046875, -1.8876953125, -1.07666015625, -0.265625, 0.54541015625, 1.3564453125, 2.16748046875, 2.978515625, 3.78955078125, 4.6005859375, 5.41162109375, 6.22265625, 7.03369140625, 7.8447265625, 8.65576171875, 9.466796875, 10.27783203125, 11.0888671875, 11.89990234375, 12.7109375, 13.52197265625, 14.3330078125, 15.14404296875, 15.955078125, 16.76611328125, 17.5771484375, 18.38818359375, 19.19921875, 20.01025390625, 20.8212890625, 21.63232421875, 22.443359375, 23.25439453125, 24.0654296875, 24.87646484375, 25.6875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 52.0, 185.0, 376.0, 286.0, 93.0, 12.0, 2.0, 1.0, 0.0, 1.0], "bins": [-181.3253936767578, -178.1287078857422, -174.93203735351562, -171.7353515625, -168.53868103027344, -165.3419952392578, -162.14532470703125, -158.94863891601562, -155.751953125, -152.55526733398438, -149.3585968017578, -146.1619110107422, -142.96524047851562, -139.7685546875, -136.57186889648438, -133.3751983642578, -130.17852783203125, -126.98184967041016, -123.78517150878906, -120.58848571777344, -117.39180755615234, -114.19512939453125, -110.99845123291016, -107.80177307128906, -104.60508728027344, -101.40840911865234, -98.21173095703125, -95.01504516601562, -91.81836700439453, -88.62168884277344, -85.42501068115234, -82.22833251953125, -79.03164672851562, -75.83496856689453, -72.63829040527344, -69.44160461425781, -66.24492645263672, -63.048248291015625, -59.85157012939453, -56.65489196777344, -53.458213806152344, -50.26153564453125, -47.06485366821289, -43.8681755065918, -40.6714973449707, -37.474815368652344, -34.27813720703125, -31.081459045410156, -27.88477897644043, -24.688098907470703, -21.49142074584961, -18.294740676879883, -15.098061561584473, -11.901382446289062, -8.704702377319336, -5.508024215698242, -2.3113441467285156, 0.8853352069854736, 4.082014560699463, 7.278694152832031, 10.475373268127441, 13.672052383422852, 16.868732452392578, 20.065410614013672, 23.2620906829834]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 12.0, 6.0, 13.0, 13.0, 20.0, 18.0, 24.0, 26.0, 30.0, 37.0, 27.0, 47.0, 36.0, 36.0, 37.0, 41.0, 40.0, 42.0, 44.0, 42.0, 42.0, 42.0, 31.0, 39.0, 38.0, 29.0, 27.0, 25.0, 18.0, 22.0, 14.0, 18.0, 16.0, 8.0, 7.0, 8.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.400285720825195, -26.552488327026367, -25.704692840576172, -24.856895446777344, -24.009098052978516, -23.161300659179688, -22.313505172729492, -21.465707778930664, -20.61791229248047, -19.77011489868164, -18.922319412231445, -18.074522018432617, -17.22672462463379, -16.378929138183594, -15.531131744384766, -14.683334350585938, -13.83553695678711, -12.987740516662598, -12.13994312286377, -11.292146682739258, -10.44434928894043, -9.596552848815918, -8.748756408691406, -7.900959491729736, -7.053162574768066, -6.2053656578063965, -5.357568740844727, -4.509772300720215, -3.661975383758545, -2.814178466796875, -1.9663820266723633, -1.1185851097106934, -0.2707862854003906, 0.5770105123519897, 1.4248073101043701, 2.272603988647461, 3.120400905609131, 3.968197822570801, 4.8159942626953125, 5.663791179656982, 6.511588096618652, 7.359385013580322, 8.207181930541992, 9.054978370666504, 9.902774810791016, 10.750572204589844, 11.598368644714355, 12.446165084838867, 13.293962478637695, 14.141758918762207, 14.989556312561035, 15.837352752685547, 16.685150146484375, 17.532947540283203, 18.3807430267334, 19.228540420532227, 20.076335906982422, 20.92413330078125, 21.771928787231445, 22.619726181030273, 23.4675235748291, 24.315319061279297, 25.163116455078125, 26.010913848876953, 26.85871124267578]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 8.0, 9.0, 12.0, 12.0, 13.0, 16.0, 21.0, 17.0, 26.0, 20.0, 30.0, 26.0, 29.0, 30.0, 34.0, 41.0, 32.0, 30.0, 55.0, 39.0, 45.0, 36.0, 38.0, 32.0, 41.0, 35.0, 41.0, 32.0, 25.0, 23.0, 19.0, 23.0, 18.0, 15.0, 8.0, 8.0, 13.0, 9.0, 7.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.507965087890625, -3.39288330078125, -3.277801513671875, -3.1627197265625, -3.047637939453125, -2.93255615234375, -2.817474365234375, -2.702392578125, -2.587310791015625, -2.47222900390625, -2.357147216796875, -2.2420654296875, -2.126983642578125, -2.01190185546875, -1.896820068359375, -1.78173828125, -1.666656494140625, -1.55157470703125, -1.436492919921875, -1.3214111328125, -1.206329345703125, -1.09124755859375, -0.976165771484375, -0.861083984375, -0.746002197265625, -0.63092041015625, -0.515838623046875, -0.4007568359375, -0.285675048828125, -0.17059326171875, -0.055511474609375, 0.0595703125, 0.174652099609375, 0.28973388671875, 0.404815673828125, 0.5198974609375, 0.634979248046875, 0.75006103515625, 0.865142822265625, 0.980224609375, 1.095306396484375, 1.21038818359375, 1.325469970703125, 1.4405517578125, 1.555633544921875, 1.67071533203125, 1.785797119140625, 1.90087890625, 2.015960693359375, 2.13104248046875, 2.246124267578125, 2.3612060546875, 2.476287841796875, 2.59136962890625, 2.706451416015625, 2.821533203125, 2.936614990234375, 3.05169677734375, 3.166778564453125, 3.2818603515625, 3.396942138671875, 3.51202392578125, 3.627105712890625, 3.7421875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 9.0, 13.0, 22.0, 25.0, 43.0, 67.0, 98.0, 129.0, 188.0, 274.0, 402.0, 578.0, 834.0, 1165.0, 1766.0, 2577.0, 3796.0, 5471.0, 8384.0, 12478.0, 19027.0, 29713.0, 47320.0, 78849.0, 146605.0, 282241.0, 170482.0, 89136.0, 52020.0, 32468.0, 20932.0, 13398.0, 9145.0, 5962.0, 3992.0, 2753.0, 1932.0, 1370.0, 925.0, 577.0, 424.0, 326.0, 185.0, 132.0, 125.0, 68.0, 54.0, 23.0, 18.0, 20.0, 11.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.62060546875, -0.6015701293945312, -0.5825347900390625, -0.5634994506835938, -0.544464111328125, -0.5254287719726562, -0.5063934326171875, -0.48735809326171875, -0.46832275390625, -0.44928741455078125, -0.4302520751953125, -0.41121673583984375, -0.392181396484375, -0.37314605712890625, -0.3541107177734375, -0.33507537841796875, -0.3160400390625, -0.29700469970703125, -0.2779693603515625, -0.25893402099609375, -0.239898681640625, -0.22086334228515625, -0.2018280029296875, -0.18279266357421875, -0.16375732421875, -0.14472198486328125, -0.1256866455078125, -0.10665130615234375, -0.087615966796875, -0.06858062744140625, -0.0495452880859375, -0.03050994873046875, -0.011474609375, 0.00756072998046875, 0.0265960693359375, 0.04563140869140625, 0.064666748046875, 0.08370208740234375, 0.1027374267578125, 0.12177276611328125, 0.14080810546875, 0.15984344482421875, 0.1788787841796875, 0.19791412353515625, 0.216949462890625, 0.23598480224609375, 0.2550201416015625, 0.27405548095703125, 0.2930908203125, 0.31212615966796875, 0.3311614990234375, 0.35019683837890625, 0.369232177734375, 0.38826751708984375, 0.4073028564453125, 0.42633819580078125, 0.44537353515625, 0.46440887451171875, 0.4834442138671875, 0.5024795532226562, 0.521514892578125, 0.5405502319335938, 0.5595855712890625, 0.5786209106445312, 0.59765625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 6.0, 11.0, 6.0, 16.0, 12.0, 19.0, 21.0, 23.0, 25.0, 24.0, 29.0, 22.0, 28.0, 33.0, 22.0, 42.0, 39.0, 43.0, 1069.0, 45.0, 28.0, 40.0, 36.0, 48.0, 37.0, 37.0, 34.0, 36.0, 32.0, 18.0, 22.0, 23.0, 19.0, 17.0, 8.0, 14.0, 6.0, 5.0, 6.0, 3.0, 5.0, 9.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.42578125, -2.3487548828125, -2.271728515625, -2.1947021484375, -2.11767578125, -2.0406494140625, -1.963623046875, -1.8865966796875, -1.8095703125, -1.7325439453125, -1.655517578125, -1.5784912109375, -1.50146484375, -1.4244384765625, -1.347412109375, -1.2703857421875, -1.193359375, -1.1163330078125, -1.039306640625, -0.9622802734375, -0.88525390625, -0.8082275390625, -0.731201171875, -0.6541748046875, -0.5771484375, -0.5001220703125, -0.423095703125, -0.3460693359375, -0.26904296875, -0.1920166015625, -0.114990234375, -0.0379638671875, 0.0390625, 0.1160888671875, 0.193115234375, 0.2701416015625, 0.34716796875, 0.4241943359375, 0.501220703125, 0.5782470703125, 0.6552734375, 0.7322998046875, 0.809326171875, 0.8863525390625, 0.96337890625, 1.0404052734375, 1.117431640625, 1.1944580078125, 1.271484375, 1.3485107421875, 1.425537109375, 1.5025634765625, 1.57958984375, 1.6566162109375, 1.733642578125, 1.8106689453125, 1.8876953125, 1.9647216796875, 2.041748046875, 2.1187744140625, 2.19580078125, 2.2728271484375, 2.349853515625, 2.4268798828125, 2.50390625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 8.0, 13.0, 26.0, 47.0, 60.0, 81.0, 124.0, 189.0, 232.0, 306.0, 477.0, 653.0, 944.0, 1371.0, 2014.0, 2689.0, 3915.0, 5623.0, 8057.0, 11734.0, 16563.0, 24304.0, 35424.0, 53516.0, 86596.0, 163923.0, 1307802.0, 140440.0, 77334.0, 48535.0, 32141.0, 21961.0, 15181.0, 10528.0, 7489.0, 5188.0, 3615.0, 2512.0, 1774.0, 1189.0, 783.0, 591.0, 390.0, 268.0, 176.0, 128.0, 61.0, 58.0, 36.0, 15.0, 14.0, 13.0, 11.0, 4.0, 2.0, 3.0, 0.0, 3.0], "bins": [-0.5380859375, -0.5214767456054688, -0.5048675537109375, -0.48825836181640625, -0.471649169921875, -0.45503997802734375, -0.4384307861328125, -0.42182159423828125, -0.40521240234375, -0.38860321044921875, -0.3719940185546875, -0.35538482666015625, -0.338775634765625, -0.32216644287109375, -0.3055572509765625, -0.28894805908203125, -0.2723388671875, -0.25572967529296875, -0.2391204833984375, -0.22251129150390625, -0.205902099609375, -0.18929290771484375, -0.1726837158203125, -0.15607452392578125, -0.13946533203125, -0.12285614013671875, -0.1062469482421875, -0.08963775634765625, -0.073028564453125, -0.05641937255859375, -0.0398101806640625, -0.02320098876953125, -0.006591796875, 0.01001739501953125, 0.0266265869140625, 0.04323577880859375, 0.059844970703125, 0.07645416259765625, 0.0930633544921875, 0.10967254638671875, 0.12628173828125, 0.14289093017578125, 0.1595001220703125, 0.17610931396484375, 0.192718505859375, 0.20932769775390625, 0.2259368896484375, 0.24254608154296875, 0.2591552734375, 0.27576446533203125, 0.2923736572265625, 0.30898284912109375, 0.325592041015625, 0.34220123291015625, 0.3588104248046875, 0.37541961669921875, 0.39202880859375, 0.40863800048828125, 0.4252471923828125, 0.44185638427734375, 0.458465576171875, 0.47507476806640625, 0.4916839599609375, 0.5082931518554688, 0.52490234375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 9.0, 5.0, 7.0, 12.0, 18.0, 17.0, 18.0, 24.0, 28.0, 28.0, 39.0, 35.0, 63.0, 68.0, 68.0, 71.0, 70.0, 65.0, 68.0, 55.0, 38.0, 34.0, 42.0, 27.0, 28.0, 11.0, 5.0, 9.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001456737518310547, -0.00014094635844230652, -0.00013621896505355835, -0.00013149157166481018, -0.000126764178276062, -0.00012203678488731384, -0.00011730939149856567, -0.0001125819981098175, -0.00010785460472106934, -0.00010312721133232117, -9.8399817943573e-05, -9.367242455482483e-05, -8.894503116607666e-05, -8.421763777732849e-05, -7.949024438858032e-05, -7.476285099983215e-05, -7.003545761108398e-05, -6.530806422233582e-05, -6.0580670833587646e-05, -5.585327744483948e-05, -5.112588405609131e-05, -4.639849066734314e-05, -4.167109727859497e-05, -3.69437038898468e-05, -3.221631050109863e-05, -2.7488917112350464e-05, -2.2761523723602295e-05, -1.8034130334854126e-05, -1.3306736946105957e-05, -8.579343557357788e-06, -3.851950168609619e-06, 8.754432201385498e-07, 5.602836608886719e-06, 1.0330229997634888e-05, 1.5057623386383057e-05, 1.9785016775131226e-05, 2.4512410163879395e-05, 2.9239803552627563e-05, 3.396719694137573e-05, 3.86945903301239e-05, 4.342198371887207e-05, 4.814937710762024e-05, 5.287677049636841e-05, 5.760416388511658e-05, 6.233155727386475e-05, 6.705895066261292e-05, 7.178634405136108e-05, 7.651373744010925e-05, 8.124113082885742e-05, 8.596852421760559e-05, 9.069591760635376e-05, 9.542331099510193e-05, 0.0001001507043838501, 0.00010487809777259827, 0.00010960549116134644, 0.0001143328845500946, 0.00011906027793884277, 0.00012378767132759094, 0.0001285150647163391, 0.00013324245810508728, 0.00013796985149383545, 0.00014269724488258362, 0.0001474246382713318, 0.00015215203166007996, 0.00015687942504882812]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 5.0, 5.0, 16.0, 11.0, 16.0, 24.0, 36.0, 50.0, 70.0, 80.0, 119.0, 237.0, 511.0, 2830.0, 1034999.0, 8152.0, 605.0, 266.0, 155.0, 75.0, 58.0, 53.0, 38.0, 27.0, 24.0, 18.0, 13.0, 18.0, 9.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003475189208984375, -0.003368556499481201, -0.0032619237899780273, -0.0031552910804748535, -0.0030486583709716797, -0.002942025661468506, -0.002835392951965332, -0.002728760242462158, -0.0026221275329589844, -0.0025154948234558105, -0.0024088621139526367, -0.002302229404449463, -0.002195596694946289, -0.0020889639854431152, -0.0019823312759399414, -0.0018756985664367676, -0.0017690658569335938, -0.00166243314743042, -0.001555800437927246, -0.0014491677284240723, -0.0013425350189208984, -0.0012359023094177246, -0.0011292695999145508, -0.001022636890411377, -0.0009160041809082031, -0.0008093714714050293, -0.0007027387619018555, -0.0005961060523986816, -0.0004894733428955078, -0.000382840633392334, -0.00027620792388916016, -0.00016957521438598633, -6.29425048828125e-05, 4.369020462036133e-05, 0.00015032291412353516, 0.000256955623626709, 0.0003635883331298828, 0.00047022104263305664, 0.0005768537521362305, 0.0006834864616394043, 0.0007901191711425781, 0.000896751880645752, 0.0010033845901489258, 0.0011100172996520996, 0.0012166500091552734, 0.0013232827186584473, 0.001429915428161621, 0.001536548137664795, 0.0016431808471679688, 0.0017498135566711426, 0.0018564462661743164, 0.0019630789756774902, 0.002069711685180664, 0.002176344394683838, 0.0022829771041870117, 0.0023896098136901855, 0.0024962425231933594, 0.002602875232696533, 0.002709507942199707, 0.002816140651702881, 0.0029227733612060547, 0.0030294060707092285, 0.0031360387802124023, 0.003242671489715576, 0.00334930419921875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 64.0, 330.0, 447.0, 145.0, 23.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005411451566033065, -0.0005305749364197254, -0.0005200047162361443, -0.0005094344960525632, -0.0004988642176613212, -0.00048829399747774, -0.00047772377729415894, -0.0004671535571105778, -0.0004565833369269967, -0.0004460131167434156, -0.000435442867456004, -0.0004248726472724229, -0.0004143024270888418, -0.0004037321778014302, -0.0003931619576178491, -0.000382591737434268, -0.00037202148814685643, -0.0003614512679632753, -0.00035088101867586374, -0.00034031079849228263, -0.0003297405783087015, -0.0003191703581251204, -0.00030860010883770883, -0.0002980298886541277, -0.00028745963936671615, -0.00027688941918313503, -0.00026631916989572346, -0.00025574894971214235, -0.00024517872952856123, -0.0002346084947930649, -0.00022403826005756855, -0.00021346803987398744, -0.00020289779058657587, -0.00019232755585107952, -0.0001817573356674984, -0.00017118710093200207, -0.00016061688074842095, -0.0001500466460129246, -0.00013947641127742827, -0.00012890619109384716, -0.00011833595635835081, -0.00010776572889881209, -9.719550143927336e-05, -8.662526670377702e-05, -7.605503924423829e-05, -6.548481178469956e-05, -5.491457704920322e-05, -4.434434958966449e-05, -3.377412213012576e-05, -2.320389285159763e-05, -1.2633663573069498e-05, -2.063432475551963e-06, 8.506794983986765e-06, 1.9077022443525493e-05, 2.9647257179021835e-05, 4.021748463856056e-05, 5.078771209809929e-05, 6.135793955763802e-05, 7.192816701717675e-05, 8.249840175267309e-05, 9.306862921221182e-05, 0.00010363885667175055, 0.00011420909140724689, 0.00012477932614274323, 0.00013534954632632434]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 12.0, 9.0, 8.0, 13.0, 25.0, 20.0, 16.0, 30.0, 45.0, 33.0, 27.0, 31.0, 47.0, 42.0, 47.0, 48.0, 43.0, 43.0, 51.0, 53.0, 48.0, 39.0, 32.0, 37.0, 27.0, 35.0, 32.0, 17.0, 15.0, 14.0, 10.0, 16.0, 14.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.338689804077148e-05, -8.092913776636124e-05, -7.847137749195099e-05, -7.601361721754074e-05, -7.355585694313049e-05, -7.109809666872025e-05, -6.864033639431e-05, -6.618257611989975e-05, -6.37248158454895e-05, -6.126705557107925e-05, -5.8809295296669006e-05, -5.635153502225876e-05, -5.389377474784851e-05, -5.143601447343826e-05, -4.8978254199028015e-05, -4.652049392461777e-05, -4.406273365020752e-05, -4.160497337579727e-05, -3.9147213101387024e-05, -3.6689452826976776e-05, -3.423169255256653e-05, -3.177393227815628e-05, -2.9316172003746033e-05, -2.6858411729335785e-05, -2.4400651454925537e-05, -2.194289118051529e-05, -1.948513090610504e-05, -1.7027370631694794e-05, -1.4569610357284546e-05, -1.2111850082874298e-05, -9.65408980846405e-06, -7.1963295340538025e-06, -4.738569259643555e-06, -2.280808985233307e-06, 1.7695128917694092e-07, 2.6347115635871887e-06, 5.0924718379974365e-06, 7.550232112407684e-06, 1.0007992386817932e-05, 1.246575266122818e-05, 1.4923512935638428e-05, 1.7381273210048676e-05, 1.9839033484458923e-05, 2.229679375886917e-05, 2.475455403327942e-05, 2.7212314307689667e-05, 2.9670074582099915e-05, 3.212783485651016e-05, 3.458559513092041e-05, 3.704335540533066e-05, 3.9501115679740906e-05, 4.1958875954151154e-05, 4.44166362285614e-05, 4.687439650297165e-05, 4.93321567773819e-05, 5.1789917051792145e-05, 5.424767732620239e-05, 5.670543760061264e-05, 5.916319787502289e-05, 6.162095814943314e-05, 6.407871842384338e-05, 6.653647869825363e-05, 6.899423897266388e-05, 7.145199924707413e-05, 7.390975952148438e-05]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 8.0, 9.0, 12.0, 12.0, 13.0, 16.0, 21.0, 17.0, 26.0, 20.0, 30.0, 26.0, 29.0, 30.0, 34.0, 41.0, 32.0, 30.0, 55.0, 39.0, 45.0, 36.0, 38.0, 32.0, 41.0, 35.0, 41.0, 32.0, 25.0, 23.0, 19.0, 23.0, 18.0, 15.0, 8.0, 8.0, 13.0, 9.0, 7.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.507965087890625, -3.39288330078125, -3.277801513671875, -3.1627197265625, -3.047637939453125, -2.93255615234375, -2.817474365234375, -2.702392578125, -2.587310791015625, -2.47222900390625, -2.357147216796875, -2.2420654296875, -2.126983642578125, -2.01190185546875, -1.896820068359375, -1.78173828125, -1.666656494140625, -1.55157470703125, -1.436492919921875, -1.3214111328125, -1.206329345703125, -1.09124755859375, -0.976165771484375, -0.861083984375, -0.746002197265625, -0.63092041015625, -0.515838623046875, -0.4007568359375, -0.285675048828125, -0.17059326171875, -0.055511474609375, 0.0595703125, 0.174652099609375, 0.28973388671875, 0.404815673828125, 0.5198974609375, 0.634979248046875, 0.75006103515625, 0.865142822265625, 0.980224609375, 1.095306396484375, 1.21038818359375, 1.325469970703125, 1.4405517578125, 1.555633544921875, 1.67071533203125, 1.785797119140625, 1.90087890625, 2.015960693359375, 2.13104248046875, 2.246124267578125, 2.3612060546875, 2.476287841796875, 2.59136962890625, 2.706451416015625, 2.821533203125, 2.936614990234375, 3.05169677734375, 3.166778564453125, 3.2818603515625, 3.396942138671875, 3.51202392578125, 3.627105712890625, 3.7421875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 5.0, 3.0, 10.0, 11.0, 16.0, 24.0, 21.0, 34.0, 40.0, 44.0, 90.0, 117.0, 176.0, 231.0, 372.0, 676.0, 1407.0, 2775.0, 6289.0, 14848.0, 34883.0, 84010.0, 196458.0, 371859.0, 191496.0, 81830.0, 34303.0, 14367.0, 6225.0, 2749.0, 1333.0, 702.0, 374.0, 220.0, 145.0, 102.0, 77.0, 57.0, 42.0, 25.0, 23.0, 22.0, 11.0, 13.0, 12.0, 6.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.5234375, -3.411529541015625, -3.29962158203125, -3.187713623046875, -3.0758056640625, -2.963897705078125, -2.85198974609375, -2.740081787109375, -2.628173828125, -2.516265869140625, -2.40435791015625, -2.292449951171875, -2.1805419921875, -2.068634033203125, -1.95672607421875, -1.844818115234375, -1.73291015625, -1.621002197265625, -1.50909423828125, -1.397186279296875, -1.2852783203125, -1.173370361328125, -1.06146240234375, -0.949554443359375, -0.837646484375, -0.725738525390625, -0.61383056640625, -0.501922607421875, -0.3900146484375, -0.278106689453125, -0.16619873046875, -0.054290771484375, 0.0576171875, 0.169525146484375, 0.28143310546875, 0.393341064453125, 0.5052490234375, 0.617156982421875, 0.72906494140625, 0.840972900390625, 0.952880859375, 1.064788818359375, 1.17669677734375, 1.288604736328125, 1.4005126953125, 1.512420654296875, 1.62432861328125, 1.736236572265625, 1.84814453125, 1.960052490234375, 2.07196044921875, 2.183868408203125, 2.2957763671875, 2.407684326171875, 2.51959228515625, 2.631500244140625, 2.743408203125, 2.855316162109375, 2.96722412109375, 3.079132080078125, 3.1910400390625, 3.302947998046875, 3.41485595703125, 3.526763916015625, 3.638671875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 8.0, 5.0, 14.0, 15.0, 15.0, 16.0, 15.0, 13.0, 22.0, 26.0, 18.0, 27.0, 35.0, 33.0, 40.0, 35.0, 54.0, 90.0, 174.0, 1505.0, 344.0, 124.0, 73.0, 48.0, 45.0, 34.0, 34.0, 17.0, 27.0, 23.0, 21.0, 18.0, 15.0, 14.0, 15.0, 13.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8359375, -11.3946533203125, -10.953369140625, -10.5120849609375, -10.07080078125, -9.6295166015625, -9.188232421875, -8.7469482421875, -8.3056640625, -7.8643798828125, -7.423095703125, -6.9818115234375, -6.54052734375, -6.0992431640625, -5.657958984375, -5.2166748046875, -4.775390625, -4.3341064453125, -3.892822265625, -3.4515380859375, -3.01025390625, -2.5689697265625, -2.127685546875, -1.6864013671875, -1.2451171875, -0.8038330078125, -0.362548828125, 0.0787353515625, 0.52001953125, 0.9613037109375, 1.402587890625, 1.8438720703125, 2.28515625, 2.7264404296875, 3.167724609375, 3.6090087890625, 4.05029296875, 4.4915771484375, 4.932861328125, 5.3741455078125, 5.8154296875, 6.2567138671875, 6.697998046875, 7.1392822265625, 7.58056640625, 8.0218505859375, 8.463134765625, 8.9044189453125, 9.345703125, 9.7869873046875, 10.228271484375, 10.6695556640625, 11.11083984375, 11.5521240234375, 11.993408203125, 12.4346923828125, 12.8759765625, 13.3172607421875, 13.758544921875, 14.1998291015625, 14.64111328125, 15.0823974609375, 15.523681640625, 15.9649658203125, 16.40625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 6.0, 3.0, 5.0, 7.0, 9.0, 9.0, 23.0, 32.0, 25.0, 71.0, 102.0, 161.0, 331.0, 790.0, 15921.0, 3124723.0, 2358.0, 476.0, 226.0, 141.0, 95.0, 69.0, 39.0, 29.0, 15.0, 8.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.375, -68.9365234375, -66.498046875, -64.0595703125, -61.62109375, -59.1826171875, -56.744140625, -54.3056640625, -51.8671875, -49.4287109375, -46.990234375, -44.5517578125, -42.11328125, -39.6748046875, -37.236328125, -34.7978515625, -32.359375, -29.9208984375, -27.482421875, -25.0439453125, -22.60546875, -20.1669921875, -17.728515625, -15.2900390625, -12.8515625, -10.4130859375, -7.974609375, -5.5361328125, -3.09765625, -0.6591796875, 1.779296875, 4.2177734375, 6.65625, 9.0947265625, 11.533203125, 13.9716796875, 16.41015625, 18.8486328125, 21.287109375, 23.7255859375, 26.1640625, 28.6025390625, 31.041015625, 33.4794921875, 35.91796875, 38.3564453125, 40.794921875, 43.2333984375, 45.671875, 48.1103515625, 50.548828125, 52.9873046875, 55.42578125, 57.8642578125, 60.302734375, 62.7412109375, 65.1796875, 67.6181640625, 70.056640625, 72.4951171875, 74.93359375, 77.3720703125, 79.810546875, 82.2490234375, 84.6875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 713.0, 301.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.10687255859375, -18.36716079711914, -13.627450942993164, -8.887740135192871, -4.148029327392578, 0.5916824340820312, 5.331392288208008, 10.071102142333984, 14.810813903808594, 19.550525665283203, 24.29023551940918, 29.029945373535156, 33.769657135009766, 38.509368896484375, 43.24907684326172, 47.98878860473633, 52.72850036621094, 57.46821212768555, 62.207923889160156, 66.9476318359375, 71.68734741210938, 76.42705535888672, 81.16676330566406, 85.90647888183594, 90.64618682861328, 95.38589477539062, 100.1256103515625, 104.86531829833984, 109.60502624511719, 114.34474182128906, 119.0844497680664, 123.82415771484375, 128.56387329101562, 133.3035888671875, 138.0432891845703, 142.7830047607422, 147.52272033691406, 152.26242065429688, 157.00213623046875, 161.74185180664062, 166.4815673828125, 171.22128295898438, 175.9609832763672, 180.70069885253906, 185.44041442871094, 190.18011474609375, 194.91983032226562, 199.6595458984375, 204.3992462158203, 209.1389617919922, 213.878662109375, 218.61837768554688, 223.35809326171875, 228.09780883789062, 232.83750915527344, 237.5772247314453, 242.31692504882812, 247.056640625, 251.7963409423828, 256.53607177734375, 261.2757568359375, 266.0154724121094, 270.75518798828125, 275.4949035644531, 280.234619140625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 2.0, 5.0, 10.0, 13.0, 12.0, 14.0, 16.0, 15.0, 19.0, 14.0, 21.0, 24.0, 26.0, 42.0, 43.0, 30.0, 36.0, 43.0, 38.0, 35.0, 44.0, 56.0, 50.0, 37.0, 30.0, 41.0, 31.0, 28.0, 29.0, 30.0, 31.0, 20.0, 22.0, 22.0, 18.0, 10.0, 8.0, 8.0, 8.0, 5.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.92547607421875, -33.87828063964844, -32.831085205078125, -31.78388786315918, -30.736690521240234, -29.689495086669922, -28.64229965209961, -27.595104217529297, -26.54790687561035, -25.50071144104004, -24.453514099121094, -23.40631866455078, -22.35912322998047, -21.311925888061523, -20.26473045349121, -19.217533111572266, -18.170337677001953, -17.12314224243164, -16.075944900512695, -15.028749465942383, -13.981553077697754, -12.934356689453125, -11.887161254882812, -10.839964866638184, -9.792768478393555, -8.745572090148926, -7.698376178741455, -6.651180267333984, -5.6039838790893555, -4.556787490844727, -3.509591579437256, -2.462395668029785, -1.4151992797851562, -0.36800312995910645, 0.6791930198669434, 1.7263891696929932, 2.773585319519043, 3.820781707763672, 4.867977619171143, 5.915173530578613, 6.962369918823242, 8.009566307067871, 9.0567626953125, 10.103958129882812, 11.151154518127441, 12.19835090637207, 13.245546340942383, 14.292742729187012, 15.33993911743164, 16.387134552001953, 17.4343318939209, 18.48152732849121, 19.528724670410156, 20.57592010498047, 21.62311553955078, 22.670310974121094, 23.71750831604004, 24.76470375061035, 25.811901092529297, 26.85909652709961, 27.906291961669922, 28.953489303588867, 30.00068473815918, 31.047882080078125, 32.09507751464844]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 5.0, 12.0, 10.0, 9.0, 20.0, 17.0, 20.0, 17.0, 18.0, 31.0, 38.0, 23.0, 28.0, 38.0, 48.0, 41.0, 37.0, 37.0, 34.0, 43.0, 46.0, 51.0, 45.0, 43.0, 23.0, 46.0, 39.0, 27.0, 16.0, 20.0, 24.0, 9.0, 15.0, 8.0, 11.0, 12.0, 5.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.1005859375, -3.966796875, -3.8330078125, -3.69921875, -3.5654296875, -3.431640625, -3.2978515625, -3.1640625, -3.0302734375, -2.896484375, -2.7626953125, -2.62890625, -2.4951171875, -2.361328125, -2.2275390625, -2.09375, -1.9599609375, -1.826171875, -1.6923828125, -1.55859375, -1.4248046875, -1.291015625, -1.1572265625, -1.0234375, -0.8896484375, -0.755859375, -0.6220703125, -0.48828125, -0.3544921875, -0.220703125, -0.0869140625, 0.046875, 0.1806640625, 0.314453125, 0.4482421875, 0.58203125, 0.7158203125, 0.849609375, 0.9833984375, 1.1171875, 1.2509765625, 1.384765625, 1.5185546875, 1.65234375, 1.7861328125, 1.919921875, 2.0537109375, 2.1875, 2.3212890625, 2.455078125, 2.5888671875, 2.72265625, 2.8564453125, 2.990234375, 3.1240234375, 3.2578125, 3.3916015625, 3.525390625, 3.6591796875, 3.79296875, 3.9267578125, 4.060546875, 4.1943359375, 4.328125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 5.0, 2.0, 8.0, 9.0, 12.0, 20.0, 16.0, 18.0, 35.0, 25.0, 39.0, 43.0, 37.0, 57.0, 59.0, 90.0, 127.0, 147.0, 336.0, 791.0, 3354.0, 37166.0, 707376.0, 2696852.0, 704982.0, 37445.0, 3324.0, 850.0, 318.0, 155.0, 109.0, 88.0, 68.0, 53.0, 35.0, 44.0, 27.0, 31.0, 25.0, 24.0, 19.0, 9.0, 16.0, 12.0, 2.0, 8.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.453369140625, -8.15673828125, -7.860107421875, -7.5634765625, -7.266845703125, -6.97021484375, -6.673583984375, -6.376953125, -6.080322265625, -5.78369140625, -5.487060546875, -5.1904296875, -4.893798828125, -4.59716796875, -4.300537109375, -4.00390625, -3.707275390625, -3.41064453125, -3.114013671875, -2.8173828125, -2.520751953125, -2.22412109375, -1.927490234375, -1.630859375, -1.334228515625, -1.03759765625, -0.740966796875, -0.4443359375, -0.147705078125, 0.14892578125, 0.445556640625, 0.7421875, 1.038818359375, 1.33544921875, 1.632080078125, 1.9287109375, 2.225341796875, 2.52197265625, 2.818603515625, 3.115234375, 3.411865234375, 3.70849609375, 4.005126953125, 4.3017578125, 4.598388671875, 4.89501953125, 5.191650390625, 5.48828125, 5.784912109375, 6.08154296875, 6.378173828125, 6.6748046875, 6.971435546875, 7.26806640625, 7.564697265625, 7.861328125, 8.157958984375, 8.45458984375, 8.751220703125, 9.0478515625, 9.344482421875, 9.64111328125, 9.937744140625, 10.234375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 6.0, 9.0, 11.0, 12.0, 19.0, 28.0, 41.0, 45.0, 64.0, 133.0, 221.0, 258.0, 389.0, 493.0, 552.0, 527.0, 410.0, 238.0, 177.0, 121.0, 93.0, 66.0, 49.0, 23.0, 33.0, 17.0, 13.0, 10.0, 6.0, 5.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.86016845703125, -6.5679931640625, -6.27581787109375, -5.983642578125, -5.69146728515625, -5.3992919921875, -5.10711669921875, -4.81494140625, -4.52276611328125, -4.2305908203125, -3.93841552734375, -3.646240234375, -3.35406494140625, -3.0618896484375, -2.76971435546875, -2.4775390625, -2.18536376953125, -1.8931884765625, -1.60101318359375, -1.308837890625, -1.01666259765625, -0.7244873046875, -0.43231201171875, -0.14013671875, 0.15203857421875, 0.4442138671875, 0.73638916015625, 1.028564453125, 1.32073974609375, 1.6129150390625, 1.90509033203125, 2.197265625, 2.48944091796875, 2.7816162109375, 3.07379150390625, 3.365966796875, 3.65814208984375, 3.9503173828125, 4.24249267578125, 4.53466796875, 4.82684326171875, 5.1190185546875, 5.41119384765625, 5.703369140625, 5.99554443359375, 6.2877197265625, 6.57989501953125, 6.8720703125, 7.16424560546875, 7.4564208984375, 7.74859619140625, 8.040771484375, 8.33294677734375, 8.6251220703125, 8.91729736328125, 9.20947265625, 9.50164794921875, 9.7938232421875, 10.08599853515625, 10.378173828125, 10.67034912109375, 10.9625244140625, 11.25469970703125, 11.546875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 10.0, 11.0, 15.0, 22.0, 20.0, 32.0, 51.0, 89.0, 120.0, 160.0, 263.0, 347.0, 628.0, 8948.0, 4134414.0, 47178.0, 758.0, 363.0, 308.0, 187.0, 122.0, 58.0, 57.0, 32.0, 23.0, 17.0, 14.0, 9.0, 12.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.03125, -52.6669921875, -51.302734375, -49.9384765625, -48.57421875, -47.2099609375, -45.845703125, -44.4814453125, -43.1171875, -41.7529296875, -40.388671875, -39.0244140625, -37.66015625, -36.2958984375, -34.931640625, -33.5673828125, -32.203125, -30.8388671875, -29.474609375, -28.1103515625, -26.74609375, -25.3818359375, -24.017578125, -22.6533203125, -21.2890625, -19.9248046875, -18.560546875, -17.1962890625, -15.83203125, -14.4677734375, -13.103515625, -11.7392578125, -10.375, -9.0107421875, -7.646484375, -6.2822265625, -4.91796875, -3.5537109375, -2.189453125, -0.8251953125, 0.5390625, 1.9033203125, 3.267578125, 4.6318359375, 5.99609375, 7.3603515625, 8.724609375, 10.0888671875, 11.453125, 12.8173828125, 14.181640625, 15.5458984375, 16.91015625, 18.2744140625, 19.638671875, 21.0029296875, 22.3671875, 23.7314453125, 25.095703125, 26.4599609375, 27.82421875, 29.1884765625, 30.552734375, 31.9169921875, 33.28125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 20.0, 575.0, 409.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.62611389160156, -94.29499816894531, -86.96387481689453, -79.63275909423828, -72.3016357421875, -64.97052001953125, -57.639404296875, -50.308284759521484, -42.97716522216797, -35.64604568481445, -28.31492805480957, -20.983810424804688, -13.652690887451172, -6.321571350097656, 1.0095443725585938, 8.34066390991211, 15.671783447265625, 23.00290298461914, 30.334020614624023, 37.665138244628906, 44.99625778198242, 52.32737731933594, 59.65849304199219, 66.98960876464844, 74.32073211669922, 81.65184783935547, 88.98297119140625, 96.3140869140625, 103.64520263671875, 110.97632598876953, 118.30744171142578, 125.63856506347656, 132.96969604492188, 140.30081176757812, 147.63192749023438, 154.96304321289062, 162.29417419433594, 169.6252899169922, 176.95640563964844, 184.2875213623047, 191.61865234375, 198.94976806640625, 206.2808837890625, 213.61199951171875, 220.94313049316406, 228.2742462158203, 235.60536193847656, 242.9364776611328, 250.26759338378906, 257.5987243652344, 264.9298400878906, 272.2609558105469, 279.5920715332031, 286.9231872558594, 294.2543029785156, 301.5854187011719, 308.9165344238281, 316.2476501464844, 323.5787658691406, 330.9098815917969, 338.2409973144531, 345.5721435546875, 352.90325927734375, 360.234375, 367.56549072265625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 9.0, 19.0, 11.0, 26.0, 20.0, 34.0, 32.0, 46.0, 41.0, 46.0, 46.0, 67.0, 58.0, 49.0, 43.0, 55.0, 43.0, 49.0, 35.0, 43.0, 41.0, 26.0, 31.0, 24.0, 23.0, 14.0, 17.0, 9.0, 10.0, 10.0, 4.0, 6.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-36.49530792236328, -35.49312210083008, -34.49094009399414, -33.48875427246094, -32.486568450927734, -31.484384536743164, -30.482200622558594, -29.48001480102539, -28.477828979492188, -27.475645065307617, -26.473459243774414, -25.471275329589844, -24.46908950805664, -23.46690559387207, -22.4647216796875, -21.462535858154297, -20.460351943969727, -19.458168029785156, -18.455982208251953, -17.453798294067383, -16.45161247253418, -15.44942855834961, -14.447243690490723, -13.445058822631836, -12.44287395477295, -11.440689086914062, -10.438504219055176, -9.436319351196289, -8.434135437011719, -7.431950092315674, -6.429765701293945, -5.427580833435059, -4.425397872924805, -3.423213005065918, -2.4210283756256104, -1.4188437461853027, -0.416658878326416, 0.5855259895324707, 1.5877103805541992, 2.589895248413086, 3.5920801162719727, 4.594264984130859, 5.596449851989746, 6.598634243011475, 7.600819110870361, 8.603004455566406, 9.605188369750977, 10.607373237609863, 11.60955810546875, 12.611742973327637, 13.613927841186523, 14.616111755371094, 15.618297576904297, 16.620481491088867, 17.622665405273438, 18.62485122680664, 19.627037048339844, 20.629220962524414, 21.631406784057617, 22.633590698242188, 23.63577651977539, 24.63796043395996, 25.64014434814453, 26.642330169677734, 27.644514083862305]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 4.0, 6.0, 7.0, 8.0, 10.0, 11.0, 19.0, 18.0, 24.0, 26.0, 21.0, 30.0, 28.0, 29.0, 36.0, 27.0, 46.0, 27.0, 39.0, 47.0, 26.0, 49.0, 49.0, 29.0, 37.0, 29.0, 38.0, 32.0, 33.0, 32.0, 17.0, 18.0, 21.0, 15.0, 18.0, 14.0, 14.0, 16.0, 6.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.37890625, -3.265045166015625, -3.15118408203125, -3.037322998046875, -2.9234619140625, -2.809600830078125, -2.69573974609375, -2.581878662109375, -2.468017578125, -2.354156494140625, -2.24029541015625, -2.126434326171875, -2.0125732421875, -1.898712158203125, -1.78485107421875, -1.670989990234375, -1.55712890625, -1.443267822265625, -1.32940673828125, -1.215545654296875, -1.1016845703125, -0.987823486328125, -0.87396240234375, -0.760101318359375, -0.646240234375, -0.532379150390625, -0.41851806640625, -0.304656982421875, -0.1907958984375, -0.076934814453125, 0.03692626953125, 0.150787353515625, 0.2646484375, 0.378509521484375, 0.49237060546875, 0.606231689453125, 0.7200927734375, 0.833953857421875, 0.94781494140625, 1.061676025390625, 1.175537109375, 1.289398193359375, 1.40325927734375, 1.517120361328125, 1.6309814453125, 1.744842529296875, 1.85870361328125, 1.972564697265625, 2.08642578125, 2.200286865234375, 2.31414794921875, 2.428009033203125, 2.5418701171875, 2.655731201171875, 2.76959228515625, 2.883453369140625, 2.997314453125, 3.111175537109375, 3.22503662109375, 3.338897705078125, 3.4527587890625, 3.566619873046875, 3.68048095703125, 3.794342041015625, 3.908203125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 5.0, 11.0, 17.0, 31.0, 31.0, 48.0, 83.0, 109.0, 162.0, 276.0, 369.0, 533.0, 753.0, 1158.0, 1675.0, 2504.0, 3786.0, 5457.0, 8135.0, 12154.0, 18980.0, 29231.0, 47959.0, 81060.0, 155117.0, 296223.0, 161728.0, 84145.0, 49041.0, 29948.0, 19412.0, 12772.0, 8241.0, 5558.0, 3798.0, 2645.0, 1752.0, 1146.0, 810.0, 550.0, 372.0, 243.0, 195.0, 110.0, 66.0, 44.0, 39.0, 32.0, 17.0, 12.0, 6.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.58642578125, -0.5665664672851562, -0.5467071533203125, -0.5268478393554688, -0.506988525390625, -0.48712921142578125, -0.4672698974609375, -0.44741058349609375, -0.42755126953125, -0.40769195556640625, -0.3878326416015625, -0.36797332763671875, -0.348114013671875, -0.32825469970703125, -0.3083953857421875, -0.28853607177734375, -0.2686767578125, -0.24881744384765625, -0.2289581298828125, -0.20909881591796875, -0.189239501953125, -0.16938018798828125, -0.1495208740234375, -0.12966156005859375, -0.10980224609375, -0.08994293212890625, -0.0700836181640625, -0.05022430419921875, -0.030364990234375, -0.01050567626953125, 0.0093536376953125, 0.02921295166015625, 0.049072265625, 0.06893157958984375, 0.0887908935546875, 0.10865020751953125, 0.128509521484375, 0.14836883544921875, 0.1682281494140625, 0.18808746337890625, 0.20794677734375, 0.22780609130859375, 0.2476654052734375, 0.26752471923828125, 0.287384033203125, 0.30724334716796875, 0.3271026611328125, 0.34696197509765625, 0.3668212890625, 0.38668060302734375, 0.4065399169921875, 0.42639923095703125, 0.446258544921875, 0.46611785888671875, 0.4859771728515625, 0.5058364868164062, 0.52569580078125, 0.5455551147460938, 0.5654144287109375, 0.5852737426757812, 0.605133056640625, 0.6249923706054688, 0.6448516845703125, 0.6647109985351562, 0.6845703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 9.0, 7.0, 6.0, 12.0, 20.0, 15.0, 6.0, 16.0, 21.0, 16.0, 23.0, 24.0, 37.0, 22.0, 23.0, 32.0, 31.0, 41.0, 33.0, 41.0, 43.0, 1066.0, 38.0, 34.0, 37.0, 32.0, 36.0, 29.0, 21.0, 24.0, 26.0, 24.0, 16.0, 23.0, 21.0, 20.0, 18.0, 15.0, 9.0, 11.0, 8.0, 7.0, 9.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.1015625, -2.034393310546875, -1.96722412109375, -1.900054931640625, -1.8328857421875, -1.765716552734375, -1.69854736328125, -1.631378173828125, -1.564208984375, -1.497039794921875, -1.42987060546875, -1.362701416015625, -1.2955322265625, -1.228363037109375, -1.16119384765625, -1.094024658203125, -1.02685546875, -0.959686279296875, -0.89251708984375, -0.825347900390625, -0.7581787109375, -0.691009521484375, -0.62384033203125, -0.556671142578125, -0.489501953125, -0.422332763671875, -0.35516357421875, -0.287994384765625, -0.2208251953125, -0.153656005859375, -0.08648681640625, -0.019317626953125, 0.0478515625, 0.115020751953125, 0.18218994140625, 0.249359130859375, 0.3165283203125, 0.383697509765625, 0.45086669921875, 0.518035888671875, 0.585205078125, 0.652374267578125, 0.71954345703125, 0.786712646484375, 0.8538818359375, 0.921051025390625, 0.98822021484375, 1.055389404296875, 1.12255859375, 1.189727783203125, 1.25689697265625, 1.324066162109375, 1.3912353515625, 1.458404541015625, 1.52557373046875, 1.592742919921875, 1.659912109375, 1.727081298828125, 1.79425048828125, 1.861419677734375, 1.9285888671875, 1.995758056640625, 2.06292724609375, 2.130096435546875, 2.197265625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 6.0, 5.0, 15.0, 28.0, 28.0, 48.0, 72.0, 96.0, 136.0, 164.0, 274.0, 380.0, 523.0, 765.0, 1030.0, 1468.0, 1982.0, 2885.0, 3905.0, 5385.0, 7296.0, 9876.0, 13859.0, 19375.0, 27337.0, 39882.0, 60306.0, 101560.0, 193780.0, 1272268.0, 116650.0, 67647.0, 43591.0, 29465.0, 20959.0, 15085.0, 10752.0, 7885.0, 5673.0, 4097.0, 3000.0, 2170.0, 1589.0, 1124.0, 805.0, 582.0, 425.0, 284.0, 205.0, 158.0, 90.0, 57.0, 33.0, 31.0, 21.0, 10.0, 7.0, 3.0, 7.0, 1.0, 3.0], "bins": [-0.47607421875, -0.46125030517578125, -0.4464263916015625, -0.43160247802734375, -0.416778564453125, -0.40195465087890625, -0.3871307373046875, -0.37230682373046875, -0.35748291015625, -0.34265899658203125, -0.3278350830078125, -0.31301116943359375, -0.298187255859375, -0.28336334228515625, -0.2685394287109375, -0.25371551513671875, -0.2388916015625, -0.22406768798828125, -0.2092437744140625, -0.19441986083984375, -0.179595947265625, -0.16477203369140625, -0.1499481201171875, -0.13512420654296875, -0.12030029296875, -0.10547637939453125, -0.0906524658203125, -0.07582855224609375, -0.061004638671875, -0.04618072509765625, -0.0313568115234375, -0.01653289794921875, -0.001708984375, 0.01311492919921875, 0.0279388427734375, 0.04276275634765625, 0.057586669921875, 0.07241058349609375, 0.0872344970703125, 0.10205841064453125, 0.11688232421875, 0.13170623779296875, 0.1465301513671875, 0.16135406494140625, 0.176177978515625, 0.19100189208984375, 0.2058258056640625, 0.22064971923828125, 0.2354736328125, 0.25029754638671875, 0.2651214599609375, 0.27994537353515625, 0.294769287109375, 0.30959320068359375, 0.3244171142578125, 0.33924102783203125, 0.35406494140625, 0.36888885498046875, 0.3837127685546875, 0.39853668212890625, 0.413360595703125, 0.42818450927734375, 0.4430084228515625, 0.45783233642578125, 0.47265625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 4.0, 8.0, 8.0, 16.0, 13.0, 26.0, 27.0, 26.0, 29.0, 41.0, 43.0, 42.0, 39.0, 47.0, 51.0, 51.0, 55.0, 53.0, 42.0, 57.0, 46.0, 28.0, 32.0, 30.0, 22.0, 26.0, 22.0, 21.0, 17.0, 9.0, 12.0, 7.0, 6.0, 7.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00011676549911499023, -0.0001131836324930191, -0.00010960176587104797, -0.00010601989924907684, -0.00010243803262710571, -9.885616600513458e-05, -9.527429938316345e-05, -9.169243276119232e-05, -8.811056613922119e-05, -8.452869951725006e-05, -8.094683289527893e-05, -7.73649662733078e-05, -7.378309965133667e-05, -7.020123302936554e-05, -6.661936640739441e-05, -6.303749978542328e-05, -5.945563316345215e-05, -5.587376654148102e-05, -5.229189991950989e-05, -4.871003329753876e-05, -4.512816667556763e-05, -4.1546300053596497e-05, -3.7964433431625366e-05, -3.4382566809654236e-05, -3.0800700187683105e-05, -2.7218833565711975e-05, -2.3636966943740845e-05, -2.0055100321769714e-05, -1.6473233699798584e-05, -1.2891367077827454e-05, -9.309500455856323e-06, -5.727633833885193e-06, -2.1457672119140625e-06, 1.4360994100570679e-06, 5.017966032028198e-06, 8.599832653999329e-06, 1.2181699275970459e-05, 1.576356589794159e-05, 1.934543251991272e-05, 2.292729914188385e-05, 2.650916576385498e-05, 3.009103238582611e-05, 3.367289900779724e-05, 3.725476562976837e-05, 4.08366322517395e-05, 4.441849887371063e-05, 4.800036549568176e-05, 5.158223211765289e-05, 5.5164098739624023e-05, 5.8745965361595154e-05, 6.232783198356628e-05, 6.590969860553741e-05, 6.949156522750854e-05, 7.307343184947968e-05, 7.66552984714508e-05, 8.023716509342194e-05, 8.381903171539307e-05, 8.74008983373642e-05, 9.098276495933533e-05, 9.456463158130646e-05, 9.814649820327759e-05, 0.00010172836482524872, 0.00010531023144721985, 0.00010889209806919098, 0.00011247396469116211]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 2.0, 4.0, 7.0, 7.0, 14.0, 17.0, 13.0, 26.0, 29.0, 31.0, 45.0, 71.0, 77.0, 103.0, 150.0, 325.0, 742.0, 12242.0, 1026697.0, 6245.0, 711.0, 318.0, 150.0, 120.0, 89.0, 71.0, 57.0, 47.0, 33.0, 30.0, 12.0, 16.0, 10.0, 10.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0026607513427734375, -0.0025761425495147705, -0.0024915337562561035, -0.0024069249629974365, -0.0023223161697387695, -0.0022377073764801025, -0.0021530985832214355, -0.0020684897899627686, -0.0019838809967041016, -0.0018992722034454346, -0.0018146634101867676, -0.0017300546169281006, -0.0016454458236694336, -0.0015608370304107666, -0.0014762282371520996, -0.0013916194438934326, -0.0013070106506347656, -0.0012224018573760986, -0.0011377930641174316, -0.0010531842708587646, -0.0009685754776000977, -0.0008839666843414307, -0.0007993578910827637, -0.0007147490978240967, -0.0006301403045654297, -0.0005455315113067627, -0.0004609227180480957, -0.0003763139247894287, -0.0002917051315307617, -0.00020709633827209473, -0.00012248754501342773, -3.787875175476074e-05, 4.673004150390625e-05, 0.00013133883476257324, 0.00021594762802124023, 0.0003005564212799072, 0.0003851652145385742, 0.0004697740077972412, 0.0005543828010559082, 0.0006389915943145752, 0.0007236003875732422, 0.0008082091808319092, 0.0008928179740905762, 0.0009774267673492432, 0.0010620355606079102, 0.0011466443538665771, 0.0012312531471252441, 0.0013158619403839111, 0.0014004707336425781, 0.0014850795269012451, 0.0015696883201599121, 0.001654297113418579, 0.001738905906677246, 0.001823514699935913, 0.00190812349319458, 0.001992732286453247, 0.002077341079711914, 0.002161949872970581, 0.002246558666229248, 0.002331167459487915, 0.002415776252746582, 0.002500385046005249, 0.002584993839263916, 0.002669602632522583, 0.00275421142578125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 30.0, 144.0, 372.0, 365.0, 93.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016670180775690824, -0.00015681717195548117, -0.00014693252160213888, -0.0001370478858007118, -0.00012716324999928474, -0.00011727860692190006, -0.00010739396384451538, -9.750932804308832e-05, -8.762468496570364e-05, -7.774004188831896e-05, -6.785540608689189e-05, -5.797076300950721e-05, -4.8086123570101336e-05, -3.820148413069546e-05, -2.8316841053310782e-05, -1.8432205251883715e-05, -8.547562174499035e-06, 1.3370781744015403e-06, 1.1221718523302115e-05, 2.1106359781697392e-05, 3.0990999221103266e-05, 4.087563866050914e-05, 5.076028173789382e-05, 6.0644917539320886e-05, 7.052956061670557e-05, 8.041420369409025e-05, 9.029883949551731e-05, 0.000100183482572902, 0.00011006812565028667, 0.00011995276145171374, 0.0001298373972531408, 0.0001397220476064831, 0.00014960666885599494, 0.000159491304657422, 0.0001693759550107643, 0.00017926059081219137, 0.00018914522661361843, 0.0001990298624150455, 0.0002089145127683878, 0.00021879914856981486, 0.00022868378437124193, 0.000238568420172669, 0.00024845305597409606, 0.00025833770632743835, 0.00026822235668078065, 0.0002781069779302925, 0.0002879916282836348, 0.0002978762495331466, 0.0003077608998864889, 0.0003176455502398312, 0.00032753017148934305, 0.00033741482184268534, 0.00034729947219602764, 0.0003571840934455395, 0.00036706874379888177, 0.00037695339415222406, 0.00038683804450556636, 0.00039672269485890865, 0.0004066073161084205, 0.0004164919664617628, 0.0004263766168151051, 0.0004362612380646169, 0.0004461458884179592, 0.0004560305387713015, 0.00046591516002081335]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 9.0, 6.0, 10.0, 9.0, 18.0, 17.0, 19.0, 20.0, 20.0, 30.0, 24.0, 31.0, 26.0, 22.0, 34.0, 40.0, 36.0, 48.0, 30.0, 48.0, 30.0, 33.0, 37.0, 36.0, 34.0, 37.0, 40.0, 31.0, 31.0, 22.0, 24.0, 26.0, 18.0, 12.0, 15.0, 15.0, 6.0, 5.0, 12.0, 6.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0], "bins": [-6.645917892456055e-05, -6.452761590480804e-05, -6.259605288505554e-05, -6.066448986530304e-05, -5.873292684555054e-05, -5.6801363825798035e-05, -5.486980080604553e-05, -5.293823778629303e-05, -5.100667476654053e-05, -4.9075111746788025e-05, -4.714354872703552e-05, -4.521198570728302e-05, -4.328042268753052e-05, -4.1348859667778015e-05, -3.941729664802551e-05, -3.748573362827301e-05, -3.555417060852051e-05, -3.3622607588768005e-05, -3.16910445690155e-05, -2.9759481549263e-05, -2.7827918529510498e-05, -2.5896355509757996e-05, -2.3964792490005493e-05, -2.203322947025299e-05, -2.0101666450500488e-05, -1.8170103430747986e-05, -1.6238540410995483e-05, -1.4306977391242981e-05, -1.2375414371490479e-05, -1.0443851351737976e-05, -8.512288331985474e-06, -6.580725312232971e-06, -4.649162292480469e-06, -2.7175992727279663e-06, -7.860362529754639e-07, 1.1455267667770386e-06, 3.077089786529541e-06, 5.0086528062820435e-06, 6.940215826034546e-06, 8.871778845787048e-06, 1.080334186553955e-05, 1.2734904885292053e-05, 1.4666467905044556e-05, 1.6598030924797058e-05, 1.852959394454956e-05, 2.0461156964302063e-05, 2.2392719984054565e-05, 2.4324283003807068e-05, 2.625584602355957e-05, 2.8187409043312073e-05, 3.0118972063064575e-05, 3.205053508281708e-05, 3.398209810256958e-05, 3.591366112232208e-05, 3.7845224142074585e-05, 3.977678716182709e-05, 4.170835018157959e-05, 4.363991320133209e-05, 4.5571476221084595e-05, 4.75030392408371e-05, 4.94346022605896e-05, 5.13661652803421e-05, 5.3297728300094604e-05, 5.522929131984711e-05, 5.716085433959961e-05]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 4.0, 6.0, 7.0, 8.0, 10.0, 11.0, 19.0, 18.0, 24.0, 26.0, 21.0, 30.0, 28.0, 29.0, 36.0, 27.0, 46.0, 27.0, 39.0, 47.0, 26.0, 49.0, 49.0, 29.0, 37.0, 29.0, 38.0, 32.0, 33.0, 32.0, 17.0, 18.0, 21.0, 15.0, 18.0, 14.0, 14.0, 16.0, 6.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.37890625, -3.265045166015625, -3.15118408203125, -3.037322998046875, -2.9234619140625, -2.809600830078125, -2.69573974609375, -2.581878662109375, -2.468017578125, -2.354156494140625, -2.24029541015625, -2.126434326171875, -2.0125732421875, -1.898712158203125, -1.78485107421875, -1.670989990234375, -1.55712890625, -1.443267822265625, -1.32940673828125, -1.215545654296875, -1.1016845703125, -0.987823486328125, -0.87396240234375, -0.760101318359375, -0.646240234375, -0.532379150390625, -0.41851806640625, -0.304656982421875, -0.1907958984375, -0.076934814453125, 0.03692626953125, 0.150787353515625, 0.2646484375, 0.378509521484375, 0.49237060546875, 0.606231689453125, 0.7200927734375, 0.833953857421875, 0.94781494140625, 1.061676025390625, 1.175537109375, 1.289398193359375, 1.40325927734375, 1.517120361328125, 1.6309814453125, 1.744842529296875, 1.85870361328125, 1.972564697265625, 2.08642578125, 2.200286865234375, 2.31414794921875, 2.428009033203125, 2.5418701171875, 2.655731201171875, 2.76959228515625, 2.883453369140625, 2.997314453125, 3.111175537109375, 3.22503662109375, 3.338897705078125, 3.4527587890625, 3.566619873046875, 3.68048095703125, 3.794342041015625, 3.908203125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 1.0, 6.0, 5.0, 8.0, 12.0, 8.0, 20.0, 12.0, 19.0, 39.0, 52.0, 100.0, 133.0, 274.0, 571.0, 1250.0, 2726.0, 5896.0, 13356.0, 29905.0, 75337.0, 222431.0, 411629.0, 177090.0, 61705.0, 25081.0, 11375.0, 5113.0, 2294.0, 1043.0, 496.0, 231.0, 123.0, 54.0, 39.0, 34.0, 12.0, 24.0, 9.0, 8.0, 9.0, 4.0, 8.0, 5.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7421875, -3.61907958984375, -3.4959716796875, -3.37286376953125, -3.249755859375, -3.12664794921875, -3.0035400390625, -2.88043212890625, -2.75732421875, -2.63421630859375, -2.5111083984375, -2.38800048828125, -2.264892578125, -2.14178466796875, -2.0186767578125, -1.89556884765625, -1.7724609375, -1.64935302734375, -1.5262451171875, -1.40313720703125, -1.280029296875, -1.15692138671875, -1.0338134765625, -0.91070556640625, -0.78759765625, -0.66448974609375, -0.5413818359375, -0.41827392578125, -0.295166015625, -0.17205810546875, -0.0489501953125, 0.07415771484375, 0.197265625, 0.32037353515625, 0.4434814453125, 0.56658935546875, 0.689697265625, 0.81280517578125, 0.9359130859375, 1.05902099609375, 1.18212890625, 1.30523681640625, 1.4283447265625, 1.55145263671875, 1.674560546875, 1.79766845703125, 1.9207763671875, 2.04388427734375, 2.1669921875, 2.29010009765625, 2.4132080078125, 2.53631591796875, 2.659423828125, 2.78253173828125, 2.9056396484375, 3.02874755859375, 3.15185546875, 3.27496337890625, 3.3980712890625, 3.52117919921875, 3.644287109375, 3.76739501953125, 3.8905029296875, 4.01361083984375, 4.13671875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 3.0, 8.0, 11.0, 9.0, 10.0, 16.0, 15.0, 16.0, 22.0, 23.0, 32.0, 40.0, 31.0, 37.0, 37.0, 63.0, 101.0, 251.0, 1590.0, 243.0, 95.0, 51.0, 51.0, 42.0, 36.0, 36.0, 33.0, 29.0, 24.0, 22.0, 18.0, 15.0, 10.0, 10.0, 4.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.015625, -17.521728515625, -17.02783203125, -16.533935546875, -16.0400390625, -15.546142578125, -15.05224609375, -14.558349609375, -14.064453125, -13.570556640625, -13.07666015625, -12.582763671875, -12.0888671875, -11.594970703125, -11.10107421875, -10.607177734375, -10.11328125, -9.619384765625, -9.12548828125, -8.631591796875, -8.1376953125, -7.643798828125, -7.14990234375, -6.656005859375, -6.162109375, -5.668212890625, -5.17431640625, -4.680419921875, -4.1865234375, -3.692626953125, -3.19873046875, -2.704833984375, -2.2109375, -1.717041015625, -1.22314453125, -0.729248046875, -0.2353515625, 0.258544921875, 0.75244140625, 1.246337890625, 1.740234375, 2.234130859375, 2.72802734375, 3.221923828125, 3.7158203125, 4.209716796875, 4.70361328125, 5.197509765625, 5.69140625, 6.185302734375, 6.67919921875, 7.173095703125, 7.6669921875, 8.160888671875, 8.65478515625, 9.148681640625, 9.642578125, 10.136474609375, 10.63037109375, 11.124267578125, 11.6181640625, 12.112060546875, 12.60595703125, 13.099853515625, 13.59375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 12.0, 6.0, 7.0, 17.0, 26.0, 22.0, 33.0, 49.0, 58.0, 73.0, 94.0, 141.0, 170.0, 259.0, 468.0, 1238.0, 119226.0, 3017997.0, 4016.0, 618.0, 327.0, 242.0, 146.0, 99.0, 69.0, 54.0, 48.0, 30.0, 26.0, 28.0, 19.0, 19.0, 9.0, 13.0, 8.0, 2.0, 1.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-38.65625, -37.41796875, -36.1796875, -34.94140625, -33.703125, -32.46484375, -31.2265625, -29.98828125, -28.75, -27.51171875, -26.2734375, -25.03515625, -23.796875, -22.55859375, -21.3203125, -20.08203125, -18.84375, -17.60546875, -16.3671875, -15.12890625, -13.890625, -12.65234375, -11.4140625, -10.17578125, -8.9375, -7.69921875, -6.4609375, -5.22265625, -3.984375, -2.74609375, -1.5078125, -0.26953125, 0.96875, 2.20703125, 3.4453125, 4.68359375, 5.921875, 7.16015625, 8.3984375, 9.63671875, 10.875, 12.11328125, 13.3515625, 14.58984375, 15.828125, 17.06640625, 18.3046875, 19.54296875, 20.78125, 22.01953125, 23.2578125, 24.49609375, 25.734375, 26.97265625, 28.2109375, 29.44921875, 30.6875, 31.92578125, 33.1640625, 34.40234375, 35.640625, 36.87890625, 38.1171875, 39.35546875, 40.59375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 207.0, 796.0, 14.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.495949745178223, -5.851185321807861, -1.2064208984375, 3.4383440017700195, 8.083107948303223, 12.727871894836426, 17.372638702392578, 22.01740264892578, 26.662166595458984, 31.306930541992188, 35.95169448852539, 40.596458435058594, 45.24122619628906, 49.885986328125, 54.53075408935547, 59.17551803588867, 63.820281982421875, 68.46504974365234, 73.10980987548828, 77.75457763671875, 82.39933776855469, 87.04410552978516, 91.68887329101562, 96.33363342285156, 100.9783935546875, 105.62316131591797, 110.2679214477539, 114.91268920898438, 119.55744934082031, 124.20221710205078, 128.84698486328125, 133.4917449951172, 138.1365203857422, 142.78128051757812, 147.42605590820312, 152.07081604003906, 156.715576171875, 161.36033630371094, 166.00511169433594, 170.64987182617188, 175.2946319580078, 179.93939208984375, 184.58416748046875, 189.2289276123047, 193.87368774414062, 198.51844787597656, 203.16322326660156, 207.8079833984375, 212.4527587890625, 217.09751892089844, 221.74229431152344, 226.38705444335938, 231.0318145751953, 235.67657470703125, 240.32135009765625, 244.9661102294922, 249.61087036132812, 254.25563049316406, 258.900390625, 263.545166015625, 268.18994140625, 272.8346862792969, 277.4794616699219, 282.12420654296875, 286.76898193359375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 4.0, 19.0, 14.0, 11.0, 16.0, 20.0, 22.0, 29.0, 26.0, 34.0, 30.0, 29.0, 34.0, 38.0, 44.0, 55.0, 37.0, 36.0, 43.0, 50.0, 35.0, 45.0, 40.0, 38.0, 36.0, 31.0, 19.0, 26.0, 31.0, 12.0, 16.0, 13.0, 16.0, 12.0, 5.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.09455490112305, -34.94756317138672, -33.800575256347656, -32.65358352661133, -31.506591796875, -30.359601974487305, -29.21261215209961, -28.06562042236328, -26.918630599975586, -25.77164077758789, -24.624649047851562, -23.477659225463867, -22.330669403076172, -21.183677673339844, -20.03668785095215, -18.889698028564453, -17.742706298828125, -16.59571647644043, -15.448724746704102, -14.301734924316406, -13.154744148254395, -12.007753372192383, -10.860763549804688, -9.713772773742676, -8.566781997680664, -7.419791221618652, -6.272800922393799, -5.125810623168945, -3.9788198471069336, -2.831829071044922, -1.6848387718200684, -0.5378484725952148, 0.6091384887695312, 1.7561290264129639, 2.9031195640563965, 4.05010986328125, 5.197100639343262, 6.344091415405273, 7.491081714630127, 8.63807201385498, 9.785062789916992, 10.932053565979004, 12.079044342041016, 13.226034164428711, 14.373024940490723, 15.520015716552734, 16.66700553894043, 17.813995361328125, 18.960987091064453, 20.10797691345215, 21.254968643188477, 22.401958465576172, 23.5489501953125, 24.695940017700195, 25.84292984008789, 26.98992156982422, 28.136911392211914, 29.28390121459961, 30.430892944335938, 31.577882766723633, 32.72487258911133, 33.871864318847656, 35.018856048583984, 36.16584396362305, 37.312835693359375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 11.0, 7.0, 8.0, 12.0, 11.0, 20.0, 26.0, 29.0, 30.0, 18.0, 25.0, 37.0, 40.0, 26.0, 36.0, 33.0, 41.0, 29.0, 49.0, 42.0, 45.0, 53.0, 28.0, 36.0, 36.0, 30.0, 27.0, 20.0, 31.0, 25.0, 19.0, 22.0, 19.0, 9.0, 6.0, 12.0, 19.0, 7.0, 2.0, 7.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.0078125, -3.8782958984375, -3.748779296875, -3.6192626953125, -3.48974609375, -3.3602294921875, -3.230712890625, -3.1011962890625, -2.9716796875, -2.8421630859375, -2.712646484375, -2.5831298828125, -2.45361328125, -2.3240966796875, -2.194580078125, -2.0650634765625, -1.935546875, -1.8060302734375, -1.676513671875, -1.5469970703125, -1.41748046875, -1.2879638671875, -1.158447265625, -1.0289306640625, -0.8994140625, -0.7698974609375, -0.640380859375, -0.5108642578125, -0.38134765625, -0.2518310546875, -0.122314453125, 0.0072021484375, 0.13671875, 0.2662353515625, 0.395751953125, 0.5252685546875, 0.65478515625, 0.7843017578125, 0.913818359375, 1.0433349609375, 1.1728515625, 1.3023681640625, 1.431884765625, 1.5614013671875, 1.69091796875, 1.8204345703125, 1.949951171875, 2.0794677734375, 2.208984375, 2.3385009765625, 2.468017578125, 2.5975341796875, 2.72705078125, 2.8565673828125, 2.986083984375, 3.1156005859375, 3.2451171875, 3.3746337890625, 3.504150390625, 3.6336669921875, 3.76318359375, 3.8927001953125, 4.022216796875, 4.1517333984375, 4.28125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 4.0, 1.0, 3.0, 6.0, 7.0, 7.0, 12.0, 13.0, 15.0, 17.0, 24.0, 35.0, 39.0, 50.0, 67.0, 68.0, 105.0, 136.0, 288.0, 701.0, 2876.0, 53232.0, 1794337.0, 2254488.0, 82113.0, 3835.0, 835.0, 321.0, 163.0, 103.0, 74.0, 61.0, 56.0, 39.0, 28.0, 23.0, 19.0, 13.0, 16.0, 12.0, 19.0, 5.0, 6.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-13.078125, -12.6824951171875, -12.286865234375, -11.8912353515625, -11.49560546875, -11.0999755859375, -10.704345703125, -10.3087158203125, -9.9130859375, -9.5174560546875, -9.121826171875, -8.7261962890625, -8.33056640625, -7.9349365234375, -7.539306640625, -7.1436767578125, -6.748046875, -6.3524169921875, -5.956787109375, -5.5611572265625, -5.16552734375, -4.7698974609375, -4.374267578125, -3.9786376953125, -3.5830078125, -3.1873779296875, -2.791748046875, -2.3961181640625, -2.00048828125, -1.6048583984375, -1.209228515625, -0.8135986328125, -0.41796875, -0.0223388671875, 0.373291015625, 0.7689208984375, 1.16455078125, 1.5601806640625, 1.955810546875, 2.3514404296875, 2.7470703125, 3.1427001953125, 3.538330078125, 3.9339599609375, 4.32958984375, 4.7252197265625, 5.120849609375, 5.5164794921875, 5.912109375, 6.3077392578125, 6.703369140625, 7.0989990234375, 7.49462890625, 7.8902587890625, 8.285888671875, 8.6815185546875, 9.0771484375, 9.4727783203125, 9.868408203125, 10.2640380859375, 10.65966796875, 11.0552978515625, 11.450927734375, 11.8465576171875, 12.2421875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 14.0, 6.0, 29.0, 30.0, 65.0, 86.0, 117.0, 224.0, 364.0, 488.0, 636.0, 648.0, 467.0, 320.0, 200.0, 118.0, 87.0, 49.0, 40.0, 25.0, 16.0, 11.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.59375, -14.2535400390625, -13.913330078125, -13.5731201171875, -13.23291015625, -12.8927001953125, -12.552490234375, -12.2122802734375, -11.8720703125, -11.5318603515625, -11.191650390625, -10.8514404296875, -10.51123046875, -10.1710205078125, -9.830810546875, -9.4906005859375, -9.150390625, -8.8101806640625, -8.469970703125, -8.1297607421875, -7.78955078125, -7.4493408203125, -7.109130859375, -6.7689208984375, -6.4287109375, -6.0885009765625, -5.748291015625, -5.4080810546875, -5.06787109375, -4.7276611328125, -4.387451171875, -4.0472412109375, -3.70703125, -3.3668212890625, -3.026611328125, -2.6864013671875, -2.34619140625, -2.0059814453125, -1.665771484375, -1.3255615234375, -0.9853515625, -0.6451416015625, -0.304931640625, 0.0352783203125, 0.37548828125, 0.7156982421875, 1.055908203125, 1.3961181640625, 1.736328125, 2.0765380859375, 2.416748046875, 2.7569580078125, 3.09716796875, 3.4373779296875, 3.777587890625, 4.1177978515625, 4.4580078125, 4.7982177734375, 5.138427734375, 5.4786376953125, 5.81884765625, 6.1590576171875, 6.499267578125, 6.8394775390625, 7.1796875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 8.0, 4.0, 8.0, 13.0, 20.0, 42.0, 54.0, 76.0, 115.0, 152.0, 311.0, 433.0, 965.0, 170339.0, 4017374.0, 2785.0, 613.0, 384.0, 197.0, 132.0, 100.0, 61.0, 32.0, 16.0, 14.0, 16.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.25, -28.7548828125, -27.259765625, -25.7646484375, -24.26953125, -22.7744140625, -21.279296875, -19.7841796875, -18.2890625, -16.7939453125, -15.298828125, -13.8037109375, -12.30859375, -10.8134765625, -9.318359375, -7.8232421875, -6.328125, -4.8330078125, -3.337890625, -1.8427734375, -0.34765625, 1.1474609375, 2.642578125, 4.1376953125, 5.6328125, 7.1279296875, 8.623046875, 10.1181640625, 11.61328125, 13.1083984375, 14.603515625, 16.0986328125, 17.59375, 19.0888671875, 20.583984375, 22.0791015625, 23.57421875, 25.0693359375, 26.564453125, 28.0595703125, 29.5546875, 31.0498046875, 32.544921875, 34.0400390625, 35.53515625, 37.0302734375, 38.525390625, 40.0205078125, 41.515625, 43.0107421875, 44.505859375, 46.0009765625, 47.49609375, 48.9912109375, 50.486328125, 51.9814453125, 53.4765625, 54.9716796875, 56.466796875, 57.9619140625, 59.45703125, 60.9521484375, 62.447265625, 63.9423828125, 65.4375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 32.0, 303.0, 481.0, 182.0, 14.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.25506591796875, -140.28289794921875, -136.31072998046875, -132.33856201171875, -128.36639404296875, -124.39422607421875, -120.42206573486328, -116.44989776611328, -112.47772979736328, -108.50556182861328, -104.53339385986328, -100.56122589111328, -96.58906555175781, -92.61689758300781, -88.64472961425781, -84.67256164550781, -80.70039367675781, -76.72822570800781, -72.75605773925781, -68.78388977050781, -64.81172180175781, -60.83955764770508, -56.867393493652344, -52.895225524902344, -48.923057556152344, -44.950889587402344, -40.978721618652344, -37.00655746459961, -33.03438949584961, -29.06222152709961, -25.090055465698242, -21.117889404296875, -17.145729064941406, -13.173562049865723, -9.201395034790039, -5.2292280197143555, -1.2570610046386719, 2.715106964111328, 6.687273025512695, 10.659439086914062, 14.631607055664062, 18.603775024414062, 22.57594108581543, 26.548107147216797, 30.520275115966797, 34.4924430847168, 38.46460723876953, 42.43677520751953, 46.40894317626953, 50.38111114501953, 54.35327911376953, 58.325443267822266, 62.297611236572266, 66.269775390625, 70.241943359375, 74.214111328125, 78.186279296875, 82.158447265625, 86.130615234375, 90.102783203125, 94.074951171875, 98.047119140625, 102.01927947998047, 105.99144744873047, 109.96361541748047]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 6.0, 15.0, 12.0, 18.0, 26.0, 25.0, 28.0, 34.0, 31.0, 37.0, 44.0, 48.0, 53.0, 53.0, 44.0, 53.0, 52.0, 45.0, 46.0, 46.0, 29.0, 33.0, 34.0, 31.0, 23.0, 26.0, 20.0, 14.0, 14.0, 12.0, 11.0, 4.0, 4.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.145313262939453, -24.26028060913086, -23.375246047973633, -22.49021339416504, -21.605178833007812, -20.72014617919922, -19.835113525390625, -18.95008087158203, -18.065046310424805, -17.18001365661621, -16.294979095458984, -15.40994644165039, -14.52491283416748, -13.63987922668457, -12.754846572875977, -11.869812965393066, -10.984779357910156, -10.099745750427246, -9.214712142944336, -8.329679489135742, -7.444645881652832, -6.559612274169922, -5.67457914352417, -4.789546012878418, -3.904512405395508, -3.0194790363311768, -2.1344456672668457, -1.2494122982025146, -0.3643789291381836, 0.5206546783447266, 1.4056878089904785, 2.2907209396362305, 3.1757545471191406, 4.060788154602051, 4.945821285247803, 5.830854415893555, 6.715888023376465, 7.600921630859375, 8.485954284667969, 9.370987892150879, 10.256021499633789, 11.1410551071167, 12.02608871459961, 12.911121368408203, 13.796154975891113, 14.681188583374023, 15.566221237182617, 16.451255798339844, 17.336288452148438, 18.22132110595703, 19.106355667114258, 19.99138832092285, 20.876422882080078, 21.761455535888672, 22.646488189697266, 23.53152084350586, 24.416555404663086, 25.30158805847168, 26.186622619628906, 27.0716552734375, 27.956687927246094, 28.84172248840332, 29.726755142211914, 30.61178970336914, 31.496822357177734]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 6.0, 9.0, 5.0, 13.0, 9.0, 8.0, 14.0, 19.0, 27.0, 24.0, 27.0, 33.0, 17.0, 34.0, 34.0, 30.0, 37.0, 28.0, 43.0, 54.0, 27.0, 39.0, 39.0, 39.0, 37.0, 40.0, 26.0, 31.0, 21.0, 30.0, 23.0, 21.0, 21.0, 25.0, 12.0, 16.0, 21.0, 8.0, 15.0, 12.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.609375, -3.4932861328125, -3.377197265625, -3.2611083984375, -3.14501953125, -3.0289306640625, -2.912841796875, -2.7967529296875, -2.6806640625, -2.5645751953125, -2.448486328125, -2.3323974609375, -2.21630859375, -2.1002197265625, -1.984130859375, -1.8680419921875, -1.751953125, -1.6358642578125, -1.519775390625, -1.4036865234375, -1.28759765625, -1.1715087890625, -1.055419921875, -0.9393310546875, -0.8232421875, -0.7071533203125, -0.591064453125, -0.4749755859375, -0.35888671875, -0.2427978515625, -0.126708984375, -0.0106201171875, 0.10546875, 0.2215576171875, 0.337646484375, 0.4537353515625, 0.56982421875, 0.6859130859375, 0.802001953125, 0.9180908203125, 1.0341796875, 1.1502685546875, 1.266357421875, 1.3824462890625, 1.49853515625, 1.6146240234375, 1.730712890625, 1.8468017578125, 1.962890625, 2.0789794921875, 2.195068359375, 2.3111572265625, 2.42724609375, 2.5433349609375, 2.659423828125, 2.7755126953125, 2.8916015625, 3.0076904296875, 3.123779296875, 3.2398681640625, 3.35595703125, 3.4720458984375, 3.588134765625, 3.7042236328125, 3.8203125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 11.0, 13.0, 11.0, 8.0, 22.0, 42.0, 56.0, 96.0, 115.0, 200.0, 287.0, 440.0, 656.0, 1028.0, 1582.0, 2501.0, 3961.0, 6218.0, 9851.0, 15990.0, 25709.0, 42736.0, 75367.0, 145311.0, 302290.0, 189327.0, 92738.0, 51379.0, 30403.0, 18373.0, 11559.0, 7348.0, 4567.0, 2996.0, 1805.0, 1195.0, 778.0, 527.0, 370.0, 211.0, 148.0, 110.0, 64.0, 51.0, 30.0, 13.0, 16.0, 15.0, 10.0, 12.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.70166015625, -0.67950439453125, -0.6573486328125, -0.63519287109375, -0.613037109375, -0.59088134765625, -0.5687255859375, -0.54656982421875, -0.5244140625, -0.50225830078125, -0.4801025390625, -0.45794677734375, -0.435791015625, -0.41363525390625, -0.3914794921875, -0.36932373046875, -0.34716796875, -0.32501220703125, -0.3028564453125, -0.28070068359375, -0.258544921875, -0.23638916015625, -0.2142333984375, -0.19207763671875, -0.169921875, -0.14776611328125, -0.1256103515625, -0.10345458984375, -0.081298828125, -0.05914306640625, -0.0369873046875, -0.01483154296875, 0.00732421875, 0.02947998046875, 0.0516357421875, 0.07379150390625, 0.095947265625, 0.11810302734375, 0.1402587890625, 0.16241455078125, 0.1845703125, 0.20672607421875, 0.2288818359375, 0.25103759765625, 0.273193359375, 0.29534912109375, 0.3175048828125, 0.33966064453125, 0.36181640625, 0.38397216796875, 0.4061279296875, 0.42828369140625, 0.450439453125, 0.47259521484375, 0.4947509765625, 0.51690673828125, 0.5390625, 0.56121826171875, 0.5833740234375, 0.60552978515625, 0.627685546875, 0.64984130859375, 0.6719970703125, 0.69415283203125, 0.71630859375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 8.0, 10.0, 11.0, 11.0, 7.0, 14.0, 17.0, 16.0, 20.0, 24.0, 32.0, 27.0, 41.0, 34.0, 29.0, 31.0, 40.0, 45.0, 52.0, 1063.0, 42.0, 33.0, 54.0, 33.0, 24.0, 36.0, 40.0, 31.0, 32.0, 30.0, 29.0, 16.0, 13.0, 16.0, 12.0, 20.0, 12.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.658203125, -2.574371337890625, -2.49053955078125, -2.406707763671875, -2.3228759765625, -2.239044189453125, -2.15521240234375, -2.071380615234375, -1.987548828125, -1.903717041015625, -1.81988525390625, -1.736053466796875, -1.6522216796875, -1.568389892578125, -1.48455810546875, -1.400726318359375, -1.31689453125, -1.233062744140625, -1.14923095703125, -1.065399169921875, -0.9815673828125, -0.897735595703125, -0.81390380859375, -0.730072021484375, -0.646240234375, -0.562408447265625, -0.47857666015625, -0.394744873046875, -0.3109130859375, -0.227081298828125, -0.14324951171875, -0.059417724609375, 0.0244140625, 0.108245849609375, 0.19207763671875, 0.275909423828125, 0.3597412109375, 0.443572998046875, 0.52740478515625, 0.611236572265625, 0.695068359375, 0.778900146484375, 0.86273193359375, 0.946563720703125, 1.0303955078125, 1.114227294921875, 1.19805908203125, 1.281890869140625, 1.36572265625, 1.449554443359375, 1.53338623046875, 1.617218017578125, 1.7010498046875, 1.784881591796875, 1.86871337890625, 1.952545166015625, 2.036376953125, 2.120208740234375, 2.20404052734375, 2.287872314453125, 2.3717041015625, 2.455535888671875, 2.53936767578125, 2.623199462890625, 2.70703125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 7.0, 8.0, 15.0, 19.0, 33.0, 38.0, 75.0, 81.0, 93.0, 125.0, 174.0, 228.0, 298.0, 480.0, 674.0, 931.0, 1338.0, 1886.0, 2751.0, 3921.0, 5811.0, 8560.0, 12294.0, 18036.0, 26877.0, 40322.0, 63808.0, 110094.0, 1283007.0, 224052.0, 107180.0, 61217.0, 39751.0, 26644.0, 17700.0, 12065.0, 8044.0, 5598.0, 3882.0, 2649.0, 1814.0, 1304.0, 939.0, 686.0, 502.0, 324.0, 241.0, 183.0, 100.0, 68.0, 61.0, 32.0, 33.0, 27.0, 23.0, 13.0, 14.0, 4.0, 5.0, 0.0, 4.0], "bins": [-0.587890625, -0.5695037841796875, -0.551116943359375, -0.5327301025390625, -0.51434326171875, -0.4959564208984375, -0.477569580078125, -0.4591827392578125, -0.4407958984375, -0.4224090576171875, -0.404022216796875, -0.3856353759765625, -0.36724853515625, -0.3488616943359375, -0.330474853515625, -0.3120880126953125, -0.293701171875, -0.2753143310546875, -0.256927490234375, -0.2385406494140625, -0.22015380859375, -0.2017669677734375, -0.183380126953125, -0.1649932861328125, -0.1466064453125, -0.1282196044921875, -0.109832763671875, -0.0914459228515625, -0.07305908203125, -0.0546722412109375, -0.036285400390625, -0.0178985595703125, 0.00048828125, 0.0188751220703125, 0.037261962890625, 0.0556488037109375, 0.07403564453125, 0.0924224853515625, 0.110809326171875, 0.1291961669921875, 0.1475830078125, 0.1659698486328125, 0.184356689453125, 0.2027435302734375, 0.22113037109375, 0.2395172119140625, 0.257904052734375, 0.2762908935546875, 0.294677734375, 0.3130645751953125, 0.331451416015625, 0.3498382568359375, 0.36822509765625, 0.3866119384765625, 0.404998779296875, 0.4233856201171875, 0.4417724609375, 0.4601593017578125, 0.478546142578125, 0.4969329833984375, 0.51531982421875, 0.5337066650390625, 0.552093505859375, 0.5704803466796875, 0.5888671875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 3.0, 10.0, 7.0, 10.0, 12.0, 27.0, 24.0, 28.0, 35.0, 36.0, 44.0, 50.0, 56.0, 60.0, 68.0, 67.0, 65.0, 62.0, 61.0, 48.0, 33.0, 39.0, 20.0, 28.0, 24.0, 13.0, 7.0, 6.0, 8.0, 8.0, 9.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0001659393310546875, -0.00016099214553833008, -0.00015604496002197266, -0.00015109777450561523, -0.0001461505889892578, -0.0001412034034729004, -0.00013625621795654297, -0.00013130903244018555, -0.00012636184692382812, -0.0001214146614074707, -0.00011646747589111328, -0.00011152029037475586, -0.00010657310485839844, -0.00010162591934204102, -9.66787338256836e-05, -9.173154830932617e-05, -8.678436279296875e-05, -8.183717727661133e-05, -7.68899917602539e-05, -7.194280624389648e-05, -6.699562072753906e-05, -6.204843521118164e-05, -5.710124969482422e-05, -5.21540641784668e-05, -4.7206878662109375e-05, -4.225969314575195e-05, -3.731250762939453e-05, -3.236532211303711e-05, -2.7418136596679688e-05, -2.2470951080322266e-05, -1.7523765563964844e-05, -1.2576580047607422e-05, -7.62939453125e-06, -2.682209014892578e-06, 2.2649765014648438e-06, 7.212162017822266e-06, 1.2159347534179688e-05, 1.710653305053711e-05, 2.205371856689453e-05, 2.7000904083251953e-05, 3.1948089599609375e-05, 3.68952751159668e-05, 4.184246063232422e-05, 4.678964614868164e-05, 5.173683166503906e-05, 5.6684017181396484e-05, 6.16312026977539e-05, 6.657838821411133e-05, 7.152557373046875e-05, 7.647275924682617e-05, 8.14199447631836e-05, 8.636713027954102e-05, 9.131431579589844e-05, 9.626150131225586e-05, 0.00010120868682861328, 0.0001061558723449707, 0.00011110305786132812, 0.00011605024337768555, 0.00012099742889404297, 0.0001259446144104004, 0.0001308917999267578, 0.00013583898544311523, 0.00014078617095947266, 0.00014573335647583008, 0.0001506805419921875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 3.0, 3.0, 12.0, 12.0, 8.0, 10.0, 17.0, 33.0, 38.0, 43.0, 64.0, 75.0, 122.0, 215.0, 535.0, 2852.0, 1038074.0, 5030.0, 594.0, 269.0, 126.0, 100.0, 83.0, 47.0, 36.0, 29.0, 29.0, 22.0, 9.0, 11.0, 9.0, 7.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00345611572265625, -0.0033429861068725586, -0.003229856491088867, -0.0031167268753051758, -0.0030035972595214844, -0.002890467643737793, -0.0027773380279541016, -0.00266420841217041, -0.0025510787963867188, -0.0024379491806030273, -0.002324819564819336, -0.0022116899490356445, -0.002098560333251953, -0.0019854307174682617, -0.0018723011016845703, -0.001759171485900879, -0.0016460418701171875, -0.001532912254333496, -0.0014197826385498047, -0.0013066530227661133, -0.0011935234069824219, -0.0010803937911987305, -0.0009672641754150391, -0.0008541345596313477, -0.0007410049438476562, -0.0006278753280639648, -0.0005147457122802734, -0.00040161609649658203, -0.0002884864807128906, -0.00017535686492919922, -6.222724914550781e-05, 5.0902366638183594e-05, 0.000164031982421875, 0.0002771615982055664, 0.0003902912139892578, 0.0005034208297729492, 0.0006165504455566406, 0.000729680061340332, 0.0008428096771240234, 0.0009559392929077148, 0.0010690689086914062, 0.0011821985244750977, 0.001295328140258789, 0.0014084577560424805, 0.0015215873718261719, 0.0016347169876098633, 0.0017478466033935547, 0.001860976219177246, 0.0019741058349609375, 0.002087235450744629, 0.0022003650665283203, 0.0023134946823120117, 0.002426624298095703, 0.0025397539138793945, 0.002652883529663086, 0.0027660131454467773, 0.0028791427612304688, 0.00299227237701416, 0.0031054019927978516, 0.003218531608581543, 0.0033316612243652344, 0.0034447908401489258, 0.003557920455932617, 0.0036710500717163086, 0.0037841796875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 8.0, 19.0, 47.0, 45.0, 97.0, 148.0, 178.0, 164.0, 124.0, 87.0, 44.0, 29.0, 7.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00017212591774296016, -0.00016852229600772262, -0.0001649186888244003, -0.00016131506708916277, -0.00015771145990584046, -0.00015410783817060292, -0.0001505042309872806, -0.00014690060925204307, -0.00014329700206872076, -0.00013969338033348322, -0.0001360897731501609, -0.00013248615141492337, -0.00012888254423160106, -0.00012527892249636352, -0.00012167531531304121, -0.00011807169357780367, -0.00011446807911852375, -0.00011086446465924382, -0.0001072608501999639, -0.00010365723574068397, -0.00010005362128140405, -9.645000682212412e-05, -9.284638508688658e-05, -8.924277790356427e-05, -8.563915616832674e-05, -8.203554170904681e-05, -7.843192724976689e-05, -7.482831279048696e-05, -7.122469833120704e-05, -6.762108387192711e-05, -6.401746941264719e-05, -6.0413851315388456e-05, -5.6810244132066146e-05, -5.320662967278622e-05, -4.9603015213506296e-05, -4.5999397116247565e-05, -4.239578265696764e-05, -3.8792168197687715e-05, -3.518855373840779e-05, -3.1584939279127866e-05, -2.798132481984794e-05, -2.4377710360568017e-05, -2.0774095901288092e-05, -1.7170479623018764e-05, -1.356686516373884e-05, -9.963250704458915e-06, -6.3596344261895865e-06, -2.756019966909662e-06, 8.475944923702627e-07, 4.451209406397538e-06, 8.054824320424814e-06, 1.165843968919944e-05, 1.5262054148479365e-05, 1.886566860775929e-05, 2.2469284886028618e-05, 2.6072899345308542e-05, 2.9676513804588467e-05, 3.328012826386839e-05, 3.6883742723148316e-05, 4.048735718242824e-05, 4.4090971641708165e-05, 4.769458610098809e-05, 5.129820419824682e-05, 5.4901818657526746e-05, 5.850543311680667e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 10.0, 10.0, 11.0, 16.0, 15.0, 19.0, 17.0, 21.0, 12.0, 27.0, 38.0, 24.0, 36.0, 31.0, 39.0, 46.0, 40.0, 38.0, 38.0, 45.0, 38.0, 37.0, 39.0, 41.0, 26.0, 32.0, 46.0, 26.0, 36.0, 18.0, 16.0, 22.0, 19.0, 12.0, 11.0, 11.0, 5.0, 8.0, 4.0, 6.0, 5.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.396936416625977e-05, -7.145106792449951e-05, -6.893277168273926e-05, -6.6414475440979e-05, -6.389617919921875e-05, -6.13778829574585e-05, -5.885958671569824e-05, -5.634129047393799e-05, -5.3822994232177734e-05, -5.130469799041748e-05, -4.8786401748657227e-05, -4.626810550689697e-05, -4.374980926513672e-05, -4.1231513023376465e-05, -3.871321678161621e-05, -3.619492053985596e-05, -3.36766242980957e-05, -3.115832805633545e-05, -2.8640031814575195e-05, -2.612173557281494e-05, -2.3603439331054688e-05, -2.1085143089294434e-05, -1.856684684753418e-05, -1.6048550605773926e-05, -1.3530254364013672e-05, -1.1011958122253418e-05, -8.493661880493164e-06, -5.97536563873291e-06, -3.4570693969726562e-06, -9.387731552124023e-07, 1.5795230865478516e-06, 4.0978193283081055e-06, 6.616115570068359e-06, 9.134411811828613e-06, 1.1652708053588867e-05, 1.4171004295349121e-05, 1.6689300537109375e-05, 1.920759677886963e-05, 2.1725893020629883e-05, 2.4244189262390137e-05, 2.676248550415039e-05, 2.9280781745910645e-05, 3.17990779876709e-05, 3.431737422943115e-05, 3.6835670471191406e-05, 3.935396671295166e-05, 4.1872262954711914e-05, 4.439055919647217e-05, 4.690885543823242e-05, 4.9427151679992676e-05, 5.194544792175293e-05, 5.4463744163513184e-05, 5.698204040527344e-05, 5.950033664703369e-05, 6.201863288879395e-05, 6.45369291305542e-05, 6.705522537231445e-05, 6.957352161407471e-05, 7.209181785583496e-05, 7.461011409759521e-05, 7.712841033935547e-05, 7.964670658111572e-05, 8.216500282287598e-05, 8.468329906463623e-05, 8.720159530639648e-05]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 1.0, 2.0, 6.0, 9.0, 5.0, 13.0, 9.0, 8.0, 14.0, 19.0, 27.0, 24.0, 27.0, 33.0, 17.0, 34.0, 34.0, 30.0, 37.0, 28.0, 43.0, 54.0, 27.0, 39.0, 39.0, 39.0, 37.0, 40.0, 26.0, 31.0, 21.0, 30.0, 23.0, 21.0, 21.0, 25.0, 12.0, 16.0, 21.0, 8.0, 15.0, 12.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.609375, -3.4932861328125, -3.377197265625, -3.2611083984375, -3.14501953125, -3.0289306640625, -2.912841796875, -2.7967529296875, -2.6806640625, -2.5645751953125, -2.448486328125, -2.3323974609375, -2.21630859375, -2.1002197265625, -1.984130859375, -1.8680419921875, -1.751953125, -1.6358642578125, -1.519775390625, -1.4036865234375, -1.28759765625, -1.1715087890625, -1.055419921875, -0.9393310546875, -0.8232421875, -0.7071533203125, -0.591064453125, -0.4749755859375, -0.35888671875, -0.2427978515625, -0.126708984375, -0.0106201171875, 0.10546875, 0.2215576171875, 0.337646484375, 0.4537353515625, 0.56982421875, 0.6859130859375, 0.802001953125, 0.9180908203125, 1.0341796875, 1.1502685546875, 1.266357421875, 1.3824462890625, 1.49853515625, 1.6146240234375, 1.730712890625, 1.8468017578125, 1.962890625, 2.0789794921875, 2.195068359375, 2.3111572265625, 2.42724609375, 2.5433349609375, 2.659423828125, 2.7755126953125, 2.8916015625, 3.0076904296875, 3.123779296875, 3.2398681640625, 3.35595703125, 3.4720458984375, 3.588134765625, 3.7042236328125, 3.8203125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 10.0, 4.0, 7.0, 16.0, 10.0, 11.0, 22.0, 31.0, 50.0, 54.0, 68.0, 93.0, 106.0, 156.0, 250.0, 439.0, 923.0, 2376.0, 6225.0, 16749.0, 45198.0, 115421.0, 278323.0, 347228.0, 143335.0, 56751.0, 21298.0, 7899.0, 2887.0, 1156.0, 494.0, 277.0, 167.0, 117.0, 93.0, 75.0, 47.0, 38.0, 39.0, 23.0, 22.0, 15.0, 12.0, 9.0, 11.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.84765625, -3.71990966796875, -3.5921630859375, -3.46441650390625, -3.336669921875, -3.20892333984375, -3.0811767578125, -2.95343017578125, -2.82568359375, -2.69793701171875, -2.5701904296875, -2.44244384765625, -2.314697265625, -2.18695068359375, -2.0592041015625, -1.93145751953125, -1.8037109375, -1.67596435546875, -1.5482177734375, -1.42047119140625, -1.292724609375, -1.16497802734375, -1.0372314453125, -0.90948486328125, -0.78173828125, -0.65399169921875, -0.5262451171875, -0.39849853515625, -0.270751953125, -0.14300537109375, -0.0152587890625, 0.11248779296875, 0.240234375, 0.36798095703125, 0.4957275390625, 0.62347412109375, 0.751220703125, 0.87896728515625, 1.0067138671875, 1.13446044921875, 1.26220703125, 1.38995361328125, 1.5177001953125, 1.64544677734375, 1.773193359375, 1.90093994140625, 2.0286865234375, 2.15643310546875, 2.2841796875, 2.41192626953125, 2.5396728515625, 2.66741943359375, 2.795166015625, 2.92291259765625, 3.0506591796875, 3.17840576171875, 3.30615234375, 3.43389892578125, 3.5616455078125, 3.68939208984375, 3.817138671875, 3.94488525390625, 4.0726318359375, 4.20037841796875, 4.328125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 3.0, 0.0, 4.0, 5.0, 12.0, 11.0, 11.0, 8.0, 16.0, 21.0, 21.0, 20.0, 27.0, 22.0, 37.0, 41.0, 41.0, 57.0, 65.0, 166.0, 1440.0, 415.0, 128.0, 75.0, 50.0, 58.0, 41.0, 42.0, 29.0, 33.0, 35.0, 15.0, 16.0, 9.0, 14.0, 9.0, 10.0, 9.0, 7.0, 9.0, 1.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.421875, -11.0272216796875, -10.632568359375, -10.2379150390625, -9.84326171875, -9.4486083984375, -9.053955078125, -8.6593017578125, -8.2646484375, -7.8699951171875, -7.475341796875, -7.0806884765625, -6.68603515625, -6.2913818359375, -5.896728515625, -5.5020751953125, -5.107421875, -4.7127685546875, -4.318115234375, -3.9234619140625, -3.52880859375, -3.1341552734375, -2.739501953125, -2.3448486328125, -1.9501953125, -1.5555419921875, -1.160888671875, -0.7662353515625, -0.37158203125, 0.0230712890625, 0.417724609375, 0.8123779296875, 1.20703125, 1.6016845703125, 1.996337890625, 2.3909912109375, 2.78564453125, 3.1802978515625, 3.574951171875, 3.9696044921875, 4.3642578125, 4.7589111328125, 5.153564453125, 5.5482177734375, 5.94287109375, 6.3375244140625, 6.732177734375, 7.1268310546875, 7.521484375, 7.9161376953125, 8.310791015625, 8.7054443359375, 9.10009765625, 9.4947509765625, 9.889404296875, 10.2840576171875, 10.6787109375, 11.0733642578125, 11.468017578125, 11.8626708984375, 12.25732421875, 12.6519775390625, 13.046630859375, 13.4412841796875, 13.8359375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 7.0, 3.0, 4.0, 13.0, 20.0, 32.0, 25.0, 35.0, 32.0, 59.0, 96.0, 110.0, 187.0, 347.0, 779.0, 3974.0, 3117233.0, 20501.0, 1138.0, 451.0, 198.0, 137.0, 94.0, 67.0, 45.0, 29.0, 16.0, 20.0, 9.0, 13.0, 7.0, 10.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.4375, -48.7373046875, -47.037109375, -45.3369140625, -43.63671875, -41.9365234375, -40.236328125, -38.5361328125, -36.8359375, -35.1357421875, -33.435546875, -31.7353515625, -30.03515625, -28.3349609375, -26.634765625, -24.9345703125, -23.234375, -21.5341796875, -19.833984375, -18.1337890625, -16.43359375, -14.7333984375, -13.033203125, -11.3330078125, -9.6328125, -7.9326171875, -6.232421875, -4.5322265625, -2.83203125, -1.1318359375, 0.568359375, 2.2685546875, 3.96875, 5.6689453125, 7.369140625, 9.0693359375, 10.76953125, 12.4697265625, 14.169921875, 15.8701171875, 17.5703125, 19.2705078125, 20.970703125, 22.6708984375, 24.37109375, 26.0712890625, 27.771484375, 29.4716796875, 31.171875, 32.8720703125, 34.572265625, 36.2724609375, 37.97265625, 39.6728515625, 41.373046875, 43.0732421875, 44.7734375, 46.4736328125, 48.173828125, 49.8740234375, 51.57421875, 53.2744140625, 54.974609375, 56.6748046875, 58.375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 21.0, 55.0, 128.0, 214.0, 257.0, 196.0, 90.0, 35.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.67979621887207, -16.764461517333984, -15.849126815795898, -14.933792114257812, -14.018457412719727, -13.10312271118164, -12.187788009643555, -11.272453308105469, -10.357118606567383, -9.441783905029297, -8.526449203491211, -7.611114501953125, -6.695779800415039, -5.780445098876953, -4.865110397338867, -3.9497756958007812, -3.0344409942626953, -2.1191062927246094, -1.2037715911865234, -0.2884368896484375, 0.6268978118896484, 1.5422325134277344, 2.4575672149658203, 3.3729019165039062, 4.288236618041992, 5.203571319580078, 6.118906021118164, 7.03424072265625, 7.949575424194336, 8.864910125732422, 9.780244827270508, 10.695579528808594, 11.610912322998047, 12.526247024536133, 13.441581726074219, 14.356916427612305, 15.27225112915039, 16.187585830688477, 17.102920532226562, 18.01825523376465, 18.933589935302734, 19.84892463684082, 20.764259338378906, 21.679594039916992, 22.594928741455078, 23.510263442993164, 24.42559814453125, 25.340932846069336, 26.256267547607422, 27.171602249145508, 28.086936950683594, 29.00227165222168, 29.917606353759766, 30.83294105529785, 31.748275756835938, 32.663612365722656, 33.57894515991211, 34.49427795410156, 35.40961456298828, 36.324951171875, 37.24028396606445, 38.155616760253906, 39.070953369140625, 39.986289978027344, 40.9016227722168]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 9.0, 9.0, 10.0, 12.0, 11.0, 13.0, 14.0, 27.0, 32.0, 27.0, 36.0, 34.0, 46.0, 37.0, 31.0, 28.0, 39.0, 55.0, 42.0, 37.0, 48.0, 44.0, 38.0, 44.0, 37.0, 31.0, 27.0, 24.0, 25.0, 22.0, 26.0, 18.0, 9.0, 13.0, 7.0, 4.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.4241828918457, -31.450801849365234, -30.477420806884766, -29.504039764404297, -28.530658721923828, -27.55727767944336, -26.583898544311523, -25.610517501831055, -24.637136459350586, -23.663755416870117, -22.69037437438965, -21.71699333190918, -20.743614196777344, -19.770233154296875, -18.796852111816406, -17.823471069335938, -16.85009002685547, -15.876708984375, -14.903327941894531, -13.929947853088379, -12.95656681060791, -11.983185768127441, -11.009805679321289, -10.03642463684082, -9.063043594360352, -8.089662551879883, -7.116281986236572, -6.142901420593262, -5.169520378112793, -4.196139335632324, -3.2227587699890137, -2.249378204345703, -1.2759971618652344, -0.3026163578033447, 0.6707644462585449, 1.6441452503204346, 2.617526054382324, 3.590907096862793, 4.5642876625061035, 5.537668228149414, 6.511049270629883, 7.484430313110352, 8.45781135559082, 9.431191444396973, 10.404572486877441, 11.37795352935791, 12.351333618164062, 13.324714660644531, 14.298095703125, 15.271476745605469, 16.244857788085938, 17.218238830566406, 18.191619873046875, 19.165000915527344, 20.13838005065918, 21.11176109313965, 22.085142135620117, 23.058523178100586, 24.031904220581055, 25.005285263061523, 25.97866439819336, 26.952045440673828, 27.925426483154297, 28.898807525634766, 29.872188568115234]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 1.0, 7.0, 8.0, 8.0, 6.0, 7.0, 10.0, 14.0, 12.0, 24.0, 25.0, 20.0, 26.0, 26.0, 40.0, 22.0, 27.0, 41.0, 33.0, 27.0, 47.0, 39.0, 36.0, 38.0, 26.0, 38.0, 45.0, 40.0, 31.0, 22.0, 33.0, 22.0, 26.0, 26.0, 17.0, 17.0, 12.0, 13.0, 19.0, 13.0, 12.0, 13.0, 8.0, 3.0, 5.0, 6.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.70703125, -3.5831298828125, -3.459228515625, -3.3353271484375, -3.21142578125, -3.0875244140625, -2.963623046875, -2.8397216796875, -2.7158203125, -2.5919189453125, -2.468017578125, -2.3441162109375, -2.22021484375, -2.0963134765625, -1.972412109375, -1.8485107421875, -1.724609375, -1.6007080078125, -1.476806640625, -1.3529052734375, -1.22900390625, -1.1051025390625, -0.981201171875, -0.8572998046875, -0.7333984375, -0.6094970703125, -0.485595703125, -0.3616943359375, -0.23779296875, -0.1138916015625, 0.010009765625, 0.1339111328125, 0.2578125, 0.3817138671875, 0.505615234375, 0.6295166015625, 0.75341796875, 0.8773193359375, 1.001220703125, 1.1251220703125, 1.2490234375, 1.3729248046875, 1.496826171875, 1.6207275390625, 1.74462890625, 1.8685302734375, 1.992431640625, 2.1163330078125, 2.240234375, 2.3641357421875, 2.488037109375, 2.6119384765625, 2.73583984375, 2.8597412109375, 2.983642578125, 3.1075439453125, 3.2314453125, 3.3553466796875, 3.479248046875, 3.6031494140625, 3.72705078125, 3.8509521484375, 3.974853515625, 4.0987548828125, 4.22265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 11.0, 9.0, 9.0, 18.0, 19.0, 25.0, 31.0, 29.0, 41.0, 62.0, 66.0, 67.0, 95.0, 118.0, 152.0, 259.0, 923.0, 9554.0, 457803.0, 3304912.0, 409136.0, 8970.0, 924.0, 272.0, 155.0, 121.0, 71.0, 77.0, 56.0, 45.0, 48.0, 35.0, 35.0, 22.0, 15.0, 21.0, 10.0, 18.0, 4.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.359375, -11.9539794921875, -11.548583984375, -11.1431884765625, -10.73779296875, -10.3323974609375, -9.927001953125, -9.5216064453125, -9.1162109375, -8.7108154296875, -8.305419921875, -7.9000244140625, -7.49462890625, -7.0892333984375, -6.683837890625, -6.2784423828125, -5.873046875, -5.4676513671875, -5.062255859375, -4.6568603515625, -4.25146484375, -3.8460693359375, -3.440673828125, -3.0352783203125, -2.6298828125, -2.2244873046875, -1.819091796875, -1.4136962890625, -1.00830078125, -0.6029052734375, -0.197509765625, 0.2078857421875, 0.61328125, 1.0186767578125, 1.424072265625, 1.8294677734375, 2.23486328125, 2.6402587890625, 3.045654296875, 3.4510498046875, 3.8564453125, 4.2618408203125, 4.667236328125, 5.0726318359375, 5.47802734375, 5.8834228515625, 6.288818359375, 6.6942138671875, 7.099609375, 7.5050048828125, 7.910400390625, 8.3157958984375, 8.72119140625, 9.1265869140625, 9.531982421875, 9.9373779296875, 10.3427734375, 10.7481689453125, 11.153564453125, 11.5589599609375, 11.96435546875, 12.3697509765625, 12.775146484375, 13.1805419921875, 13.5859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 9.0, 6.0, 8.0, 6.0, 8.0, 12.0, 13.0, 23.0, 23.0, 41.0, 56.0, 76.0, 78.0, 139.0, 163.0, 214.0, 248.0, 319.0, 370.0, 382.0, 387.0, 350.0, 257.0, 210.0, 143.0, 115.0, 101.0, 63.0, 54.0, 47.0, 39.0, 29.0, 22.0, 18.0, 11.0, 3.0, 6.0, 10.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.98046875, -4.7862548828125, -4.592041015625, -4.3978271484375, -4.20361328125, -4.0093994140625, -3.815185546875, -3.6209716796875, -3.4267578125, -3.2325439453125, -3.038330078125, -2.8441162109375, -2.64990234375, -2.4556884765625, -2.261474609375, -2.0672607421875, -1.873046875, -1.6788330078125, -1.484619140625, -1.2904052734375, -1.09619140625, -0.9019775390625, -0.707763671875, -0.5135498046875, -0.3193359375, -0.1251220703125, 0.069091796875, 0.2633056640625, 0.45751953125, 0.6517333984375, 0.845947265625, 1.0401611328125, 1.234375, 1.4285888671875, 1.622802734375, 1.8170166015625, 2.01123046875, 2.2054443359375, 2.399658203125, 2.5938720703125, 2.7880859375, 2.9822998046875, 3.176513671875, 3.3707275390625, 3.56494140625, 3.7591552734375, 3.953369140625, 4.1475830078125, 4.341796875, 4.5360107421875, 4.730224609375, 4.9244384765625, 5.11865234375, 5.3128662109375, 5.507080078125, 5.7012939453125, 5.8955078125, 6.0897216796875, 6.283935546875, 6.4781494140625, 6.67236328125, 6.8665771484375, 7.060791015625, 7.2550048828125, 7.44921875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 4.0, 3.0, 11.0, 13.0, 24.0, 18.0, 39.0, 43.0, 63.0, 65.0, 110.0, 127.0, 162.0, 198.0, 271.0, 409.0, 836.0, 42163.0, 4076390.0, 70640.0, 975.0, 405.0, 313.0, 243.0, 185.0, 149.0, 110.0, 70.0, 56.0, 40.0, 40.0, 22.0, 13.0, 12.0, 9.0, 11.0, 7.0, 6.0, 5.0, 1.0, 1.0, 4.0, 3.0, 1.0], "bins": [-39.28125, -38.261962890625, -37.24267578125, -36.223388671875, -35.2041015625, -34.184814453125, -33.16552734375, -32.146240234375, -31.126953125, -30.107666015625, -29.08837890625, -28.069091796875, -27.0498046875, -26.030517578125, -25.01123046875, -23.991943359375, -22.97265625, -21.953369140625, -20.93408203125, -19.914794921875, -18.8955078125, -17.876220703125, -16.85693359375, -15.837646484375, -14.818359375, -13.799072265625, -12.77978515625, -11.760498046875, -10.7412109375, -9.721923828125, -8.70263671875, -7.683349609375, -6.6640625, -5.644775390625, -4.62548828125, -3.606201171875, -2.5869140625, -1.567626953125, -0.54833984375, 0.470947265625, 1.490234375, 2.509521484375, 3.52880859375, 4.548095703125, 5.5673828125, 6.586669921875, 7.60595703125, 8.625244140625, 9.64453125, 10.663818359375, 11.68310546875, 12.702392578125, 13.7216796875, 14.740966796875, 15.76025390625, 16.779541015625, 17.798828125, 18.818115234375, 19.83740234375, 20.856689453125, 21.8759765625, 22.895263671875, 23.91455078125, 24.933837890625, 25.953125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 25.0, 177.0, 391.0, 309.0, 98.0, 10.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.38491439819336, -19.52646827697754, -16.66802215576172, -13.809574127197266, -10.951128005981445, -8.092681884765625, -5.234233856201172, -2.3757877349853516, 0.48265838623046875, 3.3411049842834473, 6.199551582336426, 9.057998657226562, 11.916444778442383, 14.774890899658203, 17.633338928222656, 20.491785049438477, 23.350231170654297, 26.208677291870117, 29.067123413085938, 31.92557144165039, 34.784019470214844, 37.64246368408203, 40.500911712646484, 43.35935974121094, 46.217803955078125, 49.07625198364258, 51.934696197509766, 54.79314422607422, 57.651588439941406, 60.51003646850586, 63.36848449707031, 66.2269287109375, 69.08537292480469, 71.94381713867188, 74.8022689819336, 77.66071319580078, 80.51915740966797, 83.37760925292969, 86.23605346679688, 89.09449768066406, 91.95294189453125, 94.81138610839844, 97.66983795166016, 100.52828216552734, 103.38672637939453, 106.24517822265625, 109.10362243652344, 111.96206665039062, 114.82051849365234, 117.67896270751953, 120.53741455078125, 123.39585876464844, 126.25430297851562, 129.1127471923828, 131.97119140625, 134.82965087890625, 137.68809509277344, 140.54653930664062, 143.4049835205078, 146.263427734375, 149.12188720703125, 151.98033142089844, 154.83877563476562, 157.6972198486328, 160.5556640625]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 5.0, 9.0, 4.0, 12.0, 18.0, 19.0, 21.0, 23.0, 19.0, 17.0, 30.0, 24.0, 37.0, 34.0, 39.0, 36.0, 50.0, 43.0, 41.0, 42.0, 53.0, 38.0, 42.0, 38.0, 37.0, 25.0, 30.0, 24.0, 30.0, 24.0, 24.0, 16.0, 9.0, 20.0, 15.0, 10.0, 7.0, 11.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.612600326538086, -23.874149322509766, -23.135698318481445, -22.397247314453125, -21.658796310424805, -20.920345306396484, -20.181894302368164, -19.443443298339844, -18.704992294311523, -17.966541290283203, -17.228090286254883, -16.489639282226562, -15.751188278198242, -15.012737274169922, -14.274286270141602, -13.535835266113281, -12.797384262084961, -12.05893325805664, -11.32048225402832, -10.58203125, -9.84358024597168, -9.10512924194336, -8.366678237915039, -7.628227233886719, -6.889776229858398, -6.151325225830078, -5.412874221801758, -4.6744232177734375, -3.935972213745117, -3.197521209716797, -2.4590702056884766, -1.7206192016601562, -0.9821662902832031, -0.2437152862548828, 0.4947357177734375, 1.2331867218017578, 1.9716377258300781, 2.7100887298583984, 3.4485397338867188, 4.186990737915039, 4.925441741943359, 5.66389274597168, 6.40234375, 7.14079475402832, 7.879245758056641, 8.617696762084961, 9.356147766113281, 10.094598770141602, 10.833049774169922, 11.571500778198242, 12.309951782226562, 13.048402786254883, 13.786853790283203, 14.525304794311523, 15.263755798339844, 16.002206802368164, 16.740657806396484, 17.479108810424805, 18.217559814453125, 18.956010818481445, 19.694461822509766, 20.432912826538086, 21.171363830566406, 21.909814834594727, 22.648265838623047]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 8.0, 3.0, 8.0, 5.0, 9.0, 7.0, 18.0, 24.0, 23.0, 19.0, 26.0, 22.0, 24.0, 23.0, 29.0, 32.0, 28.0, 37.0, 42.0, 36.0, 41.0, 39.0, 33.0, 29.0, 33.0, 28.0, 30.0, 33.0, 26.0, 34.0, 21.0, 27.0, 25.0, 25.0, 18.0, 23.0, 15.0, 20.0, 11.0, 11.0, 7.0, 11.0, 7.0, 7.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-3.7734375, -3.6602783203125, -3.547119140625, -3.4339599609375, -3.32080078125, -3.2076416015625, -3.094482421875, -2.9813232421875, -2.8681640625, -2.7550048828125, -2.641845703125, -2.5286865234375, -2.41552734375, -2.3023681640625, -2.189208984375, -2.0760498046875, -1.962890625, -1.8497314453125, -1.736572265625, -1.6234130859375, -1.51025390625, -1.3970947265625, -1.283935546875, -1.1707763671875, -1.0576171875, -0.9444580078125, -0.831298828125, -0.7181396484375, -0.60498046875, -0.4918212890625, -0.378662109375, -0.2655029296875, -0.15234375, -0.0391845703125, 0.073974609375, 0.1871337890625, 0.30029296875, 0.4134521484375, 0.526611328125, 0.6397705078125, 0.7529296875, 0.8660888671875, 0.979248046875, 1.0924072265625, 1.20556640625, 1.3187255859375, 1.431884765625, 1.5450439453125, 1.658203125, 1.7713623046875, 1.884521484375, 1.9976806640625, 2.11083984375, 2.2239990234375, 2.337158203125, 2.4503173828125, 2.5634765625, 2.6766357421875, 2.789794921875, 2.9029541015625, 3.01611328125, 3.1292724609375, 3.242431640625, 3.3555908203125, 3.46875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 7.0, 5.0, 8.0, 9.0, 19.0, 25.0, 42.0, 62.0, 84.0, 120.0, 151.0, 260.0, 352.0, 507.0, 688.0, 1011.0, 1506.0, 2230.0, 3264.0, 4652.0, 7097.0, 10605.0, 15781.0, 23820.0, 35868.0, 54690.0, 88325.0, 152243.0, 249742.0, 148529.0, 85824.0, 54057.0, 35536.0, 23500.0, 15678.0, 10435.0, 7023.0, 4729.0, 3144.0, 2149.0, 1497.0, 1033.0, 669.0, 448.0, 375.0, 242.0, 174.0, 117.0, 79.0, 53.0, 32.0, 33.0, 12.0, 7.0, 13.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.5927734375, -0.573944091796875, -0.55511474609375, -0.536285400390625, -0.5174560546875, -0.498626708984375, -0.47979736328125, -0.460968017578125, -0.442138671875, -0.423309326171875, -0.40447998046875, -0.385650634765625, -0.3668212890625, -0.347991943359375, -0.32916259765625, -0.310333251953125, -0.29150390625, -0.272674560546875, -0.25384521484375, -0.235015869140625, -0.2161865234375, -0.197357177734375, -0.17852783203125, -0.159698486328125, -0.140869140625, -0.122039794921875, -0.10321044921875, -0.084381103515625, -0.0655517578125, -0.046722412109375, -0.02789306640625, -0.009063720703125, 0.009765625, 0.028594970703125, 0.04742431640625, 0.066253662109375, 0.0850830078125, 0.103912353515625, 0.12274169921875, 0.141571044921875, 0.160400390625, 0.179229736328125, 0.19805908203125, 0.216888427734375, 0.2357177734375, 0.254547119140625, 0.27337646484375, 0.292205810546875, 0.31103515625, 0.329864501953125, 0.34869384765625, 0.367523193359375, 0.3863525390625, 0.405181884765625, 0.42401123046875, 0.442840576171875, 0.461669921875, 0.480499267578125, 0.49932861328125, 0.518157958984375, 0.5369873046875, 0.555816650390625, 0.57464599609375, 0.593475341796875, 0.6123046875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 8.0, 4.0, 14.0, 15.0, 9.0, 8.0, 23.0, 19.0, 20.0, 34.0, 26.0, 41.0, 44.0, 38.0, 31.0, 52.0, 40.0, 51.0, 1069.0, 46.0, 37.0, 50.0, 39.0, 47.0, 40.0, 40.0, 25.0, 32.0, 17.0, 17.0, 22.0, 12.0, 7.0, 12.0, 8.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.76025390625, -2.6689453125, -2.57763671875, -2.486328125, -2.39501953125, -2.3037109375, -2.21240234375, -2.12109375, -2.02978515625, -1.9384765625, -1.84716796875, -1.755859375, -1.66455078125, -1.5732421875, -1.48193359375, -1.390625, -1.29931640625, -1.2080078125, -1.11669921875, -1.025390625, -0.93408203125, -0.8427734375, -0.75146484375, -0.66015625, -0.56884765625, -0.4775390625, -0.38623046875, -0.294921875, -0.20361328125, -0.1123046875, -0.02099609375, 0.0703125, 0.16162109375, 0.2529296875, 0.34423828125, 0.435546875, 0.52685546875, 0.6181640625, 0.70947265625, 0.80078125, 0.89208984375, 0.9833984375, 1.07470703125, 1.166015625, 1.25732421875, 1.3486328125, 1.43994140625, 1.53125, 1.62255859375, 1.7138671875, 1.80517578125, 1.896484375, 1.98779296875, 2.0791015625, 2.17041015625, 2.26171875, 2.35302734375, 2.4443359375, 2.53564453125, 2.626953125, 2.71826171875, 2.8095703125, 2.90087890625, 2.9921875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 8.0, 2.0, 8.0, 5.0, 12.0, 6.0, 30.0, 27.0, 48.0, 76.0, 134.0, 156.0, 272.0, 411.0, 576.0, 837.0, 1210.0, 1838.0, 2604.0, 3868.0, 5675.0, 8281.0, 12679.0, 18822.0, 29571.0, 46929.0, 79271.0, 149763.0, 1339434.0, 166250.0, 85518.0, 50654.0, 31304.0, 20156.0, 13057.0, 8719.0, 6085.0, 4072.0, 2782.0, 1880.0, 1359.0, 888.0, 610.0, 390.0, 281.0, 199.0, 118.0, 98.0, 62.0, 39.0, 21.0, 18.0, 12.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.64208984375, -0.62237548828125, -0.6026611328125, -0.58294677734375, -0.563232421875, -0.54351806640625, -0.5238037109375, -0.50408935546875, -0.484375, -0.46466064453125, -0.4449462890625, -0.42523193359375, -0.405517578125, -0.38580322265625, -0.3660888671875, -0.34637451171875, -0.32666015625, -0.30694580078125, -0.2872314453125, -0.26751708984375, -0.247802734375, -0.22808837890625, -0.2083740234375, -0.18865966796875, -0.1689453125, -0.14923095703125, -0.1295166015625, -0.10980224609375, -0.090087890625, -0.07037353515625, -0.0506591796875, -0.03094482421875, -0.01123046875, 0.00848388671875, 0.0281982421875, 0.04791259765625, 0.067626953125, 0.08734130859375, 0.1070556640625, 0.12677001953125, 0.146484375, 0.16619873046875, 0.1859130859375, 0.20562744140625, 0.225341796875, 0.24505615234375, 0.2647705078125, 0.28448486328125, 0.30419921875, 0.32391357421875, 0.3436279296875, 0.36334228515625, 0.383056640625, 0.40277099609375, 0.4224853515625, 0.44219970703125, 0.4619140625, 0.48162841796875, 0.5013427734375, 0.52105712890625, 0.540771484375, 0.56048583984375, 0.5802001953125, 0.59991455078125, 0.61962890625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 8.0, 10.0, 9.0, 14.0, 5.0, 10.0, 17.0, 22.0, 32.0, 30.0, 44.0, 55.0, 68.0, 63.0, 59.0, 62.0, 63.0, 55.0, 71.0, 63.0, 47.0, 40.0, 32.0, 24.0, 25.0, 23.0, 14.0, 11.0, 6.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011867284774780273, -0.0001133875921368599, -0.00010810233652591705, -0.00010281708091497421, -9.753182530403137e-05, -9.224656969308853e-05, -8.696131408214569e-05, -8.167605847120285e-05, -7.639080286026001e-05, -7.110554724931717e-05, -6.582029163837433e-05, -6.053503602743149e-05, -5.524978041648865e-05, -4.996452480554581e-05, -4.4679269194602966e-05, -3.9394013583660126e-05, -3.4108757972717285e-05, -2.8823502361774445e-05, -2.3538246750831604e-05, -1.8252991139888763e-05, -1.2967735528945923e-05, -7.682479918003082e-06, -2.3972243070602417e-06, 2.888031303882599e-06, 8.17328691482544e-06, 1.345854252576828e-05, 1.874379813671112e-05, 2.402905374765396e-05, 2.9314309358596802e-05, 3.459956496953964e-05, 3.988482058048248e-05, 4.5170076191425323e-05, 5.0455331802368164e-05, 5.5740587413311005e-05, 6.1025843024253845e-05, 6.631109863519669e-05, 7.159635424613953e-05, 7.688160985708237e-05, 8.216686546802521e-05, 8.745212107896805e-05, 9.273737668991089e-05, 9.802263230085373e-05, 0.00010330788791179657, 0.00010859314352273941, 0.00011387839913368225, 0.00011916365474462509, 0.00012444891035556793, 0.00012973416596651077, 0.0001350194215774536, 0.00014030467718839645, 0.0001455899327993393, 0.00015087518841028214, 0.00015616044402122498, 0.00016144569963216782, 0.00016673095524311066, 0.0001720162108540535, 0.00017730146646499634, 0.00018258672207593918, 0.00018787197768688202, 0.00019315723329782486, 0.0001984424889087677, 0.00020372774451971054, 0.00020901300013065338, 0.00021429825574159622, 0.00021958351135253906]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 2.0, 9.0, 10.0, 19.0, 17.0, 35.0, 38.0, 50.0, 60.0, 87.0, 123.0, 196.0, 332.0, 818.0, 12382.0, 1030579.0, 2435.0, 602.0, 251.0, 137.0, 90.0, 59.0, 54.0, 40.0, 27.0, 16.0, 14.0, 15.0, 15.0, 13.0, 5.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0], "bins": [-0.004535675048828125, -0.004423230886459351, -0.004310786724090576, -0.004198342561721802, -0.004085898399353027, -0.003973454236984253, -0.0038610100746154785, -0.003748565912246704, -0.0036361217498779297, -0.0035236775875091553, -0.003411233425140381, -0.0032987892627716064, -0.003186345100402832, -0.0030739009380340576, -0.002961456775665283, -0.002849012613296509, -0.0027365684509277344, -0.00262412428855896, -0.0025116801261901855, -0.002399235963821411, -0.0022867918014526367, -0.0021743476390838623, -0.002061903476715088, -0.0019494593143463135, -0.001837015151977539, -0.0017245709896087646, -0.0016121268272399902, -0.0014996826648712158, -0.0013872385025024414, -0.001274794340133667, -0.0011623501777648926, -0.0010499060153961182, -0.0009374618530273438, -0.0008250176906585693, -0.0007125735282897949, -0.0006001293659210205, -0.0004876852035522461, -0.0003752410411834717, -0.00026279687881469727, -0.00015035271644592285, -3.790855407714844e-05, 7.453560829162598e-05, 0.0001869797706604004, 0.0002994239330291748, 0.0004118680953979492, 0.0005243122577667236, 0.000636756420135498, 0.0007492005825042725, 0.0008616447448730469, 0.0009740889072418213, 0.0010865330696105957, 0.0011989772319793701, 0.0013114213943481445, 0.001423865556716919, 0.0015363097190856934, 0.0016487538814544678, 0.0017611980438232422, 0.0018736422061920166, 0.001986086368560791, 0.0020985305309295654, 0.00221097469329834, 0.0023234188556671143, 0.0024358630180358887, 0.002548307180404663, 0.0026607513427734375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 219.0, 568.0, 200.0, 15.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022592559980694205, -0.00021223867952357978, -0.00019855177379213274, -0.00018486485350877047, -0.0001711779332254082, -0.00015749101294204593, -0.00014380409265868366, -0.00013011718692723662, -0.00011643026664387435, -0.00010274334636051208, -8.905643335310742e-05, -7.536952034570277e-05, -6.16826000623405e-05, -4.799567977897823e-05, -3.430876677157357e-05, -2.0621853764168918e-05, -6.934933480806649e-06, 6.751983164576814e-06, 2.0438899809960276e-05, 3.412581645534374e-05, 4.78127331007272e-05, 6.149965338408947e-05, 7.518656639149413e-05, 8.887347939889878e-05, 0.00010256039968226105, 0.00011624731996562332, 0.00012993422569707036, 0.00014362114598043263, 0.0001573080662637949, 0.00017099498654715717, 0.00018468190683051944, 0.00019836881256196648, 0.00021205574739724398, 0.00022574266768060625, 0.00023942958796396852, 0.0002531165082473308, 0.00026680342853069305, 0.00028049031971022487, 0.00029417723999358714, 0.0003078641602769494, 0.0003215510805603117, 0.00033523800084367394, 0.0003489249211270362, 0.0003626118414103985, 0.0003762987325899303, 0.000389985681977123, 0.00040367257315665483, 0.0004173594934400171, 0.0004310464137233794, 0.00044473333400674164, 0.0004584202542901039, 0.0004721071745734662, 0.00048579409485682845, 0.0004994809860363603, 0.000513167935423553, 0.0005268548266030848, 0.0005405417177826166, 0.0005542286089621484, 0.0005679155583493412, 0.000581602449528873, 0.0005952893989160657, 0.0006089762900955975, 0.0006226632394827902, 0.000636350130662322, 0.0006500370800495148]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 11.0, 8.0, 9.0, 11.0, 15.0, 12.0, 13.0, 18.0, 15.0, 18.0, 35.0, 33.0, 18.0, 27.0, 36.0, 41.0, 35.0, 39.0, 41.0, 26.0, 37.0, 38.0, 45.0, 29.0, 38.0, 31.0, 45.0, 23.0, 24.0, 20.0, 37.0, 20.0, 29.0, 24.0, 15.0, 15.0, 11.0, 15.0, 9.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-7.963180541992188e-05, -7.73230567574501e-05, -7.501430809497833e-05, -7.270555943250656e-05, -7.039681077003479e-05, -6.808806210756302e-05, -6.577931344509125e-05, -6.347056478261948e-05, -6.11618161201477e-05, -5.8853067457675934e-05, -5.654431879520416e-05, -5.423557013273239e-05, -5.192682147026062e-05, -4.961807280778885e-05, -4.730932414531708e-05, -4.5000575482845306e-05, -4.2691826820373535e-05, -4.0383078157901764e-05, -3.807432949542999e-05, -3.576558083295822e-05, -3.345683217048645e-05, -3.114808350801468e-05, -2.8839334845542908e-05, -2.6530586183071136e-05, -2.4221837520599365e-05, -2.1913088858127594e-05, -1.9604340195655823e-05, -1.729559153318405e-05, -1.498684287071228e-05, -1.2678094208240509e-05, -1.0369345545768738e-05, -8.060596883296967e-06, -5.751848220825195e-06, -3.443099558353424e-06, -1.1343508958816528e-06, 1.1743977665901184e-06, 3.4831464290618896e-06, 5.791895091533661e-06, 8.100643754005432e-06, 1.0409392416477203e-05, 1.2718141078948975e-05, 1.5026889741420746e-05, 1.7335638403892517e-05, 1.964438706636429e-05, 2.195313572883606e-05, 2.426188439130783e-05, 2.6570633053779602e-05, 2.8879381716251373e-05, 3.1188130378723145e-05, 3.3496879041194916e-05, 3.580562770366669e-05, 3.811437636613846e-05, 4.042312502861023e-05, 4.2731873691082e-05, 4.504062235355377e-05, 4.734937101602554e-05, 4.9658119678497314e-05, 5.1966868340969086e-05, 5.427561700344086e-05, 5.658436566591263e-05, 5.88931143283844e-05, 6.120186299085617e-05, 6.351061165332794e-05, 6.581936031579971e-05, 6.812810897827148e-05]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 8.0, 3.0, 8.0, 5.0, 9.0, 7.0, 18.0, 24.0, 23.0, 19.0, 26.0, 22.0, 24.0, 23.0, 29.0, 32.0, 28.0, 37.0, 42.0, 36.0, 41.0, 39.0, 33.0, 29.0, 33.0, 28.0, 30.0, 33.0, 26.0, 34.0, 21.0, 27.0, 25.0, 25.0, 18.0, 23.0, 15.0, 20.0, 11.0, 11.0, 7.0, 11.0, 7.0, 7.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-3.7734375, -3.6602783203125, -3.547119140625, -3.4339599609375, -3.32080078125, -3.2076416015625, -3.094482421875, -2.9813232421875, -2.8681640625, -2.7550048828125, -2.641845703125, -2.5286865234375, -2.41552734375, -2.3023681640625, -2.189208984375, -2.0760498046875, -1.962890625, -1.8497314453125, -1.736572265625, -1.6234130859375, -1.51025390625, -1.3970947265625, -1.283935546875, -1.1707763671875, -1.0576171875, -0.9444580078125, -0.831298828125, -0.7181396484375, -0.60498046875, -0.4918212890625, -0.378662109375, -0.2655029296875, -0.15234375, -0.0391845703125, 0.073974609375, 0.1871337890625, 0.30029296875, 0.4134521484375, 0.526611328125, 0.6397705078125, 0.7529296875, 0.8660888671875, 0.979248046875, 1.0924072265625, 1.20556640625, 1.3187255859375, 1.431884765625, 1.5450439453125, 1.658203125, 1.7713623046875, 1.884521484375, 1.9976806640625, 2.11083984375, 2.2239990234375, 2.337158203125, 2.4503173828125, 2.5634765625, 2.6766357421875, 2.789794921875, 2.9029541015625, 3.01611328125, 3.1292724609375, 3.242431640625, 3.3555908203125, 3.46875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 8.0, 5.0, 7.0, 18.0, 20.0, 22.0, 18.0, 45.0, 46.0, 54.0, 62.0, 87.0, 156.0, 184.0, 292.0, 449.0, 900.0, 3007.0, 20259.0, 154733.0, 692278.0, 150685.0, 19966.0, 2872.0, 871.0, 501.0, 264.0, 186.0, 125.0, 93.0, 65.0, 54.0, 53.0, 23.0, 31.0, 24.0, 13.0, 16.0, 11.0, 5.0, 13.0, 4.0, 2.0, 7.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-8.3203125, -8.0718994140625, -7.823486328125, -7.5750732421875, -7.32666015625, -7.0782470703125, -6.829833984375, -6.5814208984375, -6.3330078125, -6.0845947265625, -5.836181640625, -5.5877685546875, -5.33935546875, -5.0909423828125, -4.842529296875, -4.5941162109375, -4.345703125, -4.0972900390625, -3.848876953125, -3.6004638671875, -3.35205078125, -3.1036376953125, -2.855224609375, -2.6068115234375, -2.3583984375, -2.1099853515625, -1.861572265625, -1.6131591796875, -1.36474609375, -1.1163330078125, -0.867919921875, -0.6195068359375, -0.37109375, -0.1226806640625, 0.125732421875, 0.3741455078125, 0.62255859375, 0.8709716796875, 1.119384765625, 1.3677978515625, 1.6162109375, 1.8646240234375, 2.113037109375, 2.3614501953125, 2.60986328125, 2.8582763671875, 3.106689453125, 3.3551025390625, 3.603515625, 3.8519287109375, 4.100341796875, 4.3487548828125, 4.59716796875, 4.8455810546875, 5.093994140625, 5.3424072265625, 5.5908203125, 5.8392333984375, 6.087646484375, 6.3360595703125, 6.58447265625, 6.8328857421875, 7.081298828125, 7.3297119140625, 7.578125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 9.0, 5.0, 13.0, 6.0, 9.0, 8.0, 9.0, 14.0, 18.0, 12.0, 36.0, 32.0, 32.0, 28.0, 45.0, 29.0, 39.0, 48.0, 86.0, 200.0, 1520.0, 252.0, 116.0, 61.0, 50.0, 45.0, 40.0, 38.0, 43.0, 33.0, 30.0, 26.0, 15.0, 16.0, 14.0, 20.0, 13.0, 3.0, 9.0, 6.0, 9.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.8436279296875, -9.460693359375, -9.0777587890625, -8.69482421875, -8.3118896484375, -7.928955078125, -7.5460205078125, -7.1630859375, -6.7801513671875, -6.397216796875, -6.0142822265625, -5.63134765625, -5.2484130859375, -4.865478515625, -4.4825439453125, -4.099609375, -3.7166748046875, -3.333740234375, -2.9508056640625, -2.56787109375, -2.1849365234375, -1.802001953125, -1.4190673828125, -1.0361328125, -0.6531982421875, -0.270263671875, 0.1126708984375, 0.49560546875, 0.8785400390625, 1.261474609375, 1.6444091796875, 2.02734375, 2.4102783203125, 2.793212890625, 3.1761474609375, 3.55908203125, 3.9420166015625, 4.324951171875, 4.7078857421875, 5.0908203125, 5.4737548828125, 5.856689453125, 6.2396240234375, 6.62255859375, 7.0054931640625, 7.388427734375, 7.7713623046875, 8.154296875, 8.5372314453125, 8.920166015625, 9.3031005859375, 9.68603515625, 10.0689697265625, 10.451904296875, 10.8348388671875, 11.2177734375, 11.6007080078125, 11.983642578125, 12.3665771484375, 12.74951171875, 13.1324462890625, 13.515380859375, 13.8983154296875, 14.28125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 10.0, 11.0, 9.0, 17.0, 24.0, 34.0, 28.0, 32.0, 56.0, 52.0, 83.0, 102.0, 124.0, 187.0, 391.0, 914.0, 5363.0, 3092426.0, 43141.0, 1323.0, 525.0, 232.0, 147.0, 101.0, 65.0, 62.0, 50.0, 48.0, 22.0, 25.0, 19.0, 11.0, 16.0, 12.0, 9.0, 5.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.21875, -40.96533203125, -39.7119140625, -38.45849609375, -37.205078125, -35.95166015625, -34.6982421875, -33.44482421875, -32.19140625, -30.93798828125, -29.6845703125, -28.43115234375, -27.177734375, -25.92431640625, -24.6708984375, -23.41748046875, -22.1640625, -20.91064453125, -19.6572265625, -18.40380859375, -17.150390625, -15.89697265625, -14.6435546875, -13.39013671875, -12.13671875, -10.88330078125, -9.6298828125, -8.37646484375, -7.123046875, -5.86962890625, -4.6162109375, -3.36279296875, -2.109375, -0.85595703125, 0.3974609375, 1.65087890625, 2.904296875, 4.15771484375, 5.4111328125, 6.66455078125, 7.91796875, 9.17138671875, 10.4248046875, 11.67822265625, 12.931640625, 14.18505859375, 15.4384765625, 16.69189453125, 17.9453125, 19.19873046875, 20.4521484375, 21.70556640625, 22.958984375, 24.21240234375, 25.4658203125, 26.71923828125, 27.97265625, 29.22607421875, 30.4794921875, 31.73291015625, 32.986328125, 34.23974609375, 35.4931640625, 36.74658203125, 38.0]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [38.0, 489.0, 461.0, 28.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.029485702514648, -2.5264501571655273, -0.02341461181640625, 2.479620933532715, 4.982656478881836, 7.485692024230957, 9.988727569580078, 12.491762161254883, 14.99479866027832, 17.497833251953125, 20.000869750976562, 22.50390625, 25.006940841674805, 27.50997543334961, 30.013011932373047, 32.51604461669922, 35.019081115722656, 37.522117614746094, 40.02515411376953, 42.5281867980957, 45.03122329711914, 47.53425979614258, 50.03729248046875, 52.54032897949219, 55.043365478515625, 57.54640197753906, 60.0494384765625, 62.55247116088867, 65.05551147460938, 67.55854034423828, 70.06157684326172, 72.56461334228516, 75.06765747070312, 77.57069396972656, 80.07373046875, 82.57676696777344, 85.07980346679688, 87.58283233642578, 90.08586883544922, 92.58890533447266, 95.0919418334961, 97.59497833251953, 100.09801483154297, 102.6010513305664, 105.10408020019531, 107.60711669921875, 110.11015319824219, 112.61318969726562, 115.11622619628906, 117.6192626953125, 120.12229919433594, 122.62533569335938, 125.12837219238281, 127.63140106201172, 130.1344451904297, 132.63748168945312, 135.1405029296875, 137.64353942871094, 140.14657592773438, 142.6496124267578, 145.15264892578125, 147.6556854248047, 150.15872192382812, 152.6617431640625, 155.164794921875]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 8.0, 7.0, 12.0, 8.0, 7.0, 9.0, 18.0, 19.0, 22.0, 13.0, 23.0, 20.0, 36.0, 25.0, 35.0, 32.0, 32.0, 30.0, 46.0, 51.0, 38.0, 49.0, 46.0, 39.0, 39.0, 44.0, 41.0, 34.0, 34.0, 24.0, 20.0, 17.0, 12.0, 19.0, 15.0, 16.0, 8.0, 13.0, 9.0, 11.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.94292449951172, -32.890628814697266, -31.838335037231445, -30.786041259765625, -29.733745574951172, -28.68145179748535, -27.62915802001953, -26.576862335205078, -25.524568557739258, -24.472274780273438, -23.419979095458984, -22.367685317993164, -21.315391540527344, -20.26309585571289, -19.21080207824707, -18.15850830078125, -17.106212615966797, -16.053918838500977, -15.001623153686523, -13.949329376220703, -12.897034645080566, -11.84473991394043, -10.79244613647461, -9.740151405334473, -8.687856674194336, -7.635561943054199, -6.583267688751221, -5.530973434448242, -4.4786787033081055, -3.4263839721679688, -2.3740897178649902, -1.3217954635620117, -0.2695045471191406, 0.782789945602417, 1.8350844383239746, 2.8873789310455322, 3.93967342376709, 4.991968154907227, 6.044262409210205, 7.096556663513184, 8.14885139465332, 9.201146125793457, 10.253440856933594, 11.305734634399414, 12.35802936553955, 13.410324096679688, 14.462617874145508, 15.514912605285645, 16.56720733642578, 17.6195011138916, 18.671796798706055, 19.724090576171875, 20.776386260986328, 21.82868003845215, 22.88097381591797, 23.933269500732422, 24.985563278198242, 26.037857055664062, 27.090152740478516, 28.142446517944336, 29.194740295410156, 30.24703598022461, 31.29932975769043, 32.35162353515625, 33.4039192199707]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 6.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 7.0, 11.0, 7.0, 13.0, 15.0, 17.0, 23.0, 19.0, 26.0, 23.0, 15.0, 29.0, 34.0, 29.0, 39.0, 33.0, 33.0, 32.0, 30.0, 41.0, 27.0, 43.0, 38.0, 34.0, 27.0, 34.0, 37.0, 33.0, 26.0, 20.0, 27.0, 20.0, 36.0, 17.0, 12.0, 14.0, 16.0, 10.0, 5.0, 5.0, 5.0, 6.0, 6.0, 4.0, 4.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.0625, -3.9361572265625, -3.809814453125, -3.6834716796875, -3.55712890625, -3.4307861328125, -3.304443359375, -3.1781005859375, -3.0517578125, -2.9254150390625, -2.799072265625, -2.6727294921875, -2.54638671875, -2.4200439453125, -2.293701171875, -2.1673583984375, -2.041015625, -1.9146728515625, -1.788330078125, -1.6619873046875, -1.53564453125, -1.4093017578125, -1.282958984375, -1.1566162109375, -1.0302734375, -0.9039306640625, -0.777587890625, -0.6512451171875, -0.52490234375, -0.3985595703125, -0.272216796875, -0.1458740234375, -0.01953125, 0.1068115234375, 0.233154296875, 0.3594970703125, 0.48583984375, 0.6121826171875, 0.738525390625, 0.8648681640625, 0.9912109375, 1.1175537109375, 1.243896484375, 1.3702392578125, 1.49658203125, 1.6229248046875, 1.749267578125, 1.8756103515625, 2.001953125, 2.1282958984375, 2.254638671875, 2.3809814453125, 2.50732421875, 2.6336669921875, 2.760009765625, 2.8863525390625, 3.0126953125, 3.1390380859375, 3.265380859375, 3.3917236328125, 3.51806640625, 3.6444091796875, 3.770751953125, 3.8970947265625, 4.0234375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 6.0, 7.0, 11.0, 8.0, 10.0, 22.0, 24.0, 24.0, 42.0, 53.0, 72.0, 102.0, 155.0, 254.0, 443.0, 745.0, 2124.0, 7306.0, 36950.0, 213098.0, 896093.0, 1688518.0, 1022831.0, 263615.0, 47616.0, 9314.0, 2558.0, 963.0, 465.0, 253.0, 177.0, 117.0, 88.0, 49.0, 32.0, 32.0, 29.0, 20.0, 12.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0], "bins": [-6.16015625, -5.98193359375, -5.8037109375, -5.62548828125, -5.447265625, -5.26904296875, -5.0908203125, -4.91259765625, -4.734375, -4.55615234375, -4.3779296875, -4.19970703125, -4.021484375, -3.84326171875, -3.6650390625, -3.48681640625, -3.30859375, -3.13037109375, -2.9521484375, -2.77392578125, -2.595703125, -2.41748046875, -2.2392578125, -2.06103515625, -1.8828125, -1.70458984375, -1.5263671875, -1.34814453125, -1.169921875, -0.99169921875, -0.8134765625, -0.63525390625, -0.45703125, -0.27880859375, -0.1005859375, 0.07763671875, 0.255859375, 0.43408203125, 0.6123046875, 0.79052734375, 0.96875, 1.14697265625, 1.3251953125, 1.50341796875, 1.681640625, 1.85986328125, 2.0380859375, 2.21630859375, 2.39453125, 2.57275390625, 2.7509765625, 2.92919921875, 3.107421875, 3.28564453125, 3.4638671875, 3.64208984375, 3.8203125, 3.99853515625, 4.1767578125, 4.35498046875, 4.533203125, 4.71142578125, 4.8896484375, 5.06787109375, 5.24609375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 20.0, 12.0, 14.0, 23.0, 39.0, 62.0, 74.0, 104.0, 128.0, 182.0, 209.0, 351.0, 443.0, 426.0, 446.0, 325.0, 315.0, 224.0, 144.0, 144.0, 85.0, 67.0, 69.0, 28.0, 39.0, 20.0, 13.0, 10.0, 12.0, 5.0, 9.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.359375, -7.111572265625, -6.86376953125, -6.615966796875, -6.3681640625, -6.120361328125, -5.87255859375, -5.624755859375, -5.376953125, -5.129150390625, -4.88134765625, -4.633544921875, -4.3857421875, -4.137939453125, -3.89013671875, -3.642333984375, -3.39453125, -3.146728515625, -2.89892578125, -2.651123046875, -2.4033203125, -2.155517578125, -1.90771484375, -1.659912109375, -1.412109375, -1.164306640625, -0.91650390625, -0.668701171875, -0.4208984375, -0.173095703125, 0.07470703125, 0.322509765625, 0.5703125, 0.818115234375, 1.06591796875, 1.313720703125, 1.5615234375, 1.809326171875, 2.05712890625, 2.304931640625, 2.552734375, 2.800537109375, 3.04833984375, 3.296142578125, 3.5439453125, 3.791748046875, 4.03955078125, 4.287353515625, 4.53515625, 4.782958984375, 5.03076171875, 5.278564453125, 5.5263671875, 5.774169921875, 6.02197265625, 6.269775390625, 6.517578125, 6.765380859375, 7.01318359375, 7.260986328125, 7.5087890625, 7.756591796875, 8.00439453125, 8.252197265625, 8.5]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 9.0, 9.0, 11.0, 15.0, 21.0, 27.0, 47.0, 60.0, 89.0, 129.0, 163.0, 193.0, 281.0, 388.0, 668.0, 1518.0, 7074.0, 1264850.0, 2902863.0, 11882.0, 1730.0, 711.0, 472.0, 304.0, 204.0, 161.0, 107.0, 77.0, 59.0, 50.0, 26.0, 21.0, 16.0, 6.0, 10.0, 8.0, 5.0, 0.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.625, -27.78515625, -26.9453125, -26.10546875, -25.265625, -24.42578125, -23.5859375, -22.74609375, -21.90625, -21.06640625, -20.2265625, -19.38671875, -18.546875, -17.70703125, -16.8671875, -16.02734375, -15.1875, -14.34765625, -13.5078125, -12.66796875, -11.828125, -10.98828125, -10.1484375, -9.30859375, -8.46875, -7.62890625, -6.7890625, -5.94921875, -5.109375, -4.26953125, -3.4296875, -2.58984375, -1.75, -0.91015625, -0.0703125, 0.76953125, 1.609375, 2.44921875, 3.2890625, 4.12890625, 4.96875, 5.80859375, 6.6484375, 7.48828125, 8.328125, 9.16796875, 10.0078125, 10.84765625, 11.6875, 12.52734375, 13.3671875, 14.20703125, 15.046875, 15.88671875, 16.7265625, 17.56640625, 18.40625, 19.24609375, 20.0859375, 20.92578125, 21.765625, 22.60546875, 23.4453125, 24.28515625, 25.125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 56.0, 759.0, 194.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.14484405517578, -55.700927734375, -49.25700759887695, -42.813087463378906, -36.369171142578125, -29.925254821777344, -23.481334686279297, -17.03741455078125, -10.593498229980469, -4.149580001831055, 2.2943382263183594, 8.738256454467773, 15.182174682617188, 21.62609100341797, 28.070011138916016, 34.51393127441406, 40.957847595214844, 47.401763916015625, 53.84568405151367, 60.28960418701172, 66.7335205078125, 73.17743682861328, 79.62135314941406, 86.06527709960938, 92.50919342041016, 98.95310974121094, 105.39703369140625, 111.84095001220703, 118.28486633300781, 124.7287826538086, 131.17269897460938, 137.6166229248047, 144.060546875, 150.5044708251953, 156.94837951660156, 163.39230346679688, 169.83621215820312, 176.28013610839844, 182.72406005859375, 189.16796875, 195.6118927001953, 202.05581665039062, 208.49972534179688, 214.9436492919922, 221.3875732421875, 227.83148193359375, 234.27540588378906, 240.71932983398438, 247.16323852539062, 253.60716247558594, 260.05108642578125, 266.4949951171875, 272.93890380859375, 279.3828125, 285.8267517089844, 292.2706604003906, 298.714599609375, 305.15850830078125, 311.6024475097656, 318.0463562011719, 324.4902648925781, 330.9342041015625, 337.37811279296875, 343.822021484375, 350.26593017578125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 6.0, 8.0, 7.0, 12.0, 17.0, 26.0, 21.0, 17.0, 24.0, 20.0, 28.0, 31.0, 32.0, 36.0, 36.0, 39.0, 43.0, 52.0, 36.0, 34.0, 34.0, 42.0, 45.0, 45.0, 33.0, 30.0, 24.0, 27.0, 31.0, 15.0, 26.0, 24.0, 18.0, 16.0, 20.0, 7.0, 10.0, 7.0, 11.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.00054931640625, -26.189193725585938, -25.377838134765625, -24.566482543945312, -23.755126953125, -22.943771362304688, -22.132417678833008, -21.321062088012695, -20.509706497192383, -19.69835090637207, -18.886995315551758, -18.075639724731445, -17.264286041259766, -16.452930450439453, -15.64157485961914, -14.830219268798828, -14.018863677978516, -13.207508087158203, -12.39615249633789, -11.584797859191895, -10.773442268371582, -9.96208667755127, -9.150732040405273, -8.339376449584961, -7.528020858764648, -6.716665267944336, -5.905310153961182, -5.093955039978027, -4.282599449157715, -3.4712438583374023, -2.659888744354248, -1.8485336303710938, -1.0371780395507812, -0.22582268714904785, 0.5855326652526855, 1.396888017654419, 2.2082433700561523, 3.019598960876465, 3.830954074859619, 4.642309188842773, 5.453664779663086, 6.265020370483398, 7.076375484466553, 7.887730598449707, 8.69908618927002, 9.510441780090332, 10.321796417236328, 11.13315200805664, 11.944507598876953, 12.755863189697266, 13.567218780517578, 14.378573417663574, 15.189929008483887, 16.001285552978516, 16.812639236450195, 17.623994827270508, 18.43535041809082, 19.246706008911133, 20.058061599731445, 20.869417190551758, 21.680770874023438, 22.49212646484375, 23.303482055664062, 24.114837646484375, 24.926193237304688]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 5.0, 12.0, 12.0, 13.0, 16.0, 28.0, 22.0, 27.0, 31.0, 36.0, 38.0, 29.0, 33.0, 43.0, 39.0, 43.0, 43.0, 48.0, 42.0, 41.0, 44.0, 34.0, 40.0, 26.0, 35.0, 36.0, 23.0, 22.0, 23.0, 14.0, 17.0, 19.0, 11.0, 6.0, 7.0, 8.0, 1.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.23126220703125, -4.0992431640625, -3.96722412109375, -3.835205078125, -3.70318603515625, -3.5711669921875, -3.43914794921875, -3.30712890625, -3.17510986328125, -3.0430908203125, -2.91107177734375, -2.779052734375, -2.64703369140625, -2.5150146484375, -2.38299560546875, -2.2509765625, -2.11895751953125, -1.9869384765625, -1.85491943359375, -1.722900390625, -1.59088134765625, -1.4588623046875, -1.32684326171875, -1.19482421875, -1.06280517578125, -0.9307861328125, -0.79876708984375, -0.666748046875, -0.53472900390625, -0.4027099609375, -0.27069091796875, -0.138671875, -0.00665283203125, 0.1253662109375, 0.25738525390625, 0.389404296875, 0.52142333984375, 0.6534423828125, 0.78546142578125, 0.91748046875, 1.04949951171875, 1.1815185546875, 1.31353759765625, 1.445556640625, 1.57757568359375, 1.7095947265625, 1.84161376953125, 1.9736328125, 2.10565185546875, 2.2376708984375, 2.36968994140625, 2.501708984375, 2.63372802734375, 2.7657470703125, 2.89776611328125, 3.02978515625, 3.16180419921875, 3.2938232421875, 3.42584228515625, 3.557861328125, 3.68988037109375, 3.8218994140625, 3.95391845703125, 4.0859375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 7.0, 12.0, 12.0, 26.0, 47.0, 55.0, 99.0, 136.0, 177.0, 248.0, 399.0, 606.0, 890.0, 1254.0, 1811.0, 2903.0, 4249.0, 6536.0, 10035.0, 15318.0, 24244.0, 39754.0, 67255.0, 127335.0, 266843.0, 218477.0, 105644.0, 58215.0, 34381.0, 21679.0, 13657.0, 8706.0, 5826.0, 3851.0, 2616.0, 1762.0, 1104.0, 735.0, 514.0, 372.0, 235.0, 170.0, 110.0, 77.0, 64.0, 30.0, 23.0, 22.0, 12.0, 10.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6630859375, -0.6416015625, -0.6201171875, -0.5986328125, -0.5771484375, -0.5556640625, -0.5341796875, -0.5126953125, -0.4912109375, -0.4697265625, -0.4482421875, -0.4267578125, -0.4052734375, -0.3837890625, -0.3623046875, -0.3408203125, -0.3193359375, -0.2978515625, -0.2763671875, -0.2548828125, -0.2333984375, -0.2119140625, -0.1904296875, -0.1689453125, -0.1474609375, -0.1259765625, -0.1044921875, -0.0830078125, -0.0615234375, -0.0400390625, -0.0185546875, 0.0029296875, 0.0244140625, 0.0458984375, 0.0673828125, 0.0888671875, 0.1103515625, 0.1318359375, 0.1533203125, 0.1748046875, 0.1962890625, 0.2177734375, 0.2392578125, 0.2607421875, 0.2822265625, 0.3037109375, 0.3251953125, 0.3466796875, 0.3681640625, 0.3896484375, 0.4111328125, 0.4326171875, 0.4541015625, 0.4755859375, 0.4970703125, 0.5185546875, 0.5400390625, 0.5615234375, 0.5830078125, 0.6044921875, 0.6259765625, 0.6474609375, 0.6689453125, 0.6904296875, 0.7119140625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 12.0, 10.0, 12.0, 11.0, 10.0, 10.0, 11.0, 22.0, 26.0, 24.0, 24.0, 29.0, 29.0, 38.0, 28.0, 38.0, 30.0, 35.0, 36.0, 44.0, 1062.0, 34.0, 38.0, 36.0, 29.0, 29.0, 35.0, 32.0, 31.0, 27.0, 24.0, 18.0, 18.0, 24.0, 13.0, 17.0, 12.0, 7.0, 8.0, 8.0, 5.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.181640625, -2.107940673828125, -2.03424072265625, -1.960540771484375, -1.8868408203125, -1.813140869140625, -1.73944091796875, -1.665740966796875, -1.592041015625, -1.518341064453125, -1.44464111328125, -1.370941162109375, -1.2972412109375, -1.223541259765625, -1.14984130859375, -1.076141357421875, -1.00244140625, -0.928741455078125, -0.85504150390625, -0.781341552734375, -0.7076416015625, -0.633941650390625, -0.56024169921875, -0.486541748046875, -0.412841796875, -0.339141845703125, -0.26544189453125, -0.191741943359375, -0.1180419921875, -0.044342041015625, 0.02935791015625, 0.103057861328125, 0.1767578125, 0.250457763671875, 0.32415771484375, 0.397857666015625, 0.4715576171875, 0.545257568359375, 0.61895751953125, 0.692657470703125, 0.766357421875, 0.840057373046875, 0.91375732421875, 0.987457275390625, 1.0611572265625, 1.134857177734375, 1.20855712890625, 1.282257080078125, 1.35595703125, 1.429656982421875, 1.50335693359375, 1.577056884765625, 1.6507568359375, 1.724456787109375, 1.79815673828125, 1.871856689453125, 1.945556640625, 2.019256591796875, 2.09295654296875, 2.166656494140625, 2.2403564453125, 2.314056396484375, 2.38775634765625, 2.461456298828125, 2.53515625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 6.0, 14.0, 20.0, 26.0, 41.0, 70.0, 87.0, 108.0, 172.0, 242.0, 351.0, 448.0, 652.0, 857.0, 1235.0, 1754.0, 2458.0, 3445.0, 4893.0, 6828.0, 9757.0, 14197.0, 20310.0, 30465.0, 46073.0, 72057.0, 126517.0, 1296555.0, 184485.0, 94911.0, 57443.0, 37951.0, 25332.0, 17099.0, 11805.0, 8160.0, 5905.0, 4155.0, 2987.0, 2072.0, 1581.0, 1107.0, 841.0, 530.0, 353.0, 266.0, 157.0, 111.0, 94.0, 65.0, 35.0, 19.0, 16.0, 9.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.5537109375, -0.5362777709960938, -0.5188446044921875, -0.5014114379882812, -0.483978271484375, -0.46654510498046875, -0.4491119384765625, -0.43167877197265625, -0.41424560546875, -0.39681243896484375, -0.3793792724609375, -0.36194610595703125, -0.344512939453125, -0.32707977294921875, -0.3096466064453125, -0.29221343994140625, -0.2747802734375, -0.25734710693359375, -0.2399139404296875, -0.22248077392578125, -0.205047607421875, -0.18761444091796875, -0.1701812744140625, -0.15274810791015625, -0.13531494140625, -0.11788177490234375, -0.1004486083984375, -0.08301544189453125, -0.065582275390625, -0.04814910888671875, -0.0307159423828125, -0.01328277587890625, 0.004150390625, 0.02158355712890625, 0.0390167236328125, 0.05644989013671875, 0.073883056640625, 0.09131622314453125, 0.1087493896484375, 0.12618255615234375, 0.14361572265625, 0.16104888916015625, 0.1784820556640625, 0.19591522216796875, 0.213348388671875, 0.23078155517578125, 0.2482147216796875, 0.26564788818359375, 0.2830810546875, 0.30051422119140625, 0.3179473876953125, 0.33538055419921875, 0.352813720703125, 0.37024688720703125, 0.3876800537109375, 0.40511322021484375, 0.42254638671875, 0.43997955322265625, 0.4574127197265625, 0.47484588623046875, 0.492279052734375, 0.5097122192382812, 0.5271453857421875, 0.5445785522460938, 0.56201171875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 3.0, 8.0, 7.0, 5.0, 10.0, 10.0, 15.0, 19.0, 29.0, 22.0, 23.0, 26.0, 21.0, 35.0, 45.0, 40.0, 53.0, 58.0, 57.0, 54.0, 42.0, 46.0, 44.0, 40.0, 39.0, 50.0, 32.0, 29.0, 20.0, 24.0, 19.0, 12.0, 9.0, 7.0, 11.0, 8.0, 10.0, 2.0, 1.0, 1.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00011557340621948242, -0.00011192634701728821, -0.000108279287815094, -0.00010463222861289978, -0.00010098516941070557, -9.733811020851135e-05, -9.369105100631714e-05, -9.004399180412292e-05, -8.639693260192871e-05, -8.27498733997345e-05, -7.910281419754028e-05, -7.545575499534607e-05, -7.180869579315186e-05, -6.816163659095764e-05, -6.451457738876343e-05, -6.0867518186569214e-05, -5.7220458984375e-05, -5.3573399782180786e-05, -4.992634057998657e-05, -4.627928137779236e-05, -4.2632222175598145e-05, -3.898516297340393e-05, -3.533810377120972e-05, -3.16910445690155e-05, -2.804398536682129e-05, -2.4396926164627075e-05, -2.074986696243286e-05, -1.7102807760238647e-05, -1.3455748558044434e-05, -9.80868935585022e-06, -6.161630153656006e-06, -2.514570951461792e-06, 1.1324882507324219e-06, 4.779547452926636e-06, 8.42660665512085e-06, 1.2073665857315063e-05, 1.5720725059509277e-05, 1.936778426170349e-05, 2.3014843463897705e-05, 2.666190266609192e-05, 3.0308961868286133e-05, 3.395602107048035e-05, 3.760308027267456e-05, 4.1250139474868774e-05, 4.489719867706299e-05, 4.85442578792572e-05, 5.2191317081451416e-05, 5.583837628364563e-05, 5.9485435485839844e-05, 6.313249468803406e-05, 6.677955389022827e-05, 7.042661309242249e-05, 7.40736722946167e-05, 7.772073149681091e-05, 8.136779069900513e-05, 8.501484990119934e-05, 8.866190910339355e-05, 9.230896830558777e-05, 9.595602750778198e-05, 9.96030867099762e-05, 0.00010325014591217041, 0.00010689720511436462, 0.00011054426431655884, 0.00011419132351875305, 0.00011783838272094727]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 4.0, 4.0, 11.0, 8.0, 13.0, 11.0, 19.0, 23.0, 42.0, 22.0, 45.0, 47.0, 73.0, 122.0, 151.0, 247.0, 462.0, 1118.0, 73407.0, 968189.0, 2732.0, 716.0, 320.0, 191.0, 130.0, 110.0, 52.0, 57.0, 29.0, 38.0, 32.0, 32.0, 22.0, 13.0, 17.0, 6.0, 9.0, 3.0, 10.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024871826171875, -0.002407550811767578, -0.0023279190063476562, -0.0022482872009277344, -0.0021686553955078125, -0.0020890235900878906, -0.0020093917846679688, -0.0019297599792480469, -0.001850128173828125, -0.0017704963684082031, -0.0016908645629882812, -0.0016112327575683594, -0.0015316009521484375, -0.0014519691467285156, -0.0013723373413085938, -0.0012927055358886719, -0.00121307373046875, -0.0011334419250488281, -0.0010538101196289062, -0.0009741783142089844, -0.0008945465087890625, -0.0008149147033691406, -0.0007352828979492188, -0.0006556510925292969, -0.000576019287109375, -0.0004963874816894531, -0.00041675567626953125, -0.0003371238708496094, -0.0002574920654296875, -0.00017786026000976562, -9.822845458984375e-05, -1.8596649169921875e-05, 6.103515625e-05, 0.00014066696166992188, 0.00022029876708984375, 0.0002999305725097656, 0.0003795623779296875, 0.0004591941833496094, 0.0005388259887695312, 0.0006184577941894531, 0.000698089599609375, 0.0007777214050292969, 0.0008573532104492188, 0.0009369850158691406, 0.0010166168212890625, 0.0010962486267089844, 0.0011758804321289062, 0.0012555122375488281, 0.00133514404296875, 0.0014147758483886719, 0.0014944076538085938, 0.0015740394592285156, 0.0016536712646484375, 0.0017333030700683594, 0.0018129348754882812, 0.0018925666809082031, 0.001972198486328125, 0.002051830291748047, 0.0021314620971679688, 0.0022110939025878906, 0.0022907257080078125, 0.0023703575134277344, 0.0024499893188476562, 0.002529621124267578, 0.0026092529296875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 102.0, 530.0, 331.0, 44.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026377395261079073, -0.0002510901540517807, -0.00023840635549277067, -0.00022572255693376064, -0.00021303874382283539, -0.00020035494526382536, -0.00018767114670481533, -0.00017498733359389007, -0.00016230353503488004, -0.00014961973647587, -0.00013693593791685998, -0.00012425213935784996, -0.0001115683262469247, -9.888452768791467e-05, -8.620072912890464e-05, -7.3516923293937e-05, -6.083313201088458e-05, -4.814932981389575e-05, -3.546552761690691e-05, -2.2781729057896882e-05, -1.0097926860908046e-05, 2.5858753360807896e-06, 1.526967389509082e-05, 2.795347973005846e-05, 4.063727828906849e-05, 5.3321080486057326e-05, 6.600488268304616e-05, 7.868868124205619e-05, 9.137247980106622e-05, 0.00010405628563603386, 0.00011674008419504389, 0.00012942389003001153, 0.00014210768858902156, 0.0001547914871480316, 0.00016747528570704162, 0.00018015908426605165, 0.0001928428973769769, 0.00020552669593598694, 0.00021821049449499696, 0.00023089430760592222, 0.00024357810616493225, 0.0002562619047239423, 0.0002689457032829523, 0.00028162950184196234, 0.00029431330040097237, 0.0003069970989599824, 0.0003196808975189924, 0.0003323647251818329, 0.0003450484946370125, 0.0003577322931960225, 0.00037041609175503254, 0.00038309989031404257, 0.0003957836888730526, 0.0004084674874320626, 0.00042115128599107265, 0.00043383511365391314, 0.00044651891221292317, 0.0004592027107719332, 0.0004718865093309432, 0.00048457030788995326, 0.0004972541355527937, 0.0005099379341118038, 0.0005226217326708138, 0.0005353055312298238, 0.0005479893297888339]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 14.0, 9.0, 23.0, 23.0, 23.0, 30.0, 24.0, 26.0, 35.0, 32.0, 31.0, 35.0, 32.0, 40.0, 57.0, 50.0, 38.0, 39.0, 31.0, 42.0, 34.0, 36.0, 46.0, 32.0, 27.0, 27.0, 22.0, 31.0, 17.0, 14.0, 13.0, 10.0, 14.0, 7.0, 8.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.580352783203125e-05, -6.354041397571564e-05, -6.127730011940002e-05, -5.901418626308441e-05, -5.67510724067688e-05, -5.4487958550453186e-05, -5.222484469413757e-05, -4.996173083782196e-05, -4.769861698150635e-05, -4.5435503125190735e-05, -4.317238926887512e-05, -4.090927541255951e-05, -3.8646161556243896e-05, -3.6383047699928284e-05, -3.411993384361267e-05, -3.185681998729706e-05, -2.9593706130981445e-05, -2.7330592274665833e-05, -2.506747841835022e-05, -2.2804364562034607e-05, -2.0541250705718994e-05, -1.827813684940338e-05, -1.601502299308777e-05, -1.3751909136772156e-05, -1.1488795280456543e-05, -9.22568142414093e-06, -6.962567567825317e-06, -4.699453711509705e-06, -2.436339855194092e-06, -1.73225998878479e-07, 2.089887857437134e-06, 4.353001713752747e-06, 6.616115570068359e-06, 8.879229426383972e-06, 1.1142343282699585e-05, 1.3405457139015198e-05, 1.566857099533081e-05, 1.7931684851646423e-05, 2.0194798707962036e-05, 2.245791256427765e-05, 2.4721026420593262e-05, 2.6984140276908875e-05, 2.9247254133224487e-05, 3.15103679895401e-05, 3.377348184585571e-05, 3.6036595702171326e-05, 3.829970955848694e-05, 4.056282341480255e-05, 4.2825937271118164e-05, 4.508905112743378e-05, 4.735216498374939e-05, 4.9615278840065e-05, 5.1878392696380615e-05, 5.414150655269623e-05, 5.640462040901184e-05, 5.8667734265327454e-05, 6.0930848121643066e-05, 6.319396197795868e-05, 6.545707583427429e-05, 6.77201896905899e-05, 6.998330354690552e-05, 7.224641740322113e-05, 7.450953125953674e-05, 7.677264511585236e-05, 7.903575897216797e-05]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 5.0, 12.0, 12.0, 13.0, 16.0, 28.0, 22.0, 27.0, 31.0, 36.0, 38.0, 29.0, 33.0, 43.0, 39.0, 43.0, 43.0, 48.0, 42.0, 41.0, 44.0, 34.0, 40.0, 26.0, 35.0, 36.0, 23.0, 22.0, 23.0, 14.0, 17.0, 19.0, 11.0, 6.0, 7.0, 8.0, 1.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.36328125, -4.23126220703125, -4.0992431640625, -3.96722412109375, -3.835205078125, -3.70318603515625, -3.5711669921875, -3.43914794921875, -3.30712890625, -3.17510986328125, -3.0430908203125, -2.91107177734375, -2.779052734375, -2.64703369140625, -2.5150146484375, -2.38299560546875, -2.2509765625, -2.11895751953125, -1.9869384765625, -1.85491943359375, -1.722900390625, -1.59088134765625, -1.4588623046875, -1.32684326171875, -1.19482421875, -1.06280517578125, -0.9307861328125, -0.79876708984375, -0.666748046875, -0.53472900390625, -0.4027099609375, -0.27069091796875, -0.138671875, -0.00665283203125, 0.1253662109375, 0.25738525390625, 0.389404296875, 0.52142333984375, 0.6534423828125, 0.78546142578125, 0.91748046875, 1.04949951171875, 1.1815185546875, 1.31353759765625, 1.445556640625, 1.57757568359375, 1.7095947265625, 1.84161376953125, 1.9736328125, 2.10565185546875, 2.2376708984375, 2.36968994140625, 2.501708984375, 2.63372802734375, 2.7657470703125, 2.89776611328125, 3.02978515625, 3.16180419921875, 3.2938232421875, 3.42584228515625, 3.557861328125, 3.68988037109375, 3.8218994140625, 3.95391845703125, 4.0859375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 7.0, 7.0, 7.0, 14.0, 11.0, 12.0, 25.0, 37.0, 47.0, 68.0, 112.0, 226.0, 531.0, 1334.0, 3906.0, 10967.0, 30497.0, 86200.0, 253510.0, 393450.0, 174426.0, 59552.0, 21470.0, 7690.0, 2683.0, 951.0, 356.0, 166.0, 97.0, 52.0, 25.0, 26.0, 22.0, 15.0, 14.0, 11.0, 6.0, 9.0, 2.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.22265625, -5.07049560546875, -4.9183349609375, -4.76617431640625, -4.614013671875, -4.46185302734375, -4.3096923828125, -4.15753173828125, -4.00537109375, -3.85321044921875, -3.7010498046875, -3.54888916015625, -3.396728515625, -3.24456787109375, -3.0924072265625, -2.94024658203125, -2.7880859375, -2.63592529296875, -2.4837646484375, -2.33160400390625, -2.179443359375, -2.02728271484375, -1.8751220703125, -1.72296142578125, -1.57080078125, -1.41864013671875, -1.2664794921875, -1.11431884765625, -0.962158203125, -0.80999755859375, -0.6578369140625, -0.50567626953125, -0.353515625, -0.20135498046875, -0.0491943359375, 0.10296630859375, 0.255126953125, 0.40728759765625, 0.5594482421875, 0.71160888671875, 0.86376953125, 1.01593017578125, 1.1680908203125, 1.32025146484375, 1.472412109375, 1.62457275390625, 1.7767333984375, 1.92889404296875, 2.0810546875, 2.23321533203125, 2.3853759765625, 2.53753662109375, 2.689697265625, 2.84185791015625, 2.9940185546875, 3.14617919921875, 3.29833984375, 3.45050048828125, 3.6026611328125, 3.75482177734375, 3.906982421875, 4.05914306640625, 4.2113037109375, 4.36346435546875, 4.515625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 8.0, 10.0, 15.0, 26.0, 22.0, 23.0, 25.0, 23.0, 43.0, 40.0, 50.0, 43.0, 71.0, 141.0, 244.0, 1458.0, 245.0, 108.0, 64.0, 57.0, 30.0, 43.0, 27.0, 36.0, 36.0, 37.0, 19.0, 18.0, 12.0, 16.0, 9.0, 8.0, 4.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 5.0], "bins": [-17.34375, -16.9039306640625, -16.464111328125, -16.0242919921875, -15.58447265625, -15.1446533203125, -14.704833984375, -14.2650146484375, -13.8251953125, -13.3853759765625, -12.945556640625, -12.5057373046875, -12.06591796875, -11.6260986328125, -11.186279296875, -10.7464599609375, -10.306640625, -9.8668212890625, -9.427001953125, -8.9871826171875, -8.54736328125, -8.1075439453125, -7.667724609375, -7.2279052734375, -6.7880859375, -6.3482666015625, -5.908447265625, -5.4686279296875, -5.02880859375, -4.5889892578125, -4.149169921875, -3.7093505859375, -3.26953125, -2.8297119140625, -2.389892578125, -1.9500732421875, -1.51025390625, -1.0704345703125, -0.630615234375, -0.1907958984375, 0.2490234375, 0.6888427734375, 1.128662109375, 1.5684814453125, 2.00830078125, 2.4481201171875, 2.887939453125, 3.3277587890625, 3.767578125, 4.2073974609375, 4.647216796875, 5.0870361328125, 5.52685546875, 5.9666748046875, 6.406494140625, 6.8463134765625, 7.2861328125, 7.7259521484375, 8.165771484375, 8.6055908203125, 9.04541015625, 9.4852294921875, 9.925048828125, 10.3648681640625, 10.8046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 1.0, 5.0, 5.0, 9.0, 16.0, 15.0, 17.0, 25.0, 24.0, 45.0, 59.0, 84.0, 107.0, 163.0, 224.0, 371.0, 683.0, 1848.0, 46398.0, 3058544.0, 33674.0, 1589.0, 678.0, 353.0, 228.0, 135.0, 114.0, 70.0, 57.0, 35.0, 29.0, 19.0, 15.0, 11.0, 15.0, 5.0, 10.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0], "bins": [-32.75, -31.82666015625, -30.9033203125, -29.97998046875, -29.056640625, -28.13330078125, -27.2099609375, -26.28662109375, -25.36328125, -24.43994140625, -23.5166015625, -22.59326171875, -21.669921875, -20.74658203125, -19.8232421875, -18.89990234375, -17.9765625, -17.05322265625, -16.1298828125, -15.20654296875, -14.283203125, -13.35986328125, -12.4365234375, -11.51318359375, -10.58984375, -9.66650390625, -8.7431640625, -7.81982421875, -6.896484375, -5.97314453125, -5.0498046875, -4.12646484375, -3.203125, -2.27978515625, -1.3564453125, -0.43310546875, 0.490234375, 1.41357421875, 2.3369140625, 3.26025390625, 4.18359375, 5.10693359375, 6.0302734375, 6.95361328125, 7.876953125, 8.80029296875, 9.7236328125, 10.64697265625, 11.5703125, 12.49365234375, 13.4169921875, 14.34033203125, 15.263671875, 16.18701171875, 17.1103515625, 18.03369140625, 18.95703125, 19.88037109375, 20.8037109375, 21.72705078125, 22.650390625, 23.57373046875, 24.4970703125, 25.42041015625, 26.34375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 94.0, 547.0, 347.0, 22.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.10516357421875, -51.50600814819336, -48.9068489074707, -46.30769348144531, -43.708534240722656, -41.109378814697266, -38.510223388671875, -35.91106414794922, -33.31190872192383, -30.712751388549805, -28.11359405517578, -25.51443862915039, -22.915281295776367, -20.316123962402344, -17.716968536376953, -15.11781120300293, -12.518653869628906, -9.919496536254883, -7.320340156555176, -4.7211833000183105, -2.1220264434814453, 0.4771308898925781, 3.076287269592285, 5.675443649291992, 8.274600982666016, 10.873758316040039, 13.472914695739746, 16.072071075439453, 18.671228408813477, 21.2703857421875, 23.86954116821289, 26.468698501586914, 29.067855834960938, 31.66701316833496, 34.266170501708984, 36.865325927734375, 39.46448516845703, 42.06364059448242, 44.66279602050781, 47.26195526123047, 49.86111068725586, 52.46026611328125, 55.059425354003906, 57.6585807800293, 60.25773620605469, 62.856895446777344, 65.4560546875, 68.05520629882812, 70.65436553955078, 73.25352478027344, 75.85267639160156, 78.45183563232422, 81.05099487304688, 83.650146484375, 86.24930572509766, 88.84846496582031, 91.44761657714844, 94.0467758178711, 96.64592742919922, 99.24508666992188, 101.84424591064453, 104.44340515136719, 107.04255676269531, 109.64171600341797, 112.24087524414062]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 9.0, 10.0, 7.0, 18.0, 7.0, 5.0, 12.0, 15.0, 23.0, 15.0, 18.0, 27.0, 36.0, 31.0, 44.0, 37.0, 37.0, 31.0, 37.0, 42.0, 37.0, 40.0, 39.0, 34.0, 48.0, 22.0, 40.0, 23.0, 23.0, 28.0, 17.0, 26.0, 21.0, 22.0, 16.0, 14.0, 13.0, 11.0, 5.0, 8.0, 8.0, 5.0, 7.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-29.64960479736328, -28.7479305267334, -27.84625816345215, -26.944583892822266, -26.042911529541016, -25.141237258911133, -24.23956298828125, -23.337890625, -22.43621826171875, -21.534543991088867, -20.632871627807617, -19.731197357177734, -18.829524993896484, -17.9278507232666, -17.02617645263672, -16.12450408935547, -15.222829818725586, -14.32115650177002, -13.419483184814453, -12.51780891418457, -11.61613655090332, -10.714462280273438, -9.812788963317871, -8.911115646362305, -8.009442329406738, -7.107769012451172, -6.2060956954956055, -5.304421901702881, -4.4027485847473145, -3.501075267791748, -2.5994014739990234, -1.697728157043457, -0.7960567474365234, 0.10561668872833252, 1.0072901248931885, 1.908963680267334, 2.8106369972229004, 3.712310314178467, 4.613984107971191, 5.515657424926758, 6.417330741882324, 7.319004058837891, 8.220677375793457, 9.122350692749023, 10.024024963378906, 10.925697326660156, 11.827371597290039, 12.729044914245605, 13.630718231201172, 14.532391548156738, 15.434064865112305, 16.335739135742188, 17.237411499023438, 18.13908576965332, 19.040760040283203, 19.942432403564453, 20.844104766845703, 21.745779037475586, 22.647451400756836, 23.54912567138672, 24.45079803466797, 25.35247230529785, 26.254146575927734, 27.155818939208984, 28.057493209838867]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 5.0, 3.0, 8.0, 16.0, 13.0, 14.0, 21.0, 27.0, 25.0, 25.0, 24.0, 35.0, 25.0, 42.0, 40.0, 37.0, 35.0, 48.0, 47.0, 45.0, 43.0, 46.0, 48.0, 40.0, 31.0, 42.0, 31.0, 32.0, 28.0, 15.0, 14.0, 17.0, 10.0, 13.0, 5.0, 12.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.65625, -4.51470947265625, -4.3731689453125, -4.23162841796875, -4.090087890625, -3.94854736328125, -3.8070068359375, -3.66546630859375, -3.52392578125, -3.38238525390625, -3.2408447265625, -3.09930419921875, -2.957763671875, -2.81622314453125, -2.6746826171875, -2.53314208984375, -2.3916015625, -2.25006103515625, -2.1085205078125, -1.96697998046875, -1.825439453125, -1.68389892578125, -1.5423583984375, -1.40081787109375, -1.25927734375, -1.11773681640625, -0.9761962890625, -0.83465576171875, -0.693115234375, -0.55157470703125, -0.4100341796875, -0.26849365234375, -0.126953125, 0.01458740234375, 0.1561279296875, 0.29766845703125, 0.439208984375, 0.58074951171875, 0.7222900390625, 0.86383056640625, 1.00537109375, 1.14691162109375, 1.2884521484375, 1.42999267578125, 1.571533203125, 1.71307373046875, 1.8546142578125, 1.99615478515625, 2.1376953125, 2.27923583984375, 2.4207763671875, 2.56231689453125, 2.703857421875, 2.84539794921875, 2.9869384765625, 3.12847900390625, 3.27001953125, 3.41156005859375, 3.5531005859375, 3.69464111328125, 3.836181640625, 3.97772216796875, 4.1192626953125, 4.26080322265625, 4.40234375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 3.0, 5.0, 7.0, 15.0, 13.0, 25.0, 11.0, 26.0, 28.0, 35.0, 37.0, 50.0, 58.0, 64.0, 127.0, 225.0, 736.0, 7214.0, 514826.0, 3455447.0, 210064.0, 4025.0, 523.0, 201.0, 132.0, 65.0, 69.0, 48.0, 38.0, 30.0, 23.0, 16.0, 15.0, 12.0, 11.0, 5.0, 4.0, 13.0, 8.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.6070556640625, -13.159423828125, -12.7117919921875, -12.26416015625, -11.8165283203125, -11.368896484375, -10.9212646484375, -10.4736328125, -10.0260009765625, -9.578369140625, -9.1307373046875, -8.68310546875, -8.2354736328125, -7.787841796875, -7.3402099609375, -6.892578125, -6.4449462890625, -5.997314453125, -5.5496826171875, -5.10205078125, -4.6544189453125, -4.206787109375, -3.7591552734375, -3.3115234375, -2.8638916015625, -2.416259765625, -1.9686279296875, -1.52099609375, -1.0733642578125, -0.625732421875, -0.1781005859375, 0.26953125, 0.7171630859375, 1.164794921875, 1.6124267578125, 2.06005859375, 2.5076904296875, 2.955322265625, 3.4029541015625, 3.8505859375, 4.2982177734375, 4.745849609375, 5.1934814453125, 5.64111328125, 6.0887451171875, 6.536376953125, 6.9840087890625, 7.431640625, 7.8792724609375, 8.326904296875, 8.7745361328125, 9.22216796875, 9.6697998046875, 10.117431640625, 10.5650634765625, 11.0126953125, 11.4603271484375, 11.907958984375, 12.3555908203125, 12.80322265625, 13.2508544921875, 13.698486328125, 14.1461181640625, 14.59375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 9.0, 13.0, 23.0, 19.0, 36.0, 64.0, 74.0, 113.0, 166.0, 236.0, 354.0, 460.0, 503.0, 512.0, 418.0, 295.0, 236.0, 174.0, 96.0, 83.0, 49.0, 40.0, 25.0, 16.0, 16.0, 7.0, 11.0, 7.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.0859375, -7.8328857421875, -7.579833984375, -7.3267822265625, -7.07373046875, -6.8206787109375, -6.567626953125, -6.3145751953125, -6.0615234375, -5.8084716796875, -5.555419921875, -5.3023681640625, -5.04931640625, -4.7962646484375, -4.543212890625, -4.2901611328125, -4.037109375, -3.7840576171875, -3.531005859375, -3.2779541015625, -3.02490234375, -2.7718505859375, -2.518798828125, -2.2657470703125, -2.0126953125, -1.7596435546875, -1.506591796875, -1.2535400390625, -1.00048828125, -0.7474365234375, -0.494384765625, -0.2413330078125, 0.01171875, 0.2647705078125, 0.517822265625, 0.7708740234375, 1.02392578125, 1.2769775390625, 1.530029296875, 1.7830810546875, 2.0361328125, 2.2891845703125, 2.542236328125, 2.7952880859375, 3.04833984375, 3.3013916015625, 3.554443359375, 3.8074951171875, 4.060546875, 4.3135986328125, 4.566650390625, 4.8197021484375, 5.07275390625, 5.3258056640625, 5.578857421875, 5.8319091796875, 6.0849609375, 6.3380126953125, 6.591064453125, 6.8441162109375, 7.09716796875, 7.3502197265625, 7.603271484375, 7.8563232421875, 8.109375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 13.0, 8.0, 7.0, 18.0, 30.0, 37.0, 47.0, 30.0, 63.0, 130.0, 138.0, 166.0, 223.0, 359.0, 629.0, 1496.0, 30957.0, 3783034.0, 370671.0, 3899.0, 878.0, 415.0, 266.0, 171.0, 143.0, 114.0, 83.0, 70.0, 43.0, 40.0, 24.0, 19.0, 19.0, 9.0, 10.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.03125, -25.210693359375, -24.39013671875, -23.569580078125, -22.7490234375, -21.928466796875, -21.10791015625, -20.287353515625, -19.466796875, -18.646240234375, -17.82568359375, -17.005126953125, -16.1845703125, -15.364013671875, -14.54345703125, -13.722900390625, -12.90234375, -12.081787109375, -11.26123046875, -10.440673828125, -9.6201171875, -8.799560546875, -7.97900390625, -7.158447265625, -6.337890625, -5.517333984375, -4.69677734375, -3.876220703125, -3.0556640625, -2.235107421875, -1.41455078125, -0.593994140625, 0.2265625, 1.047119140625, 1.86767578125, 2.688232421875, 3.5087890625, 4.329345703125, 5.14990234375, 5.970458984375, 6.791015625, 7.611572265625, 8.43212890625, 9.252685546875, 10.0732421875, 10.893798828125, 11.71435546875, 12.534912109375, 13.35546875, 14.176025390625, 14.99658203125, 15.817138671875, 16.6376953125, 17.458251953125, 18.27880859375, 19.099365234375, 19.919921875, 20.740478515625, 21.56103515625, 22.381591796875, 23.2021484375, 24.022705078125, 24.84326171875, 25.663818359375, 26.484375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 36.0, 342.0, 479.0, 141.0, 12.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.917238235473633, -18.39624786376953, -14.87525749206543, -11.354267120361328, -7.833276748657227, -4.312286376953125, -0.7912960052490234, 2.729694366455078, 6.25068473815918, 9.771675109863281, 13.292665481567383, 16.813655853271484, 20.334646224975586, 23.855636596679688, 27.37662696838379, 30.89761734008789, 34.418609619140625, 37.939598083496094, 41.46059036254883, 44.98158264160156, 48.50257110595703, 52.0235595703125, 55.544551849365234, 59.06554412841797, 62.58653259277344, 66.1075210571289, 69.62850952148438, 73.14950561523438, 76.67049407958984, 80.19148254394531, 83.71247863769531, 87.23346710205078, 90.75445556640625, 94.27544403076172, 97.79643249511719, 101.31742858886719, 104.83841705322266, 108.35940551757812, 111.88040161132812, 115.4013900756836, 118.92237854003906, 122.44336700439453, 125.96435546875, 129.4853515625, 133.00634765625, 136.52732849121094, 140.04832458496094, 143.56930541992188, 147.09030151367188, 150.61129760742188, 154.1322784423828, 157.6532745361328, 161.17425537109375, 164.69525146484375, 168.21624755859375, 171.7372283935547, 175.2582244873047, 178.7792205810547, 182.30020141601562, 185.82119750976562, 189.34219360351562, 192.86317443847656, 196.38417053222656, 199.9051513671875, 203.4261474609375]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 8.0, 15.0, 9.0, 16.0, 5.0, 18.0, 14.0, 28.0, 15.0, 25.0, 30.0, 32.0, 20.0, 27.0, 35.0, 38.0, 44.0, 43.0, 36.0, 36.0, 39.0, 27.0, 30.0, 40.0, 36.0, 32.0, 34.0, 35.0, 35.0, 21.0, 21.0, 18.0, 14.0, 15.0, 17.0, 15.0, 11.0, 8.0, 10.0, 9.0, 6.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.458660125732422, -19.81545066833496, -19.1722412109375, -18.529033660888672, -17.88582420349121, -17.24261474609375, -16.59940528869629, -15.956195831298828, -15.312986373901367, -14.669776916503906, -14.026568412780762, -13.3833589553833, -12.74014949798584, -12.096940994262695, -11.453731536865234, -10.810522079467773, -10.167313575744629, -9.524104118347168, -8.880895614624023, -8.237686157226562, -7.594476699829102, -6.951267719268799, -6.308058738708496, -5.664849281311035, -5.021640300750732, -4.37843132019043, -3.7352218627929688, -3.092012882232666, -2.448803663253784, -1.8055944442749023, -1.1623854637145996, -0.5191760063171387, 0.12403297424316406, 0.7672421336174011, 1.4104512929916382, 2.0536603927612305, 2.6968696117401123, 3.340078830718994, 3.983287811279297, 4.626497268676758, 5.2697062492370605, 5.912915229797363, 6.556124687194824, 7.199333667755127, 7.84254264831543, 8.48575210571289, 9.128961563110352, 9.772171020507812, 10.415379524230957, 11.058588981628418, 11.701797485351562, 12.345006942749023, 12.988216400146484, 13.631425857543945, 14.27463436126709, 14.91784381866455, 15.561052322387695, 16.204261779785156, 16.847471237182617, 17.490680694580078, 18.133888244628906, 18.777097702026367, 19.420307159423828, 20.06351661682129, 20.70672607421875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 9.0, 11.0, 11.0, 14.0, 13.0, 22.0, 27.0, 27.0, 27.0, 21.0, 36.0, 28.0, 43.0, 37.0, 39.0, 51.0, 44.0, 35.0, 38.0, 42.0, 30.0, 47.0, 36.0, 30.0, 43.0, 33.0, 34.0, 28.0, 27.0, 17.0, 22.0, 13.0, 13.0, 11.0, 8.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.45703125, -4.32073974609375, -4.1844482421875, -4.04815673828125, -3.911865234375, -3.77557373046875, -3.6392822265625, -3.50299072265625, -3.36669921875, -3.23040771484375, -3.0941162109375, -2.95782470703125, -2.821533203125, -2.68524169921875, -2.5489501953125, -2.41265869140625, -2.2763671875, -2.14007568359375, -2.0037841796875, -1.86749267578125, -1.731201171875, -1.59490966796875, -1.4586181640625, -1.32232666015625, -1.18603515625, -1.04974365234375, -0.9134521484375, -0.77716064453125, -0.640869140625, -0.50457763671875, -0.3682861328125, -0.23199462890625, -0.095703125, 0.04058837890625, 0.1768798828125, 0.31317138671875, 0.449462890625, 0.58575439453125, 0.7220458984375, 0.85833740234375, 0.99462890625, 1.13092041015625, 1.2672119140625, 1.40350341796875, 1.539794921875, 1.67608642578125, 1.8123779296875, 1.94866943359375, 2.0849609375, 2.22125244140625, 2.3575439453125, 2.49383544921875, 2.630126953125, 2.76641845703125, 2.9027099609375, 3.03900146484375, 3.17529296875, 3.31158447265625, 3.4478759765625, 3.58416748046875, 3.720458984375, 3.85675048828125, 3.9930419921875, 4.12933349609375, 4.265625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 11.0, 9.0, 11.0, 19.0, 38.0, 61.0, 79.0, 114.0, 146.0, 288.0, 398.0, 623.0, 918.0, 1522.0, 2353.0, 3876.0, 6192.0, 10061.0, 16516.0, 27754.0, 49080.0, 89129.0, 176299.0, 307770.0, 160572.0, 82205.0, 45618.0, 26117.0, 15547.0, 9432.0, 5853.0, 3637.0, 2205.0, 1457.0, 932.0, 572.0, 414.0, 259.0, 155.0, 108.0, 78.0, 45.0, 27.0, 17.0, 14.0, 7.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.83154296875, -0.805908203125, -0.7802734375, -0.754638671875, -0.72900390625, -0.703369140625, -0.677734375, -0.652099609375, -0.62646484375, -0.600830078125, -0.5751953125, -0.549560546875, -0.52392578125, -0.498291015625, -0.47265625, -0.447021484375, -0.42138671875, -0.395751953125, -0.3701171875, -0.344482421875, -0.31884765625, -0.293212890625, -0.267578125, -0.241943359375, -0.21630859375, -0.190673828125, -0.1650390625, -0.139404296875, -0.11376953125, -0.088134765625, -0.0625, -0.036865234375, -0.01123046875, 0.014404296875, 0.0400390625, 0.065673828125, 0.09130859375, 0.116943359375, 0.142578125, 0.168212890625, 0.19384765625, 0.219482421875, 0.2451171875, 0.270751953125, 0.29638671875, 0.322021484375, 0.34765625, 0.373291015625, 0.39892578125, 0.424560546875, 0.4501953125, 0.475830078125, 0.50146484375, 0.527099609375, 0.552734375, 0.578369140625, 0.60400390625, 0.629638671875, 0.6552734375, 0.680908203125, 0.70654296875, 0.732177734375, 0.7578125, 0.783447265625, 0.80908203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 0.0, 4.0, 9.0, 10.0, 7.0, 10.0, 6.0, 18.0, 30.0, 22.0, 22.0, 29.0, 38.0, 37.0, 37.0, 30.0, 34.0, 35.0, 43.0, 37.0, 1083.0, 49.0, 44.0, 45.0, 47.0, 39.0, 25.0, 29.0, 33.0, 28.0, 21.0, 15.0, 17.0, 15.0, 13.0, 8.0, 12.0, 16.0, 7.0, 7.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.92327880859375, -2.8367919921875, -2.75030517578125, -2.663818359375, -2.57733154296875, -2.4908447265625, -2.40435791015625, -2.31787109375, -2.23138427734375, -2.1448974609375, -2.05841064453125, -1.971923828125, -1.88543701171875, -1.7989501953125, -1.71246337890625, -1.6259765625, -1.53948974609375, -1.4530029296875, -1.36651611328125, -1.280029296875, -1.19354248046875, -1.1070556640625, -1.02056884765625, -0.93408203125, -0.84759521484375, -0.7611083984375, -0.67462158203125, -0.588134765625, -0.50164794921875, -0.4151611328125, -0.32867431640625, -0.2421875, -0.15570068359375, -0.0692138671875, 0.01727294921875, 0.103759765625, 0.19024658203125, 0.2767333984375, 0.36322021484375, 0.44970703125, 0.53619384765625, 0.6226806640625, 0.70916748046875, 0.795654296875, 0.88214111328125, 0.9686279296875, 1.05511474609375, 1.1416015625, 1.22808837890625, 1.3145751953125, 1.40106201171875, 1.487548828125, 1.57403564453125, 1.6605224609375, 1.74700927734375, 1.83349609375, 1.91998291015625, 2.0064697265625, 2.09295654296875, 2.179443359375, 2.26593017578125, 2.3524169921875, 2.43890380859375, 2.525390625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 13.0, 13.0, 25.0, 30.0, 66.0, 82.0, 118.0, 185.0, 303.0, 466.0, 630.0, 1001.0, 1454.0, 2077.0, 3025.0, 4581.0, 6555.0, 9994.0, 15320.0, 23663.0, 37109.0, 60167.0, 106324.0, 237747.0, 1300611.0, 112307.0, 62186.0, 38409.0, 24360.0, 16066.0, 10575.0, 7176.0, 4752.0, 3138.0, 2116.0, 1446.0, 955.0, 642.0, 452.0, 291.0, 230.0, 159.0, 91.0, 66.0, 44.0, 48.0, 28.0, 9.0, 8.0, 9.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6352920532226562, -0.6148223876953125, -0.5943527221679688, -0.573883056640625, -0.5534133911132812, -0.5329437255859375, -0.5124740600585938, -0.49200439453125, -0.47153472900390625, -0.4510650634765625, -0.43059539794921875, -0.410125732421875, -0.38965606689453125, -0.3691864013671875, -0.34871673583984375, -0.3282470703125, -0.30777740478515625, -0.2873077392578125, -0.26683807373046875, -0.246368408203125, -0.22589874267578125, -0.2054290771484375, -0.18495941162109375, -0.16448974609375, -0.14402008056640625, -0.1235504150390625, -0.10308074951171875, -0.082611083984375, -0.06214141845703125, -0.0416717529296875, -0.02120208740234375, -0.000732421875, 0.01973724365234375, 0.0402069091796875, 0.06067657470703125, 0.081146240234375, 0.10161590576171875, 0.1220855712890625, 0.14255523681640625, 0.16302490234375, 0.18349456787109375, 0.2039642333984375, 0.22443389892578125, 0.244903564453125, 0.26537322998046875, 0.2858428955078125, 0.30631256103515625, 0.3267822265625, 0.34725189208984375, 0.3677215576171875, 0.38819122314453125, 0.408660888671875, 0.42913055419921875, 0.4496002197265625, 0.47006988525390625, 0.49053955078125, 0.5110092163085938, 0.5314788818359375, 0.5519485473632812, 0.572418212890625, 0.5928878784179688, 0.6133575439453125, 0.6338272094726562, 0.654296875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 16.0, 2.0, 7.0, 7.0, 13.0, 21.0, 24.0, 26.0, 26.0, 50.0, 51.0, 70.0, 67.0, 71.0, 81.0, 68.0, 69.0, 71.0, 63.0, 44.0, 31.0, 18.0, 24.0, 12.0, 15.0, 12.0, 8.0, 7.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001919269561767578, -0.0001860298216342926, -0.0001801326870918274, -0.00017423555254936218, -0.00016833841800689697, -0.00016244128346443176, -0.00015654414892196655, -0.00015064701437950134, -0.00014474987983703613, -0.00013885274529457092, -0.0001329556107521057, -0.0001270584762096405, -0.00012116134166717529, -0.00011526420712471008, -0.00010936707258224487, -0.00010346993803977966, -9.757280349731445e-05, -9.167566895484924e-05, -8.577853441238403e-05, -7.988139986991882e-05, -7.398426532745361e-05, -6.80871307849884e-05, -6.21899962425232e-05, -5.6292861700057983e-05, -5.0395727157592773e-05, -4.4498592615127563e-05, -3.8601458072662354e-05, -3.2704323530197144e-05, -2.6807188987731934e-05, -2.0910054445266724e-05, -1.5012919902801514e-05, -9.115785360336304e-06, -3.2186508178710938e-06, 2.678483724594116e-06, 8.575618267059326e-06, 1.4472752809524536e-05, 2.0369887351989746e-05, 2.6267021894454956e-05, 3.2164156436920166e-05, 3.8061290979385376e-05, 4.3958425521850586e-05, 4.9855560064315796e-05, 5.5752694606781006e-05, 6.164982914924622e-05, 6.754696369171143e-05, 7.344409823417664e-05, 7.934123277664185e-05, 8.523836731910706e-05, 9.113550186157227e-05, 9.703263640403748e-05, 0.00010292977094650269, 0.0001088269054889679, 0.0001147240400314331, 0.00012062117457389832, 0.00012651830911636353, 0.00013241544365882874, 0.00013831257820129395, 0.00014420971274375916, 0.00015010684728622437, 0.00015600398182868958, 0.00016190111637115479, 0.00016779825091362, 0.0001736953854560852, 0.00017959251999855042, 0.00018548965454101562]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 8.0, 13.0, 23.0, 9.0, 18.0, 29.0, 36.0, 53.0, 82.0, 134.0, 225.0, 459.0, 1338.0, 1010530.0, 33897.0, 818.0, 340.0, 154.0, 124.0, 59.0, 45.0, 35.0, 32.0, 24.0, 13.0, 10.0, 11.0, 8.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004161834716796875, -0.0040267109870910645, -0.003891587257385254, -0.0037564635276794434, -0.003621339797973633, -0.0034862160682678223, -0.0033510923385620117, -0.003215968608856201, -0.0030808448791503906, -0.00294572114944458, -0.0028105974197387695, -0.002675473690032959, -0.0025403499603271484, -0.002405226230621338, -0.0022701025009155273, -0.002134978771209717, -0.0019998550415039062, -0.0018647313117980957, -0.0017296075820922852, -0.0015944838523864746, -0.001459360122680664, -0.0013242363929748535, -0.001189112663269043, -0.0010539889335632324, -0.0009188652038574219, -0.0007837414741516113, -0.0006486177444458008, -0.0005134940147399902, -0.0003783702850341797, -0.00024324655532836914, -0.0001081228256225586, 2.7000904083251953e-05, 0.0001621246337890625, 0.00029724836349487305, 0.0004323720932006836, 0.0005674958229064941, 0.0007026195526123047, 0.0008377432823181152, 0.0009728670120239258, 0.0011079907417297363, 0.0012431144714355469, 0.0013782382011413574, 0.001513361930847168, 0.0016484856605529785, 0.001783609390258789, 0.0019187331199645996, 0.00205385684967041, 0.0021889805793762207, 0.0023241043090820312, 0.002459228038787842, 0.0025943517684936523, 0.002729475498199463, 0.0028645992279052734, 0.002999722957611084, 0.0031348466873168945, 0.003269970417022705, 0.0034050941467285156, 0.003540217876434326, 0.0036753416061401367, 0.0038104653358459473, 0.003945589065551758, 0.004080712795257568, 0.004215836524963379, 0.0043509602546691895, 0.004486083984375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 15.0, 29.0, 64.0, 106.0, 143.0, 172.0, 154.0, 144.0, 94.0, 41.0, 25.0, 14.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010209299944108352, -9.857855911832303e-05, -9.506411879556254e-05, -9.154967847280204e-05, -8.803523815004155e-05, -8.452079782728106e-05, -8.100636478047818e-05, -7.749191718176007e-05, -7.39774841349572e-05, -7.04630438121967e-05, -6.694860348943621e-05, -6.343416316667572e-05, -5.9919722843915224e-05, -5.640528252115473e-05, -5.2890845836373046e-05, -4.9376405513612553e-05, -4.5861961552873254e-05, -4.234752123011276e-05, -3.883308090735227e-05, -3.5318640584591776e-05, -3.1804200261831284e-05, -2.8289761758060195e-05, -2.4775323254289106e-05, -2.1260882931528613e-05, -1.774644260876812e-05, -1.4232002286007628e-05, -1.0717562872741837e-05, -7.203123459476046e-06, -3.6886831367155537e-06, -1.7424281395506114e-07, 3.340195689816028e-06, 6.8546360125765204e-06, 1.0369083611294627e-05, 1.388352393405512e-05, 1.7397964256815612e-05, 2.09124027605867e-05, 2.4426843083347194e-05, 2.7941283406107686e-05, 3.1455721909878775e-05, 3.497016223263927e-05, 3.848460255539976e-05, 4.199904287816025e-05, 4.5513483200920746e-05, 4.902791988570243e-05, 5.2542360208462924e-05, 5.6056800531223416e-05, 5.957124085398391e-05, 6.30856811767444e-05, 6.66001214995049e-05, 7.011456182226539e-05, 7.362900214502588e-05, 7.714344246778637e-05, 8.065788279054686e-05, 8.417232311330736e-05, 8.768675616011024e-05, 9.120120375882834e-05, 9.471563680563122e-05, 9.823007712839171e-05, 0.0001017445174511522, 0.0001052589577739127, 0.00010877339809667319, 0.00011228783841943368, 0.00011580227874219418, 0.00011931671178899705, 0.00012283115938771516]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 8.0, 10.0, 6.0, 13.0, 10.0, 18.0, 11.0, 25.0, 13.0, 23.0, 21.0, 31.0, 34.0, 26.0, 32.0, 42.0, 35.0, 33.0, 41.0, 29.0, 44.0, 35.0, 36.0, 31.0, 40.0, 34.0, 38.0, 23.0, 28.0, 33.0, 28.0, 28.0, 17.0, 10.0, 19.0, 15.0, 14.0, 8.0, 8.0, 10.0, 6.0, 7.0, 3.0, 5.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.575750350952148e-05, -7.341057062149048e-05, -7.106363773345947e-05, -6.871670484542847e-05, -6.636977195739746e-05, -6.402283906936646e-05, -6.167590618133545e-05, -5.932897329330444e-05, -5.698204040527344e-05, -5.463510751724243e-05, -5.2288174629211426e-05, -4.994124174118042e-05, -4.7594308853149414e-05, -4.524737596511841e-05, -4.29004430770874e-05, -4.0553510189056396e-05, -3.820657730102539e-05, -3.5859644412994385e-05, -3.351271152496338e-05, -3.116577863693237e-05, -2.8818845748901367e-05, -2.647191286087036e-05, -2.4124979972839355e-05, -2.177804708480835e-05, -1.9431114196777344e-05, -1.7084181308746338e-05, -1.4737248420715332e-05, -1.2390315532684326e-05, -1.004338264465332e-05, -7.696449756622314e-06, -5.349516868591309e-06, -3.0025839805603027e-06, -6.556510925292969e-07, 1.691281795501709e-06, 4.038214683532715e-06, 6.385147571563721e-06, 8.732080459594727e-06, 1.1079013347625732e-05, 1.3425946235656738e-05, 1.5772879123687744e-05, 1.811981201171875e-05, 2.0466744899749756e-05, 2.2813677787780762e-05, 2.5160610675811768e-05, 2.7507543563842773e-05, 2.985447645187378e-05, 3.2201409339904785e-05, 3.454834222793579e-05, 3.68952751159668e-05, 3.92422080039978e-05, 4.158914089202881e-05, 4.3936073780059814e-05, 4.628300666809082e-05, 4.8629939556121826e-05, 5.097687244415283e-05, 5.332380533218384e-05, 5.5670738220214844e-05, 5.801767110824585e-05, 6.0364603996276855e-05, 6.271153688430786e-05, 6.505846977233887e-05, 6.740540266036987e-05, 6.975233554840088e-05, 7.209926843643188e-05, 7.444620132446289e-05]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 9.0, 11.0, 11.0, 14.0, 13.0, 22.0, 27.0, 27.0, 27.0, 21.0, 36.0, 28.0, 43.0, 37.0, 39.0, 51.0, 44.0, 35.0, 38.0, 42.0, 30.0, 47.0, 36.0, 30.0, 43.0, 33.0, 34.0, 28.0, 27.0, 17.0, 22.0, 13.0, 13.0, 11.0, 8.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.45703125, -4.32073974609375, -4.1844482421875, -4.04815673828125, -3.911865234375, -3.77557373046875, -3.6392822265625, -3.50299072265625, -3.36669921875, -3.23040771484375, -3.0941162109375, -2.95782470703125, -2.821533203125, -2.68524169921875, -2.5489501953125, -2.41265869140625, -2.2763671875, -2.14007568359375, -2.0037841796875, -1.86749267578125, -1.731201171875, -1.59490966796875, -1.4586181640625, -1.32232666015625, -1.18603515625, -1.04974365234375, -0.9134521484375, -0.77716064453125, -0.640869140625, -0.50457763671875, -0.3682861328125, -0.23199462890625, -0.095703125, 0.04058837890625, 0.1768798828125, 0.31317138671875, 0.449462890625, 0.58575439453125, 0.7220458984375, 0.85833740234375, 0.99462890625, 1.13092041015625, 1.2672119140625, 1.40350341796875, 1.539794921875, 1.67608642578125, 1.8123779296875, 1.94866943359375, 2.0849609375, 2.22125244140625, 2.3575439453125, 2.49383544921875, 2.630126953125, 2.76641845703125, 2.9027099609375, 3.03900146484375, 3.17529296875, 3.31158447265625, 3.4478759765625, 3.58416748046875, 3.720458984375, 3.85675048828125, 3.9930419921875, 4.12933349609375, 4.265625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 2.0, 8.0, 9.0, 9.0, 19.0, 21.0, 24.0, 36.0, 44.0, 66.0, 97.0, 126.0, 190.0, 276.0, 430.0, 835.0, 2827.0, 13082.0, 65420.0, 489034.0, 406361.0, 54177.0, 10874.0, 2460.0, 807.0, 407.0, 268.0, 184.0, 122.0, 88.0, 64.0, 43.0, 40.0, 33.0, 21.0, 12.0, 7.0, 11.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.296875, -8.0450439453125, -7.793212890625, -7.5413818359375, -7.28955078125, -7.0377197265625, -6.785888671875, -6.5340576171875, -6.2822265625, -6.0303955078125, -5.778564453125, -5.5267333984375, -5.27490234375, -5.0230712890625, -4.771240234375, -4.5194091796875, -4.267578125, -4.0157470703125, -3.763916015625, -3.5120849609375, -3.26025390625, -3.0084228515625, -2.756591796875, -2.5047607421875, -2.2529296875, -2.0010986328125, -1.749267578125, -1.4974365234375, -1.24560546875, -0.9937744140625, -0.741943359375, -0.4901123046875, -0.23828125, 0.0135498046875, 0.265380859375, 0.5172119140625, 0.76904296875, 1.0208740234375, 1.272705078125, 1.5245361328125, 1.7763671875, 2.0281982421875, 2.280029296875, 2.5318603515625, 2.78369140625, 3.0355224609375, 3.287353515625, 3.5391845703125, 3.791015625, 4.0428466796875, 4.294677734375, 4.5465087890625, 4.79833984375, 5.0501708984375, 5.302001953125, 5.5538330078125, 5.8056640625, 6.0574951171875, 6.309326171875, 6.5611572265625, 6.81298828125, 7.0648193359375, 7.316650390625, 7.5684814453125, 7.8203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 0.0, 1.0, 5.0, 5.0, 7.0, 7.0, 5.0, 12.0, 12.0, 10.0, 10.0, 18.0, 17.0, 21.0, 23.0, 29.0, 30.0, 43.0, 42.0, 56.0, 58.0, 75.0, 134.0, 391.0, 1411.0, 168.0, 69.0, 52.0, 46.0, 40.0, 41.0, 36.0, 23.0, 28.0, 20.0, 17.0, 12.0, 17.0, 11.0, 14.0, 11.0, 9.0, 6.0, 2.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.5960693359375, -12.176513671875, -11.7569580078125, -11.33740234375, -10.9178466796875, -10.498291015625, -10.0787353515625, -9.6591796875, -9.2396240234375, -8.820068359375, -8.4005126953125, -7.98095703125, -7.5614013671875, -7.141845703125, -6.7222900390625, -6.302734375, -5.8831787109375, -5.463623046875, -5.0440673828125, -4.62451171875, -4.2049560546875, -3.785400390625, -3.3658447265625, -2.9462890625, -2.5267333984375, -2.107177734375, -1.6876220703125, -1.26806640625, -0.8485107421875, -0.428955078125, -0.0093994140625, 0.41015625, 0.8297119140625, 1.249267578125, 1.6688232421875, 2.08837890625, 2.5079345703125, 2.927490234375, 3.3470458984375, 3.7666015625, 4.1861572265625, 4.605712890625, 5.0252685546875, 5.44482421875, 5.8643798828125, 6.283935546875, 6.7034912109375, 7.123046875, 7.5426025390625, 7.962158203125, 8.3817138671875, 8.80126953125, 9.2208251953125, 9.640380859375, 10.0599365234375, 10.4794921875, 10.8990478515625, 11.318603515625, 11.7381591796875, 12.15771484375, 12.5772705078125, 12.996826171875, 13.4163818359375, 13.8359375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 3.0, 9.0, 10.0, 14.0, 23.0, 24.0, 20.0, 21.0, 38.0, 49.0, 49.0, 82.0, 119.0, 192.0, 254.0, 505.0, 1212.0, 7902.0, 2965328.0, 165133.0, 2709.0, 812.0, 384.0, 235.0, 121.0, 83.0, 70.0, 63.0, 41.0, 45.0, 21.0, 24.0, 20.0, 16.0, 10.0, 11.0, 11.0, 9.0, 4.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.09375, -29.08349609375, -28.0732421875, -27.06298828125, -26.052734375, -25.04248046875, -24.0322265625, -23.02197265625, -22.01171875, -21.00146484375, -19.9912109375, -18.98095703125, -17.970703125, -16.96044921875, -15.9501953125, -14.93994140625, -13.9296875, -12.91943359375, -11.9091796875, -10.89892578125, -9.888671875, -8.87841796875, -7.8681640625, -6.85791015625, -5.84765625, -4.83740234375, -3.8271484375, -2.81689453125, -1.806640625, -0.79638671875, 0.2138671875, 1.22412109375, 2.234375, 3.24462890625, 4.2548828125, 5.26513671875, 6.275390625, 7.28564453125, 8.2958984375, 9.30615234375, 10.31640625, 11.32666015625, 12.3369140625, 13.34716796875, 14.357421875, 15.36767578125, 16.3779296875, 17.38818359375, 18.3984375, 19.40869140625, 20.4189453125, 21.42919921875, 22.439453125, 23.44970703125, 24.4599609375, 25.47021484375, 26.48046875, 27.49072265625, 28.5009765625, 29.51123046875, 30.521484375, 31.53173828125, 32.5419921875, 33.55224609375, 34.5625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 364.0, 639.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.357666015625, -178.4025115966797, -174.44735717773438, -170.49220275878906, -166.53704833984375, -162.58189392089844, -158.62673950195312, -154.6715850830078, -150.7164306640625, -146.7612762451172, -142.80612182617188, -138.85096740722656, -134.89581298828125, -130.94065856933594, -126.98550415039062, -123.03034973144531, -119.0751953125, -115.12004089355469, -111.16488647460938, -107.20973205566406, -103.25457763671875, -99.29942321777344, -95.34426879882812, -91.38911437988281, -87.43396759033203, -83.47881317138672, -79.5236587524414, -75.5685043334961, -71.61334991455078, -67.65819549560547, -63.703041076660156, -59.747886657714844, -55.79273223876953, -51.83757781982422, -47.882423400878906, -43.927268981933594, -39.97211456298828, -36.01696014404297, -32.061805725097656, -28.106653213500977, -24.151498794555664, -20.19634437561035, -16.24118995666504, -12.286036491394043, -8.33088207244873, -4.375728607177734, -0.4205741882324219, 3.5345802307128906, 7.489734649658203, 11.444889068603516, 15.400043487548828, 19.35519790649414, 23.310352325439453, 27.265504837036133, 31.220659255981445, 35.175811767578125, 39.13096618652344, 43.08612060546875, 47.04127502441406, 50.996429443359375, 54.95158386230469, 58.90673828125, 62.86189270019531, 66.81704711914062, 70.77220153808594]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 9.0, 5.0, 9.0, 5.0, 10.0, 14.0, 18.0, 21.0, 35.0, 27.0, 22.0, 31.0, 37.0, 32.0, 45.0, 61.0, 34.0, 42.0, 38.0, 39.0, 28.0, 43.0, 38.0, 33.0, 30.0, 35.0, 23.0, 23.0, 34.0, 22.0, 24.0, 17.0, 11.0, 17.0, 9.0, 7.0, 8.0, 10.0, 7.0, 5.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.35193634033203, -27.443452835083008, -26.534971237182617, -25.626487731933594, -24.71800422668457, -23.809520721435547, -22.901039123535156, -21.992555618286133, -21.08407211303711, -20.175588607788086, -19.267107009887695, -18.358623504638672, -17.45013999938965, -16.541656494140625, -15.633174896240234, -14.724691390991211, -13.81620979309082, -12.907727241516113, -11.99924373626709, -11.090761184692383, -10.18227767944336, -9.273795127868652, -8.365312576293945, -7.45682954788208, -6.548346519470215, -5.63986349105835, -4.731380462646484, -3.8228979110717773, -2.914414882659912, -2.005931854248047, -1.0974493026733398, -0.1889662742614746, 0.7195186614990234, 1.6280015707015991, 2.536484479904175, 3.444967269897461, 4.353450298309326, 5.261933326721191, 6.170415878295898, 7.078898906707764, 7.987381935119629, 8.895864486694336, 9.80434799194336, 10.712830543518066, 11.621313095092773, 12.529796600341797, 13.438279151916504, 14.346761703491211, 15.255245208740234, 16.163728713989258, 17.07221031188965, 17.980693817138672, 18.889177322387695, 19.79766082763672, 20.70614242553711, 21.614625930786133, 22.523109436035156, 23.43159294128418, 24.34007453918457, 25.248558044433594, 26.157041549682617, 27.06552505493164, 27.97400665283203, 28.882490158081055, 29.790971755981445]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 9.0, 9.0, 16.0, 9.0, 22.0, 20.0, 28.0, 23.0, 38.0, 31.0, 21.0, 31.0, 33.0, 45.0, 40.0, 40.0, 41.0, 44.0, 44.0, 40.0, 38.0, 38.0, 30.0, 35.0, 36.0, 29.0, 26.0, 22.0, 14.0, 21.0, 13.0, 12.0, 9.0, 11.0, 17.0, 6.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.03515625, -3.90496826171875, -3.7747802734375, -3.64459228515625, -3.514404296875, -3.38421630859375, -3.2540283203125, -3.12384033203125, -2.99365234375, -2.86346435546875, -2.7332763671875, -2.60308837890625, -2.472900390625, -2.34271240234375, -2.2125244140625, -2.08233642578125, -1.9521484375, -1.82196044921875, -1.6917724609375, -1.56158447265625, -1.431396484375, -1.30120849609375, -1.1710205078125, -1.04083251953125, -0.91064453125, -0.78045654296875, -0.6502685546875, -0.52008056640625, -0.389892578125, -0.25970458984375, -0.1295166015625, 0.00067138671875, 0.130859375, 0.26104736328125, 0.3912353515625, 0.52142333984375, 0.651611328125, 0.78179931640625, 0.9119873046875, 1.04217529296875, 1.17236328125, 1.30255126953125, 1.4327392578125, 1.56292724609375, 1.693115234375, 1.82330322265625, 1.9534912109375, 2.08367919921875, 2.2138671875, 2.34405517578125, 2.4742431640625, 2.60443115234375, 2.734619140625, 2.86480712890625, 2.9949951171875, 3.12518310546875, 3.25537109375, 3.38555908203125, 3.5157470703125, 3.64593505859375, 3.776123046875, 3.90631103515625, 4.0364990234375, 4.16668701171875, 4.296875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 9.0, 13.0, 14.0, 16.0, 29.0, 22.0, 24.0, 47.0, 47.0, 61.0, 82.0, 135.0, 203.0, 562.0, 2274.0, 33292.0, 874831.0, 2891512.0, 375191.0, 13414.0, 1408.0, 405.0, 190.0, 109.0, 80.0, 50.0, 47.0, 33.0, 24.0, 22.0, 15.0, 17.0, 16.0, 8.0, 13.0, 7.0, 6.0, 9.0, 3.0, 5.0, 1.0, 6.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-11.125, -10.79150390625, -10.4580078125, -10.12451171875, -9.791015625, -9.45751953125, -9.1240234375, -8.79052734375, -8.45703125, -8.12353515625, -7.7900390625, -7.45654296875, -7.123046875, -6.78955078125, -6.4560546875, -6.12255859375, -5.7890625, -5.45556640625, -5.1220703125, -4.78857421875, -4.455078125, -4.12158203125, -3.7880859375, -3.45458984375, -3.12109375, -2.78759765625, -2.4541015625, -2.12060546875, -1.787109375, -1.45361328125, -1.1201171875, -0.78662109375, -0.453125, -0.11962890625, 0.2138671875, 0.54736328125, 0.880859375, 1.21435546875, 1.5478515625, 1.88134765625, 2.21484375, 2.54833984375, 2.8818359375, 3.21533203125, 3.548828125, 3.88232421875, 4.2158203125, 4.54931640625, 4.8828125, 5.21630859375, 5.5498046875, 5.88330078125, 6.216796875, 6.55029296875, 6.8837890625, 7.21728515625, 7.55078125, 7.88427734375, 8.2177734375, 8.55126953125, 8.884765625, 9.21826171875, 9.5517578125, 9.88525390625, 10.21875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 12.0, 9.0, 15.0, 18.0, 17.0, 32.0, 31.0, 66.0, 70.0, 109.0, 145.0, 194.0, 209.0, 297.0, 348.0, 351.0, 408.0, 367.0, 275.0, 223.0, 213.0, 158.0, 106.0, 85.0, 75.0, 50.0, 36.0, 33.0, 16.0, 16.0, 13.0, 13.0, 21.0, 13.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.10546875, -5.92706298828125, -5.7486572265625, -5.57025146484375, -5.391845703125, -5.21343994140625, -5.0350341796875, -4.85662841796875, -4.67822265625, -4.49981689453125, -4.3214111328125, -4.14300537109375, -3.964599609375, -3.78619384765625, -3.6077880859375, -3.42938232421875, -3.2509765625, -3.07257080078125, -2.8941650390625, -2.71575927734375, -2.537353515625, -2.35894775390625, -2.1805419921875, -2.00213623046875, -1.82373046875, -1.64532470703125, -1.4669189453125, -1.28851318359375, -1.110107421875, -0.93170166015625, -0.7532958984375, -0.57489013671875, -0.396484375, -0.21807861328125, -0.0396728515625, 0.13873291015625, 0.317138671875, 0.49554443359375, 0.6739501953125, 0.85235595703125, 1.03076171875, 1.20916748046875, 1.3875732421875, 1.56597900390625, 1.744384765625, 1.92279052734375, 2.1011962890625, 2.27960205078125, 2.4580078125, 2.63641357421875, 2.8148193359375, 2.99322509765625, 3.171630859375, 3.35003662109375, 3.5284423828125, 3.70684814453125, 3.88525390625, 4.06365966796875, 4.2420654296875, 4.42047119140625, 4.598876953125, 4.77728271484375, 4.9556884765625, 5.13409423828125, 5.3125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 7.0, 2.0, 10.0, 7.0, 16.0, 19.0, 23.0, 26.0, 54.0, 70.0, 77.0, 96.0, 130.0, 176.0, 261.0, 433.0, 759.0, 2264.0, 28945.0, 2603854.0, 1535414.0, 17784.0, 1820.0, 729.0, 416.0, 238.0, 169.0, 123.0, 73.0, 62.0, 56.0, 47.0, 38.0, 30.0, 14.0, 13.0, 12.0, 12.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.423095703125, -16.79931640625, -16.175537109375, -15.5517578125, -14.927978515625, -14.30419921875, -13.680419921875, -13.056640625, -12.432861328125, -11.80908203125, -11.185302734375, -10.5615234375, -9.937744140625, -9.31396484375, -8.690185546875, -8.06640625, -7.442626953125, -6.81884765625, -6.195068359375, -5.5712890625, -4.947509765625, -4.32373046875, -3.699951171875, -3.076171875, -2.452392578125, -1.82861328125, -1.204833984375, -0.5810546875, 0.042724609375, 0.66650390625, 1.290283203125, 1.9140625, 2.537841796875, 3.16162109375, 3.785400390625, 4.4091796875, 5.032958984375, 5.65673828125, 6.280517578125, 6.904296875, 7.528076171875, 8.15185546875, 8.775634765625, 9.3994140625, 10.023193359375, 10.64697265625, 11.270751953125, 11.89453125, 12.518310546875, 13.14208984375, 13.765869140625, 14.3896484375, 15.013427734375, 15.63720703125, 16.260986328125, 16.884765625, 17.508544921875, 18.13232421875, 18.756103515625, 19.3798828125, 20.003662109375, 20.62744140625, 21.251220703125, 21.875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 25.0, 129.0, 367.0, 356.0, 115.0, 22.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.33060455322266, -105.81037902832031, -103.2901611328125, -100.76993560791016, -98.24971008300781, -95.7294921875, -93.20926666259766, -90.68904113769531, -88.1688232421875, -85.64859771728516, -83.12837982177734, -80.608154296875, -78.08793640136719, -75.56771087646484, -73.0474853515625, -70.52726745605469, -68.00704193115234, -65.48681640625, -62.96659851074219, -60.446372985839844, -57.926151275634766, -55.40592956542969, -52.885704040527344, -50.365482330322266, -47.84526062011719, -45.32503890991211, -42.80481719970703, -40.28459167480469, -37.76436996459961, -35.24414825439453, -32.72392272949219, -30.20370101928711, -27.6834716796875, -25.163249969482422, -22.64302635192871, -20.122802734375, -17.602581024169922, -15.082358360290527, -12.562135696411133, -10.041912078857422, -7.521690368652344, -5.001467704772949, -2.4812450408935547, 0.038977622985839844, 2.5592002868652344, 5.079422950744629, 7.599645614624023, 10.119869232177734, 12.640090942382812, 15.160313606262207, 17.6805362701416, 20.200759887695312, 22.72098159790039, 25.24120330810547, 27.76142692565918, 30.28165054321289, 32.80187225341797, 35.32209396362305, 37.842315673828125, 40.36254119873047, 42.88276290893555, 45.402984619140625, 47.92321014404297, 50.44343185424805, 52.963653564453125]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 7.0, 7.0, 13.0, 10.0, 16.0, 11.0, 13.0, 25.0, 27.0, 25.0, 21.0, 32.0, 41.0, 41.0, 42.0, 30.0, 43.0, 39.0, 42.0, 41.0, 33.0, 30.0, 35.0, 34.0, 35.0, 24.0, 38.0, 32.0, 30.0, 22.0, 25.0, 16.0, 11.0, 15.0, 14.0, 11.0, 14.0, 6.0, 7.0, 5.0, 4.0, 7.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.28722381591797, -19.64261245727539, -18.998001098632812, -18.353389739990234, -17.708778381347656, -17.064167022705078, -16.4195556640625, -15.774945259094238, -15.13033390045166, -14.485722541809082, -13.841111183166504, -13.196499824523926, -12.551889419555664, -11.907278060913086, -11.262666702270508, -10.61805534362793, -9.973443984985352, -9.328832626342773, -8.684221267700195, -8.039609909057617, -7.394999027252197, -6.750387668609619, -6.105776786804199, -5.461165428161621, -4.816554069519043, -4.171942710876465, -3.527331590652466, -2.882720470428467, -2.2381091117858887, -1.5934977531433105, -0.9488866329193115, -0.3042755126953125, 0.3403358459472656, 0.9849470853805542, 1.6295583248138428, 2.274169445037842, 2.91878080368042, 3.563392162322998, 4.208003044128418, 4.852614402770996, 5.497225761413574, 6.141837120056152, 6.7864484786987305, 7.43105936050415, 8.07567024230957, 8.720281600952148, 9.364892959594727, 10.009504318237305, 10.654115676879883, 11.298727035522461, 11.943338394165039, 12.587949752807617, 13.232561111450195, 13.877172470092773, 14.521782875061035, 15.166394233703613, 15.811005592346191, 16.455615997314453, 17.10022735595703, 17.74483871459961, 18.389450073242188, 19.034061431884766, 19.678672790527344, 20.323284149169922, 20.9678955078125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0, 8.0, 3.0, 7.0, 11.0, 11.0, 14.0, 23.0, 22.0, 19.0, 20.0, 29.0, 26.0, 24.0, 30.0, 39.0, 40.0, 42.0, 30.0, 36.0, 41.0, 50.0, 54.0, 43.0, 37.0, 44.0, 25.0, 30.0, 44.0, 20.0, 20.0, 25.0, 22.0, 16.0, 20.0, 15.0, 12.0, 9.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.93505859375, -3.7998046875, -3.66455078125, -3.529296875, -3.39404296875, -3.2587890625, -3.12353515625, -2.98828125, -2.85302734375, -2.7177734375, -2.58251953125, -2.447265625, -2.31201171875, -2.1767578125, -2.04150390625, -1.90625, -1.77099609375, -1.6357421875, -1.50048828125, -1.365234375, -1.22998046875, -1.0947265625, -0.95947265625, -0.82421875, -0.68896484375, -0.5537109375, -0.41845703125, -0.283203125, -0.14794921875, -0.0126953125, 0.12255859375, 0.2578125, 0.39306640625, 0.5283203125, 0.66357421875, 0.798828125, 0.93408203125, 1.0693359375, 1.20458984375, 1.33984375, 1.47509765625, 1.6103515625, 1.74560546875, 1.880859375, 2.01611328125, 2.1513671875, 2.28662109375, 2.421875, 2.55712890625, 2.6923828125, 2.82763671875, 2.962890625, 3.09814453125, 3.2333984375, 3.36865234375, 3.50390625, 3.63916015625, 3.7744140625, 3.90966796875, 4.044921875, 4.18017578125, 4.3154296875, 4.45068359375, 4.5859375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 5.0, 12.0, 10.0, 22.0, 33.0, 35.0, 53.0, 77.0, 88.0, 145.0, 197.0, 299.0, 445.0, 591.0, 846.0, 1119.0, 1700.0, 2478.0, 3691.0, 5147.0, 7644.0, 11462.0, 16878.0, 25331.0, 39336.0, 63173.0, 111476.0, 227193.0, 232062.0, 113448.0, 64365.0, 39703.0, 26063.0, 17163.0, 11343.0, 7709.0, 5298.0, 3700.0, 2454.0, 1723.0, 1136.0, 876.0, 596.0, 449.0, 273.0, 205.0, 157.0, 112.0, 92.0, 47.0, 26.0, 32.0, 19.0, 8.0, 3.0, 8.0, 3.0, 4.0, 0.0, 0.0, 3.0], "bins": [-0.63818359375, -0.6176071166992188, -0.5970306396484375, -0.5764541625976562, -0.555877685546875, -0.5353012084960938, -0.5147247314453125, -0.49414825439453125, -0.47357177734375, -0.45299530029296875, -0.4324188232421875, -0.41184234619140625, -0.391265869140625, -0.37068939208984375, -0.3501129150390625, -0.32953643798828125, -0.3089599609375, -0.28838348388671875, -0.2678070068359375, -0.24723052978515625, -0.226654052734375, -0.20607757568359375, -0.1855010986328125, -0.16492462158203125, -0.14434814453125, -0.12377166748046875, -0.1031951904296875, -0.08261871337890625, -0.062042236328125, -0.04146575927734375, -0.0208892822265625, -0.00031280517578125, 0.020263671875, 0.04084014892578125, 0.0614166259765625, 0.08199310302734375, 0.102569580078125, 0.12314605712890625, 0.1437225341796875, 0.16429901123046875, 0.18487548828125, 0.20545196533203125, 0.2260284423828125, 0.24660491943359375, 0.267181396484375, 0.28775787353515625, 0.3083343505859375, 0.32891082763671875, 0.3494873046875, 0.37006378173828125, 0.3906402587890625, 0.41121673583984375, 0.431793212890625, 0.45236968994140625, 0.4729461669921875, 0.49352264404296875, 0.51409912109375, 0.5346755981445312, 0.5552520751953125, 0.5758285522460938, 0.596405029296875, 0.6169815063476562, 0.6375579833984375, 0.6581344604492188, 0.6787109375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 6.0, 12.0, 13.0, 6.0, 18.0, 15.0, 20.0, 19.0, 29.0, 27.0, 32.0, 29.0, 28.0, 34.0, 32.0, 43.0, 32.0, 43.0, 34.0, 1062.0, 33.0, 42.0, 31.0, 27.0, 44.0, 32.0, 31.0, 32.0, 29.0, 26.0, 14.0, 19.0, 14.0, 19.0, 18.0, 9.0, 6.0, 10.0, 7.0, 6.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.55078125, -2.46875, -2.38671875, -2.3046875, -2.22265625, -2.140625, -2.05859375, -1.9765625, -1.89453125, -1.8125, -1.73046875, -1.6484375, -1.56640625, -1.484375, -1.40234375, -1.3203125, -1.23828125, -1.15625, -1.07421875, -0.9921875, -0.91015625, -0.828125, -0.74609375, -0.6640625, -0.58203125, -0.5, -0.41796875, -0.3359375, -0.25390625, -0.171875, -0.08984375, -0.0078125, 0.07421875, 0.15625, 0.23828125, 0.3203125, 0.40234375, 0.484375, 0.56640625, 0.6484375, 0.73046875, 0.8125, 0.89453125, 0.9765625, 1.05859375, 1.140625, 1.22265625, 1.3046875, 1.38671875, 1.46875, 1.55078125, 1.6328125, 1.71484375, 1.796875, 1.87890625, 1.9609375, 2.04296875, 2.125, 2.20703125, 2.2890625, 2.37109375, 2.453125, 2.53515625, 2.6171875, 2.69921875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 8.0, 9.0, 15.0, 27.0, 35.0, 47.0, 90.0, 96.0, 161.0, 230.0, 350.0, 457.0, 631.0, 919.0, 1223.0, 1695.0, 2372.0, 3250.0, 4538.0, 6129.0, 8601.0, 12288.0, 17421.0, 24979.0, 36658.0, 55438.0, 88723.0, 162438.0, 1294168.0, 136133.0, 78001.0, 49088.0, 32632.0, 22693.0, 15733.0, 11342.0, 8061.0, 5804.0, 4123.0, 2940.0, 2132.0, 1559.0, 1095.0, 827.0, 595.0, 421.0, 274.0, 210.0, 155.0, 101.0, 74.0, 56.0, 38.0, 23.0, 17.0, 8.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.5810546875, -0.5631027221679688, -0.5451507568359375, -0.5271987915039062, -0.509246826171875, -0.49129486083984375, -0.4733428955078125, -0.45539093017578125, -0.43743896484375, -0.41948699951171875, -0.4015350341796875, -0.38358306884765625, -0.365631103515625, -0.34767913818359375, -0.3297271728515625, -0.31177520751953125, -0.2938232421875, -0.27587127685546875, -0.2579193115234375, -0.23996734619140625, -0.222015380859375, -0.20406341552734375, -0.1861114501953125, -0.16815948486328125, -0.15020751953125, -0.13225555419921875, -0.1143035888671875, -0.09635162353515625, -0.078399658203125, -0.06044769287109375, -0.0424957275390625, -0.02454376220703125, -0.006591796875, 0.01136016845703125, 0.0293121337890625, 0.04726409912109375, 0.065216064453125, 0.08316802978515625, 0.1011199951171875, 0.11907196044921875, 0.13702392578125, 0.15497589111328125, 0.1729278564453125, 0.19087982177734375, 0.208831787109375, 0.22678375244140625, 0.2447357177734375, 0.26268768310546875, 0.2806396484375, 0.29859161376953125, 0.3165435791015625, 0.33449554443359375, 0.352447509765625, 0.37039947509765625, 0.3883514404296875, 0.40630340576171875, 0.42425537109375, 0.44220733642578125, 0.4601593017578125, 0.47811126708984375, 0.496063232421875, 0.5140151977539062, 0.5319671630859375, 0.5499191284179688, 0.56787109375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 8.0, 10.0, 8.0, 10.0, 11.0, 16.0, 18.0, 15.0, 29.0, 26.0, 42.0, 50.0, 44.0, 58.0, 76.0, 51.0, 65.0, 56.0, 64.0, 51.0, 49.0, 60.0, 46.0, 27.0, 26.0, 17.0, 11.0, 10.0, 9.0, 9.0, 5.0, 3.0, 6.0, 5.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019121170043945312, -0.00018531642854213715, -0.00017942115664482117, -0.0001735258847475052, -0.0001676306128501892, -0.00016173534095287323, -0.00015584006905555725, -0.00014994479715824127, -0.0001440495252609253, -0.00013815425336360931, -0.00013225898146629333, -0.00012636370956897736, -0.00012046843767166138, -0.0001145731657743454, -0.00010867789387702942, -0.00010278262197971344, -9.688735008239746e-05, -9.099207818508148e-05, -8.50968062877655e-05, -7.920153439044952e-05, -7.330626249313354e-05, -6.741099059581757e-05, -6.151571869850159e-05, -5.562044680118561e-05, -4.972517490386963e-05, -4.382990300655365e-05, -3.793463110923767e-05, -3.203935921192169e-05, -2.6144087314605713e-05, -2.0248815417289734e-05, -1.4353543519973755e-05, -8.458271622657776e-06, -2.562999725341797e-06, 3.332272171974182e-06, 9.227544069290161e-06, 1.512281596660614e-05, 2.101808786392212e-05, 2.6913359761238098e-05, 3.280863165855408e-05, 3.8703903555870056e-05, 4.4599175453186035e-05, 5.0494447350502014e-05, 5.638971924781799e-05, 6.228499114513397e-05, 6.818026304244995e-05, 7.407553493976593e-05, 7.997080683708191e-05, 8.586607873439789e-05, 9.176135063171387e-05, 9.765662252902985e-05, 0.00010355189442634583, 0.0001094471663236618, 0.00011534243822097778, 0.00012123771011829376, 0.00012713298201560974, 0.00013302825391292572, 0.0001389235258102417, 0.00014481879770755768, 0.00015071406960487366, 0.00015660934150218964, 0.00016250461339950562, 0.0001683998852968216, 0.00017429515719413757, 0.00018019042909145355, 0.00018608570098876953]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 7.0, 12.0, 17.0, 17.0, 24.0, 26.0, 39.0, 57.0, 91.0, 147.0, 224.0, 341.0, 674.0, 2570.0, 1036095.0, 6239.0, 818.0, 396.0, 214.0, 162.0, 76.0, 73.0, 50.0, 33.0, 37.0, 23.0, 19.0, 22.0, 12.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004161834716796875, -0.004034161567687988, -0.0039064884185791016, -0.003778815269470215, -0.003651142120361328, -0.0035234689712524414, -0.0033957958221435547, -0.003268122673034668, -0.0031404495239257812, -0.0030127763748168945, -0.002885103225708008, -0.002757430076599121, -0.0026297569274902344, -0.0025020837783813477, -0.002374410629272461, -0.0022467374801635742, -0.0021190643310546875, -0.0019913911819458008, -0.001863718032836914, -0.0017360448837280273, -0.0016083717346191406, -0.001480698585510254, -0.0013530254364013672, -0.0012253522872924805, -0.0010976791381835938, -0.000970005989074707, -0.0008423328399658203, -0.0007146596908569336, -0.0005869865417480469, -0.00045931339263916016, -0.00033164024353027344, -0.00020396709442138672, -7.62939453125e-05, 5.137920379638672e-05, 0.00017905235290527344, 0.00030672550201416016, 0.0004343986511230469, 0.0005620718002319336, 0.0006897449493408203, 0.000817418098449707, 0.0009450912475585938, 0.0010727643966674805, 0.0012004375457763672, 0.001328110694885254, 0.0014557838439941406, 0.0015834569931030273, 0.001711130142211914, 0.0018388032913208008, 0.0019664764404296875, 0.0020941495895385742, 0.002221822738647461, 0.0023494958877563477, 0.0024771690368652344, 0.002604842185974121, 0.002732515335083008, 0.0028601884841918945, 0.0029878616333007812, 0.003115534782409668, 0.0032432079315185547, 0.0033708810806274414, 0.003498554229736328, 0.003626227378845215, 0.0037539005279541016, 0.0038815736770629883, 0.004009246826171875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 34.0, 154.0, 245.0, 302.0, 182.0, 71.0, 16.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027681791107170284, -0.0002701149496715516, -0.0002634120173752308, -0.00025670905597507954, -0.00025000612367875874, -0.0002433031622786075, -0.00023660021543037146, -0.00022989726858213544, -0.00022319432173389941, -0.0002164913748856634, -0.00020978842803742737, -0.00020308548118919134, -0.0001963825197890401, -0.0001896795874927193, -0.00018297662609256804, -0.00017627367924433202, -0.000169570732396096, -0.00016286778554785997, -0.00015616483869962394, -0.00014946189185138792, -0.0001427589450031519, -0.00013605598360300064, -0.00012935303675476462, -0.0001226500899065286, -0.00011594714305829257, -0.00010924419621005654, -0.00010254124936182052, -9.583829523762688e-05, -8.913534838939086e-05, -8.243240154115483e-05, -7.572944741696119e-05, -6.902650056872517e-05, -6.232355372048914e-05, -5.562060687225312e-05, -4.891765638603829e-05, -4.221470589982346e-05, -3.551175905158743e-05, -2.8808812203351408e-05, -2.2105861717136577e-05, -1.5402911230921745e-05, -8.699964382685721e-06, -1.997015715460293e-06, 4.705932951765135e-06, 1.1408881618990563e-05, 1.811183028621599e-05, 2.4814777134452015e-05, 3.151772762066685e-05, 3.822067810688168e-05, 4.49236249551177e-05, 5.162657180335373e-05, 5.832952228956856e-05, 6.503247277578339e-05, 7.173541962401941e-05, 7.843836647225544e-05, 8.514132059644908e-05, 9.18442674446851e-05, 9.854721429292113e-05, 0.00010525016114115715, 0.00011195310798939317, 0.00011865606211358681, 0.00012535901623778045, 0.00013206194853410125, 0.0001387649099342525, 0.00014546785678248852, 0.00015217080363072455]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 5.0, 5.0, 9.0, 20.0, 14.0, 26.0, 27.0, 29.0, 22.0, 35.0, 35.0, 35.0, 48.0, 56.0, 47.0, 59.0, 45.0, 54.0, 52.0, 43.0, 42.0, 50.0, 38.0, 26.0, 37.0, 31.0, 20.0, 20.0, 16.0, 10.0, 14.0, 6.0, 2.0, 6.0, 5.0, 1.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011771917343139648, -0.00011443905532360077, -0.00011115893721580505, -0.00010787881910800934, -0.00010459870100021362, -0.00010131858289241791, -9.803846478462219e-05, -9.475834667682648e-05, -9.147822856903076e-05, -8.819811046123505e-05, -8.491799235343933e-05, -8.163787424564362e-05, -7.83577561378479e-05, -7.507763803005219e-05, -7.179751992225647e-05, -6.851740181446075e-05, -6.523728370666504e-05, -6.195716559886932e-05, -5.867704749107361e-05, -5.539692938327789e-05, -5.211681127548218e-05, -4.883669316768646e-05, -4.555657505989075e-05, -4.227645695209503e-05, -3.8996338844299316e-05, -3.57162207365036e-05, -3.2436102628707886e-05, -2.915598452091217e-05, -2.5875866413116455e-05, -2.259574830532074e-05, -1.9315630197525024e-05, -1.603551208972931e-05, -1.2755393981933594e-05, -9.475275874137878e-06, -6.195157766342163e-06, -2.9150396585464478e-06, 3.650784492492676e-07, 3.645196557044983e-06, 6.925314664840698e-06, 1.0205432772636414e-05, 1.3485550880432129e-05, 1.6765668988227844e-05, 2.004578709602356e-05, 2.3325905203819275e-05, 2.660602331161499e-05, 2.9886141419410706e-05, 3.316625952720642e-05, 3.6446377635002136e-05, 3.972649574279785e-05, 4.300661385059357e-05, 4.628673195838928e-05, 4.9566850066185e-05, 5.284696817398071e-05, 5.612708628177643e-05, 5.9407204389572144e-05, 6.268732249736786e-05, 6.596744060516357e-05, 6.924755871295929e-05, 7.2527676820755e-05, 7.580779492855072e-05, 7.908791303634644e-05, 8.236803114414215e-05, 8.564814925193787e-05, 8.892826735973358e-05, 9.22083854675293e-05]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0, 8.0, 3.0, 7.0, 11.0, 11.0, 14.0, 23.0, 22.0, 19.0, 20.0, 29.0, 26.0, 24.0, 30.0, 39.0, 40.0, 42.0, 30.0, 36.0, 41.0, 50.0, 54.0, 43.0, 37.0, 44.0, 25.0, 30.0, 44.0, 20.0, 20.0, 25.0, 22.0, 16.0, 20.0, 15.0, 12.0, 9.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.93505859375, -3.7998046875, -3.66455078125, -3.529296875, -3.39404296875, -3.2587890625, -3.12353515625, -2.98828125, -2.85302734375, -2.7177734375, -2.58251953125, -2.447265625, -2.31201171875, -2.1767578125, -2.04150390625, -1.90625, -1.77099609375, -1.6357421875, -1.50048828125, -1.365234375, -1.22998046875, -1.0947265625, -0.95947265625, -0.82421875, -0.68896484375, -0.5537109375, -0.41845703125, -0.283203125, -0.14794921875, -0.0126953125, 0.12255859375, 0.2578125, 0.39306640625, 0.5283203125, 0.66357421875, 0.798828125, 0.93408203125, 1.0693359375, 1.20458984375, 1.33984375, 1.47509765625, 1.6103515625, 1.74560546875, 1.880859375, 2.01611328125, 2.1513671875, 2.28662109375, 2.421875, 2.55712890625, 2.6923828125, 2.82763671875, 2.962890625, 3.09814453125, 3.2333984375, 3.36865234375, 3.50390625, 3.63916015625, 3.7744140625, 3.90966796875, 4.044921875, 4.18017578125, 4.3154296875, 4.45068359375, 4.5859375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 2.0, 2.0, 13.0, 3.0, 8.0, 26.0, 20.0, 39.0, 57.0, 76.0, 88.0, 104.0, 149.0, 189.0, 258.0, 351.0, 503.0, 707.0, 1485.0, 5258.0, 28272.0, 287266.0, 658501.0, 51419.0, 8833.0, 2008.0, 821.0, 571.0, 387.0, 292.0, 219.0, 134.0, 122.0, 93.0, 70.0, 48.0, 41.0, 26.0, 22.0, 19.0, 12.0, 9.0, 6.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.887451171875, -9.54833984375, -9.209228515625, -8.8701171875, -8.531005859375, -8.19189453125, -7.852783203125, -7.513671875, -7.174560546875, -6.83544921875, -6.496337890625, -6.1572265625, -5.818115234375, -5.47900390625, -5.139892578125, -4.80078125, -4.461669921875, -4.12255859375, -3.783447265625, -3.4443359375, -3.105224609375, -2.76611328125, -2.427001953125, -2.087890625, -1.748779296875, -1.40966796875, -1.070556640625, -0.7314453125, -0.392333984375, -0.05322265625, 0.285888671875, 0.625, 0.964111328125, 1.30322265625, 1.642333984375, 1.9814453125, 2.320556640625, 2.65966796875, 2.998779296875, 3.337890625, 3.677001953125, 4.01611328125, 4.355224609375, 4.6943359375, 5.033447265625, 5.37255859375, 5.711669921875, 6.05078125, 6.389892578125, 6.72900390625, 7.068115234375, 7.4072265625, 7.746337890625, 8.08544921875, 8.424560546875, 8.763671875, 9.102783203125, 9.44189453125, 9.781005859375, 10.1201171875, 10.459228515625, 10.79833984375, 11.137451171875, 11.4765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 3.0, 4.0, 7.0, 10.0, 5.0, 12.0, 17.0, 25.0, 32.0, 38.0, 45.0, 56.0, 59.0, 68.0, 91.0, 315.0, 1663.0, 153.0, 72.0, 65.0, 57.0, 37.0, 41.0, 30.0, 33.0, 22.0, 16.0, 17.0, 10.0, 9.0, 11.0, 2.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.734375, -19.158447265625, -18.58251953125, -18.006591796875, -17.4306640625, -16.854736328125, -16.27880859375, -15.702880859375, -15.126953125, -14.551025390625, -13.97509765625, -13.399169921875, -12.8232421875, -12.247314453125, -11.67138671875, -11.095458984375, -10.51953125, -9.943603515625, -9.36767578125, -8.791748046875, -8.2158203125, -7.639892578125, -7.06396484375, -6.488037109375, -5.912109375, -5.336181640625, -4.76025390625, -4.184326171875, -3.6083984375, -3.032470703125, -2.45654296875, -1.880615234375, -1.3046875, -0.728759765625, -0.15283203125, 0.423095703125, 0.9990234375, 1.574951171875, 2.15087890625, 2.726806640625, 3.302734375, 3.878662109375, 4.45458984375, 5.030517578125, 5.6064453125, 6.182373046875, 6.75830078125, 7.334228515625, 7.91015625, 8.486083984375, 9.06201171875, 9.637939453125, 10.2138671875, 10.789794921875, 11.36572265625, 11.941650390625, 12.517578125, 13.093505859375, 13.66943359375, 14.245361328125, 14.8212890625, 15.397216796875, 15.97314453125, 16.549072265625, 17.125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 13.0, 17.0, 28.0, 56.0, 50.0, 85.0, 160.0, 344.0, 1796.0, 2785039.0, 355834.0, 1523.0, 324.0, 157.0, 102.0, 49.0, 38.0, 24.0, 19.0, 9.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.625, -92.3232421875, -89.021484375, -85.7197265625, -82.41796875, -79.1162109375, -75.814453125, -72.5126953125, -69.2109375, -65.9091796875, -62.607421875, -59.3056640625, -56.00390625, -52.7021484375, -49.400390625, -46.0986328125, -42.796875, -39.4951171875, -36.193359375, -32.8916015625, -29.58984375, -26.2880859375, -22.986328125, -19.6845703125, -16.3828125, -13.0810546875, -9.779296875, -6.4775390625, -3.17578125, 0.1259765625, 3.427734375, 6.7294921875, 10.03125, 13.3330078125, 16.634765625, 19.9365234375, 23.23828125, 26.5400390625, 29.841796875, 33.1435546875, 36.4453125, 39.7470703125, 43.048828125, 46.3505859375, 49.65234375, 52.9541015625, 56.255859375, 59.5576171875, 62.859375, 66.1611328125, 69.462890625, 72.7646484375, 76.06640625, 79.3681640625, 82.669921875, 85.9716796875, 89.2734375, 92.5751953125, 95.876953125, 99.1787109375, 102.48046875, 105.7822265625, 109.083984375, 112.3857421875, 115.6875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 10.0, 57.0, 283.0, 473.0, 155.0, 32.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.85395812988281, -62.91175079345703, -60.969547271728516, -59.027339935302734, -57.08513259887695, -55.14292907714844, -53.200721740722656, -51.258514404296875, -49.316307067871094, -47.37409973144531, -45.4318962097168, -43.489688873291016, -41.547481536865234, -39.60527801513672, -37.66307067871094, -35.720863342285156, -33.77865982055664, -31.836454391479492, -29.89424705505371, -27.952041625976562, -26.00983428955078, -24.067628860473633, -22.125423431396484, -20.183216094970703, -18.241010665893555, -16.298805236816406, -14.356597900390625, -12.414392471313477, -10.472186088562012, -8.529979705810547, -6.587774276733398, -4.645567893981934, -2.703357696533203, -0.7611515522003174, 1.1810545921325684, 3.123260498046875, 5.06546688079834, 7.007673263549805, 8.949878692626953, 10.892085075378418, 12.834291458129883, 14.776497840881348, 16.718704223632812, 18.66090965270996, 20.60311508178711, 22.54532241821289, 24.48752784729004, 26.429733276367188, 28.37194061279297, 30.314146041870117, 32.256351470947266, 34.19855880737305, 36.14076614379883, 38.082969665527344, 40.025177001953125, 41.967384338378906, 43.90959167480469, 45.85179901123047, 47.794002532958984, 49.736209869384766, 51.67841720581055, 53.62062072753906, 55.562828063964844, 57.505035400390625, 59.44723892211914]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 4.0, 12.0, 8.0, 5.0, 15.0, 14.0, 15.0, 17.0, 23.0, 25.0, 20.0, 35.0, 37.0, 38.0, 37.0, 31.0, 37.0, 38.0, 48.0, 41.0, 40.0, 45.0, 38.0, 41.0, 51.0, 40.0, 23.0, 23.0, 24.0, 22.0, 31.0, 20.0, 25.0, 10.0, 8.0, 12.0, 14.0, 7.0, 5.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.744325637817383, -28.76934242248535, -27.794361114501953, -26.819377899169922, -25.84439468383789, -24.869413375854492, -23.89443016052246, -22.919448852539062, -21.94446563720703, -20.969482421875, -19.9945011138916, -19.01951789855957, -18.044536590576172, -17.06955337524414, -16.09457015991211, -15.119587898254395, -14.14460563659668, -13.169623374938965, -12.19464111328125, -11.219657897949219, -10.244675636291504, -9.269693374633789, -8.294710159301758, -7.319727897644043, -6.344745635986328, -5.369763374328613, -4.39478063583374, -3.4197981357574463, -2.4448156356811523, -1.4698333740234375, -0.49485063552856445, 0.4801321029663086, 1.4551162719726562, 2.43009877204895, 3.405081272125244, 4.380064010620117, 5.355046272277832, 6.330028533935547, 7.30501127243042, 8.279994010925293, 9.254976272583008, 10.229958534240723, 11.204940795898438, 12.179924011230469, 13.154906272888184, 14.129888534545898, 15.10487174987793, 16.079853057861328, 17.05483627319336, 18.02981948852539, 19.00480079650879, 19.97978401184082, 20.95476531982422, 21.92974853515625, 22.90473175048828, 23.879714965820312, 24.85469627380371, 25.829679489135742, 26.80466079711914, 27.779644012451172, 28.754627227783203, 29.7296085357666, 30.704591751098633, 31.67957305908203, 32.65455627441406]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 7.0, 6.0, 6.0, 4.0, 6.0, 11.0, 12.0, 13.0, 17.0, 14.0, 19.0, 39.0, 24.0, 27.0, 31.0, 22.0, 46.0, 45.0, 42.0, 49.0, 45.0, 52.0, 49.0, 36.0, 33.0, 41.0, 34.0, 34.0, 27.0, 20.0, 26.0, 25.0, 18.0, 20.0, 19.0, 13.0, 16.0, 16.0, 6.0, 8.0, 8.0, 4.0, 8.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.390625, -4.24755859375, -4.1044921875, -3.96142578125, -3.818359375, -3.67529296875, -3.5322265625, -3.38916015625, -3.24609375, -3.10302734375, -2.9599609375, -2.81689453125, -2.673828125, -2.53076171875, -2.3876953125, -2.24462890625, -2.1015625, -1.95849609375, -1.8154296875, -1.67236328125, -1.529296875, -1.38623046875, -1.2431640625, -1.10009765625, -0.95703125, -0.81396484375, -0.6708984375, -0.52783203125, -0.384765625, -0.24169921875, -0.0986328125, 0.04443359375, 0.1875, 0.33056640625, 0.4736328125, 0.61669921875, 0.759765625, 0.90283203125, 1.0458984375, 1.18896484375, 1.33203125, 1.47509765625, 1.6181640625, 1.76123046875, 1.904296875, 2.04736328125, 2.1904296875, 2.33349609375, 2.4765625, 2.61962890625, 2.7626953125, 2.90576171875, 3.048828125, 3.19189453125, 3.3349609375, 3.47802734375, 3.62109375, 3.76416015625, 3.9072265625, 4.05029296875, 4.193359375, 4.33642578125, 4.4794921875, 4.62255859375, 4.765625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 9.0, 11.0, 12.0, 21.0, 30.0, 38.0, 32.0, 53.0, 66.0, 74.0, 102.0, 119.0, 182.0, 253.0, 381.0, 704.0, 1891.0, 9696.0, 113570.0, 1128531.0, 2375736.0, 515372.0, 39855.0, 4585.0, 1121.0, 559.0, 320.0, 211.0, 184.0, 122.0, 94.0, 71.0, 48.0, 49.0, 45.0, 32.0, 23.0, 16.0, 16.0, 9.0, 11.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.63671875, -7.37615966796875, -7.1156005859375, -6.85504150390625, -6.594482421875, -6.33392333984375, -6.0733642578125, -5.81280517578125, -5.55224609375, -5.29168701171875, -5.0311279296875, -4.77056884765625, -4.510009765625, -4.24945068359375, -3.9888916015625, -3.72833251953125, -3.4677734375, -3.20721435546875, -2.9466552734375, -2.68609619140625, -2.425537109375, -2.16497802734375, -1.9044189453125, -1.64385986328125, -1.38330078125, -1.12274169921875, -0.8621826171875, -0.60162353515625, -0.341064453125, -0.08050537109375, 0.1800537109375, 0.44061279296875, 0.701171875, 0.96173095703125, 1.2222900390625, 1.48284912109375, 1.743408203125, 2.00396728515625, 2.2645263671875, 2.52508544921875, 2.78564453125, 3.04620361328125, 3.3067626953125, 3.56732177734375, 3.827880859375, 4.08843994140625, 4.3489990234375, 4.60955810546875, 4.8701171875, 5.13067626953125, 5.3912353515625, 5.65179443359375, 5.912353515625, 6.17291259765625, 6.4334716796875, 6.69403076171875, 6.95458984375, 7.21514892578125, 7.4757080078125, 7.73626708984375, 7.996826171875, 8.25738525390625, 8.5179443359375, 8.77850341796875, 9.0390625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 6.0, 9.0, 6.0, 19.0, 21.0, 26.0, 41.0, 49.0, 99.0, 107.0, 166.0, 224.0, 327.0, 407.0, 457.0, 444.0, 406.0, 332.0, 236.0, 197.0, 122.0, 96.0, 76.0, 61.0, 34.0, 31.0, 20.0, 17.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.53515625, -5.33050537109375, -5.1258544921875, -4.92120361328125, -4.716552734375, -4.51190185546875, -4.3072509765625, -4.10260009765625, -3.89794921875, -3.69329833984375, -3.4886474609375, -3.28399658203125, -3.079345703125, -2.87469482421875, -2.6700439453125, -2.46539306640625, -2.2607421875, -2.05609130859375, -1.8514404296875, -1.64678955078125, -1.442138671875, -1.23748779296875, -1.0328369140625, -0.82818603515625, -0.62353515625, -0.41888427734375, -0.2142333984375, -0.00958251953125, 0.195068359375, 0.39971923828125, 0.6043701171875, 0.80902099609375, 1.013671875, 1.21832275390625, 1.4229736328125, 1.62762451171875, 1.832275390625, 2.03692626953125, 2.2415771484375, 2.44622802734375, 2.65087890625, 2.85552978515625, 3.0601806640625, 3.26483154296875, 3.469482421875, 3.67413330078125, 3.8787841796875, 4.08343505859375, 4.2880859375, 4.49273681640625, 4.6973876953125, 4.90203857421875, 5.106689453125, 5.31134033203125, 5.5159912109375, 5.72064208984375, 5.92529296875, 6.12994384765625, 6.3345947265625, 6.53924560546875, 6.743896484375, 6.94854736328125, 7.1531982421875, 7.35784912109375, 7.5625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 6.0, 8.0, 18.0, 11.0, 22.0, 28.0, 37.0, 46.0, 62.0, 60.0, 87.0, 141.0, 180.0, 284.0, 431.0, 739.0, 1584.0, 6721.0, 88911.0, 3037941.0, 1020543.0, 29854.0, 3638.0, 1121.0, 569.0, 373.0, 240.0, 148.0, 125.0, 73.0, 61.0, 54.0, 41.0, 27.0, 29.0, 14.0, 14.0, 9.0, 4.0, 4.0, 3.0, 8.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.6484375, -15.1566162109375, -14.664794921875, -14.1729736328125, -13.68115234375, -13.1893310546875, -12.697509765625, -12.2056884765625, -11.7138671875, -11.2220458984375, -10.730224609375, -10.2384033203125, -9.74658203125, -9.2547607421875, -8.762939453125, -8.2711181640625, -7.779296875, -7.2874755859375, -6.795654296875, -6.3038330078125, -5.81201171875, -5.3201904296875, -4.828369140625, -4.3365478515625, -3.8447265625, -3.3529052734375, -2.861083984375, -2.3692626953125, -1.87744140625, -1.3856201171875, -0.893798828125, -0.4019775390625, 0.08984375, 0.5816650390625, 1.073486328125, 1.5653076171875, 2.05712890625, 2.5489501953125, 3.040771484375, 3.5325927734375, 4.0244140625, 4.5162353515625, 5.008056640625, 5.4998779296875, 5.99169921875, 6.4835205078125, 6.975341796875, 7.4671630859375, 7.958984375, 8.4508056640625, 8.942626953125, 9.4344482421875, 9.92626953125, 10.4180908203125, 10.909912109375, 11.4017333984375, 11.8935546875, 12.3853759765625, 12.877197265625, 13.3690185546875, 13.86083984375, 14.3526611328125, 14.844482421875, 15.3363037109375, 15.828125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 56.0, 401.0, 436.0, 111.0, 10.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.4868392944336, -84.95323181152344, -81.41963195800781, -77.88602447509766, -74.35242462158203, -70.81881713867188, -67.28521728515625, -63.751609802246094, -60.2180061340332, -56.68440246582031, -53.15079879760742, -49.61719512939453, -46.083587646484375, -42.54998779296875, -39.016380310058594, -35.4827766418457, -31.949172973632812, -28.415569305419922, -24.88196563720703, -21.348360061645508, -17.814756393432617, -14.281152725219727, -10.747547149658203, -7.2139434814453125, -3.680339813232422, -0.14673566818237305, 3.386868476867676, 6.920473098754883, 10.454076766967773, 13.987680435180664, 17.521286010742188, 21.054889678955078, 24.5885009765625, 28.12210464477539, 31.65570831298828, 35.18931579589844, 38.72291564941406, 42.25652313232422, 45.79012680053711, 49.32373046875, 52.85733413696289, 56.39093780517578, 59.92454147338867, 63.45814514160156, 66.99175262451172, 70.52535247802734, 74.0589599609375, 77.59255981445312, 81.12616729736328, 84.65977478027344, 88.19337463378906, 91.72698211669922, 95.26058197021484, 98.794189453125, 102.32778930664062, 105.86139678955078, 109.39500427246094, 112.9286117553711, 116.46221160888672, 119.99581909179688, 123.5294189453125, 127.06302642822266, 130.5966339111328, 134.13023376464844, 137.66383361816406]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 2.0, 6.0, 12.0, 7.0, 4.0, 8.0, 13.0, 10.0, 12.0, 14.0, 23.0, 16.0, 26.0, 24.0, 21.0, 20.0, 29.0, 33.0, 40.0, 34.0, 45.0, 37.0, 36.0, 42.0, 33.0, 42.0, 37.0, 38.0, 41.0, 36.0, 32.0, 34.0, 39.0, 19.0, 28.0, 10.0, 14.0, 22.0, 13.0, 10.0, 9.0, 7.0, 3.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-21.181427001953125, -20.560644149780273, -19.93985939025879, -19.319076538085938, -18.698291778564453, -18.0775089263916, -17.456724166870117, -16.835941314697266, -16.21515655517578, -15.594372749328613, -14.973588943481445, -14.352805137634277, -13.73202133178711, -13.111237525939941, -12.490453720092773, -11.869670867919922, -11.248887062072754, -10.628103256225586, -10.007319450378418, -9.38653564453125, -8.765751838684082, -8.144968032836914, -7.524184703826904, -6.903400897979736, -6.282617092132568, -5.6618332862854, -5.041049480438232, -4.420266151428223, -3.7994821071624756, -3.1786983013153076, -2.5579147338867188, -1.9371309280395508, -1.3163471221923828, -0.6955633759498596, -0.07477962970733643, 0.546004056930542, 1.16678786277771, 1.787571668624878, 2.408355236053467, 3.0291390419006348, 3.6499228477478027, 4.270706653594971, 4.891490459442139, 5.512273788452148, 6.133057594299316, 6.753841400146484, 7.374625205993652, 7.99540901184082, 8.616192817687988, 9.236976623535156, 9.857760429382324, 10.478544235229492, 11.09932804107666, 11.720111846923828, 12.34089469909668, 12.961679458618164, 13.582462310791016, 14.203246116638184, 14.824029922485352, 15.44481372833252, 16.065597534179688, 16.68638038635254, 17.307165145874023, 17.927947998046875, 18.54873275756836]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 12.0, 10.0, 12.0, 13.0, 12.0, 14.0, 18.0, 15.0, 20.0, 22.0, 28.0, 25.0, 25.0, 31.0, 40.0, 41.0, 39.0, 44.0, 43.0, 46.0, 51.0, 50.0, 31.0, 38.0, 29.0, 40.0, 23.0, 31.0, 20.0, 19.0, 22.0, 22.0, 12.0, 16.0, 13.0, 6.0, 12.0, 10.0, 10.0, 8.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.998046875, -3.866058349609375, -3.73406982421875, -3.602081298828125, -3.4700927734375, -3.338104248046875, -3.20611572265625, -3.074127197265625, -2.942138671875, -2.810150146484375, -2.67816162109375, -2.546173095703125, -2.4141845703125, -2.282196044921875, -2.15020751953125, -2.018218994140625, -1.88623046875, -1.754241943359375, -1.62225341796875, -1.490264892578125, -1.3582763671875, -1.226287841796875, -1.09429931640625, -0.962310791015625, -0.830322265625, -0.698333740234375, -0.56634521484375, -0.434356689453125, -0.3023681640625, -0.170379638671875, -0.03839111328125, 0.093597412109375, 0.2255859375, 0.357574462890625, 0.48956298828125, 0.621551513671875, 0.7535400390625, 0.885528564453125, 1.01751708984375, 1.149505615234375, 1.281494140625, 1.413482666015625, 1.54547119140625, 1.677459716796875, 1.8094482421875, 1.941436767578125, 2.07342529296875, 2.205413818359375, 2.33740234375, 2.469390869140625, 2.60137939453125, 2.733367919921875, 2.8653564453125, 2.997344970703125, 3.12933349609375, 3.261322021484375, 3.393310546875, 3.525299072265625, 3.65728759765625, 3.789276123046875, 3.9212646484375, 4.053253173828125, 4.18524169921875, 4.317230224609375, 4.44921875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 10.0, 15.0, 10.0, 18.0, 28.0, 62.0, 65.0, 95.0, 116.0, 193.0, 272.0, 386.0, 555.0, 808.0, 1175.0, 1706.0, 2307.0, 3343.0, 4906.0, 6985.0, 10183.0, 14410.0, 21493.0, 32622.0, 51399.0, 88973.0, 173683.0, 273284.0, 144206.0, 77320.0, 45575.0, 29187.0, 19608.0, 13146.0, 9155.0, 6410.0, 4516.0, 3137.0, 2180.0, 1536.0, 1033.0, 763.0, 527.0, 369.0, 263.0, 153.0, 120.0, 75.0, 64.0, 36.0, 27.0, 17.0, 13.0, 7.0, 6.0, 7.0, 2.0], "bins": [-0.7099609375, -0.6893081665039062, -0.6686553955078125, -0.6480026245117188, -0.627349853515625, -0.6066970825195312, -0.5860443115234375, -0.5653915405273438, -0.54473876953125, -0.5240859985351562, -0.5034332275390625, -0.48278045654296875, -0.462127685546875, -0.44147491455078125, -0.4208221435546875, -0.40016937255859375, -0.3795166015625, -0.35886383056640625, -0.3382110595703125, -0.31755828857421875, -0.296905517578125, -0.27625274658203125, -0.2555999755859375, -0.23494720458984375, -0.21429443359375, -0.19364166259765625, -0.1729888916015625, -0.15233612060546875, -0.131683349609375, -0.11103057861328125, -0.0903778076171875, -0.06972503662109375, -0.049072265625, -0.02841949462890625, -0.0077667236328125, 0.01288604736328125, 0.033538818359375, 0.05419158935546875, 0.0748443603515625, 0.09549713134765625, 0.11614990234375, 0.13680267333984375, 0.1574554443359375, 0.17810821533203125, 0.198760986328125, 0.21941375732421875, 0.2400665283203125, 0.26071929931640625, 0.2813720703125, 0.30202484130859375, 0.3226776123046875, 0.34333038330078125, 0.363983154296875, 0.38463592529296875, 0.4052886962890625, 0.42594146728515625, 0.44659423828125, 0.46724700927734375, 0.4878997802734375, 0.5085525512695312, 0.529205322265625, 0.5498580932617188, 0.5705108642578125, 0.5911636352539062, 0.61181640625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 6.0, 10.0, 7.0, 13.0, 15.0, 15.0, 16.0, 15.0, 21.0, 36.0, 24.0, 27.0, 32.0, 21.0, 28.0, 29.0, 39.0, 39.0, 43.0, 1066.0, 48.0, 41.0, 40.0, 35.0, 33.0, 37.0, 40.0, 24.0, 34.0, 24.0, 26.0, 17.0, 15.0, 15.0, 17.0, 10.0, 13.0, 7.0, 5.0, 8.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.65234375, -2.57147216796875, -2.4906005859375, -2.40972900390625, -2.328857421875, -2.24798583984375, -2.1671142578125, -2.08624267578125, -2.00537109375, -1.92449951171875, -1.8436279296875, -1.76275634765625, -1.681884765625, -1.60101318359375, -1.5201416015625, -1.43927001953125, -1.3583984375, -1.27752685546875, -1.1966552734375, -1.11578369140625, -1.034912109375, -0.95404052734375, -0.8731689453125, -0.79229736328125, -0.71142578125, -0.63055419921875, -0.5496826171875, -0.46881103515625, -0.387939453125, -0.30706787109375, -0.2261962890625, -0.14532470703125, -0.064453125, 0.01641845703125, 0.0972900390625, 0.17816162109375, 0.259033203125, 0.33990478515625, 0.4207763671875, 0.50164794921875, 0.58251953125, 0.66339111328125, 0.7442626953125, 0.82513427734375, 0.906005859375, 0.98687744140625, 1.0677490234375, 1.14862060546875, 1.2294921875, 1.31036376953125, 1.3912353515625, 1.47210693359375, 1.552978515625, 1.63385009765625, 1.7147216796875, 1.79559326171875, 1.87646484375, 1.95733642578125, 2.0382080078125, 2.11907958984375, 2.199951171875, 2.28082275390625, 2.3616943359375, 2.44256591796875, 2.5234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 5.0, 5.0, 11.0, 24.0, 33.0, 48.0, 70.0, 95.0, 155.0, 196.0, 304.0, 406.0, 589.0, 830.0, 1164.0, 1562.0, 2259.0, 3053.0, 4276.0, 5930.0, 8246.0, 11620.0, 16549.0, 23908.0, 34651.0, 51949.0, 83824.0, 156674.0, 1299881.0, 147336.0, 79667.0, 50167.0, 33188.0, 22601.0, 15993.0, 11285.0, 8066.0, 5751.0, 4084.0, 3018.0, 2191.0, 1529.0, 1165.0, 782.0, 565.0, 440.0, 301.0, 202.0, 161.0, 114.0, 77.0, 41.0, 27.0, 28.0, 17.0, 9.0, 10.0, 4.0, 2.0, 3.0, 1.0], "bins": [-0.54638671875, -0.5290145874023438, -0.5116424560546875, -0.49427032470703125, -0.476898193359375, -0.45952606201171875, -0.4421539306640625, -0.42478179931640625, -0.40740966796875, -0.39003753662109375, -0.3726654052734375, -0.35529327392578125, -0.337921142578125, -0.32054901123046875, -0.3031768798828125, -0.28580474853515625, -0.2684326171875, -0.25106048583984375, -0.2336883544921875, -0.21631622314453125, -0.198944091796875, -0.18157196044921875, -0.1641998291015625, -0.14682769775390625, -0.12945556640625, -0.11208343505859375, -0.0947113037109375, -0.07733917236328125, -0.059967041015625, -0.04259490966796875, -0.0252227783203125, -0.00785064697265625, 0.009521484375, 0.02689361572265625, 0.0442657470703125, 0.06163787841796875, 0.079010009765625, 0.09638214111328125, 0.1137542724609375, 0.13112640380859375, 0.14849853515625, 0.16587066650390625, 0.1832427978515625, 0.20061492919921875, 0.217987060546875, 0.23535919189453125, 0.2527313232421875, 0.27010345458984375, 0.2874755859375, 0.30484771728515625, 0.3222198486328125, 0.33959197998046875, 0.356964111328125, 0.37433624267578125, 0.3917083740234375, 0.40908050537109375, 0.42645263671875, 0.44382476806640625, 0.4611968994140625, 0.47856903076171875, 0.495941162109375, 0.5133132934570312, 0.5306854248046875, 0.5480575561523438, 0.5654296875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 6.0, 9.0, 11.0, 16.0, 6.0, 18.0, 12.0, 31.0, 28.0, 35.0, 32.0, 46.0, 63.0, 47.0, 61.0, 85.0, 79.0, 64.0, 72.0, 41.0, 44.0, 37.0, 33.0, 22.0, 12.0, 20.0, 17.0, 9.0, 8.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020456314086914062, -0.00019867345690727234, -0.00019278377294540405, -0.00018689408898353577, -0.00018100440502166748, -0.0001751147210597992, -0.0001692250370979309, -0.00016333535313606262, -0.00015744566917419434, -0.00015155598521232605, -0.00014566630125045776, -0.00013977661728858948, -0.0001338869333267212, -0.0001279972493648529, -0.00012210756540298462, -0.00011621788144111633, -0.00011032819747924805, -0.00010443851351737976, -9.854882955551147e-05, -9.265914559364319e-05, -8.67694616317749e-05, -8.087977766990662e-05, -7.499009370803833e-05, -6.910040974617004e-05, -6.321072578430176e-05, -5.732104182243347e-05, -5.1431357860565186e-05, -4.55416738986969e-05, -3.965198993682861e-05, -3.376230597496033e-05, -2.787262201309204e-05, -2.1982938051223755e-05, -1.609325408935547e-05, -1.0203570127487183e-05, -4.3138861656188965e-06, 1.5757977962493896e-06, 7.465481758117676e-06, 1.3355165719985962e-05, 1.9244849681854248e-05, 2.5134533643722534e-05, 3.102421760559082e-05, 3.6913901567459106e-05, 4.280358552932739e-05, 4.869326949119568e-05, 5.4582953453063965e-05, 6.047263741493225e-05, 6.636232137680054e-05, 7.225200533866882e-05, 7.814168930053711e-05, 8.40313732624054e-05, 8.992105722427368e-05, 9.581074118614197e-05, 0.00010170042514801025, 0.00010759010910987854, 0.00011347979307174683, 0.00011936947703361511, 0.0001252591609954834, 0.00013114884495735168, 0.00013703852891921997, 0.00014292821288108826, 0.00014881789684295654, 0.00015470758080482483, 0.00016059726476669312, 0.0001664869487285614, 0.0001723766326904297]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 8.0, 11.0, 12.0, 21.0, 33.0, 34.0, 34.0, 44.0, 76.0, 102.0, 128.0, 169.0, 326.0, 570.0, 1350.0, 642215.0, 400605.0, 1194.0, 552.0, 284.0, 192.0, 134.0, 104.0, 79.0, 48.0, 33.0, 40.0, 25.0, 22.0, 13.0, 17.0, 15.0, 11.0, 12.0, 6.0, 9.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0032215118408203125, -0.0031140148639678955, -0.0030065178871154785, -0.0028990209102630615, -0.0027915239334106445, -0.0026840269565582275, -0.0025765299797058105, -0.0024690330028533936, -0.0023615360260009766, -0.0022540390491485596, -0.0021465420722961426, -0.0020390450954437256, -0.0019315481185913086, -0.0018240511417388916, -0.0017165541648864746, -0.0016090571880340576, -0.0015015602111816406, -0.0013940632343292236, -0.0012865662574768066, -0.0011790692806243896, -0.0010715723037719727, -0.0009640753269195557, -0.0008565783500671387, -0.0007490813732147217, -0.0006415843963623047, -0.0005340874195098877, -0.0004265904426574707, -0.0003190934658050537, -0.00021159648895263672, -0.00010409951210021973, 3.3974647521972656e-06, 0.00011089444160461426, 0.00021839141845703125, 0.00032588839530944824, 0.00043338537216186523, 0.0005408823490142822, 0.0006483793258666992, 0.0007558763027191162, 0.0008633732795715332, 0.0009708702564239502, 0.0010783672332763672, 0.0011858642101287842, 0.0012933611869812012, 0.0014008581638336182, 0.0015083551406860352, 0.0016158521175384521, 0.0017233490943908691, 0.0018308460712432861, 0.0019383430480957031, 0.00204584002494812, 0.002153337001800537, 0.002260833978652954, 0.002368330955505371, 0.002475827932357788, 0.002583324909210205, 0.002690821886062622, 0.002798318862915039, 0.002905815839767456, 0.003013312816619873, 0.00312080979347229, 0.003228306770324707, 0.003335803747177124, 0.003443300724029541, 0.003550797700881958, 0.003658294677734375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 14.0, 402.0, 562.0, 32.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0011356903705745935, -0.0011161316651850939, -0.0010965729597955942, -0.0010770141379907727, -0.001057455432601273, -0.0010378967272117734, -0.0010183380218222737, -0.0009987792000174522, -0.0009792204946279526, -0.0009596617892384529, -0.0009401030256412923, -0.0009205443202517927, -0.0009009855566546321, -0.0008814268512651324, -0.0008618680876679718, -0.0008423093822784722, -0.0008227506186813116, -0.0008031919132918119, -0.0007836331496946514, -0.0007640744443051517, -0.0007445156807079911, -0.0007249569753184915, -0.0007053982117213309, -0.0006858395063318312, -0.0006662808009423316, -0.0006467220955528319, -0.0006271633319556713, -0.0006076046265661716, -0.0005880458629690111, -0.0005684871575795114, -0.0005489283939823508, -0.0005293696885928512, -0.0005098109249956906, -0.0004902522196061909, -0.00047069345600903034, -0.0004511347215157002, -0.0004315759870223701, -0.00041201725252904, -0.00039245851803570986, -0.0003728998126462102, -0.00035334107815288007, -0.00033378234365954995, -0.00031422360916621983, -0.0002946648746728897, -0.0002751061401795596, -0.00025554740568622947, -0.00023598868574481457, -0.00021642995125148445, -0.00019687121675815433, -0.0001773124822648242, -0.0001577537477714941, -0.0001381950278300792, -0.00011863628606079146, -9.907755156746134e-05, -7.951882435008883e-05, -5.9960089856758714e-05, -4.040135536342859e-05, -2.0842622689087875e-05, -1.2838900147471577e-06, 1.8274840840604156e-05, 3.783357533393428e-05, 5.73923098272644e-05, 7.69510370446369e-05, 9.650977153796703e-05, 0.00011606850603129715]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 5.0, 2.0, 10.0, 8.0, 14.0, 14.0, 10.0, 14.0, 24.0, 17.0, 29.0, 14.0, 39.0, 35.0, 27.0, 28.0, 32.0, 44.0, 44.0, 37.0, 31.0, 34.0, 39.0, 43.0, 28.0, 41.0, 26.0, 41.0, 23.0, 38.0, 28.0, 16.0, 21.0, 21.0, 24.0, 14.0, 19.0, 11.0, 10.0, 12.0, 11.0, 9.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.445978164672852e-05, -8.176174014806747e-05, -7.906369864940643e-05, -7.636565715074539e-05, -7.366761565208435e-05, -7.096957415342331e-05, -6.827153265476227e-05, -6.557349115610123e-05, -6.287544965744019e-05, -6.0177408158779144e-05, -5.74793666601181e-05, -5.478132516145706e-05, -5.208328366279602e-05, -4.938524216413498e-05, -4.668720066547394e-05, -4.39891591668129e-05, -4.1291117668151855e-05, -3.8593076169490814e-05, -3.589503467082977e-05, -3.319699317216873e-05, -3.049895167350769e-05, -2.780091017484665e-05, -2.5102868676185608e-05, -2.2404827177524567e-05, -1.9706785678863525e-05, -1.7008744180202484e-05, -1.4310702681541443e-05, -1.1612661182880402e-05, -8.91461968421936e-06, -6.216578185558319e-06, -3.518536686897278e-06, -8.204951882362366e-07, 1.8775463104248047e-06, 4.575587809085846e-06, 7.273629307746887e-06, 9.971670806407928e-06, 1.266971230506897e-05, 1.536775380373001e-05, 1.8065795302391052e-05, 2.0763836801052094e-05, 2.3461878299713135e-05, 2.6159919798374176e-05, 2.8857961297035217e-05, 3.155600279569626e-05, 3.42540442943573e-05, 3.695208579301834e-05, 3.965012729167938e-05, 4.2348168790340424e-05, 4.5046210289001465e-05, 4.7744251787662506e-05, 5.044229328632355e-05, 5.314033478498459e-05, 5.583837628364563e-05, 5.853641778230667e-05, 6.123445928096771e-05, 6.393250077962875e-05, 6.66305422782898e-05, 6.932858377695084e-05, 7.202662527561188e-05, 7.472466677427292e-05, 7.742270827293396e-05, 8.0120749771595e-05, 8.281879127025604e-05, 8.551683276891708e-05, 8.821487426757812e-05]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 12.0, 10.0, 12.0, 13.0, 12.0, 14.0, 18.0, 15.0, 20.0, 22.0, 28.0, 25.0, 25.0, 31.0, 40.0, 41.0, 39.0, 44.0, 43.0, 46.0, 51.0, 50.0, 31.0, 38.0, 29.0, 40.0, 23.0, 31.0, 20.0, 19.0, 22.0, 22.0, 12.0, 16.0, 13.0, 6.0, 12.0, 10.0, 10.0, 8.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.998046875, -3.866058349609375, -3.73406982421875, -3.602081298828125, -3.4700927734375, -3.338104248046875, -3.20611572265625, -3.074127197265625, -2.942138671875, -2.810150146484375, -2.67816162109375, -2.546173095703125, -2.4141845703125, -2.282196044921875, -2.15020751953125, -2.018218994140625, -1.88623046875, -1.754241943359375, -1.62225341796875, -1.490264892578125, -1.3582763671875, -1.226287841796875, -1.09429931640625, -0.962310791015625, -0.830322265625, -0.698333740234375, -0.56634521484375, -0.434356689453125, -0.3023681640625, -0.170379638671875, -0.03839111328125, 0.093597412109375, 0.2255859375, 0.357574462890625, 0.48956298828125, 0.621551513671875, 0.7535400390625, 0.885528564453125, 1.01751708984375, 1.149505615234375, 1.281494140625, 1.413482666015625, 1.54547119140625, 1.677459716796875, 1.8094482421875, 1.941436767578125, 2.07342529296875, 2.205413818359375, 2.33740234375, 2.469390869140625, 2.60137939453125, 2.733367919921875, 2.8653564453125, 2.997344970703125, 3.12933349609375, 3.261322021484375, 3.393310546875, 3.525299072265625, 3.65728759765625, 3.789276123046875, 3.9212646484375, 4.053253173828125, 4.18524169921875, 4.317230224609375, 4.44921875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 6.0, 16.0, 16.0, 27.0, 38.0, 42.0, 46.0, 73.0, 88.0, 119.0, 166.0, 261.0, 383.0, 617.0, 1319.0, 2698.0, 6302.0, 15533.0, 39812.0, 104766.0, 293639.0, 360212.0, 136816.0, 50866.0, 19676.0, 7780.0, 3447.0, 1536.0, 803.0, 467.0, 256.0, 189.0, 137.0, 102.0, 74.0, 46.0, 39.0, 37.0, 29.0, 18.0, 13.0, 7.0, 10.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.171875, -5.0057373046875, -4.839599609375, -4.6734619140625, -4.50732421875, -4.3411865234375, -4.175048828125, -4.0089111328125, -3.8427734375, -3.6766357421875, -3.510498046875, -3.3443603515625, -3.17822265625, -3.0120849609375, -2.845947265625, -2.6798095703125, -2.513671875, -2.3475341796875, -2.181396484375, -2.0152587890625, -1.84912109375, -1.6829833984375, -1.516845703125, -1.3507080078125, -1.1845703125, -1.0184326171875, -0.852294921875, -0.6861572265625, -0.52001953125, -0.3538818359375, -0.187744140625, -0.0216064453125, 0.14453125, 0.3106689453125, 0.476806640625, 0.6429443359375, 0.80908203125, 0.9752197265625, 1.141357421875, 1.3074951171875, 1.4736328125, 1.6397705078125, 1.805908203125, 1.9720458984375, 2.13818359375, 2.3043212890625, 2.470458984375, 2.6365966796875, 2.802734375, 2.9688720703125, 3.135009765625, 3.3011474609375, 3.46728515625, 3.6334228515625, 3.799560546875, 3.9656982421875, 4.1318359375, 4.2979736328125, 4.464111328125, 4.6302490234375, 4.79638671875, 4.9625244140625, 5.128662109375, 5.2947998046875, 5.4609375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 12.0, 8.0, 17.0, 15.0, 34.0, 23.0, 25.0, 34.0, 28.0, 33.0, 54.0, 59.0, 64.0, 91.0, 244.0, 1514.0, 264.0, 127.0, 73.0, 56.0, 42.0, 31.0, 36.0, 42.0, 25.0, 16.0, 23.0, 11.0, 8.0, 7.0, 4.0, 9.0, 10.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1015625, -11.6475830078125, -11.193603515625, -10.7396240234375, -10.28564453125, -9.8316650390625, -9.377685546875, -8.9237060546875, -8.4697265625, -8.0157470703125, -7.561767578125, -7.1077880859375, -6.65380859375, -6.1998291015625, -5.745849609375, -5.2918701171875, -4.837890625, -4.3839111328125, -3.929931640625, -3.4759521484375, -3.02197265625, -2.5679931640625, -2.114013671875, -1.6600341796875, -1.2060546875, -0.7520751953125, -0.298095703125, 0.1558837890625, 0.60986328125, 1.0638427734375, 1.517822265625, 1.9718017578125, 2.42578125, 2.8797607421875, 3.333740234375, 3.7877197265625, 4.24169921875, 4.6956787109375, 5.149658203125, 5.6036376953125, 6.0576171875, 6.5115966796875, 6.965576171875, 7.4195556640625, 7.87353515625, 8.3275146484375, 8.781494140625, 9.2354736328125, 9.689453125, 10.1434326171875, 10.597412109375, 11.0513916015625, 11.50537109375, 11.9593505859375, 12.413330078125, 12.8673095703125, 13.3212890625, 13.7752685546875, 14.229248046875, 14.6832275390625, 15.13720703125, 15.5911865234375, 16.045166015625, 16.4991455078125, 16.953125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 7.0, 14.0, 17.0, 21.0, 27.0, 34.0, 54.0, 92.0, 127.0, 217.0, 349.0, 636.0, 1489.0, 24383.0, 2959476.0, 153736.0, 2895.0, 881.0, 425.0, 275.0, 184.0, 119.0, 73.0, 43.0, 27.0, 23.0, 10.0, 12.0, 7.0, 12.0, 9.0, 2.0, 5.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.265625, -28.39697265625, -27.5283203125, -26.65966796875, -25.791015625, -24.92236328125, -24.0537109375, -23.18505859375, -22.31640625, -21.44775390625, -20.5791015625, -19.71044921875, -18.841796875, -17.97314453125, -17.1044921875, -16.23583984375, -15.3671875, -14.49853515625, -13.6298828125, -12.76123046875, -11.892578125, -11.02392578125, -10.1552734375, -9.28662109375, -8.41796875, -7.54931640625, -6.6806640625, -5.81201171875, -4.943359375, -4.07470703125, -3.2060546875, -2.33740234375, -1.46875, -0.60009765625, 0.2685546875, 1.13720703125, 2.005859375, 2.87451171875, 3.7431640625, 4.61181640625, 5.48046875, 6.34912109375, 7.2177734375, 8.08642578125, 8.955078125, 9.82373046875, 10.6923828125, 11.56103515625, 12.4296875, 13.29833984375, 14.1669921875, 15.03564453125, 15.904296875, 16.77294921875, 17.6416015625, 18.51025390625, 19.37890625, 20.24755859375, 21.1162109375, 21.98486328125, 22.853515625, 23.72216796875, 24.5908203125, 25.45947265625, 26.328125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 22.0, 102.0, 259.0, 361.0, 198.0, 52.0, 12.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.3653564453125, -27.031261444091797, -25.69716453552246, -24.363067626953125, -23.028972625732422, -21.69487762451172, -20.360780715942383, -19.026683807373047, -17.692588806152344, -16.35849380493164, -15.024396896362305, -13.690300941467285, -12.356204986572266, -11.022109031677246, -9.688013076782227, -8.353917121887207, -7.0198211669921875, -5.685725212097168, -4.351629257202148, -3.017533302307129, -1.6834373474121094, -0.34934139251708984, 0.9847545623779297, 2.318850517272949, 3.6529464721679688, 4.987042427062988, 6.321138381958008, 7.655234336853027, 8.989330291748047, 10.323426246643066, 11.657522201538086, 12.991618156433105, 14.32571029663086, 15.659806251525879, 16.9939022064209, 18.327999114990234, 19.662094116210938, 20.99618911743164, 22.330286026000977, 23.664382934570312, 24.998477935791016, 26.33257293701172, 27.666669845581055, 29.00076675415039, 30.334861755371094, 31.668956756591797, 33.0030517578125, 34.33715057373047, 35.67124557495117, 37.005340576171875, 38.339439392089844, 39.67353439331055, 41.00762939453125, 42.34172439575195, 43.675819396972656, 45.009918212890625, 46.34401321411133, 47.67810821533203, 49.01220703125, 50.3463020324707, 51.680397033691406, 53.01449203491211, 54.34858703613281, 55.68268585205078, 57.016780853271484]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 10.0, 10.0, 9.0, 13.0, 12.0, 19.0, 21.0, 25.0, 30.0, 26.0, 24.0, 25.0, 34.0, 34.0, 55.0, 29.0, 27.0, 44.0, 42.0, 41.0, 44.0, 44.0, 34.0, 32.0, 32.0, 23.0, 33.0, 28.0, 17.0, 22.0, 16.0, 17.0, 14.0, 17.0, 19.0, 12.0, 12.0, 6.0, 8.0, 8.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-26.375974655151367, -25.584087371826172, -24.79220199584961, -24.000316619873047, -23.20842933654785, -22.416542053222656, -21.624656677246094, -20.83277130126953, -20.040884017944336, -19.24899673461914, -18.457111358642578, -17.665225982666016, -16.87333869934082, -16.081451416015625, -15.289566040039062, -14.497679710388184, -13.705793380737305, -12.913907051086426, -12.122020721435547, -11.330134391784668, -10.538248062133789, -9.74636173248291, -8.954475402832031, -8.162589073181152, -7.370702743530273, -6.5788164138793945, -5.786930084228516, -4.995043754577637, -4.203157424926758, -3.411271095275879, -2.619384765625, -1.827498435974121, -1.035614013671875, -0.2437276840209961, 0.5481586456298828, 1.3400449752807617, 2.1319313049316406, 2.9238176345825195, 3.7157039642333984, 4.507590293884277, 5.299476623535156, 6.091362953186035, 6.883249282836914, 7.675135612487793, 8.467021942138672, 9.25890827178955, 10.05079460144043, 10.842680931091309, 11.634567260742188, 12.426453590393066, 13.218339920043945, 14.010226249694824, 14.802112579345703, 15.593998908996582, 16.38588523864746, 17.177772521972656, 17.96965789794922, 18.76154327392578, 19.553430557250977, 20.345317840576172, 21.137203216552734, 21.929088592529297, 22.720975875854492, 23.512863159179688, 24.30474853515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 7.0, 5.0, 6.0, 10.0, 10.0, 12.0, 17.0, 13.0, 19.0, 14.0, 17.0, 21.0, 18.0, 26.0, 23.0, 24.0, 39.0, 39.0, 46.0, 49.0, 40.0, 51.0, 47.0, 42.0, 41.0, 34.0, 34.0, 30.0, 34.0, 32.0, 27.0, 20.0, 23.0, 22.0, 17.0, 16.0, 17.0, 17.0, 4.0, 8.0, 11.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.0078125, -3.873779296875, -3.73974609375, -3.605712890625, -3.4716796875, -3.337646484375, -3.20361328125, -3.069580078125, -2.935546875, -2.801513671875, -2.66748046875, -2.533447265625, -2.3994140625, -2.265380859375, -2.13134765625, -1.997314453125, -1.86328125, -1.729248046875, -1.59521484375, -1.461181640625, -1.3271484375, -1.193115234375, -1.05908203125, -0.925048828125, -0.791015625, -0.656982421875, -0.52294921875, -0.388916015625, -0.2548828125, -0.120849609375, 0.01318359375, 0.147216796875, 0.28125, 0.415283203125, 0.54931640625, 0.683349609375, 0.8173828125, 0.951416015625, 1.08544921875, 1.219482421875, 1.353515625, 1.487548828125, 1.62158203125, 1.755615234375, 1.8896484375, 2.023681640625, 2.15771484375, 2.291748046875, 2.42578125, 2.559814453125, 2.69384765625, 2.827880859375, 2.9619140625, 3.095947265625, 3.22998046875, 3.364013671875, 3.498046875, 3.632080078125, 3.76611328125, 3.900146484375, 4.0341796875, 4.168212890625, 4.30224609375, 4.436279296875, 4.5703125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 6.0, 5.0, 8.0, 5.0, 10.0, 8.0, 14.0, 18.0, 26.0, 37.0, 40.0, 65.0, 114.0, 180.0, 349.0, 854.0, 3003.0, 23423.0, 317797.0, 2213932.0, 1476141.0, 143437.0, 11528.0, 1891.0, 614.0, 279.0, 135.0, 89.0, 65.0, 40.0, 22.0, 20.0, 29.0, 17.0, 19.0, 9.0, 7.0, 7.0, 4.0, 6.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.734375, -9.46282958984375, -9.1912841796875, -8.91973876953125, -8.648193359375, -8.37664794921875, -8.1051025390625, -7.83355712890625, -7.56201171875, -7.29046630859375, -7.0189208984375, -6.74737548828125, -6.475830078125, -6.20428466796875, -5.9327392578125, -5.66119384765625, -5.3896484375, -5.11810302734375, -4.8465576171875, -4.57501220703125, -4.303466796875, -4.03192138671875, -3.7603759765625, -3.48883056640625, -3.21728515625, -2.94573974609375, -2.6741943359375, -2.40264892578125, -2.131103515625, -1.85955810546875, -1.5880126953125, -1.31646728515625, -1.044921875, -0.77337646484375, -0.5018310546875, -0.23028564453125, 0.041259765625, 0.31280517578125, 0.5843505859375, 0.85589599609375, 1.12744140625, 1.39898681640625, 1.6705322265625, 1.94207763671875, 2.213623046875, 2.48516845703125, 2.7567138671875, 3.02825927734375, 3.2998046875, 3.57135009765625, 3.8428955078125, 4.11444091796875, 4.385986328125, 4.65753173828125, 4.9290771484375, 5.20062255859375, 5.47216796875, 5.74371337890625, 6.0152587890625, 6.28680419921875, 6.558349609375, 6.82989501953125, 7.1014404296875, 7.37298583984375, 7.64453125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 1.0, 7.0, 5.0, 9.0, 12.0, 16.0, 26.0, 36.0, 58.0, 68.0, 89.0, 143.0, 193.0, 311.0, 387.0, 521.0, 501.0, 453.0, 372.0, 262.0, 187.0, 139.0, 79.0, 57.0, 44.0, 27.0, 20.0, 17.0, 8.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.81640625, -7.6064453125, -7.396484375, -7.1865234375, -6.9765625, -6.7666015625, -6.556640625, -6.3466796875, -6.13671875, -5.9267578125, -5.716796875, -5.5068359375, -5.296875, -5.0869140625, -4.876953125, -4.6669921875, -4.45703125, -4.2470703125, -4.037109375, -3.8271484375, -3.6171875, -3.4072265625, -3.197265625, -2.9873046875, -2.77734375, -2.5673828125, -2.357421875, -2.1474609375, -1.9375, -1.7275390625, -1.517578125, -1.3076171875, -1.09765625, -0.8876953125, -0.677734375, -0.4677734375, -0.2578125, -0.0478515625, 0.162109375, 0.3720703125, 0.58203125, 0.7919921875, 1.001953125, 1.2119140625, 1.421875, 1.6318359375, 1.841796875, 2.0517578125, 2.26171875, 2.4716796875, 2.681640625, 2.8916015625, 3.1015625, 3.3115234375, 3.521484375, 3.7314453125, 3.94140625, 4.1513671875, 4.361328125, 4.5712890625, 4.78125, 4.9912109375, 5.201171875, 5.4111328125, 5.62109375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 15.0, 12.0, 15.0, 20.0, 19.0, 31.0, 52.0, 58.0, 86.0, 148.0, 272.0, 433.0, 831.0, 1994.0, 6699.0, 34452.0, 300883.0, 2794559.0, 952082.0, 82890.0, 12979.0, 3232.0, 1144.0, 512.0, 281.0, 171.0, 129.0, 75.0, 47.0, 33.0, 18.0, 19.0, 20.0, 19.0, 2.0, 14.0, 11.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.6796875, -9.37451171875, -9.0693359375, -8.76416015625, -8.458984375, -8.15380859375, -7.8486328125, -7.54345703125, -7.23828125, -6.93310546875, -6.6279296875, -6.32275390625, -6.017578125, -5.71240234375, -5.4072265625, -5.10205078125, -4.796875, -4.49169921875, -4.1865234375, -3.88134765625, -3.576171875, -3.27099609375, -2.9658203125, -2.66064453125, -2.35546875, -2.05029296875, -1.7451171875, -1.43994140625, -1.134765625, -0.82958984375, -0.5244140625, -0.21923828125, 0.0859375, 0.39111328125, 0.6962890625, 1.00146484375, 1.306640625, 1.61181640625, 1.9169921875, 2.22216796875, 2.52734375, 2.83251953125, 3.1376953125, 3.44287109375, 3.748046875, 4.05322265625, 4.3583984375, 4.66357421875, 4.96875, 5.27392578125, 5.5791015625, 5.88427734375, 6.189453125, 6.49462890625, 6.7998046875, 7.10498046875, 7.41015625, 7.71533203125, 8.0205078125, 8.32568359375, 8.630859375, 8.93603515625, 9.2412109375, 9.54638671875, 9.8515625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 16.0, 49.0, 76.0, 154.0, 205.0, 198.0, 148.0, 95.0, 43.0, 13.0, 9.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.798091888427734, -50.645545959472656, -49.49299621582031, -48.34044647216797, -47.18790054321289, -46.03535461425781, -44.88280487060547, -43.730255126953125, -42.57770919799805, -41.42516326904297, -40.272613525390625, -39.12006378173828, -37.9675178527832, -36.814971923828125, -35.66242218017578, -34.50987243652344, -33.35732650756836, -32.20478057861328, -31.052230834960938, -29.899682998657227, -28.747135162353516, -27.594587326049805, -26.442039489746094, -25.289491653442383, -24.136943817138672, -22.98439598083496, -21.83184814453125, -20.67930030822754, -19.526752471923828, -18.374204635620117, -17.221656799316406, -16.069108963012695, -14.916557312011719, -13.764009475708008, -12.611461639404297, -11.458913803100586, -10.306365966796875, -9.153818130493164, -8.001270294189453, -6.848722457885742, -5.696174621582031, -4.54362678527832, -3.3910789489746094, -2.2385311126708984, -1.0859832763671875, 0.06656455993652344, 1.2191123962402344, 2.3716602325439453, 3.5242080688476562, 4.676755905151367, 5.829303741455078, 6.981851577758789, 8.1343994140625, 9.286947250366211, 10.439495086669922, 11.592042922973633, 12.744590759277344, 13.897138595581055, 15.049686431884766, 16.202234268188477, 17.354782104492188, 18.5073299407959, 19.65987777709961, 20.81242561340332, 21.96497344970703]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 5.0, 3.0, 3.0, 3.0, 9.0, 5.0, 10.0, 13.0, 13.0, 10.0, 16.0, 17.0, 22.0, 19.0, 21.0, 43.0, 26.0, 27.0, 35.0, 38.0, 30.0, 32.0, 41.0, 43.0, 31.0, 55.0, 45.0, 30.0, 36.0, 28.0, 32.0, 24.0, 29.0, 22.0, 27.0, 27.0, 20.0, 17.0, 20.0, 14.0, 11.0, 12.0, 13.0, 7.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.560039520263672, -16.944480895996094, -16.328920364379883, -15.713360786437988, -15.097801208496094, -14.4822416305542, -13.866682052612305, -13.25112247467041, -12.635562896728516, -12.020003318786621, -11.404443740844727, -10.788884162902832, -10.173324584960938, -9.557765007019043, -8.942205429077148, -8.326645851135254, -7.711086273193359, -7.095526695251465, -6.47996711730957, -5.864407539367676, -5.248847961425781, -4.633288383483887, -4.017728805541992, -3.4021692276000977, -2.786609649658203, -2.1710500717163086, -1.555490493774414, -0.9399309158325195, -0.324371337890625, 0.29118824005126953, 0.9067478179931641, 1.5223073959350586, 2.1378650665283203, 2.753424644470215, 3.3689842224121094, 3.984543800354004, 4.600103378295898, 5.215662956237793, 5.8312225341796875, 6.446782112121582, 7.062341690063477, 7.677901268005371, 8.293460845947266, 8.90902042388916, 9.524580001831055, 10.14013957977295, 10.755699157714844, 11.371258735656738, 11.986818313598633, 12.602377891540527, 13.217937469482422, 13.833497047424316, 14.449056625366211, 15.064616203308105, 15.68017578125, 16.295734405517578, 16.91129493713379, 17.52685546875, 18.142414093017578, 18.757972717285156, 19.373533248901367, 19.989093780517578, 20.604652404785156, 21.220211029052734, 21.835771560668945]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 5.0, 2.0, 8.0, 11.0, 9.0, 7.0, 11.0, 12.0, 16.0, 12.0, 21.0, 22.0, 26.0, 24.0, 21.0, 33.0, 40.0, 35.0, 35.0, 52.0, 45.0, 52.0, 42.0, 44.0, 55.0, 32.0, 31.0, 28.0, 30.0, 33.0, 23.0, 32.0, 27.0, 25.0, 23.0, 14.0, 13.0, 7.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.817779541015625, -3.67657470703125, -3.535369873046875, -3.3941650390625, -3.252960205078125, -3.11175537109375, -2.970550537109375, -2.829345703125, -2.688140869140625, -2.54693603515625, -2.405731201171875, -2.2645263671875, -2.123321533203125, -1.98211669921875, -1.840911865234375, -1.69970703125, -1.558502197265625, -1.41729736328125, -1.276092529296875, -1.1348876953125, -0.993682861328125, -0.85247802734375, -0.711273193359375, -0.570068359375, -0.428863525390625, -0.28765869140625, -0.146453857421875, -0.0052490234375, 0.135955810546875, 0.27716064453125, 0.418365478515625, 0.5595703125, 0.700775146484375, 0.84197998046875, 0.983184814453125, 1.1243896484375, 1.265594482421875, 1.40679931640625, 1.548004150390625, 1.689208984375, 1.830413818359375, 1.97161865234375, 2.112823486328125, 2.2540283203125, 2.395233154296875, 2.53643798828125, 2.677642822265625, 2.81884765625, 2.960052490234375, 3.10125732421875, 3.242462158203125, 3.3836669921875, 3.524871826171875, 3.66607666015625, 3.807281494140625, 3.948486328125, 4.089691162109375, 4.23089599609375, 4.372100830078125, 4.5133056640625, 4.654510498046875, 4.79571533203125, 4.936920166015625, 5.078125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 8.0, 13.0, 9.0, 34.0, 37.0, 53.0, 66.0, 104.0, 124.0, 197.0, 284.0, 407.0, 639.0, 980.0, 1485.0, 2391.0, 3576.0, 5662.0, 8590.0, 13762.0, 22120.0, 37738.0, 68805.0, 146387.0, 338385.0, 195465.0, 85335.0, 45172.0, 26877.0, 16042.0, 9828.0, 6109.0, 4041.0, 2577.0, 1662.0, 1168.0, 813.0, 542.0, 361.0, 262.0, 149.0, 113.0, 67.0, 36.0, 31.0, 20.0, 12.0, 6.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.723358154296875, -0.69720458984375, -0.671051025390625, -0.6448974609375, -0.618743896484375, -0.59259033203125, -0.566436767578125, -0.540283203125, -0.514129638671875, -0.48797607421875, -0.461822509765625, -0.4356689453125, -0.409515380859375, -0.38336181640625, -0.357208251953125, -0.3310546875, -0.304901123046875, -0.27874755859375, -0.252593994140625, -0.2264404296875, -0.200286865234375, -0.17413330078125, -0.147979736328125, -0.121826171875, -0.095672607421875, -0.06951904296875, -0.043365478515625, -0.0172119140625, 0.008941650390625, 0.03509521484375, 0.061248779296875, 0.08740234375, 0.113555908203125, 0.13970947265625, 0.165863037109375, 0.1920166015625, 0.218170166015625, 0.24432373046875, 0.270477294921875, 0.296630859375, 0.322784423828125, 0.34893798828125, 0.375091552734375, 0.4012451171875, 0.427398681640625, 0.45355224609375, 0.479705810546875, 0.505859375, 0.532012939453125, 0.55816650390625, 0.584320068359375, 0.6104736328125, 0.636627197265625, 0.66278076171875, 0.688934326171875, 0.715087890625, 0.741241455078125, 0.76739501953125, 0.793548583984375, 0.8197021484375, 0.845855712890625, 0.87200927734375, 0.898162841796875, 0.92431640625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 6.0, 3.0, 5.0, 8.0, 14.0, 19.0, 15.0, 14.0, 24.0, 16.0, 28.0, 30.0, 23.0, 29.0, 36.0, 36.0, 39.0, 42.0, 47.0, 35.0, 1059.0, 42.0, 43.0, 42.0, 34.0, 43.0, 28.0, 29.0, 27.0, 32.0, 21.0, 27.0, 19.0, 17.0, 14.0, 10.0, 12.0, 10.0, 9.0, 13.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.771484375, -2.683319091796875, -2.59515380859375, -2.506988525390625, -2.4188232421875, -2.330657958984375, -2.24249267578125, -2.154327392578125, -2.066162109375, -1.977996826171875, -1.88983154296875, -1.801666259765625, -1.7135009765625, -1.625335693359375, -1.53717041015625, -1.449005126953125, -1.36083984375, -1.272674560546875, -1.18450927734375, -1.096343994140625, -1.0081787109375, -0.920013427734375, -0.83184814453125, -0.743682861328125, -0.655517578125, -0.567352294921875, -0.47918701171875, -0.391021728515625, -0.3028564453125, -0.214691162109375, -0.12652587890625, -0.038360595703125, 0.0498046875, 0.137969970703125, 0.22613525390625, 0.314300537109375, 0.4024658203125, 0.490631103515625, 0.57879638671875, 0.666961669921875, 0.755126953125, 0.843292236328125, 0.93145751953125, 1.019622802734375, 1.1077880859375, 1.195953369140625, 1.28411865234375, 1.372283935546875, 1.46044921875, 1.548614501953125, 1.63677978515625, 1.724945068359375, 1.8131103515625, 1.901275634765625, 1.98944091796875, 2.077606201171875, 2.165771484375, 2.253936767578125, 2.34210205078125, 2.430267333984375, 2.5184326171875, 2.606597900390625, 2.69476318359375, 2.782928466796875, 2.87109375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 7.0, 7.0, 5.0, 18.0, 25.0, 31.0, 44.0, 71.0, 108.0, 145.0, 173.0, 276.0, 438.0, 538.0, 840.0, 1106.0, 1594.0, 2130.0, 3022.0, 4334.0, 5965.0, 8396.0, 11791.0, 17051.0, 24694.0, 36409.0, 56100.0, 93852.0, 178821.0, 1294533.0, 133273.0, 73839.0, 45952.0, 30884.0, 20708.0, 14551.0, 10255.0, 7274.0, 5114.0, 3603.0, 2629.0, 1942.0, 1343.0, 943.0, 628.0, 486.0, 354.0, 278.0, 167.0, 124.0, 96.0, 61.0, 42.0, 23.0, 18.0, 12.0, 8.0, 4.0, 3.0, 0.0, 6.0], "bins": [-0.61572265625, -0.596649169921875, -0.57757568359375, -0.558502197265625, -0.5394287109375, -0.520355224609375, -0.50128173828125, -0.482208251953125, -0.463134765625, -0.444061279296875, -0.42498779296875, -0.405914306640625, -0.3868408203125, -0.367767333984375, -0.34869384765625, -0.329620361328125, -0.310546875, -0.291473388671875, -0.27239990234375, -0.253326416015625, -0.2342529296875, -0.215179443359375, -0.19610595703125, -0.177032470703125, -0.157958984375, -0.138885498046875, -0.11981201171875, -0.100738525390625, -0.0816650390625, -0.062591552734375, -0.04351806640625, -0.024444580078125, -0.00537109375, 0.013702392578125, 0.03277587890625, 0.051849365234375, 0.0709228515625, 0.089996337890625, 0.10906982421875, 0.128143310546875, 0.147216796875, 0.166290283203125, 0.18536376953125, 0.204437255859375, 0.2235107421875, 0.242584228515625, 0.26165771484375, 0.280731201171875, 0.2998046875, 0.318878173828125, 0.33795166015625, 0.357025146484375, 0.3760986328125, 0.395172119140625, 0.41424560546875, 0.433319091796875, 0.452392578125, 0.471466064453125, 0.49053955078125, 0.509613037109375, 0.5286865234375, 0.547760009765625, 0.56683349609375, 0.585906982421875, 0.60498046875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 6.0, 4.0, 10.0, 8.0, 5.0, 8.0, 20.0, 17.0, 24.0, 20.0, 20.0, 32.0, 31.0, 44.0, 45.0, 54.0, 55.0, 62.0, 75.0, 58.0, 66.0, 49.0, 39.0, 44.0, 42.0, 36.0, 22.0, 20.0, 18.0, 12.0, 11.0, 9.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015115737915039062, -0.0001463666558265686, -0.00014157593250274658, -0.00013678520917892456, -0.00013199448585510254, -0.00012720376253128052, -0.0001224130392074585, -0.00011762231588363647, -0.00011283159255981445, -0.00010804086923599243, -0.00010325014591217041, -9.845942258834839e-05, -9.366869926452637e-05, -8.887797594070435e-05, -8.408725261688232e-05, -7.92965292930603e-05, -7.450580596923828e-05, -6.971508264541626e-05, -6.492435932159424e-05, -6.013363599777222e-05, -5.5342912673950195e-05, -5.0552189350128174e-05, -4.576146602630615e-05, -4.097074270248413e-05, -3.618001937866211e-05, -3.138929605484009e-05, -2.6598572731018066e-05, -2.1807849407196045e-05, -1.7017126083374023e-05, -1.2226402759552002e-05, -7.4356794357299805e-06, -2.644956111907959e-06, 2.1457672119140625e-06, 6.936490535736084e-06, 1.1727213859558105e-05, 1.6517937183380127e-05, 2.130866050720215e-05, 2.609938383102417e-05, 3.089010715484619e-05, 3.568083047866821e-05, 4.0471553802490234e-05, 4.5262277126312256e-05, 5.005300045013428e-05, 5.48437237739563e-05, 5.963444709777832e-05, 6.442517042160034e-05, 6.921589374542236e-05, 7.400661706924438e-05, 7.87973403930664e-05, 8.358806371688843e-05, 8.837878704071045e-05, 9.316951036453247e-05, 9.796023368835449e-05, 0.00010275095701217651, 0.00010754168033599854, 0.00011233240365982056, 0.00011712312698364258, 0.0001219138503074646, 0.00012670457363128662, 0.00013149529695510864, 0.00013628602027893066, 0.00014107674360275269, 0.0001458674669265747, 0.00015065819025039673, 0.00015544891357421875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 7.0, 12.0, 7.0, 9.0, 21.0, 18.0, 33.0, 30.0, 53.0, 63.0, 104.0, 114.0, 202.0, 276.0, 526.0, 1109.0, 119431.0, 922748.0, 1920.0, 683.0, 350.0, 230.0, 137.0, 86.0, 86.0, 60.0, 42.0, 45.0, 31.0, 24.0, 10.0, 19.0, 12.0, 13.0, 6.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.003078460693359375, -0.002985656261444092, -0.0028928518295288086, -0.0028000473976135254, -0.002707242965698242, -0.002614438533782959, -0.0025216341018676758, -0.0024288296699523926, -0.0023360252380371094, -0.002243220806121826, -0.002150416374206543, -0.0020576119422912598, -0.0019648075103759766, -0.0018720030784606934, -0.0017791986465454102, -0.001686394214630127, -0.0015935897827148438, -0.0015007853507995605, -0.0014079809188842773, -0.0013151764869689941, -0.001222372055053711, -0.0011295676231384277, -0.0010367631912231445, -0.0009439587593078613, -0.0008511543273925781, -0.0007583498954772949, -0.0006655454635620117, -0.0005727410316467285, -0.0004799365997314453, -0.0003871321678161621, -0.0002943277359008789, -0.0002015233039855957, -0.0001087188720703125, -1.5914440155029297e-05, 7.68899917602539e-05, 0.0001696944236755371, 0.0002624988555908203, 0.0003553032875061035, 0.0004481077194213867, 0.0005409121513366699, 0.0006337165832519531, 0.0007265210151672363, 0.0008193254470825195, 0.0009121298789978027, 0.001004934310913086, 0.0010977387428283691, 0.0011905431747436523, 0.0012833476066589355, 0.0013761520385742188, 0.001468956470489502, 0.0015617609024047852, 0.0016545653343200684, 0.0017473697662353516, 0.0018401741981506348, 0.001932978630065918, 0.002025783061981201, 0.0021185874938964844, 0.0022113919258117676, 0.0023041963577270508, 0.002397000789642334, 0.002489805221557617, 0.0025826096534729004, 0.0026754140853881836, 0.002768218517303467, 0.00286102294921875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 43.0, 173.0, 395.0, 281.0, 103.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014769290282856673, -0.0001383087655995041, -0.00012892464292235672, -0.00011954050569329411, -0.00011015638301614672, -0.0001007722457870841, -9.13881158339791e-05, -8.20039858808741e-05, -7.26198559277691e-05, -6.323572597466409e-05, -5.385159602155909e-05, -4.446746243047528e-05, -3.508333247737028e-05, -2.5699202524265274e-05, -1.6315068933181465e-05, -6.930938980076462e-06, 2.4531909730285406e-06, 1.1837321835628245e-05, 2.122145269822795e-05, 3.0605584470322356e-05, 3.998971442342736e-05, 4.937384437653236e-05, 5.875797796761617e-05, 6.814210792072117e-05, 7.752623787382618e-05, 8.691036782693118e-05, 9.629449778003618e-05, 0.00010567862773314118, 0.0001150627649622038, 0.0001244468876393512, 0.0001338310248684138, 0.0001432151475455612, 0.00015259927022270858, 0.0001619834074517712, 0.0001713675301289186, 0.0001807516673579812, 0.0001901357900351286, 0.0001995199272641912, 0.00020890406449325383, 0.00021828818717040122, 0.0002276723098475486, 0.00023705644707661122, 0.00024644058430567384, 0.0002558247069828212, 0.0002652088296599686, 0.000274592952337116, 0.00028397710411809385, 0.00029336122679524124, 0.0003027453785762191, 0.00031212950125336647, 0.0003215136530343443, 0.0003308977757114917, 0.0003402818983886391, 0.0003496660210657865, 0.0003590501728467643, 0.0003684342955239117, 0.0003778184182010591, 0.0003872025408782065, 0.00039658669265918434, 0.0004059708153363317, 0.0004153549380134791, 0.0004247390606906265, 0.00043412321247160435, 0.00044350733514875174, 0.0004528914578258991]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 16.0, 10.0, 11.0, 14.0, 17.0, 11.0, 23.0, 22.0, 25.0, 22.0, 27.0, 26.0, 36.0, 51.0, 40.0, 42.0, 49.0, 41.0, 44.0, 38.0, 36.0, 35.0, 33.0, 34.0, 35.0, 42.0, 36.0, 24.0, 32.0, 27.0, 18.0, 16.0, 16.0, 6.0, 6.0, 11.0, 13.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.143352508544922e-05, -8.877180516719818e-05, -8.611008524894714e-05, -8.34483653306961e-05, -8.078664541244507e-05, -7.812492549419403e-05, -7.546320557594299e-05, -7.280148565769196e-05, -7.013976573944092e-05, -6.747804582118988e-05, -6.481632590293884e-05, -6.21546059846878e-05, -5.949288606643677e-05, -5.683116614818573e-05, -5.416944622993469e-05, -5.1507726311683655e-05, -4.884600639343262e-05, -4.618428647518158e-05, -4.352256655693054e-05, -4.0860846638679504e-05, -3.819912672042847e-05, -3.553740680217743e-05, -3.287568688392639e-05, -3.0213966965675354e-05, -2.7552247047424316e-05, -2.489052712917328e-05, -2.222880721092224e-05, -1.9567087292671204e-05, -1.6905367374420166e-05, -1.4243647456169128e-05, -1.158192753791809e-05, -8.920207619667053e-06, -6.258487701416016e-06, -3.596767783164978e-06, -9.350478649139404e-07, 1.7266720533370972e-06, 4.388391971588135e-06, 7.050111889839172e-06, 9.71183180809021e-06, 1.2373551726341248e-05, 1.5035271644592285e-05, 1.7696991562843323e-05, 2.035871148109436e-05, 2.3020431399345398e-05, 2.5682151317596436e-05, 2.8343871235847473e-05, 3.100559115409851e-05, 3.366731107234955e-05, 3.6329030990600586e-05, 3.8990750908851624e-05, 4.165247082710266e-05, 4.43141907453537e-05, 4.6975910663604736e-05, 4.9637630581855774e-05, 5.229935050010681e-05, 5.496107041835785e-05, 5.762279033660889e-05, 6.0284510254859924e-05, 6.294623017311096e-05, 6.5607950091362e-05, 6.826967000961304e-05, 7.093138992786407e-05, 7.359310984611511e-05, 7.625482976436615e-05, 7.891654968261719e-05]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 5.0, 2.0, 8.0, 11.0, 9.0, 7.0, 11.0, 12.0, 16.0, 12.0, 21.0, 22.0, 26.0, 24.0, 21.0, 33.0, 40.0, 35.0, 35.0, 52.0, 45.0, 52.0, 42.0, 44.0, 55.0, 32.0, 31.0, 28.0, 30.0, 33.0, 23.0, 32.0, 27.0, 25.0, 23.0, 14.0, 13.0, 7.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.817779541015625, -3.67657470703125, -3.535369873046875, -3.3941650390625, -3.252960205078125, -3.11175537109375, -2.970550537109375, -2.829345703125, -2.688140869140625, -2.54693603515625, -2.405731201171875, -2.2645263671875, -2.123321533203125, -1.98211669921875, -1.840911865234375, -1.69970703125, -1.558502197265625, -1.41729736328125, -1.276092529296875, -1.1348876953125, -0.993682861328125, -0.85247802734375, -0.711273193359375, -0.570068359375, -0.428863525390625, -0.28765869140625, -0.146453857421875, -0.0052490234375, 0.135955810546875, 0.27716064453125, 0.418365478515625, 0.5595703125, 0.700775146484375, 0.84197998046875, 0.983184814453125, 1.1243896484375, 1.265594482421875, 1.40679931640625, 1.548004150390625, 1.689208984375, 1.830413818359375, 1.97161865234375, 2.112823486328125, 2.2540283203125, 2.395233154296875, 2.53643798828125, 2.677642822265625, 2.81884765625, 2.960052490234375, 3.10125732421875, 3.242462158203125, 3.3836669921875, 3.524871826171875, 3.66607666015625, 3.807281494140625, 3.948486328125, 4.089691162109375, 4.23089599609375, 4.372100830078125, 4.5133056640625, 4.654510498046875, 4.79571533203125, 4.936920166015625, 5.078125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 10.0, 17.0, 26.0, 33.0, 33.0, 53.0, 70.0, 112.0, 152.0, 164.0, 228.0, 289.0, 473.0, 762.0, 1406.0, 3040.0, 8072.0, 27515.0, 97773.0, 301902.0, 389639.0, 152294.0, 43365.0, 12243.0, 4185.0, 1858.0, 904.0, 542.0, 357.0, 245.0, 226.0, 145.0, 112.0, 69.0, 57.0, 57.0, 30.0, 22.0, 11.0, 13.0, 12.0, 7.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-6.8046875, -6.61126708984375, -6.4178466796875, -6.22442626953125, -6.031005859375, -5.83758544921875, -5.6441650390625, -5.45074462890625, -5.25732421875, -5.06390380859375, -4.8704833984375, -4.67706298828125, -4.483642578125, -4.29022216796875, -4.0968017578125, -3.90338134765625, -3.7099609375, -3.51654052734375, -3.3231201171875, -3.12969970703125, -2.936279296875, -2.74285888671875, -2.5494384765625, -2.35601806640625, -2.16259765625, -1.96917724609375, -1.7757568359375, -1.58233642578125, -1.388916015625, -1.19549560546875, -1.0020751953125, -0.80865478515625, -0.615234375, -0.42181396484375, -0.2283935546875, -0.03497314453125, 0.158447265625, 0.35186767578125, 0.5452880859375, 0.73870849609375, 0.93212890625, 1.12554931640625, 1.3189697265625, 1.51239013671875, 1.705810546875, 1.89923095703125, 2.0926513671875, 2.28607177734375, 2.4794921875, 2.67291259765625, 2.8663330078125, 3.05975341796875, 3.253173828125, 3.44659423828125, 3.6400146484375, 3.83343505859375, 4.02685546875, 4.22027587890625, 4.4136962890625, 4.60711669921875, 4.800537109375, 4.99395751953125, 5.1873779296875, 5.38079833984375, 5.57421875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 12.0, 11.0, 18.0, 29.0, 25.0, 21.0, 45.0, 40.0, 36.0, 74.0, 92.0, 157.0, 358.0, 1460.0, 173.0, 90.0, 70.0, 53.0, 46.0, 43.0, 35.0, 27.0, 19.0, 23.0, 12.0, 8.0, 12.0, 6.0, 17.0, 5.0, 5.0, 1.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.578125, -13.1263427734375, -12.674560546875, -12.2227783203125, -11.77099609375, -11.3192138671875, -10.867431640625, -10.4156494140625, -9.9638671875, -9.5120849609375, -9.060302734375, -8.6085205078125, -8.15673828125, -7.7049560546875, -7.253173828125, -6.8013916015625, -6.349609375, -5.8978271484375, -5.446044921875, -4.9942626953125, -4.54248046875, -4.0906982421875, -3.638916015625, -3.1871337890625, -2.7353515625, -2.2835693359375, -1.831787109375, -1.3800048828125, -0.92822265625, -0.4764404296875, -0.024658203125, 0.4271240234375, 0.87890625, 1.3306884765625, 1.782470703125, 2.2342529296875, 2.68603515625, 3.1378173828125, 3.589599609375, 4.0413818359375, 4.4931640625, 4.9449462890625, 5.396728515625, 5.8485107421875, 6.30029296875, 6.7520751953125, 7.203857421875, 7.6556396484375, 8.107421875, 8.5592041015625, 9.010986328125, 9.4627685546875, 9.91455078125, 10.3663330078125, 10.818115234375, 11.2698974609375, 11.7216796875, 12.1734619140625, 12.625244140625, 13.0770263671875, 13.52880859375, 13.9805908203125, 14.432373046875, 14.8841552734375, 15.3359375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 12.0, 15.0, 25.0, 27.0, 41.0, 41.0, 93.0, 75.0, 104.0, 146.0, 204.0, 309.0, 434.0, 716.0, 1402.0, 11715.0, 2271148.0, 848604.0, 7320.0, 1223.0, 643.0, 361.0, 269.0, 210.0, 132.0, 123.0, 61.0, 35.0, 42.0, 29.0, 30.0, 24.0, 9.0, 8.0, 8.0, 8.0, 8.0, 9.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-26.03125, -25.306640625, -24.58203125, -23.857421875, -23.1328125, -22.408203125, -21.68359375, -20.958984375, -20.234375, -19.509765625, -18.78515625, -18.060546875, -17.3359375, -16.611328125, -15.88671875, -15.162109375, -14.4375, -13.712890625, -12.98828125, -12.263671875, -11.5390625, -10.814453125, -10.08984375, -9.365234375, -8.640625, -7.916015625, -7.19140625, -6.466796875, -5.7421875, -5.017578125, -4.29296875, -3.568359375, -2.84375, -2.119140625, -1.39453125, -0.669921875, 0.0546875, 0.779296875, 1.50390625, 2.228515625, 2.953125, 3.677734375, 4.40234375, 5.126953125, 5.8515625, 6.576171875, 7.30078125, 8.025390625, 8.75, 9.474609375, 10.19921875, 10.923828125, 11.6484375, 12.373046875, 13.09765625, 13.822265625, 14.546875, 15.271484375, 15.99609375, 16.720703125, 17.4453125, 18.169921875, 18.89453125, 19.619140625, 20.34375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 41.0, 79.0, 191.0, 248.0, 255.0, 125.0, 54.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.88557243347168, -22.83837127685547, -21.79117202758789, -20.74397087097168, -19.69676971435547, -18.649568557739258, -17.602367401123047, -16.55516815185547, -15.507966995239258, -14.460765838623047, -13.413565635681152, -12.366365432739258, -11.319164276123047, -10.271963119506836, -9.224762916564941, -8.177562713623047, -7.130361557006836, -6.083160877227783, -5.0359601974487305, -3.9887595176696777, -2.941558837890625, -1.8943581581115723, -0.8471574783325195, 0.2000432014465332, 1.247243881225586, 2.2944445610046387, 3.3416452407836914, 4.388845920562744, 5.436046600341797, 6.48324728012085, 7.530447959899902, 8.577648162841797, 9.624847412109375, 10.672048568725586, 11.71924877166748, 12.766448974609375, 13.813650131225586, 14.860851287841797, 15.908051490783691, 16.955251693725586, 18.002452850341797, 19.049654006958008, 20.09685516357422, 21.144054412841797, 22.191255569458008, 23.23845672607422, 24.285655975341797, 25.332857131958008, 26.38005828857422, 27.42725944519043, 28.47446060180664, 29.52165985107422, 30.56886100769043, 31.61606216430664, 32.66326141357422, 33.71046447753906, 34.75766372680664, 35.80486297607422, 36.85206604003906, 37.89926528930664, 38.94646453857422, 39.99366760253906, 41.04086685180664, 42.088069915771484, 43.13526916503906]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 8.0, 3.0, 7.0, 7.0, 10.0, 10.0, 8.0, 13.0, 17.0, 20.0, 23.0, 23.0, 25.0, 27.0, 25.0, 30.0, 31.0, 40.0, 45.0, 38.0, 39.0, 31.0, 30.0, 35.0, 33.0, 38.0, 27.0, 41.0, 34.0, 31.0, 21.0, 23.0, 20.0, 20.0, 23.0, 16.0, 19.0, 22.0, 8.0, 15.0, 10.0, 11.0, 10.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-21.802602767944336, -21.121204376220703, -20.43980598449707, -19.758407592773438, -19.077009201049805, -18.395610809326172, -17.714214324951172, -17.03281593322754, -16.351417541503906, -15.670019149780273, -14.98862075805664, -14.307222366333008, -13.625824928283691, -12.944426536560059, -12.263028144836426, -11.58163070678711, -10.90023136138916, -10.218832969665527, -9.537434577941895, -8.856037139892578, -8.174638748168945, -7.4932403564453125, -6.81184196472168, -6.130444049835205, -5.449045658111572, -4.7676472663879395, -4.086249351501465, -3.404850959777832, -2.7234528064727783, -2.0420546531677246, -1.3606562614440918, -0.6792583465576172, 0.002140045166015625, 0.6835382580757141, 1.3649364709854126, 2.046334743499756, 2.7277328968048096, 3.4091310501098633, 4.090529441833496, 4.771927356719971, 5.4533257484436035, 6.134724140167236, 6.816122055053711, 7.497520446777344, 8.178918838500977, 8.86031723022461, 9.541715621948242, 10.223113059997559, 10.904511451721191, 11.585909843444824, 12.267308235168457, 12.948705673217773, 13.630104064941406, 14.311502456665039, 14.992900848388672, 15.674299240112305, 16.355697631835938, 17.03709602355957, 17.718494415283203, 18.399892807006836, 19.08129119873047, 19.76268768310547, 20.444087982177734, 21.125484466552734, 21.806882858276367]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 11.0, 4.0, 7.0, 7.0, 1.0, 11.0, 10.0, 10.0, 20.0, 13.0, 14.0, 19.0, 12.0, 19.0, 22.0, 29.0, 25.0, 31.0, 40.0, 39.0, 54.0, 30.0, 37.0, 35.0, 57.0, 38.0, 37.0, 36.0, 28.0, 26.0, 34.0, 33.0, 31.0, 14.0, 33.0, 15.0, 17.0, 18.0, 18.0, 11.0, 14.0, 10.0, 7.0, 6.0, 7.0, 3.0, 5.0, 1.0, 7.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.0078125, -3.874267578125, -3.74072265625, -3.607177734375, -3.4736328125, -3.340087890625, -3.20654296875, -3.072998046875, -2.939453125, -2.805908203125, -2.67236328125, -2.538818359375, -2.4052734375, -2.271728515625, -2.13818359375, -2.004638671875, -1.87109375, -1.737548828125, -1.60400390625, -1.470458984375, -1.3369140625, -1.203369140625, -1.06982421875, -0.936279296875, -0.802734375, -0.669189453125, -0.53564453125, -0.402099609375, -0.2685546875, -0.135009765625, -0.00146484375, 0.132080078125, 0.265625, 0.399169921875, 0.53271484375, 0.666259765625, 0.7998046875, 0.933349609375, 1.06689453125, 1.200439453125, 1.333984375, 1.467529296875, 1.60107421875, 1.734619140625, 1.8681640625, 2.001708984375, 2.13525390625, 2.268798828125, 2.40234375, 2.535888671875, 2.66943359375, 2.802978515625, 2.9365234375, 3.070068359375, 3.20361328125, 3.337158203125, 3.470703125, 3.604248046875, 3.73779296875, 3.871337890625, 4.0048828125, 4.138427734375, 4.27197265625, 4.405517578125, 4.5390625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 7.0, 7.0, 12.0, 3.0, 8.0, 12.0, 21.0, 26.0, 30.0, 40.0, 43.0, 65.0, 93.0, 115.0, 135.0, 185.0, 280.0, 382.0, 532.0, 4753.0, 4183987.0, 1605.0, 469.0, 369.0, 257.0, 216.0, 149.0, 106.0, 83.0, 70.0, 38.0, 29.0, 26.0, 28.0, 24.0, 15.0, 11.0, 10.0, 7.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-80.0625, -77.80078125, -75.5390625, -73.27734375, -71.015625, -68.75390625, -66.4921875, -64.23046875, -61.96875, -59.70703125, -57.4453125, -55.18359375, -52.921875, -50.66015625, -48.3984375, -46.13671875, -43.875, -41.61328125, -39.3515625, -37.08984375, -34.828125, -32.56640625, -30.3046875, -28.04296875, -25.78125, -23.51953125, -21.2578125, -18.99609375, -16.734375, -14.47265625, -12.2109375, -9.94921875, -7.6875, -5.42578125, -3.1640625, -0.90234375, 1.359375, 3.62109375, 5.8828125, 8.14453125, 10.40625, 12.66796875, 14.9296875, 17.19140625, 19.453125, 21.71484375, 23.9765625, 26.23828125, 28.5, 30.76171875, 33.0234375, 35.28515625, 37.546875, 39.80859375, 42.0703125, 44.33203125, 46.59375, 48.85546875, 51.1171875, 53.37890625, 55.640625, 57.90234375, 60.1640625, 62.42578125, 64.6875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 7.0, 6.0, 10.0, 11.0, 11.0, 9.0, 22.0, 36.0, 36.0, 52.0, 57.0, 86.0, 118.0, 180.0, 231.0, 352.0, 456.0, 513.0, 487.0, 402.0, 273.0, 214.0, 130.0, 87.0, 69.0, 48.0, 47.0, 26.0, 30.0, 8.0, 13.0, 13.0, 6.0, 4.0, 10.0, 2.0, 4.0, 0.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.23046875, -7.021484375, -6.8125, -6.603515625, -6.39453125, -6.185546875, -5.9765625, -5.767578125, -5.55859375, -5.349609375, -5.140625, -4.931640625, -4.72265625, -4.513671875, -4.3046875, -4.095703125, -3.88671875, -3.677734375, -3.46875, -3.259765625, -3.05078125, -2.841796875, -2.6328125, -2.423828125, -2.21484375, -2.005859375, -1.796875, -1.587890625, -1.37890625, -1.169921875, -0.9609375, -0.751953125, -0.54296875, -0.333984375, -0.125, 0.083984375, 0.29296875, 0.501953125, 0.7109375, 0.919921875, 1.12890625, 1.337890625, 1.546875, 1.755859375, 1.96484375, 2.173828125, 2.3828125, 2.591796875, 2.80078125, 3.009765625, 3.21875, 3.427734375, 3.63671875, 3.845703125, 4.0546875, 4.263671875, 4.47265625, 4.681640625, 4.890625, 5.099609375, 5.30859375, 5.517578125, 5.7265625, 5.935546875, 6.14453125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 11.0, 7.0, 19.0, 26.0, 31.0, 35.0, 47.0, 63.0, 82.0, 159.0, 603.0, 57261.0, 4132131.0, 3075.0, 334.0, 117.0, 75.0, 44.0, 36.0, 42.0, 24.0, 25.0, 16.0, 7.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-68.4375, -66.7392578125, -65.041015625, -63.3427734375, -61.64453125, -59.9462890625, -58.248046875, -56.5498046875, -54.8515625, -53.1533203125, -51.455078125, -49.7568359375, -48.05859375, -46.3603515625, -44.662109375, -42.9638671875, -41.265625, -39.5673828125, -37.869140625, -36.1708984375, -34.47265625, -32.7744140625, -31.076171875, -29.3779296875, -27.6796875, -25.9814453125, -24.283203125, -22.5849609375, -20.88671875, -19.1884765625, -17.490234375, -15.7919921875, -14.09375, -12.3955078125, -10.697265625, -8.9990234375, -7.30078125, -5.6025390625, -3.904296875, -2.2060546875, -0.5078125, 1.1904296875, 2.888671875, 4.5869140625, 6.28515625, 7.9833984375, 9.681640625, 11.3798828125, 13.078125, 14.7763671875, 16.474609375, 18.1728515625, 19.87109375, 21.5693359375, 23.267578125, 24.9658203125, 26.6640625, 28.3623046875, 30.060546875, 31.7587890625, 33.45703125, 35.1552734375, 36.853515625, 38.5517578125, 40.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 33.0, 90.0, 174.0, 269.0, 257.0, 123.0, 41.0, 13.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.711305618286133, -30.176977157592773, -28.642648696899414, -27.108318328857422, -25.573989868164062, -24.039661407470703, -22.505332946777344, -20.971004486083984, -19.436676025390625, -17.902347564697266, -16.368019104003906, -14.83368968963623, -13.299361228942871, -11.765032768249512, -10.230703353881836, -8.696374893188477, -7.162046432495117, -5.627717971801758, -4.09338903427124, -2.5590600967407227, -1.0247316360473633, 0.5095968246459961, 2.043926239013672, 3.5782546997070312, 5.112583160400391, 6.64691162109375, 8.18124008178711, 9.715569496154785, 11.249897956848145, 12.784226417541504, 14.31855583190918, 15.852884292602539, 17.38721466064453, 18.92154312133789, 20.45587158203125, 21.99020004272461, 23.52452850341797, 25.058856964111328, 26.59318733215332, 28.12751579284668, 29.66184425354004, 31.1961727142334, 32.73050308227539, 34.26483154296875, 35.79916000366211, 37.33348846435547, 38.86781692504883, 40.40214538574219, 41.93647384643555, 43.470802307128906, 45.005130767822266, 46.539459228515625, 48.073787689208984, 49.608116149902344, 51.14244842529297, 52.67677307128906, 54.21110534667969, 55.74543380737305, 57.279762268066406, 58.814090728759766, 60.348419189453125, 61.882747650146484, 63.417076110839844, 64.95140838623047, 66.48573303222656]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 2.0, 1.0, 7.0, 5.0, 11.0, 14.0, 14.0, 12.0, 13.0, 17.0, 32.0, 18.0, 23.0, 21.0, 37.0, 40.0, 40.0, 43.0, 41.0, 31.0, 44.0, 38.0, 44.0, 38.0, 36.0, 39.0, 33.0, 38.0, 35.0, 30.0, 26.0, 29.0, 24.0, 20.0, 17.0, 19.0, 14.0, 14.0, 6.0, 5.0, 7.0, 2.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.36933135986328, -19.69687271118164, -19.024415969848633, -18.351957321166992, -17.679500579833984, -17.007041931152344, -16.334583282470703, -15.662125587463379, -14.989667892456055, -14.31721019744873, -13.644752502441406, -12.972293853759766, -12.299836158752441, -11.627378463745117, -10.954919815063477, -10.282462120056152, -9.610004425048828, -8.937546730041504, -8.26508903503418, -7.592630386352539, -6.920172691345215, -6.247714996337891, -5.575256824493408, -4.902798652648926, -4.230340957641602, -3.5578830242156982, -2.885425090789795, -2.2129671573638916, -1.5405092239379883, -0.868051290512085, -0.19559335708618164, 0.4768648147583008, 1.1493244171142578, 1.8217823505401611, 2.4942402839660645, 3.1666982173919678, 3.839156150817871, 4.511613845825195, 5.184072017669678, 5.85653018951416, 6.528987884521484, 7.201445579528809, 7.873903751373291, 8.546361923217773, 9.218819618225098, 9.891277313232422, 10.563735961914062, 11.236193656921387, 11.908651351928711, 12.581109046936035, 13.25356674194336, 13.926025390625, 14.598483085632324, 15.270940780639648, 15.943399429321289, 16.615856170654297, 17.288314819335938, 17.960773468017578, 18.633230209350586, 19.305688858032227, 19.978145599365234, 20.650604248046875, 21.323062896728516, 21.995521545410156, 22.667978286743164]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 4.0, 9.0, 12.0, 14.0, 10.0, 15.0, 21.0, 23.0, 28.0, 29.0, 28.0, 41.0, 49.0, 37.0, 41.0, 45.0, 49.0, 48.0, 56.0, 45.0, 43.0, 37.0, 27.0, 28.0, 40.0, 28.0, 23.0, 24.0, 35.0, 23.0, 18.0, 8.0, 11.0, 20.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.5816650390625, -4.432861328125, -4.2840576171875, -4.13525390625, -3.9864501953125, -3.837646484375, -3.6888427734375, -3.5400390625, -3.3912353515625, -3.242431640625, -3.0936279296875, -2.94482421875, -2.7960205078125, -2.647216796875, -2.4984130859375, -2.349609375, -2.2008056640625, -2.052001953125, -1.9031982421875, -1.75439453125, -1.6055908203125, -1.456787109375, -1.3079833984375, -1.1591796875, -1.0103759765625, -0.861572265625, -0.7127685546875, -0.56396484375, -0.4151611328125, -0.266357421875, -0.1175537109375, 0.03125, 0.1800537109375, 0.328857421875, 0.4776611328125, 0.62646484375, 0.7752685546875, 0.924072265625, 1.0728759765625, 1.2216796875, 1.3704833984375, 1.519287109375, 1.6680908203125, 1.81689453125, 1.9656982421875, 2.114501953125, 2.2633056640625, 2.412109375, 2.5609130859375, 2.709716796875, 2.8585205078125, 3.00732421875, 3.1561279296875, 3.304931640625, 3.4537353515625, 3.6025390625, 3.7513427734375, 3.900146484375, 4.0489501953125, 4.19775390625, 4.3465576171875, 4.495361328125, 4.6441650390625, 4.79296875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 13.0, 16.0, 20.0, 20.0, 42.0, 61.0, 107.0, 176.0, 287.0, 441.0, 682.0, 1094.0, 1808.0, 2872.0, 4967.0, 8218.0, 14205.0, 24703.0, 45471.0, 88549.0, 211727.0, 355444.0, 140102.0, 65701.0, 34644.0, 19234.0, 11110.0, 6573.0, 3967.0, 2435.0, 1484.0, 880.0, 510.0, 345.0, 229.0, 162.0, 92.0, 52.0, 37.0, 15.0, 20.0, 18.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.916015625, -0.8867340087890625, -0.857452392578125, -0.8281707763671875, -0.79888916015625, -0.7696075439453125, -0.740325927734375, -0.7110443115234375, -0.6817626953125, -0.6524810791015625, -0.623199462890625, -0.5939178466796875, -0.56463623046875, -0.5353546142578125, -0.506072998046875, -0.4767913818359375, -0.447509765625, -0.4182281494140625, -0.388946533203125, -0.3596649169921875, -0.33038330078125, -0.3011016845703125, -0.271820068359375, -0.2425384521484375, -0.2132568359375, -0.1839752197265625, -0.154693603515625, -0.1254119873046875, -0.09613037109375, -0.0668487548828125, -0.037567138671875, -0.0082855224609375, 0.02099609375, 0.0502777099609375, 0.079559326171875, 0.1088409423828125, 0.13812255859375, 0.1674041748046875, 0.196685791015625, 0.2259674072265625, 0.2552490234375, 0.2845306396484375, 0.313812255859375, 0.3430938720703125, 0.37237548828125, 0.4016571044921875, 0.430938720703125, 0.4602203369140625, 0.489501953125, 0.5187835693359375, 0.548065185546875, 0.5773468017578125, 0.60662841796875, 0.6359100341796875, 0.665191650390625, 0.6944732666015625, 0.7237548828125, 0.7530364990234375, 0.782318115234375, 0.8115997314453125, 0.84088134765625, 0.8701629638671875, 0.899444580078125, 0.9287261962890625, 0.9580078125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 8.0, 3.0, 1.0, 5.0, 4.0, 7.0, 9.0, 12.0, 11.0, 13.0, 21.0, 11.0, 15.0, 22.0, 24.0, 17.0, 30.0, 36.0, 29.0, 31.0, 40.0, 19.0, 27.0, 36.0, 35.0, 1063.0, 27.0, 34.0, 47.0, 40.0, 24.0, 23.0, 29.0, 20.0, 32.0, 26.0, 30.0, 26.0, 18.0, 17.0, 12.0, 24.0, 13.0, 7.0, 8.0, 7.0, 9.0, 4.0, 5.0, 5.0, 4.0, 8.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.453125, -2.380157470703125, -2.30718994140625, -2.234222412109375, -2.1612548828125, -2.088287353515625, -2.01531982421875, -1.942352294921875, -1.869384765625, -1.796417236328125, -1.72344970703125, -1.650482177734375, -1.5775146484375, -1.504547119140625, -1.43157958984375, -1.358612060546875, -1.28564453125, -1.212677001953125, -1.13970947265625, -1.066741943359375, -0.9937744140625, -0.920806884765625, -0.84783935546875, -0.774871826171875, -0.701904296875, -0.628936767578125, -0.55596923828125, -0.483001708984375, -0.4100341796875, -0.337066650390625, -0.26409912109375, -0.191131591796875, -0.1181640625, -0.045196533203125, 0.02777099609375, 0.100738525390625, 0.1737060546875, 0.246673583984375, 0.31964111328125, 0.392608642578125, 0.465576171875, 0.538543701171875, 0.61151123046875, 0.684478759765625, 0.7574462890625, 0.830413818359375, 0.90338134765625, 0.976348876953125, 1.04931640625, 1.122283935546875, 1.19525146484375, 1.268218994140625, 1.3411865234375, 1.414154052734375, 1.48712158203125, 1.560089111328125, 1.633056640625, 1.706024169921875, 1.77899169921875, 1.851959228515625, 1.9249267578125, 1.997894287109375, 2.07086181640625, 2.143829345703125, 2.216796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 8.0, 8.0, 14.0, 12.0, 25.0, 47.0, 70.0, 103.0, 147.0, 209.0, 294.0, 399.0, 607.0, 792.0, 1069.0, 1427.0, 2007.0, 2809.0, 3647.0, 5212.0, 7164.0, 9896.0, 13937.0, 19318.0, 28089.0, 40646.0, 60953.0, 98211.0, 185831.0, 1271084.0, 118985.0, 70079.0, 45654.0, 31314.0, 21984.0, 15521.0, 10995.0, 7936.0, 5678.0, 4133.0, 2934.0, 2211.0, 1576.0, 1152.0, 789.0, 616.0, 443.0, 286.0, 237.0, 180.0, 110.0, 88.0, 70.0, 48.0, 38.0, 17.0, 15.0, 10.0, 6.0, 3.0, 2.0], "bins": [-0.541015625, -0.5241928100585938, -0.5073699951171875, -0.49054718017578125, -0.473724365234375, -0.45690155029296875, -0.4400787353515625, -0.42325592041015625, -0.40643310546875, -0.38961029052734375, -0.3727874755859375, -0.35596466064453125, -0.339141845703125, -0.32231903076171875, -0.3054962158203125, -0.28867340087890625, -0.2718505859375, -0.25502777099609375, -0.2382049560546875, -0.22138214111328125, -0.204559326171875, -0.18773651123046875, -0.1709136962890625, -0.15409088134765625, -0.13726806640625, -0.12044525146484375, -0.1036224365234375, -0.08679962158203125, -0.069976806640625, -0.05315399169921875, -0.0363311767578125, -0.01950836181640625, -0.002685546875, 0.01413726806640625, 0.0309600830078125, 0.04778289794921875, 0.064605712890625, 0.08142852783203125, 0.0982513427734375, 0.11507415771484375, 0.13189697265625, 0.14871978759765625, 0.1655426025390625, 0.18236541748046875, 0.199188232421875, 0.21601104736328125, 0.2328338623046875, 0.24965667724609375, 0.2664794921875, 0.28330230712890625, 0.3001251220703125, 0.31694793701171875, 0.333770751953125, 0.35059356689453125, 0.3674163818359375, 0.38423919677734375, 0.40106201171875, 0.41788482666015625, 0.4347076416015625, 0.45153045654296875, 0.468353271484375, 0.48517608642578125, 0.5019989013671875, 0.5188217163085938, 0.53564453125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 4.0, 11.0, 8.0, 14.0, 14.0, 11.0, 18.0, 27.0, 43.0, 44.0, 52.0, 42.0, 69.0, 70.0, 54.0, 68.0, 60.0, 66.0, 54.0, 49.0, 42.0, 49.0, 33.0, 19.0, 15.0, 18.0, 8.0, 8.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013589859008789062, -0.00013083219528198242, -0.00012576580047607422, -0.00012069940567016602, -0.00011563301086425781, -0.00011056661605834961, -0.0001055002212524414, -0.0001004338264465332, -9.5367431640625e-05, -9.03010368347168e-05, -8.52346420288086e-05, -8.016824722290039e-05, -7.510185241699219e-05, -7.003545761108398e-05, -6.496906280517578e-05, -5.990266799926758e-05, -5.4836273193359375e-05, -4.976987838745117e-05, -4.470348358154297e-05, -3.9637088775634766e-05, -3.457069396972656e-05, -2.950429916381836e-05, -2.4437904357910156e-05, -1.9371509552001953e-05, -1.430511474609375e-05, -9.238719940185547e-06, -4.172325134277344e-06, 8.940696716308594e-07, 5.9604644775390625e-06, 1.1026859283447266e-05, 1.609325408935547e-05, 2.1159648895263672e-05, 2.6226043701171875e-05, 3.129243850708008e-05, 3.635883331298828e-05, 4.1425228118896484e-05, 4.649162292480469e-05, 5.155801773071289e-05, 5.6624412536621094e-05, 6.16908073425293e-05, 6.67572021484375e-05, 7.18235969543457e-05, 7.68899917602539e-05, 8.195638656616211e-05, 8.702278137207031e-05, 9.208917617797852e-05, 9.715557098388672e-05, 0.00010222196578979492, 0.00010728836059570312, 0.00011235475540161133, 0.00011742115020751953, 0.00012248754501342773, 0.00012755393981933594, 0.00013262033462524414, 0.00013768672943115234, 0.00014275312423706055, 0.00014781951904296875, 0.00015288591384887695, 0.00015795230865478516, 0.00016301870346069336, 0.00016808509826660156, 0.00017315149307250977, 0.00017821788787841797, 0.00018328428268432617, 0.00018835067749023438]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 6.0, 8.0, 11.0, 7.0, 10.0, 8.0, 17.0, 15.0, 27.0, 29.0, 36.0, 67.0, 97.0, 128.0, 195.0, 258.0, 432.0, 774.0, 1519.0, 472519.0, 568710.0, 1632.0, 766.0, 413.0, 274.0, 195.0, 104.0, 75.0, 54.0, 37.0, 30.0, 30.0, 21.0, 11.0, 10.0, 11.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030765533447265625, -0.0029861032962799072, -0.002895653247833252, -0.0028052031993865967, -0.0027147531509399414, -0.002624303102493286, -0.002533853054046631, -0.0024434030055999756, -0.0023529529571533203, -0.002262502908706665, -0.0021720528602600098, -0.0020816028118133545, -0.0019911527633666992, -0.001900702714920044, -0.0018102526664733887, -0.0017198026180267334, -0.0016293525695800781, -0.0015389025211334229, -0.0014484524726867676, -0.0013580024242401123, -0.001267552375793457, -0.0011771023273468018, -0.0010866522789001465, -0.0009962022304534912, -0.0009057521820068359, -0.0008153021335601807, -0.0007248520851135254, -0.0006344020366668701, -0.0005439519882202148, -0.00045350193977355957, -0.0003630518913269043, -0.000272601842880249, -0.00018215179443359375, -9.170174598693848e-05, -1.2516975402832031e-06, 8.919835090637207e-05, 0.00017964839935302734, 0.0002700984477996826, 0.0003605484962463379, 0.00045099854469299316, 0.0005414485931396484, 0.0006318986415863037, 0.000722348690032959, 0.0008127987384796143, 0.0009032487869262695, 0.0009936988353729248, 0.00108414888381958, 0.0011745989322662354, 0.0012650489807128906, 0.001355499029159546, 0.0014459490776062012, 0.0015363991260528564, 0.0016268491744995117, 0.001717299222946167, 0.0018077492713928223, 0.0018981993198394775, 0.001988649368286133, 0.002079099416732788, 0.0021695494651794434, 0.0022599995136260986, 0.002350449562072754, 0.002440899610519409, 0.0025313496589660645, 0.0026217997074127197, 0.002712249755859375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 8.0, 25.0, 100.0, 281.0, 348.0, 175.0, 59.0, 14.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003797558892983943, -0.00037220411468297243, -0.00036465234006755054, -0.00035710056545212865, -0.00034954879083670676, -0.00034199701622128487, -0.000334445241605863, -0.0003268934669904411, -0.0003193416923750192, -0.0003117899177595973, -0.0003042381431441754, -0.0002966863685287535, -0.00028913459391333163, -0.00028158281929790974, -0.00027403104468248785, -0.00026647927006706595, -0.0002589275245554745, -0.00025137574994005263, -0.00024382397532463074, -0.00023627220070920885, -0.00022872042609378695, -0.00022116865147836506, -0.00021361687686294317, -0.00020606510224752128, -0.0001985133276320994, -0.0001909615530166775, -0.0001834097784012556, -0.00017585800378583372, -0.00016830622917041183, -0.00016075445455498993, -0.00015320267993956804, -0.00014565090532414615, -0.0001380991452606395, -0.0001305473706452176, -0.0001229955960297957, -0.00011544382141437382, -0.00010789204679895192, -0.00010034027218353003, -9.278850484406576e-05, -8.523673022864386e-05, -7.768495561322197e-05, -7.013318099780008e-05, -6.258140638237819e-05, -5.502963540493511e-05, -4.7477860789513215e-05, -3.9926086174091324e-05, -3.237431519664824e-05, -2.482254058122635e-05, -1.7270765965804458e-05, -9.718992259877268e-06, -2.1672185539500788e-06, 5.384554242482409e-06, 1.29363288579043e-05, 2.048810347332619e-05, 2.8039874450769275e-05, 3.559164906619117e-05, 4.314342368161306e-05, 5.069519829703495e-05, 5.824697291245684e-05, 6.579874025192112e-05, 7.335051486734301e-05, 8.09022894827649e-05, 8.845406409818679e-05, 9.600583871360868e-05, 0.00010355761332903057]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 5.0, 6.0, 8.0, 2.0, 6.0, 11.0, 12.0, 12.0, 22.0, 21.0, 24.0, 28.0, 28.0, 32.0, 27.0, 46.0, 37.0, 42.0, 48.0, 41.0, 49.0, 40.0, 38.0, 51.0, 39.0, 41.0, 46.0, 39.0, 34.0, 38.0, 22.0, 26.0, 19.0, 11.0, 10.0, 13.0, 4.0, 7.0, 8.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.176399230957031e-05, -6.916001439094543e-05, -6.655603647232056e-05, -6.395205855369568e-05, -6.13480806350708e-05, -5.874410271644592e-05, -5.6140124797821045e-05, -5.353614687919617e-05, -5.093216896057129e-05, -4.832819104194641e-05, -4.572421312332153e-05, -4.3120235204696655e-05, -4.051625728607178e-05, -3.79122793674469e-05, -3.530830144882202e-05, -3.2704323530197144e-05, -3.0100345611572266e-05, -2.7496367692947388e-05, -2.489238977432251e-05, -2.2288411855697632e-05, -1.9684433937072754e-05, -1.7080456018447876e-05, -1.4476478099822998e-05, -1.187250018119812e-05, -9.268522262573242e-06, -6.664544343948364e-06, -4.060566425323486e-06, -1.4565885066986084e-06, 1.1473894119262695e-06, 3.7513673305511475e-06, 6.355345249176025e-06, 8.959323167800903e-06, 1.1563301086425781e-05, 1.416727900505066e-05, 1.6771256923675537e-05, 1.9375234842300415e-05, 2.1979212760925293e-05, 2.458319067955017e-05, 2.718716859817505e-05, 2.9791146516799927e-05, 3.2395124435424805e-05, 3.499910235404968e-05, 3.760308027267456e-05, 4.020705819129944e-05, 4.2811036109924316e-05, 4.5415014028549194e-05, 4.801899194717407e-05, 5.062296986579895e-05, 5.322694778442383e-05, 5.5830925703048706e-05, 5.8434903621673584e-05, 6.103888154029846e-05, 6.364285945892334e-05, 6.624683737754822e-05, 6.88508152961731e-05, 7.145479321479797e-05, 7.405877113342285e-05, 7.666274905204773e-05, 7.926672697067261e-05, 8.187070488929749e-05, 8.447468280792236e-05, 8.707866072654724e-05, 8.968263864517212e-05, 9.2286616563797e-05, 9.489059448242188e-05]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 4.0, 9.0, 12.0, 14.0, 10.0, 15.0, 21.0, 23.0, 28.0, 29.0, 28.0, 41.0, 49.0, 37.0, 41.0, 45.0, 49.0, 48.0, 56.0, 45.0, 43.0, 37.0, 27.0, 28.0, 40.0, 28.0, 23.0, 24.0, 35.0, 23.0, 18.0, 8.0, 11.0, 20.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.5816650390625, -4.432861328125, -4.2840576171875, -4.13525390625, -3.9864501953125, -3.837646484375, -3.6888427734375, -3.5400390625, -3.3912353515625, -3.242431640625, -3.0936279296875, -2.94482421875, -2.7960205078125, -2.647216796875, -2.4984130859375, -2.349609375, -2.2008056640625, -2.052001953125, -1.9031982421875, -1.75439453125, -1.6055908203125, -1.456787109375, -1.3079833984375, -1.1591796875, -1.0103759765625, -0.861572265625, -0.7127685546875, -0.56396484375, -0.4151611328125, -0.266357421875, -0.1175537109375, 0.03125, 0.1800537109375, 0.328857421875, 0.4776611328125, 0.62646484375, 0.7752685546875, 0.924072265625, 1.0728759765625, 1.2216796875, 1.3704833984375, 1.519287109375, 1.6680908203125, 1.81689453125, 1.9656982421875, 2.114501953125, 2.2633056640625, 2.412109375, 2.5609130859375, 2.709716796875, 2.8585205078125, 3.00732421875, 3.1561279296875, 3.304931640625, 3.4537353515625, 3.6025390625, 3.7513427734375, 3.900146484375, 4.0489501953125, 4.19775390625, 4.3465576171875, 4.495361328125, 4.6441650390625, 4.79296875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 12.0, 16.0, 19.0, 19.0, 18.0, 26.0, 43.0, 62.0, 68.0, 90.0, 122.0, 179.0, 239.0, 318.0, 472.0, 610.0, 846.0, 1183.0, 1632.0, 3414.0, 18014.0, 152932.0, 598307.0, 230494.0, 28526.0, 4403.0, 1937.0, 1221.0, 888.0, 654.0, 446.0, 360.0, 257.0, 190.0, 135.0, 95.0, 99.0, 58.0, 47.0, 23.0, 25.0, 15.0, 12.0, 12.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.4609375, -9.1707763671875, -8.880615234375, -8.5904541015625, -8.30029296875, -8.0101318359375, -7.719970703125, -7.4298095703125, -7.1396484375, -6.8494873046875, -6.559326171875, -6.2691650390625, -5.97900390625, -5.6888427734375, -5.398681640625, -5.1085205078125, -4.818359375, -4.5281982421875, -4.238037109375, -3.9478759765625, -3.65771484375, -3.3675537109375, -3.077392578125, -2.7872314453125, -2.4970703125, -2.2069091796875, -1.916748046875, -1.6265869140625, -1.33642578125, -1.0462646484375, -0.756103515625, -0.4659423828125, -0.17578125, 0.1143798828125, 0.404541015625, 0.6947021484375, 0.98486328125, 1.2750244140625, 1.565185546875, 1.8553466796875, 2.1455078125, 2.4356689453125, 2.725830078125, 3.0159912109375, 3.30615234375, 3.5963134765625, 3.886474609375, 4.1766357421875, 4.466796875, 4.7569580078125, 5.047119140625, 5.3372802734375, 5.62744140625, 5.9176025390625, 6.207763671875, 6.4979248046875, 6.7880859375, 7.0782470703125, 7.368408203125, 7.6585693359375, 7.94873046875, 8.2388916015625, 8.529052734375, 8.8192138671875, 9.109375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 9.0, 9.0, 10.0, 11.0, 12.0, 25.0, 16.0, 17.0, 19.0, 25.0, 26.0, 35.0, 46.0, 48.0, 43.0, 45.0, 73.0, 188.0, 1437.0, 354.0, 169.0, 81.0, 54.0, 60.0, 32.0, 29.0, 28.0, 17.0, 11.0, 22.0, 17.0, 16.0, 9.0, 14.0, 11.0, 4.0, 4.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-11.2890625, -10.9656982421875, -10.642333984375, -10.3189697265625, -9.99560546875, -9.6722412109375, -9.348876953125, -9.0255126953125, -8.7021484375, -8.3787841796875, -8.055419921875, -7.7320556640625, -7.40869140625, -7.0853271484375, -6.761962890625, -6.4385986328125, -6.115234375, -5.7918701171875, -5.468505859375, -5.1451416015625, -4.82177734375, -4.4984130859375, -4.175048828125, -3.8516845703125, -3.5283203125, -3.2049560546875, -2.881591796875, -2.5582275390625, -2.23486328125, -1.9114990234375, -1.588134765625, -1.2647705078125, -0.94140625, -0.6180419921875, -0.294677734375, 0.0286865234375, 0.35205078125, 0.6754150390625, 0.998779296875, 1.3221435546875, 1.6455078125, 1.9688720703125, 2.292236328125, 2.6156005859375, 2.93896484375, 3.2623291015625, 3.585693359375, 3.9090576171875, 4.232421875, 4.5557861328125, 4.879150390625, 5.2025146484375, 5.52587890625, 5.8492431640625, 6.172607421875, 6.4959716796875, 6.8193359375, 7.1427001953125, 7.466064453125, 7.7894287109375, 8.11279296875, 8.4361572265625, 8.759521484375, 9.0828857421875, 9.40625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 6.0, 4.0, 9.0, 5.0, 14.0, 19.0, 30.0, 34.0, 55.0, 63.0, 98.0, 131.0, 209.0, 354.0, 569.0, 1210.0, 10126.0, 3127372.0, 2985.0, 980.0, 458.0, 301.0, 194.0, 121.0, 98.0, 59.0, 58.0, 32.0, 16.0, 27.0, 9.0, 11.0, 9.0, 9.0, 4.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.78125, -49.107421875, -47.43359375, -45.759765625, -44.0859375, -42.412109375, -40.73828125, -39.064453125, -37.390625, -35.716796875, -34.04296875, -32.369140625, -30.6953125, -29.021484375, -27.34765625, -25.673828125, -24.0, -22.326171875, -20.65234375, -18.978515625, -17.3046875, -15.630859375, -13.95703125, -12.283203125, -10.609375, -8.935546875, -7.26171875, -5.587890625, -3.9140625, -2.240234375, -0.56640625, 1.107421875, 2.78125, 4.455078125, 6.12890625, 7.802734375, 9.4765625, 11.150390625, 12.82421875, 14.498046875, 16.171875, 17.845703125, 19.51953125, 21.193359375, 22.8671875, 24.541015625, 26.21484375, 27.888671875, 29.5625, 31.236328125, 32.91015625, 34.583984375, 36.2578125, 37.931640625, 39.60546875, 41.279296875, 42.953125, 44.626953125, 46.30078125, 47.974609375, 49.6484375, 51.322265625, 52.99609375, 54.669921875, 56.34375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 18.0, 61.0, 138.0, 180.0, 224.0, 186.0, 109.0, 52.0, 17.0, 8.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.63885498046875, -28.664894104003906, -27.690933227539062, -26.71697425842285, -25.743013381958008, -24.769052505493164, -23.795093536376953, -22.82113265991211, -21.847171783447266, -20.873210906982422, -19.899250030517578, -18.925291061401367, -17.951330184936523, -16.97736930847168, -16.00341033935547, -15.029449462890625, -14.055488586425781, -13.081527709960938, -12.10756778717041, -11.133607864379883, -10.159646987915039, -9.185686111450195, -8.211726188659668, -7.237765789031982, -6.263805389404297, -5.289844989776611, -4.315884590148926, -3.3419241905212402, -2.3679637908935547, -1.3940033912658691, -0.4200429916381836, 0.553917407989502, 1.5278778076171875, 2.501838207244873, 3.4757986068725586, 4.449759006500244, 5.42371940612793, 6.397679805755615, 7.371640205383301, 8.345600128173828, 9.319561004638672, 10.293521881103516, 11.267481803894043, 12.24144172668457, 13.215402603149414, 14.189363479614258, 15.163323402404785, 16.137283325195312, 17.111244201660156, 18.085205078125, 19.059165954589844, 20.033124923706055, 21.0070858001709, 21.981046676635742, 22.955005645751953, 23.928966522216797, 24.90292739868164, 25.876888275146484, 26.850849151611328, 27.82480812072754, 28.798768997192383, 29.772729873657227, 30.746688842773438, 31.72064971923828, 32.694610595703125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 10.0, 9.0, 14.0, 16.0, 26.0, 19.0, 24.0, 31.0, 24.0, 28.0, 27.0, 29.0, 37.0, 55.0, 44.0, 46.0, 51.0, 46.0, 50.0, 48.0, 30.0, 49.0, 26.0, 34.0, 31.0, 23.0, 19.0, 19.0, 26.0, 12.0, 15.0, 14.0, 12.0, 3.0, 8.0, 10.0, 5.0, 10.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.97964096069336, -22.160324096679688, -21.341007232666016, -20.521690368652344, -19.702373504638672, -18.883056640625, -18.06374168395996, -17.24442481994629, -16.425107955932617, -15.605791091918945, -14.786474227905273, -13.967158317565918, -13.147841453552246, -12.328524589538574, -11.509208679199219, -10.689891815185547, -9.870574951171875, -9.051258087158203, -8.231941223144531, -7.412625312805176, -6.593308448791504, -5.773991584777832, -4.954675197601318, -4.135358810424805, -3.316041946411133, -2.49672532081604, -1.6774086952209473, -0.8580920696258545, -0.03877544403076172, 0.7805414199829102, 1.5998578071594238, 2.4191741943359375, 3.2384910583496094, 4.057807922363281, 4.877124309539795, 5.696440696716309, 6.5157575607299805, 7.335074424743652, 8.154390335083008, 8.97370719909668, 9.793024063110352, 10.612340927124023, 11.431657791137695, 12.25097370147705, 13.070290565490723, 13.889607429504395, 14.70892333984375, 15.528240203857422, 16.347557067871094, 17.166873931884766, 17.986190795898438, 18.80550765991211, 19.62482452392578, 20.444141387939453, 21.263456344604492, 22.082773208618164, 22.902090072631836, 23.721406936645508, 24.54072380065918, 25.36004066467285, 26.17935562133789, 26.998672485351562, 27.817989349365234, 28.637306213378906, 29.456623077392578]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 2.0, 6.0, 4.0, 7.0, 12.0, 12.0, 13.0, 19.0, 11.0, 16.0, 26.0, 28.0, 30.0, 32.0, 40.0, 41.0, 37.0, 34.0, 54.0, 43.0, 41.0, 48.0, 44.0, 42.0, 29.0, 39.0, 31.0, 32.0, 38.0, 30.0, 22.0, 17.0, 24.0, 26.0, 12.0, 19.0, 12.0, 6.0, 14.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.5714111328125, -4.424072265625, -4.2767333984375, -4.12939453125, -3.9820556640625, -3.834716796875, -3.6873779296875, -3.5400390625, -3.3927001953125, -3.245361328125, -3.0980224609375, -2.95068359375, -2.8033447265625, -2.656005859375, -2.5086669921875, -2.361328125, -2.2139892578125, -2.066650390625, -1.9193115234375, -1.77197265625, -1.6246337890625, -1.477294921875, -1.3299560546875, -1.1826171875, -1.0352783203125, -0.887939453125, -0.7406005859375, -0.59326171875, -0.4459228515625, -0.298583984375, -0.1512451171875, -0.00390625, 0.1434326171875, 0.290771484375, 0.4381103515625, 0.58544921875, 0.7327880859375, 0.880126953125, 1.0274658203125, 1.1748046875, 1.3221435546875, 1.469482421875, 1.6168212890625, 1.76416015625, 1.9114990234375, 2.058837890625, 2.2061767578125, 2.353515625, 2.5008544921875, 2.648193359375, 2.7955322265625, 2.94287109375, 3.0902099609375, 3.237548828125, 3.3848876953125, 3.5322265625, 3.6795654296875, 3.826904296875, 3.9742431640625, 4.12158203125, 4.2689208984375, 4.416259765625, 4.5635986328125, 4.7109375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 3.0, 4.0, 14.0, 13.0, 7.0, 17.0, 24.0, 21.0, 21.0, 44.0, 39.0, 45.0, 60.0, 77.0, 113.0, 155.0, 249.0, 479.0, 924.0, 2442.0, 7143.0, 28631.0, 184307.0, 1103989.0, 2109387.0, 638601.0, 92257.0, 16847.0, 4689.0, 1660.0, 765.0, 384.0, 217.0, 150.0, 113.0, 81.0, 68.0, 48.0, 51.0, 32.0, 23.0, 29.0, 11.0, 15.0, 9.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.64453125, -7.4151611328125, -7.185791015625, -6.9564208984375, -6.72705078125, -6.4976806640625, -6.268310546875, -6.0389404296875, -5.8095703125, -5.5802001953125, -5.350830078125, -5.1214599609375, -4.89208984375, -4.6627197265625, -4.433349609375, -4.2039794921875, -3.974609375, -3.7452392578125, -3.515869140625, -3.2864990234375, -3.05712890625, -2.8277587890625, -2.598388671875, -2.3690185546875, -2.1396484375, -1.9102783203125, -1.680908203125, -1.4515380859375, -1.22216796875, -0.9927978515625, -0.763427734375, -0.5340576171875, -0.3046875, -0.0753173828125, 0.154052734375, 0.3834228515625, 0.61279296875, 0.8421630859375, 1.071533203125, 1.3009033203125, 1.5302734375, 1.7596435546875, 1.989013671875, 2.2183837890625, 2.44775390625, 2.6771240234375, 2.906494140625, 3.1358642578125, 3.365234375, 3.5946044921875, 3.823974609375, 4.0533447265625, 4.28271484375, 4.5120849609375, 4.741455078125, 4.9708251953125, 5.2001953125, 5.4295654296875, 5.658935546875, 5.8883056640625, 6.11767578125, 6.3470458984375, 6.576416015625, 6.8057861328125, 7.03515625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 9.0, 6.0, 10.0, 13.0, 22.0, 33.0, 35.0, 43.0, 65.0, 78.0, 75.0, 94.0, 134.0, 174.0, 237.0, 321.0, 391.0, 468.0, 423.0, 352.0, 292.0, 186.0, 147.0, 88.0, 88.0, 57.0, 46.0, 47.0, 33.0, 26.0, 22.0, 14.0, 14.0, 6.0, 4.0, 6.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.696533203125, -5.48291015625, -5.269287109375, -5.0556640625, -4.842041015625, -4.62841796875, -4.414794921875, -4.201171875, -3.987548828125, -3.77392578125, -3.560302734375, -3.3466796875, -3.133056640625, -2.91943359375, -2.705810546875, -2.4921875, -2.278564453125, -2.06494140625, -1.851318359375, -1.6376953125, -1.424072265625, -1.21044921875, -0.996826171875, -0.783203125, -0.569580078125, -0.35595703125, -0.142333984375, 0.0712890625, 0.284912109375, 0.49853515625, 0.712158203125, 0.92578125, 1.139404296875, 1.35302734375, 1.566650390625, 1.7802734375, 1.993896484375, 2.20751953125, 2.421142578125, 2.634765625, 2.848388671875, 3.06201171875, 3.275634765625, 3.4892578125, 3.702880859375, 3.91650390625, 4.130126953125, 4.34375, 4.557373046875, 4.77099609375, 4.984619140625, 5.1982421875, 5.411865234375, 5.62548828125, 5.839111328125, 6.052734375, 6.266357421875, 6.47998046875, 6.693603515625, 6.9072265625, 7.120849609375, 7.33447265625, 7.548095703125, 7.76171875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 7.0, 14.0, 30.0, 37.0, 68.0, 99.0, 175.0, 243.0, 477.0, 900.0, 1992.0, 8836.0, 222658.0, 3645602.0, 297902.0, 10776.0, 2266.0, 959.0, 488.0, 302.0, 153.0, 104.0, 69.0, 43.0, 31.0, 14.0, 14.0, 6.0, 3.0, 6.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.84375, -15.307373046875, -14.77099609375, -14.234619140625, -13.6982421875, -13.161865234375, -12.62548828125, -12.089111328125, -11.552734375, -11.016357421875, -10.47998046875, -9.943603515625, -9.4072265625, -8.870849609375, -8.33447265625, -7.798095703125, -7.26171875, -6.725341796875, -6.18896484375, -5.652587890625, -5.1162109375, -4.579833984375, -4.04345703125, -3.507080078125, -2.970703125, -2.434326171875, -1.89794921875, -1.361572265625, -0.8251953125, -0.288818359375, 0.24755859375, 0.783935546875, 1.3203125, 1.856689453125, 2.39306640625, 2.929443359375, 3.4658203125, 4.002197265625, 4.53857421875, 5.074951171875, 5.611328125, 6.147705078125, 6.68408203125, 7.220458984375, 7.7568359375, 8.293212890625, 8.82958984375, 9.365966796875, 9.90234375, 10.438720703125, 10.97509765625, 11.511474609375, 12.0478515625, 12.584228515625, 13.12060546875, 13.656982421875, 14.193359375, 14.729736328125, 15.26611328125, 15.802490234375, 16.3388671875, 16.875244140625, 17.41162109375, 17.947998046875, 18.484375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 26.0, 199.0, 446.0, 270.0, 64.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.316314697265625, -53.8779182434082, -50.43952178955078, -47.00112533569336, -43.56272888183594, -40.124332427978516, -36.685935974121094, -33.24753952026367, -29.80914306640625, -26.370746612548828, -22.932350158691406, -19.493953704833984, -16.055557250976562, -12.61716079711914, -9.178764343261719, -5.740367889404297, -2.301971435546875, 1.1364250183105469, 4.574821472167969, 8.01321792602539, 11.451614379882812, 14.890010833740234, 18.328407287597656, 21.766803741455078, 25.2052001953125, 28.643596649169922, 32.081993103027344, 35.520389556884766, 38.95878601074219, 42.39718246459961, 45.83557891845703, 49.27397537231445, 52.712371826171875, 56.1507682800293, 59.58916473388672, 63.02756118774414, 66.46595764160156, 69.90435791015625, 73.3427505493164, 76.78114318847656, 80.21954345703125, 83.65794372558594, 87.0963363647461, 90.53472900390625, 93.97312927246094, 97.41152954101562, 100.84992218017578, 104.28831481933594, 107.72671508789062, 111.16511535644531, 114.60350799560547, 118.04190063476562, 121.48030090332031, 124.918701171875, 128.35708618164062, 131.7954864501953, 135.23388671875, 138.6722869873047, 142.11068725585938, 145.549072265625, 148.9874725341797, 152.42587280273438, 155.8642578125, 159.3026580810547, 162.74105834960938]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 12.0, 13.0, 10.0, 19.0, 17.0, 19.0, 25.0, 32.0, 31.0, 34.0, 28.0, 33.0, 31.0, 35.0, 41.0, 36.0, 60.0, 52.0, 45.0, 38.0, 30.0, 51.0, 33.0, 32.0, 27.0, 25.0, 25.0, 29.0, 26.0, 17.0, 16.0, 7.0, 9.0, 14.0, 5.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.326858520507812, -23.46636390686035, -22.605867385864258, -21.745372772216797, -20.884876251220703, -20.024381637573242, -19.16388702392578, -18.303390502929688, -17.442893981933594, -16.582399368286133, -15.721902847290039, -14.861408233642578, -14.000911712646484, -13.140417098999023, -12.279921531677246, -11.419425964355469, -10.558931350708008, -9.69843578338623, -8.837940216064453, -7.977445125579834, -7.116949558258057, -6.256453990936279, -5.39595890045166, -4.535463333129883, -3.6749677658081055, -2.814472198486328, -1.9539768695831299, -1.0934815406799316, -0.2329859733581543, 0.627509593963623, 1.4880046844482422, 2.3485002517700195, 3.208995819091797, 4.069491386413574, 4.929986953735352, 5.790482044219971, 6.650977611541748, 7.511473178863525, 8.371968269348145, 9.232463836669922, 10.0929594039917, 10.953454971313477, 11.813950538635254, 12.674446105957031, 13.534940719604492, 14.395437240600586, 15.255931854248047, 16.11642837524414, 16.9769229888916, 17.837417602539062, 18.697914123535156, 19.558408737182617, 20.41890525817871, 21.279399871826172, 22.139896392822266, 23.000391006469727, 23.860885620117188, 24.72138023376465, 25.581876754760742, 26.442371368408203, 27.302867889404297, 28.163362503051758, 29.02385711669922, 29.884353637695312, 30.744850158691406]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 12.0, 8.0, 16.0, 17.0, 19.0, 22.0, 22.0, 28.0, 30.0, 38.0, 28.0, 40.0, 32.0, 44.0, 46.0, 43.0, 46.0, 43.0, 39.0, 41.0, 28.0, 33.0, 39.0, 32.0, 29.0, 34.0, 33.0, 28.0, 24.0, 16.0, 11.0, 8.0, 15.0, 9.0, 12.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.75, -3.642120361328125, -3.53424072265625, -3.426361083984375, -3.3184814453125, -3.210601806640625, -3.10272216796875, -2.994842529296875, -2.886962890625, -2.779083251953125, -2.67120361328125, -2.563323974609375, -2.4554443359375, -2.347564697265625, -2.23968505859375, -2.131805419921875, -2.02392578125, -1.916046142578125, -1.80816650390625, -1.700286865234375, -1.5924072265625, -1.484527587890625, -1.37664794921875, -1.268768310546875, -1.160888671875, -1.053009033203125, -0.94512939453125, -0.837249755859375, -0.7293701171875, -0.621490478515625, -0.51361083984375, -0.405731201171875, -0.2978515625, -0.189971923828125, -0.08209228515625, 0.025787353515625, 0.1336669921875, 0.241546630859375, 0.34942626953125, 0.457305908203125, 0.565185546875, 0.673065185546875, 0.78094482421875, 0.888824462890625, 0.9967041015625, 1.104583740234375, 1.21246337890625, 1.320343017578125, 1.42822265625, 1.536102294921875, 1.64398193359375, 1.751861572265625, 1.8597412109375, 1.967620849609375, 2.07550048828125, 2.183380126953125, 2.291259765625, 2.399139404296875, 2.50701904296875, 2.614898681640625, 2.7227783203125, 2.830657958984375, 2.93853759765625, 3.046417236328125, 3.154296875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 13.0, 17.0, 12.0, 27.0, 34.0, 54.0, 72.0, 97.0, 140.0, 200.0, 303.0, 390.0, 618.0, 846.0, 1261.0, 1798.0, 2649.0, 4028.0, 5927.0, 9059.0, 13681.0, 20999.0, 32979.0, 52282.0, 87002.0, 162845.0, 273763.0, 152757.0, 82898.0, 49863.0, 31667.0, 20475.0, 13361.0, 8658.0, 5738.0, 3786.0, 2630.0, 1734.0, 1176.0, 870.0, 586.0, 388.0, 251.0, 187.0, 128.0, 91.0, 63.0, 62.0, 40.0, 14.0, 19.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.53955078125, -0.5229263305664062, -0.5063018798828125, -0.48967742919921875, -0.473052978515625, -0.45642852783203125, -0.4398040771484375, -0.42317962646484375, -0.40655517578125, -0.38993072509765625, -0.3733062744140625, -0.35668182373046875, -0.340057373046875, -0.32343292236328125, -0.3068084716796875, -0.29018402099609375, -0.2735595703125, -0.25693511962890625, -0.2403106689453125, -0.22368621826171875, -0.207061767578125, -0.19043731689453125, -0.1738128662109375, -0.15718841552734375, -0.14056396484375, -0.12393951416015625, -0.1073150634765625, -0.09069061279296875, -0.074066162109375, -0.05744171142578125, -0.0408172607421875, -0.02419281005859375, -0.007568359375, 0.00905609130859375, 0.0256805419921875, 0.04230499267578125, 0.058929443359375, 0.07555389404296875, 0.0921783447265625, 0.10880279541015625, 0.12542724609375, 0.14205169677734375, 0.1586761474609375, 0.17530059814453125, 0.191925048828125, 0.20854949951171875, 0.2251739501953125, 0.24179840087890625, 0.2584228515625, 0.27504730224609375, 0.2916717529296875, 0.30829620361328125, 0.324920654296875, 0.34154510498046875, 0.3581695556640625, 0.37479400634765625, 0.39141845703125, 0.40804290771484375, 0.4246673583984375, 0.44129180908203125, 0.457916259765625, 0.47454071044921875, 0.4911651611328125, 0.5077896118164062, 0.5244140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 13.0, 5.0, 10.0, 8.0, 10.0, 16.0, 16.0, 25.0, 13.0, 23.0, 31.0, 26.0, 26.0, 32.0, 35.0, 39.0, 26.0, 47.0, 35.0, 26.0, 1057.0, 37.0, 31.0, 39.0, 27.0, 41.0, 28.0, 28.0, 31.0, 32.0, 22.0, 18.0, 24.0, 21.0, 18.0, 9.0, 19.0, 14.0, 8.0, 12.0, 6.0, 6.0, 6.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.8974609375, -1.8379364013671875, -1.778411865234375, -1.7188873291015625, -1.65936279296875, -1.5998382568359375, -1.540313720703125, -1.4807891845703125, -1.4212646484375, -1.3617401123046875, -1.302215576171875, -1.2426910400390625, -1.18316650390625, -1.1236419677734375, -1.064117431640625, -1.0045928955078125, -0.945068359375, -0.8855438232421875, -0.826019287109375, -0.7664947509765625, -0.70697021484375, -0.6474456787109375, -0.587921142578125, -0.5283966064453125, -0.4688720703125, -0.4093475341796875, -0.349822998046875, -0.2902984619140625, -0.23077392578125, -0.1712493896484375, -0.111724853515625, -0.0522003173828125, 0.00732421875, 0.0668487548828125, 0.126373291015625, 0.1858978271484375, 0.24542236328125, 0.3049468994140625, 0.364471435546875, 0.4239959716796875, 0.4835205078125, 0.5430450439453125, 0.602569580078125, 0.6620941162109375, 0.72161865234375, 0.7811431884765625, 0.840667724609375, 0.9001922607421875, 0.959716796875, 1.0192413330078125, 1.078765869140625, 1.1382904052734375, 1.19781494140625, 1.2573394775390625, 1.316864013671875, 1.3763885498046875, 1.4359130859375, 1.4954376220703125, 1.554962158203125, 1.6144866943359375, 1.67401123046875, 1.7335357666015625, 1.793060302734375, 1.8525848388671875, 1.912109375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 6.0, 9.0, 10.0, 10.0, 28.0, 32.0, 56.0, 61.0, 98.0, 129.0, 165.0, 220.0, 311.0, 451.0, 597.0, 867.0, 1146.0, 1628.0, 2249.0, 3137.0, 4200.0, 5771.0, 7903.0, 10796.0, 14930.0, 21391.0, 30365.0, 44537.0, 68000.0, 111024.0, 1249338.0, 194253.0, 108419.0, 66211.0, 43511.0, 30001.0, 20944.0, 14915.0, 10754.0, 7745.0, 5613.0, 4149.0, 3028.0, 2179.0, 1611.0, 1139.0, 887.0, 688.0, 469.0, 365.0, 239.0, 182.0, 112.0, 79.0, 64.0, 37.0, 37.0, 18.0, 15.0, 7.0, 5.0, 2.0, 6.0], "bins": [-0.4130859375, -0.4001655578613281, -0.38724517822265625, -0.3743247985839844, -0.3614044189453125, -0.3484840393066406, -0.33556365966796875, -0.3226432800292969, -0.309722900390625, -0.2968025207519531, -0.28388214111328125, -0.2709617614746094, -0.2580413818359375, -0.24512100219726562, -0.23220062255859375, -0.21928024291992188, -0.20635986328125, -0.19343948364257812, -0.18051910400390625, -0.16759872436523438, -0.1546783447265625, -0.14175796508789062, -0.12883758544921875, -0.11591720581054688, -0.102996826171875, -0.09007644653320312, -0.07715606689453125, -0.06423568725585938, -0.0513153076171875, -0.038394927978515625, -0.02547454833984375, -0.012554168701171875, 0.0003662109375, 0.013286590576171875, 0.02620697021484375, 0.039127349853515625, 0.0520477294921875, 0.06496810913085938, 0.07788848876953125, 0.09080886840820312, 0.103729248046875, 0.11664962768554688, 0.12957000732421875, 0.14249038696289062, 0.1554107666015625, 0.16833114624023438, 0.18125152587890625, 0.19417190551757812, 0.20709228515625, 0.22001266479492188, 0.23293304443359375, 0.24585342407226562, 0.2587738037109375, 0.2716941833496094, 0.28461456298828125, 0.2975349426269531, 0.310455322265625, 0.3233757019042969, 0.33629608154296875, 0.3492164611816406, 0.3621368408203125, 0.3750572204589844, 0.38797760009765625, 0.4008979797363281, 0.413818359375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 1.0, 3.0, 8.0, 12.0, 9.0, 18.0, 29.0, 26.0, 25.0, 29.0, 39.0, 38.0, 46.0, 58.0, 64.0, 54.0, 61.0, 70.0, 38.0, 54.0, 42.0, 39.0, 40.0, 35.0, 37.0, 24.0, 13.0, 20.0, 14.0, 17.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.28640365600586e-05, -8.961278945207596e-05, -8.636154234409332e-05, -8.311029523611069e-05, -7.985904812812805e-05, -7.660780102014542e-05, -7.335655391216278e-05, -7.010530680418015e-05, -6.685405969619751e-05, -6.360281258821487e-05, -6.035156548023224e-05, -5.71003183722496e-05, -5.384907126426697e-05, -5.059782415628433e-05, -4.73465770483017e-05, -4.409532994031906e-05, -4.0844082832336426e-05, -3.759283572435379e-05, -3.4341588616371155e-05, -3.109034150838852e-05, -2.7839094400405884e-05, -2.4587847292423248e-05, -2.1336600184440613e-05, -1.8085353076457977e-05, -1.4834105968475342e-05, -1.1582858860492706e-05, -8.33161175251007e-06, -5.080364644527435e-06, -1.8291175365447998e-06, 1.4221295714378357e-06, 4.673376679420471e-06, 7.924623787403107e-06, 1.1175870895385742e-05, 1.4427118003368378e-05, 1.7678365111351013e-05, 2.092961221933365e-05, 2.4180859327316284e-05, 2.743210643529892e-05, 3.0683353543281555e-05, 3.393460065126419e-05, 3.7185847759246826e-05, 4.043709486722946e-05, 4.36883419752121e-05, 4.693958908319473e-05, 5.019083619117737e-05, 5.3442083299160004e-05, 5.669333040714264e-05, 5.9944577515125275e-05, 6.319582462310791e-05, 6.644707173109055e-05, 6.969831883907318e-05, 7.294956594705582e-05, 7.620081305503845e-05, 7.945206016302109e-05, 8.270330727100372e-05, 8.595455437898636e-05, 8.9205801486969e-05, 9.245704859495163e-05, 9.570829570293427e-05, 9.89595428109169e-05, 0.00010221078991889954, 0.00010546203702688217, 0.00010871328413486481, 0.00011196453124284744, 0.00011521577835083008]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 1.0, 6.0, 6.0, 5.0, 7.0, 16.0, 11.0, 19.0, 28.0, 26.0, 44.0, 52.0, 65.0, 101.0, 135.0, 179.0, 273.0, 409.0, 677.0, 1531.0, 184699.0, 854589.0, 3281.0, 839.0, 486.0, 311.0, 205.0, 127.0, 117.0, 80.0, 65.0, 41.0, 31.0, 24.0, 15.0, 12.0, 9.0, 7.0, 12.0, 1.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.0023288726806640625, -0.0022678375244140625, -0.0022068023681640625, -0.0021457672119140625, -0.0020847320556640625, -0.0020236968994140625, -0.0019626617431640625, -0.0019016265869140625, -0.0018405914306640625, -0.0017795562744140625, -0.0017185211181640625, -0.0016574859619140625, -0.0015964508056640625, -0.0015354156494140625, -0.0014743804931640625, -0.0014133453369140625, -0.0013523101806640625, -0.0012912750244140625, -0.0012302398681640625, -0.0011692047119140625, -0.0011081695556640625, -0.0010471343994140625, -0.0009860992431640625, -0.0009250640869140625, -0.0008640289306640625, -0.0008029937744140625, -0.0007419586181640625, -0.0006809234619140625, -0.0006198883056640625, -0.0005588531494140625, -0.0004978179931640625, -0.0004367828369140625, -0.0003757476806640625, -0.0003147125244140625, -0.0002536773681640625, -0.0001926422119140625, -0.0001316070556640625, -7.05718994140625e-05, -9.5367431640625e-06, 5.14984130859375e-05, 0.0001125335693359375, 0.0001735687255859375, 0.0002346038818359375, 0.0002956390380859375, 0.0003566741943359375, 0.0004177093505859375, 0.0004787445068359375, 0.0005397796630859375, 0.0006008148193359375, 0.0006618499755859375, 0.0007228851318359375, 0.0007839202880859375, 0.0008449554443359375, 0.0009059906005859375, 0.0009670257568359375, 0.0010280609130859375, 0.0010890960693359375, 0.0011501312255859375, 0.0012111663818359375, 0.0012722015380859375, 0.0013332366943359375, 0.0013942718505859375, 0.0014553070068359375, 0.0015163421630859375, 0.0015773773193359375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 26.0, 76.0, 176.0, 256.0, 246.0, 140.0, 58.0, 16.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.349190516630188e-05, -5.8578654716257006e-05, -5.3665404266212136e-05, -4.875215017818846e-05, -4.383889972814359e-05, -3.892564927809872e-05, -3.401239519007504e-05, -2.909914474003017e-05, -2.41858942899853e-05, -1.927264383994043e-05, -1.4359391570906155e-05, -9.446140211366583e-06, -4.5328888518270105e-06, 3.8036159821785986e-07, 5.293613867252134e-06, 1.0206866136286408e-05, 1.5120116586331278e-05, 2.003336703637615e-05, 2.4946619305410422e-05, 2.9859871574444696e-05, 3.477312202448957e-05, 3.968637247453444e-05, 4.4599626562558115e-05, 4.9512877012602985e-05, 5.4426127462647855e-05, 5.9339377912692726e-05, 6.42526283627376e-05, 6.916587881278247e-05, 7.407912926282734e-05, 7.899237971287221e-05, 8.390563743887469e-05, 8.881888788891956e-05, 9.373214561492205e-05, 9.864539606496692e-05, 0.00010355864651501179, 0.00010847189696505666, 0.00011338514741510153, 0.0001182983978651464, 0.00012321164831519127, 0.00012812489876523614, 0.000133038149215281, 0.00013795139966532588, 0.00014286465011537075, 0.00014777790056541562, 0.0001526911510154605, 0.00015760440146550536, 0.00016251765191555023, 0.0001674309023655951, 0.0001723441673675552, 0.00017725741781760007, 0.00018217066826764494, 0.0001870839187176898, 0.00019199716916773468, 0.00019691041961777955, 0.00020182367006782442, 0.00020673693506978452, 0.0002116501855198294, 0.00021656343596987426, 0.00022147668641991913, 0.000226389936869964, 0.00023130318732000887, 0.00023621643777005374, 0.00024112968822009861, 0.0002460429386701435, 0.00025095618912018836]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 2.0, 11.0, 12.0, 14.0, 21.0, 17.0, 18.0, 29.0, 31.0, 19.0, 37.0, 37.0, 32.0, 43.0, 39.0, 50.0, 46.0, 48.0, 42.0, 38.0, 47.0, 40.0, 38.0, 30.0, 34.0, 36.0, 27.0, 26.0, 19.0, 26.0, 12.0, 9.0, 17.0, 11.0, 8.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.0558319091796875e-05, -5.88512048125267e-05, -5.714409053325653e-05, -5.543697625398636e-05, -5.3729861974716187e-05, -5.2022747695446014e-05, -5.031563341617584e-05, -4.860851913690567e-05, -4.69014048576355e-05, -4.5194290578365326e-05, -4.3487176299095154e-05, -4.178006201982498e-05, -4.007294774055481e-05, -3.836583346128464e-05, -3.6658719182014465e-05, -3.495160490274429e-05, -3.324449062347412e-05, -3.153737634420395e-05, -2.9830262064933777e-05, -2.8123147785663605e-05, -2.6416033506393433e-05, -2.470891922712326e-05, -2.300180494785309e-05, -2.1294690668582916e-05, -1.9587576389312744e-05, -1.7880462110042572e-05, -1.61733478307724e-05, -1.4466233551502228e-05, -1.2759119272232056e-05, -1.1052004992961884e-05, -9.344890713691711e-06, -7.63777643442154e-06, -5.930662155151367e-06, -4.223547875881195e-06, -2.516433596611023e-06, -8.093193173408508e-07, 8.977949619293213e-07, 2.6049092411994934e-06, 4.3120235204696655e-06, 6.019137799739838e-06, 7.72625207901001e-06, 9.433366358280182e-06, 1.1140480637550354e-05, 1.2847594916820526e-05, 1.4554709196090698e-05, 1.626182347536087e-05, 1.7968937754631042e-05, 1.9676052033901215e-05, 2.1383166313171387e-05, 2.309028059244156e-05, 2.479739487171173e-05, 2.6504509150981903e-05, 2.8211623430252075e-05, 2.9918737709522247e-05, 3.162585198879242e-05, 3.333296626806259e-05, 3.5040080547332764e-05, 3.6747194826602936e-05, 3.845430910587311e-05, 4.016142338514328e-05, 4.186853766441345e-05, 4.3575651943683624e-05, 4.5282766222953796e-05, 4.698988050222397e-05, 4.869699478149414e-05]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 12.0, 8.0, 16.0, 17.0, 19.0, 22.0, 22.0, 28.0, 30.0, 38.0, 28.0, 40.0, 32.0, 44.0, 46.0, 43.0, 46.0, 43.0, 39.0, 41.0, 28.0, 33.0, 39.0, 32.0, 29.0, 34.0, 33.0, 28.0, 24.0, 16.0, 11.0, 8.0, 15.0, 9.0, 12.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.75, -3.642120361328125, -3.53424072265625, -3.426361083984375, -3.3184814453125, -3.210601806640625, -3.10272216796875, -2.994842529296875, -2.886962890625, -2.779083251953125, -2.67120361328125, -2.563323974609375, -2.4554443359375, -2.347564697265625, -2.23968505859375, -2.131805419921875, -2.02392578125, -1.916046142578125, -1.80816650390625, -1.700286865234375, -1.5924072265625, -1.484527587890625, -1.37664794921875, -1.268768310546875, -1.160888671875, -1.053009033203125, -0.94512939453125, -0.837249755859375, -0.7293701171875, -0.621490478515625, -0.51361083984375, -0.405731201171875, -0.2978515625, -0.189971923828125, -0.08209228515625, 0.025787353515625, 0.1336669921875, 0.241546630859375, 0.34942626953125, 0.457305908203125, 0.565185546875, 0.673065185546875, 0.78094482421875, 0.888824462890625, 0.9967041015625, 1.104583740234375, 1.21246337890625, 1.320343017578125, 1.42822265625, 1.536102294921875, 1.64398193359375, 1.751861572265625, 1.8597412109375, 1.967620849609375, 2.07550048828125, 2.183380126953125, 2.291259765625, 2.399139404296875, 2.50701904296875, 2.614898681640625, 2.7227783203125, 2.830657958984375, 2.93853759765625, 3.046417236328125, 3.154296875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 5.0, 9.0, 9.0, 14.0, 19.0, 33.0, 34.0, 62.0, 77.0, 82.0, 128.0, 163.0, 227.0, 302.0, 364.0, 536.0, 718.0, 1019.0, 1341.0, 1891.0, 2771.0, 4779.0, 15921.0, 155685.0, 698751.0, 135045.0, 14263.0, 4526.0, 2775.0, 1932.0, 1316.0, 984.0, 734.0, 530.0, 385.0, 265.0, 238.0, 156.0, 111.0, 85.0, 65.0, 53.0, 43.0, 26.0, 20.0, 19.0, 17.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.3282470703125, -8.054931640625, -7.7816162109375, -7.50830078125, -7.2349853515625, -6.961669921875, -6.6883544921875, -6.4150390625, -6.1417236328125, -5.868408203125, -5.5950927734375, -5.32177734375, -5.0484619140625, -4.775146484375, -4.5018310546875, -4.228515625, -3.9552001953125, -3.681884765625, -3.4085693359375, -3.13525390625, -2.8619384765625, -2.588623046875, -2.3153076171875, -2.0419921875, -1.7686767578125, -1.495361328125, -1.2220458984375, -0.94873046875, -0.6754150390625, -0.402099609375, -0.1287841796875, 0.14453125, 0.4178466796875, 0.691162109375, 0.9644775390625, 1.23779296875, 1.5111083984375, 1.784423828125, 2.0577392578125, 2.3310546875, 2.6043701171875, 2.877685546875, 3.1510009765625, 3.42431640625, 3.6976318359375, 3.970947265625, 4.2442626953125, 4.517578125, 4.7908935546875, 5.064208984375, 5.3375244140625, 5.61083984375, 5.8841552734375, 6.157470703125, 6.4307861328125, 6.7041015625, 6.9774169921875, 7.250732421875, 7.5240478515625, 7.79736328125, 8.0706787109375, 8.343994140625, 8.6173095703125, 8.890625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 7.0, 7.0, 9.0, 12.0, 19.0, 15.0, 16.0, 17.0, 32.0, 28.0, 37.0, 56.0, 61.0, 78.0, 119.0, 370.0, 1576.0, 153.0, 85.0, 52.0, 53.0, 41.0, 40.0, 34.0, 29.0, 25.0, 16.0, 11.0, 10.0, 16.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.859375, -10.510498046875, -10.16162109375, -9.812744140625, -9.4638671875, -9.114990234375, -8.76611328125, -8.417236328125, -8.068359375, -7.719482421875, -7.37060546875, -7.021728515625, -6.6728515625, -6.323974609375, -5.97509765625, -5.626220703125, -5.27734375, -4.928466796875, -4.57958984375, -4.230712890625, -3.8818359375, -3.532958984375, -3.18408203125, -2.835205078125, -2.486328125, -2.137451171875, -1.78857421875, -1.439697265625, -1.0908203125, -0.741943359375, -0.39306640625, -0.044189453125, 0.3046875, 0.653564453125, 1.00244140625, 1.351318359375, 1.7001953125, 2.049072265625, 2.39794921875, 2.746826171875, 3.095703125, 3.444580078125, 3.79345703125, 4.142333984375, 4.4912109375, 4.840087890625, 5.18896484375, 5.537841796875, 5.88671875, 6.235595703125, 6.58447265625, 6.933349609375, 7.2822265625, 7.631103515625, 7.97998046875, 8.328857421875, 8.677734375, 9.026611328125, 9.37548828125, 9.724365234375, 10.0732421875, 10.422119140625, 10.77099609375, 11.119873046875, 11.46875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 19.0, 42.0, 33.0, 33.0, 48.0, 72.0, 92.0, 178.0, 222.0, 432.0, 799.0, 2312.0, 249036.0, 2887497.0, 2622.0, 971.0, 425.0, 259.0, 173.0, 100.0, 81.0, 66.0, 47.0, 24.0, 17.0, 16.0, 22.0, 11.0, 5.0, 6.0, 2.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.07568359375, -37.7763671875, -36.47705078125, -35.177734375, -33.87841796875, -32.5791015625, -31.27978515625, -29.98046875, -28.68115234375, -27.3818359375, -26.08251953125, -24.783203125, -23.48388671875, -22.1845703125, -20.88525390625, -19.5859375, -18.28662109375, -16.9873046875, -15.68798828125, -14.388671875, -13.08935546875, -11.7900390625, -10.49072265625, -9.19140625, -7.89208984375, -6.5927734375, -5.29345703125, -3.994140625, -2.69482421875, -1.3955078125, -0.09619140625, 1.203125, 2.50244140625, 3.8017578125, 5.10107421875, 6.400390625, 7.69970703125, 8.9990234375, 10.29833984375, 11.59765625, 12.89697265625, 14.1962890625, 15.49560546875, 16.794921875, 18.09423828125, 19.3935546875, 20.69287109375, 21.9921875, 23.29150390625, 24.5908203125, 25.89013671875, 27.189453125, 28.48876953125, 29.7880859375, 31.08740234375, 32.38671875, 33.68603515625, 34.9853515625, 36.28466796875, 37.583984375, 38.88330078125, 40.1826171875, 41.48193359375, 42.78125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 24.0, 45.0, 97.0, 208.0, 263.0, 231.0, 86.0, 37.0, 15.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.93561553955078, -46.724857330322266, -45.514095306396484, -44.30333709716797, -43.09257888793945, -41.88181686401367, -40.671058654785156, -39.460296630859375, -38.24953842163086, -37.038780212402344, -35.82801818847656, -34.61725997924805, -33.40650177001953, -32.19573974609375, -30.984981536865234, -29.774221420288086, -28.56346321105957, -27.352703094482422, -26.141944885253906, -24.931184768676758, -23.72042465209961, -22.509666442871094, -21.298906326293945, -20.088146209716797, -18.87738800048828, -17.666627883911133, -16.455869674682617, -15.245109558105469, -14.03434944152832, -12.823590278625488, -11.612831115722656, -10.402070999145508, -9.19131088256836, -7.980551242828369, -6.769791603088379, -5.559032440185547, -4.348272800445557, -3.1375131607055664, -1.9267539978027344, -0.7159938812255859, 0.4947652816772461, 1.7055248022079468, 2.9162843227386475, 4.127043724060059, 5.337803363800049, 6.548563003540039, 7.759322166442871, 8.97008228302002, 10.180841445922852, 11.391600608825684, 12.602360725402832, 13.813119888305664, 15.023880004882812, 16.234638214111328, 17.445398330688477, 18.656158447265625, 19.86691665649414, 21.07767677307129, 22.288434982299805, 23.499195098876953, 24.7099552154541, 25.92071533203125, 27.131473541259766, 28.342233657836914, 29.552993774414062]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 7.0, 16.0, 10.0, 11.0, 9.0, 12.0, 12.0, 11.0, 22.0, 16.0, 16.0, 33.0, 28.0, 30.0, 27.0, 27.0, 34.0, 31.0, 41.0, 29.0, 40.0, 40.0, 37.0, 39.0, 29.0, 25.0, 34.0, 25.0, 29.0, 30.0, 36.0, 31.0, 27.0, 30.0, 19.0, 20.0, 8.0, 20.0, 10.0, 11.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.995271682739258, -18.326915740966797, -17.658557891845703, -16.990201950073242, -16.32184600830078, -15.65349006652832, -14.985133171081543, -14.316776275634766, -13.648420333862305, -12.980064392089844, -12.311707496643066, -11.643350601196289, -10.974994659423828, -10.306638717651367, -9.63828182220459, -8.969924926757812, -8.301568984985352, -7.633212566375732, -6.964856147766113, -6.296499729156494, -5.628143310546875, -4.959786891937256, -4.291430473327637, -3.6230740547180176, -2.9547176361083984, -2.2863612174987793, -1.6180047988891602, -0.949648380279541, -0.2812919616699219, 0.38706445693969727, 1.0554208755493164, 1.7237772941589355, 2.392131805419922, 3.060488224029541, 3.72884464263916, 4.397201061248779, 5.065557479858398, 5.733913898468018, 6.402270317077637, 7.070626735687256, 7.738983154296875, 8.407339096069336, 9.075695991516113, 9.74405288696289, 10.412408828735352, 11.080764770507812, 11.74912166595459, 12.417478561401367, 13.085834503173828, 13.754190444946289, 14.422547340393066, 15.090904235839844, 15.759260177612305, 16.427616119384766, 17.09597396850586, 17.76432991027832, 18.43268585205078, 19.101041793823242, 19.769397735595703, 20.437755584716797, 21.106111526489258, 21.77446746826172, 22.442825317382812, 23.111181259155273, 23.779537200927734]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 8.0, 6.0, 5.0, 5.0, 6.0, 12.0, 17.0, 18.0, 16.0, 24.0, 18.0, 26.0, 31.0, 23.0, 38.0, 26.0, 37.0, 43.0, 29.0, 41.0, 30.0, 42.0, 42.0, 48.0, 38.0, 32.0, 32.0, 36.0, 38.0, 35.0, 19.0, 23.0, 26.0, 26.0, 19.0, 13.0, 12.0, 17.0, 13.0, 4.0, 6.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.40234375, -3.29425048828125, -3.1861572265625, -3.07806396484375, -2.969970703125, -2.86187744140625, -2.7537841796875, -2.64569091796875, -2.53759765625, -2.42950439453125, -2.3214111328125, -2.21331787109375, -2.105224609375, -1.99713134765625, -1.8890380859375, -1.78094482421875, -1.6728515625, -1.56475830078125, -1.4566650390625, -1.34857177734375, -1.240478515625, -1.13238525390625, -1.0242919921875, -0.91619873046875, -0.80810546875, -0.70001220703125, -0.5919189453125, -0.48382568359375, -0.375732421875, -0.26763916015625, -0.1595458984375, -0.05145263671875, 0.056640625, 0.16473388671875, 0.2728271484375, 0.38092041015625, 0.489013671875, 0.59710693359375, 0.7052001953125, 0.81329345703125, 0.92138671875, 1.02947998046875, 1.1375732421875, 1.24566650390625, 1.353759765625, 1.46185302734375, 1.5699462890625, 1.67803955078125, 1.7861328125, 1.89422607421875, 2.0023193359375, 2.11041259765625, 2.218505859375, 2.32659912109375, 2.4346923828125, 2.54278564453125, 2.65087890625, 2.75897216796875, 2.8670654296875, 2.97515869140625, 3.083251953125, 3.19134521484375, 3.2994384765625, 3.40753173828125, 3.515625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 6.0, 10.0, 11.0, 18.0, 13.0, 15.0, 20.0, 29.0, 32.0, 36.0, 44.0, 57.0, 74.0, 92.0, 156.0, 370.0, 1081.0, 3979.0, 26213.0, 529249.0, 3153552.0, 450069.0, 23380.0, 3776.0, 1027.0, 340.0, 148.0, 94.0, 82.0, 65.0, 50.0, 29.0, 28.0, 30.0, 31.0, 16.0, 8.0, 15.0, 7.0, 10.0, 8.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.5390625, -10.2042236328125, -9.869384765625, -9.5345458984375, -9.19970703125, -8.8648681640625, -8.530029296875, -8.1951904296875, -7.8603515625, -7.5255126953125, -7.190673828125, -6.8558349609375, -6.52099609375, -6.1861572265625, -5.851318359375, -5.5164794921875, -5.181640625, -4.8468017578125, -4.511962890625, -4.1771240234375, -3.84228515625, -3.5074462890625, -3.172607421875, -2.8377685546875, -2.5029296875, -2.1680908203125, -1.833251953125, -1.4984130859375, -1.16357421875, -0.8287353515625, -0.493896484375, -0.1590576171875, 0.17578125, 0.5106201171875, 0.845458984375, 1.1802978515625, 1.51513671875, 1.8499755859375, 2.184814453125, 2.5196533203125, 2.8544921875, 3.1893310546875, 3.524169921875, 3.8590087890625, 4.19384765625, 4.5286865234375, 4.863525390625, 5.1983642578125, 5.533203125, 5.8680419921875, 6.202880859375, 6.5377197265625, 6.87255859375, 7.2073974609375, 7.542236328125, 7.8770751953125, 8.2119140625, 8.5467529296875, 8.881591796875, 9.2164306640625, 9.55126953125, 9.8861083984375, 10.220947265625, 10.5557861328125, 10.890625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 10.0, 19.0, 33.0, 148.0, 409.0, 1057.0, 1474.0, 622.0, 193.0, 83.0, 27.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.015625, -22.322509765625, -21.62939453125, -20.936279296875, -20.2431640625, -19.550048828125, -18.85693359375, -18.163818359375, -17.470703125, -16.777587890625, -16.08447265625, -15.391357421875, -14.6982421875, -14.005126953125, -13.31201171875, -12.618896484375, -11.92578125, -11.232666015625, -10.53955078125, -9.846435546875, -9.1533203125, -8.460205078125, -7.76708984375, -7.073974609375, -6.380859375, -5.687744140625, -4.99462890625, -4.301513671875, -3.6083984375, -2.915283203125, -2.22216796875, -1.529052734375, -0.8359375, -0.142822265625, 0.55029296875, 1.243408203125, 1.9365234375, 2.629638671875, 3.32275390625, 4.015869140625, 4.708984375, 5.402099609375, 6.09521484375, 6.788330078125, 7.4814453125, 8.174560546875, 8.86767578125, 9.560791015625, 10.25390625, 10.947021484375, 11.64013671875, 12.333251953125, 13.0263671875, 13.719482421875, 14.41259765625, 15.105712890625, 15.798828125, 16.491943359375, 17.18505859375, 17.878173828125, 18.5712890625, 19.264404296875, 19.95751953125, 20.650634765625, 21.34375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 11.0, 16.0, 25.0, 103.0, 313.0, 1417.0, 24152.0, 4161408.0, 5648.0, 842.0, 225.0, 61.0, 22.0, 15.0, 6.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.1875, -43.74560546875, -42.3037109375, -40.86181640625, -39.419921875, -37.97802734375, -36.5361328125, -35.09423828125, -33.65234375, -32.21044921875, -30.7685546875, -29.32666015625, -27.884765625, -26.44287109375, -25.0009765625, -23.55908203125, -22.1171875, -20.67529296875, -19.2333984375, -17.79150390625, -16.349609375, -14.90771484375, -13.4658203125, -12.02392578125, -10.58203125, -9.14013671875, -7.6982421875, -6.25634765625, -4.814453125, -3.37255859375, -1.9306640625, -0.48876953125, 0.953125, 2.39501953125, 3.8369140625, 5.27880859375, 6.720703125, 8.16259765625, 9.6044921875, 11.04638671875, 12.48828125, 13.93017578125, 15.3720703125, 16.81396484375, 18.255859375, 19.69775390625, 21.1396484375, 22.58154296875, 24.0234375, 25.46533203125, 26.9072265625, 28.34912109375, 29.791015625, 31.23291015625, 32.6748046875, 34.11669921875, 35.55859375, 37.00048828125, 38.4423828125, 39.88427734375, 41.326171875, 42.76806640625, 44.2099609375, 45.65185546875, 47.09375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 25.0, 98.0, 249.0, 301.0, 227.0, 90.0, 11.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.73889923095703, -73.76427459716797, -71.78964233398438, -69.81501770019531, -67.84038543701172, -65.86576080322266, -63.89113235473633, -61.91650390625, -59.94187545776367, -57.967247009277344, -55.992618560791016, -54.01799011230469, -52.043365478515625, -50.06873321533203, -48.09410858154297, -46.11948013305664, -44.14485168457031, -42.170223236083984, -40.195594787597656, -38.22096633911133, -36.246337890625, -34.27171325683594, -32.29708480834961, -30.32245635986328, -28.347827911376953, -26.373199462890625, -24.398571014404297, -22.4239444732666, -20.449316024780273, -18.474687576293945, -16.50006103515625, -14.525432586669922, -12.550804138183594, -10.576175689697266, -8.601548194885254, -6.626920223236084, -4.652292251586914, -2.677663803100586, -0.7030363082885742, 1.2715911865234375, 3.2462196350097656, 5.2208476066589355, 7.1954755783081055, 9.170103073120117, 11.144731521606445, 13.119359970092773, 15.093987464904785, 17.068614959716797, 19.043243408203125, 21.017871856689453, 22.99250030517578, 24.967126846313477, 26.941755294799805, 28.916383743286133, 30.891010284423828, 32.865638732910156, 34.840267181396484, 36.81489562988281, 38.78952407836914, 40.76415252685547, 42.73877716064453, 44.713409423828125, 46.68803405761719, 48.662662506103516, 50.637290954589844]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 9.0, 8.0, 7.0, 13.0, 11.0, 15.0, 20.0, 22.0, 18.0, 23.0, 26.0, 29.0, 31.0, 39.0, 32.0, 44.0, 40.0, 34.0, 38.0, 45.0, 39.0, 40.0, 36.0, 34.0, 30.0, 50.0, 26.0, 24.0, 23.0, 31.0, 24.0, 20.0, 22.0, 14.0, 11.0, 8.0, 13.0, 10.0, 8.0, 8.0, 3.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.18072509765625, -21.426908493041992, -20.6730899810791, -19.919273376464844, -19.165454864501953, -18.411638259887695, -17.657821655273438, -16.904003143310547, -16.15018653869629, -15.396368980407715, -14.64255142211914, -13.888734817504883, -13.134917259216309, -12.381099700927734, -11.62728214263916, -10.873464584350586, -10.119647026062012, -9.365829467773438, -8.612011909484863, -7.858194828033447, -7.104377746582031, -6.350560188293457, -5.596742630004883, -4.842925548553467, -4.089107990264893, -3.3352906703948975, -2.5814733505249023, -1.8276557922363281, -1.073838472366333, -0.3200211524963379, 0.43379640579223633, 1.1876134872436523, 1.9414310455322266, 2.6952483654022217, 3.449065685272217, 4.202883243560791, 4.956700325012207, 5.710517883300781, 6.4643354415893555, 7.2181525230407715, 7.971970081329346, 8.725787162780762, 9.479604721069336, 10.23342227935791, 10.987239837646484, 11.741056442260742, 12.494874954223633, 13.24869155883789, 14.002509117126465, 14.756326675415039, 15.510144233703613, 16.263961791992188, 17.017778396606445, 17.771595001220703, 18.525413513183594, 19.27923011779785, 20.033048629760742, 20.786865234375, 21.54068374633789, 22.29450035095215, 23.04831886291504, 23.802135467529297, 24.555953979492188, 25.309770584106445, 26.063587188720703]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 10.0, 3.0, 7.0, 5.0, 13.0, 16.0, 13.0, 15.0, 14.0, 28.0, 24.0, 29.0, 28.0, 28.0, 31.0, 41.0, 33.0, 39.0, 46.0, 42.0, 39.0, 52.0, 40.0, 39.0, 36.0, 37.0, 40.0, 45.0, 32.0, 19.0, 18.0, 23.0, 25.0, 15.0, 15.0, 10.0, 9.0, 8.0, 5.0, 10.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.62640380859375, -2.5379638671875, -2.44952392578125, -2.361083984375, -2.27264404296875, -2.1842041015625, -2.09576416015625, -2.00732421875, -1.91888427734375, -1.8304443359375, -1.74200439453125, -1.653564453125, -1.56512451171875, -1.4766845703125, -1.38824462890625, -1.2998046875, -1.21136474609375, -1.1229248046875, -1.03448486328125, -0.946044921875, -0.85760498046875, -0.7691650390625, -0.68072509765625, -0.59228515625, -0.50384521484375, -0.4154052734375, -0.32696533203125, -0.238525390625, -0.15008544921875, -0.0616455078125, 0.02679443359375, 0.115234375, 0.20367431640625, 0.2921142578125, 0.38055419921875, 0.468994140625, 0.55743408203125, 0.6458740234375, 0.73431396484375, 0.82275390625, 0.91119384765625, 0.9996337890625, 1.08807373046875, 1.176513671875, 1.26495361328125, 1.3533935546875, 1.44183349609375, 1.5302734375, 1.61871337890625, 1.7071533203125, 1.79559326171875, 1.884033203125, 1.97247314453125, 2.0609130859375, 2.14935302734375, 2.23779296875, 2.32623291015625, 2.4146728515625, 2.50311279296875, 2.591552734375, 2.67999267578125, 2.7684326171875, 2.85687255859375, 2.9453125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 5.0, 4.0, 8.0, 14.0, 19.0, 34.0, 50.0, 85.0, 113.0, 142.0, 244.0, 349.0, 481.0, 759.0, 1043.0, 1478.0, 2217.0, 3054.0, 4492.0, 6541.0, 9466.0, 14099.0, 21297.0, 32713.0, 51102.0, 84628.0, 152448.0, 267379.0, 155269.0, 87134.0, 52010.0, 32948.0, 21476.0, 14252.0, 9725.0, 6584.0, 4666.0, 3179.0, 2149.0, 1536.0, 1031.0, 739.0, 454.0, 384.0, 248.0, 175.0, 104.0, 83.0, 50.0, 31.0, 25.0, 17.0, 16.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.414794921875, -0.4012031555175781, -0.38761138916015625, -0.3740196228027344, -0.3604278564453125, -0.3468360900878906, -0.33324432373046875, -0.3196525573730469, -0.306060791015625, -0.2924690246582031, -0.27887725830078125, -0.2652854919433594, -0.2516937255859375, -0.23810195922851562, -0.22451019287109375, -0.21091842651367188, -0.19732666015625, -0.18373489379882812, -0.17014312744140625, -0.15655136108398438, -0.1429595947265625, -0.12936782836914062, -0.11577606201171875, -0.10218429565429688, -0.088592529296875, -0.07500076293945312, -0.06140899658203125, -0.047817230224609375, -0.0342254638671875, -0.020633697509765625, -0.00704193115234375, 0.006549835205078125, 0.0201416015625, 0.033733367919921875, 0.04732513427734375, 0.060916900634765625, 0.0745086669921875, 0.08810043334960938, 0.10169219970703125, 0.11528396606445312, 0.128875732421875, 0.14246749877929688, 0.15605926513671875, 0.16965103149414062, 0.1832427978515625, 0.19683456420898438, 0.21042633056640625, 0.22401809692382812, 0.23760986328125, 0.2512016296386719, 0.26479339599609375, 0.2783851623535156, 0.2919769287109375, 0.3055686950683594, 0.31916046142578125, 0.3327522277832031, 0.346343994140625, 0.3599357604980469, 0.37352752685546875, 0.3871192932128906, 0.4007110595703125, 0.4143028259277344, 0.42789459228515625, 0.4414863586425781, 0.455078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 10.0, 7.0, 8.0, 8.0, 9.0, 15.0, 16.0, 21.0, 23.0, 20.0, 34.0, 27.0, 35.0, 49.0, 41.0, 43.0, 43.0, 51.0, 48.0, 1067.0, 46.0, 46.0, 51.0, 28.0, 36.0, 40.0, 33.0, 24.0, 17.0, 28.0, 14.0, 15.0, 15.0, 9.0, 16.0, 6.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.078125, -2.0189208984375, -1.959716796875, -1.9005126953125, -1.84130859375, -1.7821044921875, -1.722900390625, -1.6636962890625, -1.6044921875, -1.5452880859375, -1.486083984375, -1.4268798828125, -1.36767578125, -1.3084716796875, -1.249267578125, -1.1900634765625, -1.130859375, -1.0716552734375, -1.012451171875, -0.9532470703125, -0.89404296875, -0.8348388671875, -0.775634765625, -0.7164306640625, -0.6572265625, -0.5980224609375, -0.538818359375, -0.4796142578125, -0.42041015625, -0.3612060546875, -0.302001953125, -0.2427978515625, -0.18359375, -0.1243896484375, -0.065185546875, -0.0059814453125, 0.05322265625, 0.1124267578125, 0.171630859375, 0.2308349609375, 0.2900390625, 0.3492431640625, 0.408447265625, 0.4676513671875, 0.52685546875, 0.5860595703125, 0.645263671875, 0.7044677734375, 0.763671875, 0.8228759765625, 0.882080078125, 0.9412841796875, 1.00048828125, 1.0596923828125, 1.118896484375, 1.1781005859375, 1.2373046875, 1.2965087890625, 1.355712890625, 1.4149169921875, 1.47412109375, 1.5333251953125, 1.592529296875, 1.6517333984375, 1.7109375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 15.0, 21.0, 31.0, 44.0, 77.0, 108.0, 149.0, 215.0, 301.0, 476.0, 662.0, 1026.0, 1524.0, 2226.0, 3255.0, 4953.0, 7405.0, 10884.0, 16957.0, 26524.0, 43096.0, 74261.0, 146227.0, 1347372.0, 183777.0, 88480.0, 49971.0, 30054.0, 19195.0, 12542.0, 8164.0, 5553.0, 3660.0, 2634.0, 1704.0, 1120.0, 821.0, 523.0, 397.0, 239.0, 172.0, 112.0, 64.0, 44.0, 29.0, 21.0, 11.0, 12.0, 6.0, 10.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.4375, -0.4236717224121094, -0.40984344482421875, -0.3960151672363281, -0.3821868896484375, -0.3683586120605469, -0.35453033447265625, -0.3407020568847656, -0.326873779296875, -0.3130455017089844, -0.29921722412109375, -0.2853889465332031, -0.2715606689453125, -0.2577323913574219, -0.24390411376953125, -0.23007583618164062, -0.21624755859375, -0.20241928100585938, -0.18859100341796875, -0.17476272583007812, -0.1609344482421875, -0.14710617065429688, -0.13327789306640625, -0.11944961547851562, -0.105621337890625, -0.09179306030273438, -0.07796478271484375, -0.06413650512695312, -0.0503082275390625, -0.036479949951171875, -0.02265167236328125, -0.008823394775390625, 0.0050048828125, 0.018833160400390625, 0.03266143798828125, 0.046489715576171875, 0.0603179931640625, 0.07414627075195312, 0.08797454833984375, 0.10180282592773438, 0.115631103515625, 0.12945938110351562, 0.14328765869140625, 0.15711593627929688, 0.1709442138671875, 0.18477249145507812, 0.19860076904296875, 0.21242904663085938, 0.22625732421875, 0.24008560180664062, 0.25391387939453125, 0.2677421569824219, 0.2815704345703125, 0.2953987121582031, 0.30922698974609375, 0.3230552673339844, 0.336883544921875, 0.3507118225097656, 0.36454010009765625, 0.3783683776855469, 0.3921966552734375, 0.4060249328613281, 0.41985321044921875, 0.4336814880371094, 0.447509765625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 5.0, 8.0, 5.0, 9.0, 6.0, 13.0, 9.0, 11.0, 21.0, 32.0, 44.0, 49.0, 62.0, 56.0, 67.0, 67.0, 82.0, 78.0, 61.0, 63.0, 48.0, 50.0, 33.0, 27.0, 24.0, 23.0, 10.0, 6.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010216236114501953, -9.889528155326843e-05, -9.562820196151733e-05, -9.236112236976624e-05, -8.909404277801514e-05, -8.582696318626404e-05, -8.255988359451294e-05, -7.929280400276184e-05, -7.602572441101074e-05, -7.275864481925964e-05, -6.949156522750854e-05, -6.622448563575745e-05, -6.295740604400635e-05, -5.969032645225525e-05, -5.642324686050415e-05, -5.315616726875305e-05, -4.988908767700195e-05, -4.6622008085250854e-05, -4.3354928493499756e-05, -4.008784890174866e-05, -3.682076930999756e-05, -3.355368971824646e-05, -3.028661012649536e-05, -2.7019530534744263e-05, -2.3752450942993164e-05, -2.0485371351242065e-05, -1.7218291759490967e-05, -1.3951212167739868e-05, -1.068413257598877e-05, -7.417052984237671e-06, -4.149973392486572e-06, -8.828938007354736e-07, 2.384185791015625e-06, 5.651265382766724e-06, 8.918344974517822e-06, 1.2185424566268921e-05, 1.545250415802002e-05, 1.8719583749771118e-05, 2.1986663341522217e-05, 2.5253742933273315e-05, 2.8520822525024414e-05, 3.178790211677551e-05, 3.505498170852661e-05, 3.832206130027771e-05, 4.158914089202881e-05, 4.485622048377991e-05, 4.8123300075531006e-05, 5.1390379667282104e-05, 5.46574592590332e-05, 5.79245388507843e-05, 6.11916184425354e-05, 6.44586980342865e-05, 6.77257776260376e-05, 7.09928572177887e-05, 7.42599368095398e-05, 7.75270164012909e-05, 8.079409599304199e-05, 8.406117558479309e-05, 8.732825517654419e-05, 9.059533476829529e-05, 9.386241436004639e-05, 9.712949395179749e-05, 0.00010039657354354858, 0.00010366365313529968, 0.00010693073272705078]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 3.0, 16.0, 10.0, 15.0, 22.0, 30.0, 35.0, 45.0, 80.0, 102.0, 160.0, 257.0, 453.0, 850.0, 2394.0, 1013478.0, 27970.0, 1150.0, 548.0, 315.0, 198.0, 134.0, 72.0, 44.0, 44.0, 25.0, 16.0, 21.0, 15.0, 11.0, 13.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020694732666015625, -0.0020042061805725098, -0.001938939094543457, -0.0018736720085144043, -0.0018084049224853516, -0.0017431378364562988, -0.001677870750427246, -0.0016126036643981934, -0.0015473365783691406, -0.0014820694923400879, -0.0014168024063110352, -0.0013515353202819824, -0.0012862682342529297, -0.001221001148223877, -0.0011557340621948242, -0.0010904669761657715, -0.0010251998901367188, -0.000959932804107666, -0.0008946657180786133, -0.0008293986320495605, -0.0007641315460205078, -0.0006988644599914551, -0.0006335973739624023, -0.0005683302879333496, -0.0005030632019042969, -0.00043779611587524414, -0.0003725290298461914, -0.00030726194381713867, -0.00024199485778808594, -0.0001767277717590332, -0.00011146068572998047, -4.6193599700927734e-05, 1.9073486328125e-05, 8.434057235717773e-05, 0.00014960765838623047, 0.0002148747444152832, 0.00028014183044433594, 0.00034540891647338867, 0.0004106760025024414, 0.00047594308853149414, 0.0005412101745605469, 0.0006064772605895996, 0.0006717443466186523, 0.0007370114326477051, 0.0008022785186767578, 0.0008675456047058105, 0.0009328126907348633, 0.000998079776763916, 0.0010633468627929688, 0.0011286139488220215, 0.0011938810348510742, 0.001259148120880127, 0.0013244152069091797, 0.0013896822929382324, 0.0014549493789672852, 0.0015202164649963379, 0.0015854835510253906, 0.0016507506370544434, 0.001716017723083496, 0.0017812848091125488, 0.0018465518951416016, 0.0019118189811706543, 0.001977086067199707, 0.0020423531532287598, 0.0021076202392578125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 15.0, 488.0, 489.0, 19.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0006496733985841274, -0.000637414981611073, -0.0006251565064303577, -0.0006128980894573033, -0.0006006396724842489, -0.0005883811973035336, -0.0005761227803304791, -0.0005638643633574247, -0.0005516059463843703, -0.0005393475294113159, -0.0005270890542306006, -0.0005148306372575462, -0.0005025722202844918, -0.0004903137451037765, -0.00047805532813072205, -0.00046579691115766764, -0.0004535384359769523, -0.00044127998990006745, -0.00042902157292701304, -0.0004167631268501282, -0.00040450470987707376, -0.0003922462638001889, -0.00037998781772330403, -0.0003677294007502496, -0.00035547095467336476, -0.0003432125085964799, -0.0003309540916234255, -0.0003186956455465406, -0.00030643719946965575, -0.00029417878249660134, -0.0002819203364197165, -0.0002696618903428316, -0.00025740344426594675, -0.0002451449981890619, -0.00023288658121600747, -0.0002206281351391226, -0.00020836970361415297, -0.00019611127208918333, -0.00018385282601229846, -0.00017159439448732883, -0.0001593359629623592, -0.00014707753143738955, -0.00013481909991241992, -0.00012256065383553505, -0.00011030222231056541, -9.804379078559577e-05, -8.578535198466852e-05, -7.352691318374127e-05, -6.126848165877163e-05, -4.901004649582319e-05, -3.6751611332874745e-05, -2.44931761699263e-05, -1.2234741006977856e-05, 2.3690517991781235e-08, 1.2282129318919033e-05, 2.4540568119846284e-05, 3.679899964481592e-05, 4.9057434807764366e-05, 6.131586997071281e-05, 7.357430877164006e-05, 8.58327402966097e-05, 9.809117182157934e-05, 0.00011034961062250659, 0.00012260804942343384, 0.00013486648094840348]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 9.0, 6.0, 11.0, 9.0, 9.0, 20.0, 7.0, 20.0, 25.0, 22.0, 36.0, 30.0, 33.0, 20.0, 48.0, 25.0, 35.0, 38.0, 39.0, 50.0, 49.0, 38.0, 41.0, 37.0, 47.0, 38.0, 39.0, 22.0, 27.0, 31.0, 24.0, 27.0, 18.0, 15.0, 15.0, 11.0, 11.0, 4.0, 3.0, 1.0, 4.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.369020462036133e-05, -4.225224256515503e-05, -4.081428050994873e-05, -3.937631845474243e-05, -3.793835639953613e-05, -3.6500394344329834e-05, -3.5062432289123535e-05, -3.3624470233917236e-05, -3.218650817871094e-05, -3.074854612350464e-05, -2.931058406829834e-05, -2.787262201309204e-05, -2.6434659957885742e-05, -2.4996697902679443e-05, -2.3558735847473145e-05, -2.2120773792266846e-05, -2.0682811737060547e-05, -1.9244849681854248e-05, -1.780688762664795e-05, -1.636892557144165e-05, -1.4930963516235352e-05, -1.3493001461029053e-05, -1.2055039405822754e-05, -1.0617077350616455e-05, -9.179115295410156e-06, -7.741153240203857e-06, -6.303191184997559e-06, -4.86522912979126e-06, -3.427267074584961e-06, -1.989305019378662e-06, -5.513429641723633e-07, 8.866190910339355e-07, 2.3245811462402344e-06, 3.762543201446533e-06, 5.200505256652832e-06, 6.638467311859131e-06, 8.07642936706543e-06, 9.514391422271729e-06, 1.0952353477478027e-05, 1.2390315532684326e-05, 1.3828277587890625e-05, 1.5266239643096924e-05, 1.6704201698303223e-05, 1.814216375350952e-05, 1.958012580871582e-05, 2.101808786392212e-05, 2.2456049919128418e-05, 2.3894011974334717e-05, 2.5331974029541016e-05, 2.6769936084747314e-05, 2.8207898139953613e-05, 2.9645860195159912e-05, 3.108382225036621e-05, 3.252178430557251e-05, 3.395974636077881e-05, 3.539770841598511e-05, 3.6835670471191406e-05, 3.8273632526397705e-05, 3.9711594581604004e-05, 4.11495566368103e-05, 4.25875186920166e-05, 4.40254807472229e-05, 4.54634428024292e-05, 4.69014048576355e-05, 4.83393669128418e-05]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 10.0, 3.0, 7.0, 5.0, 13.0, 16.0, 13.0, 15.0, 14.0, 28.0, 24.0, 29.0, 28.0, 28.0, 31.0, 41.0, 33.0, 39.0, 46.0, 42.0, 39.0, 52.0, 40.0, 39.0, 36.0, 37.0, 40.0, 45.0, 32.0, 19.0, 18.0, 23.0, 25.0, 15.0, 15.0, 10.0, 9.0, 8.0, 5.0, 10.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.62640380859375, -2.5379638671875, -2.44952392578125, -2.361083984375, -2.27264404296875, -2.1842041015625, -2.09576416015625, -2.00732421875, -1.91888427734375, -1.8304443359375, -1.74200439453125, -1.653564453125, -1.56512451171875, -1.4766845703125, -1.38824462890625, -1.2998046875, -1.21136474609375, -1.1229248046875, -1.03448486328125, -0.946044921875, -0.85760498046875, -0.7691650390625, -0.68072509765625, -0.59228515625, -0.50384521484375, -0.4154052734375, -0.32696533203125, -0.238525390625, -0.15008544921875, -0.0616455078125, 0.02679443359375, 0.115234375, 0.20367431640625, 0.2921142578125, 0.38055419921875, 0.468994140625, 0.55743408203125, 0.6458740234375, 0.73431396484375, 0.82275390625, 0.91119384765625, 0.9996337890625, 1.08807373046875, 1.176513671875, 1.26495361328125, 1.3533935546875, 1.44183349609375, 1.5302734375, 1.61871337890625, 1.7071533203125, 1.79559326171875, 1.884033203125, 1.97247314453125, 2.0609130859375, 2.14935302734375, 2.23779296875, 2.32623291015625, 2.4146728515625, 2.50311279296875, 2.591552734375, 2.67999267578125, 2.7684326171875, 2.85687255859375, 2.9453125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 13.0, 17.0, 29.0, 33.0, 44.0, 79.0, 92.0, 122.0, 146.0, 182.0, 265.0, 395.0, 589.0, 952.0, 1611.0, 3097.0, 7088.0, 22185.0, 115969.0, 604598.0, 234183.0, 37133.0, 10169.0, 4086.0, 2049.0, 1138.0, 656.0, 460.0, 317.0, 215.0, 157.0, 113.0, 90.0, 63.0, 49.0, 58.0, 36.0, 15.0, 14.0, 13.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.49072265625, -5.3173828125, -5.14404296875, -4.970703125, -4.79736328125, -4.6240234375, -4.45068359375, -4.27734375, -4.10400390625, -3.9306640625, -3.75732421875, -3.583984375, -3.41064453125, -3.2373046875, -3.06396484375, -2.890625, -2.71728515625, -2.5439453125, -2.37060546875, -2.197265625, -2.02392578125, -1.8505859375, -1.67724609375, -1.50390625, -1.33056640625, -1.1572265625, -0.98388671875, -0.810546875, -0.63720703125, -0.4638671875, -0.29052734375, -0.1171875, 0.05615234375, 0.2294921875, 0.40283203125, 0.576171875, 0.74951171875, 0.9228515625, 1.09619140625, 1.26953125, 1.44287109375, 1.6162109375, 1.78955078125, 1.962890625, 2.13623046875, 2.3095703125, 2.48291015625, 2.65625, 2.82958984375, 3.0029296875, 3.17626953125, 3.349609375, 3.52294921875, 3.6962890625, 3.86962890625, 4.04296875, 4.21630859375, 4.3896484375, 4.56298828125, 4.736328125, 4.90966796875, 5.0830078125, 5.25634765625, 5.4296875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 12.0, 6.0, 11.0, 3.0, 14.0, 18.0, 28.0, 24.0, 40.0, 39.0, 62.0, 62.0, 95.0, 140.0, 394.0, 1517.0, 166.0, 86.0, 60.0, 58.0, 43.0, 34.0, 32.0, 22.0, 22.0, 7.0, 13.0, 9.0, 4.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-12.140625, -11.813232421875, -11.48583984375, -11.158447265625, -10.8310546875, -10.503662109375, -10.17626953125, -9.848876953125, -9.521484375, -9.194091796875, -8.86669921875, -8.539306640625, -8.2119140625, -7.884521484375, -7.55712890625, -7.229736328125, -6.90234375, -6.574951171875, -6.24755859375, -5.920166015625, -5.5927734375, -5.265380859375, -4.93798828125, -4.610595703125, -4.283203125, -3.955810546875, -3.62841796875, -3.301025390625, -2.9736328125, -2.646240234375, -2.31884765625, -1.991455078125, -1.6640625, -1.336669921875, -1.00927734375, -0.681884765625, -0.3544921875, -0.027099609375, 0.30029296875, 0.627685546875, 0.955078125, 1.282470703125, 1.60986328125, 1.937255859375, 2.2646484375, 2.592041015625, 2.91943359375, 3.246826171875, 3.57421875, 3.901611328125, 4.22900390625, 4.556396484375, 4.8837890625, 5.211181640625, 5.53857421875, 5.865966796875, 6.193359375, 6.520751953125, 6.84814453125, 7.175537109375, 7.5029296875, 7.830322265625, 8.15771484375, 8.485107421875, 8.8125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 1.0, 8.0, 6.0, 5.0, 15.0, 8.0, 11.0, 24.0, 35.0, 29.0, 64.0, 67.0, 101.0, 132.0, 202.0, 339.0, 778.0, 2494.0, 1414444.0, 1722491.0, 2597.0, 764.0, 371.0, 216.0, 129.0, 117.0, 59.0, 62.0, 31.0, 27.0, 25.0, 13.0, 10.0, 10.0, 11.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.90625, -17.266845703125, -16.62744140625, -15.988037109375, -15.3486328125, -14.709228515625, -14.06982421875, -13.430419921875, -12.791015625, -12.151611328125, -11.51220703125, -10.872802734375, -10.2333984375, -9.593994140625, -8.95458984375, -8.315185546875, -7.67578125, -7.036376953125, -6.39697265625, -5.757568359375, -5.1181640625, -4.478759765625, -3.83935546875, -3.199951171875, -2.560546875, -1.921142578125, -1.28173828125, -0.642333984375, -0.0029296875, 0.636474609375, 1.27587890625, 1.915283203125, 2.5546875, 3.194091796875, 3.83349609375, 4.472900390625, 5.1123046875, 5.751708984375, 6.39111328125, 7.030517578125, 7.669921875, 8.309326171875, 8.94873046875, 9.588134765625, 10.2275390625, 10.866943359375, 11.50634765625, 12.145751953125, 12.78515625, 13.424560546875, 14.06396484375, 14.703369140625, 15.3427734375, 15.982177734375, 16.62158203125, 17.260986328125, 17.900390625, 18.539794921875, 19.17919921875, 19.818603515625, 20.4580078125, 21.097412109375, 21.73681640625, 22.376220703125, 23.015625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 44.0, 489.0, 446.0, 33.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.157018661499023, -27.982383728027344, -25.807750701904297, -23.63311767578125, -21.45848274230957, -19.28384780883789, -17.109214782714844, -14.93458080291748, -12.759946823120117, -10.585312843322754, -8.41067886352539, -6.236044883728027, -4.061410903930664, -1.8867769241333008, 0.2878570556640625, 2.462491035461426, 4.637125015258789, 6.811758995056152, 8.986392974853516, 11.161026954650879, 13.335660934448242, 15.510294914245605, 17.68492889404297, 19.859561920166016, 22.034196853637695, 24.208831787109375, 26.383464813232422, 28.55809783935547, 30.73273277282715, 32.90736770629883, 35.082000732421875, 37.25663375854492, 39.4312744140625, 41.60590744018555, 43.780540466308594, 45.955177307128906, 48.12981033325195, 50.304443359375, 52.47908020019531, 54.65371322631836, 56.828346252441406, 59.00297927856445, 61.1776123046875, 63.35224914550781, 65.52688598632812, 67.7015151977539, 69.87615203857422, 72.05078125, 74.22541809082031, 76.40005493164062, 78.5746841430664, 80.74932098388672, 82.9239501953125, 85.09858703613281, 87.27322387695312, 89.4478530883789, 91.62248992919922, 93.79712677001953, 95.97175598144531, 98.14639282226562, 100.32102966308594, 102.49565887451172, 104.67029571533203, 106.84492492675781, 109.01956176757812]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 8.0, 6.0, 12.0, 9.0, 7.0, 14.0, 11.0, 25.0, 24.0, 25.0, 31.0, 25.0, 26.0, 31.0, 27.0, 36.0, 34.0, 28.0, 28.0, 43.0, 35.0, 41.0, 43.0, 50.0, 37.0, 34.0, 30.0, 26.0, 30.0, 33.0, 25.0, 24.0, 28.0, 17.0, 13.0, 6.0, 17.0, 10.0, 10.0, 9.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-17.1634521484375, -16.640655517578125, -16.11785888671875, -15.595062255859375, -15.072265625, -14.549468994140625, -14.02667236328125, -13.503875732421875, -12.9810791015625, -12.458282470703125, -11.93548583984375, -11.412689208984375, -10.889892578125, -10.367095947265625, -9.84429931640625, -9.321502685546875, -8.798705101013184, -8.275908470153809, -7.753111839294434, -7.230315208435059, -6.707518577575684, -6.184721946716309, -5.661924839019775, -5.1391282081604, -4.616331577301025, -4.09353494644165, -3.5707383155822754, -3.0479414463043213, -2.5251448154449463, -2.0023481845855713, -1.4795513153076172, -0.9567546844482422, -0.4339580535888672, 0.08883863687515259, 0.6116353273391724, 1.134432077407837, 1.657228708267212, 2.180025339126587, 2.702822208404541, 3.225618839263916, 3.748415470123291, 4.271212100982666, 4.794008731842041, 5.316805839538574, 5.839602470397949, 6.362399101257324, 6.885195732116699, 7.407992362976074, 7.930788993835449, 8.453585624694824, 8.9763822555542, 9.499178886413574, 10.02197551727295, 10.544772148132324, 11.067569732666016, 11.59036636352539, 12.113162994384766, 12.63595962524414, 13.158756256103516, 13.68155288696289, 14.204349517822266, 14.72714614868164, 15.249942779541016, 15.77273941040039, 16.295536041259766]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 6.0, 11.0, 10.0, 10.0, 14.0, 8.0, 13.0, 12.0, 16.0, 19.0, 26.0, 13.0, 30.0, 26.0, 31.0, 31.0, 39.0, 39.0, 38.0, 44.0, 38.0, 38.0, 36.0, 44.0, 34.0, 48.0, 32.0, 21.0, 26.0, 24.0, 26.0, 24.0, 25.0, 27.0, 19.0, 14.0, 18.0, 14.0, 9.0, 8.0, 2.0, 12.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.7576904296875, -2.663818359375, -2.5699462890625, -2.47607421875, -2.3822021484375, -2.288330078125, -2.1944580078125, -2.1005859375, -2.0067138671875, -1.912841796875, -1.8189697265625, -1.72509765625, -1.6312255859375, -1.537353515625, -1.4434814453125, -1.349609375, -1.2557373046875, -1.161865234375, -1.0679931640625, -0.97412109375, -0.8802490234375, -0.786376953125, -0.6925048828125, -0.5986328125, -0.5047607421875, -0.410888671875, -0.3170166015625, -0.22314453125, -0.1292724609375, -0.035400390625, 0.0584716796875, 0.15234375, 0.2462158203125, 0.340087890625, 0.4339599609375, 0.52783203125, 0.6217041015625, 0.715576171875, 0.8094482421875, 0.9033203125, 0.9971923828125, 1.091064453125, 1.1849365234375, 1.27880859375, 1.3726806640625, 1.466552734375, 1.5604248046875, 1.654296875, 1.7481689453125, 1.842041015625, 1.9359130859375, 2.02978515625, 2.1236572265625, 2.217529296875, 2.3114013671875, 2.4052734375, 2.4991455078125, 2.593017578125, 2.6868896484375, 2.78076171875, 2.8746337890625, 2.968505859375, 3.0623779296875, 3.15625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 9.0, 9.0, 8.0, 9.0, 7.0, 12.0, 15.0, 23.0, 23.0, 43.0, 47.0, 66.0, 78.0, 116.0, 130.0, 212.0, 253.0, 356.0, 593.0, 969.0, 1852.0, 5855.0, 135751.0, 3630405.0, 402897.0, 9023.0, 2229.0, 1074.0, 614.0, 423.0, 317.0, 237.0, 156.0, 108.0, 78.0, 64.0, 47.0, 35.0, 39.0, 14.0, 25.0, 16.0, 8.0, 11.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-16.328125, -15.8115234375, -15.294921875, -14.7783203125, -14.26171875, -13.7451171875, -13.228515625, -12.7119140625, -12.1953125, -11.6787109375, -11.162109375, -10.6455078125, -10.12890625, -9.6123046875, -9.095703125, -8.5791015625, -8.0625, -7.5458984375, -7.029296875, -6.5126953125, -5.99609375, -5.4794921875, -4.962890625, -4.4462890625, -3.9296875, -3.4130859375, -2.896484375, -2.3798828125, -1.86328125, -1.3466796875, -0.830078125, -0.3134765625, 0.203125, 0.7197265625, 1.236328125, 1.7529296875, 2.26953125, 2.7861328125, 3.302734375, 3.8193359375, 4.3359375, 4.8525390625, 5.369140625, 5.8857421875, 6.40234375, 6.9189453125, 7.435546875, 7.9521484375, 8.46875, 8.9853515625, 9.501953125, 10.0185546875, 10.53515625, 11.0517578125, 11.568359375, 12.0849609375, 12.6015625, 13.1181640625, 13.634765625, 14.1513671875, 14.66796875, 15.1845703125, 15.701171875, 16.2177734375, 16.734375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 5.0, 6.0, 3.0, 15.0, 37.0, 62.0, 159.0, 396.0, 933.0, 1196.0, 737.0, 309.0, 130.0, 41.0, 22.0, 11.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9453125, -13.5001220703125, -13.054931640625, -12.6097412109375, -12.16455078125, -11.7193603515625, -11.274169921875, -10.8289794921875, -10.3837890625, -9.9385986328125, -9.493408203125, -9.0482177734375, -8.60302734375, -8.1578369140625, -7.712646484375, -7.2674560546875, -6.822265625, -6.3770751953125, -5.931884765625, -5.4866943359375, -5.04150390625, -4.5963134765625, -4.151123046875, -3.7059326171875, -3.2607421875, -2.8155517578125, -2.370361328125, -1.9251708984375, -1.47998046875, -1.0347900390625, -0.589599609375, -0.1444091796875, 0.30078125, 0.7459716796875, 1.191162109375, 1.6363525390625, 2.08154296875, 2.5267333984375, 2.971923828125, 3.4171142578125, 3.8623046875, 4.3074951171875, 4.752685546875, 5.1978759765625, 5.64306640625, 6.0882568359375, 6.533447265625, 6.9786376953125, 7.423828125, 7.8690185546875, 8.314208984375, 8.7593994140625, 9.20458984375, 9.6497802734375, 10.094970703125, 10.5401611328125, 10.9853515625, 11.4305419921875, 11.875732421875, 12.3209228515625, 12.76611328125, 13.2113037109375, 13.656494140625, 14.1016845703125, 14.546875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 9.0, 10.0, 29.0, 36.0, 63.0, 70.0, 124.0, 164.0, 290.0, 402.0, 801.0, 1511.0, 3937.0, 14198.0, 118092.0, 2119326.0, 1816272.0, 99516.0, 12480.0, 3510.0, 1501.0, 742.0, 396.0, 274.0, 157.0, 117.0, 76.0, 60.0, 25.0, 24.0, 17.0, 9.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-9.4375, -9.17510986328125, -8.9127197265625, -8.65032958984375, -8.387939453125, -8.12554931640625, -7.8631591796875, -7.60076904296875, -7.33837890625, -7.07598876953125, -6.8135986328125, -6.55120849609375, -6.288818359375, -6.02642822265625, -5.7640380859375, -5.50164794921875, -5.2392578125, -4.97686767578125, -4.7144775390625, -4.45208740234375, -4.189697265625, -3.92730712890625, -3.6649169921875, -3.40252685546875, -3.14013671875, -2.87774658203125, -2.6153564453125, -2.35296630859375, -2.090576171875, -1.82818603515625, -1.5657958984375, -1.30340576171875, -1.041015625, -0.77862548828125, -0.5162353515625, -0.25384521484375, 0.008544921875, 0.27093505859375, 0.5333251953125, 0.79571533203125, 1.05810546875, 1.32049560546875, 1.5828857421875, 1.84527587890625, 2.107666015625, 2.37005615234375, 2.6324462890625, 2.89483642578125, 3.1572265625, 3.41961669921875, 3.6820068359375, 3.94439697265625, 4.206787109375, 4.46917724609375, 4.7315673828125, 4.99395751953125, 5.25634765625, 5.51873779296875, 5.7811279296875, 6.04351806640625, 6.305908203125, 6.56829833984375, 6.8306884765625, 7.09307861328125, 7.35546875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 7.0, 8.0, 13.0, 22.0, 27.0, 21.0, 31.0, 42.0, 50.0, 58.0, 61.0, 71.0, 84.0, 88.0, 75.0, 53.0, 48.0, 55.0, 37.0, 47.0, 23.0, 21.0, 13.0, 9.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.53204345703125, -39.5267219543457, -38.521400451660156, -37.51607894897461, -36.51075744628906, -35.505435943603516, -34.50011444091797, -33.49479293823242, -32.489471435546875, -31.484149932861328, -30.47882843017578, -29.473506927490234, -28.468185424804688, -27.46286392211914, -26.457542419433594, -25.452220916748047, -24.446901321411133, -23.441579818725586, -22.43625831604004, -21.430936813354492, -20.425615310668945, -19.4202938079834, -18.414974212646484, -17.409652709960938, -16.40433120727539, -15.399009704589844, -14.393688201904297, -13.38836669921875, -12.383045196533203, -11.377723693847656, -10.372403144836426, -9.367081642150879, -8.361759185791016, -7.356437683105469, -6.351116180419922, -5.345795154571533, -4.340473651885986, -3.3351521492004395, -2.329831123352051, -1.324509620666504, -0.31918811798095703, 0.6861332654953003, 1.6914546489715576, 2.6967759132385254, 3.7020974159240723, 4.707418918609619, 5.712739944458008, 6.718061447143555, 7.723382949829102, 8.728704452514648, 9.734025955200195, 10.739347457885742, 11.744668960571289, 12.749990463256836, 13.755311012268066, 14.760632514953613, 15.76595401763916, 16.77127456665039, 17.776596069335938, 18.781917572021484, 19.78723907470703, 20.792560577392578, 21.797882080078125, 22.803203582763672, 23.80852508544922]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 10.0, 2.0, 4.0, 9.0, 4.0, 9.0, 11.0, 13.0, 18.0, 21.0, 19.0, 26.0, 21.0, 34.0, 21.0, 32.0, 39.0, 35.0, 46.0, 47.0, 37.0, 43.0, 42.0, 49.0, 55.0, 37.0, 34.0, 26.0, 35.0, 27.0, 22.0, 32.0, 23.0, 22.0, 18.0, 16.0, 11.0, 13.0, 9.0, 11.0, 7.0, 8.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.17300796508789, -20.441434860229492, -19.70985984802246, -18.978286743164062, -18.24671173095703, -17.515138626098633, -16.783565521240234, -16.051990509033203, -15.320416450500488, -14.588842391967773, -13.857268333435059, -13.125694274902344, -12.394121170043945, -11.662546157836914, -10.930973052978516, -10.1993989944458, -9.467824935913086, -8.736250877380371, -8.004676818847656, -7.2731032371521, -6.541529178619385, -5.80995512008667, -5.078381538391113, -4.346807479858398, -3.6152334213256836, -2.8836593627929688, -2.152085542678833, -1.4205117225646973, -0.6889376640319824, 0.04263639450073242, 0.7742099761962891, 1.505784034729004, 2.2373580932617188, 2.9689321517944336, 3.7005059719085693, 4.432079792022705, 5.16365385055542, 5.895227909088135, 6.626801490783691, 7.358375549316406, 8.089949607849121, 8.821523666381836, 9.55309772491455, 10.284671783447266, 11.016244888305664, 11.747819900512695, 12.479393005371094, 13.210967063903809, 13.942541122436523, 14.674115180969238, 15.405689239501953, 16.13726234436035, 16.868837356567383, 17.60041046142578, 18.331985473632812, 19.06355857849121, 19.79513168334961, 20.526704788208008, 21.25827980041504, 21.989852905273438, 22.72142791748047, 23.453001022338867, 24.184574127197266, 24.916149139404297, 25.647724151611328]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 10.0, 12.0, 14.0, 17.0, 9.0, 19.0, 24.0, 17.0, 33.0, 28.0, 39.0, 35.0, 38.0, 42.0, 45.0, 45.0, 44.0, 51.0, 51.0, 47.0, 42.0, 36.0, 39.0, 33.0, 26.0, 24.0, 26.0, 25.0, 24.0, 18.0, 13.0, 16.0, 8.0, 7.0, 9.0, 4.0, 11.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03125, -38.6982421875, -37.365234375, -36.0322265625, -34.69921875, -33.3662109375, -32.033203125, -30.7001953125, -29.3671875, -28.0341796875, -26.701171875, -25.3681640625, -24.03515625, -22.7021484375, -21.369140625, -20.0361328125, -18.703125, -17.3701171875, -16.037109375, -14.7041015625, -13.37109375, -12.0380859375, -10.705078125, -9.3720703125, -8.0390625, -6.7060546875, -5.373046875, -4.0400390625, -2.70703125, -1.3740234375, -0.041015625, 1.2919921875, 2.625, 3.9580078125, 5.291015625, 6.6240234375, 7.95703125, 9.2900390625, 10.623046875, 11.9560546875, 13.2890625, 14.6220703125, 15.955078125, 17.2880859375, 18.62109375, 19.9541015625, 21.287109375, 22.6201171875, 23.953125, 25.2861328125, 26.619140625, 27.9521484375, 29.28515625, 30.6181640625, 31.951171875, 33.2841796875, 34.6171875, 35.9501953125, 37.283203125, 38.6162109375, 39.94921875, 41.2822265625, 42.615234375, 43.9482421875, 45.28125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 14.0, 12.0, 36.0, 36.0, 62.0, 103.0, 129.0, 188.0, 300.0, 398.0, 739.0, 1096.0, 1734.0, 2803.0, 4443.0, 7127.0, 11427.0, 19079.0, 32460.0, 58592.0, 117305.0, 273891.0, 264318.0, 113915.0, 57322.0, 32053.0, 18850.0, 11281.0, 6910.0, 4395.0, 2700.0, 1793.0, 1058.0, 690.0, 398.0, 283.0, 160.0, 143.0, 101.0, 75.0, 43.0, 27.0, 9.0, 13.0, 7.0, 6.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-7.54296875, -7.31427001953125, -7.0855712890625, -6.85687255859375, -6.628173828125, -6.39947509765625, -6.1707763671875, -5.94207763671875, -5.71337890625, -5.48468017578125, -5.2559814453125, -5.02728271484375, -4.798583984375, -4.56988525390625, -4.3411865234375, -4.11248779296875, -3.8837890625, -3.65509033203125, -3.4263916015625, -3.19769287109375, -2.968994140625, -2.74029541015625, -2.5115966796875, -2.28289794921875, -2.05419921875, -1.82550048828125, -1.5968017578125, -1.36810302734375, -1.139404296875, -0.91070556640625, -0.6820068359375, -0.45330810546875, -0.224609375, 0.00408935546875, 0.2327880859375, 0.46148681640625, 0.690185546875, 0.91888427734375, 1.1475830078125, 1.37628173828125, 1.60498046875, 1.83367919921875, 2.0623779296875, 2.29107666015625, 2.519775390625, 2.74847412109375, 2.9771728515625, 3.20587158203125, 3.4345703125, 3.66326904296875, 3.8919677734375, 4.12066650390625, 4.349365234375, 4.57806396484375, 4.8067626953125, 5.03546142578125, 5.26416015625, 5.49285888671875, 5.7215576171875, 5.95025634765625, 6.178955078125, 6.40765380859375, 6.6363525390625, 6.86505126953125, 7.09375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 9.0, 8.0, 8.0, 17.0, 13.0, 17.0, 14.0, 22.0, 21.0, 25.0, 32.0, 38.0, 34.0, 44.0, 23.0, 34.0, 51.0, 27.0, 36.0, 1059.0, 35.0, 48.0, 41.0, 33.0, 33.0, 28.0, 31.0, 39.0, 35.0, 21.0, 25.0, 12.0, 18.0, 10.0, 13.0, 10.0, 9.0, 11.0, 4.0, 11.0, 1.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.9375, -23.15625, -22.375, -21.59375, -20.8125, -20.03125, -19.25, -18.46875, -17.6875, -16.90625, -16.125, -15.34375, -14.5625, -13.78125, -13.0, -12.21875, -11.4375, -10.65625, -9.875, -9.09375, -8.3125, -7.53125, -6.75, -5.96875, -5.1875, -4.40625, -3.625, -2.84375, -2.0625, -1.28125, -0.5, 0.28125, 1.0625, 1.84375, 2.625, 3.40625, 4.1875, 4.96875, 5.75, 6.53125, 7.3125, 8.09375, 8.875, 9.65625, 10.4375, 11.21875, 12.0, 12.78125, 13.5625, 14.34375, 15.125, 15.90625, 16.6875, 17.46875, 18.25, 19.03125, 19.8125, 20.59375, 21.375, 22.15625, 22.9375, 23.71875, 24.5, 25.28125, 26.0625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 7.0, 9.0, 18.0, 17.0, 27.0, 42.0, 65.0, 86.0, 145.0, 186.0, 253.0, 356.0, 515.0, 752.0, 955.0, 1461.0, 1942.0, 2662.0, 3878.0, 5390.0, 7601.0, 11165.0, 16238.0, 23634.0, 35329.0, 54334.0, 88722.0, 163968.0, 1301107.0, 142143.0, 79405.0, 49557.0, 33055.0, 21890.0, 14980.0, 10248.0, 7179.0, 5064.0, 3624.0, 2631.0, 1850.0, 1389.0, 904.0, 681.0, 516.0, 356.0, 234.0, 189.0, 101.0, 102.0, 75.0, 43.0, 21.0, 18.0, 16.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-5.609375, -5.43621826171875, -5.2630615234375, -5.08990478515625, -4.916748046875, -4.74359130859375, -4.5704345703125, -4.39727783203125, -4.22412109375, -4.05096435546875, -3.8778076171875, -3.70465087890625, -3.531494140625, -3.35833740234375, -3.1851806640625, -3.01202392578125, -2.8388671875, -2.66571044921875, -2.4925537109375, -2.31939697265625, -2.146240234375, -1.97308349609375, -1.7999267578125, -1.62677001953125, -1.45361328125, -1.28045654296875, -1.1072998046875, -0.93414306640625, -0.760986328125, -0.58782958984375, -0.4146728515625, -0.24151611328125, -0.068359375, 0.10479736328125, 0.2779541015625, 0.45111083984375, 0.624267578125, 0.79742431640625, 0.9705810546875, 1.14373779296875, 1.31689453125, 1.49005126953125, 1.6632080078125, 1.83636474609375, 2.009521484375, 2.18267822265625, 2.3558349609375, 2.52899169921875, 2.7021484375, 2.87530517578125, 3.0484619140625, 3.22161865234375, 3.394775390625, 3.56793212890625, 3.7410888671875, 3.91424560546875, 4.08740234375, 4.26055908203125, 4.4337158203125, 4.60687255859375, 4.780029296875, 4.95318603515625, 5.1263427734375, 5.29949951171875, 5.47265625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 4.0, 6.0, 4.0, 8.0, 8.0, 10.0, 12.0, 19.0, 27.0, 17.0, 30.0, 37.0, 58.0, 59.0, 66.0, 74.0, 77.0, 80.0, 87.0, 60.0, 59.0, 40.0, 29.0, 20.0, 14.0, 21.0, 18.0, 13.0, 6.0, 11.0, 3.0, 10.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0030040740966796875, -0.002924621105194092, -0.002845168113708496, -0.0027657151222229004, -0.0026862621307373047, -0.002606809139251709, -0.0025273561477661133, -0.0024479031562805176, -0.002368450164794922, -0.002288997173309326, -0.0022095441818237305, -0.0021300911903381348, -0.002050638198852539, -0.0019711852073669434, -0.0018917322158813477, -0.001812279224395752, -0.0017328262329101562, -0.0016533732414245605, -0.0015739202499389648, -0.0014944672584533691, -0.0014150142669677734, -0.0013355612754821777, -0.001256108283996582, -0.0011766552925109863, -0.0010972023010253906, -0.001017749309539795, -0.0009382963180541992, -0.0008588433265686035, -0.0007793903350830078, -0.0006999373435974121, -0.0006204843521118164, -0.0005410313606262207, -0.000461578369140625, -0.0003821253776550293, -0.0003026723861694336, -0.0002232193946838379, -0.0001437664031982422, -6.431341171264648e-05, 1.5139579772949219e-05, 9.459257125854492e-05, 0.00017404556274414062, 0.00025349855422973633, 0.00033295154571533203, 0.00041240453720092773, 0.0004918575286865234, 0.0005713105201721191, 0.0006507635116577148, 0.0007302165031433105, 0.0008096694946289062, 0.000889122486114502, 0.0009685754776000977, 0.0010480284690856934, 0.001127481460571289, 0.0012069344520568848, 0.0012863874435424805, 0.0013658404350280762, 0.0014452934265136719, 0.0015247464179992676, 0.0016041994094848633, 0.001683652400970459, 0.0017631053924560547, 0.0018425583839416504, 0.001922011375427246, 0.002001464366912842, 0.0020809173583984375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 7.0, 9.0, 4.0, 11.0, 14.0, 20.0, 20.0, 48.0, 45.0, 54.0, 92.0, 135.0, 246.0, 368.0, 692.0, 1432.0, 3556.0, 11108.0, 43637.0, 245876.0, 552097.0, 147490.0, 28343.0, 7791.0, 2757.0, 1159.0, 619.0, 302.0, 197.0, 130.0, 79.0, 64.0, 38.0, 31.0, 23.0, 8.0, 21.0, 17.0, 3.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01285552978515625, -0.012402176856994629, -0.011948823928833008, -0.011495471000671387, -0.011042118072509766, -0.010588765144348145, -0.010135412216186523, -0.009682059288024902, -0.009228706359863281, -0.00877535343170166, -0.008322000503540039, -0.007868647575378418, -0.007415294647216797, -0.006961941719055176, -0.006508588790893555, -0.006055235862731934, -0.0056018829345703125, -0.005148530006408691, -0.00469517707824707, -0.004241824150085449, -0.003788471221923828, -0.003335118293762207, -0.002881765365600586, -0.002428412437438965, -0.0019750595092773438, -0.0015217065811157227, -0.0010683536529541016, -0.0006150007247924805, -0.00016164779663085938, 0.0002917051315307617, 0.0007450580596923828, 0.001198410987854004, 0.001651763916015625, 0.002105116844177246, 0.002558469772338867, 0.0030118227005004883, 0.0034651756286621094, 0.0039185285568237305, 0.0043718814849853516, 0.004825234413146973, 0.005278587341308594, 0.005731940269470215, 0.006185293197631836, 0.006638646125793457, 0.007091999053955078, 0.007545351982116699, 0.00799870491027832, 0.008452057838439941, 0.008905410766601562, 0.009358763694763184, 0.009812116622924805, 0.010265469551086426, 0.010718822479248047, 0.011172175407409668, 0.011625528335571289, 0.01207888126373291, 0.012532234191894531, 0.012985587120056152, 0.013438940048217773, 0.013892292976379395, 0.014345645904541016, 0.014798998832702637, 0.015252351760864258, 0.01570570468902588, 0.0161590576171875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 19.0, 37.0, 70.0, 99.0, 142.0, 177.0, 145.0, 126.0, 70.0, 50.0, 18.0, 19.0, 10.0, 9.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012861154973506927, -0.0011907619191333652, -0.0010954084573313594, -0.0010000548791140318, -0.000904701417312026, -0.0008093478390946984, -0.0007139943190850317, -0.0006186407990753651, -0.0005232872790656984, -0.0004279337590560317, -0.000332580239046365, -0.00023722668993286788, -0.0001418731699232012, -4.651964991353452e-05, 4.8833899199962616e-05, 0.0001441874192096293, 0.00023954093921929598, 0.00033489445922896266, 0.00043024797923862934, 0.0005256015574559569, 0.0006209550192579627, 0.0007163085974752903, 0.000811662117484957, 0.0009070156374946237, 0.0010023692157119513, 0.0010977227939292789, 0.0011930762557312846, 0.0012884298339486122, 0.001383783295750618, 0.0014791368739679456, 0.0015744904521852732, 0.001669843913987279, 0.0017651973757892847, 0.0018605509540066123, 0.00195590453222394, 0.0020512579940259457, 0.0021466114558279514, 0.002241964917629957, 0.0023373186122626066, 0.0024326720740646124, 0.002528025535866618, 0.002623378997668624, 0.0027187326923012733, 0.002814086154103279, 0.002909439615905285, 0.0030047930777072906, 0.00310014677233994, 0.003195500234141946, 0.0032908539287745953, 0.003386207390576601, 0.0034815610852092505, 0.0035769145470112562, 0.003672268008813262, 0.0037676214706152678, 0.003862975165247917, 0.003958328627049923, 0.004053682088851929, 0.0041490355506539345, 0.00424438901245594, 0.004339742474257946, 0.004435096401721239, 0.004530449863523245, 0.004625803325325251, 0.004721156787127256, 0.004816510248929262]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 11.0, 16.0, 9.0, 18.0, 17.0, 28.0, 26.0, 23.0, 26.0, 30.0, 38.0, 34.0, 49.0, 58.0, 48.0, 39.0, 36.0, 33.0, 53.0, 41.0, 40.0, 35.0, 32.0, 30.0, 36.0, 30.0, 29.0, 27.0, 26.0, 15.0, 17.0, 12.0, 5.0, 6.0, 4.0, 4.0, 6.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011513829231262207, -0.0011114394292235374, -0.0010714959353208542, -0.001031552441418171, -0.0009916089475154877, -0.0009516654536128044, -0.0009117219597101212, -0.0008717784658074379, -0.0008318349719047546, -0.0007918914780020714, -0.0007519479840993881, -0.0007120044901967049, -0.0006720609962940216, -0.0006321175023913383, -0.0005921740084886551, -0.0005522305145859718, -0.0005122870206832886, -0.0004723435267806053, -0.00043240003287792206, -0.0003924565389752388, -0.00035251304507255554, -0.0003125695511698723, -0.000272626057267189, -0.00023268256336450577, -0.0001927390694618225, -0.00015279557555913925, -0.000112852081656456, -7.290858775377274e-05, -3.296509385108948e-05, 6.9784000515937805e-06, 4.692189395427704e-05, 8.68653878569603e-05, 0.00012680888175964355, 0.0001667523756623268, 0.00020669586956501007, 0.00024663936346769333, 0.0002865828573703766, 0.00032652635127305984, 0.0003664698451757431, 0.00040641333907842636, 0.0004463568329811096, 0.0004863003268837929, 0.0005262438207864761, 0.0005661873146891594, 0.0006061308085918427, 0.0006460743024945259, 0.0006860177963972092, 0.0007259612902998924, 0.0007659047842025757, 0.0008058482781052589, 0.0008457917720079422, 0.0008857352659106255, 0.0009256787598133087, 0.000965622253715992, 0.0010055657476186752, 0.0010455092415213585, 0.0010854527354240417, 0.001125396229326725, 0.0011653397232294083, 0.0012052832171320915, 0.0012452267110347748, 0.001285170204937458, 0.0013251136988401413, 0.0013650571927428246, 0.0014050006866455078]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 10.0, 12.0, 14.0, 17.0, 9.0, 19.0, 24.0, 17.0, 33.0, 28.0, 39.0, 35.0, 38.0, 43.0, 44.0, 45.0, 44.0, 51.0, 51.0, 46.0, 43.0, 36.0, 39.0, 33.0, 26.0, 24.0, 26.0, 25.0, 24.0, 18.0, 13.0, 16.0, 8.0, 7.0, 9.0, 4.0, 11.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03125, -38.6982421875, -37.365234375, -36.0322265625, -34.69921875, -33.3662109375, -32.033203125, -30.7001953125, -29.3671875, -28.0341796875, -26.701171875, -25.3681640625, -24.03515625, -22.7021484375, -21.369140625, -20.0361328125, -18.703125, -17.3701171875, -16.037109375, -14.7041015625, -13.37109375, -12.0380859375, -10.705078125, -9.3720703125, -8.0390625, -6.7060546875, -5.373046875, -4.0400390625, -2.70703125, -1.3740234375, -0.041015625, 1.2919921875, 2.625, 3.9580078125, 5.291015625, 6.6240234375, 7.95703125, 9.2900390625, 10.623046875, 11.9560546875, 13.2890625, 14.6220703125, 15.955078125, 17.2880859375, 18.62109375, 19.9541015625, 21.287109375, 22.6201171875, 23.953125, 25.2861328125, 26.619140625, 27.9521484375, 29.28515625, 30.6181640625, 31.951171875, 33.2841796875, 34.6171875, 35.9501953125, 37.283203125, 38.6162109375, 39.94921875, 41.2822265625, 42.615234375, 43.9482421875, 45.28125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 6.0, 6.0, 20.0, 22.0, 25.0, 52.0, 52.0, 98.0, 142.0, 239.0, 398.0, 684.0, 1265.0, 2582.0, 6308.0, 19585.0, 83851.0, 404437.0, 410750.0, 86228.0, 19923.0, 6230.0, 2633.0, 1224.0, 648.0, 398.0, 241.0, 150.0, 101.0, 74.0, 49.0, 27.0, 40.0, 12.0, 11.0, 13.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.109375, -8.86322021484375, -8.6170654296875, -8.37091064453125, -8.124755859375, -7.87860107421875, -7.6324462890625, -7.38629150390625, -7.14013671875, -6.89398193359375, -6.6478271484375, -6.40167236328125, -6.155517578125, -5.90936279296875, -5.6632080078125, -5.41705322265625, -5.1708984375, -4.92474365234375, -4.6785888671875, -4.43243408203125, -4.186279296875, -3.94012451171875, -3.6939697265625, -3.44781494140625, -3.20166015625, -2.95550537109375, -2.7093505859375, -2.46319580078125, -2.217041015625, -1.97088623046875, -1.7247314453125, -1.47857666015625, -1.232421875, -0.98626708984375, -0.7401123046875, -0.49395751953125, -0.247802734375, -0.00164794921875, 0.2445068359375, 0.49066162109375, 0.73681640625, 0.98297119140625, 1.2291259765625, 1.47528076171875, 1.721435546875, 1.96759033203125, 2.2137451171875, 2.45989990234375, 2.7060546875, 2.95220947265625, 3.1983642578125, 3.44451904296875, 3.690673828125, 3.93682861328125, 4.1829833984375, 4.42913818359375, 4.67529296875, 4.92144775390625, 5.1676025390625, 5.41375732421875, 5.659912109375, 5.90606689453125, 6.1522216796875, 6.39837646484375, 6.64453125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 5.0, 13.0, 17.0, 16.0, 25.0, 27.0, 35.0, 38.0, 32.0, 48.0, 59.0, 52.0, 66.0, 2113.0, 64.0, 60.0, 57.0, 63.0, 50.0, 37.0, 37.0, 27.0, 22.0, 19.0, 10.0, 14.0, 12.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.625, -73.0703125, -70.515625, -67.9609375, -65.40625, -62.8515625, -60.296875, -57.7421875, -55.1875, -52.6328125, -50.078125, -47.5234375, -44.96875, -42.4140625, -39.859375, -37.3046875, -34.75, -32.1953125, -29.640625, -27.0859375, -24.53125, -21.9765625, -19.421875, -16.8671875, -14.3125, -11.7578125, -9.203125, -6.6484375, -4.09375, -1.5390625, 1.015625, 3.5703125, 6.125, 8.6796875, 11.234375, 13.7890625, 16.34375, 18.8984375, 21.453125, 24.0078125, 26.5625, 29.1171875, 31.671875, 34.2265625, 36.78125, 39.3359375, 41.890625, 44.4453125, 47.0, 49.5546875, 52.109375, 54.6640625, 57.21875, 59.7734375, 62.328125, 64.8828125, 67.4375, 69.9921875, 72.546875, 75.1015625, 77.65625, 80.2109375, 82.765625, 85.3203125, 87.875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 5.0, 4.0, 9.0, 8.0, 20.0, 29.0, 35.0, 66.0, 87.0, 121.0, 171.0, 264.0, 347.0, 582.0, 949.0, 2060.0, 5759.0, 38899.0, 2370507.0, 681233.0, 34807.0, 5205.0, 1840.0, 955.0, 560.0, 376.0, 228.0, 167.0, 127.0, 74.0, 59.0, 40.0, 26.0, 17.0, 8.0, 8.0, 9.0, 8.0, 3.0, 2.0, 10.0, 1.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0], "bins": [-12.6875, -12.302734375, -11.91796875, -11.533203125, -11.1484375, -10.763671875, -10.37890625, -9.994140625, -9.609375, -9.224609375, -8.83984375, -8.455078125, -8.0703125, -7.685546875, -7.30078125, -6.916015625, -6.53125, -6.146484375, -5.76171875, -5.376953125, -4.9921875, -4.607421875, -4.22265625, -3.837890625, -3.453125, -3.068359375, -2.68359375, -2.298828125, -1.9140625, -1.529296875, -1.14453125, -0.759765625, -0.375, 0.009765625, 0.39453125, 0.779296875, 1.1640625, 1.548828125, 1.93359375, 2.318359375, 2.703125, 3.087890625, 3.47265625, 3.857421875, 4.2421875, 4.626953125, 5.01171875, 5.396484375, 5.78125, 6.166015625, 6.55078125, 6.935546875, 7.3203125, 7.705078125, 8.08984375, 8.474609375, 8.859375, 9.244140625, 9.62890625, 10.013671875, 10.3984375, 10.783203125, 11.16796875, 11.552734375, 11.9375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 13.0, 8.0, 20.0, 27.0, 56.0, 81.0, 108.0, 156.0, 154.0, 127.0, 92.0, 55.0, 34.0, 18.0, 11.0, 7.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-111.04193878173828, -107.97674560546875, -104.91155242919922, -101.84636688232422, -98.78117370605469, -95.71598052978516, -92.65078735351562, -89.58560180664062, -86.5204086303711, -83.45521545410156, -80.39002227783203, -77.32483673095703, -74.2596435546875, -71.19445037841797, -68.12925720214844, -65.06407165527344, -61.99887466430664, -58.93368148803711, -55.868492126464844, -52.80329895019531, -49.73810958862305, -46.672916412353516, -43.60772705078125, -40.54253387451172, -37.47734069824219, -34.412147521972656, -31.34695816040039, -28.28176498413086, -25.216575622558594, -22.151382446289062, -19.086191177368164, -16.020999908447266, -12.955810546875, -9.890619277954102, -6.825427532196045, -3.7602357864379883, -0.6950445175170898, 2.3701467514038086, 5.435338973999023, 8.500530242919922, 11.56572151184082, 14.630912780761719, 17.696104049682617, 20.761295318603516, 23.826488494873047, 26.891677856445312, 29.956871032714844, 33.022064208984375, 36.08725357055664, 39.15244674682617, 42.21763610839844, 45.28282928466797, 48.348018646240234, 51.413211822509766, 54.47840118408203, 57.54359436035156, 60.608787536621094, 63.673980712890625, 66.73917388916016, 69.80435943603516, 72.86955261230469, 75.93474578857422, 78.99993896484375, 82.06512451171875, 85.13031768798828]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 6.0, 8.0, 3.0, 4.0, 8.0, 5.0, 8.0, 16.0, 13.0, 22.0, 34.0, 27.0, 29.0, 33.0, 31.0, 34.0, 55.0, 55.0, 56.0, 51.0, 59.0, 51.0, 55.0, 51.0, 40.0, 41.0, 35.0, 27.0, 29.0, 24.0, 20.0, 18.0, 9.0, 7.0, 11.0, 7.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.08335876464844, -81.07108306884766, -78.05879974365234, -75.04652404785156, -72.03424072265625, -69.02196502685547, -66.00968933105469, -62.99740982055664, -59.985130310058594, -56.97285079956055, -53.9605712890625, -50.94829559326172, -47.93601608276367, -44.923736572265625, -41.911460876464844, -38.8991813659668, -35.88690185546875, -32.8746223449707, -29.86234474182129, -26.850067138671875, -23.837787628173828, -20.82550811767578, -17.813230514526367, -14.800952911376953, -11.788673400878906, -8.776394844055176, -5.764116287231445, -2.751837730407715, 0.2604408264160156, 3.272719383239746, 6.284997940063477, 9.29727554321289, 12.309555053710938, 15.321833610534668, 18.3341121673584, 21.346389770507812, 24.35866928100586, 27.370948791503906, 30.38322639465332, 33.395503997802734, 36.40778350830078, 39.42006301879883, 42.432342529296875, 45.444618225097656, 48.4568977355957, 51.46917724609375, 54.48145294189453, 57.49373245239258, 60.506011962890625, 63.51829147338867, 66.53057098388672, 69.5428466796875, 72.55513000488281, 75.5674057006836, 78.57968139648438, 81.59196472167969, 84.60424041748047, 87.61651611328125, 90.62879943847656, 93.64107513427734, 96.65335083007812, 99.66563415527344, 102.67790985107422, 105.690185546875, 108.70246887207031]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 9.0, 18.0, 13.0, 15.0, 30.0, 33.0, 62.0, 79.0, 128.0, 216.0, 364.0, 578.0, 1003.0, 1629.0, 2505.0, 4026.0, 6529.0, 1014182.0, 6573.0, 3903.0, 2553.0, 1560.0, 973.0, 572.0, 330.0, 214.0, 150.0, 105.0, 69.0, 38.0, 37.0, 14.0, 20.0, 10.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.47530746459961, -21.875869750976562, -21.276432037353516, -20.67699432373047, -20.077556610107422, -19.478118896484375, -18.878681182861328, -18.27924346923828, -17.679805755615234, -17.080368041992188, -16.48093032836914, -15.881492614746094, -15.282054901123047, -14.6826171875, -14.083179473876953, -13.483741760253906, -12.884303092956543, -12.284865379333496, -11.68542766571045, -11.085989952087402, -10.486552238464355, -9.887114524841309, -9.287675857543945, -8.688238143920898, -8.088800430297852, -7.489362716674805, -6.889925003051758, -6.290487289428711, -5.691049575805664, -5.091611862182617, -4.492173671722412, -3.8927359580993652, -3.2932987213134766, -2.6938610076904297, -2.094423294067383, -1.4949853420257568, -0.89554762840271, -0.2961099147796631, 0.3033280372619629, 0.9027657508850098, 1.5022034645080566, 2.1016411781311035, 2.7010788917541504, 3.3005168437957764, 3.8999545574188232, 4.499392509460449, 5.098830223083496, 5.698267936706543, 6.29770565032959, 6.897143363952637, 7.496581077575684, 8.09601879119873, 8.695456504821777, 9.294894218444824, 9.894332885742188, 10.493770599365234, 11.093208312988281, 11.692646026611328, 12.292083740234375, 12.891521453857422, 13.490959167480469, 14.090396881103516, 14.689834594726562, 15.28927230834961, 15.888710021972656]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 19.0, 23.0, 44.0, 56.0, 61.0, 141.0, 3677.0, 51458920.0, 193.0, 74.0, 31.0, 25.0, 21.0, 29.0, 21.0, 16.0, 18.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2878.673095703125, -2727.9326171875, -2577.192138671875, -2426.45166015625, -2275.71142578125, -2124.970703125, -1974.23046875, -1823.489990234375, -1672.74951171875, -1522.009033203125, -1371.2685546875, -1220.5281982421875, -1069.7877197265625, -919.0472412109375, -768.3068237304688, -617.56640625, -466.825927734375, -316.0854797363281, -165.34503173828125, -14.604583740234375, 136.1358642578125, 286.8763427734375, 437.61676025390625, 588.357177734375, 739.09765625, 889.838134765625, 1040.57861328125, 1191.3189697265625, 1342.0594482421875, 1492.7999267578125, 1643.540283203125, 1794.28076171875, 1945.02099609375, 2095.761474609375, 2246.501953125, 2397.242431640625, 2547.98291015625, 2698.72314453125, 2849.463623046875, 3000.2041015625, 3150.944580078125, 3301.68505859375, 3452.425537109375, 3603.166015625, 3753.90625, 3904.64697265625, 4055.38720703125, 4206.1279296875, 4356.8681640625, 4507.6083984375, 4658.34912109375, 4809.08935546875, 4959.830078125, 5110.5703125, 5261.31103515625, 5412.05126953125, 5562.7919921875, 5713.5322265625, 5864.27294921875, 6015.01318359375, 6165.75390625, 6316.494140625, 6467.23486328125, 6617.97509765625, 6768.71533203125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 3.0, 8.0, 9.0, 17.0, 18.0, 45.0, 66.0, 105.0, 147.0, 197.0, 290.0, 412.0, 640.0, 950.0, 1282.0, 1937.0, 2784.0, 4204.0, 6218.0, 9463.0, 14161.0, 21730.0, 33251.0, 52523.0, 85826.0, 145477.0, 268958.0, 670255.0, 3980681.0, 449581.0, 218233.0, 120667.0, 71686.0, 44560.0, 28543.0, 18471.0, 12185.0, 8070.0, 5657.0, 3669.0, 2647.0, 1753.0, 1293.0, 881.0, 541.0, 471.0, 238.0, 226.0, 104.0, 100.0, 68.0, 43.0, 20.0, 27.0, 19.0, 3.0, 16.0, 6.0, 3.0, 0.0, 6.0], "bins": [-3.53515625, -3.422332763671875, -3.30950927734375, -3.196685791015625, -3.0838623046875, -2.971038818359375, -2.85821533203125, -2.745391845703125, -2.632568359375, -2.519744873046875, -2.40692138671875, -2.294097900390625, -2.1812744140625, -2.068450927734375, -1.95562744140625, -1.842803955078125, -1.72998046875, -1.617156982421875, -1.50433349609375, -1.391510009765625, -1.2786865234375, -1.165863037109375, -1.05303955078125, -0.940216064453125, -0.827392578125, -0.714569091796875, -0.60174560546875, -0.488922119140625, -0.3760986328125, -0.263275146484375, -0.15045166015625, -0.037628173828125, 0.0751953125, 0.188018798828125, 0.30084228515625, 0.413665771484375, 0.5264892578125, 0.639312744140625, 0.75213623046875, 0.864959716796875, 0.977783203125, 1.090606689453125, 1.20343017578125, 1.316253662109375, 1.4290771484375, 1.541900634765625, 1.65472412109375, 1.767547607421875, 1.88037109375, 1.993194580078125, 2.10601806640625, 2.218841552734375, 2.3316650390625, 2.444488525390625, 2.55731201171875, 2.670135498046875, 2.782958984375, 2.895782470703125, 3.00860595703125, 3.121429443359375, 3.2342529296875, 3.347076416015625, 3.45989990234375, 3.572723388671875, 3.685546875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [4.0, 6.0, 1.0, 4.0, 6.0, 4.0, 2.0, 10.0, 10.0, 14.0, 11.0, 8.0, 13.0, 17.0, 16.0, 24.0, 34.0, 27.0, 43.0, 25.0, 34.0, 38.0, 31.0, 52.0, 71.0, 224.0, 702.0, 158.0, 47.0, 41.0, 41.0, 45.0, 32.0, 28.0, 26.0, 24.0, 20.0, 25.0, 23.0, 11.0, 13.0, 14.0, 10.0, 10.0, 6.0, 9.0, 3.0, 7.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.1484375, -6.877685546875, -6.60693359375, -6.336181640625, -6.0654296875, -5.794677734375, -5.52392578125, -5.253173828125, -4.982421875, -4.711669921875, -4.44091796875, -4.170166015625, -3.8994140625, -3.628662109375, -3.35791015625, -3.087158203125, -2.81640625, -2.545654296875, -2.27490234375, -2.004150390625, -1.7333984375, -1.462646484375, -1.19189453125, -0.921142578125, -0.650390625, -0.379638671875, -0.10888671875, 0.161865234375, 0.4326171875, 0.703369140625, 0.97412109375, 1.244873046875, 1.515625, 1.786376953125, 2.05712890625, 2.327880859375, 2.5986328125, 2.869384765625, 3.14013671875, 3.410888671875, 3.681640625, 3.952392578125, 4.22314453125, 4.493896484375, 4.7646484375, 5.035400390625, 5.30615234375, 5.576904296875, 5.84765625, 6.118408203125, 6.38916015625, 6.659912109375, 6.9306640625, 7.201416015625, 7.47216796875, 7.742919921875, 8.013671875, 8.284423828125, 8.55517578125, 8.825927734375, 9.0966796875, 9.367431640625, 9.63818359375, 9.908935546875, 10.1796875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 6.0, 0.0, 1.0, 9.0, 14.0, 9.0, 6.0, 26.0, 31.0, 32.0, 71.0, 85.0, 131.0, 185.0, 327.0, 462.0, 733.0, 1179.0, 1789.0, 2884.0, 4955.0, 8276.0, 14839.0, 25292.0, 45872.0, 87943.0, 175064.0, 413169.0, 4056166.0, 903253.0, 274324.0, 126114.0, 64995.0, 34977.0, 19790.0, 11287.0, 6506.0, 3972.0, 2333.0, 1562.0, 943.0, 644.0, 409.0, 229.0, 177.0, 117.0, 76.0, 67.0, 38.0, 25.0, 11.0, 14.0, 9.0, 7.0, 1.0, 8.0, 3.0, 0.0, 0.0, 3.0], "bins": [-6.0234375, -5.83966064453125, -5.6558837890625, -5.47210693359375, -5.288330078125, -5.10455322265625, -4.9207763671875, -4.73699951171875, -4.55322265625, -4.36944580078125, -4.1856689453125, -4.00189208984375, -3.818115234375, -3.63433837890625, -3.4505615234375, -3.26678466796875, -3.0830078125, -2.89923095703125, -2.7154541015625, -2.53167724609375, -2.347900390625, -2.16412353515625, -1.9803466796875, -1.79656982421875, -1.61279296875, -1.42901611328125, -1.2452392578125, -1.06146240234375, -0.877685546875, -0.69390869140625, -0.5101318359375, -0.32635498046875, -0.142578125, 0.04119873046875, 0.2249755859375, 0.40875244140625, 0.592529296875, 0.77630615234375, 0.9600830078125, 1.14385986328125, 1.32763671875, 1.51141357421875, 1.6951904296875, 1.87896728515625, 2.062744140625, 2.24652099609375, 2.4302978515625, 2.61407470703125, 2.7978515625, 2.98162841796875, 3.1654052734375, 3.34918212890625, 3.532958984375, 3.71673583984375, 3.9005126953125, 4.08428955078125, 4.26806640625, 4.45184326171875, 4.6356201171875, 4.81939697265625, 5.003173828125, 5.18695068359375, 5.3707275390625, 5.55450439453125, 5.73828125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 13.0, 16.0, 7.0, 14.0, 27.0, 20.0, 38.0, 27.0, 26.0, 39.0, 50.0, 59.0, 79.0, 144.0, 560.0, 388.0, 101.0, 61.0, 46.0, 40.0, 40.0, 36.0, 36.0, 33.0, 20.0, 21.0, 19.0, 11.0, 10.0, 12.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.4537353515625, -8.188720703125, -7.9237060546875, -7.65869140625, -7.3936767578125, -7.128662109375, -6.8636474609375, -6.5986328125, -6.3336181640625, -6.068603515625, -5.8035888671875, -5.53857421875, -5.2735595703125, -5.008544921875, -4.7435302734375, -4.478515625, -4.2135009765625, -3.948486328125, -3.6834716796875, -3.41845703125, -3.1534423828125, -2.888427734375, -2.6234130859375, -2.3583984375, -2.0933837890625, -1.828369140625, -1.5633544921875, -1.29833984375, -1.0333251953125, -0.768310546875, -0.5032958984375, -0.23828125, 0.0267333984375, 0.291748046875, 0.5567626953125, 0.82177734375, 1.0867919921875, 1.351806640625, 1.6168212890625, 1.8818359375, 2.1468505859375, 2.411865234375, 2.6768798828125, 2.94189453125, 3.2069091796875, 3.471923828125, 3.7369384765625, 4.001953125, 4.2669677734375, 4.531982421875, 4.7969970703125, 5.06201171875, 5.3270263671875, 5.592041015625, 5.8570556640625, 6.1220703125, 6.3870849609375, 6.652099609375, 6.9171142578125, 7.18212890625, 7.4471435546875, 7.712158203125, 7.9771728515625, 8.2421875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 7.0, 0.0, 22.0, 32.0, 27.0, 23.0, 37.0, 36.0, 52.0, 110.0, 139.0, 207.0, 201.0, 197.0, 350.0, 550.0, 713.0, 900.0, 1481.0, 2248.0, 3271.0, 6101.0, 11756.0, 26628.0, 86872.0, 5900256.0, 174958.0, 38521.0, 15504.0, 7640.0, 4237.0, 2670.0, 1566.0, 1210.0, 785.0, 505.0, 387.0, 313.0, 244.0, 130.0, 136.0, 88.0, 83.0, 85.0, 39.0, 47.0, 8.0, 12.0, 4.0, 10.0, 23.0, 12.0, 0.0, 0.0, 3.0, 6.0], "bins": [-14.4296875, -14.0013427734375, -13.572998046875, -13.1446533203125, -12.71630859375, -12.2879638671875, -11.859619140625, -11.4312744140625, -11.0029296875, -10.5745849609375, -10.146240234375, -9.7178955078125, -9.28955078125, -8.8612060546875, -8.432861328125, -8.0045166015625, -7.576171875, -7.1478271484375, -6.719482421875, -6.2911376953125, -5.86279296875, -5.4344482421875, -5.006103515625, -4.5777587890625, -4.1494140625, -3.7210693359375, -3.292724609375, -2.8643798828125, -2.43603515625, -2.0076904296875, -1.579345703125, -1.1510009765625, -0.72265625, -0.2943115234375, 0.134033203125, 0.5623779296875, 0.99072265625, 1.4190673828125, 1.847412109375, 2.2757568359375, 2.7041015625, 3.1324462890625, 3.560791015625, 3.9891357421875, 4.41748046875, 4.8458251953125, 5.274169921875, 5.7025146484375, 6.130859375, 6.5592041015625, 6.987548828125, 7.4158935546875, 7.84423828125, 8.2725830078125, 8.700927734375, 9.1292724609375, 9.5576171875, 9.9859619140625, 10.414306640625, 10.8426513671875, 11.27099609375, 11.6993408203125, 12.127685546875, 12.5560302734375, 12.984375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 8.0, 5.0, 3.0, 10.0, 7.0, 12.0, 17.0, 16.0, 21.0, 16.0, 22.0, 22.0, 23.0, 35.0, 45.0, 41.0, 50.0, 71.0, 103.0, 190.0, 460.0, 251.0, 126.0, 68.0, 50.0, 44.0, 44.0, 37.0, 30.0, 25.0, 21.0, 23.0, 26.0, 21.0, 8.0, 11.0, 13.0, 16.0, 12.0, 9.0, 5.0, 1.0, 5.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-5.18359375, -5.0343017578125, -4.885009765625, -4.7357177734375, -4.58642578125, -4.4371337890625, -4.287841796875, -4.1385498046875, -3.9892578125, -3.8399658203125, -3.690673828125, -3.5413818359375, -3.39208984375, -3.2427978515625, -3.093505859375, -2.9442138671875, -2.794921875, -2.6456298828125, -2.496337890625, -2.3470458984375, -2.19775390625, -2.0484619140625, -1.899169921875, -1.7498779296875, -1.6005859375, -1.4512939453125, -1.302001953125, -1.1527099609375, -1.00341796875, -0.8541259765625, -0.704833984375, -0.5555419921875, -0.40625, -0.2569580078125, -0.107666015625, 0.0416259765625, 0.19091796875, 0.3402099609375, 0.489501953125, 0.6387939453125, 0.7880859375, 0.9373779296875, 1.086669921875, 1.2359619140625, 1.38525390625, 1.5345458984375, 1.683837890625, 1.8331298828125, 1.982421875, 2.1317138671875, 2.281005859375, 2.4302978515625, 2.57958984375, 2.7288818359375, 2.878173828125, 3.0274658203125, 3.1767578125, 3.3260498046875, 3.475341796875, 3.6246337890625, 3.77392578125, 3.9232177734375, 4.072509765625, 4.2218017578125, 4.37109375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 4.0, 16.0, 29.0, 50.0, 69.0, 131.0, 364.0, 170.0, 68.0, 53.0, 20.0, 4.0, 8.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.03418731689453, -19.437789916992188, -18.84139060974121, -18.244993209838867, -17.648595809936523, -17.052196502685547, -16.455799102783203, -15.85940170288086, -15.2630033493042, -14.666604995727539, -14.070207595825195, -13.473809242248535, -12.877410888671875, -12.281013488769531, -11.684615135192871, -11.088216781616211, -10.491819381713867, -9.895421028137207, -9.299023628234863, -8.702625274658203, -8.10622787475586, -7.509829521179199, -6.913431167602539, -6.317033290863037, -5.720635414123535, -5.124237537384033, -4.527839660644531, -3.931441307067871, -3.335043430328369, -2.738645553588867, -2.142247438430786, -1.545849323272705, -0.9494514465332031, -0.3530534505844116, 0.24334454536437988, 0.8397425413131714, 1.436140537261963, 2.032538414001465, 2.628936529159546, 3.225334644317627, 3.821732521057129, 4.418130397796631, 5.014528274536133, 5.610926628112793, 6.207324504852295, 6.803722381591797, 7.400120735168457, 7.996518611907959, 8.592916488647461, 9.189314842224121, 9.785712242126465, 10.382110595703125, 10.978507995605469, 11.574906349182129, 12.171304702758789, 12.767702102661133, 13.364100456237793, 13.960498809814453, 14.556896209716797, 15.153294563293457, 15.749692916870117, 16.34609031677246, 16.942487716674805, 17.53888702392578, 18.135284423828125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 9.0, 6.0, 8.0, 16.0, 20.0, 19.0, 21.0, 22.0, 26.0, 23.0, 30.0, 41.0, 36.0, 42.0, 48.0, 48.0, 42.0, 49.0, 43.0, 32.0, 37.0, 39.0, 40.0, 29.0, 40.0, 24.0, 34.0, 22.0, 26.0, 19.0, 16.0, 20.0, 17.0, 13.0, 13.0, 3.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.480586051940918, -6.259017467498779, -6.037448406219482, -5.815879821777344, -5.594310760498047, -5.372742176055908, -5.151173114776611, -4.929604530334473, -4.708035469055176, -4.486466884613037, -4.26489782333374, -4.043329238891602, -3.8217601776123047, -3.600191593170166, -3.378622531890869, -3.1570539474487305, -2.9354851245880127, -2.713916301727295, -2.492347478866577, -2.2707786560058594, -2.0492098331451416, -1.8276411294937134, -1.6060723066329956, -1.3845034837722778, -1.16293466091156, -0.9413658380508423, -0.7197970151901245, -0.4982282519340515, -0.27665942907333374, -0.05509066581726074, 0.16647815704345703, 0.3880469799041748, 0.6096158027648926, 0.8311846256256104, 1.0527534484863281, 1.274322271347046, 1.4958910942077637, 1.717459797859192, 1.9390286207199097, 2.160597324371338, 2.3821663856506348, 2.6037352085113525, 2.8253040313720703, 3.046872854232788, 3.268441677093506, 3.4900102615356445, 3.7115793228149414, 3.93314790725708, 4.154716491699219, 4.376285076141357, 4.597854137420654, 4.819422721862793, 5.04099178314209, 5.2625603675842285, 5.484129428863525, 5.705698013305664, 5.927267074584961, 6.1488356590271, 6.3704047203063965, 6.591973304748535, 6.813542366027832, 7.035110950469971, 7.256680011749268, 7.478248596191406, 7.699817657470703]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 6.0, 15.0, 9.0, 17.0, 23.0, 26.0, 25.0, 42.0, 84.0, 80.0, 113.0, 164.0, 264.0, 376.0, 535.0, 871.0, 1559.0, 3267.0, 8737.0, 32905.0, 3847217.0, 263781.0, 22978.0, 5919.0, 2298.0, 1127.0, 632.0, 369.0, 265.0, 167.0, 100.0, 83.0, 63.0, 42.0, 26.0, 14.0, 28.0, 12.0, 6.0, 7.0, 4.0, 7.0, 5.0, 5.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0196533203125, -0.01894974708557129, -0.018246173858642578, -0.017542600631713867, -0.016839027404785156, -0.016135454177856445, -0.015431880950927734, -0.014728307723999023, -0.014024734497070312, -0.013321161270141602, -0.01261758804321289, -0.01191401481628418, -0.011210441589355469, -0.010506868362426758, -0.009803295135498047, -0.009099721908569336, -0.008396148681640625, -0.007692575454711914, -0.006989002227783203, -0.006285429000854492, -0.005581855773925781, -0.00487828254699707, -0.004174709320068359, -0.0034711360931396484, -0.0027675628662109375, -0.0020639896392822266, -0.0013604164123535156, -0.0006568431854248047, 4.673004150390625e-05, 0.0007503032684326172, 0.0014538764953613281, 0.002157449722290039, 0.00286102294921875, 0.003564596176147461, 0.004268169403076172, 0.004971742630004883, 0.005675315856933594, 0.006378889083862305, 0.007082462310791016, 0.0077860355377197266, 0.008489608764648438, 0.009193181991577148, 0.00989675521850586, 0.01060032844543457, 0.011303901672363281, 0.012007474899291992, 0.012711048126220703, 0.013414621353149414, 0.014118194580078125, 0.014821767807006836, 0.015525341033935547, 0.016228914260864258, 0.01693248748779297, 0.01763606071472168, 0.01833963394165039, 0.0190432071685791, 0.019746780395507812, 0.020450353622436523, 0.021153926849365234, 0.021857500076293945, 0.022561073303222656, 0.023264646530151367, 0.023968219757080078, 0.02467179298400879, 0.0253753662109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 8.0, 10.0, 7.0, 12.0, 10.0, 15.0, 13.0, 31.0, 753.0, 22.0, 12.0, 7.0, 14.0, 10.0, 4.0, 6.0, 7.0, 5.0, 4.0, 4.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014944076538085938, -0.0014466643333435059, -0.001398921012878418, -0.00135117769241333, -0.0013034343719482422, -0.0012556910514831543, -0.0012079477310180664, -0.0011602044105529785, -0.0011124610900878906, -0.0010647177696228027, -0.0010169744491577148, -0.000969231128692627, -0.0009214878082275391, -0.0008737444877624512, -0.0008260011672973633, -0.0007782578468322754, -0.0007305145263671875, -0.0006827712059020996, -0.0006350278854370117, -0.0005872845649719238, -0.0005395412445068359, -0.000491797924041748, -0.00044405460357666016, -0.00039631128311157227, -0.0003485679626464844, -0.0003008246421813965, -0.0002530813217163086, -0.0002053380012512207, -0.0001575946807861328, -0.00010985136032104492, -6.210803985595703e-05, -1.436471939086914e-05, 3.337860107421875e-05, 8.112192153930664e-05, 0.00012886524200439453, 0.00017660856246948242, 0.0002243518829345703, 0.0002720952033996582, 0.0003198385238647461, 0.000367581844329834, 0.0004153251647949219, 0.00046306848526000977, 0.0005108118057250977, 0.0005585551261901855, 0.0006062984466552734, 0.0006540417671203613, 0.0007017850875854492, 0.0007495284080505371, 0.000797271728515625, 0.0008450150489807129, 0.0008927583694458008, 0.0009405016899108887, 0.0009882450103759766, 0.0010359883308410645, 0.0010837316513061523, 0.0011314749717712402, 0.0011792182922363281, 0.001226961612701416, 0.001274704933166504, 0.0013224482536315918, 0.0013701915740966797, 0.0014179348945617676, 0.0014656782150268555, 0.0015134215354919434, 0.0015611648559570312]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 10.0, 6.0, 11.0, 14.0, 21.0, 26.0, 38.0, 49.0, 58.0, 73.0, 118.0, 179.0, 275.0, 421.0, 762.0, 1422.0, 3273.0, 11801.0, 133313.0, 3877668.0, 145607.0, 12274.0, 3382.0, 1412.0, 754.0, 423.0, 252.0, 188.0, 127.0, 91.0, 68.0, 34.0, 30.0, 25.0, 21.0, 14.0, 9.0, 9.0, 3.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.024169921875, -0.023448705673217773, -0.022727489471435547, -0.02200627326965332, -0.021285057067871094, -0.020563840866088867, -0.01984262466430664, -0.019121408462524414, -0.018400192260742188, -0.01767897605895996, -0.016957759857177734, -0.016236543655395508, -0.015515327453613281, -0.014794111251831055, -0.014072895050048828, -0.013351678848266602, -0.012630462646484375, -0.011909246444702148, -0.011188030242919922, -0.010466814041137695, -0.009745597839355469, -0.009024381637573242, -0.008303165435791016, -0.007581949234008789, -0.0068607330322265625, -0.006139516830444336, -0.005418300628662109, -0.004697084426879883, -0.003975868225097656, -0.0032546520233154297, -0.002533435821533203, -0.0018122196197509766, -0.00109100341796875, -0.00036978721618652344, 0.0003514289855957031, 0.0010726451873779297, 0.0017938613891601562, 0.002515077590942383, 0.0032362937927246094, 0.003957509994506836, 0.0046787261962890625, 0.005399942398071289, 0.006121158599853516, 0.006842374801635742, 0.007563591003417969, 0.008284807205200195, 0.009006023406982422, 0.009727239608764648, 0.010448455810546875, 0.011169672012329102, 0.011890888214111328, 0.012612104415893555, 0.013333320617675781, 0.014054536819458008, 0.014775753021240234, 0.015496969223022461, 0.016218185424804688, 0.016939401626586914, 0.01766061782836914, 0.018381834030151367, 0.019103050231933594, 0.01982426643371582, 0.020545482635498047, 0.021266698837280273, 0.0219879150390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 9.0, 9.0, 15.0, 12.0, 22.0, 21.0, 36.0, 32.0, 51.0, 66.0, 104.0, 120.0, 167.0, 193.0, 302.0, 570.0, 967.0, 401.0, 239.0, 183.0, 144.0, 79.0, 69.0, 55.0, 51.0, 29.0, 40.0, 22.0, 10.0, 8.0, 9.0, 10.0, 8.0, 2.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0025920867919921875, -0.0025163888931274414, -0.0024406909942626953, -0.0023649930953979492, -0.002289295196533203, -0.002213597297668457, -0.002137899398803711, -0.002062201499938965, -0.0019865036010742188, -0.0019108057022094727, -0.0018351078033447266, -0.0017594099044799805, -0.0016837120056152344, -0.0016080141067504883, -0.0015323162078857422, -0.001456618309020996, -0.00138092041015625, -0.001305222511291504, -0.0012295246124267578, -0.0011538267135620117, -0.0010781288146972656, -0.0010024309158325195, -0.0009267330169677734, -0.0008510351181030273, -0.0007753372192382812, -0.0006996393203735352, -0.0006239414215087891, -0.000548243522644043, -0.0004725456237792969, -0.0003968477249145508, -0.0003211498260498047, -0.0002454519271850586, -0.0001697540283203125, -9.40561294555664e-05, -1.8358230590820312e-05, 5.733966827392578e-05, 0.00013303756713867188, 0.00020873546600341797, 0.00028443336486816406, 0.00036013126373291016, 0.00043582916259765625, 0.0005115270614624023, 0.0005872249603271484, 0.0006629228591918945, 0.0007386207580566406, 0.0008143186569213867, 0.0008900165557861328, 0.0009657144546508789, 0.001041412353515625, 0.001117110252380371, 0.0011928081512451172, 0.0012685060501098633, 0.0013442039489746094, 0.0014199018478393555, 0.0014955997467041016, 0.0015712976455688477, 0.0016469955444335938, 0.0017226934432983398, 0.001798391342163086, 0.001874089241027832, 0.0019497871398925781, 0.0020254850387573242, 0.0021011829376220703, 0.0021768808364868164, 0.0022525787353515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 21.0, 24.0, 56.0, 145.0, 251.0, 268.0, 123.0, 55.0, 23.0, 12.0, 5.0, 4.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03887498751282692, -0.03776520863175392, -0.036655426025390625, -0.03554564714431763, -0.03443586453795433, -0.03332608565688133, -0.032216303050518036, -0.031106524169445038, -0.02999674342572689, -0.028886962682008743, -0.027777181938290596, -0.02666740119457245, -0.02555762231349945, -0.024447839707136154, -0.023338060826063156, -0.02222828008234501, -0.02111849933862686, -0.020008718594908714, -0.018898937851190567, -0.01778915710747242, -0.016679376363754272, -0.0155695965513587, -0.014459816738963127, -0.01335003599524498, -0.012240255251526833, -0.011130474507808685, -0.010020693764090538, -0.008910913951694965, -0.007801133207976818, -0.006691352464258671, -0.005581572186201811, -0.004471791908144951, -0.003362007439136505, -0.0022522269282490015, -0.0011424464173614979, -3.2665906473994255e-05, 0.0010771146044135094, 0.0021868953481316566, 0.0032966756261885166, 0.004406455904245377, 0.005516236647963524, 0.006626017391681671, 0.007735797669738531, 0.008845577947795391, 0.009955358691513538, 0.011065139435231686, 0.012174919247627258, 0.013284699991345406, 0.014394480735063553, 0.0155042614787817, 0.016614042222499847, 0.017723822966217995, 0.018833603709936142, 0.01994338259100914, 0.021053163334727287, 0.022162944078445435, 0.023272724822163582, 0.02438250556588173, 0.025492286309599876, 0.026602067053318024, 0.02771184593439102, 0.028821628540754318, 0.029931407421827316, 0.031041188165545464, 0.03215096890926361]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 7.0, 5.0, 4.0, 5.0, 7.0, 5.0, 12.0, 14.0, 10.0, 13.0, 12.0, 40.0, 28.0, 28.0, 47.0, 31.0, 49.0, 45.0, 33.0, 45.0, 54.0, 56.0, 47.0, 56.0, 46.0, 38.0, 39.0, 43.0, 29.0, 24.0, 26.0, 25.0, 17.0, 12.0, 8.0, 7.0, 4.0, 14.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010569870471954346, -0.010247211903333664, -0.009924553334712982, -0.0096018947660923, -0.009279236197471619, -0.008956577628850937, -0.008633919060230255, -0.008311260491609573, -0.007988601922988892, -0.00766594335436821, -0.007343284785747528, -0.007020626217126846, -0.0066979676485061646, -0.006375309079885483, -0.006052650511264801, -0.005729991942644119, -0.0054073333740234375, -0.005084674805402756, -0.004762016236782074, -0.004439357668161392, -0.0041166990995407104, -0.0037940405309200287, -0.003471381962299347, -0.003148723393678665, -0.0028260648250579834, -0.0025034062564373016, -0.00218074768781662, -0.0018580891191959381, -0.0015354305505752563, -0.0012127719819545746, -0.0008901134133338928, -0.0005674548447132111, -0.0002447962760925293, 7.786229252815247e-05, 0.00040052086114883423, 0.000723179429769516, 0.0010458379983901978, 0.0013684965670108795, 0.0016911551356315613, 0.002013813704252243, 0.002336472272872925, 0.0026591308414936066, 0.0029817894101142883, 0.00330444797873497, 0.003627106547355652, 0.003949765115976334, 0.004272423684597015, 0.004595082253217697, 0.004917740821838379, 0.005240399390459061, 0.005563057959079742, 0.005885716527700424, 0.006208375096321106, 0.006531033664941788, 0.0068536922335624695, 0.007176350802183151, 0.007499009370803833, 0.007821667939424515, 0.008144326508045197, 0.008466985076665878, 0.00878964364528656, 0.009112302213907242, 0.009434960782527924, 0.009757619351148605, 0.010080277919769287]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 12.0, 17.0, 14.0, 24.0, 34.0, 38.0, 58.0, 90.0, 117.0, 147.0, 204.0, 290.0, 390.0, 628.0, 902.0, 1330.0, 2223.0, 3608.0, 6576.0, 13349.0, 35932.0, 873521.0, 71017.0, 17790.0, 8226.0, 4489.0, 2699.0, 1569.0, 988.0, 684.0, 476.0, 319.0, 210.0, 131.0, 112.0, 87.0, 64.0, 45.0, 28.0, 27.0, 23.0, 14.0, 12.0, 7.0, 15.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0169677734375, -0.01643204689025879, -0.015896320343017578, -0.015360593795776367, -0.014824867248535156, -0.014289140701293945, -0.013753414154052734, -0.013217687606811523, -0.012681961059570312, -0.012146234512329102, -0.01161050796508789, -0.01107478141784668, -0.010539054870605469, -0.010003328323364258, -0.009467601776123047, -0.008931875228881836, -0.008396148681640625, -0.007860422134399414, -0.007324695587158203, -0.006788969039916992, -0.006253242492675781, -0.00571751594543457, -0.005181789398193359, -0.0046460628509521484, -0.0041103363037109375, -0.0035746097564697266, -0.0030388832092285156, -0.0025031566619873047, -0.0019674301147460938, -0.0014317035675048828, -0.0008959770202636719, -0.00036025047302246094, 0.00017547607421875, 0.0007112026214599609, 0.0012469291687011719, 0.0017826557159423828, 0.0023183822631835938, 0.0028541088104248047, 0.0033898353576660156, 0.0039255619049072266, 0.0044612884521484375, 0.0049970149993896484, 0.005532741546630859, 0.00606846809387207, 0.006604194641113281, 0.007139921188354492, 0.007675647735595703, 0.008211374282836914, 0.008747100830078125, 0.009282827377319336, 0.009818553924560547, 0.010354280471801758, 0.010890007019042969, 0.01142573356628418, 0.01196146011352539, 0.012497186660766602, 0.013032913208007812, 0.013568639755249023, 0.014104366302490234, 0.014640092849731445, 0.015175819396972656, 0.015711545944213867, 0.016247272491455078, 0.01678299903869629, 0.0173187255859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 7.0, 4.0, 6.0, 8.0, 4.0, 7.0, 7.0, 12.0, 16.0, 29.0, 131.0, 377.0, 245.0, 45.0, 21.0, 14.0, 7.0, 9.0, 5.0, 2.0, 9.0, 4.0, 1.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015516281127929688, -0.0015009045600891113, -0.001450181007385254, -0.0013994574546813965, -0.001348733901977539, -0.0012980103492736816, -0.0012472867965698242, -0.0011965632438659668, -0.0011458396911621094, -0.001095116138458252, -0.0010443925857543945, -0.0009936690330505371, -0.0009429454803466797, -0.0008922219276428223, -0.0008414983749389648, -0.0007907748222351074, -0.00074005126953125, -0.0006893277168273926, -0.0006386041641235352, -0.0005878806114196777, -0.0005371570587158203, -0.0004864335060119629, -0.00043570995330810547, -0.00038498640060424805, -0.0003342628479003906, -0.0002835392951965332, -0.00023281574249267578, -0.00018209218978881836, -0.00013136863708496094, -8.064508438110352e-05, -2.9921531677246094e-05, 2.0802021026611328e-05, 7.152557373046875e-05, 0.00012224912643432617, 0.0001729726791381836, 0.00022369623184204102, 0.00027441978454589844, 0.00032514333724975586, 0.0003758668899536133, 0.0004265904426574707, 0.0004773139953613281, 0.0005280375480651855, 0.000578761100769043, 0.0006294846534729004, 0.0006802082061767578, 0.0007309317588806152, 0.0007816553115844727, 0.0008323788642883301, 0.0008831024169921875, 0.0009338259696960449, 0.0009845495223999023, 0.0010352730751037598, 0.0010859966278076172, 0.0011367201805114746, 0.001187443733215332, 0.0012381672859191895, 0.0012888908386230469, 0.0013396143913269043, 0.0013903379440307617, 0.0014410614967346191, 0.0014917850494384766, 0.001542508602142334, 0.0015932321548461914, 0.0016439557075500488, 0.0016946792602539062]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 3.0, 8.0, 9.0, 15.0, 17.0, 18.0, 34.0, 50.0, 48.0, 88.0, 93.0, 164.0, 252.0, 342.0, 531.0, 761.0, 1231.0, 2167.0, 4180.0, 10363.0, 50879.0, 840122.0, 110396.0, 14726.0, 5235.0, 2656.0, 1446.0, 863.0, 535.0, 386.0, 271.0, 187.0, 141.0, 92.0, 67.0, 48.0, 41.0, 25.0, 17.0, 14.0, 10.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0266876220703125, -0.025870084762573242, -0.025052547454833984, -0.024235010147094727, -0.02341747283935547, -0.02259993553161621, -0.021782398223876953, -0.020964860916137695, -0.020147323608398438, -0.01932978630065918, -0.018512248992919922, -0.017694711685180664, -0.016877174377441406, -0.01605963706970215, -0.01524209976196289, -0.014424562454223633, -0.013607025146484375, -0.012789487838745117, -0.01197195053100586, -0.011154413223266602, -0.010336875915527344, -0.009519338607788086, -0.008701801300048828, -0.00788426399230957, -0.0070667266845703125, -0.006249189376831055, -0.005431652069091797, -0.004614114761352539, -0.0037965774536132812, -0.0029790401458740234, -0.0021615028381347656, -0.0013439655303955078, -0.00052642822265625, 0.0002911090850830078, 0.0011086463928222656, 0.0019261837005615234, 0.0027437210083007812, 0.003561258316040039, 0.004378795623779297, 0.005196332931518555, 0.0060138702392578125, 0.00683140754699707, 0.007648944854736328, 0.008466482162475586, 0.009284019470214844, 0.010101556777954102, 0.01091909408569336, 0.011736631393432617, 0.012554168701171875, 0.013371706008911133, 0.01418924331665039, 0.015006780624389648, 0.015824317932128906, 0.016641855239868164, 0.017459392547607422, 0.01827692985534668, 0.019094467163085938, 0.019912004470825195, 0.020729541778564453, 0.02154707908630371, 0.02236461639404297, 0.023182153701782227, 0.023999691009521484, 0.024817228317260742, 0.025634765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 2.0, 6.0, 11.0, 24.0, 17.0, 24.0, 20.0, 17.0, 35.0, 29.0, 30.0, 35.0, 37.0, 41.0, 40.0, 32.0, 44.0, 27.0, 46.0, 43.0, 45.0, 48.0, 50.0, 37.0, 31.0, 32.0, 27.0, 26.0, 20.0, 10.0, 25.0, 15.0, 11.0, 11.0, 4.0, 7.0, 3.0, 7.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006847381591796875, -0.006637156009674072, -0.0064269304275512695, -0.006216704845428467, -0.006006479263305664, -0.005796253681182861, -0.005586028099060059, -0.005375802516937256, -0.005165576934814453, -0.00495535135269165, -0.004745125770568848, -0.004534900188446045, -0.004324674606323242, -0.0041144490242004395, -0.0039042234420776367, -0.003693997859954834, -0.0034837722778320312, -0.0032735466957092285, -0.0030633211135864258, -0.002853095531463623, -0.0026428699493408203, -0.0024326443672180176, -0.002222418785095215, -0.002012193202972412, -0.0018019676208496094, -0.0015917420387268066, -0.001381516456604004, -0.0011712908744812012, -0.0009610652923583984, -0.0007508397102355957, -0.000540614128112793, -0.00033038854598999023, -0.0001201629638671875, 9.006261825561523e-05, 0.00030028820037841797, 0.0005105137825012207, 0.0007207393646240234, 0.0009309649467468262, 0.001141190528869629, 0.0013514161109924316, 0.0015616416931152344, 0.0017718672752380371, 0.00198209285736084, 0.0021923184394836426, 0.0024025440216064453, 0.002612769603729248, 0.0028229951858520508, 0.0030332207679748535, 0.0032434463500976562, 0.003453671932220459, 0.0036638975143432617, 0.0038741230964660645, 0.004084348678588867, 0.00429457426071167, 0.004504799842834473, 0.004715025424957275, 0.004925251007080078, 0.005135476589202881, 0.005345702171325684, 0.005555927753448486, 0.005766153335571289, 0.005976378917694092, 0.0061866044998168945, 0.006396830081939697, 0.0066070556640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 11.0, 21.0, 33.0, 49.0, 82.0, 126.0, 235.0, 591.0, 1517.0, 6355.0, 153795.0, 872177.0, 10137.0, 2012.0, 735.0, 309.0, 154.0, 78.0, 45.0, 25.0, 27.0, 11.0, 7.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038330078125, -0.03720664978027344, -0.036083221435546875, -0.03495979309082031, -0.03383636474609375, -0.03271293640136719, -0.031589508056640625, -0.030466079711914062, -0.0293426513671875, -0.028219223022460938, -0.027095794677734375, -0.025972366333007812, -0.02484893798828125, -0.023725509643554688, -0.022602081298828125, -0.021478652954101562, -0.020355224609375, -0.019231796264648438, -0.018108367919921875, -0.016984939575195312, -0.01586151123046875, -0.014738082885742188, -0.013614654541015625, -0.012491226196289062, -0.0113677978515625, -0.010244369506835938, -0.009120941162109375, -0.007997512817382812, -0.00687408447265625, -0.0057506561279296875, -0.004627227783203125, -0.0035037994384765625, -0.00238037109375, -0.0012569427490234375, -0.000133514404296875, 0.0009899139404296875, 0.00211334228515625, 0.0032367706298828125, 0.004360198974609375, 0.0054836273193359375, 0.0066070556640625, 0.0077304840087890625, 0.008853912353515625, 0.009977340698242188, 0.01110076904296875, 0.012224197387695312, 0.013347625732421875, 0.014471054077148438, 0.015594482421875, 0.016717910766601562, 0.017841339111328125, 0.018964767456054688, 0.02008819580078125, 0.021211624145507812, 0.022335052490234375, 0.023458480834960938, 0.0245819091796875, 0.025705337524414062, 0.026828765869140625, 0.027952194213867188, 0.02907562255859375, 0.030199050903320312, 0.031322479248046875, 0.03244590759277344, 0.0335693359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 4.0, 8.0, 2.0, 9.0, 6.0, 18.0, 15.0, 30.0, 24.0, 34.0, 38.0, 54.0, 80.0, 148.0, 154.0, 83.0, 63.0, 50.0, 45.0, 30.0, 21.0, 21.0, 8.0, 15.0, 9.0, 4.0, 7.0, 0.0, 3.0, 5.0, 3.0, 1.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003353118896484375, -0.0032486021518707275, -0.00314408540725708, -0.0030395686626434326, -0.002935051918029785, -0.0028305351734161377, -0.0027260184288024902, -0.0026215016841888428, -0.0025169849395751953, -0.002412468194961548, -0.0023079514503479004, -0.002203434705734253, -0.0020989179611206055, -0.001994401216506958, -0.0018898844718933105, -0.001785367727279663, -0.0016808509826660156, -0.0015763342380523682, -0.0014718174934387207, -0.0013673007488250732, -0.0012627840042114258, -0.0011582672595977783, -0.0010537505149841309, -0.0009492337703704834, -0.0008447170257568359, -0.0007402002811431885, -0.000635683536529541, -0.0005311667919158936, -0.0004266500473022461, -0.00032213330268859863, -0.00021761655807495117, -0.00011309981346130371, -8.58306884765625e-06, 9.593367576599121e-05, 0.00020045042037963867, 0.00030496716499328613, 0.0004094839096069336, 0.0005140006542205811, 0.0006185173988342285, 0.000723034143447876, 0.0008275508880615234, 0.0009320676326751709, 0.0010365843772888184, 0.0011411011219024658, 0.0012456178665161133, 0.0013501346111297607, 0.0014546513557434082, 0.0015591681003570557, 0.0016636848449707031, 0.0017682015895843506, 0.001872718334197998, 0.0019772350788116455, 0.002081751823425293, 0.0021862685680389404, 0.002290785312652588, 0.0023953020572662354, 0.002499818801879883, 0.0026043355464935303, 0.0027088522911071777, 0.002813369035720825, 0.0029178857803344727, 0.00302240252494812, 0.0031269192695617676, 0.003231436014175415, 0.0033359527587890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 13.0, 25.0, 28.0, 35.0, 58.0, 83.0, 104.0, 178.0, 455.0, 806.0, 2521.0, 12330.0, 904569.0, 116749.0, 7190.0, 1893.0, 641.0, 331.0, 179.0, 119.0, 78.0, 38.0, 24.0, 14.0, 19.0, 15.0, 21.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.039581298828125, -0.03805065155029297, -0.03652000427246094, -0.034989356994628906, -0.033458709716796875, -0.031928062438964844, -0.030397415161132812, -0.02886676788330078, -0.02733612060546875, -0.02580547332763672, -0.024274826049804688, -0.022744178771972656, -0.021213531494140625, -0.019682884216308594, -0.018152236938476562, -0.01662158966064453, -0.0150909423828125, -0.013560295104980469, -0.012029647827148438, -0.010499000549316406, -0.008968353271484375, -0.007437705993652344, -0.0059070587158203125, -0.004376411437988281, -0.00284576416015625, -0.0013151168823242188, 0.0002155303955078125, 0.0017461776733398438, 0.003276824951171875, 0.004807472229003906, 0.0063381195068359375, 0.007868766784667969, 0.0093994140625, 0.010930061340332031, 0.012460708618164062, 0.013991355895996094, 0.015522003173828125, 0.017052650451660156, 0.018583297729492188, 0.02011394500732422, 0.02164459228515625, 0.02317523956298828, 0.024705886840820312, 0.026236534118652344, 0.027767181396484375, 0.029297828674316406, 0.030828475952148438, 0.03235912322998047, 0.0338897705078125, 0.03542041778564453, 0.03695106506347656, 0.038481712341308594, 0.040012359619140625, 0.041543006896972656, 0.04307365417480469, 0.04460430145263672, 0.04613494873046875, 0.04766559600830078, 0.04919624328613281, 0.050726890563964844, 0.052257537841796875, 0.053788185119628906, 0.05531883239746094, 0.05684947967529297, 0.058380126953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 8.0, 9.0, 18.0, 20.0, 42.0, 152.0, 334.0, 206.0, 78.0, 29.0, 22.0, 16.0, 13.0, 14.0, 5.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0271453857421875, -0.026406288146972656, -0.025667190551757812, -0.02492809295654297, -0.024188995361328125, -0.02344989776611328, -0.022710800170898438, -0.021971702575683594, -0.02123260498046875, -0.020493507385253906, -0.019754409790039062, -0.01901531219482422, -0.018276214599609375, -0.01753711700439453, -0.016798019409179688, -0.016058921813964844, -0.01531982421875, -0.014580726623535156, -0.013841629028320312, -0.013102531433105469, -0.012363433837890625, -0.011624336242675781, -0.010885238647460938, -0.010146141052246094, -0.00940704345703125, -0.008667945861816406, -0.007928848266601562, -0.007189750671386719, -0.006450653076171875, -0.005711555480957031, -0.0049724578857421875, -0.004233360290527344, -0.0034942626953125, -0.0027551651000976562, -0.0020160675048828125, -0.0012769699096679688, -0.000537872314453125, 0.00020122528076171875, 0.0009403228759765625, 0.0016794204711914062, 0.00241851806640625, 0.0031576156616210938, 0.0038967132568359375, 0.004635810852050781, 0.005374908447265625, 0.006114006042480469, 0.0068531036376953125, 0.007592201232910156, 0.008331298828125, 0.009070396423339844, 0.009809494018554688, 0.010548591613769531, 0.011287689208984375, 0.012026786804199219, 0.012765884399414062, 0.013504981994628906, 0.01424407958984375, 0.014983177185058594, 0.015722274780273438, 0.01646137237548828, 0.017200469970703125, 0.01793956756591797, 0.018678665161132812, 0.019417762756347656, 0.0201568603515625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 26.0, 59.0, 207.0, 542.0, 93.0, 22.0, 12.0, 5.0, 4.0, 0.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.38651442527770996, -0.3774142563343048, -0.36831408739089966, -0.3592139184474945, -0.35011374950408936, -0.3410135805606842, -0.33191341161727905, -0.3228132426738739, -0.31371307373046875, -0.3046129047870636, -0.29551273584365845, -0.2864125669002533, -0.27731239795684814, -0.268212229013443, -0.25911206007003784, -0.2500118911266327, -0.24091173708438873, -0.23181156814098358, -0.22271139919757843, -0.21361123025417328, -0.20451106131076813, -0.19541089236736298, -0.18631073832511902, -0.17721056938171387, -0.16811040043830872, -0.15901023149490356, -0.1499100625514984, -0.14080989360809326, -0.1317097246646881, -0.12260955572128296, -0.1135093942284584, -0.10440922528505325, -0.0953090488910675, -0.08620887994766235, -0.0771087110042572, -0.06800854206085205, -0.0589083768427372, -0.049808207899332047, -0.040708042681217194, -0.03160787373781204, -0.02250770479440689, -0.013407536782324314, -0.004307368770241737, 0.004792798310518265, 0.013892967253923416, 0.022993136197328568, 0.03209330141544342, 0.04119347035884857, 0.05029363930225372, 0.059393808245658875, 0.06849397718906403, 0.07759414613246918, 0.08669431507587433, 0.09579448401927948, 0.10489464551210403, 0.11399481445550919, 0.12309498339891434, 0.1321951448917389, 0.14129531383514404, 0.1503954827785492, 0.15949565172195435, 0.1685958206653595, 0.17769598960876465, 0.1867961585521698, 0.19589632749557495]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 9.0, 2.0, 4.0, 7.0, 9.0, 7.0, 17.0, 21.0, 33.0, 59.0, 73.0, 107.0, 105.0, 139.0, 118.0, 65.0, 72.0, 20.0, 38.0, 17.0, 11.0, 9.0, 12.0, 4.0, 9.0, 9.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.12486505508422852, -0.12102162837982178, -0.11717820912599564, -0.1133347824215889, -0.10949136316776276, -0.10564793646335602, -0.10180450975894928, -0.09796108305454254, -0.0941176638007164, -0.09027423709630966, -0.08643081784248352, -0.08258739113807678, -0.07874396443367004, -0.0749005451798439, -0.07105711847543716, -0.06721369922161102, -0.06337027251720428, -0.059526849538087845, -0.055683426558971405, -0.05183999985456467, -0.04799657687544823, -0.04415315389633179, -0.04030972719192505, -0.03646630421280861, -0.03262288123369217, -0.02877945825457573, -0.02493603341281414, -0.02109260857105255, -0.01724918559193611, -0.013405762612819672, -0.009562337771058083, -0.0057189129292964935, -0.0018754899501800537, 0.0019679339602589607, 0.005811357870697975, 0.00965478178113699, 0.013498205691576004, 0.017341628670692444, 0.021185053512454033, 0.025028478354215622, 0.028871901333332062, 0.0327153243124485, 0.03655874729156494, 0.04040217399597168, 0.04424559697508812, 0.04808901995420456, 0.0519324466586113, 0.05577586963772774, 0.05961929261684418, 0.06346271932125092, 0.06730613857507706, 0.0711495652794838, 0.07499298453330994, 0.07883641123771667, 0.08267983794212341, 0.08652326464653015, 0.09036668390035629, 0.09421011060476303, 0.09805352985858917, 0.10189695656299591, 0.10574038326740265, 0.10958380252122879, 0.11342722922563553, 0.11727064847946167, 0.12111407518386841]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 9.0, 10.0, 17.0, 19.0, 21.0, 26.0, 47.0, 169.0, 2220.0, 4129894.0, 60744.0, 791.0, 112.0, 47.0, 37.0, 17.0, 18.0, 21.0, 8.0, 3.0, 5.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03515625, -1.962127685546875, -1.88909912109375, -1.816070556640625, -1.7430419921875, -1.670013427734375, -1.59698486328125, -1.523956298828125, -1.450927734375, -1.377899169921875, -1.30487060546875, -1.231842041015625, -1.1588134765625, -1.085784912109375, -1.01275634765625, -0.939727783203125, -0.86669921875, -0.793670654296875, -0.72064208984375, -0.647613525390625, -0.5745849609375, -0.501556396484375, -0.42852783203125, -0.355499267578125, -0.282470703125, -0.209442138671875, -0.13641357421875, -0.063385009765625, 0.0096435546875, 0.082672119140625, 0.15570068359375, 0.228729248046875, 0.3017578125, 0.374786376953125, 0.44781494140625, 0.520843505859375, 0.5938720703125, 0.666900634765625, 0.73992919921875, 0.812957763671875, 0.885986328125, 0.959014892578125, 1.03204345703125, 1.105072021484375, 1.1781005859375, 1.251129150390625, 1.32415771484375, 1.397186279296875, 1.47021484375, 1.543243408203125, 1.61627197265625, 1.689300537109375, 1.7623291015625, 1.835357666015625, 1.90838623046875, 1.981414794921875, 2.054443359375, 2.127471923828125, 2.20050048828125, 2.273529052734375, 2.3465576171875, 2.419586181640625, 2.49261474609375, 2.565643310546875, 2.638671875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 5.0, 5.0, 2.0, 0.0, 6.0, 6.0, 7.0, 5.0, 4.0, 15.0, 17.0, 30.0, 54.0, 124.0, 178.0, 217.0, 109.0, 71.0, 46.0, 18.0, 17.0, 5.0, 7.0, 7.0, 3.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 6.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010204315185546875, -0.0009855031967163086, -0.0009505748748779297, -0.0009156465530395508, -0.0008807182312011719, -0.000845789909362793, -0.0008108615875244141, -0.0007759332656860352, -0.0007410049438476562, -0.0007060766220092773, -0.0006711483001708984, -0.0006362199783325195, -0.0006012916564941406, -0.0005663633346557617, -0.0005314350128173828, -0.0004965066909790039, -0.000461578369140625, -0.0004266500473022461, -0.0003917217254638672, -0.0003567934036254883, -0.0003218650817871094, -0.00028693675994873047, -0.00025200843811035156, -0.00021708011627197266, -0.00018215179443359375, -0.00014722347259521484, -0.00011229515075683594, -7.736682891845703e-05, -4.2438507080078125e-05, -7.510185241699219e-06, 2.7418136596679688e-05, 6.23464584350586e-05, 9.72747802734375e-05, 0.0001322031021118164, 0.0001671314239501953, 0.00020205974578857422, 0.00023698806762695312, 0.00027191638946533203, 0.00030684471130371094, 0.00034177303314208984, 0.00037670135498046875, 0.00041162967681884766, 0.00044655799865722656, 0.00048148632049560547, 0.0005164146423339844, 0.0005513429641723633, 0.0005862712860107422, 0.0006211996078491211, 0.0006561279296875, 0.0006910562515258789, 0.0007259845733642578, 0.0007609128952026367, 0.0007958412170410156, 0.0008307695388793945, 0.0008656978607177734, 0.0009006261825561523, 0.0009355545043945312, 0.0009704828262329102, 0.001005411148071289, 0.001040339469909668, 0.0010752677917480469, 0.0011101961135864258, 0.0011451244354248047, 0.0011800527572631836, 0.0012149810791015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 9.0, 8.0, 16.0, 21.0, 22.0, 29.0, 42.0, 54.0, 72.0, 85.0, 133.0, 201.0, 2060.0, 4170460.0, 19588.0, 565.0, 182.0, 139.0, 124.0, 86.0, 78.0, 63.0, 55.0, 46.0, 36.0, 28.0, 19.0, 17.0, 9.0, 4.0, 9.0, 5.0, 3.0, 1.0, 6.0, 1.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3271484375, -0.31390380859375, -0.3006591796875, -0.28741455078125, -0.274169921875, -0.26092529296875, -0.2476806640625, -0.23443603515625, -0.22119140625, -0.20794677734375, -0.1947021484375, -0.18145751953125, -0.168212890625, -0.15496826171875, -0.1417236328125, -0.12847900390625, -0.115234375, -0.10198974609375, -0.0887451171875, -0.07550048828125, -0.062255859375, -0.04901123046875, -0.0357666015625, -0.02252197265625, -0.00927734375, 0.00396728515625, 0.0172119140625, 0.03045654296875, 0.043701171875, 0.05694580078125, 0.0701904296875, 0.08343505859375, 0.0966796875, 0.10992431640625, 0.1231689453125, 0.13641357421875, 0.149658203125, 0.16290283203125, 0.1761474609375, 0.18939208984375, 0.20263671875, 0.21588134765625, 0.2291259765625, 0.24237060546875, 0.255615234375, 0.26885986328125, 0.2821044921875, 0.29534912109375, 0.30859375, 0.32183837890625, 0.3350830078125, 0.34832763671875, 0.361572265625, 0.37481689453125, 0.3880615234375, 0.40130615234375, 0.41455078125, 0.42779541015625, 0.4410400390625, 0.45428466796875, 0.467529296875, 0.48077392578125, 0.4940185546875, 0.50726318359375, 0.5205078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 11.0, 13.0, 19.0, 28.0, 30.0, 45.0, 72.0, 81.0, 106.0, 150.0, 220.0, 289.0, 1346.0, 479.0, 242.0, 168.0, 143.0, 118.0, 97.0, 78.0, 68.0, 59.0, 47.0, 37.0, 29.0, 25.0, 12.0, 9.0, 8.0, 9.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002529144287109375, -0.0024268031120300293, -0.0023244619369506836, -0.002222120761871338, -0.002119779586791992, -0.0020174384117126465, -0.0019150972366333008, -0.001812756061553955, -0.0017104148864746094, -0.0016080737113952637, -0.001505732536315918, -0.0014033913612365723, -0.0013010501861572266, -0.0011987090110778809, -0.0010963678359985352, -0.0009940266609191895, -0.0008916854858398438, -0.000789344310760498, -0.0006870031356811523, -0.0005846619606018066, -0.00048232078552246094, -0.00037997961044311523, -0.00027763843536376953, -0.00017529726028442383, -7.295608520507812e-05, 2.9385089874267578e-05, 0.00013172626495361328, 0.00023406744003295898, 0.0003364086151123047, 0.0004387497901916504, 0.0005410909652709961, 0.0006434321403503418, 0.0007457733154296875, 0.0008481144905090332, 0.0009504556655883789, 0.0010527968406677246, 0.0011551380157470703, 0.001257479190826416, 0.0013598203659057617, 0.0014621615409851074, 0.0015645027160644531, 0.0016668438911437988, 0.0017691850662231445, 0.0018715262413024902, 0.001973867416381836, 0.0020762085914611816, 0.0021785497665405273, 0.002280890941619873, 0.0023832321166992188, 0.0024855732917785645, 0.00258791446685791, 0.002690255641937256, 0.0027925968170166016, 0.0028949379920959473, 0.002997279167175293, 0.0030996203422546387, 0.0032019615173339844, 0.00330430269241333, 0.0034066438674926758, 0.0035089850425720215, 0.003611326217651367, 0.003713667392730713, 0.0038160085678100586, 0.003918349742889404, 0.00402069091796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 734.0, 249.0, 25.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09924425184726715, -0.06409721076488495, -0.028950177133083344, 0.006196856498718262, 0.041343897581100464, 0.07649093866348267, 0.11163796484470367, 0.14678500592708588, 0.18193204700946808, 0.21707908809185028, 0.2522261142730713, 0.2873731553554535, 0.3225201964378357, 0.3576672375202179, 0.3928142786026001, 0.4279612898826599, 0.4631083607673645, 0.4982554018497467, 0.5334024429321289, 0.5685494542121887, 0.6036965250968933, 0.6388435363769531, 0.6739906072616577, 0.7091376185417175, 0.7442846298217773, 0.7794316411018372, 0.8145787119865417, 0.8497257232666016, 0.8848727941513062, 0.920019805431366, 0.9551668167114258, 0.9903138875961304, 1.0254608392715454, 1.06060791015625, 1.095754861831665, 1.1309019327163696, 1.1660490036010742, 1.2011960744857788, 1.2363430261611938, 1.2714900970458984, 1.306637167930603, 1.3417842388153076, 1.3769311904907227, 1.4120782613754272, 1.4472253322601318, 1.4823724031448364, 1.5175193548202515, 1.552666425704956, 1.587813377380371, 1.6229604482650757, 1.6581073999404907, 1.6932544708251953, 1.7284015417099, 1.7635486125946045, 1.7986955642700195, 1.8338426351547241, 1.8689897060394287, 1.9041367769241333, 1.9392837285995483, 1.974430799484253, 2.009577751159668, 2.044724941253662, 2.079871892929077, 2.115018844604492, 2.1501660346984863]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 11.0, 12.0, 16.0, 14.0, 36.0, 46.0, 65.0, 84.0, 106.0, 100.0, 121.0, 92.0, 82.0, 69.0, 56.0, 39.0, 17.0, 11.0, 5.0, 11.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0771322250366211, -0.07387250661849976, -0.07061278820037842, -0.06735306978225708, -0.06409335136413574, -0.060833629220724106, -0.05757390707731247, -0.05431418865919113, -0.051054470241069794, -0.047794751822948456, -0.04453503340482712, -0.04127531126141548, -0.038015592843294144, -0.034755874425172806, -0.03149615228176117, -0.02823643386363983, -0.024976715445518494, -0.021716997027397156, -0.01845727674663067, -0.015197557397186756, -0.011937838047742844, -0.008678119629621506, -0.005418399348855019, -0.0021586790680885315, 0.0011010393500328064, 0.004360758699476719, 0.007620478048920631, 0.010880197398364544, 0.014139916747808456, 0.017399635165929794, 0.02065935544669628, 0.02391907572746277, 0.027178794145584106, 0.030438512563705444, 0.03369823098182678, 0.03695795312523842, 0.040217671543359756, 0.043477389961481094, 0.04673711210489273, 0.04999683052301407, 0.053256548941135406, 0.056516267359256744, 0.05977598577737808, 0.06303570419549942, 0.06629543006420135, 0.06955514848232269, 0.07281486690044403, 0.07607458531856537, 0.0793343037366867, 0.08259402215480804, 0.08585374057292938, 0.08911345899105072, 0.09237317740917206, 0.0956328958272934, 0.09889262169599533, 0.10215234011411667, 0.105412058532238, 0.10867177695035934, 0.11193149536848068, 0.11519121378660202, 0.11845093965530396, 0.12171065807342529, 0.12497037649154663, 0.12823009490966797, 0.1314898133277893]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 9.0, 8.0, 13.0, 14.0, 27.0, 28.0, 28.0, 52.0, 76.0, 92.0, 107.0, 196.0, 235.0, 315.0, 458.0, 673.0, 990.0, 1485.0, 2446.0, 4091.0, 7072.0, 14600.0, 48956.0, 818299.0, 106689.0, 19515.0, 8881.0, 4802.0, 2794.0, 1767.0, 1146.0, 750.0, 505.0, 413.0, 253.0, 192.0, 155.0, 113.0, 67.0, 70.0, 51.0, 31.0, 18.0, 17.0, 22.0, 10.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0219268798828125, -0.0212554931640625, -0.0205841064453125, -0.0199127197265625, -0.0192413330078125, -0.0185699462890625, -0.0178985595703125, -0.0172271728515625, -0.0165557861328125, -0.0158843994140625, -0.0152130126953125, -0.0145416259765625, -0.0138702392578125, -0.0131988525390625, -0.0125274658203125, -0.0118560791015625, -0.0111846923828125, -0.0105133056640625, -0.0098419189453125, -0.0091705322265625, -0.0084991455078125, -0.0078277587890625, -0.0071563720703125, -0.0064849853515625, -0.0058135986328125, -0.0051422119140625, -0.0044708251953125, -0.0037994384765625, -0.0031280517578125, -0.0024566650390625, -0.0017852783203125, -0.0011138916015625, -0.0004425048828125, 0.0002288818359375, 0.0009002685546875, 0.0015716552734375, 0.0022430419921875, 0.0029144287109375, 0.0035858154296875, 0.0042572021484375, 0.0049285888671875, 0.0055999755859375, 0.0062713623046875, 0.0069427490234375, 0.0076141357421875, 0.0082855224609375, 0.0089569091796875, 0.0096282958984375, 0.0102996826171875, 0.0109710693359375, 0.0116424560546875, 0.0123138427734375, 0.0129852294921875, 0.0136566162109375, 0.0143280029296875, 0.0149993896484375, 0.0156707763671875, 0.0163421630859375, 0.0170135498046875, 0.0176849365234375, 0.0183563232421875, 0.0190277099609375, 0.0196990966796875, 0.0203704833984375, 0.0210418701171875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 3.0, 5.0, 7.0, 8.0, 8.0, 8.0, 11.0, 18.0, 33.0, 67.0, 130.0, 213.0, 200.0, 114.0, 55.0, 25.0, 11.0, 10.0, 6.0, 10.0, 5.0, 5.0, 4.0, 5.0, 6.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011262893676757812, -0.0010872185230255127, -0.0010481476783752441, -0.0010090768337249756, -0.000970005989074707, -0.0009309351444244385, -0.0008918642997741699, -0.0008527934551239014, -0.0008137226104736328, -0.0007746517658233643, -0.0007355809211730957, -0.0006965100765228271, -0.0006574392318725586, -0.00061836838722229, -0.0005792975425720215, -0.0005402266979217529, -0.0005011558532714844, -0.0004620850086212158, -0.00042301416397094727, -0.0003839433193206787, -0.00034487247467041016, -0.0003058016300201416, -0.00026673078536987305, -0.0002276599407196045, -0.00018858909606933594, -0.00014951825141906738, -0.00011044740676879883, -7.137656211853027e-05, -3.230571746826172e-05, 6.765127182006836e-06, 4.583597183227539e-05, 8.490681648254395e-05, 0.0001239776611328125, 0.00016304850578308105, 0.0002021193504333496, 0.00024119019508361816, 0.0002802610397338867, 0.0003193318843841553, 0.00035840272903442383, 0.0003974735736846924, 0.00043654441833496094, 0.0004756152629852295, 0.000514686107635498, 0.0005537569522857666, 0.0005928277969360352, 0.0006318986415863037, 0.0006709694862365723, 0.0007100403308868408, 0.0007491111755371094, 0.0007881820201873779, 0.0008272528648376465, 0.000866323709487915, 0.0009053945541381836, 0.0009444653987884521, 0.0009835362434387207, 0.0010226070880889893, 0.0010616779327392578, 0.0011007487773895264, 0.001139819622039795, 0.0011788904666900635, 0.001217961311340332, 0.0012570321559906006, 0.0012961030006408691, 0.0013351738452911377, 0.0013742446899414062]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 5.0, 2.0, 5.0, 2.0, 4.0, 6.0, 9.0, 6.0, 12.0, 16.0, 16.0, 16.0, 11.0, 13.0, 23.0, 24.0, 30.0, 35.0, 39.0, 40.0, 122.0, 627.0, 4079.0, 196423.0, 838584.0, 7055.0, 855.0, 176.0, 59.0, 34.0, 33.0, 25.0, 20.0, 17.0, 24.0, 11.0, 17.0, 13.0, 8.0, 12.0, 6.0, 8.0, 5.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.05023193359375, -0.04856395721435547, -0.04689598083496094, -0.045228004455566406, -0.043560028076171875, -0.041892051696777344, -0.04022407531738281, -0.03855609893798828, -0.03688812255859375, -0.03522014617919922, -0.03355216979980469, -0.031884193420410156, -0.030216217041015625, -0.028548240661621094, -0.026880264282226562, -0.02521228790283203, -0.0235443115234375, -0.02187633514404297, -0.020208358764648438, -0.018540382385253906, -0.016872406005859375, -0.015204429626464844, -0.013536453247070312, -0.011868476867675781, -0.01020050048828125, -0.008532524108886719, -0.0068645477294921875, -0.005196571350097656, -0.003528594970703125, -0.0018606185913085938, -0.0001926422119140625, 0.0014753341674804688, 0.003143310546875, 0.004811286926269531, 0.0064792633056640625, 0.008147239685058594, 0.009815216064453125, 0.011483192443847656, 0.013151168823242188, 0.014819145202636719, 0.01648712158203125, 0.01815509796142578, 0.019823074340820312, 0.021491050720214844, 0.023159027099609375, 0.024827003479003906, 0.026494979858398438, 0.02816295623779297, 0.0298309326171875, 0.03149890899658203, 0.03316688537597656, 0.034834861755371094, 0.036502838134765625, 0.038170814514160156, 0.03983879089355469, 0.04150676727294922, 0.04317474365234375, 0.04484272003173828, 0.04651069641113281, 0.048178672790527344, 0.049846649169921875, 0.051514625549316406, 0.05318260192871094, 0.05485057830810547, 0.0565185546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 8.0, 11.0, 11.0, 11.0, 18.0, 20.0, 15.0, 19.0, 28.0, 31.0, 24.0, 20.0, 27.0, 29.0, 31.0, 38.0, 36.0, 36.0, 35.0, 42.0, 32.0, 41.0, 38.0, 41.0, 49.0, 34.0, 30.0, 30.0, 22.0, 30.0, 22.0, 22.0, 18.0, 21.0, 4.0, 9.0, 9.0, 8.0, 13.0, 7.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.004161834716796875, -0.004039019346237183, -0.00391620397567749, -0.003793388605117798, -0.0036705732345581055, -0.003547757863998413, -0.0034249424934387207, -0.0033021271228790283, -0.003179311752319336, -0.0030564963817596436, -0.002933681011199951, -0.002810865640640259, -0.0026880502700805664, -0.002565234899520874, -0.0024424195289611816, -0.0023196041584014893, -0.002196788787841797, -0.0020739734172821045, -0.0019511580467224121, -0.0018283426761627197, -0.0017055273056030273, -0.001582711935043335, -0.0014598965644836426, -0.0013370811939239502, -0.0012142658233642578, -0.0010914504528045654, -0.000968635082244873, -0.0008458197116851807, -0.0007230043411254883, -0.0006001889705657959, -0.0004773736000061035, -0.00035455822944641113, -0.00023174285888671875, -0.00010892748832702637, 1.3887882232666016e-05, 0.0001367032527923584, 0.0002595186233520508, 0.00038233399391174316, 0.0005051493644714355, 0.0006279647350311279, 0.0007507801055908203, 0.0008735954761505127, 0.000996410846710205, 0.0011192262172698975, 0.0012420415878295898, 0.0013648569583892822, 0.0014876723289489746, 0.001610487699508667, 0.0017333030700683594, 0.0018561184406280518, 0.001978933811187744, 0.0021017491817474365, 0.002224564552307129, 0.0023473799228668213, 0.0024701952934265137, 0.002593010663986206, 0.0027158260345458984, 0.002838641405105591, 0.002961456775665283, 0.0030842721462249756, 0.003207087516784668, 0.0033299028873443604, 0.0034527182579040527, 0.003575533628463745, 0.0036983489990234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 17.0, 30.0, 29.0, 59.0, 140.0, 508.0, 2911.0, 123239.0, 915083.0, 5427.0, 684.0, 215.0, 77.0, 35.0, 22.0, 10.0, 15.0, 9.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038360595703125, -0.03694629669189453, -0.03553199768066406, -0.034117698669433594, -0.032703399658203125, -0.031289100646972656, -0.029874801635742188, -0.02846050262451172, -0.02704620361328125, -0.02563190460205078, -0.024217605590820312, -0.022803306579589844, -0.021389007568359375, -0.019974708557128906, -0.018560409545898438, -0.01714611053466797, -0.0157318115234375, -0.014317512512207031, -0.012903213500976562, -0.011488914489746094, -0.010074615478515625, -0.008660316467285156, -0.0072460174560546875, -0.005831718444824219, -0.00441741943359375, -0.0030031204223632812, -0.0015888214111328125, -0.00017452239990234375, 0.001239776611328125, 0.0026540756225585938, 0.0040683746337890625, 0.005482673645019531, 0.00689697265625, 0.008311271667480469, 0.009725570678710938, 0.011139869689941406, 0.012554168701171875, 0.013968467712402344, 0.015382766723632812, 0.01679706573486328, 0.01821136474609375, 0.01962566375732422, 0.021039962768554688, 0.022454261779785156, 0.023868560791015625, 0.025282859802246094, 0.026697158813476562, 0.02811145782470703, 0.0295257568359375, 0.03094005584716797, 0.03235435485839844, 0.033768653869628906, 0.035182952880859375, 0.036597251892089844, 0.03801155090332031, 0.03942584991455078, 0.04084014892578125, 0.04225444793701172, 0.04366874694824219, 0.045083045959472656, 0.046497344970703125, 0.047911643981933594, 0.04932594299316406, 0.05074024200439453, 0.052154541015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 5.0, 4.0, 6.0, 3.0, 4.0, 10.0, 8.0, 18.0, 16.0, 27.0, 56.0, 158.0, 359.0, 162.0, 52.0, 18.0, 16.0, 11.0, 14.0, 8.0, 11.0, 2.0, 5.0, 3.0, 3.0, 5.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009007453918457031, -0.0008607730269432068, -0.0008208006620407104, -0.0007808282971382141, -0.0007408559322357178, -0.0007008835673332214, -0.0006609112024307251, -0.0006209388375282288, -0.0005809664726257324, -0.0005409941077232361, -0.0005010217428207397, -0.0004610493779182434, -0.00042107701301574707, -0.00038110464811325073, -0.0003411322832107544, -0.00030115991830825806, -0.0002611875534057617, -0.00022121518850326538, -0.00018124282360076904, -0.0001412704586982727, -0.00010129809379577637, -6.132572889328003e-05, -2.135336399078369e-05, 1.8619000911712646e-05, 5.8591365814208984e-05, 9.856373071670532e-05, 0.00013853609561920166, 0.000178508460521698, 0.00021848082542419434, 0.0002584531903266907, 0.000298425555229187, 0.00033839792013168335, 0.0003783702850341797, 0.000418342649936676, 0.00045831501483917236, 0.0004982873797416687, 0.000538259744644165, 0.0005782321095466614, 0.0006182044744491577, 0.000658176839351654, 0.0006981492042541504, 0.0007381215691566467, 0.0007780939340591431, 0.0008180662989616394, 0.0008580386638641357, 0.0008980110287666321, 0.0009379833936691284, 0.0009779557585716248, 0.001017928123474121, 0.0010579004883766174, 0.0010978728532791138, 0.00113784521818161, 0.0011778175830841064, 0.0012177899479866028, 0.0012577623128890991, 0.0012977346777915955, 0.0013377070426940918, 0.0013776794075965881, 0.0014176517724990845, 0.0014576241374015808, 0.0014975965023040771, 0.0015375688672065735, 0.0015775412321090698, 0.0016175135970115662, 0.0016574859619140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 3.0, 8.0, 13.0, 9.0, 23.0, 24.0, 51.0, 126.0, 473.0, 3267.0, 823387.0, 218284.0, 2304.0, 339.0, 117.0, 50.0, 27.0, 22.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031158447265625, -0.02973794937133789, -0.02831745147705078, -0.026896953582763672, -0.025476455688476562, -0.024055957794189453, -0.022635459899902344, -0.021214962005615234, -0.019794464111328125, -0.018373966217041016, -0.016953468322753906, -0.015532970428466797, -0.014112472534179688, -0.012691974639892578, -0.011271476745605469, -0.00985097885131836, -0.00843048095703125, -0.007009983062744141, -0.005589485168457031, -0.004168987274169922, -0.0027484893798828125, -0.0013279914855957031, 9.250640869140625e-05, 0.0015130043029785156, 0.002933502197265625, 0.004354000091552734, 0.005774497985839844, 0.007194995880126953, 0.008615493774414062, 0.010035991668701172, 0.011456489562988281, 0.01287698745727539, 0.0142974853515625, 0.01571798324584961, 0.01713848114013672, 0.018558979034423828, 0.019979476928710938, 0.021399974822998047, 0.022820472717285156, 0.024240970611572266, 0.025661468505859375, 0.027081966400146484, 0.028502464294433594, 0.029922962188720703, 0.03134346008300781, 0.03276395797729492, 0.03418445587158203, 0.03560495376586914, 0.03702545166015625, 0.03844594955444336, 0.03986644744873047, 0.04128694534301758, 0.04270744323730469, 0.0441279411315918, 0.045548439025878906, 0.046968936920166016, 0.048389434814453125, 0.049809932708740234, 0.051230430603027344, 0.05265092849731445, 0.05407142639160156, 0.05549192428588867, 0.05691242218017578, 0.05833292007446289, 0.05975341796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 8.0, 16.0, 18.0, 18.0, 34.0, 36.0, 68.0, 71.0, 121.0, 164.0, 124.0, 102.0, 54.0, 37.0, 26.0, 22.0, 20.0, 8.0, 6.0, 9.0, 4.0, 2.0, 8.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00431060791015625, -0.004147708415985107, -0.003984808921813965, -0.0038219094276428223, -0.0036590099334716797, -0.003496110439300537, -0.0033332109451293945, -0.003170311450958252, -0.0030074119567871094, -0.002844512462615967, -0.0026816129684448242, -0.0025187134742736816, -0.002355813980102539, -0.0021929144859313965, -0.002030014991760254, -0.0018671154975891113, -0.0017042160034179688, -0.0015413165092468262, -0.0013784170150756836, -0.001215517520904541, -0.0010526180267333984, -0.0008897185325622559, -0.0007268190383911133, -0.0005639195442199707, -0.0004010200500488281, -0.00023812055587768555, -7.522106170654297e-05, 8.767843246459961e-05, 0.0002505779266357422, 0.00041347742080688477, 0.0005763769149780273, 0.0007392764091491699, 0.0009021759033203125, 0.001065075397491455, 0.0012279748916625977, 0.0013908743858337402, 0.0015537738800048828, 0.0017166733741760254, 0.001879572868347168, 0.0020424723625183105, 0.002205371856689453, 0.0023682713508605957, 0.0025311708450317383, 0.002694070339202881, 0.0028569698333740234, 0.003019869327545166, 0.0031827688217163086, 0.003345668315887451, 0.0035085678100585938, 0.0036714673042297363, 0.003834366798400879, 0.0039972662925720215, 0.004160165786743164, 0.004323065280914307, 0.004485964775085449, 0.004648864269256592, 0.004811763763427734, 0.004974663257598877, 0.0051375627517700195, 0.005300462245941162, 0.005463361740112305, 0.005626261234283447, 0.00578916072845459, 0.005952060222625732, 0.006114959716796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 10.0, 3.0, 7.0, 12.0, 37.0, 190.0, 404.0, 219.0, 64.0, 25.0, 11.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14002105593681335, -0.1365664303302765, -0.13311180472373962, -0.12965716421604156, -0.1262025386095047, -0.12274791300296783, -0.11929328739643097, -0.1158386617898941, -0.11238402873277664, -0.10892940312623978, -0.10547477006912231, -0.10202014446258545, -0.09856551885604858, -0.09511088579893112, -0.09165626019239426, -0.0882016271352768, -0.08474700152873993, -0.08129237592220306, -0.0778377428650856, -0.07438311725854874, -0.07092848420143127, -0.06747385859489441, -0.06401923298835754, -0.06056460365653038, -0.05710997432470322, -0.05365534499287605, -0.05020071566104889, -0.046746090054512024, -0.04329146072268486, -0.0398368313908577, -0.03638220578432083, -0.03292757645249367, -0.029472939670085907, -0.026018310338258743, -0.02256368286907673, -0.019109055399894714, -0.01565442606806755, -0.012199796736240387, -0.008745169267058372, -0.005290541797876358, -0.0018359124660491943, 0.0016187159344553947, 0.005073344334959984, 0.008527972735464573, 0.011982601135969162, 0.015437230467796326, 0.01889185793697834, 0.022346485406160355, 0.02580111473798752, 0.029255744069814682, 0.032710373401641846, 0.03616499900817871, 0.039619628340005875, 0.04307425767183304, 0.046528883278369904, 0.04998351261019707, 0.05343814194202423, 0.056892771273851395, 0.06034740060567856, 0.06380202621221542, 0.06725665926933289, 0.07071128487586975, 0.07416591048240662, 0.07762053608894348, 0.08107516914606094]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 10.0, 12.0, 11.0, 27.0, 25.0, 44.0, 45.0, 54.0, 57.0, 85.0, 69.0, 80.0, 76.0, 73.0, 57.0, 48.0, 36.0, 35.0, 28.0, 21.0, 20.0, 16.0, 5.0, 8.0, 9.0, 8.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.04657745361328125, -0.0452071912586689, -0.04383692890405655, -0.0424666702747345, -0.04109640792012215, -0.039726145565509796, -0.038355886936187744, -0.036985624581575394, -0.03561536222696304, -0.03424509987235069, -0.03287483751773834, -0.03150457888841629, -0.03013431653380394, -0.02876405417919159, -0.027393793687224388, -0.026023533195257187, -0.024653270840644836, -0.023283008486032486, -0.021912747994065285, -0.020542487502098083, -0.019172225147485733, -0.017801962792873383, -0.01643170230090618, -0.015061440877616405, -0.01369117945432663, -0.012320918031036854, -0.010950656607747078, -0.009580395184457302, -0.008210133761167526, -0.00683987233787775, -0.0054696109145879745, -0.004099349491298199, -0.002729088068008423, -0.001358826644718647, 1.1434778571128845e-05, 0.0013816962018609047, 0.0027519576251506805, 0.004122219048440456, 0.005492480471730232, 0.006862741895020008, 0.008233003318309784, 0.00960326474159956, 0.010973526164889336, 0.012343787588179111, 0.013714049011468887, 0.015084310434758663, 0.01645457185804844, 0.01782483235001564, 0.01919509470462799, 0.02056535705924034, 0.021935617551207542, 0.023305878043174744, 0.024676140397787094, 0.026046402752399445, 0.027416663244366646, 0.028786923736333847, 0.030157186090946198, 0.03152744844555855, 0.0328977108001709, 0.03426796942949295, 0.0356382317841053, 0.03700849413871765, 0.0383787527680397, 0.039749015122652054, 0.041119277477264404]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 0.0, 6.0, 5.0, 3.0, 4.0, 4.0, 0.0, 6.0, 14.0, 13.0, 7.0, 8.0, 16.0, 14.0, 18.0, 32.0, 64.0, 322.0, 4193249.0, 263.0, 54.0, 22.0, 17.0, 33.0, 12.0, 20.0, 16.0, 8.0, 8.0, 14.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.8828125, -0.8495025634765625, -0.816192626953125, -0.7828826904296875, -0.74957275390625, -0.7162628173828125, -0.682952880859375, -0.6496429443359375, -0.6163330078125, -0.5830230712890625, -0.549713134765625, -0.5164031982421875, -0.48309326171875, -0.4497833251953125, -0.416473388671875, -0.3831634521484375, -0.349853515625, -0.3165435791015625, -0.283233642578125, -0.2499237060546875, -0.21661376953125, -0.1833038330078125, -0.149993896484375, -0.1166839599609375, -0.0833740234375, -0.0500640869140625, -0.016754150390625, 0.0165557861328125, 0.04986572265625, 0.0831756591796875, 0.116485595703125, 0.1497955322265625, 0.18310546875, 0.2164154052734375, 0.249725341796875, 0.2830352783203125, 0.31634521484375, 0.3496551513671875, 0.382965087890625, 0.4162750244140625, 0.4495849609375, 0.4828948974609375, 0.516204833984375, 0.5495147705078125, 0.58282470703125, 0.6161346435546875, 0.649444580078125, 0.6827545166015625, 0.716064453125, 0.7493743896484375, 0.782684326171875, 0.8159942626953125, 0.84930419921875, 0.8826141357421875, 0.915924072265625, 0.9492340087890625, 0.9825439453125, 1.0158538818359375, 1.049163818359375, 1.0824737548828125, 1.11578369140625, 1.1490936279296875, 1.182403564453125, 1.2157135009765625, 1.2490234375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 1.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 8.0, 12.0, 13.0, 22.0, 25.0, 33.0, 83.0, 122.0, 171.0, 148.0, 107.0, 88.0, 43.0, 26.0, 12.0, 9.0, 7.0, 6.0, 12.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00107574462890625, -0.0010420680046081543, -0.0010083913803100586, -0.0009747147560119629, -0.0009410381317138672, -0.0009073615074157715, -0.0008736848831176758, -0.0008400082588195801, -0.0008063316345214844, -0.0007726550102233887, -0.000738978385925293, -0.0007053017616271973, -0.0006716251373291016, -0.0006379485130310059, -0.0006042718887329102, -0.0005705952644348145, -0.0005369186401367188, -0.000503242015838623, -0.00046956539154052734, -0.00043588876724243164, -0.00040221214294433594, -0.00036853551864624023, -0.00033485889434814453, -0.00030118227005004883, -0.0002675056457519531, -0.00023382902145385742, -0.00020015239715576172, -0.00016647577285766602, -0.0001327991485595703, -9.912252426147461e-05, -6.54458999633789e-05, -3.17692756652832e-05, 1.9073486328125e-06, 3.55839729309082e-05, 6.92605972290039e-05, 0.00010293722152709961, 0.0001366138458251953, 0.00017029047012329102, 0.00020396709442138672, 0.00023764371871948242, 0.0002713203430175781, 0.00030499696731567383, 0.00033867359161376953, 0.00037235021591186523, 0.00040602684020996094, 0.00043970346450805664, 0.00047338008880615234, 0.000507056713104248, 0.0005407333374023438, 0.0005744099617004395, 0.0006080865859985352, 0.0006417632102966309, 0.0006754398345947266, 0.0007091164588928223, 0.000742793083190918, 0.0007764697074890137, 0.0008101463317871094, 0.0008438229560852051, 0.0008774995803833008, 0.0009111762046813965, 0.0009448528289794922, 0.0009785294532775879, 0.0010122060775756836, 0.0010458827018737793, 0.001079559326171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 17.0, 39.0, 138.0, 23876.0, 4170048.0, 122.0, 24.0, 7.0, 7.0, 3.0, 1.0, 4.0], "bins": [-1.498046875, -1.4713134765625, -1.444580078125, -1.4178466796875, -1.39111328125, -1.3643798828125, -1.337646484375, -1.3109130859375, -1.2841796875, -1.2574462890625, -1.230712890625, -1.2039794921875, -1.17724609375, -1.1505126953125, -1.123779296875, -1.0970458984375, -1.0703125, -1.0435791015625, -1.016845703125, -0.9901123046875, -0.96337890625, -0.9366455078125, -0.909912109375, -0.8831787109375, -0.8564453125, -0.8297119140625, -0.802978515625, -0.7762451171875, -0.74951171875, -0.7227783203125, -0.696044921875, -0.6693115234375, -0.642578125, -0.6158447265625, -0.589111328125, -0.5623779296875, -0.53564453125, -0.5089111328125, -0.482177734375, -0.4554443359375, -0.4287109375, -0.4019775390625, -0.375244140625, -0.3485107421875, -0.32177734375, -0.2950439453125, -0.268310546875, -0.2415771484375, -0.21484375, -0.1881103515625, -0.161376953125, -0.1346435546875, -0.10791015625, -0.0811767578125, -0.054443359375, -0.0277099609375, -0.0009765625, 0.0257568359375, 0.052490234375, 0.0792236328125, 0.10595703125, 0.1326904296875, 0.159423828125, 0.1861572265625, 0.212890625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 11.0, 32.0, 108.0, 412.0, 2929.0, 461.0, 83.0, 20.0, 9.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0138397216796875, -0.013581395149230957, -0.013323068618774414, -0.013064742088317871, -0.012806415557861328, -0.012548089027404785, -0.012289762496948242, -0.0120314359664917, -0.011773109436035156, -0.011514782905578613, -0.01125645637512207, -0.010998129844665527, -0.010739803314208984, -0.010481476783752441, -0.010223150253295898, -0.009964823722839355, -0.009706497192382812, -0.00944817066192627, -0.009189844131469727, -0.008931517601013184, -0.00867319107055664, -0.008414864540100098, -0.008156538009643555, -0.007898211479187012, -0.007639884948730469, -0.007381558418273926, -0.007123231887817383, -0.00686490535736084, -0.006606578826904297, -0.006348252296447754, -0.006089925765991211, -0.005831599235534668, -0.005573272705078125, -0.005314946174621582, -0.005056619644165039, -0.004798293113708496, -0.004539966583251953, -0.00428164005279541, -0.004023313522338867, -0.0037649869918823242, -0.0035066604614257812, -0.0032483339309692383, -0.0029900074005126953, -0.0027316808700561523, -0.0024733543395996094, -0.0022150278091430664, -0.0019567012786865234, -0.0016983747482299805, -0.0014400482177734375, -0.0011817216873168945, -0.0009233951568603516, -0.0006650686264038086, -0.0004067420959472656, -0.00014841556549072266, 0.00010991096496582031, 0.0003682374954223633, 0.0006265640258789062, 0.0008848905563354492, 0.0011432170867919922, 0.0014015436172485352, 0.0016598701477050781, 0.001918196678161621, 0.002176523208618164, 0.002434849739074707, 0.00269317626953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1002.0, 18.0, 1.0], "bins": [-3.636082410812378, -3.577230930328369, -3.5183792114257812, -3.4595277309417725, -3.4006762504577637, -3.341824531555176, -3.282973051071167, -3.224121332168579, -3.1652698516845703, -3.1064183712005615, -3.0475666522979736, -2.988715171813965, -2.929863452911377, -2.871011972427368, -2.8121604919433594, -2.7533087730407715, -2.6944572925567627, -2.635605812072754, -2.576754093170166, -2.5179026126861572, -2.4590511322021484, -2.4001994132995605, -2.3413479328155518, -2.282496213912964, -2.223644733428955, -2.1647932529449463, -2.1059415340423584, -2.0470900535583496, -1.9882384538650513, -1.929386854171753, -1.8705353736877441, -1.8116837739944458, -1.7528321743011475, -1.6939805746078491, -1.6351289749145508, -1.576277494430542, -1.5174258947372437, -1.4585742950439453, -1.3997228145599365, -1.3408712148666382, -1.2820196151733398, -1.2231680154800415, -1.1643164157867432, -1.1054649353027344, -1.046613335609436, -0.9877617359161377, -0.9289101958274841, -0.8700586557388306, -0.811207115650177, -0.7523555755615234, -0.6935039758682251, -0.6346523761749268, -0.5758008360862732, -0.5169492959976196, -0.4580976963043213, -0.39924612641334534, -0.3403945565223694, -0.28154298663139343, -0.22269141674041748, -0.16383984684944153, -0.10498827695846558, -0.046136707067489624, 0.012714862823486328, 0.07156643271446228, 0.13041800260543823]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 11.0, 25.0, 66.0, 151.0, 254.0, 238.0, 161.0, 69.0, 28.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28930211067199707, -0.28349003195762634, -0.2776779532432556, -0.2718658745288849, -0.26605379581451416, -0.26024168729782104, -0.2544296383857727, -0.24861754477024078, -0.24280545115470886, -0.23699337244033813, -0.2311812937259674, -0.22536921501159668, -0.21955712139606476, -0.21374504268169403, -0.2079329639673233, -0.20212088525295258, -0.19630880653858185, -0.19049672782421112, -0.1846846491098404, -0.17887255549430847, -0.17306047677993774, -0.16724839806556702, -0.1614363193511963, -0.15562424063682556, -0.14981216192245483, -0.1440000832080841, -0.13818800449371338, -0.13237592577934265, -0.12656383216381073, -0.12075175344944, -0.11493967473506927, -0.10912759602069855, -0.10331550240516663, -0.0975034236907959, -0.09169133752584457, -0.08587925881147385, -0.08006717264652252, -0.0742550939321518, -0.06844301521778107, -0.06263093650341034, -0.056818850338459015, -0.05100676789879799, -0.04519468545913696, -0.039382606744766235, -0.03357052430510521, -0.027758441865444183, -0.021946363151073456, -0.01613428071141243, -0.010322198271751404, -0.004510116763412952, 0.001301964744925499, 0.007114045321941376, 0.012926127761602402, 0.018738210201263428, 0.024550288915634155, 0.03036237135529518, 0.03617445379495621, 0.04198653623461723, 0.04779861867427826, 0.05361069738864899, 0.05942277982831001, 0.06523486226797104, 0.07104694098234177, 0.07685902714729309, 0.08267110586166382]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 6.0, 14.0, 18.0, 14.0, 21.0, 26.0, 39.0, 43.0, 39.0, 36.0, 59.0, 44.0, 73.0, 3148.0, 1043755.0, 780.0, 58.0, 55.0, 43.0, 49.0, 44.0, 30.0, 35.0, 16.0, 15.0, 17.0, 14.0, 9.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.274658203125, -0.26618194580078125, -0.2577056884765625, -0.24922943115234375, -0.240753173828125, -0.23227691650390625, -0.2238006591796875, -0.21532440185546875, -0.20684814453125, -0.19837188720703125, -0.1898956298828125, -0.18141937255859375, -0.172943115234375, -0.16446685791015625, -0.1559906005859375, -0.14751434326171875, -0.1390380859375, -0.13056182861328125, -0.1220855712890625, -0.11360931396484375, -0.105133056640625, -0.09665679931640625, -0.0881805419921875, -0.07970428466796875, -0.07122802734375, -0.06275177001953125, -0.0542755126953125, -0.04579925537109375, -0.037322998046875, -0.02884674072265625, -0.0203704833984375, -0.01189422607421875, -0.00341796875, 0.00505828857421875, 0.0135345458984375, 0.02201080322265625, 0.030487060546875, 0.03896331787109375, 0.0474395751953125, 0.05591583251953125, 0.06439208984375, 0.07286834716796875, 0.0813446044921875, 0.08982086181640625, 0.098297119140625, 0.10677337646484375, 0.1152496337890625, 0.12372589111328125, 0.1322021484375, 0.14067840576171875, 0.1491546630859375, 0.15763092041015625, 0.166107177734375, 0.17458343505859375, 0.1830596923828125, 0.19153594970703125, 0.20001220703125, 0.20848846435546875, 0.2169647216796875, 0.22544097900390625, 0.233917236328125, 0.24239349365234375, 0.2508697509765625, 0.25934600830078125, 0.267822265625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 118.0, 565.0, 306.0, 24.0, 3.0], "bins": [-0.07366943359375, -0.07245504856109619, -0.07124066352844238, -0.07002627849578857, -0.06881189346313477, -0.06759750843048096, -0.06638312339782715, -0.06516873836517334, -0.06395435333251953, -0.06273996829986572, -0.061525583267211914, -0.060311198234558105, -0.0590968132019043, -0.05788242816925049, -0.05666804313659668, -0.05545365810394287, -0.05423927307128906, -0.053024888038635254, -0.051810503005981445, -0.05059611797332764, -0.04938173294067383, -0.04816734790802002, -0.04695296287536621, -0.0457385778427124, -0.044524192810058594, -0.043309807777404785, -0.04209542274475098, -0.04088103771209717, -0.03966665267944336, -0.03845226764678955, -0.03723788261413574, -0.036023497581481934, -0.034809112548828125, -0.033594727516174316, -0.03238034248352051, -0.0311659574508667, -0.02995157241821289, -0.028737187385559082, -0.027522802352905273, -0.026308417320251465, -0.025094032287597656, -0.023879647254943848, -0.02266526222229004, -0.02145087718963623, -0.020236492156982422, -0.019022107124328613, -0.017807722091674805, -0.016593337059020996, -0.015378952026367188, -0.014164566993713379, -0.01295018196105957, -0.011735796928405762, -0.010521411895751953, -0.009307026863098145, -0.008092641830444336, -0.006878256797790527, -0.005663871765136719, -0.00444948673248291, -0.0032351016998291016, -0.002020716667175293, -0.0008063316345214844, 0.0004080533981323242, 0.0016224384307861328, 0.0028368234634399414, 0.00405120849609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 1.0, 6.0, 2.0, 8.0, 10.0, 13.0, 14.0, 17.0, 27.0, 35.0, 39.0, 45.0, 79.0, 110.0, 176.0, 269.0, 861.0, 4597.0, 67812.0, 922823.0, 46351.0, 3672.0, 750.0, 283.0, 163.0, 111.0, 76.0, 47.0, 36.0, 23.0, 30.0, 16.0, 12.0, 9.0, 8.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10801887512207031, -0.10422134399414062, -0.10042381286621094, -0.09662628173828125, -0.09282875061035156, -0.08903121948242188, -0.08523368835449219, -0.0814361572265625, -0.07763862609863281, -0.07384109497070312, -0.07004356384277344, -0.06624603271484375, -0.06244850158691406, -0.058650970458984375, -0.05485343933105469, -0.051055908203125, -0.04725837707519531, -0.043460845947265625, -0.03966331481933594, -0.03586578369140625, -0.03206825256347656, -0.028270721435546875, -0.024473190307617188, -0.0206756591796875, -0.016878128051757812, -0.013080596923828125, -0.009283065795898438, -0.00548553466796875, -0.0016880035400390625, 0.002109527587890625, 0.0059070587158203125, 0.00970458984375, 0.013502120971679688, 0.017299652099609375, 0.021097183227539062, 0.02489471435546875, 0.028692245483398438, 0.032489776611328125, 0.03628730773925781, 0.0400848388671875, 0.04388236999511719, 0.047679901123046875, 0.05147743225097656, 0.05527496337890625, 0.05907249450683594, 0.06287002563476562, 0.06666755676269531, 0.070465087890625, 0.07426261901855469, 0.07806015014648438, 0.08185768127441406, 0.08565521240234375, 0.08945274353027344, 0.09325027465820312, 0.09704780578613281, 0.1008453369140625, 0.10464286804199219, 0.10844039916992188, 0.11223793029785156, 0.11603546142578125, 0.11983299255371094, 0.12363052368164062, 0.1274280548095703, 0.1312255859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 3.0, 7.0, 13.0, 21.0, 14.0, 17.0, 23.0, 24.0, 40.0, 40.0, 54.0, 54.0, 60.0, 73.0, 59.0, 59.0, 65.0, 73.0, 46.0, 41.0, 49.0, 39.0, 29.0, 19.0, 18.0, 12.0, 12.0, 8.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0494384765625, -0.04771757125854492, -0.045996665954589844, -0.044275760650634766, -0.04255485534667969, -0.04083395004272461, -0.03911304473876953, -0.03739213943481445, -0.035671234130859375, -0.0339503288269043, -0.03222942352294922, -0.03050851821899414, -0.028787612915039062, -0.027066707611083984, -0.025345802307128906, -0.023624897003173828, -0.02190399169921875, -0.020183086395263672, -0.018462181091308594, -0.016741275787353516, -0.015020370483398438, -0.01329946517944336, -0.011578559875488281, -0.009857654571533203, -0.008136749267578125, -0.006415843963623047, -0.004694938659667969, -0.0029740333557128906, -0.0012531280517578125, 0.0004677772521972656, 0.0021886825561523438, 0.003909587860107422, 0.0056304931640625, 0.007351398468017578, 0.009072303771972656, 0.010793209075927734, 0.012514114379882812, 0.01423501968383789, 0.01595592498779297, 0.017676830291748047, 0.019397735595703125, 0.021118640899658203, 0.02283954620361328, 0.02456045150756836, 0.026281356811523438, 0.028002262115478516, 0.029723167419433594, 0.03144407272338867, 0.03316497802734375, 0.03488588333129883, 0.036606788635253906, 0.038327693939208984, 0.04004859924316406, 0.04176950454711914, 0.04349040985107422, 0.0452113151550293, 0.046932220458984375, 0.04865312576293945, 0.05037403106689453, 0.05209493637084961, 0.05381584167480469, 0.055536746978759766, 0.057257652282714844, 0.05897855758666992, 0.060699462890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 9.0, 9.0, 6.0, 4.0, 12.0, 10.0, 18.0, 22.0, 24.0, 34.0, 43.0, 97.0, 181.0, 523.0, 2548.0, 27013.0, 1006834.0, 9064.0, 1322.0, 361.0, 147.0, 72.0, 32.0, 33.0, 23.0, 20.0, 19.0, 5.0, 8.0, 12.0, 4.0, 7.0, 6.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.41650390625, -0.4040031433105469, -0.39150238037109375, -0.3790016174316406, -0.3665008544921875, -0.3540000915527344, -0.34149932861328125, -0.3289985656738281, -0.316497802734375, -0.3039970397949219, -0.29149627685546875, -0.2789955139160156, -0.2664947509765625, -0.2539939880371094, -0.24149322509765625, -0.22899246215820312, -0.21649169921875, -0.20399093627929688, -0.19149017333984375, -0.17898941040039062, -0.1664886474609375, -0.15398788452148438, -0.14148712158203125, -0.12898635864257812, -0.116485595703125, -0.10398483276367188, -0.09148406982421875, -0.07898330688476562, -0.0664825439453125, -0.053981781005859375, -0.04148101806640625, -0.028980255126953125, -0.0164794921875, -0.003978729248046875, 0.00852203369140625, 0.021022796630859375, 0.0335235595703125, 0.046024322509765625, 0.05852508544921875, 0.07102584838867188, 0.083526611328125, 0.09602737426757812, 0.10852813720703125, 0.12102890014648438, 0.1335296630859375, 0.14603042602539062, 0.15853118896484375, 0.17103195190429688, 0.18353271484375, 0.19603347778320312, 0.20853424072265625, 0.22103500366210938, 0.2335357666015625, 0.24603652954101562, 0.25853729248046875, 0.2710380554199219, 0.283538818359375, 0.2960395812988281, 0.30854034423828125, 0.3210411071777344, 0.3335418701171875, 0.3460426330566406, 0.35854339599609375, 0.3710441589355469, 0.383544921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 13.0, 14.0, 10.0, 8.0, 11.0, 10.0, 21.0, 19.0, 31.0, 51.0, 63.0, 74.0, 111.0, 165.0, 92.0, 78.0, 55.0, 41.0, 20.0, 27.0, 18.0, 9.0, 12.0, 5.0, 8.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003249645233154297, -0.00031453371047973633, -0.00030410289764404297, -0.0002936720848083496, -0.00028324127197265625, -0.0002728104591369629, -0.00026237964630126953, -0.00025194883346557617, -0.0002415180206298828, -0.00023108720779418945, -0.0002206563949584961, -0.00021022558212280273, -0.00019979476928710938, -0.00018936395645141602, -0.00017893314361572266, -0.0001685023307800293, -0.00015807151794433594, -0.00014764070510864258, -0.00013720989227294922, -0.00012677907943725586, -0.0001163482666015625, -0.00010591745376586914, -9.548664093017578e-05, -8.505582809448242e-05, -7.462501525878906e-05, -6.41942024230957e-05, -5.3763389587402344e-05, -4.3332576751708984e-05, -3.2901763916015625e-05, -2.2470951080322266e-05, -1.2040138244628906e-05, -1.6093254089355469e-06, 8.821487426757812e-06, 1.9252300262451172e-05, 2.968311309814453e-05, 4.011392593383789e-05, 5.054473876953125e-05, 6.097555160522461e-05, 7.140636444091797e-05, 8.183717727661133e-05, 9.226799011230469e-05, 0.00010269880294799805, 0.0001131296157836914, 0.00012356042861938477, 0.00013399124145507812, 0.00014442205429077148, 0.00015485286712646484, 0.0001652836799621582, 0.00017571449279785156, 0.00018614530563354492, 0.00019657611846923828, 0.00020700693130493164, 0.000217437744140625, 0.00022786855697631836, 0.00023829936981201172, 0.0002487301826477051, 0.00025916099548339844, 0.0002695918083190918, 0.00028002262115478516, 0.0002904534339904785, 0.0003008842468261719, 0.00031131505966186523, 0.0003217458724975586, 0.00033217668533325195, 0.0003426074981689453]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 5.0, 2.0, 6.0, 8.0, 10.0, 12.0, 31.0, 78.0, 282.0, 1410.0, 10726.0, 981798.0, 49198.0, 3969.0, 687.0, 185.0, 52.0, 20.0, 19.0, 14.0, 4.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.4586982727050781, -0.44425201416015625, -0.4298057556152344, -0.4153594970703125, -0.4009132385253906, -0.38646697998046875, -0.3720207214355469, -0.357574462890625, -0.3431282043457031, -0.32868194580078125, -0.3142356872558594, -0.2997894287109375, -0.2853431701660156, -0.27089691162109375, -0.2564506530761719, -0.24200439453125, -0.22755813598632812, -0.21311187744140625, -0.19866561889648438, -0.1842193603515625, -0.16977310180664062, -0.15532684326171875, -0.14088058471679688, -0.126434326171875, -0.11198806762695312, -0.09754180908203125, -0.08309555053710938, -0.0686492919921875, -0.054203033447265625, -0.03975677490234375, -0.025310516357421875, -0.0108642578125, 0.003582000732421875, 0.01802825927734375, 0.032474517822265625, 0.0469207763671875, 0.061367034912109375, 0.07581329345703125, 0.09025955200195312, 0.104705810546875, 0.11915206909179688, 0.13359832763671875, 0.14804458618164062, 0.1624908447265625, 0.17693710327148438, 0.19138336181640625, 0.20582962036132812, 0.22027587890625, 0.23472213745117188, 0.24916839599609375, 0.2636146545410156, 0.2780609130859375, 0.2925071716308594, 0.30695343017578125, 0.3213996887207031, 0.335845947265625, 0.3502922058105469, 0.36473846435546875, 0.3791847229003906, 0.3936309814453125, 0.4080772399902344, 0.42252349853515625, 0.4369697570800781, 0.451416015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 8.0, 7.0, 13.0, 16.0, 32.0, 39.0, 124.0, 455.0, 142.0, 45.0, 28.0, 18.0, 14.0, 2.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1689453125, -0.1637554168701172, -0.15856552124023438, -0.15337562561035156, -0.14818572998046875, -0.14299583435058594, -0.13780593872070312, -0.1326160430908203, -0.1274261474609375, -0.12223625183105469, -0.11704635620117188, -0.11185646057128906, -0.10666656494140625, -0.10147666931152344, -0.09628677368164062, -0.09109687805175781, -0.085906982421875, -0.08071708679199219, -0.07552719116210938, -0.07033729553222656, -0.06514739990234375, -0.05995750427246094, -0.054767608642578125, -0.04957771301269531, -0.0443878173828125, -0.03919792175292969, -0.034008026123046875, -0.028818130493164062, -0.02362823486328125, -0.018438339233398438, -0.013248443603515625, -0.008058547973632812, -0.00286865234375, 0.0023212432861328125, 0.007511138916015625, 0.012701034545898438, 0.01789093017578125, 0.023080825805664062, 0.028270721435546875, 0.03346061706542969, 0.0386505126953125, 0.04384040832519531, 0.049030303955078125, 0.05422019958496094, 0.05941009521484375, 0.06459999084472656, 0.06978988647460938, 0.07497978210449219, 0.080169677734375, 0.08535957336425781, 0.09054946899414062, 0.09573936462402344, 0.10092926025390625, 0.10611915588378906, 0.11130905151367188, 0.11649894714355469, 0.1216888427734375, 0.1268787384033203, 0.13206863403320312, 0.13725852966308594, 0.14244842529296875, 0.14763832092285156, 0.15282821655273438, 0.1580181121826172, 0.1632080078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 984.0, 28.0, 4.0, 1.0], "bins": [-35.275917053222656, -34.69390106201172, -34.11188888549805, -33.52987289428711, -32.94785690307617, -32.3658447265625, -31.783828735351562, -31.201814651489258, -30.619800567626953, -30.03778648376465, -29.45577049255371, -28.873756408691406, -28.2917423248291, -27.709728240966797, -27.12771224975586, -26.545698165893555, -25.96368408203125, -25.381669998168945, -24.799654006958008, -24.217639923095703, -23.6356258392334, -23.053611755371094, -22.471595764160156, -21.88958168029785, -21.307565689086914, -20.72555160522461, -20.143535614013672, -19.561521530151367, -18.979507446289062, -18.397493362426758, -17.81547737121582, -17.233463287353516, -16.65144920349121, -16.069435119628906, -15.487420082092285, -14.905405044555664, -14.32339096069336, -13.741375923156738, -13.159360885620117, -12.577346801757812, -11.995332717895508, -11.413317680358887, -10.831303596496582, -10.249288558959961, -9.667274475097656, -9.085259437561035, -8.503244400024414, -7.921230316162109, -7.339215278625488, -6.757200717926025, -6.1751861572265625, -5.593171119689941, -5.011157035827637, -4.429141998291016, -3.8471274375915527, -3.26511287689209, -2.683098316192627, -2.101083755493164, -1.5190690755844116, -0.9370543956756592, -0.3550398349761963, 0.2269747257232666, 0.8089895248413086, 1.3910040855407715, 1.9730185270309448]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 25.0, 50.0, 115.0, 184.0, 179.0, 199.0, 131.0, 77.0, 33.0, 12.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587221622467041, -2.5386786460876465, -2.490135431289673, -2.4415924549102783, -2.3930492401123047, -2.34450626373291, -2.2959632873535156, -2.247420072555542, -2.1988770961761475, -2.150334119796753, -2.1017909049987793, -2.0532479286193848, -2.004704713821411, -1.9561617374420166, -1.9076186418533325, -1.8590755462646484, -1.8105324506759644, -1.7619893550872803, -1.7134462594985962, -1.664903163909912, -1.6163601875305176, -1.5678170919418335, -1.5192739963531494, -1.4707309007644653, -1.4221878051757812, -1.3736447095870972, -1.325101613998413, -1.2765586376190186, -1.2280155420303345, -1.1794724464416504, -1.1309293508529663, -1.0823862552642822, -1.0338433980941772, -0.9853003025054932, -0.9367572665214539, -0.8882141709327698, -0.8396711349487305, -0.7911280393600464, -0.7425849437713623, -0.6940418481826782, -0.6454988121986389, -0.5969557166099548, -0.5484126806259155, -0.49986958503723145, -0.45132651925086975, -0.40278345346450806, -0.354240357875824, -0.3056972920894623, -0.2571542263031006, -0.2086111605167389, -0.160068079829216, -0.11152499914169312, -0.06298193335533142, -0.014438867568969727, 0.034104228019714355, 0.08264729380607605, 0.13119035959243774, 0.17973342537879944, 0.22827650606632233, 0.2768195867538452, 0.3253626525402069, 0.3739057183265686, 0.4224488139152527, 0.4709918797016144, 0.5195349454879761]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 18.0, 38.0, 75.0, 150.0, 498.0, 42257.0, 4150998.0, 205.0, 41.0, 6.0, 1.0], "bins": [-3.6875, -3.625072479248047, -3.5626449584960938, -3.5002174377441406, -3.4377899169921875, -3.3753623962402344, -3.3129348754882812, -3.250507354736328, -3.188079833984375, -3.125652313232422, -3.0632247924804688, -3.0007972717285156, -2.9383697509765625, -2.8759422302246094, -2.8135147094726562, -2.751087188720703, -2.68865966796875, -2.626232147216797, -2.5638046264648438, -2.5013771057128906, -2.4389495849609375, -2.3765220642089844, -2.3140945434570312, -2.251667022705078, -2.189239501953125, -2.126811981201172, -2.0643844604492188, -2.0019569396972656, -1.9395294189453125, -1.8771018981933594, -1.8146743774414062, -1.7522468566894531, -1.6898193359375, -1.6273918151855469, -1.5649642944335938, -1.5025367736816406, -1.4401092529296875, -1.3776817321777344, -1.3152542114257812, -1.2528266906738281, -1.190399169921875, -1.1279716491699219, -1.0655441284179688, -1.0031166076660156, -0.9406890869140625, -0.8782615661621094, -0.8158340454101562, -0.7534065246582031, -0.69097900390625, -0.6285514831542969, -0.5661239624023438, -0.5036964416503906, -0.4412689208984375, -0.3788414001464844, -0.31641387939453125, -0.2539863586425781, -0.191558837890625, -0.12913131713867188, -0.06670379638671875, -0.004276275634765625, 0.0581512451171875, 0.12057876586914062, 0.18300628662109375, 0.24543380737304688, 0.307861328125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 58.0, 247.0, 377.0, 234.0, 76.0, 14.0, 3.0, 1.0], "bins": [-0.0992431640625, -0.09754598140716553, -0.09584879875183105, -0.09415161609649658, -0.09245443344116211, -0.09075725078582764, -0.08906006813049316, -0.08736288547515869, -0.08566570281982422, -0.08396852016448975, -0.08227133750915527, -0.0805741548538208, -0.07887697219848633, -0.07717978954315186, -0.07548260688781738, -0.07378542423248291, -0.07208824157714844, -0.07039105892181396, -0.06869387626647949, -0.06699669361114502, -0.06529951095581055, -0.06360232830047607, -0.0619051456451416, -0.06020796298980713, -0.058510780334472656, -0.056813597679138184, -0.05511641502380371, -0.05341923236846924, -0.051722049713134766, -0.05002486705780029, -0.04832768440246582, -0.04663050174713135, -0.044933319091796875, -0.0432361364364624, -0.04153895378112793, -0.03984177112579346, -0.038144588470458984, -0.03644740581512451, -0.03475022315979004, -0.033053040504455566, -0.031355857849121094, -0.02965867519378662, -0.02796149253845215, -0.026264309883117676, -0.024567127227783203, -0.02286994457244873, -0.021172761917114258, -0.019475579261779785, -0.017778396606445312, -0.01608121395111084, -0.014384031295776367, -0.012686848640441895, -0.010989665985107422, -0.00929248332977295, -0.0075953006744384766, -0.005898118019104004, -0.004200935363769531, -0.0025037527084350586, -0.0008065700531005859, 0.0008906126022338867, 0.0025877952575683594, 0.004284977912902832, 0.005982160568237305, 0.007679343223571777, 0.00937652587890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 18.0, 38.0, 79.0, 202.0, 237.0, 382.0, 4186524.0, 6212.0, 304.0, 154.0, 85.0, 37.0, 5.0, 1.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.015625, -4.91497802734375, -4.8143310546875, -4.71368408203125, -4.613037109375, -4.51239013671875, -4.4117431640625, -4.31109619140625, -4.21044921875, -4.10980224609375, -4.0091552734375, -3.90850830078125, -3.807861328125, -3.70721435546875, -3.6065673828125, -3.50592041015625, -3.4052734375, -3.30462646484375, -3.2039794921875, -3.10333251953125, -3.002685546875, -2.90203857421875, -2.8013916015625, -2.70074462890625, -2.60009765625, -2.49945068359375, -2.3988037109375, -2.29815673828125, -2.197509765625, -2.09686279296875, -1.9962158203125, -1.89556884765625, -1.794921875, -1.69427490234375, -1.5936279296875, -1.49298095703125, -1.392333984375, -1.29168701171875, -1.1910400390625, -1.09039306640625, -0.98974609375, -0.88909912109375, -0.7884521484375, -0.68780517578125, -0.587158203125, -0.48651123046875, -0.3858642578125, -0.28521728515625, -0.1845703125, -0.08392333984375, 0.0167236328125, 0.11737060546875, 0.218017578125, 0.31866455078125, 0.4193115234375, 0.51995849609375, 0.62060546875, 0.72125244140625, 0.8218994140625, 0.92254638671875, 1.023193359375, 1.12384033203125, 1.2244873046875, 1.32513427734375, 1.42578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 112.0, 3858.0, 88.0, 14.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47607421875, -0.46661949157714844, -0.4571647644042969, -0.4477100372314453, -0.43825531005859375, -0.4288005828857422, -0.4193458557128906, -0.40989112854003906, -0.4004364013671875, -0.39098167419433594, -0.3815269470214844, -0.3720722198486328, -0.36261749267578125, -0.3531627655029297, -0.3437080383300781, -0.33425331115722656, -0.324798583984375, -0.31534385681152344, -0.3058891296386719, -0.2964344024658203, -0.28697967529296875, -0.2775249481201172, -0.2680702209472656, -0.25861549377441406, -0.2491607666015625, -0.23970603942871094, -0.23025131225585938, -0.2207965850830078, -0.21134185791015625, -0.2018871307373047, -0.19243240356445312, -0.18297767639160156, -0.17352294921875, -0.16406822204589844, -0.15461349487304688, -0.1451587677001953, -0.13570404052734375, -0.1262493133544922, -0.11679458618164062, -0.10733985900878906, -0.0978851318359375, -0.08843040466308594, -0.07897567749023438, -0.06952095031738281, -0.06006622314453125, -0.05061149597167969, -0.041156768798828125, -0.03170204162597656, -0.022247314453125, -0.012792587280273438, -0.003337860107421875, 0.0061168670654296875, 0.01557159423828125, 0.025026321411132812, 0.034481048583984375, 0.04393577575683594, 0.0533905029296875, 0.06284523010253906, 0.07229995727539062, 0.08175468444824219, 0.09120941162109375, 0.10066413879394531, 0.11011886596679688, 0.11957359313964844, 0.1290283203125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 15.0, 38.0, 736.0, 185.0, 27.0, 8.0, 3.0, 2.0], "bins": [-5.6812028884887695, -5.584517002105713, -5.487830638885498, -5.391144752502441, -5.294458389282227, -5.19777250289917, -5.101086139678955, -5.004400253295898, -4.907713890075684, -4.811028003692627, -4.714341640472412, -4.6176557540893555, -4.520969390869141, -4.424283504486084, -4.327597141265869, -4.2309112548828125, -4.134225368499756, -4.037539482116699, -3.9408531188964844, -3.8441669940948486, -3.747480869293213, -3.6507949829101562, -3.5541088581085205, -3.4574227333068848, -3.360736608505249, -3.2640504837036133, -3.1673643589019775, -3.070678234100342, -2.973992347717285, -2.8773062229156494, -2.7806200981140137, -2.683933973312378, -2.587247848510742, -2.4905617237091064, -2.3938755989074707, -2.297189474105835, -2.200503349304199, -2.1038174629211426, -2.007131338119507, -1.910445213317871, -1.8137590885162354, -1.7170729637145996, -1.6203868389129639, -1.5237008333206177, -1.427014708518982, -1.3303285837173462, -1.233642578125, -1.1369564533233643, -1.0402703285217285, -0.9435842037200928, -0.8468981385231018, -0.7502120733261108, -0.6535259485244751, -0.5568398237228394, -0.4601537585258484, -0.3634676933288574, -0.2667815685272217, -0.17009547352790833, -0.07340937852859497, 0.023276716470718384, 0.11996281147003174, 0.2166489064693451, 0.31333500146865845, 0.4100210666656494, 0.5067071914672852]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 21.0, 38.0, 58.0, 122.0, 144.0, 158.0, 164.0, 108.0, 82.0, 57.0, 19.0, 11.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.633592128753662, -1.581588864326477, -1.5295854806900024, -1.4775822162628174, -1.4255788326263428, -1.3735755681991577, -1.3215723037719727, -1.269568920135498, -1.217565655708313, -1.165562391281128, -1.1135590076446533, -1.0615557432174683, -1.0095523595809937, -0.9575490951538086, -0.9055457711219788, -0.8535424470901489, -0.8015391230583191, -0.7495357990264893, -0.6975324749946594, -0.6455291509628296, -0.5935258865356445, -0.5415225625038147, -0.48951923847198486, -0.4375159442424774, -0.3855126202106476, -0.33350929617881775, -0.2815060019493103, -0.22950267791748047, -0.17749936878681183, -0.1254960596561432, -0.07349273562431335, -0.021489441394805908, 0.030513882637023926, 0.08251719176769257, 0.1345205008983612, 0.18652382493019104, 0.23852713406085968, 0.2905304431915283, 0.34253376722335815, 0.3945370614528656, 0.44654038548469543, 0.49854370951652527, 0.5505470037460327, 0.6025503277778625, 0.6545536518096924, 0.7065569162368774, 0.758560299873352, 0.8105635643005371, 0.8625668883323669, 0.9145702123641968, 0.9665735363960266, 1.0185768604278564, 1.0705801248550415, 1.1225833892822266, 1.1745867729187012, 1.2265900373458862, 1.2785934209823608, 1.330596685409546, 1.3826000690460205, 1.4346033334732056, 1.4866067171096802, 1.5386099815368652, 1.5906133651733398, 1.642616629600525, 1.69461989402771]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 9.0, 14.0, 15.0, 28.0, 27.0, 49.0, 85.0, 202.0, 603.0, 2058.0, 23305.0, 974635.0, 43625.0, 2660.0, 740.0, 248.0, 83.0, 52.0, 39.0, 30.0, 16.0, 9.0, 10.0, 9.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8212890625, -0.7975387573242188, -0.7737884521484375, -0.7500381469726562, -0.726287841796875, -0.7025375366210938, -0.6787872314453125, -0.6550369262695312, -0.63128662109375, -0.6075363159179688, -0.5837860107421875, -0.5600357055664062, -0.536285400390625, -0.5125350952148438, -0.4887847900390625, -0.46503448486328125, -0.4412841796875, -0.41753387451171875, -0.3937835693359375, -0.37003326416015625, -0.346282958984375, -0.32253265380859375, -0.2987823486328125, -0.27503204345703125, -0.25128173828125, -0.22753143310546875, -0.2037811279296875, -0.18003082275390625, -0.156280517578125, -0.13253021240234375, -0.1087799072265625, -0.08502960205078125, -0.061279296875, -0.03752899169921875, -0.0137786865234375, 0.00997161865234375, 0.033721923828125, 0.05747222900390625, 0.0812225341796875, 0.10497283935546875, 0.12872314453125, 0.15247344970703125, 0.1762237548828125, 0.19997406005859375, 0.223724365234375, 0.24747467041015625, 0.2712249755859375, 0.29497528076171875, 0.3187255859375, 0.34247589111328125, 0.3662261962890625, 0.38997650146484375, 0.413726806640625, 0.43747711181640625, 0.4612274169921875, 0.48497772216796875, 0.50872802734375, 0.5324783325195312, 0.5562286376953125, 0.5799789428710938, 0.603729248046875, 0.6274795532226562, 0.6512298583984375, 0.6749801635742188, 0.69873046875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 25.0, 41.0, 75.0, 139.0, 174.0, 188.0, 151.0, 87.0, 71.0, 27.0, 14.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.142578125, -0.1394186019897461, -0.1362590789794922, -0.13309955596923828, -0.12994003295898438, -0.12678050994873047, -0.12362098693847656, -0.12046146392822266, -0.11730194091796875, -0.11414241790771484, -0.11098289489746094, -0.10782337188720703, -0.10466384887695312, -0.10150432586669922, -0.09834480285644531, -0.0951852798461914, -0.0920257568359375, -0.0888662338256836, -0.08570671081542969, -0.08254718780517578, -0.07938766479492188, -0.07622814178466797, -0.07306861877441406, -0.06990909576416016, -0.06674957275390625, -0.06359004974365234, -0.06043052673339844, -0.05727100372314453, -0.054111480712890625, -0.05095195770263672, -0.04779243469238281, -0.044632911682128906, -0.041473388671875, -0.038313865661621094, -0.03515434265136719, -0.03199481964111328, -0.028835296630859375, -0.02567577362060547, -0.022516250610351562, -0.019356727600097656, -0.01619720458984375, -0.013037681579589844, -0.009878158569335938, -0.006718635559082031, -0.003559112548828125, -0.00039958953857421875, 0.0027599334716796875, 0.005919456481933594, 0.0090789794921875, 0.012238502502441406, 0.015398025512695312, 0.01855754852294922, 0.021717071533203125, 0.02487659454345703, 0.028036117553710938, 0.031195640563964844, 0.03435516357421875, 0.037514686584472656, 0.04067420959472656, 0.04383373260498047, 0.046993255615234375, 0.05015277862548828, 0.05331230163574219, 0.056471824645996094, 0.05963134765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 5.0, 7.0, 7.0, 19.0, 15.0, 22.0, 34.0, 35.0, 46.0, 87.0, 180.0, 420.0, 2552.0, 62169.0, 961949.0, 19033.0, 1308.0, 283.0, 109.0, 67.0, 50.0, 39.0, 17.0, 25.0, 18.0, 8.0, 13.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44482421875, -0.4306373596191406, -0.41645050048828125, -0.4022636413574219, -0.3880767822265625, -0.3738899230957031, -0.35970306396484375, -0.3455162048339844, -0.331329345703125, -0.3171424865722656, -0.30295562744140625, -0.2887687683105469, -0.2745819091796875, -0.2603950500488281, -0.24620819091796875, -0.23202133178710938, -0.21783447265625, -0.20364761352539062, -0.18946075439453125, -0.17527389526367188, -0.1610870361328125, -0.14690017700195312, -0.13271331787109375, -0.11852645874023438, -0.104339599609375, -0.09015274047851562, -0.07596588134765625, -0.061779022216796875, -0.0475921630859375, -0.033405303955078125, -0.01921844482421875, -0.005031585693359375, 0.0091552734375, 0.023342132568359375, 0.03752899169921875, 0.051715850830078125, 0.0659027099609375, 0.08008956909179688, 0.09427642822265625, 0.10846328735351562, 0.122650146484375, 0.13683700561523438, 0.15102386474609375, 0.16521072387695312, 0.1793975830078125, 0.19358444213867188, 0.20777130126953125, 0.22195816040039062, 0.23614501953125, 0.2503318786621094, 0.26451873779296875, 0.2787055969238281, 0.2928924560546875, 0.3070793151855469, 0.32126617431640625, 0.3354530334472656, 0.349639892578125, 0.3638267517089844, 0.37801361083984375, 0.3922004699707031, 0.4063873291015625, 0.4205741882324219, 0.43476104736328125, 0.4489479064941406, 0.463134765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 4.0, 10.0, 12.0, 15.0, 26.0, 24.0, 36.0, 26.0, 39.0, 48.0, 61.0, 58.0, 63.0, 56.0, 69.0, 67.0, 49.0, 58.0, 41.0, 40.0, 34.0, 31.0, 25.0, 29.0, 11.0, 11.0, 13.0, 11.0, 3.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1689453125, -0.1636638641357422, -0.15838241577148438, -0.15310096740722656, -0.14781951904296875, -0.14253807067871094, -0.13725662231445312, -0.1319751739501953, -0.1266937255859375, -0.12141227722167969, -0.11613082885742188, -0.11084938049316406, -0.10556793212890625, -0.10028648376464844, -0.09500503540039062, -0.08972358703613281, -0.084442138671875, -0.07916069030761719, -0.07387924194335938, -0.06859779357910156, -0.06331634521484375, -0.05803489685058594, -0.052753448486328125, -0.04747200012207031, -0.0421905517578125, -0.03690910339355469, -0.031627655029296875, -0.026346206665039062, -0.02106475830078125, -0.015783309936523438, -0.010501861572265625, -0.0052204132080078125, 6.103515625e-05, 0.0053424835205078125, 0.010623931884765625, 0.015905380249023438, 0.02118682861328125, 0.026468276977539062, 0.031749725341796875, 0.03703117370605469, 0.0423126220703125, 0.04759407043457031, 0.052875518798828125, 0.05815696716308594, 0.06343841552734375, 0.06871986389160156, 0.07400131225585938, 0.07928276062011719, 0.084564208984375, 0.08984565734863281, 0.09512710571289062, 0.10040855407714844, 0.10569000244140625, 0.11097145080566406, 0.11625289916992188, 0.12153434753417969, 0.1268157958984375, 0.1320972442626953, 0.13737869262695312, 0.14266014099121094, 0.14794158935546875, 0.15322303771972656, 0.15850448608398438, 0.1637859344482422, 0.1690673828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 12.0, 18.0, 34.0, 46.0, 121.0, 237.0, 489.0, 1250.0, 5862.0, 152218.0, 873167.0, 11871.0, 1927.0, 638.0, 296.0, 140.0, 86.0, 41.0, 22.0, 16.0, 15.0, 9.0, 8.0, 6.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24560546875, -0.23917007446289062, -0.23273468017578125, -0.22629928588867188, -0.2198638916015625, -0.21342849731445312, -0.20699310302734375, -0.20055770874023438, -0.194122314453125, -0.18768692016601562, -0.18125152587890625, -0.17481613159179688, -0.1683807373046875, -0.16194534301757812, -0.15550994873046875, -0.14907455444335938, -0.14263916015625, -0.13620376586914062, -0.12976837158203125, -0.12333297729492188, -0.1168975830078125, -0.11046218872070312, -0.10402679443359375, -0.09759140014648438, -0.091156005859375, -0.08472061157226562, -0.07828521728515625, -0.07184982299804688, -0.0654144287109375, -0.058979034423828125, -0.05254364013671875, -0.046108245849609375, -0.0396728515625, -0.033237457275390625, -0.02680206298828125, -0.020366668701171875, -0.0139312744140625, -0.007495880126953125, -0.00106048583984375, 0.005374908447265625, 0.011810302734375, 0.018245697021484375, 0.02468109130859375, 0.031116485595703125, 0.0375518798828125, 0.043987274169921875, 0.05042266845703125, 0.056858062744140625, 0.06329345703125, 0.06972885131835938, 0.07616424560546875, 0.08259963989257812, 0.0890350341796875, 0.09547042846679688, 0.10190582275390625, 0.10834121704101562, 0.114776611328125, 0.12121200561523438, 0.12764739990234375, 0.13408279418945312, 0.1405181884765625, 0.14695358276367188, 0.15338897705078125, 0.15982437133789062, 0.166259765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 8.0, 1.0, 3.0, 6.0, 8.0, 8.0, 17.0, 14.0, 12.0, 16.0, 29.0, 34.0, 60.0, 66.0, 95.0, 132.0, 113.0, 73.0, 71.0, 41.0, 39.0, 28.0, 32.0, 16.0, 13.0, 20.0, 6.0, 8.0, 11.0, 2.0, 3.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002493858337402344, -0.00024043768644332886, -0.00023148953914642334, -0.00022254139184951782, -0.0002135932445526123, -0.0002046450972557068, -0.00019569694995880127, -0.00018674880266189575, -0.00017780065536499023, -0.00016885250806808472, -0.0001599043607711792, -0.00015095621347427368, -0.00014200806617736816, -0.00013305991888046265, -0.00012411177158355713, -0.00011516362428665161, -0.0001062154769897461, -9.726732969284058e-05, -8.831918239593506e-05, -7.937103509902954e-05, -7.042288780212402e-05, -6.14747405052185e-05, -5.252659320831299e-05, -4.357844591140747e-05, -3.463029861450195e-05, -2.5682151317596436e-05, -1.6734004020690918e-05, -7.7858567237854e-06, 1.1622905731201172e-06, 1.0110437870025635e-05, 1.9058585166931152e-05, 2.800673246383667e-05, 3.695487976074219e-05, 4.5903027057647705e-05, 5.485117435455322e-05, 6.379932165145874e-05, 7.274746894836426e-05, 8.169561624526978e-05, 9.064376354217529e-05, 9.959191083908081e-05, 0.00010854005813598633, 0.00011748820543289185, 0.00012643635272979736, 0.00013538450002670288, 0.0001443326473236084, 0.00015328079462051392, 0.00016222894191741943, 0.00017117708921432495, 0.00018012523651123047, 0.00018907338380813599, 0.0001980215311050415, 0.00020696967840194702, 0.00021591782569885254, 0.00022486597299575806, 0.00023381412029266357, 0.0002427622675895691, 0.0002517104148864746, 0.0002606585621833801, 0.00026960670948028564, 0.00027855485677719116, 0.0002875030040740967, 0.0002964511513710022, 0.0003053992986679077, 0.00031434744596481323, 0.00032329559326171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 10.0, 16.0, 20.0, 38.0, 54.0, 147.0, 380.0, 1668.0, 20007.0, 1003969.0, 19747.0, 1692.0, 419.0, 172.0, 75.0, 41.0, 18.0, 21.0, 13.0, 13.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.28125, -0.2723197937011719, -0.26338958740234375, -0.2544593811035156, -0.2455291748046875, -0.23659896850585938, -0.22766876220703125, -0.21873855590820312, -0.209808349609375, -0.20087814331054688, -0.19194793701171875, -0.18301773071289062, -0.1740875244140625, -0.16515731811523438, -0.15622711181640625, -0.14729690551757812, -0.13836669921875, -0.12943649291992188, -0.12050628662109375, -0.11157608032226562, -0.1026458740234375, -0.09371566772460938, -0.08478546142578125, -0.07585525512695312, -0.066925048828125, -0.057994842529296875, -0.04906463623046875, -0.040134429931640625, -0.0312042236328125, -0.022274017333984375, -0.01334381103515625, -0.004413604736328125, 0.0045166015625, 0.013446807861328125, 0.02237701416015625, 0.031307220458984375, 0.0402374267578125, 0.049167633056640625, 0.05809783935546875, 0.06702804565429688, 0.075958251953125, 0.08488845825195312, 0.09381866455078125, 0.10274887084960938, 0.1116790771484375, 0.12060928344726562, 0.12953948974609375, 0.13846969604492188, 0.14739990234375, 0.15633010864257812, 0.16526031494140625, 0.17419052124023438, 0.1831207275390625, 0.19205093383789062, 0.20098114013671875, 0.20991134643554688, 0.218841552734375, 0.22777175903320312, 0.23670196533203125, 0.24563217163085938, 0.2545623779296875, 0.2634925842285156, 0.27242279052734375, 0.2813529968261719, 0.290283203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 16.0, 22.0, 19.0, 39.0, 59.0, 122.0, 169.0, 190.0, 131.0, 78.0, 39.0, 32.0, 21.0, 12.0, 8.0, 9.0, 8.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1055908203125, -0.10196685791015625, -0.0983428955078125, -0.09471893310546875, -0.091094970703125, -0.08747100830078125, -0.0838470458984375, -0.08022308349609375, -0.07659912109375, -0.07297515869140625, -0.0693511962890625, -0.06572723388671875, -0.062103271484375, -0.05847930908203125, -0.0548553466796875, -0.05123138427734375, -0.047607421875, -0.04398345947265625, -0.0403594970703125, -0.03673553466796875, -0.033111572265625, -0.02948760986328125, -0.0258636474609375, -0.02223968505859375, -0.01861572265625, -0.01499176025390625, -0.0113677978515625, -0.00774383544921875, -0.004119873046875, -0.00049591064453125, 0.0031280517578125, 0.00675201416015625, 0.0103759765625, 0.01399993896484375, 0.0176239013671875, 0.02124786376953125, 0.024871826171875, 0.02849578857421875, 0.0321197509765625, 0.03574371337890625, 0.03936767578125, 0.04299163818359375, 0.0466156005859375, 0.05023956298828125, 0.053863525390625, 0.05748748779296875, 0.0611114501953125, 0.06473541259765625, 0.068359375, 0.07198333740234375, 0.0756072998046875, 0.07923126220703125, 0.082855224609375, 0.08647918701171875, 0.0901031494140625, 0.09372711181640625, 0.09735107421875, 0.10097503662109375, 0.1045989990234375, 0.10822296142578125, 0.111846923828125, 0.11547088623046875, 0.1190948486328125, 0.12271881103515625, 0.1263427734375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 84.0, 755.0, 124.0, 27.0, 10.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.53749942779541, -5.410022258758545, -5.28254508972168, -5.155067443847656, -5.027590274810791, -4.900113105773926, -4.772635459899902, -4.645158290863037, -4.517681121826172, -4.390203952789307, -4.262726783752441, -4.135249137878418, -4.007771968841553, -3.8802947998046875, -3.752817392349243, -3.625339984893799, -3.4978628158569336, -3.3703856468200684, -3.242908239364624, -3.1154308319091797, -2.9879536628723145, -2.860476493835449, -2.732999086380005, -2.6055216789245605, -2.4780445098876953, -2.35056734085083, -2.2230899333953857, -2.0956125259399414, -1.9681353569030762, -1.8406580686569214, -1.7131807804107666, -1.5857034921646118, -1.458226203918457, -1.3307489156723022, -1.2032716274261475, -1.0757943391799927, -0.9483170509338379, -0.8208397626876831, -0.6933624744415283, -0.5658851861953735, -0.43840789794921875, -0.31093060970306396, -0.18345332145690918, -0.055976033210754395, 0.07150125503540039, 0.19897854328155518, 0.32645583152770996, 0.45393311977386475, 0.5814104080200195, 0.7088876962661743, 0.8363649845123291, 0.9638422727584839, 1.0913195610046387, 1.2187968492507935, 1.3462741374969482, 1.473751425743103, 1.6012287139892578, 1.7287060022354126, 1.8561832904815674, 1.9836605787277222, 2.111137866973877, 2.238615036010742, 2.3660924434661865, 2.493569850921631, 2.621047019958496]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 13.0, 7.0, 17.0, 18.0, 22.0, 19.0, 33.0, 38.0, 48.0, 42.0, 49.0, 66.0, 74.0, 69.0, 55.0, 69.0, 49.0, 48.0, 50.0, 37.0, 32.0, 28.0, 26.0, 20.0, 19.0, 14.0, 9.0, 12.0, 6.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9222455024719238, -0.8873699307441711, -0.8524943590164185, -0.8176187872886658, -0.7827432155609131, -0.7478677034378052, -0.7129921317100525, -0.6781165599822998, -0.6432409882545471, -0.6083654165267944, -0.5734898447990417, -0.5386142730712891, -0.5037387609481812, -0.4688631594181061, -0.4339876174926758, -0.3991120457649231, -0.3642364740371704, -0.3293609023094177, -0.29448533058166504, -0.25960978865623474, -0.22473421692848206, -0.18985864520072937, -0.15498308837413788, -0.12010753154754639, -0.0852319598197937, -0.05035639554262161, -0.015480831265449524, 0.019394733011722565, 0.05427029728889465, 0.08914586901664734, 0.12402142584323883, 0.15889698266983032, 0.19377243518829346, 0.22864800691604614, 0.26352357864379883, 0.2983991205692291, 0.3332746922969818, 0.3681502640247345, 0.4030258059501648, 0.4379013776779175, 0.47277694940567017, 0.5076525211334229, 0.5425280928611755, 0.5774036645889282, 0.6122791767120361, 0.6471548080444336, 0.6820303201675415, 0.7169058918952942, 0.7517814636230469, 0.7866570353507996, 0.8215326070785522, 0.8564081788063049, 0.8912837505340576, 0.9261592626571655, 0.9610348343849182, 0.9959104061126709, 1.0307860374450684, 1.0656615495681763, 1.1005371809005737, 1.1354126930236816, 1.170288324356079, 1.205163836479187, 1.2400394678115845, 1.2749149799346924, 1.3097904920578003]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 0.0, 2.0, 3.0, 3.0, 6.0, 12.0, 7.0, 8.0, 11.0, 17.0, 22.0, 19.0, 23.0, 30.0, 48.0, 56.0, 79.0, 125.0, 152.0, 268.0, 535.0, 1258.0, 4077.0, 25681.0, 3612346.0, 526275.0, 18891.0, 3099.0, 787.0, 280.0, 94.0, 34.0, 20.0, 13.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.9873046875, -0.9679145812988281, -0.9485244750976562, -0.9291343688964844, -0.9097442626953125, -0.8903541564941406, -0.8709640502929688, -0.8515739440917969, -0.832183837890625, -0.8127937316894531, -0.7934036254882812, -0.7740135192871094, -0.7546234130859375, -0.7352333068847656, -0.7158432006835938, -0.6964530944824219, -0.67706298828125, -0.6576728820800781, -0.6382827758789062, -0.6188926696777344, -0.5995025634765625, -0.5801124572753906, -0.5607223510742188, -0.5413322448730469, -0.521942138671875, -0.5025520324707031, -0.48316192626953125, -0.4637718200683594, -0.4443817138671875, -0.4249916076660156, -0.40560150146484375, -0.3862113952636719, -0.3668212890625, -0.3474311828613281, -0.32804107666015625, -0.3086509704589844, -0.2892608642578125, -0.2698707580566406, -0.25048065185546875, -0.23109054565429688, -0.211700439453125, -0.19231033325195312, -0.17292022705078125, -0.15353012084960938, -0.1341400146484375, -0.11474990844726562, -0.09535980224609375, -0.07596969604492188, -0.05657958984375, -0.037189483642578125, -0.01779937744140625, 0.001590728759765625, 0.0209808349609375, 0.040370941162109375, 0.05976104736328125, 0.07915115356445312, 0.098541259765625, 0.11793136596679688, 0.13732147216796875, 0.15671157836914062, 0.1761016845703125, 0.19549179077148438, 0.21488189697265625, 0.23427200317382812, 0.253662109375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 8.0, 13.0, 33.0, 61.0, 102.0, 123.0, 178.0, 157.0, 132.0, 79.0, 50.0, 34.0, 19.0, 8.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.149658203125, -0.14671659469604492, -0.14377498626708984, -0.14083337783813477, -0.1378917694091797, -0.1349501609802246, -0.13200855255126953, -0.12906694412231445, -0.12612533569335938, -0.1231837272644043, -0.12024211883544922, -0.11730051040649414, -0.11435890197753906, -0.11141729354858398, -0.1084756851196289, -0.10553407669067383, -0.10259246826171875, -0.09965085983276367, -0.0967092514038086, -0.09376764297485352, -0.09082603454589844, -0.08788442611694336, -0.08494281768798828, -0.0820012092590332, -0.07905960083007812, -0.07611799240112305, -0.07317638397216797, -0.07023477554321289, -0.06729316711425781, -0.06435155868530273, -0.061409950256347656, -0.05846834182739258, -0.0555267333984375, -0.05258512496948242, -0.049643516540527344, -0.046701908111572266, -0.04376029968261719, -0.04081869125366211, -0.03787708282470703, -0.03493547439575195, -0.031993865966796875, -0.029052257537841797, -0.02611064910888672, -0.02316904067993164, -0.020227432250976562, -0.017285823822021484, -0.014344215393066406, -0.011402606964111328, -0.00846099853515625, -0.005519390106201172, -0.0025777816772460938, 0.0003638267517089844, 0.0033054351806640625, 0.006247043609619141, 0.009188652038574219, 0.012130260467529297, 0.015071868896484375, 0.018013477325439453, 0.02095508575439453, 0.02389669418334961, 0.026838302612304688, 0.029779911041259766, 0.032721519470214844, 0.03566312789916992, 0.038604736328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 22.0, 70.0, 151.0, 544.0, 105600.0, 4087409.0, 346.0, 89.0, 34.0, 10.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.6368865966796875, -6.504241943359375, -6.3715972900390625, -6.23895263671875, -6.1063079833984375, -5.973663330078125, -5.8410186767578125, -5.7083740234375, -5.5757293701171875, -5.443084716796875, -5.3104400634765625, -5.17779541015625, -5.0451507568359375, -4.912506103515625, -4.7798614501953125, -4.647216796875, -4.5145721435546875, -4.381927490234375, -4.2492828369140625, -4.11663818359375, -3.9839935302734375, -3.851348876953125, -3.7187042236328125, -3.5860595703125, -3.4534149169921875, -3.320770263671875, -3.1881256103515625, -3.05548095703125, -2.9228363037109375, -2.790191650390625, -2.6575469970703125, -2.52490234375, -2.3922576904296875, -2.259613037109375, -2.1269683837890625, -1.99432373046875, -1.8616790771484375, -1.729034423828125, -1.5963897705078125, -1.4637451171875, -1.3311004638671875, -1.198455810546875, -1.0658111572265625, -0.93316650390625, -0.8005218505859375, -0.667877197265625, -0.5352325439453125, -0.402587890625, -0.2699432373046875, -0.137298583984375, -0.0046539306640625, 0.12799072265625, 0.2606353759765625, 0.393280029296875, 0.5259246826171875, 0.6585693359375, 0.7912139892578125, 0.923858642578125, 1.0565032958984375, 1.18914794921875, 1.3217926025390625, 1.454437255859375, 1.5870819091796875, 1.7197265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 16.0, 53.0, 467.0, 3381.0, 112.0, 31.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.62646484375, -0.6151199340820312, -0.6037750244140625, -0.5924301147460938, -0.581085205078125, -0.5697402954101562, -0.5583953857421875, -0.5470504760742188, -0.53570556640625, -0.5243606567382812, -0.5130157470703125, -0.5016708374023438, -0.490325927734375, -0.47898101806640625, -0.4676361083984375, -0.45629119873046875, -0.4449462890625, -0.43360137939453125, -0.4222564697265625, -0.41091156005859375, -0.399566650390625, -0.38822174072265625, -0.3768768310546875, -0.36553192138671875, -0.35418701171875, -0.34284210205078125, -0.3314971923828125, -0.32015228271484375, -0.308807373046875, -0.29746246337890625, -0.2861175537109375, -0.27477264404296875, -0.263427734375, -0.25208282470703125, -0.2407379150390625, -0.22939300537109375, -0.218048095703125, -0.20670318603515625, -0.1953582763671875, -0.18401336669921875, -0.17266845703125, -0.16132354736328125, -0.1499786376953125, -0.13863372802734375, -0.127288818359375, -0.11594390869140625, -0.1045989990234375, -0.09325408935546875, -0.0819091796875, -0.07056427001953125, -0.0592193603515625, -0.04787445068359375, -0.036529541015625, -0.02518463134765625, -0.0138397216796875, -0.00249481201171875, 0.00885009765625, 0.02019500732421875, 0.0315399169921875, 0.04288482666015625, 0.054229736328125, 0.06557464599609375, 0.0769195556640625, 0.08826446533203125, 0.099609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 6.0, 24.0, 128.0, 780.0, 60.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548156499862671, -3.4421892166137695, -3.3362221717834473, -3.230254888534546, -3.1242876052856445, -3.0183205604553223, -2.912353277206421, -2.8063859939575195, -2.7004189491271973, -2.594451665878296, -2.4884846210479736, -2.3825173377990723, -2.27655029296875, -2.1705830097198486, -2.0646157264709473, -1.9586485624313354, -1.8526813983917236, -1.7467142343521118, -1.6407470703125, -1.5347797870635986, -1.4288126230239868, -1.322845458984375, -1.2168781757354736, -1.1109110116958618, -1.00494384765625, -0.8989766836166382, -0.7930094599723816, -0.687042236328125, -0.5810750722885132, -0.47510790824890137, -0.3691406846046448, -0.2631734609603882, -0.15720605850219727, -0.05123886466026306, 0.05472832918167114, 0.16069552302360535, 0.26666271686553955, 0.37262988090515137, 0.47859710454940796, 0.5845643281936646, 0.6905314922332764, 0.7964986562728882, 0.9024658799171448, 1.0084331035614014, 1.1144002676010132, 1.220367431640625, 1.3263347148895264, 1.4323018789291382, 1.53826904296875, 1.6442362070083618, 1.7502033710479736, 1.856170654296875, 1.9621378183364868, 2.0681049823760986, 2.174072265625, 2.2800393104553223, 2.3860065937042236, 2.491973876953125, 2.5979409217834473, 2.7039082050323486, 2.80987548828125, 2.9158425331115723, 3.0218098163604736, 3.127777099609375, 3.2337441444396973]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 8.0, 13.0, 28.0, 41.0, 53.0, 78.0, 95.0, 106.0, 129.0, 100.0, 96.0, 94.0, 70.0, 35.0, 19.0, 21.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.502690315246582, -1.4595664739608765, -1.4164427518844604, -1.3733189105987549, -1.3301951885223389, -1.2870713472366333, -1.2439475059509277, -1.2008237838745117, -1.1576999425888062, -1.1145761013031006, -1.0714523792266846, -1.028328537940979, -0.9852047562599182, -0.9420809745788574, -0.8989571928977966, -0.8558334112167358, -0.812709629535675, -0.7695858478546143, -0.7264620661735535, -0.6833382844924927, -0.6402144432067871, -0.5970906615257263, -0.5539668798446655, -0.51084303855896, -0.46771928668022156, -0.42459550499916077, -0.3814716935157776, -0.3383479118347168, -0.295224130153656, -0.2521003186702728, -0.20897653698921204, -0.16585272550582886, -0.12272894382476807, -0.07960514724254608, -0.036481358110904694, 0.006642431020736694, 0.04976622760295868, 0.09289002418518066, 0.13601380586624146, 0.17913761734962463, 0.22226139903068542, 0.2653851807117462, 0.3085089921951294, 0.3516327738761902, 0.394756555557251, 0.43788036704063416, 0.48100414872169495, 0.5241279602050781, 0.5672517418861389, 0.6103755235671997, 0.6534993052482605, 0.6966230869293213, 0.7397469282150269, 0.7828707098960876, 0.8259944915771484, 0.869118332862854, 0.91224205493927, 0.9553658366203308, 0.9984896183013916, 1.0416134595870972, 1.0847371816635132, 1.1278610229492188, 1.1709847450256348, 1.2141085863113403, 1.257232427597046]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 7.0, 11.0, 12.0, 18.0, 20.0, 23.0, 40.0, 40.0, 53.0, 90.0, 102.0, 178.0, 303.0, 487.0, 975.0, 2264.0, 6958.0, 27766.0, 171432.0, 717394.0, 93601.0, 18000.0, 4936.0, 1749.0, 762.0, 403.0, 274.0, 177.0, 142.0, 90.0, 67.0, 38.0, 40.0, 28.0, 23.0, 11.0, 8.0, 11.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.34521484375, -0.33516693115234375, -0.3251190185546875, -0.31507110595703125, -0.305023193359375, -0.29497528076171875, -0.2849273681640625, -0.27487945556640625, -0.26483154296875, -0.25478363037109375, -0.2447357177734375, -0.23468780517578125, -0.224639892578125, -0.21459197998046875, -0.2045440673828125, -0.19449615478515625, -0.1844482421875, -0.17440032958984375, -0.1643524169921875, -0.15430450439453125, -0.144256591796875, -0.13420867919921875, -0.1241607666015625, -0.11411285400390625, -0.10406494140625, -0.09401702880859375, -0.0839691162109375, -0.07392120361328125, -0.063873291015625, -0.05382537841796875, -0.0437774658203125, -0.03372955322265625, -0.023681640625, -0.01363372802734375, -0.0035858154296875, 0.00646209716796875, 0.016510009765625, 0.02655792236328125, 0.0366058349609375, 0.04665374755859375, 0.05670166015625, 0.06674957275390625, 0.0767974853515625, 0.08684539794921875, 0.096893310546875, 0.10694122314453125, 0.1169891357421875, 0.12703704833984375, 0.1370849609375, 0.14713287353515625, 0.1571807861328125, 0.16722869873046875, 0.177276611328125, 0.18732452392578125, 0.1973724365234375, 0.20742034912109375, 0.21746826171875, 0.22751617431640625, 0.2375640869140625, 0.24761199951171875, 0.257659912109375, 0.26770782470703125, 0.2777557373046875, 0.28780364990234375, 0.2978515625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 8.0, 17.0, 28.0, 38.0, 57.0, 83.0, 80.0, 95.0, 124.0, 112.0, 93.0, 84.0, 52.0, 45.0, 37.0, 22.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.14599609375, -0.14256668090820312, -0.13913726806640625, -0.13570785522460938, -0.1322784423828125, -0.12884902954101562, -0.12541961669921875, -0.12199020385742188, -0.118560791015625, -0.11513137817382812, -0.11170196533203125, -0.10827255249023438, -0.1048431396484375, -0.10141372680664062, -0.09798431396484375, -0.09455490112304688, -0.09112548828125, -0.08769607543945312, -0.08426666259765625, -0.08083724975585938, -0.0774078369140625, -0.07397842407226562, -0.07054901123046875, -0.06711959838867188, -0.063690185546875, -0.060260772705078125, -0.05683135986328125, -0.053401947021484375, -0.0499725341796875, -0.046543121337890625, -0.04311370849609375, -0.039684295654296875, -0.0362548828125, -0.032825469970703125, -0.02939605712890625, -0.025966644287109375, -0.0225372314453125, -0.019107818603515625, -0.01567840576171875, -0.012248992919921875, -0.008819580078125, -0.005390167236328125, -0.00196075439453125, 0.001468658447265625, 0.0048980712890625, 0.008327484130859375, 0.01175689697265625, 0.015186309814453125, 0.01861572265625, 0.022045135498046875, 0.02547454833984375, 0.028903961181640625, 0.0323333740234375, 0.035762786865234375, 0.03919219970703125, 0.042621612548828125, 0.046051025390625, 0.049480438232421875, 0.05290985107421875, 0.056339263916015625, 0.0597686767578125, 0.06319808959960938, 0.06662750244140625, 0.07005691528320312, 0.073486328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 2.0, 5.0, 2.0, 13.0, 14.0, 8.0, 13.0, 31.0, 35.0, 32.0, 57.0, 89.0, 178.0, 338.0, 1403.0, 8092.0, 109582.0, 876361.0, 46058.0, 4629.0, 899.0, 292.0, 122.0, 81.0, 51.0, 47.0, 30.0, 19.0, 17.0, 19.0, 9.0, 8.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.399658203125, -0.3864936828613281, -0.37332916259765625, -0.3601646423339844, -0.3470001220703125, -0.3338356018066406, -0.32067108154296875, -0.3075065612792969, -0.294342041015625, -0.2811775207519531, -0.26801300048828125, -0.2548484802246094, -0.2416839599609375, -0.22851943969726562, -0.21535491943359375, -0.20219039916992188, -0.18902587890625, -0.17586135864257812, -0.16269683837890625, -0.14953231811523438, -0.1363677978515625, -0.12320327758789062, -0.11003875732421875, -0.09687423706054688, -0.083709716796875, -0.07054519653320312, -0.05738067626953125, -0.044216156005859375, -0.0310516357421875, -0.017887115478515625, -0.00472259521484375, 0.008441925048828125, 0.0216064453125, 0.034770965576171875, 0.04793548583984375, 0.061100006103515625, 0.0742645263671875, 0.08742904663085938, 0.10059356689453125, 0.11375808715820312, 0.126922607421875, 0.14008712768554688, 0.15325164794921875, 0.16641616821289062, 0.1795806884765625, 0.19274520874023438, 0.20590972900390625, 0.21907424926757812, 0.23223876953125, 0.24540328979492188, 0.25856781005859375, 0.2717323303222656, 0.2848968505859375, 0.2980613708496094, 0.31122589111328125, 0.3243904113769531, 0.337554931640625, 0.3507194519042969, 0.36388397216796875, 0.3770484924316406, 0.3902130126953125, 0.4033775329589844, 0.41654205322265625, 0.4297065734863281, 0.44287109375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 12.0, 10.0, 14.0, 18.0, 24.0, 21.0, 28.0, 41.0, 47.0, 44.0, 64.0, 65.0, 58.0, 64.0, 69.0, 51.0, 63.0, 57.0, 37.0, 38.0, 28.0, 29.0, 24.0, 21.0, 11.0, 14.0, 10.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2578125, -0.24934005737304688, -0.24086761474609375, -0.23239517211914062, -0.2239227294921875, -0.21545028686523438, -0.20697784423828125, -0.19850540161132812, -0.190032958984375, -0.18156051635742188, -0.17308807373046875, -0.16461563110351562, -0.1561431884765625, -0.14767074584960938, -0.13919830322265625, -0.13072586059570312, -0.12225341796875, -0.11378097534179688, -0.10530853271484375, -0.09683609008789062, -0.0883636474609375, -0.07989120483398438, -0.07141876220703125, -0.06294631958007812, -0.054473876953125, -0.046001434326171875, -0.03752899169921875, -0.029056549072265625, -0.0205841064453125, -0.012111663818359375, -0.00363922119140625, 0.004833221435546875, 0.0133056640625, 0.021778106689453125, 0.03025054931640625, 0.038722991943359375, 0.0471954345703125, 0.055667877197265625, 0.06414031982421875, 0.07261276245117188, 0.081085205078125, 0.08955764770507812, 0.09803009033203125, 0.10650253295898438, 0.1149749755859375, 0.12344741821289062, 0.13191986083984375, 0.14039230346679688, 0.14886474609375, 0.15733718872070312, 0.16580963134765625, 0.17428207397460938, 0.1827545166015625, 0.19122695922851562, 0.19969940185546875, 0.20817184448242188, 0.216644287109375, 0.22511672973632812, 0.23358917236328125, 0.24206161499023438, 0.2505340576171875, 0.2590065002441406, 0.26747894287109375, 0.2759513854980469, 0.284423828125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 2.0, 5.0, 5.0, 3.0, 4.0, 8.0, 8.0, 9.0, 15.0, 27.0, 41.0, 75.0, 133.0, 370.0, 992.0, 3711.0, 27125.0, 937379.0, 70653.0, 5676.0, 1451.0, 464.0, 158.0, 76.0, 50.0, 35.0, 10.0, 17.0, 7.0, 6.0, 11.0, 4.0, 9.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1434326171875, -0.13916778564453125, -0.1349029541015625, -0.13063812255859375, -0.126373291015625, -0.12210845947265625, -0.1178436279296875, -0.11357879638671875, -0.10931396484375, -0.10504913330078125, -0.1007843017578125, -0.09651947021484375, -0.092254638671875, -0.08798980712890625, -0.0837249755859375, -0.07946014404296875, -0.0751953125, -0.07093048095703125, -0.0666656494140625, -0.06240081787109375, -0.058135986328125, -0.05387115478515625, -0.0496063232421875, -0.04534149169921875, -0.04107666015625, -0.03681182861328125, -0.0325469970703125, -0.02828216552734375, -0.024017333984375, -0.01975250244140625, -0.0154876708984375, -0.01122283935546875, -0.0069580078125, -0.00269317626953125, 0.0015716552734375, 0.00583648681640625, 0.010101318359375, 0.01436614990234375, 0.0186309814453125, 0.02289581298828125, 0.02716064453125, 0.03142547607421875, 0.0356903076171875, 0.03995513916015625, 0.044219970703125, 0.04848480224609375, 0.0527496337890625, 0.05701446533203125, 0.061279296875, 0.06554412841796875, 0.0698089599609375, 0.07407379150390625, 0.078338623046875, 0.08260345458984375, 0.0868682861328125, 0.09113311767578125, 0.09539794921875, 0.09966278076171875, 0.1039276123046875, 0.10819244384765625, 0.112457275390625, 0.11672210693359375, 0.1209869384765625, 0.12525177001953125, 0.1295166015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 10.0, 10.0, 11.0, 24.0, 29.0, 37.0, 50.0, 54.0, 68.0, 96.0, 102.0, 89.0, 85.0, 77.0, 56.0, 50.0, 30.0, 23.0, 35.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.733438491821289e-05, -9.361002594232559e-05, -8.98856669664383e-05, -8.6161307990551e-05, -8.24369490146637e-05, -7.87125900387764e-05, -7.49882310628891e-05, -7.12638720870018e-05, -6.75395131111145e-05, -6.38151541352272e-05, -6.0090795159339905e-05, -5.6366436183452606e-05, -5.264207720756531e-05, -4.891771823167801e-05, -4.519335925579071e-05, -4.146900027990341e-05, -3.774464130401611e-05, -3.4020282328128815e-05, -3.0295923352241516e-05, -2.6571564376354218e-05, -2.284720540046692e-05, -1.912284642457962e-05, -1.5398487448692322e-05, -1.1674128472805023e-05, -7.949769496917725e-06, -4.225410521030426e-06, -5.010515451431274e-07, 3.223307430744171e-06, 6.94766640663147e-06, 1.0672025382518768e-05, 1.4396384358406067e-05, 1.8120743334293365e-05, 2.1845102310180664e-05, 2.5569461286067963e-05, 2.929382026195526e-05, 3.301817923784256e-05, 3.674253821372986e-05, 4.046689718961716e-05, 4.4191256165504456e-05, 4.7915615141391754e-05, 5.163997411727905e-05, 5.536433309316635e-05, 5.908869206905365e-05, 6.281305104494095e-05, 6.653741002082825e-05, 7.026176899671555e-05, 7.398612797260284e-05, 7.771048694849014e-05, 8.143484592437744e-05, 8.515920490026474e-05, 8.888356387615204e-05, 9.260792285203934e-05, 9.633228182792664e-05, 0.00010005664080381393, 0.00010378099977970123, 0.00010750535875558853, 0.00011122971773147583, 0.00011495407670736313, 0.00011867843568325043, 0.00012240279465913773, 0.00012612715363502502, 0.00012985151261091232, 0.00013357587158679962, 0.00013730023056268692, 0.00014102458953857422]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 3.0, 10.0, 12.0, 28.0, 47.0, 86.0, 139.0, 281.0, 809.0, 3284.0, 21482.0, 757184.0, 251412.0, 10706.0, 1973.0, 537.0, 249.0, 110.0, 73.0, 40.0, 21.0, 13.0, 16.0, 7.0, 8.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11639404296875, -0.1130533218383789, -0.10971260070800781, -0.10637187957763672, -0.10303115844726562, -0.09969043731689453, -0.09634971618652344, -0.09300899505615234, -0.08966827392578125, -0.08632755279541016, -0.08298683166503906, -0.07964611053466797, -0.07630538940429688, -0.07296466827392578, -0.06962394714355469, -0.0662832260131836, -0.0629425048828125, -0.059601783752441406, -0.05626106262207031, -0.05292034149169922, -0.049579620361328125, -0.04623889923095703, -0.04289817810058594, -0.039557456970214844, -0.03621673583984375, -0.032876014709472656, -0.029535293579101562, -0.02619457244873047, -0.022853851318359375, -0.01951313018798828, -0.016172409057617188, -0.012831687927246094, -0.009490966796875, -0.006150245666503906, -0.0028095245361328125, 0.0005311965942382812, 0.003871917724609375, 0.007212638854980469, 0.010553359985351562, 0.013894081115722656, 0.01723480224609375, 0.020575523376464844, 0.023916244506835938, 0.02725696563720703, 0.030597686767578125, 0.03393840789794922, 0.03727912902832031, 0.040619850158691406, 0.0439605712890625, 0.047301292419433594, 0.05064201354980469, 0.05398273468017578, 0.057323455810546875, 0.06066417694091797, 0.06400489807128906, 0.06734561920166016, 0.07068634033203125, 0.07402706146240234, 0.07736778259277344, 0.08070850372314453, 0.08404922485351562, 0.08738994598388672, 0.09073066711425781, 0.0940713882446289, 0.097412109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 8.0, 7.0, 18.0, 25.0, 31.0, 59.0, 85.0, 123.0, 142.0, 137.0, 123.0, 78.0, 48.0, 34.0, 16.0, 17.0, 8.0, 6.0, 8.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07537841796875, -0.07315254211425781, -0.07092666625976562, -0.06870079040527344, -0.06647491455078125, -0.06424903869628906, -0.062023162841796875, -0.05979728698730469, -0.0575714111328125, -0.05534553527832031, -0.053119659423828125, -0.05089378356933594, -0.04866790771484375, -0.04644203186035156, -0.044216156005859375, -0.04199028015136719, -0.039764404296875, -0.03753852844238281, -0.035312652587890625, -0.03308677673339844, -0.03086090087890625, -0.028635025024414062, -0.026409149169921875, -0.024183273315429688, -0.0219573974609375, -0.019731521606445312, -0.017505645751953125, -0.015279769897460938, -0.01305389404296875, -0.010828018188476562, -0.008602142333984375, -0.0063762664794921875, -0.004150390625, -0.0019245147705078125, 0.000301361083984375, 0.0025272369384765625, 0.00475311279296875, 0.0069789886474609375, 0.009204864501953125, 0.011430740356445312, 0.0136566162109375, 0.015882492065429688, 0.018108367919921875, 0.020334243774414062, 0.02256011962890625, 0.024785995483398438, 0.027011871337890625, 0.029237747192382812, 0.031463623046875, 0.03368949890136719, 0.035915374755859375, 0.03814125061035156, 0.04036712646484375, 0.04259300231933594, 0.044818878173828125, 0.04704475402832031, 0.0492706298828125, 0.05149650573730469, 0.053722381591796875, 0.05594825744628906, 0.05817413330078125, 0.06040000915527344, 0.06262588500976562, 0.06485176086425781, 0.06707763671875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 13.0, 31.0, 74.0, 333.0, 378.0, 108.0, 36.0, 20.0, 7.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3696460723876953, -3.2929718494415283, -3.2162978649139404, -3.1396236419677734, -3.0629496574401855, -2.9862754344940186, -2.9096014499664307, -2.8329272270202637, -2.756253242492676, -2.679579019546509, -2.602905035018921, -2.526230812072754, -2.449556827545166, -2.372882604598999, -2.296208620071411, -2.219534397125244, -2.142860174179077, -2.06618595123291, -1.9895119667053223, -1.9128378629684448, -1.8361637592315674, -1.7594895362854004, -1.682815432548523, -1.6061413288116455, -1.529467225074768, -1.4527931213378906, -1.3761190176010132, -1.2994449138641357, -1.2227706909179688, -1.1460967063903809, -1.0694224834442139, -0.9927483797073364, -0.9160740375518799, -0.8393999338150024, -0.762725830078125, -0.6860516667366028, -0.6093775629997253, -0.5327034592628479, -0.45602932572364807, -0.37935519218444824, -0.3026810884475708, -0.22600696980953217, -0.14933285117149353, -0.0726587325334549, 0.00401538610458374, 0.08068948984146118, 0.157363623380661, 0.23403775691986084, 0.3107118606567383, 0.3873859643936157, 0.46406009793281555, 0.5407342314720154, 0.6174083352088928, 0.6940824389457703, 0.7707566022872925, 0.8474307060241699, 0.9241048097610474, 1.0007789134979248, 1.0774530172348022, 1.1541271209716797, 1.2308013439178467, 1.3074753284454346, 1.3841495513916016, 1.460823655128479, 1.5374977588653564]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 7.0, 8.0, 9.0, 14.0, 7.0, 15.0, 25.0, 17.0, 27.0, 27.0, 26.0, 32.0, 43.0, 52.0, 40.0, 56.0, 59.0, 45.0, 73.0, 59.0, 60.0, 42.0, 44.0, 37.0, 35.0, 23.0, 22.0, 20.0, 14.0, 18.0, 6.0, 16.0, 6.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.36531400680542, -1.323684573173523, -1.282055139541626, -1.2404258251190186, -1.1987963914871216, -1.1571669578552246, -1.1155375242233276, -1.0739080905914307, -1.0322786569595337, -0.9906492233276367, -0.9490198493003845, -0.9073904156684875, -0.8657609820365906, -0.8241316080093384, -0.7825021743774414, -0.7408727407455444, -0.6992433667182922, -0.6576139330863953, -0.6159845590591431, -0.5743551254272461, -0.5327256917953491, -0.49109628796577454, -0.44946688413619995, -0.407837450504303, -0.3662080466747284, -0.3245786428451538, -0.28294920921325684, -0.24131980538368225, -0.19969038665294647, -0.1580609679222107, -0.11643156409263611, -0.07480213046073914, -0.03317272663116455, 0.00845668837428093, 0.05008610337972641, 0.09171551465988159, 0.13334493339061737, 0.17497435212135315, 0.21660375595092773, 0.2582331895828247, 0.2998625934123993, 0.3414919972419739, 0.38312143087387085, 0.42475083470344543, 0.46638023853302, 0.508009672164917, 0.549639105796814, 0.5912685394287109, 0.6328979134559631, 0.6745273470878601, 0.7161567211151123, 0.7577861547470093, 0.7994155883789062, 0.8410450220108032, 0.8826743960380554, 0.9243038296699524, 0.9659332036972046, 1.0075626373291016, 1.0491920709609985, 1.0908215045928955, 1.132450819015503, 1.1740802526474, 1.2157096862792969, 1.2573391199111938, 1.2989685535430908]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 6.0, 4.0, 10.0, 14.0, 21.0, 26.0, 24.0, 39.0, 51.0, 65.0, 81.0, 115.0, 165.0, 265.0, 403.0, 747.0, 1616.0, 4115.0, 13727.0, 88205.0, 3905189.0, 153854.0, 18077.0, 4543.0, 1523.0, 671.0, 337.0, 172.0, 85.0, 46.0, 29.0, 13.0, 13.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.548828125, -0.5362358093261719, -0.5236434936523438, -0.5110511779785156, -0.4984588623046875, -0.4858665466308594, -0.47327423095703125, -0.4606819152832031, -0.448089599609375, -0.4354972839355469, -0.42290496826171875, -0.4103126525878906, -0.3977203369140625, -0.3851280212402344, -0.37253570556640625, -0.3599433898925781, -0.34735107421875, -0.3347587585449219, -0.32216644287109375, -0.3095741271972656, -0.2969818115234375, -0.2843894958496094, -0.27179718017578125, -0.2592048645019531, -0.246612548828125, -0.23402023315429688, -0.22142791748046875, -0.20883560180664062, -0.1962432861328125, -0.18365097045898438, -0.17105865478515625, -0.15846633911132812, -0.1458740234375, -0.13328170776367188, -0.12068939208984375, -0.10809707641601562, -0.0955047607421875, -0.08291244506835938, -0.07032012939453125, -0.057727813720703125, -0.045135498046875, -0.032543182373046875, -0.01995086669921875, -0.007358551025390625, 0.0052337646484375, 0.017826080322265625, 0.03041839599609375, 0.043010711669921875, 0.05560302734375, 0.06819534301757812, 0.08078765869140625, 0.09337997436523438, 0.1059722900390625, 0.11856460571289062, 0.13115692138671875, 0.14374923706054688, 0.156341552734375, 0.16893386840820312, 0.18152618408203125, 0.19411849975585938, 0.2067108154296875, 0.21930313110351562, 0.23189544677734375, 0.24448776245117188, 0.257080078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 3.0, 10.0, 23.0, 21.0, 50.0, 63.0, 70.0, 99.0, 97.0, 113.0, 89.0, 80.0, 79.0, 77.0, 46.0, 32.0, 16.0, 13.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1478271484375, -0.1444253921508789, -0.1410236358642578, -0.13762187957763672, -0.13422012329101562, -0.13081836700439453, -0.12741661071777344, -0.12401485443115234, -0.12061309814453125, -0.11721134185791016, -0.11380958557128906, -0.11040782928466797, -0.10700607299804688, -0.10360431671142578, -0.10020256042480469, -0.0968008041381836, -0.0933990478515625, -0.0899972915649414, -0.08659553527832031, -0.08319377899169922, -0.07979202270507812, -0.07639026641845703, -0.07298851013183594, -0.06958675384521484, -0.06618499755859375, -0.06278324127197266, -0.05938148498535156, -0.05597972869873047, -0.052577972412109375, -0.04917621612548828, -0.04577445983886719, -0.042372703552246094, -0.038970947265625, -0.035569190979003906, -0.03216743469238281, -0.02876567840576172, -0.025363922119140625, -0.02196216583251953, -0.018560409545898438, -0.015158653259277344, -0.01175689697265625, -0.008355140686035156, -0.0049533843994140625, -0.0015516281127929688, 0.001850128173828125, 0.005251884460449219, 0.008653640747070312, 0.012055397033691406, 0.0154571533203125, 0.018858909606933594, 0.022260665893554688, 0.02566242218017578, 0.029064178466796875, 0.03246593475341797, 0.03586769104003906, 0.039269447326660156, 0.04267120361328125, 0.046072959899902344, 0.04947471618652344, 0.05287647247314453, 0.056278228759765625, 0.05967998504638672, 0.06308174133300781, 0.0664834976196289, 0.06988525390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 17.0, 61.0, 107.0, 275.0, 898.0, 4101483.0, 90266.0, 759.0, 271.0, 92.0, 26.0, 13.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.005859375, -1.9515228271484375, -1.897186279296875, -1.8428497314453125, -1.78851318359375, -1.7341766357421875, -1.679840087890625, -1.6255035400390625, -1.5711669921875, -1.5168304443359375, -1.462493896484375, -1.4081573486328125, -1.35382080078125, -1.2994842529296875, -1.245147705078125, -1.1908111572265625, -1.136474609375, -1.0821380615234375, -1.027801513671875, -0.9734649658203125, -0.91912841796875, -0.8647918701171875, -0.810455322265625, -0.7561187744140625, -0.7017822265625, -0.6474456787109375, -0.593109130859375, -0.5387725830078125, -0.48443603515625, -0.4300994873046875, -0.375762939453125, -0.3214263916015625, -0.26708984375, -0.2127532958984375, -0.158416748046875, -0.1040802001953125, -0.04974365234375, 0.0045928955078125, 0.058929443359375, 0.1132659912109375, 0.1676025390625, 0.2219390869140625, 0.276275634765625, 0.3306121826171875, 0.38494873046875, 0.4392852783203125, 0.493621826171875, 0.5479583740234375, 0.602294921875, 0.6566314697265625, 0.710968017578125, 0.7653045654296875, 0.81964111328125, 0.8739776611328125, 0.928314208984375, 0.9826507568359375, 1.0369873046875, 1.0913238525390625, 1.145660400390625, 1.1999969482421875, 1.25433349609375, 1.3086700439453125, 1.363006591796875, 1.4173431396484375, 1.4716796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 9.0, 22.0, 77.0, 735.0, 3081.0, 125.0, 23.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.32141876220703125, -0.3122711181640625, -0.30312347412109375, -0.293975830078125, -0.28482818603515625, -0.2756805419921875, -0.26653289794921875, -0.25738525390625, -0.24823760986328125, -0.2390899658203125, -0.22994232177734375, -0.220794677734375, -0.21164703369140625, -0.2024993896484375, -0.19335174560546875, -0.1842041015625, -0.17505645751953125, -0.1659088134765625, -0.15676116943359375, -0.147613525390625, -0.13846588134765625, -0.1293182373046875, -0.12017059326171875, -0.11102294921875, -0.10187530517578125, -0.0927276611328125, -0.08358001708984375, -0.074432373046875, -0.06528472900390625, -0.0561370849609375, -0.04698944091796875, -0.037841796875, -0.02869415283203125, -0.0195465087890625, -0.01039886474609375, -0.001251220703125, 0.00789642333984375, 0.0170440673828125, 0.02619171142578125, 0.03533935546875, 0.04448699951171875, 0.0536346435546875, 0.06278228759765625, 0.071929931640625, 0.08107757568359375, 0.0902252197265625, 0.09937286376953125, 0.1085205078125, 0.11766815185546875, 0.1268157958984375, 0.13596343994140625, 0.145111083984375, 0.15425872802734375, 0.1634063720703125, 0.17255401611328125, 0.18170166015625, 0.19084930419921875, 0.1999969482421875, 0.20914459228515625, 0.218292236328125, 0.22743988037109375, 0.2365875244140625, 0.24573516845703125, 0.2548828125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 26.0, 779.0, 192.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.393536329269409, -3.316080093383789, -3.23862361907959, -3.1611673831939697, -3.0837111473083496, -3.0062546730041504, -2.9287984371185303, -2.85134220123291, -2.773885726928711, -2.696429491043091, -2.6189730167388916, -2.5415167808532715, -2.4640605449676514, -2.3866043090820312, -2.309147834777832, -2.231691598892212, -2.154235363006592, -2.0767791271209717, -1.999322772026062, -1.9218664169311523, -1.8444101810455322, -1.7669538259506226, -1.689497470855713, -1.6120412349700928, -1.534584879875183, -1.4571285247802734, -1.3796722888946533, -1.3022159337997437, -1.224759578704834, -1.1473033428192139, -1.0698469877243042, -0.9923906922340393, -0.9149341583251953, -0.8374778628349304, -0.7600215673446655, -0.6825652122497559, -0.605108916759491, -0.5276526212692261, -0.4501962959766388, -0.3727399706840515, -0.2952836751937866, -0.21782736480236053, -0.14037105441093445, -0.06291474401950836, 0.014541566371917725, 0.09199786186218262, 0.1694541871547699, 0.24691051244735718, 0.32436680793762207, 0.40182310342788696, 0.47927942872047424, 0.5567357540130615, 0.6341920495033264, 0.7116483449935913, 0.789104700088501, 0.8665609955787659, 0.9440172910690308, 1.0214736461639404, 1.0989298820495605, 1.1763862371444702, 1.2538425922393799, 1.331298828125, 1.4087551832199097, 1.4862115383148193, 1.5636677742004395]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 9.0, 4.0, 17.0, 20.0, 28.0, 30.0, 42.0, 61.0, 59.0, 81.0, 74.0, 91.0, 79.0, 81.0, 63.0, 47.0, 41.0, 31.0, 48.0, 29.0, 16.0, 8.0, 9.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4426233172416687, -0.4294520616531372, -0.4162808060646057, -0.4031095504760742, -0.3899383246898651, -0.3767670691013336, -0.3635958135128021, -0.35042455792427063, -0.3372533321380615, -0.32408207654953003, -0.31091082096099854, -0.29773956537246704, -0.28456833958625793, -0.27139708399772644, -0.25822582840919495, -0.24505457282066345, -0.23188331723213196, -0.21871206164360046, -0.20554082095623016, -0.19236956536769867, -0.17919832468032837, -0.16602706909179688, -0.15285581350326538, -0.1396845579147339, -0.1265133172273636, -0.11334206908941269, -0.10017082095146179, -0.0869995653629303, -0.0738283172249794, -0.0606570690870285, -0.04748581349849701, -0.03431456536054611, -0.021143317222595215, -0.007972067221999168, 0.005199182778596878, 0.018370434641838074, 0.03154168277978897, 0.04471293091773987, 0.05788418650627136, 0.07105543464422226, 0.08422668278217316, 0.09739793092012405, 0.11056917905807495, 0.12374043464660645, 0.13691169023513794, 0.15008293092250824, 0.16325418651103973, 0.17642542719841003, 0.18959668278694153, 0.20276793837547302, 0.21593917906284332, 0.22911043465137482, 0.24228167533874512, 0.2554529309272766, 0.2686241865158081, 0.2817954421043396, 0.2949666976928711, 0.3081379532814026, 0.3213092088699341, 0.3344804644584656, 0.3476516902446747, 0.3608229458332062, 0.37399420142173767, 0.38716545701026917, 0.40033668279647827]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 12.0, 7.0, 14.0, 15.0, 20.0, 40.0, 64.0, 87.0, 136.0, 163.0, 290.0, 463.0, 783.0, 1835.0, 5165.0, 20206.0, 120450.0, 722843.0, 143078.0, 23003.0, 5635.0, 2030.0, 902.0, 472.0, 261.0, 184.0, 113.0, 74.0, 64.0, 26.0, 32.0, 16.0, 22.0, 16.0, 8.0, 5.0, 8.0, 5.0, 3.0, 0.0, 4.0, 2.0], "bins": [-0.37255859375, -0.36313629150390625, -0.3537139892578125, -0.34429168701171875, -0.334869384765625, -0.32544708251953125, -0.3160247802734375, -0.30660247802734375, -0.29718017578125, -0.28775787353515625, -0.2783355712890625, -0.26891326904296875, -0.259490966796875, -0.25006866455078125, -0.2406463623046875, -0.23122406005859375, -0.2218017578125, -0.21237945556640625, -0.2029571533203125, -0.19353485107421875, -0.184112548828125, -0.17469024658203125, -0.1652679443359375, -0.15584564208984375, -0.14642333984375, -0.13700103759765625, -0.1275787353515625, -0.11815643310546875, -0.108734130859375, -0.09931182861328125, -0.0898895263671875, -0.08046722412109375, -0.071044921875, -0.06162261962890625, -0.0522003173828125, -0.04277801513671875, -0.033355712890625, -0.02393341064453125, -0.0145111083984375, -0.00508880615234375, 0.00433349609375, 0.01375579833984375, 0.0231781005859375, 0.03260040283203125, 0.042022705078125, 0.05144500732421875, 0.0608673095703125, 0.07028961181640625, 0.0797119140625, 0.08913421630859375, 0.0985565185546875, 0.10797882080078125, 0.117401123046875, 0.12682342529296875, 0.1362457275390625, 0.14566802978515625, 0.15509033203125, 0.16451263427734375, 0.1739349365234375, 0.18335723876953125, 0.192779541015625, 0.20220184326171875, 0.2116241455078125, 0.22104644775390625, 0.23046875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 8.0, 15.0, 25.0, 43.0, 41.0, 56.0, 74.0, 86.0, 86.0, 95.0, 95.0, 68.0, 66.0, 73.0, 54.0, 32.0, 30.0, 17.0, 17.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.1339111328125, -0.13083744049072266, -0.1277637481689453, -0.12469005584716797, -0.12161636352539062, -0.11854267120361328, -0.11546897888183594, -0.1123952865600586, -0.10932159423828125, -0.1062479019165039, -0.10317420959472656, -0.10010051727294922, -0.09702682495117188, -0.09395313262939453, -0.09087944030761719, -0.08780574798583984, -0.0847320556640625, -0.08165836334228516, -0.07858467102050781, -0.07551097869873047, -0.07243728637695312, -0.06936359405517578, -0.06628990173339844, -0.0632162094116211, -0.06014251708984375, -0.057068824768066406, -0.05399513244628906, -0.05092144012451172, -0.047847747802734375, -0.04477405548095703, -0.04170036315917969, -0.038626670837402344, -0.035552978515625, -0.032479286193847656, -0.029405593872070312, -0.02633190155029297, -0.023258209228515625, -0.02018451690673828, -0.017110824584960938, -0.014037132263183594, -0.01096343994140625, -0.007889747619628906, -0.0048160552978515625, -0.0017423629760742188, 0.001331329345703125, 0.004405021667480469, 0.0074787139892578125, 0.010552406311035156, 0.0136260986328125, 0.016699790954589844, 0.019773483276367188, 0.02284717559814453, 0.025920867919921875, 0.02899456024169922, 0.03206825256347656, 0.035141944885253906, 0.03821563720703125, 0.041289329528808594, 0.04436302185058594, 0.04743671417236328, 0.050510406494140625, 0.05358409881591797, 0.05665779113769531, 0.059731483459472656, 0.06280517578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 6.0, 5.0, 10.0, 13.0, 26.0, 41.0, 52.0, 101.0, 212.0, 493.0, 1785.0, 10293.0, 232058.0, 778949.0, 20526.0, 2649.0, 745.0, 265.0, 126.0, 59.0, 45.0, 28.0, 12.0, 12.0, 10.0, 8.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.65625, -0.6394844055175781, -0.6227188110351562, -0.6059532165527344, -0.5891876220703125, -0.5724220275878906, -0.5556564331054688, -0.5388908386230469, -0.522125244140625, -0.5053596496582031, -0.48859405517578125, -0.4718284606933594, -0.4550628662109375, -0.4382972717285156, -0.42153167724609375, -0.4047660827636719, -0.38800048828125, -0.3712348937988281, -0.35446929931640625, -0.3377037048339844, -0.3209381103515625, -0.3041725158691406, -0.28740692138671875, -0.2706413269042969, -0.253875732421875, -0.23711013793945312, -0.22034454345703125, -0.20357894897460938, -0.1868133544921875, -0.17004776000976562, -0.15328216552734375, -0.13651657104492188, -0.1197509765625, -0.10298538208007812, -0.08621978759765625, -0.06945419311523438, -0.0526885986328125, -0.035923004150390625, -0.01915740966796875, -0.002391815185546875, 0.014373779296875, 0.031139373779296875, 0.04790496826171875, 0.06467056274414062, 0.0814361572265625, 0.09820175170898438, 0.11496734619140625, 0.13173294067382812, 0.14849853515625, 0.16526412963867188, 0.18202972412109375, 0.19879531860351562, 0.2155609130859375, 0.23232650756835938, 0.24909210205078125, 0.2658576965332031, 0.282623291015625, 0.2993888854980469, 0.31615447998046875, 0.3329200744628906, 0.3496856689453125, 0.3664512634277344, 0.38321685791015625, 0.3999824523925781, 0.416748046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 4.0, 7.0, 5.0, 12.0, 21.0, 30.0, 36.0, 36.0, 53.0, 67.0, 85.0, 95.0, 102.0, 81.0, 74.0, 69.0, 60.0, 42.0, 21.0, 30.0, 19.0, 9.0, 7.0, 9.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5166015625, -0.5034751892089844, -0.49034881591796875, -0.4772224426269531, -0.4640960693359375, -0.4509696960449219, -0.43784332275390625, -0.4247169494628906, -0.411590576171875, -0.3984642028808594, -0.38533782958984375, -0.3722114562988281, -0.3590850830078125, -0.3459587097167969, -0.33283233642578125, -0.3197059631347656, -0.30657958984375, -0.2934532165527344, -0.28032684326171875, -0.2672004699707031, -0.2540740966796875, -0.24094772338867188, -0.22782135009765625, -0.21469497680664062, -0.201568603515625, -0.18844223022460938, -0.17531585693359375, -0.16218948364257812, -0.1490631103515625, -0.13593673706054688, -0.12281036376953125, -0.10968399047851562, -0.0965576171875, -0.08343124389648438, -0.07030487060546875, -0.057178497314453125, -0.0440521240234375, -0.030925750732421875, -0.01779937744140625, -0.004673004150390625, 0.008453369140625, 0.021579742431640625, 0.03470611572265625, 0.047832489013671875, 0.0609588623046875, 0.07408523559570312, 0.08721160888671875, 0.10033798217773438, 0.11346435546875, 0.12659072875976562, 0.13971710205078125, 0.15284347534179688, 0.1659698486328125, 0.17909622192382812, 0.19222259521484375, 0.20534896850585938, 0.218475341796875, 0.23160171508789062, 0.24472808837890625, 0.2578544616699219, 0.2709808349609375, 0.2841072082519531, 0.29723358154296875, 0.3103599548339844, 0.323486328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 12.0, 8.0, 11.0, 27.0, 32.0, 45.0, 86.0, 145.0, 272.0, 579.0, 1224.0, 3774.0, 22868.0, 785909.0, 219029.0, 10277.0, 2364.0, 861.0, 429.0, 213.0, 132.0, 81.0, 57.0, 26.0, 21.0, 11.0, 8.0, 6.0, 7.0, 9.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1031494140625, -0.0994415283203125, -0.095733642578125, -0.0920257568359375, -0.08831787109375, -0.0846099853515625, -0.080902099609375, -0.0771942138671875, -0.073486328125, -0.0697784423828125, -0.066070556640625, -0.0623626708984375, -0.05865478515625, -0.0549468994140625, -0.051239013671875, -0.0475311279296875, -0.0438232421875, -0.0401153564453125, -0.036407470703125, -0.0326995849609375, -0.02899169921875, -0.0252838134765625, -0.021575927734375, -0.0178680419921875, -0.01416015625, -0.0104522705078125, -0.006744384765625, -0.0030364990234375, 0.00067138671875, 0.0043792724609375, 0.008087158203125, 0.0117950439453125, 0.0155029296875, 0.0192108154296875, 0.022918701171875, 0.0266265869140625, 0.03033447265625, 0.0340423583984375, 0.037750244140625, 0.0414581298828125, 0.045166015625, 0.0488739013671875, 0.052581787109375, 0.0562896728515625, 0.05999755859375, 0.0637054443359375, 0.067413330078125, 0.0711212158203125, 0.0748291015625, 0.0785369873046875, 0.082244873046875, 0.0859527587890625, 0.08966064453125, 0.0933685302734375, 0.097076416015625, 0.1007843017578125, 0.1044921875, 0.1082000732421875, 0.111907958984375, 0.1156158447265625, 0.11932373046875, 0.1230316162109375, 0.126739501953125, 0.1304473876953125, 0.1341552734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 13.0, 17.0, 29.0, 40.0, 50.0, 75.0, 97.0, 95.0, 146.0, 111.0, 93.0, 69.0, 54.0, 39.0, 20.0, 17.0, 9.0, 9.0, 5.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001747608184814453, -0.00017011724412441254, -0.00016547366976737976, -0.00016083009541034698, -0.0001561865210533142, -0.00015154294669628143, -0.00014689937233924866, -0.00014225579798221588, -0.0001376122236251831, -0.00013296864926815033, -0.00012832507491111755, -0.00012368150055408478, -0.000119037926197052, -0.00011439435184001923, -0.00010975077748298645, -0.00010510720312595367, -0.0001004636287689209, -9.582005441188812e-05, -9.117648005485535e-05, -8.653290569782257e-05, -8.18893313407898e-05, -7.724575698375702e-05, -7.260218262672424e-05, -6.795860826969147e-05, -6.331503391265869e-05, -5.8671459555625916e-05, -5.402788519859314e-05, -4.9384310841560364e-05, -4.474073648452759e-05, -4.009716212749481e-05, -3.5453587770462036e-05, -3.081001341342926e-05, -2.6166439056396484e-05, -2.152286469936371e-05, -1.6879290342330933e-05, -1.2235715985298157e-05, -7.592141628265381e-06, -2.948567271232605e-06, 1.695007085800171e-06, 6.338581442832947e-06, 1.0982155799865723e-05, 1.56257301568985e-05, 2.0269304513931274e-05, 2.491287887096405e-05, 2.9556453227996826e-05, 3.42000275850296e-05, 3.884360194206238e-05, 4.3487176299095154e-05, 4.813075065612793e-05, 5.2774325013160706e-05, 5.741789937019348e-05, 6.206147372722626e-05, 6.670504808425903e-05, 7.134862244129181e-05, 7.599219679832458e-05, 8.063577115535736e-05, 8.527934551239014e-05, 8.992291986942291e-05, 9.456649422645569e-05, 9.921006858348846e-05, 0.00010385364294052124, 0.00010849721729755402, 0.00011314079165458679, 0.00011778436601161957, 0.00012242794036865234]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 16.0, 33.0, 68.0, 160.0, 449.0, 1396.0, 10040.0, 781470.0, 248022.0, 5270.0, 982.0, 353.0, 131.0, 61.0, 29.0, 20.0, 13.0, 11.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0999755859375, -0.09494590759277344, -0.08991622924804688, -0.08488655090332031, -0.07985687255859375, -0.07482719421386719, -0.06979751586914062, -0.06476783752441406, -0.0597381591796875, -0.05470848083496094, -0.049678802490234375, -0.04464912414550781, -0.03961944580078125, -0.03458976745605469, -0.029560089111328125, -0.024530410766601562, -0.019500732421875, -0.014471054077148438, -0.009441375732421875, -0.0044116973876953125, 0.00061798095703125, 0.0056476593017578125, 0.010677337646484375, 0.015707015991210938, 0.0207366943359375, 0.025766372680664062, 0.030796051025390625, 0.03582572937011719, 0.04085540771484375, 0.04588508605957031, 0.050914764404296875, 0.05594444274902344, 0.06097412109375, 0.06600379943847656, 0.07103347778320312, 0.07606315612792969, 0.08109283447265625, 0.08612251281738281, 0.09115219116210938, 0.09618186950683594, 0.1012115478515625, 0.10624122619628906, 0.11127090454101562, 0.11630058288574219, 0.12133026123046875, 0.1263599395751953, 0.13138961791992188, 0.13641929626464844, 0.141448974609375, 0.14647865295410156, 0.15150833129882812, 0.1565380096435547, 0.16156768798828125, 0.1665973663330078, 0.17162704467773438, 0.17665672302246094, 0.1816864013671875, 0.18671607971191406, 0.19174575805664062, 0.1967754364013672, 0.20180511474609375, 0.2068347930908203, 0.21186447143554688, 0.21689414978027344, 0.221923828125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 9.0, 10.0, 31.0, 49.0, 107.0, 148.0, 222.0, 180.0, 105.0, 51.0, 32.0, 18.0, 11.0, 10.0, 4.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08544921875, -0.08183860778808594, -0.07822799682617188, -0.07461738586425781, -0.07100677490234375, -0.06739616394042969, -0.06378555297851562, -0.06017494201660156, -0.0565643310546875, -0.05295372009277344, -0.049343109130859375, -0.04573249816894531, -0.04212188720703125, -0.03851127624511719, -0.034900665283203125, -0.03129005432128906, -0.027679443359375, -0.024068832397460938, -0.020458221435546875, -0.016847610473632812, -0.01323699951171875, -0.009626388549804688, -0.006015777587890625, -0.0024051666259765625, 0.0012054443359375, 0.0048160552978515625, 0.008426666259765625, 0.012037277221679688, 0.01564788818359375, 0.019258499145507812, 0.022869110107421875, 0.026479721069335938, 0.03009033203125, 0.03370094299316406, 0.037311553955078125, 0.04092216491699219, 0.04453277587890625, 0.04814338684082031, 0.051753997802734375, 0.05536460876464844, 0.0589752197265625, 0.06258583068847656, 0.06619644165039062, 0.06980705261230469, 0.07341766357421875, 0.07702827453613281, 0.08063888549804688, 0.08424949645996094, 0.087860107421875, 0.09147071838378906, 0.09508132934570312, 0.09869194030761719, 0.10230255126953125, 0.10591316223144531, 0.10952377319335938, 0.11313438415527344, 0.1167449951171875, 0.12035560607910156, 0.12396621704101562, 0.1275768280029297, 0.13118743896484375, 0.1347980499267578, 0.13840866088867188, 0.14201927185058594, 0.1456298828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 10.0, 32.0, 129.0, 630.0, 181.0, 25.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.594270706176758, -8.424546241760254, -8.254822731018066, -8.085098266601562, -7.915374755859375, -7.745650768280029, -7.575926780700684, -7.406202793121338, -7.236478805541992, -7.0667548179626465, -6.897030830383301, -6.727306842803955, -6.557582855224609, -6.387858867645264, -6.218134880065918, -6.048410892486572, -5.878686904907227, -5.708962917327881, -5.539238929748535, -5.3695149421691895, -5.199790954589844, -5.030066967010498, -4.860342979431152, -4.690618991851807, -4.520894527435303, -4.351170539855957, -4.181446552276611, -4.011722564697266, -3.84199857711792, -3.672274589538574, -3.5025506019592285, -3.332826614379883, -3.163102388381958, -2.9933784008026123, -2.8236544132232666, -2.653930425643921, -2.484206438064575, -2.3144824504852295, -2.1447582244873047, -1.9750343561172485, -1.8053103685379028, -1.6355863809585571, -1.4658623933792114, -1.2961382865905762, -1.1264142990112305, -0.9566903710365295, -0.7869663238525391, -0.6172423362731934, -0.44751834869384766, -0.27779436111450195, -0.10807034373283386, 0.06165367364883423, 0.23137766122817993, 0.40110164880752563, 0.5708256959915161, 0.7405496835708618, 0.9102736711502075, 1.0799976587295532, 1.249721646308899, 1.4194457530975342, 1.5891697406768799, 1.7588937282562256, 1.9286177158355713, 2.098341703414917, 2.2680656909942627]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 6.0, 5.0, 6.0, 9.0, 9.0, 10.0, 18.0, 24.0, 18.0, 24.0, 27.0, 29.0, 35.0, 36.0, 34.0, 45.0, 39.0, 44.0, 61.0, 56.0, 37.0, 52.0, 44.0, 44.0, 35.0, 28.0, 33.0, 32.0, 22.0, 31.0, 19.0, 23.0, 9.0, 14.0, 4.0, 8.0, 5.0, 7.0, 4.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4786643981933594, -1.433106541633606, -1.3875486850738525, -1.3419908285140991, -1.2964329719543457, -1.2508751153945923, -1.2053172588348389, -1.1597594022750854, -1.114201545715332, -1.0686436891555786, -1.0230858325958252, -0.9775279760360718, -0.9319701194763184, -0.8864122629165649, -0.8408544063568115, -0.7952965497970581, -0.7497387528419495, -0.704180896282196, -0.6586230397224426, -0.6130651831626892, -0.5675073266029358, -0.5219494700431824, -0.47639164328575134, -0.4308337867259979, -0.3852759301662445, -0.3397180736064911, -0.29416021704673767, -0.24860237538814545, -0.20304451882839203, -0.1574866622686386, -0.11192882061004639, -0.06637096405029297, -0.02081310749053955, 0.02474474534392357, 0.07030259817838669, 0.11586044728755951, 0.16141830384731293, 0.20697616040706635, 0.25253400206565857, 0.298091858625412, 0.3436497151851654, 0.3892075717449188, 0.43476542830467224, 0.48032325506210327, 0.5258811116218567, 0.5714389681816101, 0.6169968247413635, 0.6625546813011169, 0.7081125378608704, 0.7536703944206238, 0.7992282509803772, 0.8447861075401306, 0.890343964099884, 0.9359018206596375, 0.9814596176147461, 1.0270174741744995, 1.072575330734253, 1.1181331872940063, 1.1636910438537598, 1.2092489004135132, 1.2548067569732666, 1.30036461353302, 1.3459224700927734, 1.3914803266525269, 1.4370381832122803]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 6.0, 1.0, 9.0, 9.0, 5.0, 6.0, 8.0, 10.0, 13.0, 24.0, 25.0, 36.0, 64.0, 85.0, 122.0, 209.0, 347.0, 615.0, 1304.0, 2743.0, 7491.0, 36287.0, 3054392.0, 1047091.0, 32023.0, 6908.0, 2353.0, 1023.0, 479.0, 274.0, 132.0, 63.0, 52.0, 22.0, 17.0, 19.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.72998046875, -0.7133750915527344, -0.6967697143554688, -0.6801643371582031, -0.6635589599609375, -0.6469535827636719, -0.6303482055664062, -0.6137428283691406, -0.597137451171875, -0.5805320739746094, -0.5639266967773438, -0.5473213195800781, -0.5307159423828125, -0.5141105651855469, -0.49750518798828125, -0.4808998107910156, -0.46429443359375, -0.4476890563964844, -0.43108367919921875, -0.4144783020019531, -0.3978729248046875, -0.3812675476074219, -0.36466217041015625, -0.3480567932128906, -0.331451416015625, -0.3148460388183594, -0.29824066162109375, -0.2816352844238281, -0.2650299072265625, -0.24842453002929688, -0.23181915283203125, -0.21521377563476562, -0.1986083984375, -0.18200302124023438, -0.16539764404296875, -0.14879226684570312, -0.1321868896484375, -0.11558151245117188, -0.09897613525390625, -0.08237075805664062, -0.065765380859375, -0.049160003662109375, -0.03255462646484375, -0.015949249267578125, 0.0006561279296875, 0.017261505126953125, 0.03386688232421875, 0.050472259521484375, 0.06707763671875, 0.08368301391601562, 0.10028839111328125, 0.11689376831054688, 0.1334991455078125, 0.15010452270507812, 0.16670989990234375, 0.18331527709960938, 0.199920654296875, 0.21652603149414062, 0.23313140869140625, 0.24973678588867188, 0.2663421630859375, 0.2829475402832031, 0.29955291748046875, 0.3161582946777344, 0.332763671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 9.0, 9.0, 21.0, 26.0, 47.0, 45.0, 46.0, 69.0, 95.0, 94.0, 91.0, 79.0, 90.0, 68.0, 58.0, 44.0, 41.0, 19.0, 15.0, 14.0, 11.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.1396484375, -0.13650083541870117, -0.13335323333740234, -0.13020563125610352, -0.1270580291748047, -0.12391042709350586, -0.12076282501220703, -0.1176152229309082, -0.11446762084960938, -0.11132001876831055, -0.10817241668701172, -0.10502481460571289, -0.10187721252441406, -0.09872961044311523, -0.0955820083618164, -0.09243440628051758, -0.08928680419921875, -0.08613920211791992, -0.0829916000366211, -0.07984399795532227, -0.07669639587402344, -0.07354879379272461, -0.07040119171142578, -0.06725358963012695, -0.06410598754882812, -0.0609583854675293, -0.05781078338623047, -0.05466318130493164, -0.05151557922363281, -0.048367977142333984, -0.045220375061035156, -0.04207277297973633, -0.0389251708984375, -0.03577756881713867, -0.032629966735839844, -0.029482364654541016, -0.026334762573242188, -0.02318716049194336, -0.02003955841064453, -0.016891956329345703, -0.013744354248046875, -0.010596752166748047, -0.007449150085449219, -0.004301548004150391, -0.0011539459228515625, 0.0019936561584472656, 0.005141258239746094, 0.008288860321044922, 0.01143646240234375, 0.014584064483642578, 0.017731666564941406, 0.020879268646240234, 0.024026870727539062, 0.02717447280883789, 0.03032207489013672, 0.03346967697143555, 0.036617279052734375, 0.0397648811340332, 0.04291248321533203, 0.04606008529663086, 0.04920768737792969, 0.052355289459228516, 0.055502891540527344, 0.05865049362182617, 0.061798095703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 1.0, 13.0, 19.0, 28.0, 37.0, 72.0, 125.0, 275.0, 1075.0, 10511.0, 4162900.0, 17565.0, 1213.0, 241.0, 103.0, 47.0, 20.0, 15.0, 9.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052734375, -2.0066909790039062, -1.9606475830078125, -1.9146041870117188, -1.868560791015625, -1.8225173950195312, -1.7764739990234375, -1.7304306030273438, -1.68438720703125, -1.6383438110351562, -1.5923004150390625, -1.5462570190429688, -1.500213623046875, -1.4541702270507812, -1.4081268310546875, -1.3620834350585938, -1.3160400390625, -1.2699966430664062, -1.2239532470703125, -1.1779098510742188, -1.131866455078125, -1.0858230590820312, -1.0397796630859375, -0.9937362670898438, -0.94769287109375, -0.9016494750976562, -0.8556060791015625, -0.8095626831054688, -0.763519287109375, -0.7174758911132812, -0.6714324951171875, -0.6253890991210938, -0.579345703125, -0.5333023071289062, -0.4872589111328125, -0.44121551513671875, -0.395172119140625, -0.34912872314453125, -0.3030853271484375, -0.25704193115234375, -0.21099853515625, -0.16495513916015625, -0.1189117431640625, -0.07286834716796875, -0.026824951171875, 0.01921844482421875, 0.0652618408203125, 0.11130523681640625, 0.1573486328125, 0.20339202880859375, 0.2494354248046875, 0.29547882080078125, 0.341522216796875, 0.38756561279296875, 0.4336090087890625, 0.47965240478515625, 0.52569580078125, 0.5717391967773438, 0.6177825927734375, 0.6638259887695312, 0.709869384765625, 0.7559127807617188, 0.8019561767578125, 0.8479995727539062, 0.89404296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 9.0, 11.0, 13.0, 40.0, 151.0, 2782.0, 907.0, 84.0, 38.0, 13.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.646484375, -0.6329746246337891, -0.6194648742675781, -0.6059551239013672, -0.5924453735351562, -0.5789356231689453, -0.5654258728027344, -0.5519161224365234, -0.5384063720703125, -0.5248966217041016, -0.5113868713378906, -0.4978771209716797, -0.48436737060546875, -0.4708576202392578, -0.4573478698730469, -0.44383811950683594, -0.430328369140625, -0.41681861877441406, -0.4033088684082031, -0.3897991180419922, -0.37628936767578125, -0.3627796173095703, -0.3492698669433594, -0.33576011657714844, -0.3222503662109375, -0.30874061584472656, -0.2952308654785156, -0.2817211151123047, -0.26821136474609375, -0.2547016143798828, -0.24119186401367188, -0.22768211364746094, -0.21417236328125, -0.20066261291503906, -0.18715286254882812, -0.1736431121826172, -0.16013336181640625, -0.1466236114501953, -0.13311386108398438, -0.11960411071777344, -0.1060943603515625, -0.09258460998535156, -0.07907485961914062, -0.06556510925292969, -0.05205535888671875, -0.03854560852050781, -0.025035858154296875, -0.011526107788085938, 0.001983642578125, 0.015493392944335938, 0.029003143310546875, 0.04251289367675781, 0.05602264404296875, 0.06953239440917969, 0.08304214477539062, 0.09655189514160156, 0.1100616455078125, 0.12357139587402344, 0.13708114624023438, 0.1505908966064453, 0.16410064697265625, 0.1776103973388672, 0.19112014770507812, 0.20462989807128906, 0.2181396484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 12.0, 35.0, 179.0, 538.0, 179.0, 31.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-3.164594888687134, -3.105350971221924, -3.046107292175293, -2.986863613128662, -2.927619695663452, -2.868375778198242, -2.8091320991516113, -2.7498884201049805, -2.6906445026397705, -2.6314005851745605, -2.5721569061279297, -2.512913227081299, -2.453669309616089, -2.394425392150879, -2.335181713104248, -2.275938034057617, -2.2166941165924072, -2.1574501991271973, -2.0982065200805664, -2.0389628410339355, -1.9797189235687256, -1.9204751253128052, -1.8612313270568848, -1.8019875288009644, -1.742743730545044, -1.6834999322891235, -1.6242561340332031, -1.5650123357772827, -1.5057685375213623, -1.446524739265442, -1.3872809410095215, -1.328037142753601, -1.2687932252883911, -1.2095494270324707, -1.1503056287765503, -1.0910618305206299, -1.0318180322647095, -0.9725742340087891, -0.9133304357528687, -0.8540866374969482, -0.7948428392410278, -0.7355990409851074, -0.676355242729187, -0.6171114444732666, -0.5578676462173462, -0.4986238479614258, -0.43938004970550537, -0.38013625144958496, -0.32089245319366455, -0.26164865493774414, -0.20240485668182373, -0.14316105842590332, -0.08391726016998291, -0.0246734619140625, 0.03457033634185791, 0.09381413459777832, 0.15305793285369873, 0.21230173110961914, 0.27154552936553955, 0.33078932762145996, 0.39003312587738037, 0.4492769241333008, 0.5085207223892212, 0.5677645206451416, 0.627008318901062]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 10.0, 16.0, 31.0, 43.0, 70.0, 103.0, 131.0, 129.0, 111.0, 112.0, 85.0, 56.0, 54.0, 19.0, 18.0, 6.0, 8.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5089569091796875, -1.4624419212341309, -1.4159269332885742, -1.3694119453430176, -1.322896957397461, -1.2763819694519043, -1.2298669815063477, -1.183351993560791, -1.1368370056152344, -1.0903220176696777, -1.043807029724121, -0.9972920417785645, -0.9507770538330078, -0.9042620658874512, -0.8577470183372498, -0.8112320303916931, -0.7647169828414917, -0.7182019948959351, -0.6716870069503784, -0.6251720190048218, -0.5786570310592651, -0.5321420431137085, -0.4856269955635071, -0.43911200761795044, -0.3925970196723938, -0.34608203172683716, -0.2995670437812805, -0.2530520260334015, -0.20653703808784485, -0.1600220501422882, -0.11350703239440918, -0.06699204444885254, -0.020476937294006348, 0.02603805810213089, 0.07255305349826813, 0.11906805634498596, 0.1655830442905426, 0.21209803223609924, 0.25861304998397827, 0.3051280379295349, 0.35164302587509155, 0.3981580138206482, 0.44467300176620483, 0.49118801951408386, 0.5377030372619629, 0.5842180252075195, 0.6307330131530762, 0.6772480010986328, 0.7237629890441895, 0.7702779769897461, 0.8167929649353027, 0.8633079528808594, 0.909822940826416, 0.9563379287719727, 1.0028529167175293, 1.049367904663086, 1.0958828926086426, 1.1423978805541992, 1.1889128684997559, 1.2354278564453125, 1.2819428443908691, 1.3284578323364258, 1.3749728202819824, 1.421487808227539, 1.4680029153823853]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 10.0, 10.0, 15.0, 22.0, 24.0, 51.0, 66.0, 106.0, 172.0, 314.0, 604.0, 1590.0, 5636.0, 43905.0, 757039.0, 217950.0, 16196.0, 2872.0, 953.0, 408.0, 223.0, 110.0, 82.0, 65.0, 24.0, 33.0, 18.0, 10.0, 13.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5045356750488281, -0.49002838134765625, -0.4755210876464844, -0.4610137939453125, -0.4465065002441406, -0.43199920654296875, -0.4174919128417969, -0.402984619140625, -0.3884773254394531, -0.37397003173828125, -0.3594627380371094, -0.3449554443359375, -0.3304481506347656, -0.31594085693359375, -0.3014335632324219, -0.28692626953125, -0.2724189758300781, -0.25791168212890625, -0.24340438842773438, -0.2288970947265625, -0.21438980102539062, -0.19988250732421875, -0.18537521362304688, -0.170867919921875, -0.15636062622070312, -0.14185333251953125, -0.12734603881835938, -0.1128387451171875, -0.09833145141601562, -0.08382415771484375, -0.06931686401367188, -0.0548095703125, -0.040302276611328125, -0.02579498291015625, -0.011287689208984375, 0.0032196044921875, 0.017726898193359375, 0.03223419189453125, 0.046741485595703125, 0.061248779296875, 0.07575607299804688, 0.09026336669921875, 0.10477066040039062, 0.1192779541015625, 0.13378524780273438, 0.14829254150390625, 0.16279983520507812, 0.17730712890625, 0.19181442260742188, 0.20632171630859375, 0.22082901000976562, 0.2353363037109375, 0.24984359741210938, 0.26435089111328125, 0.2788581848144531, 0.293365478515625, 0.3078727722167969, 0.32238006591796875, 0.3368873596191406, 0.3513946533203125, 0.3659019470214844, 0.38040924072265625, 0.3949165344238281, 0.409423828125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 10.0, 8.0, 22.0, 43.0, 65.0, 100.0, 107.0, 129.0, 137.0, 122.0, 106.0, 65.0, 45.0, 25.0, 11.0, 5.0, 6.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2049560546875, -0.20030498504638672, -0.19565391540527344, -0.19100284576416016, -0.18635177612304688, -0.1817007064819336, -0.1770496368408203, -0.17239856719970703, -0.16774749755859375, -0.16309642791748047, -0.1584453582763672, -0.1537942886352539, -0.14914321899414062, -0.14449214935302734, -0.13984107971191406, -0.13519001007080078, -0.1305389404296875, -0.12588787078857422, -0.12123680114746094, -0.11658573150634766, -0.11193466186523438, -0.1072835922241211, -0.10263252258300781, -0.09798145294189453, -0.09333038330078125, -0.08867931365966797, -0.08402824401855469, -0.0793771743774414, -0.07472610473632812, -0.07007503509521484, -0.06542396545410156, -0.06077289581298828, -0.056121826171875, -0.05147075653076172, -0.04681968688964844, -0.042168617248535156, -0.037517547607421875, -0.032866477966308594, -0.028215408325195312, -0.02356433868408203, -0.01891326904296875, -0.014262199401855469, -0.009611129760742188, -0.004960060119628906, -0.000308990478515625, 0.004342079162597656, 0.008993148803710938, 0.013644218444824219, 0.0182952880859375, 0.02294635772705078, 0.027597427368164062, 0.032248497009277344, 0.036899566650390625, 0.041550636291503906, 0.04620170593261719, 0.05085277557373047, 0.05550384521484375, 0.06015491485595703, 0.06480598449707031, 0.0694570541381836, 0.07410812377929688, 0.07875919342041016, 0.08341026306152344, 0.08806133270263672, 0.09271240234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 20.0, 20.0, 37.0, 40.0, 66.0, 96.0, 149.0, 283.0, 481.0, 1049.0, 2470.0, 6880.0, 23034.0, 93815.0, 537750.0, 304715.0, 54966.0, 14380.0, 4669.0, 1773.0, 781.0, 397.0, 254.0, 132.0, 91.0, 46.0, 31.0, 27.0, 24.0, 7.0, 14.0, 11.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1915283203125, -0.18551063537597656, -0.17949295043945312, -0.1734752655029297, -0.16745758056640625, -0.1614398956298828, -0.15542221069335938, -0.14940452575683594, -0.1433868408203125, -0.13736915588378906, -0.13135147094726562, -0.1253337860107422, -0.11931610107421875, -0.11329841613769531, -0.10728073120117188, -0.10126304626464844, -0.095245361328125, -0.08922767639160156, -0.08320999145507812, -0.07719230651855469, -0.07117462158203125, -0.06515693664550781, -0.059139251708984375, -0.05312156677246094, -0.0471038818359375, -0.04108619689941406, -0.035068511962890625, -0.029050827026367188, -0.02303314208984375, -0.017015457153320312, -0.010997772216796875, -0.0049800872802734375, 0.00103759765625, 0.0070552825927734375, 0.013072967529296875, 0.019090652465820312, 0.02510833740234375, 0.031126022338867188, 0.037143707275390625, 0.04316139221191406, 0.0491790771484375, 0.05519676208496094, 0.061214447021484375, 0.06723213195800781, 0.07324981689453125, 0.07926750183105469, 0.08528518676757812, 0.09130287170410156, 0.097320556640625, 0.10333824157714844, 0.10935592651367188, 0.11537361145019531, 0.12139129638671875, 0.1274089813232422, 0.13342666625976562, 0.13944435119628906, 0.1454620361328125, 0.15147972106933594, 0.15749740600585938, 0.1635150909423828, 0.16953277587890625, 0.1755504608154297, 0.18156814575195312, 0.18758583068847656, 0.193603515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 9.0, 10.0, 17.0, 19.0, 23.0, 17.0, 22.0, 34.0, 41.0, 31.0, 46.0, 51.0, 41.0, 53.0, 55.0, 42.0, 46.0, 52.0, 46.0, 43.0, 43.0, 29.0, 47.0, 32.0, 27.0, 34.0, 21.0, 14.0, 17.0, 11.0, 8.0, 2.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.210693359375, -0.20326614379882812, -0.19583892822265625, -0.18841171264648438, -0.1809844970703125, -0.17355728149414062, -0.16613006591796875, -0.15870285034179688, -0.151275634765625, -0.14384841918945312, -0.13642120361328125, -0.12899398803710938, -0.1215667724609375, -0.11413955688476562, -0.10671234130859375, -0.09928512573242188, -0.09185791015625, -0.08443069458007812, -0.07700347900390625, -0.06957626342773438, -0.0621490478515625, -0.054721832275390625, -0.04729461669921875, -0.039867401123046875, -0.032440185546875, -0.025012969970703125, -0.01758575439453125, -0.010158538818359375, -0.0027313232421875, 0.004695892333984375, 0.01212310791015625, 0.019550323486328125, 0.0269775390625, 0.034404754638671875, 0.04183197021484375, 0.049259185791015625, 0.0566864013671875, 0.06411361694335938, 0.07154083251953125, 0.07896804809570312, 0.086395263671875, 0.09382247924804688, 0.10124969482421875, 0.10867691040039062, 0.1161041259765625, 0.12353134155273438, 0.13095855712890625, 0.13838577270507812, 0.14581298828125, 0.15324020385742188, 0.16066741943359375, 0.16809463500976562, 0.1755218505859375, 0.18294906616210938, 0.19037628173828125, 0.19780349731445312, 0.205230712890625, 0.21265792846679688, 0.22008514404296875, 0.22751235961914062, 0.2349395751953125, 0.24236679077148438, 0.24979400634765625, 0.2572212219238281, 0.2646484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 7.0, 11.0, 21.0, 16.0, 17.0, 21.0, 26.0, 34.0, 51.0, 68.0, 94.0, 173.0, 310.0, 706.0, 1747.0, 5656.0, 37510.0, 752021.0, 231332.0, 13307.0, 3211.0, 1062.0, 472.0, 222.0, 119.0, 82.0, 52.0, 29.0, 26.0, 41.0, 16.0, 18.0, 14.0, 7.0, 6.0, 9.0, 9.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08026123046875, -0.07726287841796875, -0.0742645263671875, -0.07126617431640625, -0.068267822265625, -0.06526947021484375, -0.0622711181640625, -0.05927276611328125, -0.0562744140625, -0.05327606201171875, -0.0502777099609375, -0.04727935791015625, -0.044281005859375, -0.04128265380859375, -0.0382843017578125, -0.03528594970703125, -0.03228759765625, -0.02928924560546875, -0.0262908935546875, -0.02329254150390625, -0.020294189453125, -0.01729583740234375, -0.0142974853515625, -0.01129913330078125, -0.00830078125, -0.00530242919921875, -0.0023040771484375, 0.00069427490234375, 0.003692626953125, 0.00669097900390625, 0.0096893310546875, 0.01268768310546875, 0.01568603515625, 0.01868438720703125, 0.0216827392578125, 0.02468109130859375, 0.027679443359375, 0.03067779541015625, 0.0336761474609375, 0.03667449951171875, 0.0396728515625, 0.04267120361328125, 0.0456695556640625, 0.04866790771484375, 0.051666259765625, 0.05466461181640625, 0.0576629638671875, 0.06066131591796875, 0.06365966796875, 0.06665802001953125, 0.0696563720703125, 0.07265472412109375, 0.075653076171875, 0.07865142822265625, 0.0816497802734375, 0.08464813232421875, 0.087646484375, 0.09064483642578125, 0.0936431884765625, 0.09664154052734375, 0.099639892578125, 0.10263824462890625, 0.1056365966796875, 0.10863494873046875, 0.11163330078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 14.0, 13.0, 24.0, 34.0, 66.0, 141.0, 245.0, 207.0, 129.0, 59.0, 33.0, 17.0, 17.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00043272972106933594, -0.0004240460693836212, -0.0004153624176979065, -0.00040667876601219177, -0.00039799511432647705, -0.00038931146264076233, -0.0003806278109550476, -0.0003719441592693329, -0.00036326050758361816, -0.00035457685589790344, -0.0003458932042121887, -0.000337209552526474, -0.0003285259008407593, -0.00031984224915504456, -0.00031115859746932983, -0.0003024749457836151, -0.0002937912940979004, -0.00028510764241218567, -0.00027642399072647095, -0.0002677403390407562, -0.0002590566873550415, -0.0002503730356693268, -0.00024168938398361206, -0.00023300573229789734, -0.00022432208061218262, -0.0002156384289264679, -0.00020695477724075317, -0.00019827112555503845, -0.00018958747386932373, -0.000180903822183609, -0.0001722201704978943, -0.00016353651881217957, -0.00015485286712646484, -0.00014616921544075012, -0.0001374855637550354, -0.00012880191206932068, -0.00012011826038360596, -0.00011143460869789124, -0.00010275095701217651, -9.406730532646179e-05, -8.538365364074707e-05, -7.670000195503235e-05, -6.801635026931763e-05, -5.9332698583602905e-05, -5.0649046897888184e-05, -4.196539521217346e-05, -3.328174352645874e-05, -2.459809184074402e-05, -1.5914440155029297e-05, -7.230788469314575e-06, 1.4528632164001465e-06, 1.0136514902114868e-05, 1.882016658782959e-05, 2.750381827354431e-05, 3.618746995925903e-05, 4.4871121644973755e-05, 5.3554773330688477e-05, 6.22384250164032e-05, 7.092207670211792e-05, 7.960572838783264e-05, 8.828938007354736e-05, 9.697303175926208e-05, 0.0001056566834449768, 0.00011434033513069153, 0.00012302398681640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 14.0, 19.0, 35.0, 86.0, 187.0, 958.0, 88151.0, 954967.0, 3542.0, 319.0, 123.0, 71.0, 41.0, 25.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.354736328125, -0.346710205078125, -0.33868408203125, -0.330657958984375, -0.3226318359375, -0.314605712890625, -0.30657958984375, -0.298553466796875, -0.29052734375, -0.282501220703125, -0.27447509765625, -0.266448974609375, -0.2584228515625, -0.250396728515625, -0.24237060546875, -0.234344482421875, -0.226318359375, -0.218292236328125, -0.21026611328125, -0.202239990234375, -0.1942138671875, -0.186187744140625, -0.17816162109375, -0.170135498046875, -0.162109375, -0.154083251953125, -0.14605712890625, -0.138031005859375, -0.1300048828125, -0.121978759765625, -0.11395263671875, -0.105926513671875, -0.097900390625, -0.089874267578125, -0.08184814453125, -0.073822021484375, -0.0657958984375, -0.057769775390625, -0.04974365234375, -0.041717529296875, -0.03369140625, -0.025665283203125, -0.01763916015625, -0.009613037109375, -0.0015869140625, 0.006439208984375, 0.01446533203125, 0.022491455078125, 0.030517578125, 0.038543701171875, 0.04656982421875, 0.054595947265625, 0.0626220703125, 0.070648193359375, 0.07867431640625, 0.086700439453125, 0.0947265625, 0.102752685546875, 0.11077880859375, 0.118804931640625, 0.1268310546875, 0.134857177734375, 0.14288330078125, 0.150909423828125, 0.158935546875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 9.0, 13.0, 21.0, 20.0, 75.0, 175.0, 263.0, 222.0, 114.0, 49.0, 20.0, 15.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2851533889770508, -0.27953529357910156, -0.27391719818115234, -0.2682991027832031, -0.2626810073852539, -0.2570629119873047, -0.25144481658935547, -0.24582672119140625, -0.24020862579345703, -0.2345905303955078, -0.2289724349975586, -0.22335433959960938, -0.21773624420166016, -0.21211814880371094, -0.20650005340576172, -0.2008819580078125, -0.19526386260986328, -0.18964576721191406, -0.18402767181396484, -0.17840957641601562, -0.1727914810180664, -0.1671733856201172, -0.16155529022216797, -0.15593719482421875, -0.15031909942626953, -0.1447010040283203, -0.1390829086303711, -0.13346481323242188, -0.12784671783447266, -0.12222862243652344, -0.11661052703857422, -0.110992431640625, -0.10537433624267578, -0.09975624084472656, -0.09413814544677734, -0.08852005004882812, -0.0829019546508789, -0.07728385925292969, -0.07166576385498047, -0.06604766845703125, -0.06042957305908203, -0.05481147766113281, -0.049193382263183594, -0.043575286865234375, -0.037957191467285156, -0.03233909606933594, -0.02672100067138672, -0.0211029052734375, -0.015484809875488281, -0.009866714477539062, -0.004248619079589844, 0.001369476318359375, 0.006987571716308594, 0.012605667114257812, 0.01822376251220703, 0.02384185791015625, 0.02945995330810547, 0.03507804870605469, 0.040696144104003906, 0.046314239501953125, 0.051932334899902344, 0.05755043029785156, 0.06316852569580078, 0.06878662109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 16.0, 51.0, 289.0, 497.0, 109.0, 36.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4458900690078735, -1.3271595239639282, -1.2084288597106934, -1.089698314666748, -0.9709676504135132, -0.8522371053695679, -0.7335065007209778, -0.6147758960723877, -0.4960452914237976, -0.3773146867752075, -0.25858408212661743, -0.13985350728034973, -0.021122902631759644, 0.09760767221450806, 0.21633827686309814, 0.33506888151168823, 0.4537994861602783, 0.5725300908088684, 0.6912606954574585, 0.8099912405014038, 0.9287219047546387, 1.047452449798584, 1.1661829948425293, 1.2849136590957642, 1.403644323348999, 1.5223748683929443, 1.6411055326461792, 1.7598360776901245, 1.8785667419433594, 1.9972972869873047, 2.11602783203125, 2.2347583770751953, 2.3534891605377197, 2.472219705581665, 2.5909502506256104, 2.7096810340881348, 2.82841157913208, 2.9471421241760254, 3.0658726692199707, 3.184603214263916, 3.3033339977264404, 3.4220645427703857, 3.540795087814331, 3.6595258712768555, 3.778256416320801, 3.896986961364746, 4.015717506408691, 4.134448051452637, 4.253178596496582, 4.371909141540527, 4.490639686584473, 4.609370231628418, 4.728100776672363, 4.846831321716309, 4.965562343597412, 5.084292888641357, 5.203023433685303, 5.321753978729248, 5.440484523773193, 5.559215068817139, 5.677945613861084, 5.7966766357421875, 5.915407180786133, 6.034137725830078, 6.152868270874023]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 5.0, 4.0, 14.0, 9.0, 20.0, 21.0, 29.0, 30.0, 29.0, 22.0, 23.0, 37.0, 40.0, 37.0, 35.0, 34.0, 51.0, 57.0, 39.0, 52.0, 58.0, 38.0, 41.0, 49.0, 35.0, 37.0, 27.0, 28.0, 21.0, 10.0, 12.0, 9.0, 8.0, 7.0, 6.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.4333292245864868, -1.3927112817764282, -1.3520934581756592, -1.3114755153656006, -1.270857572555542, -1.2302396297454834, -1.1896216869354248, -1.1490038633346558, -1.1083859205245972, -1.0677679777145386, -1.0271501541137695, -0.9865322113037109, -0.9459142684936523, -0.9052963256835938, -0.8646784424781799, -0.8240605592727661, -0.7834426164627075, -0.7428246736526489, -0.7022067904472351, -0.6615889072418213, -0.6209709644317627, -0.5803530216217041, -0.5397351384162903, -0.4991172254085541, -0.45849931240081787, -0.41788139939308167, -0.37726348638534546, -0.33664557337760925, -0.29602766036987305, -0.25540974736213684, -0.21479183435440063, -0.17417392134666443, -0.13355612754821777, -0.09293821454048157, -0.05232030153274536, -0.011702388525009155, 0.02891552448272705, 0.06953343749046326, 0.11015135049819946, 0.15076926350593567, 0.19138717651367188, 0.23200508952140808, 0.2726230025291443, 0.3132409155368805, 0.3538588285446167, 0.3944767415523529, 0.4350946545600891, 0.4757125675678253, 0.5163304805755615, 0.5569484233856201, 0.5975663065910339, 0.6381841897964478, 0.6788021326065063, 0.7194200754165649, 0.7600379586219788, 0.8006558418273926, 0.8412737846374512, 0.8818917274475098, 0.9225096106529236, 0.9631274938583374, 1.003745436668396, 1.0443633794784546, 1.0849812030792236, 1.1255991458892822, 1.1662170886993408]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 0.0, 1.0, 8.0, 2.0, 4.0, 3.0, 9.0, 7.0, 14.0, 9.0, 15.0, 17.0, 21.0, 32.0, 40.0, 55.0, 72.0, 86.0, 142.0, 178.0, 336.0, 493.0, 1107.0, 2482.0, 7372.0, 31182.0, 627146.0, 3462332.0, 46805.0, 9338.0, 2823.0, 1070.0, 482.0, 275.0, 131.0, 79.0, 33.0, 35.0, 13.0, 13.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.35498046875, -0.3471088409423828, -0.3392372131347656, -0.33136558532714844, -0.32349395751953125, -0.31562232971191406, -0.3077507019042969, -0.2998790740966797, -0.2920074462890625, -0.2841358184814453, -0.2762641906738281, -0.26839256286621094, -0.26052093505859375, -0.25264930725097656, -0.24477767944335938, -0.2369060516357422, -0.229034423828125, -0.2211627960205078, -0.21329116821289062, -0.20541954040527344, -0.19754791259765625, -0.18967628479003906, -0.18180465698242188, -0.1739330291748047, -0.1660614013671875, -0.1581897735595703, -0.15031814575195312, -0.14244651794433594, -0.13457489013671875, -0.12670326232910156, -0.11883163452148438, -0.11096000671386719, -0.10308837890625, -0.09521675109863281, -0.08734512329101562, -0.07947349548339844, -0.07160186767578125, -0.06373023986816406, -0.055858612060546875, -0.04798698425292969, -0.0401153564453125, -0.03224372863769531, -0.024372100830078125, -0.016500473022460938, -0.00862884521484375, -0.0007572174072265625, 0.007114410400390625, 0.014986038208007812, 0.022857666015625, 0.030729293823242188, 0.038600921630859375, 0.04647254943847656, 0.05434417724609375, 0.06221580505371094, 0.07008743286132812, 0.07795906066894531, 0.0858306884765625, 0.09370231628417969, 0.10157394409179688, 0.10944557189941406, 0.11731719970703125, 0.12518882751464844, 0.13306045532226562, 0.1409320831298828, 0.1488037109375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 8.0, 12.0, 29.0, 47.0, 78.0, 80.0, 100.0, 123.0, 121.0, 120.0, 110.0, 65.0, 53.0, 26.0, 10.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2015380859375, -0.1969614028930664, -0.1923847198486328, -0.18780803680419922, -0.18323135375976562, -0.17865467071533203, -0.17407798767089844, -0.16950130462646484, -0.16492462158203125, -0.16034793853759766, -0.15577125549316406, -0.15119457244873047, -0.14661788940429688, -0.14204120635986328, -0.1374645233154297, -0.1328878402709961, -0.1283111572265625, -0.1237344741821289, -0.11915779113769531, -0.11458110809326172, -0.11000442504882812, -0.10542774200439453, -0.10085105895996094, -0.09627437591552734, -0.09169769287109375, -0.08712100982666016, -0.08254432678222656, -0.07796764373779297, -0.07339096069335938, -0.06881427764892578, -0.06423759460449219, -0.059660911560058594, -0.055084228515625, -0.050507545471191406, -0.04593086242675781, -0.04135417938232422, -0.036777496337890625, -0.03220081329345703, -0.027624130249023438, -0.023047447204589844, -0.01847076416015625, -0.013894081115722656, -0.009317398071289062, -0.004740715026855469, -0.000164031982421875, 0.004412651062011719, 0.008989334106445312, 0.013566017150878906, 0.0181427001953125, 0.022719383239746094, 0.027296066284179688, 0.03187274932861328, 0.036449432373046875, 0.04102611541748047, 0.04560279846191406, 0.050179481506347656, 0.05475616455078125, 0.059332847595214844, 0.06390953063964844, 0.06848621368408203, 0.07306289672851562, 0.07763957977294922, 0.08221626281738281, 0.0867929458618164, 0.09136962890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 12.0, 8.0, 23.0, 24.0, 31.0, 71.0, 156.0, 339.0, 877.0, 2361.0, 7894.0, 52221.0, 3983862.0, 129421.0, 11767.0, 3139.0, 1112.0, 506.0, 206.0, 118.0, 43.0, 28.0, 16.0, 11.0, 4.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2364501953125, -0.2284717559814453, -0.22049331665039062, -0.21251487731933594, -0.20453643798828125, -0.19655799865722656, -0.18857955932617188, -0.1806011199951172, -0.1726226806640625, -0.1646442413330078, -0.15666580200195312, -0.14868736267089844, -0.14070892333984375, -0.13273048400878906, -0.12475204467773438, -0.11677360534667969, -0.108795166015625, -0.10081672668457031, -0.09283828735351562, -0.08485984802246094, -0.07688140869140625, -0.06890296936035156, -0.060924530029296875, -0.05294609069824219, -0.0449676513671875, -0.03698921203613281, -0.029010772705078125, -0.021032333374023438, -0.01305389404296875, -0.0050754547119140625, 0.002902984619140625, 0.010881423950195312, 0.01885986328125, 0.026838302612304688, 0.034816741943359375, 0.04279518127441406, 0.05077362060546875, 0.05875205993652344, 0.06673049926757812, 0.07470893859863281, 0.0826873779296875, 0.09066581726074219, 0.09864425659179688, 0.10662269592285156, 0.11460113525390625, 0.12257957458496094, 0.13055801391601562, 0.1385364532470703, 0.146514892578125, 0.1544933319091797, 0.16247177124023438, 0.17045021057128906, 0.17842864990234375, 0.18640708923339844, 0.19438552856445312, 0.2023639678955078, 0.2103424072265625, 0.2183208465576172, 0.22629928588867188, 0.23427772521972656, 0.24225616455078125, 0.25023460388183594, 0.2582130432128906, 0.2661914825439453, 0.274169921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 12.0, 13.0, 15.0, 25.0, 42.0, 81.0, 137.0, 648.0, 2427.0, 360.0, 134.0, 64.0, 25.0, 26.0, 11.0, 10.0, 4.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0902099609375, -0.0873250961303711, -0.08444023132324219, -0.08155536651611328, -0.07867050170898438, -0.07578563690185547, -0.07290077209472656, -0.07001590728759766, -0.06713104248046875, -0.06424617767333984, -0.06136131286621094, -0.05847644805908203, -0.055591583251953125, -0.05270671844482422, -0.04982185363769531, -0.046936988830566406, -0.0440521240234375, -0.041167259216308594, -0.03828239440917969, -0.03539752960205078, -0.032512664794921875, -0.02962779998779297, -0.026742935180664062, -0.023858070373535156, -0.02097320556640625, -0.018088340759277344, -0.015203475952148438, -0.012318611145019531, -0.009433746337890625, -0.006548881530761719, -0.0036640167236328125, -0.0007791519165039062, 0.002105712890625, 0.004990577697753906, 0.007875442504882812, 0.010760307312011719, 0.013645172119140625, 0.01653003692626953, 0.019414901733398438, 0.022299766540527344, 0.02518463134765625, 0.028069496154785156, 0.030954360961914062, 0.03383922576904297, 0.036724090576171875, 0.03960895538330078, 0.04249382019042969, 0.045378684997558594, 0.0482635498046875, 0.051148414611816406, 0.05403327941894531, 0.05691814422607422, 0.059803009033203125, 0.06268787384033203, 0.06557273864746094, 0.06845760345458984, 0.07134246826171875, 0.07422733306884766, 0.07711219787597656, 0.07999706268310547, 0.08288192749023438, 0.08576679229736328, 0.08865165710449219, 0.0915365219116211, 0.09442138671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 55.0, 261.0, 459.0, 167.0, 33.0, 12.0, 8.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32473528385162354, -0.29798340797424316, -0.2712315618991852, -0.244479700922966, -0.21772783994674683, -0.19097597897052765, -0.16422411799430847, -0.1374722570180893, -0.11072039604187012, -0.08396853506565094, -0.05721667408943176, -0.030464813113212585, -0.003712952136993408, 0.02303890883922577, 0.049790769815444946, 0.07654263079166412, 0.1032944917678833, 0.13004635274410248, 0.15679821372032166, 0.18355007469654083, 0.21030193567276, 0.2370537966489792, 0.26380565762519836, 0.29055750370025635, 0.3173093795776367, 0.3440612554550171, 0.3708131015300751, 0.39756494760513306, 0.4243168234825134, 0.4510686993598938, 0.4778205454349518, 0.5045723915100098, 0.5313242673873901, 0.5580761432647705, 0.5848280191421509, 0.6115798354148865, 0.6383317112922668, 0.6650835871696472, 0.6918354034423828, 0.7185872793197632, 0.7453391551971436, 0.7720910310745239, 0.7988429069519043, 0.8255947232246399, 0.8523465991020203, 0.8790984749794006, 0.9058502912521362, 0.9326021671295166, 0.959354043006897, 0.9861059188842773, 1.0128577947616577, 1.039609670639038, 1.066361427307129, 1.0931133031845093, 1.1198651790618896, 1.14661705493927, 1.1733689308166504, 1.2001208066940308, 1.2268726825714111, 1.2536245584487915, 1.2803764343261719, 1.3071281909942627, 1.333880066871643, 1.3606319427490234, 1.3873838186264038]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 9.0, 4.0, 6.0, 9.0, 13.0, 9.0, 20.0, 23.0, 29.0, 29.0, 20.0, 44.0, 35.0, 44.0, 46.0, 47.0, 56.0, 48.0, 44.0, 42.0, 41.0, 54.0, 29.0, 46.0, 40.0, 30.0, 25.0, 22.0, 21.0, 13.0, 23.0, 15.0, 7.0, 8.0, 9.0, 8.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.21170544624328613, -0.20439811050891876, -0.1970907747745514, -0.18978342413902283, -0.18247608840465546, -0.17516875267028809, -0.16786141693592072, -0.16055408120155334, -0.15324673056602478, -0.1459393948316574, -0.13863205909729004, -0.13132470846176147, -0.1240173727273941, -0.11671003699302673, -0.10940270125865936, -0.10209536552429199, -0.09478802978992462, -0.08748069405555725, -0.08017335087060928, -0.07286601513624191, -0.06555867195129395, -0.058251336216926575, -0.050944000482559204, -0.043636661022901535, -0.036329321563243866, -0.029021982103586197, -0.021714644506573677, -0.014407306909561157, -0.007099967449903488, 0.0002073720097541809, 0.0075147077441215515, 0.01482204720377922, 0.02212938666343689, 0.02943672612309456, 0.03674406558275223, 0.0440514013171196, 0.05135874077677727, 0.058666080236434937, 0.06597341597080231, 0.07328075170516968, 0.08058809489011765, 0.08789543062448502, 0.09520277380943298, 0.10251010954380035, 0.10981744527816772, 0.11712478846311569, 0.12443212419748306, 0.13173946738243103, 0.1390468031167984, 0.14635413885116577, 0.15366147458553314, 0.1609688103199005, 0.16827616095542908, 0.17558349668979645, 0.18289083242416382, 0.1901981681585312, 0.19750550389289856, 0.20481283962726593, 0.2121201753616333, 0.21942752599716187, 0.22673486173152924, 0.2340421974658966, 0.24134953320026398, 0.24865686893463135, 0.2559642195701599]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 5.0, 12.0, 27.0, 13.0, 15.0, 25.0, 34.0, 76.0, 74.0, 121.0, 216.0, 342.0, 711.0, 1839.0, 6566.0, 34943.0, 345368.0, 588396.0, 55990.0, 9270.0, 2515.0, 913.0, 426.0, 217.0, 145.0, 84.0, 56.0, 34.0, 33.0, 28.0, 9.0, 9.0, 9.0, 6.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23150634765625, -0.2222900390625, -0.21307373046875, -0.203857421875, -0.19464111328125, -0.1854248046875, -0.17620849609375, -0.1669921875, -0.15777587890625, -0.1485595703125, -0.13934326171875, -0.130126953125, -0.12091064453125, -0.1116943359375, -0.10247802734375, -0.09326171875, -0.08404541015625, -0.0748291015625, -0.06561279296875, -0.056396484375, -0.04718017578125, -0.0379638671875, -0.02874755859375, -0.01953125, -0.01031494140625, -0.0010986328125, 0.00811767578125, 0.017333984375, 0.02655029296875, 0.0357666015625, 0.04498291015625, 0.05419921875, 0.06341552734375, 0.0726318359375, 0.08184814453125, 0.091064453125, 0.10028076171875, 0.1094970703125, 0.11871337890625, 0.1279296875, 0.13714599609375, 0.1463623046875, 0.15557861328125, 0.164794921875, 0.17401123046875, 0.1832275390625, 0.19244384765625, 0.20166015625, 0.21087646484375, 0.2200927734375, 0.22930908203125, 0.238525390625, 0.24774169921875, 0.2569580078125, 0.26617431640625, 0.275390625, 0.28460693359375, 0.2938232421875, 0.30303955078125, 0.312255859375, 0.32147216796875, 0.3306884765625, 0.33990478515625, 0.34912109375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 17.0, 37.0, 37.0, 67.0, 81.0, 98.0, 115.0, 139.0, 111.0, 105.0, 73.0, 51.0, 35.0, 12.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.191162109375, -0.18673419952392578, -0.18230628967285156, -0.17787837982177734, -0.17345046997070312, -0.1690225601196289, -0.1645946502685547, -0.16016674041748047, -0.15573883056640625, -0.15131092071533203, -0.1468830108642578, -0.1424551010131836, -0.13802719116210938, -0.13359928131103516, -0.12917137145996094, -0.12474346160888672, -0.1203155517578125, -0.11588764190673828, -0.11145973205566406, -0.10703182220458984, -0.10260391235351562, -0.0981760025024414, -0.09374809265136719, -0.08932018280029297, -0.08489227294921875, -0.08046436309814453, -0.07603645324707031, -0.0716085433959961, -0.06718063354492188, -0.06275272369384766, -0.05832481384277344, -0.05389690399169922, -0.049468994140625, -0.04504108428955078, -0.04061317443847656, -0.036185264587402344, -0.031757354736328125, -0.027329444885253906, -0.022901535034179688, -0.01847362518310547, -0.01404571533203125, -0.009617805480957031, -0.0051898956298828125, -0.0007619857788085938, 0.003665924072265625, 0.008093833923339844, 0.012521743774414062, 0.01694965362548828, 0.0213775634765625, 0.02580547332763672, 0.030233383178710938, 0.034661293029785156, 0.039089202880859375, 0.043517112731933594, 0.04794502258300781, 0.05237293243408203, 0.05680084228515625, 0.06122875213623047, 0.06565666198730469, 0.0700845718383789, 0.07451248168945312, 0.07894039154052734, 0.08336830139160156, 0.08779621124267578, 0.09222412109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0, 8.0, 5.0, 12.0, 8.0, 20.0, 22.0, 29.0, 34.0, 37.0, 56.0, 70.0, 82.0, 106.0, 131.0, 201.0, 318.0, 574.0, 1164.0, 2380.0, 5627.0, 13819.0, 37207.0, 115464.0, 426185.0, 314018.0, 83049.0, 28068.0, 10952.0, 4478.0, 1939.0, 943.0, 527.0, 311.0, 180.0, 106.0, 83.0, 78.0, 57.0, 42.0, 45.0, 25.0, 25.0, 25.0, 11.0, 6.0, 8.0, 8.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.127197265625, -0.12320518493652344, -0.11921310424804688, -0.11522102355957031, -0.11122894287109375, -0.10723686218261719, -0.10324478149414062, -0.09925270080566406, -0.0952606201171875, -0.09126853942871094, -0.08727645874023438, -0.08328437805175781, -0.07929229736328125, -0.07530021667480469, -0.07130813598632812, -0.06731605529785156, -0.063323974609375, -0.05933189392089844, -0.055339813232421875, -0.05134773254394531, -0.04735565185546875, -0.04336357116699219, -0.039371490478515625, -0.03537940979003906, -0.0313873291015625, -0.027395248413085938, -0.023403167724609375, -0.019411087036132812, -0.01541900634765625, -0.011426925659179688, -0.007434844970703125, -0.0034427642822265625, 0.00054931640625, 0.0045413970947265625, 0.008533477783203125, 0.012525558471679688, 0.01651763916015625, 0.020509719848632812, 0.024501800537109375, 0.028493881225585938, 0.0324859619140625, 0.03647804260253906, 0.040470123291015625, 0.04446220397949219, 0.04845428466796875, 0.05244636535644531, 0.056438446044921875, 0.06043052673339844, 0.064422607421875, 0.06841468811035156, 0.07240676879882812, 0.07639884948730469, 0.08039093017578125, 0.08438301086425781, 0.08837509155273438, 0.09236717224121094, 0.0963592529296875, 0.10035133361816406, 0.10434341430664062, 0.10833549499511719, 0.11232757568359375, 0.11631965637207031, 0.12031173706054688, 0.12430381774902344, 0.1282958984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 7.0, 5.0, 13.0, 6.0, 16.0, 21.0, 20.0, 17.0, 16.0, 30.0, 37.0, 20.0, 30.0, 24.0, 48.0, 35.0, 34.0, 28.0, 41.0, 33.0, 40.0, 39.0, 36.0, 38.0, 35.0, 28.0, 37.0, 30.0, 32.0, 27.0, 23.0, 11.0, 23.0, 14.0, 12.0, 13.0, 10.0, 2.0, 12.0, 13.0, 7.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.18722152709960938, -0.18132781982421875, -0.17543411254882812, -0.1695404052734375, -0.16364669799804688, -0.15775299072265625, -0.15185928344726562, -0.145965576171875, -0.14007186889648438, -0.13417816162109375, -0.12828445434570312, -0.1223907470703125, -0.11649703979492188, -0.11060333251953125, -0.10470962524414062, -0.09881591796875, -0.09292221069335938, -0.08702850341796875, -0.08113479614257812, -0.0752410888671875, -0.06934738159179688, -0.06345367431640625, -0.057559967041015625, -0.051666259765625, -0.045772552490234375, -0.03987884521484375, -0.033985137939453125, -0.0280914306640625, -0.022197723388671875, -0.01630401611328125, -0.010410308837890625, -0.0045166015625, 0.001377105712890625, 0.00727081298828125, 0.013164520263671875, 0.0190582275390625, 0.024951934814453125, 0.03084564208984375, 0.036739349365234375, 0.042633056640625, 0.048526763916015625, 0.05442047119140625, 0.060314178466796875, 0.0662078857421875, 0.07210159301757812, 0.07799530029296875, 0.08388900756835938, 0.08978271484375, 0.09567642211914062, 0.10157012939453125, 0.10746383666992188, 0.1133575439453125, 0.11925125122070312, 0.12514495849609375, 0.13103866577148438, 0.136932373046875, 0.14282608032226562, 0.14871978759765625, 0.15461349487304688, 0.1605072021484375, 0.16640090942382812, 0.17229461669921875, 0.17818832397460938, 0.18408203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 15.0, 23.0, 25.0, 32.0, 71.0, 106.0, 206.0, 394.0, 769.0, 1757.0, 4843.0, 20293.0, 244252.0, 703290.0, 58143.0, 9139.0, 2803.0, 1160.0, 549.0, 275.0, 168.0, 89.0, 38.0, 38.0, 17.0, 10.0, 15.0, 2.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0733642578125, -0.07085609436035156, -0.06834793090820312, -0.06583976745605469, -0.06333160400390625, -0.06082344055175781, -0.058315277099609375, -0.05580711364746094, -0.0532989501953125, -0.05079078674316406, -0.048282623291015625, -0.04577445983886719, -0.04326629638671875, -0.04075813293457031, -0.038249969482421875, -0.03574180603027344, -0.033233642578125, -0.030725479125976562, -0.028217315673828125, -0.025709152221679688, -0.02320098876953125, -0.020692825317382812, -0.018184661865234375, -0.015676498413085938, -0.0131683349609375, -0.010660171508789062, -0.008152008056640625, -0.0056438446044921875, -0.00313568115234375, -0.0006275177001953125, 0.001880645751953125, 0.0043888092041015625, 0.00689697265625, 0.009405136108398438, 0.011913299560546875, 0.014421463012695312, 0.01692962646484375, 0.019437789916992188, 0.021945953369140625, 0.024454116821289062, 0.0269622802734375, 0.029470443725585938, 0.031978607177734375, 0.03448677062988281, 0.03699493408203125, 0.03950309753417969, 0.042011260986328125, 0.04451942443847656, 0.047027587890625, 0.04953575134277344, 0.052043914794921875, 0.05455207824707031, 0.05706024169921875, 0.05956840515136719, 0.062076568603515625, 0.06458473205566406, 0.0670928955078125, 0.06960105895996094, 0.07210922241210938, 0.07461738586425781, 0.07712554931640625, 0.07963371276855469, 0.08214187622070312, 0.08465003967285156, 0.087158203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 5.0, 7.0, 7.0, 6.0, 20.0, 14.0, 15.0, 19.0, 35.0, 37.0, 68.0, 70.0, 108.0, 107.0, 104.0, 75.0, 71.0, 43.0, 40.0, 26.0, 22.0, 16.0, 22.0, 8.0, 8.0, 11.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00011348724365234375, -0.00011000689119100571, -0.00010652653872966766, -0.00010304618626832962, -9.956583380699158e-05, -9.608548134565353e-05, -9.260512888431549e-05, -8.912477642297745e-05, -8.56444239616394e-05, -8.216407150030136e-05, -7.868371903896332e-05, -7.520336657762527e-05, -7.172301411628723e-05, -6.824266165494919e-05, -6.476230919361115e-05, -6.12819567322731e-05, -5.780160427093506e-05, -5.4321251809597015e-05, -5.084089934825897e-05, -4.736054688692093e-05, -4.3880194425582886e-05, -4.039984196424484e-05, -3.69194895029068e-05, -3.3439137041568756e-05, -2.9958784580230713e-05, -2.647843211889267e-05, -2.2998079657554626e-05, -1.9517727196216583e-05, -1.603737473487854e-05, -1.2557022273540497e-05, -9.076669812202454e-06, -5.59631735086441e-06, -2.115964889526367e-06, 1.364387571811676e-06, 4.844740033149719e-06, 8.325092494487762e-06, 1.1805444955825806e-05, 1.528579741716385e-05, 1.8766149878501892e-05, 2.2246502339839935e-05, 2.572685480117798e-05, 2.9207207262516022e-05, 3.2687559723854065e-05, 3.616791218519211e-05, 3.964826464653015e-05, 4.3128617107868195e-05, 4.660896956920624e-05, 5.008932203054428e-05, 5.3569674491882324e-05, 5.705002695322037e-05, 6.053037941455841e-05, 6.401073187589645e-05, 6.74910843372345e-05, 7.097143679857254e-05, 7.445178925991058e-05, 7.793214172124863e-05, 8.141249418258667e-05, 8.489284664392471e-05, 8.837319910526276e-05, 9.18535515666008e-05, 9.533390402793884e-05, 9.881425648927689e-05, 0.00010229460895061493, 0.00010577496141195297, 0.00010925531387329102]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 9.0, 14.0, 24.0, 14.0, 43.0, 55.0, 81.0, 149.0, 266.0, 531.0, 1192.0, 2987.0, 10243.0, 60028.0, 552983.0, 370827.0, 37256.0, 7405.0, 2415.0, 962.0, 450.0, 226.0, 135.0, 76.0, 36.0, 38.0, 23.0, 25.0, 20.0, 9.0, 8.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0819091796875, -0.07968854904174805, -0.0774679183959961, -0.07524728775024414, -0.07302665710449219, -0.07080602645874023, -0.06858539581298828, -0.06636476516723633, -0.06414413452148438, -0.06192350387573242, -0.05970287322998047, -0.057482242584228516, -0.05526161193847656, -0.05304098129272461, -0.050820350646972656, -0.0485997200012207, -0.04637908935546875, -0.0441584587097168, -0.041937828063964844, -0.03971719741821289, -0.03749656677246094, -0.035275936126708984, -0.03305530548095703, -0.030834674835205078, -0.028614044189453125, -0.026393413543701172, -0.02417278289794922, -0.021952152252197266, -0.019731521606445312, -0.01751089096069336, -0.015290260314941406, -0.013069629669189453, -0.0108489990234375, -0.008628368377685547, -0.006407737731933594, -0.004187107086181641, -0.0019664764404296875, 0.0002541542053222656, 0.0024747848510742188, 0.004695415496826172, 0.006916046142578125, 0.009136676788330078, 0.011357307434082031, 0.013577938079833984, 0.015798568725585938, 0.01801919937133789, 0.020239830017089844, 0.022460460662841797, 0.02468109130859375, 0.026901721954345703, 0.029122352600097656, 0.03134298324584961, 0.03356361389160156, 0.035784244537353516, 0.03800487518310547, 0.04022550582885742, 0.042446136474609375, 0.04466676712036133, 0.04688739776611328, 0.049108028411865234, 0.05132865905761719, 0.05354928970336914, 0.055769920349121094, 0.05799055099487305, 0.060211181640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 14.0, 13.0, 34.0, 37.0, 50.0, 91.0, 99.0, 96.0, 119.0, 107.0, 95.0, 66.0, 41.0, 26.0, 33.0, 28.0, 9.0, 9.0, 9.0, 3.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.09991455078125, -0.09750843048095703, -0.09510231018066406, -0.0926961898803711, -0.09029006958007812, -0.08788394927978516, -0.08547782897949219, -0.08307170867919922, -0.08066558837890625, -0.07825946807861328, -0.07585334777832031, -0.07344722747802734, -0.07104110717773438, -0.0686349868774414, -0.06622886657714844, -0.06382274627685547, -0.0614166259765625, -0.05901050567626953, -0.05660438537597656, -0.054198265075683594, -0.051792144775390625, -0.049386024475097656, -0.04697990417480469, -0.04457378387451172, -0.04216766357421875, -0.03976154327392578, -0.03735542297363281, -0.034949302673339844, -0.032543182373046875, -0.030137062072753906, -0.027730941772460938, -0.02532482147216797, -0.022918701171875, -0.02051258087158203, -0.018106460571289062, -0.015700340270996094, -0.013294219970703125, -0.010888099670410156, -0.008481979370117188, -0.006075859069824219, -0.00366973876953125, -0.0012636184692382812, 0.0011425018310546875, 0.0035486221313476562, 0.005954742431640625, 0.008360862731933594, 0.010766983032226562, 0.013173103332519531, 0.0155792236328125, 0.01798534393310547, 0.020391464233398438, 0.022797584533691406, 0.025203704833984375, 0.027609825134277344, 0.030015945434570312, 0.03242206573486328, 0.03482818603515625, 0.03723430633544922, 0.03964042663574219, 0.042046546936035156, 0.044452667236328125, 0.046858787536621094, 0.04926490783691406, 0.05167102813720703, 0.0540771484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 29.0, 245.0, 570.0, 125.0, 26.0, 9.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.828999996185303, -6.695713043212891, -6.56242561340332, -6.429138660430908, -6.295851230621338, -6.162564277648926, -6.0292768478393555, -5.895989894866943, -5.762702941894531, -5.629415988922119, -5.496128559112549, -5.362841606140137, -5.229554176330566, -5.096267223358154, -4.962980270385742, -4.829692840576172, -4.696405410766602, -4.5631184577941895, -4.429831027984619, -4.296544075012207, -4.163256645202637, -4.029969692230225, -3.8966825008392334, -3.763395309448242, -3.63010835647583, -3.496821165084839, -3.3635339736938477, -3.2302470207214355, -3.0969598293304443, -2.963672637939453, -2.830385446548462, -2.6970982551574707, -2.5638108253479004, -2.430523633956909, -2.297236442565918, -2.163949489593506, -2.0306622982025146, -1.8973751068115234, -1.7640879154205322, -1.630800724029541, -1.497513771057129, -1.3642265796661377, -1.230939507484436, -1.0976523160934448, -0.9643651843070984, -0.831078052520752, -0.6977908611297607, -0.5645037293434143, -0.43121659755706787, -0.29792946577072144, -0.1646423041820526, -0.03135514259338379, 0.10193198919296265, 0.23521912097930908, 0.3685063123703003, 0.5017934441566467, 0.6350805759429932, 0.7683677077293396, 0.901654839515686, 1.0349420309066772, 1.168229103088379, 1.3015162944793701, 1.4348034858703613, 1.5680906772613525, 1.7013777494430542]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 7.0, 8.0, 6.0, 9.0, 10.0, 14.0, 18.0, 21.0, 24.0, 21.0, 35.0, 34.0, 34.0, 38.0, 33.0, 33.0, 35.0, 42.0, 49.0, 43.0, 50.0, 45.0, 42.0, 38.0, 36.0, 32.0, 29.0, 18.0, 25.0, 27.0, 20.0, 19.0, 23.0, 14.0, 16.0, 8.0, 11.0, 8.0, 4.0, 4.0, 1.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0462589263916016, -1.0107876062393188, -0.9753163456916809, -0.939845085144043, -0.9043737649917603, -0.8689024448394775, -0.8334311842918396, -0.7979599237442017, -0.762488603591919, -0.7270172834396362, -0.6915460228919983, -0.6560747623443604, -0.6206034421920776, -0.5851321220397949, -0.549660861492157, -0.514189600944519, -0.47871828079223633, -0.443246990442276, -0.4077757000923157, -0.37230440974235535, -0.336833119392395, -0.3013618290424347, -0.26589053869247437, -0.23041924834251404, -0.1949479579925537, -0.15947666764259338, -0.12400537729263306, -0.08853408694267273, -0.0530627965927124, -0.017591506242752075, 0.017879784107208252, 0.05335107445716858, 0.08882224559783936, 0.12429353594779968, 0.15976482629776, 0.19523611664772034, 0.23070740699768066, 0.266178697347641, 0.3016499876976013, 0.33712127804756165, 0.372592568397522, 0.4080638587474823, 0.4435351490974426, 0.47900643944740295, 0.5144777297973633, 0.549949049949646, 0.5854203104972839, 0.6208915710449219, 0.6563628911972046, 0.6918342113494873, 0.7273054718971252, 0.7627767324447632, 0.7982480525970459, 0.8337193727493286, 0.8691906332969666, 0.9046618938446045, 0.9401332139968872, 0.9756045341491699, 1.011075735092163, 1.0465470552444458, 1.0820183753967285, 1.1174896955490112, 1.152961015701294, 1.188432216644287, 1.2239035367965698]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 10.0, 10.0, 22.0, 23.0, 28.0, 40.0, 52.0, 79.0, 146.0, 242.0, 518.0, 1190.0, 3286.0, 12614.0, 96002.0, 3967201.0, 95484.0, 12129.0, 3224.0, 1097.0, 448.0, 204.0, 94.0, 60.0, 22.0, 18.0, 11.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44091796875, -0.4305419921875, -0.420166015625, -0.4097900390625, -0.3994140625, -0.3890380859375, -0.378662109375, -0.3682861328125, -0.35791015625, -0.3475341796875, -0.337158203125, -0.3267822265625, -0.31640625, -0.3060302734375, -0.295654296875, -0.2852783203125, -0.27490234375, -0.2645263671875, -0.254150390625, -0.2437744140625, -0.2333984375, -0.2230224609375, -0.212646484375, -0.2022705078125, -0.19189453125, -0.1815185546875, -0.171142578125, -0.1607666015625, -0.150390625, -0.1400146484375, -0.129638671875, -0.1192626953125, -0.10888671875, -0.0985107421875, -0.088134765625, -0.0777587890625, -0.0673828125, -0.0570068359375, -0.046630859375, -0.0362548828125, -0.02587890625, -0.0155029296875, -0.005126953125, 0.0052490234375, 0.015625, 0.0260009765625, 0.036376953125, 0.0467529296875, 0.05712890625, 0.0675048828125, 0.077880859375, 0.0882568359375, 0.0986328125, 0.1090087890625, 0.119384765625, 0.1297607421875, 0.14013671875, 0.1505126953125, 0.160888671875, 0.1712646484375, 0.181640625, 0.1920166015625, 0.202392578125, 0.2127685546875, 0.22314453125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 14.0, 18.0, 35.0, 49.0, 63.0, 80.0, 78.0, 114.0, 107.0, 90.0, 87.0, 94.0, 57.0, 44.0, 26.0, 17.0, 7.0, 6.0, 6.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.182373046875, -0.1780719757080078, -0.17377090454101562, -0.16946983337402344, -0.16516876220703125, -0.16086769104003906, -0.15656661987304688, -0.1522655487060547, -0.1479644775390625, -0.1436634063720703, -0.13936233520507812, -0.13506126403808594, -0.13076019287109375, -0.12645912170410156, -0.12215805053710938, -0.11785697937011719, -0.113555908203125, -0.10925483703613281, -0.10495376586914062, -0.10065269470214844, -0.09635162353515625, -0.09205055236816406, -0.08774948120117188, -0.08344841003417969, -0.0791473388671875, -0.07484626770019531, -0.07054519653320312, -0.06624412536621094, -0.06194305419921875, -0.05764198303222656, -0.053340911865234375, -0.04903984069824219, -0.04473876953125, -0.04043769836425781, -0.036136627197265625, -0.03183555603027344, -0.02753448486328125, -0.023233413696289062, -0.018932342529296875, -0.014631271362304688, -0.0103302001953125, -0.0060291290283203125, -0.001728057861328125, 0.0025730133056640625, 0.00687408447265625, 0.011175155639648438, 0.015476226806640625, 0.019777297973632812, 0.024078369140625, 0.028379440307617188, 0.032680511474609375, 0.03698158264160156, 0.04128265380859375, 0.04558372497558594, 0.049884796142578125, 0.05418586730957031, 0.0584869384765625, 0.06278800964355469, 0.06708908081054688, 0.07139015197753906, 0.07569122314453125, 0.07999229431152344, 0.08429336547851562, 0.08859443664550781, 0.0928955078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 8.0, 5.0, 20.0, 21.0, 33.0, 56.0, 87.0, 183.0, 388.0, 1158.0, 4386.0, 21449.0, 587428.0, 3539031.0, 31787.0, 5737.0, 1552.0, 468.0, 187.0, 101.0, 63.0, 42.0, 33.0, 17.0, 15.0, 12.0, 3.0, 8.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24746322631835938, -0.23833465576171875, -0.22920608520507812, -0.2200775146484375, -0.21094894409179688, -0.20182037353515625, -0.19269180297851562, -0.183563232421875, -0.17443466186523438, -0.16530609130859375, -0.15617752075195312, -0.1470489501953125, -0.13792037963867188, -0.12879180908203125, -0.11966323852539062, -0.11053466796875, -0.10140609741210938, -0.09227752685546875, -0.08314895629882812, -0.0740203857421875, -0.06489181518554688, -0.05576324462890625, -0.046634674072265625, -0.037506103515625, -0.028377532958984375, -0.01924896240234375, -0.010120391845703125, -0.0009918212890625, 0.008136749267578125, 0.01726531982421875, 0.026393890380859375, 0.0355224609375, 0.044651031494140625, 0.05377960205078125, 0.06290817260742188, 0.0720367431640625, 0.08116531372070312, 0.09029388427734375, 0.09942245483398438, 0.108551025390625, 0.11767959594726562, 0.12680816650390625, 0.13593673706054688, 0.1450653076171875, 0.15419387817382812, 0.16332244873046875, 0.17245101928710938, 0.18157958984375, 0.19070816040039062, 0.19983673095703125, 0.20896530151367188, 0.2180938720703125, 0.22722244262695312, 0.23635101318359375, 0.24547958374023438, 0.254608154296875, 0.2637367248535156, 0.27286529541015625, 0.2819938659667969, 0.2911224365234375, 0.3002510070800781, 0.30937957763671875, 0.3185081481933594, 0.32763671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 6.0, 8.0, 12.0, 29.0, 48.0, 67.0, 145.0, 400.0, 2549.0, 540.0, 129.0, 56.0, 26.0, 21.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09259033203125, -0.0878610610961914, -0.08313179016113281, -0.07840251922607422, -0.07367324829101562, -0.06894397735595703, -0.06421470642089844, -0.059485435485839844, -0.05475616455078125, -0.050026893615722656, -0.04529762268066406, -0.04056835174560547, -0.035839080810546875, -0.03110980987548828, -0.026380538940429688, -0.021651268005371094, -0.0169219970703125, -0.012192726135253906, -0.0074634552001953125, -0.0027341842651367188, 0.001995086669921875, 0.006724357604980469, 0.011453628540039062, 0.016182899475097656, 0.02091217041015625, 0.025641441345214844, 0.030370712280273438, 0.03509998321533203, 0.039829254150390625, 0.04455852508544922, 0.04928779602050781, 0.054017066955566406, 0.058746337890625, 0.0634756088256836, 0.06820487976074219, 0.07293415069580078, 0.07766342163085938, 0.08239269256591797, 0.08712196350097656, 0.09185123443603516, 0.09658050537109375, 0.10130977630615234, 0.10603904724121094, 0.11076831817626953, 0.11549758911132812, 0.12022686004638672, 0.12495613098144531, 0.1296854019165039, 0.1344146728515625, 0.1391439437866211, 0.1438732147216797, 0.14860248565673828, 0.15333175659179688, 0.15806102752685547, 0.16279029846191406, 0.16751956939697266, 0.17224884033203125, 0.17697811126708984, 0.18170738220214844, 0.18643665313720703, 0.19116592407226562, 0.19589519500732422, 0.2006244659423828, 0.2053537368774414, 0.2100830078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 22.0, 110.0, 476.0, 316.0, 55.0, 8.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0404784679412842, -0.9969796538352966, -0.9534808397293091, -0.9099820852279663, -0.866483211517334, -0.8229844570159912, -0.7794856429100037, -0.7359868288040161, -0.6924880146980286, -0.648989200592041, -0.6054903864860535, -0.5619915723800659, -0.5184928178787231, -0.4749939739704132, -0.43149518966674805, -0.3879963755607605, -0.34449756145477295, -0.3009987473487854, -0.25749993324279785, -0.2140011489391327, -0.17050233483314514, -0.1270035207271576, -0.08350473642349243, -0.04000592231750488, 0.003492891788482666, 0.04699169844388962, 0.09049050509929657, 0.13398930430412292, 0.17748811841011047, 0.22098693251609802, 0.2644857168197632, 0.30798453092575073, 0.3514833450317383, 0.39498215913772583, 0.4384809732437134, 0.48197975754737854, 0.5254786014556885, 0.5689773559570312, 0.6124761700630188, 0.6559749841690063, 0.6994737982749939, 0.7429726123809814, 0.786471426486969, 0.8299702405929565, 0.8734689950942993, 0.9169678688049316, 0.9604666233062744, 1.0039653778076172, 1.0474642515182495, 1.0909630060195923, 1.1344618797302246, 1.1779606342315674, 1.2214595079421997, 1.2649582624435425, 1.3084571361541748, 1.3519558906555176, 1.3954546451568604, 1.4389533996582031, 1.4824522733688354, 1.5259510278701782, 1.5694499015808105, 1.6129486560821533, 1.656447410583496, 1.6999462842941284, 1.7434451580047607]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 11.0, 15.0, 9.0, 13.0, 18.0, 27.0, 20.0, 19.0, 27.0, 41.0, 40.0, 49.0, 31.0, 44.0, 58.0, 51.0, 48.0, 55.0, 47.0, 55.0, 36.0, 46.0, 44.0, 28.0, 26.0, 20.0, 27.0, 15.0, 15.0, 18.0, 13.0, 10.0, 7.0, 8.0, 4.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301017701625824, -0.29016268253326416, -0.27930769324302673, -0.2684526741504669, -0.2575976550579071, -0.24674266576766968, -0.23588764667510986, -0.22503264248371124, -0.21417763829231262, -0.203322634100914, -0.1924676150083542, -0.18161261081695557, -0.17075760662555695, -0.15990260243415833, -0.1490475833415985, -0.1381925791501999, -0.12733756005764008, -0.11648254841566086, -0.10562754422426224, -0.09477253258228302, -0.0839175283908844, -0.07306251674890518, -0.062207505106925964, -0.051352500915527344, -0.040497489273548126, -0.029642481356859207, -0.01878747157752514, -0.00793246179819107, 0.0029225461184978485, 0.013777554035186768, 0.024632565677165985, 0.035487569868564606, 0.04634258151054382, 0.05719758942723274, 0.06805259734392166, 0.07890760898590088, 0.0897626131772995, 0.10061762481927872, 0.11147263646125793, 0.12232764065265656, 0.13318264484405518, 0.1440376490354538, 0.1548926681280136, 0.16574767231941223, 0.17660267651081085, 0.18745768070220947, 0.1983126997947693, 0.2091677039861679, 0.22002272307872772, 0.23087772727012634, 0.24173274636268616, 0.2525877356529236, 0.2634427547454834, 0.2742977738380432, 0.285152792930603, 0.29600778222084045, 0.30686280131340027, 0.3177178204059601, 0.3285728096961975, 0.3394278287887573, 0.35028284788131714, 0.36113783717155457, 0.3719928562641144, 0.3828478455543518, 0.3937028646469116]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 6.0, 4.0, 1.0, 10.0, 11.0, 17.0, 12.0, 31.0, 44.0, 64.0, 99.0, 189.0, 399.0, 791.0, 1879.0, 5812.0, 25884.0, 272724.0, 674975.0, 51667.0, 9031.0, 2822.0, 1006.0, 481.0, 218.0, 151.0, 61.0, 54.0, 31.0, 31.0, 15.0, 6.0, 5.0, 3.0, 7.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.466796875, -0.4535255432128906, -0.44025421142578125, -0.4269828796386719, -0.4137115478515625, -0.4004402160644531, -0.38716888427734375, -0.3738975524902344, -0.360626220703125, -0.3473548889160156, -0.33408355712890625, -0.3208122253417969, -0.3075408935546875, -0.2942695617675781, -0.28099822998046875, -0.2677268981933594, -0.25445556640625, -0.24118423461914062, -0.22791290283203125, -0.21464157104492188, -0.2013702392578125, -0.18809890747070312, -0.17482757568359375, -0.16155624389648438, -0.148284912109375, -0.13501358032226562, -0.12174224853515625, -0.10847091674804688, -0.0951995849609375, -0.08192825317382812, -0.06865692138671875, -0.055385589599609375, -0.0421142578125, -0.028842926025390625, -0.01557159423828125, -0.002300262451171875, 0.0109710693359375, 0.024242401123046875, 0.03751373291015625, 0.050785064697265625, 0.064056396484375, 0.07732772827148438, 0.09059906005859375, 0.10387039184570312, 0.1171417236328125, 0.13041305541992188, 0.14368438720703125, 0.15695571899414062, 0.17022705078125, 0.18349838256835938, 0.19676971435546875, 0.21004104614257812, 0.2233123779296875, 0.23658370971679688, 0.24985504150390625, 0.2631263732910156, 0.276397705078125, 0.2896690368652344, 0.30294036865234375, 0.3162117004394531, 0.3294830322265625, 0.3427543640136719, 0.35602569580078125, 0.3692970275878906, 0.382568359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 10.0, 37.0, 36.0, 54.0, 62.0, 91.0, 93.0, 113.0, 103.0, 99.0, 82.0, 74.0, 46.0, 45.0, 18.0, 8.0, 9.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183837890625, -0.17944908142089844, -0.17506027221679688, -0.1706714630126953, -0.16628265380859375, -0.1618938446044922, -0.15750503540039062, -0.15311622619628906, -0.1487274169921875, -0.14433860778808594, -0.13994979858398438, -0.1355609893798828, -0.13117218017578125, -0.1267833709716797, -0.12239456176757812, -0.11800575256347656, -0.113616943359375, -0.10922813415527344, -0.10483932495117188, -0.10045051574707031, -0.09606170654296875, -0.09167289733886719, -0.08728408813476562, -0.08289527893066406, -0.0785064697265625, -0.07411766052246094, -0.06972885131835938, -0.06534004211425781, -0.06095123291015625, -0.05656242370605469, -0.052173614501953125, -0.04778480529785156, -0.04339599609375, -0.03900718688964844, -0.034618377685546875, -0.030229568481445312, -0.02584075927734375, -0.021451950073242188, -0.017063140869140625, -0.012674331665039062, -0.0082855224609375, -0.0038967132568359375, 0.000492095947265625, 0.0048809051513671875, 0.00926971435546875, 0.013658523559570312, 0.018047332763671875, 0.022436141967773438, 0.026824951171875, 0.031213760375976562, 0.035602569580078125, 0.03999137878417969, 0.04438018798828125, 0.04876899719238281, 0.053157806396484375, 0.05754661560058594, 0.0619354248046875, 0.06632423400878906, 0.07071304321289062, 0.07510185241699219, 0.07949066162109375, 0.08387947082519531, 0.08826828002929688, 0.09265708923339844, 0.0970458984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 4.0, 5.0, 4.0, 6.0, 17.0, 17.0, 32.0, 55.0, 75.0, 126.0, 199.0, 349.0, 617.0, 1257.0, 2511.0, 6265.0, 20116.0, 98876.0, 675917.0, 194776.0, 32014.0, 8711.0, 3275.0, 1477.0, 759.0, 403.0, 252.0, 137.0, 97.0, 58.0, 35.0, 37.0, 24.0, 16.0, 7.0, 4.0, 9.0, 5.0, 7.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.223388671875, -0.21531295776367188, -0.20723724365234375, -0.19916152954101562, -0.1910858154296875, -0.18301010131835938, -0.17493438720703125, -0.16685867309570312, -0.158782958984375, -0.15070724487304688, -0.14263153076171875, -0.13455581665039062, -0.1264801025390625, -0.11840438842773438, -0.11032867431640625, -0.10225296020507812, -0.09417724609375, -0.08610153198242188, -0.07802581787109375, -0.06995010375976562, -0.0618743896484375, -0.053798675537109375, -0.04572296142578125, -0.037647247314453125, -0.029571533203125, -0.021495819091796875, -0.01342010498046875, -0.005344390869140625, 0.0027313232421875, 0.010807037353515625, 0.01888275146484375, 0.026958465576171875, 0.0350341796875, 0.043109893798828125, 0.05118560791015625, 0.059261322021484375, 0.0673370361328125, 0.07541275024414062, 0.08348846435546875, 0.09156417846679688, 0.099639892578125, 0.10771560668945312, 0.11579132080078125, 0.12386703491210938, 0.1319427490234375, 0.14001846313476562, 0.14809417724609375, 0.15616989135742188, 0.16424560546875, 0.17232131958007812, 0.18039703369140625, 0.18847274780273438, 0.1965484619140625, 0.20462417602539062, 0.21269989013671875, 0.22077560424804688, 0.228851318359375, 0.23692703247070312, 0.24500274658203125, 0.2530784606933594, 0.2611541748046875, 0.2692298889160156, 0.27730560302734375, 0.2853813171386719, 0.29345703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 9.0, 7.0, 10.0, 6.0, 17.0, 14.0, 18.0, 23.0, 27.0, 25.0, 33.0, 36.0, 24.0, 35.0, 32.0, 48.0, 54.0, 59.0, 44.0, 55.0, 48.0, 52.0, 43.0, 34.0, 32.0, 26.0, 22.0, 26.0, 24.0, 16.0, 17.0, 13.0, 11.0, 11.0, 5.0, 6.0, 8.0, 3.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.280029296875, -0.27203369140625, -0.2640380859375, -0.25604248046875, -0.248046875, -0.24005126953125, -0.2320556640625, -0.22406005859375, -0.216064453125, -0.20806884765625, -0.2000732421875, -0.19207763671875, -0.18408203125, -0.17608642578125, -0.1680908203125, -0.16009521484375, -0.152099609375, -0.14410400390625, -0.1361083984375, -0.12811279296875, -0.1201171875, -0.11212158203125, -0.1041259765625, -0.09613037109375, -0.088134765625, -0.08013916015625, -0.0721435546875, -0.06414794921875, -0.05615234375, -0.04815673828125, -0.0401611328125, -0.03216552734375, -0.024169921875, -0.01617431640625, -0.0081787109375, -0.00018310546875, 0.0078125, 0.01580810546875, 0.0238037109375, 0.03179931640625, 0.039794921875, 0.04779052734375, 0.0557861328125, 0.06378173828125, 0.07177734375, 0.07977294921875, 0.0877685546875, 0.09576416015625, 0.103759765625, 0.11175537109375, 0.1197509765625, 0.12774658203125, 0.1357421875, 0.14373779296875, 0.1517333984375, 0.15972900390625, 0.167724609375, 0.17572021484375, 0.1837158203125, 0.19171142578125, 0.19970703125, 0.20770263671875, 0.2156982421875, 0.22369384765625, 0.231689453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 19.0, 46.0, 71.0, 139.0, 334.0, 961.0, 7452.0, 1008083.0, 29138.0, 1487.0, 445.0, 191.0, 88.0, 40.0, 33.0, 13.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2347412109375, -0.22625160217285156, -0.21776199340820312, -0.2092723846435547, -0.20078277587890625, -0.1922931671142578, -0.18380355834960938, -0.17531394958496094, -0.1668243408203125, -0.15833473205566406, -0.14984512329101562, -0.1413555145263672, -0.13286590576171875, -0.12437629699707031, -0.11588668823242188, -0.10739707946777344, -0.098907470703125, -0.09041786193847656, -0.08192825317382812, -0.07343864440917969, -0.06494903564453125, -0.05645942687988281, -0.047969818115234375, -0.03948020935058594, -0.0309906005859375, -0.022500991821289062, -0.014011383056640625, -0.0055217742919921875, 0.00296783447265625, 0.011457443237304688, 0.019947052001953125, 0.028436660766601562, 0.03692626953125, 0.04541587829589844, 0.053905487060546875, 0.06239509582519531, 0.07088470458984375, 0.07937431335449219, 0.08786392211914062, 0.09635353088378906, 0.1048431396484375, 0.11333274841308594, 0.12182235717773438, 0.1303119659423828, 0.13880157470703125, 0.1472911834716797, 0.15578079223632812, 0.16427040100097656, 0.172760009765625, 0.18124961853027344, 0.18973922729492188, 0.1982288360595703, 0.20671844482421875, 0.2152080535888672, 0.22369766235351562, 0.23218727111816406, 0.2406768798828125, 0.24916648864746094, 0.2576560974121094, 0.2661457061767578, 0.27463531494140625, 0.2831249237060547, 0.2916145324707031, 0.30010414123535156, 0.30859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 23.0, 30.0, 58.0, 117.0, 218.0, 247.0, 131.0, 76.0, 47.0, 16.0, 12.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004241466522216797, -0.00041430629789829254, -0.0004044659435749054, -0.00039462558925151825, -0.0003847852349281311, -0.00037494488060474396, -0.0003651045262813568, -0.00035526417195796967, -0.0003454238176345825, -0.0003355834633111954, -0.00032574310898780823, -0.0003159027546644211, -0.00030606240034103394, -0.0002962220460176468, -0.00028638169169425964, -0.0002765413373708725, -0.00026670098304748535, -0.0002568606287240982, -0.00024702027440071106, -0.00023717992007732391, -0.00022733956575393677, -0.00021749921143054962, -0.00020765885710716248, -0.00019781850278377533, -0.00018797814846038818, -0.00017813779413700104, -0.0001682974398136139, -0.00015845708549022675, -0.0001486167311668396, -0.00013877637684345245, -0.0001289360225200653, -0.00011909566819667816, -0.00010925531387329102, -9.941495954990387e-05, -8.957460522651672e-05, -7.973425090312958e-05, -6.989389657974243e-05, -6.0053542256355286e-05, -5.021318793296814e-05, -4.0372833609580994e-05, -3.053247928619385e-05, -2.06921249628067e-05, -1.0851770639419556e-05, -1.0114163160324097e-06, 8.828938007354736e-06, 1.8669292330741882e-05, 2.850964665412903e-05, 3.8350000977516174e-05, 4.819035530090332e-05, 5.8030709624290466e-05, 6.787106394767761e-05, 7.771141827106476e-05, 8.75517725944519e-05, 9.739212691783905e-05, 0.0001072324812412262, 0.00011707283556461334, 0.0001269131898880005, 0.00013675354421138763, 0.00014659389853477478, 0.00015643425285816193, 0.00016627460718154907, 0.00017611496150493622, 0.00018595531582832336, 0.0001957956701517105, 0.00020563602447509766]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 11.0, 39.0, 65.0, 135.0, 386.0, 1537.0, 241195.0, 802309.0, 2206.0, 383.0, 140.0, 78.0, 36.0, 15.0, 13.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.316650390625, -0.3083362579345703, -0.3000221252441406, -0.29170799255371094, -0.28339385986328125, -0.27507972717285156, -0.2667655944824219, -0.2584514617919922, -0.2501373291015625, -0.2418231964111328, -0.23350906372070312, -0.22519493103027344, -0.21688079833984375, -0.20856666564941406, -0.20025253295898438, -0.1919384002685547, -0.183624267578125, -0.1753101348876953, -0.16699600219726562, -0.15868186950683594, -0.15036773681640625, -0.14205360412597656, -0.13373947143554688, -0.1254253387451172, -0.1171112060546875, -0.10879707336425781, -0.10048294067382812, -0.09216880798339844, -0.08385467529296875, -0.07554054260253906, -0.06722640991210938, -0.05891227722167969, -0.05059814453125, -0.04228401184082031, -0.033969879150390625, -0.025655746459960938, -0.01734161376953125, -0.009027481079101562, -0.000713348388671875, 0.0076007843017578125, 0.0159149169921875, 0.024229049682617188, 0.032543182373046875, 0.04085731506347656, 0.04917144775390625, 0.05748558044433594, 0.06579971313476562, 0.07411384582519531, 0.082427978515625, 0.09074211120605469, 0.09905624389648438, 0.10737037658691406, 0.11568450927734375, 0.12399864196777344, 0.13231277465820312, 0.1406269073486328, 0.1489410400390625, 0.1572551727294922, 0.16556930541992188, 0.17388343811035156, 0.18219757080078125, 0.19051170349121094, 0.19882583618164062, 0.2071399688720703, 0.2154541015625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 13.0, 10.0, 51.0, 127.0, 253.0, 305.0, 136.0, 69.0, 22.0, 15.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.31689453125, -0.31017398834228516, -0.3034534454345703, -0.29673290252685547, -0.2900123596191406, -0.2832918167114258, -0.27657127380371094, -0.2698507308959961, -0.26313018798828125, -0.2564096450805664, -0.24968910217285156, -0.24296855926513672, -0.23624801635742188, -0.22952747344970703, -0.2228069305419922, -0.21608638763427734, -0.2093658447265625, -0.20264530181884766, -0.1959247589111328, -0.18920421600341797, -0.18248367309570312, -0.17576313018798828, -0.16904258728027344, -0.1623220443725586, -0.15560150146484375, -0.1488809585571289, -0.14216041564941406, -0.13543987274169922, -0.12871932983398438, -0.12199878692626953, -0.11527824401855469, -0.10855770111083984, -0.101837158203125, -0.09511661529541016, -0.08839607238769531, -0.08167552947998047, -0.07495498657226562, -0.06823444366455078, -0.06151390075683594, -0.054793357849121094, -0.04807281494140625, -0.041352272033691406, -0.03463172912597656, -0.02791118621826172, -0.021190643310546875, -0.014470100402832031, -0.0077495574951171875, -0.0010290145874023438, 0.0056915283203125, 0.012412071228027344, 0.019132614135742188, 0.02585315704345703, 0.032573699951171875, 0.03929424285888672, 0.04601478576660156, 0.052735328674316406, 0.05945587158203125, 0.0661764144897461, 0.07289695739746094, 0.07961750030517578, 0.08633804321289062, 0.09305858612060547, 0.09977912902832031, 0.10649967193603516, 0.11322021484375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 59.0, 330.0, 473.0, 115.0, 16.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.055200576782227, -9.869478225708008, -9.683755874633789, -9.49803352355957, -9.312312126159668, -9.12658977508545, -8.94086742401123, -8.755145072937012, -8.569422721862793, -8.383700370788574, -8.197978019714355, -8.012255668640137, -7.826533794403076, -7.640811443328857, -7.455089569091797, -7.269367218017578, -7.083644866943359, -6.897922515869141, -6.71220064163208, -6.526478290557861, -6.340755939483643, -6.155033588409424, -5.969311714172363, -5.7835893630981445, -5.597867488861084, -5.412145137786865, -5.226423263549805, -5.040700912475586, -4.854978561401367, -4.669256210327148, -4.483534336090088, -4.297811985015869, -4.112089157104492, -3.9263670444488525, -3.740644693374634, -3.554922580718994, -3.3692002296447754, -3.1834781169891357, -2.997756004333496, -2.8120336532592773, -2.626311779022217, -2.440589666366577, -2.2548673152923584, -2.0691452026367188, -1.8834228515625, -1.6977007389068604, -1.5119785070419312, -1.326256275177002, -1.1405339241027832, -0.954811692237854, -0.7690894603729248, -0.5833672881126404, -0.3976450562477112, -0.21192282438278198, -0.02620065212249756, 0.15952157974243164, 0.34524381160736084, 0.53096604347229, 0.7166882753372192, 0.9024104475975037, 1.088132619857788, 1.2738549709320068, 1.4595770835876465, 1.6452993154525757, 1.8310215473175049]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 9.0, 6.0, 7.0, 9.0, 9.0, 13.0, 13.0, 26.0, 23.0, 27.0, 24.0, 20.0, 34.0, 35.0, 40.0, 32.0, 27.0, 33.0, 37.0, 46.0, 44.0, 46.0, 34.0, 37.0, 39.0, 33.0, 20.0, 31.0, 27.0, 25.0, 26.0, 18.0, 24.0, 12.0, 21.0, 19.0, 12.0, 6.0, 9.0, 6.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 4.0, 7.0, 2.0, 1.0, 2.0], "bins": [-1.1482033729553223, -1.113869547843933, -1.079535722732544, -1.0452018976211548, -1.0108680725097656, -0.9765341877937317, -0.9422003626823425, -0.9078665375709534, -0.8735326528549194, -0.8391988277435303, -0.8048650026321411, -0.770531177520752, -0.736197292804718, -0.7018634676933289, -0.6675296425819397, -0.6331958174705505, -0.5988619923591614, -0.5645281672477722, -0.5301943421363831, -0.4958604872226715, -0.46152663230895996, -0.4271928071975708, -0.39285898208618164, -0.3585251569747925, -0.32419130206108093, -0.2898574769496918, -0.2555236220359802, -0.22118979692459106, -0.1868559569120407, -0.15252211689949036, -0.1181882917881012, -0.08385445177555084, -0.04952061176300049, -0.015186775475740433, 0.019147060811519623, 0.05348089337348938, 0.08781473338603973, 0.12214857339859009, 0.15648239850997925, 0.1908162385225296, 0.22515007853507996, 0.2594839036464691, 0.29381775856018066, 0.3281515836715698, 0.362485408782959, 0.39681926369667053, 0.4311530888080597, 0.46548694372177124, 0.4998207688331604, 0.5341545939445496, 0.5684884190559387, 0.6028223037719727, 0.6371561288833618, 0.671489953994751, 0.7058237791061401, 0.7401576042175293, 0.7744914293289185, 0.8088252544403076, 0.8431590795516968, 0.8774929046630859, 0.9118267893791199, 0.946160614490509, 0.9804944396018982, 1.0148283243179321, 1.0491621494293213]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 3.0, 6.0, 9.0, 6.0, 15.0, 18.0, 21.0, 36.0, 36.0, 50.0, 60.0, 61.0, 98.0, 102.0, 165.0, 217.0, 316.0, 595.0, 1275.0, 2955.0, 9457.0, 47426.0, 3599948.0, 490952.0, 28807.0, 6702.0, 2362.0, 1037.0, 515.0, 332.0, 178.0, 114.0, 98.0, 66.0, 54.0, 40.0, 36.0, 27.0, 12.0, 16.0, 10.0, 14.0, 7.0, 6.0, 6.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0], "bins": [-0.275390625, -0.2677116394042969, -0.26003265380859375, -0.2523536682128906, -0.2446746826171875, -0.23699569702148438, -0.22931671142578125, -0.22163772583007812, -0.213958740234375, -0.20627975463867188, -0.19860076904296875, -0.19092178344726562, -0.1832427978515625, -0.17556381225585938, -0.16788482666015625, -0.16020584106445312, -0.15252685546875, -0.14484786987304688, -0.13716888427734375, -0.12948989868164062, -0.1218109130859375, -0.11413192749023438, -0.10645294189453125, -0.09877395629882812, -0.091094970703125, -0.08341598510742188, -0.07573699951171875, -0.06805801391601562, -0.0603790283203125, -0.052700042724609375, -0.04502105712890625, -0.037342071533203125, -0.0296630859375, -0.021984100341796875, -0.01430511474609375, -0.006626129150390625, 0.0010528564453125, 0.008731842041015625, 0.01641082763671875, 0.024089813232421875, 0.031768798828125, 0.039447784423828125, 0.04712677001953125, 0.054805755615234375, 0.0624847412109375, 0.07016372680664062, 0.07784271240234375, 0.08552169799804688, 0.09320068359375, 0.10087966918945312, 0.10855865478515625, 0.11623764038085938, 0.1239166259765625, 0.13159561157226562, 0.13927459716796875, 0.14695358276367188, 0.154632568359375, 0.16231155395507812, 0.16999053955078125, 0.17766952514648438, 0.1853485107421875, 0.19302749633789062, 0.20070648193359375, 0.20838546752929688, 0.216064453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 14.0, 21.0, 20.0, 37.0, 48.0, 71.0, 80.0, 88.0, 106.0, 103.0, 85.0, 79.0, 83.0, 57.0, 32.0, 28.0, 18.0, 11.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.197021484375, -0.1923351287841797, -0.18764877319335938, -0.18296241760253906, -0.17827606201171875, -0.17358970642089844, -0.16890335083007812, -0.1642169952392578, -0.1595306396484375, -0.1548442840576172, -0.15015792846679688, -0.14547157287597656, -0.14078521728515625, -0.13609886169433594, -0.13141250610351562, -0.1267261505126953, -0.122039794921875, -0.11735343933105469, -0.11266708374023438, -0.10798072814941406, -0.10329437255859375, -0.09860801696777344, -0.09392166137695312, -0.08923530578613281, -0.0845489501953125, -0.07986259460449219, -0.07517623901367188, -0.07048988342285156, -0.06580352783203125, -0.06111717224121094, -0.056430816650390625, -0.05174446105957031, -0.04705810546875, -0.04237174987792969, -0.037685394287109375, -0.03299903869628906, -0.02831268310546875, -0.023626327514648438, -0.018939971923828125, -0.014253616333007812, -0.0095672607421875, -0.0048809051513671875, -0.000194549560546875, 0.0044918060302734375, 0.00917816162109375, 0.013864517211914062, 0.018550872802734375, 0.023237228393554688, 0.027923583984375, 0.03260993957519531, 0.037296295166015625, 0.04198265075683594, 0.04666900634765625, 0.05135536193847656, 0.056041717529296875, 0.06072807312011719, 0.0654144287109375, 0.07010078430175781, 0.07478713989257812, 0.07947349548339844, 0.08415985107421875, 0.08884620666503906, 0.09353256225585938, 0.09821891784667969, 0.1029052734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 16.0, 20.0, 28.0, 39.0, 64.0, 90.0, 147.0, 240.0, 358.0, 626.0, 1063.0, 2009.0, 4623.0, 14166.0, 83679.0, 3892036.0, 163224.0, 20183.0, 5893.0, 2499.0, 1326.0, 734.0, 430.0, 275.0, 160.0, 117.0, 80.0, 36.0, 26.0, 23.0, 21.0, 6.0, 12.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.201904296875, -0.19402313232421875, -0.1861419677734375, -0.17826080322265625, -0.170379638671875, -0.16249847412109375, -0.1546173095703125, -0.14673614501953125, -0.13885498046875, -0.13097381591796875, -0.1230926513671875, -0.11521148681640625, -0.107330322265625, -0.09944915771484375, -0.0915679931640625, -0.08368682861328125, -0.0758056640625, -0.06792449951171875, -0.0600433349609375, -0.05216217041015625, -0.044281005859375, -0.03639984130859375, -0.0285186767578125, -0.02063751220703125, -0.01275634765625, -0.00487518310546875, 0.0030059814453125, 0.01088714599609375, 0.018768310546875, 0.02664947509765625, 0.0345306396484375, 0.04241180419921875, 0.05029296875, 0.05817413330078125, 0.0660552978515625, 0.07393646240234375, 0.081817626953125, 0.08969879150390625, 0.0975799560546875, 0.10546112060546875, 0.11334228515625, 0.12122344970703125, 0.1291046142578125, 0.13698577880859375, 0.144866943359375, 0.15274810791015625, 0.1606292724609375, 0.16851043701171875, 0.1763916015625, 0.18427276611328125, 0.1921539306640625, 0.20003509521484375, 0.207916259765625, 0.21579742431640625, 0.2236785888671875, 0.23155975341796875, 0.23944091796875, 0.24732208251953125, 0.2552032470703125, 0.26308441162109375, 0.270965576171875, 0.27884674072265625, 0.2867279052734375, 0.29460906982421875, 0.302490234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 9.0, 8.0, 28.0, 49.0, 74.0, 188.0, 980.0, 2304.0, 214.0, 90.0, 49.0, 32.0, 10.0, 7.0, 7.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.09460735321044922, -0.09052085876464844, -0.08643436431884766, -0.08234786987304688, -0.0782613754272461, -0.07417488098144531, -0.07008838653564453, -0.06600189208984375, -0.06191539764404297, -0.05782890319824219, -0.053742408752441406, -0.049655914306640625, -0.045569419860839844, -0.04148292541503906, -0.03739643096923828, -0.0333099365234375, -0.02922344207763672, -0.025136947631835938, -0.021050453186035156, -0.016963958740234375, -0.012877464294433594, -0.008790969848632812, -0.004704475402832031, -0.00061798095703125, 0.0034685134887695312, 0.0075550079345703125, 0.011641502380371094, 0.015727996826171875, 0.019814491271972656, 0.023900985717773438, 0.02798748016357422, 0.032073974609375, 0.03616046905517578, 0.04024696350097656, 0.044333457946777344, 0.048419952392578125, 0.052506446838378906, 0.05659294128417969, 0.06067943572998047, 0.06476593017578125, 0.06885242462158203, 0.07293891906738281, 0.0770254135131836, 0.08111190795898438, 0.08519840240478516, 0.08928489685058594, 0.09337139129638672, 0.0974578857421875, 0.10154438018798828, 0.10563087463378906, 0.10971736907958984, 0.11380386352539062, 0.1178903579711914, 0.12197685241699219, 0.12606334686279297, 0.13014984130859375, 0.13423633575439453, 0.1383228302001953, 0.1424093246459961, 0.14649581909179688, 0.15058231353759766, 0.15466880798339844, 0.15875530242919922, 0.162841796875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 10.0, 18.0, 65.0, 200.0, 427.0, 212.0, 53.0, 11.0, 6.0, 2.0, 2.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2805880308151245, -0.24361862242221832, -0.20664921402931213, -0.16967980563640594, -0.13271039724349976, -0.09574098885059357, -0.05877158045768738, -0.021802186965942383, 0.015167236328125, 0.05213664472103119, 0.08910605311393738, 0.12607546150684357, 0.16304486989974976, 0.20001427829265594, 0.23698368668556213, 0.27395308017730713, 0.3109225034713745, 0.3478919267654419, 0.3848613202571869, 0.4218307137489319, 0.45880013704299927, 0.49576956033706665, 0.5327389240264893, 0.5697083473205566, 0.606677770614624, 0.6436471939086914, 0.6806166172027588, 0.7175859808921814, 0.7545554041862488, 0.7915248274803162, 0.8284941911697388, 0.8654636144638062, 0.902432918548584, 0.9394023418426514, 0.9763717651367188, 1.0133411884307861, 1.0503106117248535, 1.0872799158096313, 1.1242493391036987, 1.1612187623977661, 1.1981881856918335, 1.2351576089859009, 1.2721270322799683, 1.3090964555740356, 1.3460657596588135, 1.3830351829528809, 1.4200046062469482, 1.4569740295410156, 1.493943452835083, 1.5309128761291504, 1.5678822994232178, 1.6048517227172852, 1.6418211460113525, 1.6787904500961304, 1.7157598733901978, 1.7527292966842651, 1.7896987199783325, 1.8266681432724, 1.8636375665664673, 1.9006069898605347, 1.9375762939453125, 1.9745457172393799, 2.0115151405334473, 2.0484845638275146, 2.085453987121582]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 10.0, 10.0, 11.0, 20.0, 25.0, 29.0, 35.0, 52.0, 59.0, 62.0, 74.0, 85.0, 85.0, 77.0, 84.0, 61.0, 42.0, 47.0, 43.0, 25.0, 20.0, 16.0, 12.0, 10.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4367576241493225, -0.42403900623321533, -0.41132041811943054, -0.39860180020332336, -0.3858831822872162, -0.3731645941734314, -0.3604459762573242, -0.34772735834121704, -0.33500877022743225, -0.3222901523113251, -0.3095715641975403, -0.2968529462814331, -0.2841343283653259, -0.27141574025154114, -0.25869712233543396, -0.24597851932048798, -0.2332599014043808, -0.22054129838943481, -0.20782268047332764, -0.19510407745838165, -0.18238547444343567, -0.1696668565273285, -0.1569482535123825, -0.14422965049743652, -0.13151103258132935, -0.11879242211580276, -0.10607381910085678, -0.0933552086353302, -0.08063660562038422, -0.06791799515485764, -0.055199384689331055, -0.04248078167438507, -0.029762178659439087, -0.017043571919202805, -0.004324963316321373, 0.008393645286560059, 0.02111225202679634, 0.03383085876703262, 0.046549469232559204, 0.05926807224750519, 0.07198668271303177, 0.08470529317855835, 0.09742389619350433, 0.11014250665903091, 0.1228611171245575, 0.13557972013950348, 0.14829832315444946, 0.16101694107055664, 0.17373554408550262, 0.1864541471004486, 0.1991727650165558, 0.21189136803150177, 0.22460997104644775, 0.23732858896255493, 0.2500472068786621, 0.2627657949924469, 0.2754844129085541, 0.28820303082466125, 0.30092161893844604, 0.3136402368545532, 0.3263588547706604, 0.3390774428844452, 0.35179606080055237, 0.36451464891433716, 0.37723326683044434]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 14.0, 21.0, 30.0, 51.0, 116.0, 226.0, 557.0, 1371.0, 4812.0, 21550.0, 181307.0, 722858.0, 96116.0, 14257.0, 3374.0, 1078.0, 397.0, 188.0, 88.0, 55.0, 27.0, 17.0, 6.0, 10.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.49365234375, -0.481719970703125, -0.46978759765625, -0.457855224609375, -0.4459228515625, -0.433990478515625, -0.42205810546875, -0.410125732421875, -0.398193359375, -0.386260986328125, -0.37432861328125, -0.362396240234375, -0.3504638671875, -0.338531494140625, -0.32659912109375, -0.314666748046875, -0.302734375, -0.290802001953125, -0.27886962890625, -0.266937255859375, -0.2550048828125, -0.243072509765625, -0.23114013671875, -0.219207763671875, -0.207275390625, -0.195343017578125, -0.18341064453125, -0.171478271484375, -0.1595458984375, -0.147613525390625, -0.13568115234375, -0.123748779296875, -0.11181640625, -0.099884033203125, -0.08795166015625, -0.076019287109375, -0.0640869140625, -0.052154541015625, -0.04022216796875, -0.028289794921875, -0.016357421875, -0.004425048828125, 0.00750732421875, 0.019439697265625, 0.0313720703125, 0.043304443359375, 0.05523681640625, 0.067169189453125, 0.0791015625, 0.091033935546875, 0.10296630859375, 0.114898681640625, 0.1268310546875, 0.138763427734375, 0.15069580078125, 0.162628173828125, 0.174560546875, 0.186492919921875, 0.19842529296875, 0.210357666015625, 0.2222900390625, 0.234222412109375, 0.24615478515625, 0.258087158203125, 0.27001953125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 19.0, 13.0, 23.0, 35.0, 38.0, 63.0, 72.0, 85.0, 94.0, 100.0, 86.0, 82.0, 80.0, 58.0, 53.0, 29.0, 29.0, 13.0, 6.0, 10.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.188568115234375, -0.18402099609375, -0.179473876953125, -0.1749267578125, -0.170379638671875, -0.16583251953125, -0.161285400390625, -0.15673828125, -0.152191162109375, -0.14764404296875, -0.143096923828125, -0.1385498046875, -0.134002685546875, -0.12945556640625, -0.124908447265625, -0.120361328125, -0.115814208984375, -0.11126708984375, -0.106719970703125, -0.1021728515625, -0.097625732421875, -0.09307861328125, -0.088531494140625, -0.083984375, -0.079437255859375, -0.07489013671875, -0.070343017578125, -0.0657958984375, -0.061248779296875, -0.05670166015625, -0.052154541015625, -0.047607421875, -0.043060302734375, -0.03851318359375, -0.033966064453125, -0.0294189453125, -0.024871826171875, -0.02032470703125, -0.015777587890625, -0.01123046875, -0.006683349609375, -0.00213623046875, 0.002410888671875, 0.0069580078125, 0.011505126953125, 0.01605224609375, 0.020599365234375, 0.025146484375, 0.029693603515625, 0.03424072265625, 0.038787841796875, 0.0433349609375, 0.047882080078125, 0.05242919921875, 0.056976318359375, 0.0615234375, 0.066070556640625, 0.07061767578125, 0.075164794921875, 0.0797119140625, 0.084259033203125, 0.08880615234375, 0.093353271484375, 0.097900390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 8.0, 12.0, 8.0, 12.0, 23.0, 33.0, 50.0, 71.0, 124.0, 215.0, 341.0, 654.0, 1353.0, 2812.0, 6963.0, 19483.0, 68093.0, 331146.0, 474962.0, 99506.0, 26700.0, 8982.0, 3537.0, 1591.0, 784.0, 421.0, 219.0, 152.0, 98.0, 47.0, 30.0, 29.0, 24.0, 20.0, 13.0, 10.0, 8.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.242431640625, -0.23553085327148438, -0.22863006591796875, -0.22172927856445312, -0.2148284912109375, -0.20792770385742188, -0.20102691650390625, -0.19412612915039062, -0.187225341796875, -0.18032455444335938, -0.17342376708984375, -0.16652297973632812, -0.1596221923828125, -0.15272140502929688, -0.14582061767578125, -0.13891983032226562, -0.13201904296875, -0.12511825561523438, -0.11821746826171875, -0.11131668090820312, -0.1044158935546875, -0.09751510620117188, -0.09061431884765625, -0.08371353149414062, -0.076812744140625, -0.06991195678710938, -0.06301116943359375, -0.056110382080078125, -0.0492095947265625, -0.042308807373046875, -0.03540802001953125, -0.028507232666015625, -0.0216064453125, -0.014705657958984375, -0.00780487060546875, -0.000904083251953125, 0.0059967041015625, 0.012897491455078125, 0.01979827880859375, 0.026699066162109375, 0.033599853515625, 0.040500640869140625, 0.04740142822265625, 0.054302215576171875, 0.0612030029296875, 0.06810379028320312, 0.07500457763671875, 0.08190536499023438, 0.08880615234375, 0.09570693969726562, 0.10260772705078125, 0.10950851440429688, 0.1164093017578125, 0.12331008911132812, 0.13021087646484375, 0.13711166381835938, 0.144012451171875, 0.15091323852539062, 0.15781402587890625, 0.16471481323242188, 0.1716156005859375, 0.17851638793945312, 0.18541717529296875, 0.19231796264648438, 0.19921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 5.0, 9.0, 9.0, 20.0, 22.0, 17.0, 29.0, 27.0, 31.0, 36.0, 32.0, 27.0, 48.0, 43.0, 43.0, 50.0, 38.0, 66.0, 35.0, 37.0, 44.0, 42.0, 48.0, 38.0, 29.0, 30.0, 32.0, 14.0, 20.0, 22.0, 11.0, 12.0, 7.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.328857421875, -0.31906890869140625, -0.3092803955078125, -0.29949188232421875, -0.289703369140625, -0.27991485595703125, -0.2701263427734375, -0.26033782958984375, -0.25054931640625, -0.24076080322265625, -0.2309722900390625, -0.22118377685546875, -0.211395263671875, -0.20160675048828125, -0.1918182373046875, -0.18202972412109375, -0.1722412109375, -0.16245269775390625, -0.1526641845703125, -0.14287567138671875, -0.133087158203125, -0.12329864501953125, -0.1135101318359375, -0.10372161865234375, -0.09393310546875, -0.08414459228515625, -0.0743560791015625, -0.06456756591796875, -0.054779052734375, -0.04499053955078125, -0.0352020263671875, -0.02541351318359375, -0.015625, -0.00583648681640625, 0.0039520263671875, 0.01374053955078125, 0.023529052734375, 0.03331756591796875, 0.0431060791015625, 0.05289459228515625, 0.06268310546875, 0.07247161865234375, 0.0822601318359375, 0.09204864501953125, 0.101837158203125, 0.11162567138671875, 0.1214141845703125, 0.13120269775390625, 0.1409912109375, 0.15077972412109375, 0.1605682373046875, 0.17035675048828125, 0.180145263671875, 0.18993377685546875, 0.1997222900390625, 0.20951080322265625, 0.21929931640625, 0.22908782958984375, 0.2388763427734375, 0.24866485595703125, 0.258453369140625, 0.26824188232421875, 0.2780303955078125, 0.28781890869140625, 0.297607421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 10.0, 7.0, 5.0, 9.0, 24.0, 36.0, 45.0, 68.0, 132.0, 207.0, 495.0, 1403.0, 4518.0, 19792.0, 213737.0, 755597.0, 40979.0, 7902.0, 2205.0, 696.0, 303.0, 142.0, 86.0, 55.0, 32.0, 26.0, 13.0, 11.0, 11.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.267333984375, -0.2608451843261719, -0.25435638427734375, -0.24786758422851562, -0.2413787841796875, -0.23488998413085938, -0.22840118408203125, -0.22191238403320312, -0.215423583984375, -0.20893478393554688, -0.20244598388671875, -0.19595718383789062, -0.1894683837890625, -0.18297958374023438, -0.17649078369140625, -0.17000198364257812, -0.16351318359375, -0.15702438354492188, -0.15053558349609375, -0.14404678344726562, -0.1375579833984375, -0.13106918334960938, -0.12458038330078125, -0.11809158325195312, -0.111602783203125, -0.10511398315429688, -0.09862518310546875, -0.09213638305664062, -0.0856475830078125, -0.07915878295898438, -0.07266998291015625, -0.06618118286132812, -0.0596923828125, -0.053203582763671875, -0.04671478271484375, -0.040225982666015625, -0.0337371826171875, -0.027248382568359375, -0.02075958251953125, -0.014270782470703125, -0.007781982421875, -0.001293182373046875, 0.00519561767578125, 0.011684417724609375, 0.0181732177734375, 0.024662017822265625, 0.03115081787109375, 0.037639617919921875, 0.04412841796875, 0.050617218017578125, 0.05710601806640625, 0.06359481811523438, 0.0700836181640625, 0.07657241821289062, 0.08306121826171875, 0.08955001831054688, 0.096038818359375, 0.10252761840820312, 0.10901641845703125, 0.11550521850585938, 0.1219940185546875, 0.12848281860351562, 0.13497161865234375, 0.14146041870117188, 0.14794921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 10.0, 15.0, 38.0, 151.0, 378.0, 276.0, 89.0, 35.0, 7.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005335807800292969, -0.0005232710391283035, -0.0005129612982273102, -0.0005026515573263168, -0.0004923418164253235, -0.00048203207552433014, -0.0004717223346233368, -0.00046141259372234344, -0.0004511028528213501, -0.00044079311192035675, -0.0004304833710193634, -0.00042017363011837006, -0.0004098638892173767, -0.00039955414831638336, -0.00038924440741539, -0.00037893466651439667, -0.0003686249256134033, -0.00035831518471241, -0.0003480054438114166, -0.0003376957029104233, -0.00032738596200942993, -0.0003170762211084366, -0.00030676648020744324, -0.0002964567393064499, -0.00028614699840545654, -0.0002758372575044632, -0.00026552751660346985, -0.0002552177757024765, -0.00024490803480148315, -0.0002345982939004898, -0.00022428855299949646, -0.0002139788120985031, -0.00020366907119750977, -0.00019335933029651642, -0.00018304958939552307, -0.00017273984849452972, -0.00016243010759353638, -0.00015212036669254303, -0.00014181062579154968, -0.00013150088489055634, -0.00012119114398956299, -0.00011088140308856964, -0.0001005716621875763, -9.026192128658295e-05, -7.99521803855896e-05, -6.964243948459625e-05, -5.9332698583602905e-05, -4.902295768260956e-05, -3.871321678161621e-05, -2.8403475880622864e-05, -1.8093734979629517e-05, -7.78399407863617e-06, 2.5257468223571777e-06, 1.2835487723350525e-05, 2.3145228624343872e-05, 3.345496952533722e-05, 4.3764710426330566e-05, 5.4074451327323914e-05, 6.438419222831726e-05, 7.469393312931061e-05, 8.500367403030396e-05, 9.53134149312973e-05, 0.00010562315583229065, 0.000115932896733284, 0.00012624263763427734]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 24.0, 67.0, 151.0, 385.0, 1278.0, 5440.0, 33291.0, 797426.0, 192295.0, 14252.0, 2827.0, 731.0, 228.0, 93.0, 33.0, 17.0, 10.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.1303882598876953, -0.12344741821289062, -0.11650657653808594, -0.10956573486328125, -0.10262489318847656, -0.09568405151367188, -0.08874320983886719, -0.0818023681640625, -0.07486152648925781, -0.06792068481445312, -0.06097984313964844, -0.05403900146484375, -0.04709815979003906, -0.040157318115234375, -0.03321647644042969, -0.026275634765625, -0.019334793090820312, -0.012393951416015625, -0.0054531097412109375, 0.00148773193359375, 0.008428573608398438, 0.015369415283203125, 0.022310256958007812, 0.0292510986328125, 0.03619194030761719, 0.043132781982421875, 0.05007362365722656, 0.05701446533203125, 0.06395530700683594, 0.07089614868164062, 0.07783699035644531, 0.08477783203125, 0.09171867370605469, 0.09865951538085938, 0.10560035705566406, 0.11254119873046875, 0.11948204040527344, 0.12642288208007812, 0.1333637237548828, 0.1403045654296875, 0.1472454071044922, 0.15418624877929688, 0.16112709045410156, 0.16806793212890625, 0.17500877380371094, 0.18194961547851562, 0.1888904571533203, 0.195831298828125, 0.2027721405029297, 0.20971298217773438, 0.21665382385253906, 0.22359466552734375, 0.23053550720214844, 0.23747634887695312, 0.2444171905517578, 0.2513580322265625, 0.2582988739013672, 0.2652397155761719, 0.27218055725097656, 0.27912139892578125, 0.28606224060058594, 0.2930030822753906, 0.2999439239501953, 0.306884765625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 9.0, 8.0, 6.0, 12.0, 17.0, 21.0, 35.0, 69.0, 114.0, 160.0, 145.0, 129.0, 106.0, 65.0, 47.0, 21.0, 19.0, 12.0, 3.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1036376953125, -0.09825706481933594, -0.09287643432617188, -0.08749580383300781, -0.08211517333984375, -0.07673454284667969, -0.07135391235351562, -0.06597328186035156, -0.0605926513671875, -0.05521202087402344, -0.049831390380859375, -0.04445075988769531, -0.03907012939453125, -0.03368949890136719, -0.028308868408203125, -0.022928237915039062, -0.017547607421875, -0.012166976928710938, -0.006786346435546875, -0.0014057159423828125, 0.00397491455078125, 0.009355545043945312, 0.014736175537109375, 0.020116806030273438, 0.0254974365234375, 0.030878067016601562, 0.036258697509765625, 0.04163932800292969, 0.04701995849609375, 0.05240058898925781, 0.057781219482421875, 0.06316184997558594, 0.06854248046875, 0.07392311096191406, 0.07930374145507812, 0.08468437194824219, 0.09006500244140625, 0.09544563293457031, 0.10082626342773438, 0.10620689392089844, 0.1115875244140625, 0.11696815490722656, 0.12234878540039062, 0.1277294158935547, 0.13311004638671875, 0.1384906768798828, 0.14387130737304688, 0.14925193786621094, 0.154632568359375, 0.16001319885253906, 0.16539382934570312, 0.1707744598388672, 0.17615509033203125, 0.1815357208251953, 0.18691635131835938, 0.19229698181152344, 0.1976776123046875, 0.20305824279785156, 0.20843887329101562, 0.2138195037841797, 0.21920013427734375, 0.2245807647705078, 0.22996139526367188, 0.23534202575683594, 0.24072265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 21.0, 36.0, 88.0, 185.0, 316.0, 197.0, 102.0, 44.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1654329299926758, -1.063624620437622, -0.9618163108825684, -0.8600080609321594, -0.7581997513771057, -0.656391441822052, -0.5545831918716431, -0.45277488231658936, -0.35096657276153564, -0.24915827810764313, -0.1473499834537506, -0.04554170370101929, 0.056266605854034424, 0.15807491540908813, 0.25988316535949707, 0.3616914749145508, 0.4634997844696045, 0.5653080940246582, 0.6671164035797119, 0.7689246535301208, 0.8707329630851746, 0.9725412726402283, 1.0743495225906372, 1.176157832145691, 1.2779661417007446, 1.3797744512557983, 1.481582760810852, 1.5833909511566162, 1.68519926071167, 1.7870075702667236, 1.8888158798217773, 1.990624189376831, 2.0924324989318848, 2.1942408084869385, 2.296049118041992, 2.397857427597046, 2.4996657371520996, 2.6014740467071533, 2.703282356262207, 2.8050904273986816, 2.9068989753723145, 3.008707284927368, 3.110515594482422, 3.2123239040374756, 3.3141322135925293, 3.415940523147583, 3.5177488327026367, 3.6195569038391113, 3.721365213394165, 3.8231735229492188, 3.9249818325042725, 4.026790142059326, 4.128598213195801, 4.230406761169434, 4.332214832305908, 4.434023380279541, 4.535831451416016, 4.63763952255249, 4.739448070526123, 4.841256141662598, 4.9430646896362305, 5.044872760772705, 5.146681308746338, 5.2484893798828125, 5.350297927856445]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 13.0, 10.0, 12.0, 8.0, 15.0, 14.0, 24.0, 22.0, 23.0, 29.0, 31.0, 32.0, 33.0, 40.0, 43.0, 51.0, 34.0, 49.0, 36.0, 46.0, 37.0, 45.0, 35.0, 35.0, 36.0, 39.0, 27.0, 27.0, 18.0, 27.0, 12.0, 15.0, 13.0, 10.0, 11.0, 13.0, 5.0, 9.0, 4.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3125150203704834, -1.2703300714492798, -1.2281451225280762, -1.185960292816162, -1.1437753438949585, -1.1015903949737549, -1.0594055652618408, -1.0172206163406372, -0.9750356674194336, -0.93285071849823, -0.8906658291816711, -0.8484809398651123, -0.8062959909439087, -0.7641110420227051, -0.7219261527061462, -0.6797412633895874, -0.6375563144683838, -0.5953713655471802, -0.5531864762306213, -0.5110015869140625, -0.4688166379928589, -0.42663171887397766, -0.38444679975509644, -0.3422618806362152, -0.300076961517334, -0.25789204239845276, -0.21570712327957153, -0.1735222041606903, -0.13133728504180908, -0.08915236592292786, -0.04696744680404663, -0.004782527685165405, 0.03740251064300537, 0.0795874297618866, 0.12177234888076782, 0.16395726799964905, 0.20614218711853027, 0.2483271062374115, 0.2905120253562927, 0.33269694447517395, 0.3748818635940552, 0.4170667827129364, 0.4592517018318176, 0.5014365911483765, 0.5436215400695801, 0.5858064889907837, 0.6279913783073425, 0.6701762676239014, 0.712361216545105, 0.7545461654663086, 0.7967310547828674, 0.8389159440994263, 0.8811008930206299, 0.9232858419418335, 0.9654707312583923, 1.0076556205749512, 1.0498405694961548, 1.0920255184173584, 1.1342103481292725, 1.176395297050476, 1.2185802459716797, 1.2607651948928833, 1.302950143814087, 1.345134973526001, 1.3873199224472046]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 10.0, 7.0, 7.0, 6.0, 8.0, 18.0, 28.0, 27.0, 44.0, 53.0, 81.0, 137.0, 238.0, 465.0, 973.0, 2223.0, 5479.0, 16774.0, 118767.0, 3971166.0, 57651.0, 12024.0, 4364.0, 1863.0, 837.0, 465.0, 223.0, 136.0, 98.0, 50.0, 20.0, 14.0, 9.0, 0.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.405029296875, -0.3956890106201172, -0.3863487243652344, -0.37700843811035156, -0.36766815185546875, -0.35832786560058594, -0.3489875793457031, -0.3396472930908203, -0.3303070068359375, -0.3209667205810547, -0.3116264343261719, -0.30228614807128906, -0.29294586181640625, -0.28360557556152344, -0.2742652893066406, -0.2649250030517578, -0.255584716796875, -0.2462444305419922, -0.23690414428710938, -0.22756385803222656, -0.21822357177734375, -0.20888328552246094, -0.19954299926757812, -0.1902027130126953, -0.1808624267578125, -0.1715221405029297, -0.16218185424804688, -0.15284156799316406, -0.14350128173828125, -0.13416099548339844, -0.12482070922851562, -0.11548042297363281, -0.10614013671875, -0.09679985046386719, -0.08745956420898438, -0.07811927795410156, -0.06877899169921875, -0.05943870544433594, -0.050098419189453125, -0.04075813293457031, -0.0314178466796875, -0.022077560424804688, -0.012737274169921875, -0.0033969879150390625, 0.00594329833984375, 0.015283584594726562, 0.024623870849609375, 0.03396415710449219, 0.043304443359375, 0.05264472961425781, 0.061985015869140625, 0.07132530212402344, 0.08066558837890625, 0.09000587463378906, 0.09934616088867188, 0.10868644714355469, 0.1180267333984375, 0.1273670196533203, 0.13670730590820312, 0.14604759216308594, 0.15538787841796875, 0.16472816467285156, 0.17406845092773438, 0.1834087371826172, 0.1927490234375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 12.0, 12.0, 14.0, 19.0, 38.0, 47.0, 36.0, 56.0, 69.0, 77.0, 67.0, 68.0, 76.0, 71.0, 59.0, 67.0, 50.0, 34.0, 37.0, 20.0, 20.0, 16.0, 10.0, 4.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.17138671875, -0.1673755645751953, -0.16336441040039062, -0.15935325622558594, -0.15534210205078125, -0.15133094787597656, -0.14731979370117188, -0.1433086395263672, -0.1392974853515625, -0.1352863311767578, -0.13127517700195312, -0.12726402282714844, -0.12325286865234375, -0.11924171447753906, -0.11523056030273438, -0.11121940612792969, -0.107208251953125, -0.10319709777832031, -0.09918594360351562, -0.09517478942871094, -0.09116363525390625, -0.08715248107910156, -0.08314132690429688, -0.07913017272949219, -0.0751190185546875, -0.07110786437988281, -0.06709671020507812, -0.06308555603027344, -0.05907440185546875, -0.05506324768066406, -0.051052093505859375, -0.04704093933105469, -0.04302978515625, -0.03901863098144531, -0.035007476806640625, -0.030996322631835938, -0.02698516845703125, -0.022974014282226562, -0.018962860107421875, -0.014951705932617188, -0.0109405517578125, -0.0069293975830078125, -0.002918243408203125, 0.0010929107666015625, 0.00510406494140625, 0.009115219116210938, 0.013126373291015625, 0.017137527465820312, 0.021148681640625, 0.025159835815429688, 0.029170989990234375, 0.03318214416503906, 0.03719329833984375, 0.04120445251464844, 0.045215606689453125, 0.04922676086425781, 0.0532379150390625, 0.05724906921386719, 0.061260223388671875, 0.06527137756347656, 0.06928253173828125, 0.07329368591308594, 0.07730484008789062, 0.08131599426269531, 0.0853271484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 7.0, 12.0, 31.0, 39.0, 50.0, 67.0, 110.0, 171.0, 235.0, 482.0, 769.0, 1313.0, 2494.0, 4959.0, 12223.0, 46103.0, 3724894.0, 355081.0, 27429.0, 9063.0, 3963.0, 1990.0, 1085.0, 655.0, 380.0, 230.0, 152.0, 109.0, 49.0, 45.0, 31.0, 19.0, 8.0, 7.0, 3.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1953125, -0.1887664794921875, -0.182220458984375, -0.1756744384765625, -0.16912841796875, -0.1625823974609375, -0.156036376953125, -0.1494903564453125, -0.1429443359375, -0.1363983154296875, -0.129852294921875, -0.1233062744140625, -0.11676025390625, -0.1102142333984375, -0.103668212890625, -0.0971221923828125, -0.090576171875, -0.0840301513671875, -0.077484130859375, -0.0709381103515625, -0.06439208984375, -0.0578460693359375, -0.051300048828125, -0.0447540283203125, -0.0382080078125, -0.0316619873046875, -0.025115966796875, -0.0185699462890625, -0.01202392578125, -0.0054779052734375, 0.001068115234375, 0.0076141357421875, 0.01416015625, 0.0207061767578125, 0.027252197265625, 0.0337982177734375, 0.04034423828125, 0.0468902587890625, 0.053436279296875, 0.0599822998046875, 0.0665283203125, 0.0730743408203125, 0.079620361328125, 0.0861663818359375, 0.09271240234375, 0.0992584228515625, 0.105804443359375, 0.1123504638671875, 0.118896484375, 0.1254425048828125, 0.131988525390625, 0.1385345458984375, 0.14508056640625, 0.1516265869140625, 0.158172607421875, 0.1647186279296875, 0.1712646484375, 0.1778106689453125, 0.184356689453125, 0.1909027099609375, 0.19744873046875, 0.2039947509765625, 0.210540771484375, 0.2170867919921875, 0.2236328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 10.0, 5.0, 4.0, 6.0, 10.0, 11.0, 6.0, 20.0, 51.0, 94.0, 423.0, 2936.0, 285.0, 83.0, 42.0, 30.0, 16.0, 11.0, 9.0, 7.0, 3.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09991455078125, -0.0965127944946289, -0.09311103820800781, -0.08970928192138672, -0.08630752563476562, -0.08290576934814453, -0.07950401306152344, -0.07610225677490234, -0.07270050048828125, -0.06929874420166016, -0.06589698791503906, -0.06249523162841797, -0.059093475341796875, -0.05569171905517578, -0.05228996276855469, -0.048888206481933594, -0.0454864501953125, -0.042084693908691406, -0.03868293762207031, -0.03528118133544922, -0.031879425048828125, -0.02847766876220703, -0.025075912475585938, -0.021674156188964844, -0.01827239990234375, -0.014870643615722656, -0.011468887329101562, -0.008067131042480469, -0.004665374755859375, -0.0012636184692382812, 0.0021381378173828125, 0.005539894104003906, 0.008941650390625, 0.012343406677246094, 0.015745162963867188, 0.01914691925048828, 0.022548675537109375, 0.02595043182373047, 0.029352188110351562, 0.032753944396972656, 0.03615570068359375, 0.039557456970214844, 0.04295921325683594, 0.04636096954345703, 0.049762725830078125, 0.05316448211669922, 0.05656623840332031, 0.059967994689941406, 0.0633697509765625, 0.0667715072631836, 0.07017326354980469, 0.07357501983642578, 0.07697677612304688, 0.08037853240966797, 0.08378028869628906, 0.08718204498291016, 0.09058380126953125, 0.09398555755615234, 0.09738731384277344, 0.10078907012939453, 0.10419082641601562, 0.10759258270263672, 0.11099433898925781, 0.1143960952758789, 0.1177978515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 13.0, 58.0, 174.0, 328.0, 255.0, 111.0, 39.0, 15.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4735005795955658, -0.4494094252586365, -0.42531827092170715, -0.40122711658477783, -0.3771359622478485, -0.3530448079109192, -0.3289536237716675, -0.30486249923706055, -0.28077131509780884, -0.2566801607608795, -0.2325890064239502, -0.20849785208702087, -0.18440669775009155, -0.16031554341316223, -0.13622437417507172, -0.1121332198381424, -0.08804208040237427, -0.06395092606544495, -0.03985976800322533, -0.015768609941005707, 0.008322544395923615, 0.032413698732852936, 0.056504860520362854, 0.08059601485729218, 0.1046871691942215, 0.12877832353115082, 0.15286947786808014, 0.17696064710617065, 0.20105180144309998, 0.2251429557800293, 0.24923411011695862, 0.27332526445388794, 0.2974163889884949, 0.3215075433254242, 0.3455986976623535, 0.36968985199928284, 0.39378100633621216, 0.4178721606731415, 0.4419633150100708, 0.4660544991493225, 0.49014562368392944, 0.5142368078231812, 0.5383279323577881, 0.5624191164970398, 0.5865102410316467, 0.6106014251708984, 0.6346925497055054, 0.6587837338447571, 0.6828749179840088, 0.7069661021232605, 0.7310572266578674, 0.7551484107971191, 0.7792395353317261, 0.8033307194709778, 0.8274218440055847, 0.8515130281448364, 0.8756041526794434, 0.8996953368186951, 0.923786461353302, 0.9478776454925537, 0.9719687700271606, 0.9960599541664124, 1.020151138305664, 1.044242262840271, 1.068333387374878]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 10.0, 10.0, 20.0, 37.0, 36.0, 43.0, 51.0, 63.0, 86.0, 79.0, 91.0, 75.0, 77.0, 71.0, 74.0, 55.0, 25.0, 30.0, 23.0, 15.0, 9.0, 12.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31004977226257324, -0.2992687523365021, -0.2884877026081085, -0.27770668268203735, -0.2669256329536438, -0.25614461302757263, -0.24536357820034027, -0.2345825433731079, -0.22380150854587555, -0.2130204737186432, -0.20223943889141083, -0.19145840406417847, -0.1806773841381073, -0.16989633440971375, -0.15911531448364258, -0.14833427965641022, -0.13755324482917786, -0.1267722100019455, -0.11599117517471313, -0.10521014779806137, -0.09442911297082901, -0.08364807814359665, -0.07286705076694489, -0.062086015939712524, -0.051304981112480164, -0.0405239462852478, -0.02974291518330574, -0.018961884081363678, -0.008180849254131317, 0.0026001855731010437, 0.013381212949752808, 0.02416224777698517, 0.03494328260421753, 0.04572431743144989, 0.05650534853339195, 0.06728637963533401, 0.07806741446256638, 0.08884844928979874, 0.0996294766664505, 0.11041051149368286, 0.12119154632091522, 0.13197258114814758, 0.14275361597537994, 0.1535346508026123, 0.16431567072868347, 0.17509672045707703, 0.1858777403831482, 0.19665877521038055, 0.20743981003761292, 0.21822084486484528, 0.22900187969207764, 0.2397828996181488, 0.25056394934654236, 0.2613449692726135, 0.2721260190010071, 0.28290703892707825, 0.2936880588531494, 0.3044690787792206, 0.31525012850761414, 0.3260311484336853, 0.33681219816207886, 0.34759321808815, 0.3583742380142212, 0.36915528774261475, 0.3799363374710083]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 12.0, 8.0, 20.0, 28.0, 42.0, 59.0, 85.0, 159.0, 264.0, 488.0, 891.0, 1708.0, 3500.0, 7421.0, 17548.0, 47439.0, 152569.0, 419980.0, 267551.0, 80562.0, 27452.0, 10906.0, 4846.0, 2261.0, 1188.0, 654.0, 366.0, 217.0, 112.0, 75.0, 46.0, 26.0, 17.0, 12.0, 7.0, 9.0, 4.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159423828125, -0.15387535095214844, -0.14832687377929688, -0.1427783966064453, -0.13722991943359375, -0.1316814422607422, -0.12613296508789062, -0.12058448791503906, -0.1150360107421875, -0.10948753356933594, -0.10393905639648438, -0.09839057922363281, -0.09284210205078125, -0.08729362487792969, -0.08174514770507812, -0.07619667053222656, -0.070648193359375, -0.06509971618652344, -0.059551239013671875, -0.05400276184082031, -0.04845428466796875, -0.04290580749511719, -0.037357330322265625, -0.03180885314941406, -0.0262603759765625, -0.020711898803710938, -0.015163421630859375, -0.009614944458007812, -0.00406646728515625, 0.0014820098876953125, 0.007030487060546875, 0.012578964233398438, 0.01812744140625, 0.023675918579101562, 0.029224395751953125, 0.03477287292480469, 0.04032135009765625, 0.04586982727050781, 0.051418304443359375, 0.05696678161621094, 0.0625152587890625, 0.06806373596191406, 0.07361221313476562, 0.07916069030761719, 0.08470916748046875, 0.09025764465332031, 0.09580612182617188, 0.10135459899902344, 0.106903076171875, 0.11245155334472656, 0.11800003051757812, 0.12354850769042969, 0.12909698486328125, 0.1346454620361328, 0.14019393920898438, 0.14574241638183594, 0.1512908935546875, 0.15683937072753906, 0.16238784790039062, 0.1679363250732422, 0.17348480224609375, 0.1790332794189453, 0.18458175659179688, 0.19013023376464844, 0.1956787109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 15.0, 12.0, 23.0, 28.0, 46.0, 49.0, 60.0, 64.0, 65.0, 79.0, 74.0, 73.0, 65.0, 70.0, 64.0, 44.0, 36.0, 34.0, 19.0, 19.0, 17.0, 14.0, 7.0, 1.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.175537109375, -0.17142391204833984, -0.1673107147216797, -0.16319751739501953, -0.15908432006835938, -0.15497112274169922, -0.15085792541503906, -0.1467447280883789, -0.14263153076171875, -0.1385183334350586, -0.13440513610839844, -0.13029193878173828, -0.12617874145507812, -0.12206554412841797, -0.11795234680175781, -0.11383914947509766, -0.1097259521484375, -0.10561275482177734, -0.10149955749511719, -0.09738636016845703, -0.09327316284179688, -0.08915996551513672, -0.08504676818847656, -0.0809335708618164, -0.07682037353515625, -0.0727071762084961, -0.06859397888183594, -0.06448078155517578, -0.060367584228515625, -0.05625438690185547, -0.05214118957519531, -0.048027992248535156, -0.043914794921875, -0.039801597595214844, -0.03568840026855469, -0.03157520294189453, -0.027462005615234375, -0.02334880828857422, -0.019235610961914062, -0.015122413635253906, -0.01100921630859375, -0.006896018981933594, -0.0027828216552734375, 0.0013303756713867188, 0.005443572998046875, 0.009556770324707031, 0.013669967651367188, 0.017783164978027344, 0.0218963623046875, 0.026009559631347656, 0.030122756958007812, 0.03423595428466797, 0.038349151611328125, 0.04246234893798828, 0.04657554626464844, 0.050688743591308594, 0.05480194091796875, 0.058915138244628906, 0.06302833557128906, 0.06714153289794922, 0.07125473022460938, 0.07536792755126953, 0.07948112487792969, 0.08359432220458984, 0.08770751953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 4.0, 5.0, 15.0, 17.0, 17.0, 25.0, 22.0, 30.0, 36.0, 47.0, 67.0, 103.0, 164.0, 207.0, 389.0, 746.0, 1551.0, 4030.0, 11896.0, 42877.0, 240306.0, 605244.0, 104499.0, 23620.0, 7263.0, 2692.0, 1149.0, 558.0, 338.0, 186.0, 142.0, 77.0, 43.0, 44.0, 29.0, 40.0, 21.0, 14.0, 10.0, 7.0, 7.0, 5.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.272705078125, -0.26497650146484375, -0.2572479248046875, -0.24951934814453125, -0.241790771484375, -0.23406219482421875, -0.2263336181640625, -0.21860504150390625, -0.21087646484375, -0.20314788818359375, -0.1954193115234375, -0.18769073486328125, -0.179962158203125, -0.17223358154296875, -0.1645050048828125, -0.15677642822265625, -0.1490478515625, -0.14131927490234375, -0.1335906982421875, -0.12586212158203125, -0.118133544921875, -0.11040496826171875, -0.1026763916015625, -0.09494781494140625, -0.08721923828125, -0.07949066162109375, -0.0717620849609375, -0.06403350830078125, -0.056304931640625, -0.04857635498046875, -0.0408477783203125, -0.03311920166015625, -0.025390625, -0.01766204833984375, -0.0099334716796875, -0.00220489501953125, 0.005523681640625, 0.01325225830078125, 0.0209808349609375, 0.02870941162109375, 0.03643798828125, 0.04416656494140625, 0.0518951416015625, 0.05962371826171875, 0.067352294921875, 0.07508087158203125, 0.0828094482421875, 0.09053802490234375, 0.0982666015625, 0.10599517822265625, 0.1137237548828125, 0.12145233154296875, 0.129180908203125, 0.13690948486328125, 0.1446380615234375, 0.15236663818359375, 0.16009521484375, 0.16782379150390625, 0.1755523681640625, 0.18328094482421875, 0.191009521484375, 0.19873809814453125, 0.2064666748046875, 0.21419525146484375, 0.221923828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 5.0, 9.0, 16.0, 12.0, 22.0, 15.0, 18.0, 16.0, 19.0, 17.0, 22.0, 29.0, 40.0, 30.0, 42.0, 31.0, 48.0, 34.0, 54.0, 46.0, 45.0, 29.0, 43.0, 33.0, 28.0, 30.0, 51.0, 37.0, 22.0, 20.0, 28.0, 21.0, 10.0, 11.0, 18.0, 8.0, 8.0, 3.0, 1.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.330810546875, -0.3211669921875, -0.3115234375, -0.3018798828125, -0.292236328125, -0.2825927734375, -0.27294921875, -0.2633056640625, -0.253662109375, -0.2440185546875, -0.234375, -0.2247314453125, -0.215087890625, -0.2054443359375, -0.19580078125, -0.1861572265625, -0.176513671875, -0.1668701171875, -0.1572265625, -0.1475830078125, -0.137939453125, -0.1282958984375, -0.11865234375, -0.1090087890625, -0.099365234375, -0.0897216796875, -0.080078125, -0.0704345703125, -0.060791015625, -0.0511474609375, -0.04150390625, -0.0318603515625, -0.022216796875, -0.0125732421875, -0.0029296875, 0.0067138671875, 0.016357421875, 0.0260009765625, 0.03564453125, 0.0452880859375, 0.054931640625, 0.0645751953125, 0.07421875, 0.0838623046875, 0.093505859375, 0.1031494140625, 0.11279296875, 0.1224365234375, 0.132080078125, 0.1417236328125, 0.1513671875, 0.1610107421875, 0.170654296875, 0.1802978515625, 0.18994140625, 0.1995849609375, 0.209228515625, 0.2188720703125, 0.228515625, 0.2381591796875, 0.247802734375, 0.2574462890625, 0.26708984375, 0.2767333984375, 0.286376953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 10.0, 12.0, 11.0, 20.0, 23.0, 43.0, 70.0, 92.0, 215.0, 327.0, 666.0, 1409.0, 3569.0, 10264.0, 38001.0, 312376.0, 601746.0, 57441.0, 13933.0, 4665.0, 1831.0, 854.0, 446.0, 212.0, 123.0, 74.0, 33.0, 34.0, 18.0, 13.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.12773609161376953, -0.12388038635253906, -0.1200246810913086, -0.11616897583007812, -0.11231327056884766, -0.10845756530761719, -0.10460186004638672, -0.10074615478515625, -0.09689044952392578, -0.09303474426269531, -0.08917903900146484, -0.08532333374023438, -0.0814676284790039, -0.07761192321777344, -0.07375621795654297, -0.0699005126953125, -0.06604480743408203, -0.06218910217285156, -0.058333396911621094, -0.054477691650390625, -0.050621986389160156, -0.04676628112792969, -0.04291057586669922, -0.03905487060546875, -0.03519916534423828, -0.03134346008300781, -0.027487754821777344, -0.023632049560546875, -0.019776344299316406, -0.015920639038085938, -0.012064933776855469, -0.008209228515625, -0.004353523254394531, -0.0004978179931640625, 0.0033578872680664062, 0.007213592529296875, 0.011069297790527344, 0.014925003051757812, 0.01878070831298828, 0.02263641357421875, 0.02649211883544922, 0.030347824096679688, 0.034203529357910156, 0.038059234619140625, 0.041914939880371094, 0.04577064514160156, 0.04962635040283203, 0.0534820556640625, 0.05733776092529297, 0.06119346618652344, 0.0650491714477539, 0.06890487670898438, 0.07276058197021484, 0.07661628723144531, 0.08047199249267578, 0.08432769775390625, 0.08818340301513672, 0.09203910827636719, 0.09589481353759766, 0.09975051879882812, 0.1036062240600586, 0.10746192932128906, 0.11131763458251953, 0.11517333984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 3.0, 8.0, 22.0, 9.0, 10.0, 16.0, 24.0, 35.0, 23.0, 31.0, 43.0, 77.0, 114.0, 132.0, 120.0, 75.0, 60.0, 50.0, 38.0, 28.0, 19.0, 20.0, 14.0, 5.0, 6.0, 9.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5849552154541016e-05, -5.3017400205135345e-05, -5.0185248255729675e-05, -4.7353096306324005e-05, -4.4520944356918335e-05, -4.1688792407512665e-05, -3.8856640458106995e-05, -3.6024488508701324e-05, -3.3192336559295654e-05, -3.0360184609889984e-05, -2.7528032660484314e-05, -2.4695880711078644e-05, -2.1863728761672974e-05, -1.9031576812267303e-05, -1.6199424862861633e-05, -1.3367272913455963e-05, -1.0535120964050293e-05, -7.702969014644623e-06, -4.870817065238953e-06, -2.0386651158332825e-06, 7.934868335723877e-07, 3.625638782978058e-06, 6.457790732383728e-06, 9.289942681789398e-06, 1.2122094631195068e-05, 1.4954246580600739e-05, 1.778639853000641e-05, 2.061855047941208e-05, 2.345070242881775e-05, 2.628285437822342e-05, 2.911500632762909e-05, 3.194715827703476e-05, 3.477931022644043e-05, 3.76114621758461e-05, 4.044361412525177e-05, 4.327576607465744e-05, 4.610791802406311e-05, 4.894006997346878e-05, 5.177222192287445e-05, 5.460437387228012e-05, 5.743652582168579e-05, 6.026867777109146e-05, 6.310082972049713e-05, 6.59329816699028e-05, 6.876513361930847e-05, 7.159728556871414e-05, 7.442943751811981e-05, 7.726158946752548e-05, 8.009374141693115e-05, 8.292589336633682e-05, 8.575804531574249e-05, 8.859019726514816e-05, 9.142234921455383e-05, 9.42545011639595e-05, 9.708665311336517e-05, 9.991880506277084e-05, 0.00010275095701217651, 0.00010558310896158218, 0.00010841526091098785, 0.00011124741286039352, 0.0001140795648097992, 0.00011691171675920486, 0.00011974386870861053, 0.0001225760206580162, 0.00012540817260742188]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 2.0, 3.0, 10.0, 10.0, 20.0, 20.0, 35.0, 50.0, 72.0, 96.0, 166.0, 322.0, 606.0, 1293.0, 2860.0, 7074.0, 20673.0, 74122.0, 415575.0, 417245.0, 74435.0, 20885.0, 7341.0, 2836.0, 1280.0, 635.0, 338.0, 189.0, 126.0, 78.0, 45.0, 33.0, 21.0, 14.0, 10.0, 10.0, 10.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.105712890625, -0.10277652740478516, -0.09984016418457031, -0.09690380096435547, -0.09396743774414062, -0.09103107452392578, -0.08809471130371094, -0.0851583480834961, -0.08222198486328125, -0.0792856216430664, -0.07634925842285156, -0.07341289520263672, -0.07047653198242188, -0.06754016876220703, -0.06460380554199219, -0.061667442321777344, -0.0587310791015625, -0.055794715881347656, -0.05285835266113281, -0.04992198944091797, -0.046985626220703125, -0.04404926300048828, -0.04111289978027344, -0.038176536560058594, -0.03524017333984375, -0.032303810119628906, -0.029367446899414062, -0.02643108367919922, -0.023494720458984375, -0.02055835723876953, -0.017621994018554688, -0.014685630798339844, -0.011749267578125, -0.008812904357910156, -0.0058765411376953125, -0.0029401779174804688, -3.814697265625e-06, 0.0029325485229492188, 0.0058689117431640625, 0.008805274963378906, 0.01174163818359375, 0.014678001403808594, 0.017614364624023438, 0.02055072784423828, 0.023487091064453125, 0.02642345428466797, 0.029359817504882812, 0.032296180725097656, 0.0352325439453125, 0.038168907165527344, 0.04110527038574219, 0.04404163360595703, 0.046977996826171875, 0.04991436004638672, 0.05285072326660156, 0.055787086486816406, 0.05872344970703125, 0.061659812927246094, 0.06459617614746094, 0.06753253936767578, 0.07046890258789062, 0.07340526580810547, 0.07634162902832031, 0.07927799224853516, 0.08221435546875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 4.0, 13.0, 19.0, 28.0, 25.0, 34.0, 52.0, 66.0, 92.0, 110.0, 139.0, 107.0, 80.0, 55.0, 57.0, 30.0, 29.0, 15.0, 9.0, 11.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.081298828125, -0.0774688720703125, -0.073638916015625, -0.0698089599609375, -0.06597900390625, -0.0621490478515625, -0.058319091796875, -0.0544891357421875, -0.0506591796875, -0.0468292236328125, -0.042999267578125, -0.0391693115234375, -0.03533935546875, -0.0315093994140625, -0.027679443359375, -0.0238494873046875, -0.02001953125, -0.0161895751953125, -0.012359619140625, -0.0085296630859375, -0.00469970703125, -0.0008697509765625, 0.002960205078125, 0.0067901611328125, 0.0106201171875, 0.0144500732421875, 0.018280029296875, 0.0221099853515625, 0.02593994140625, 0.0297698974609375, 0.033599853515625, 0.0374298095703125, 0.041259765625, 0.0450897216796875, 0.048919677734375, 0.0527496337890625, 0.05657958984375, 0.0604095458984375, 0.064239501953125, 0.0680694580078125, 0.0718994140625, 0.0757293701171875, 0.079559326171875, 0.0833892822265625, 0.08721923828125, 0.0910491943359375, 0.094879150390625, 0.0987091064453125, 0.1025390625, 0.1063690185546875, 0.110198974609375, 0.1140289306640625, 0.11785888671875, 0.1216888427734375, 0.125518798828125, 0.1293487548828125, 0.1331787109375, 0.1370086669921875, 0.140838623046875, 0.1446685791015625, 0.14849853515625, 0.1523284912109375, 0.156158447265625, 0.1599884033203125, 0.163818359375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 14.0, 62.0, 150.0, 400.0, 267.0, 94.0, 17.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.028061866760254, -0.8768825531005859, -0.7257032990455627, -0.5745240449905396, -0.4233447313308716, -0.2721654176712036, -0.12098616361618042, 0.030193090438842773, 0.18137240409851074, 0.3325516879558563, 0.4837309718132019, 0.6349102258682251, 0.7860895395278931, 0.937268853187561, 1.0884480476379395, 1.2396273612976074, 1.3908066749572754, 1.5419859886169434, 1.6931653022766113, 1.8443444967269897, 1.9955238103866577, 2.1467032432556152, 2.297882318496704, 2.449061632156372, 2.60024094581604, 2.751420259475708, 2.902599573135376, 3.053778886795044, 3.204957962036133, 3.356137275695801, 3.5073165893554688, 3.6584959030151367, 3.8096752166748047, 3.9608545303344727, 4.112033843994141, 4.263213157653809, 4.414392471313477, 4.5655717849731445, 4.7167510986328125, 4.8679304122924805, 5.019109725952148, 5.170289039611816, 5.321468353271484, 5.472647666931152, 5.62382698059082, 5.775006294250488, 5.926185607910156, 6.077364921569824, 6.228543758392334, 6.379723072052002, 6.53090238571167, 6.682081699371338, 6.833261013031006, 6.984440326690674, 7.135619640350342, 7.286798477172852, 7.4379777908325195, 7.5891571044921875, 7.7403364181518555, 7.891515731811523, 8.042695045471191, 8.19387435913086, 8.345053672790527, 8.496232986450195, 8.647412300109863]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 11.0, 4.0, 10.0, 10.0, 10.0, 12.0, 18.0, 15.0, 22.0, 28.0, 20.0, 28.0, 34.0, 25.0, 49.0, 40.0, 29.0, 37.0, 44.0, 48.0, 38.0, 46.0, 45.0, 30.0, 45.0, 36.0, 35.0, 28.0, 26.0, 39.0, 30.0, 22.0, 17.0, 11.0, 9.0, 17.0, 8.0, 11.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5384279489517212, -1.4869585037231445, -1.4354890584945679, -1.3840196132659912, -1.3325501680374146, -1.281080722808838, -1.2296111583709717, -1.1781418323516846, -1.1266722679138184, -1.0752028226852417, -1.023733377456665, -0.9722639322280884, -0.9207944869995117, -0.8693250417709351, -0.8178555369377136, -0.766386091709137, -0.7149167060852051, -0.6634472608566284, -0.6119778156280518, -0.5605083703994751, -0.5090389251708984, -0.4575694501399994, -0.40609997510910034, -0.3546305298805237, -0.303161084651947, -0.25169163942337036, -0.2002221792936325, -0.14875271916389465, -0.097283273935318, -0.04581382870674133, 0.005655646324157715, 0.057125091552734375, 0.10859441757202148, 0.16006386280059814, 0.211533322930336, 0.26300278306007385, 0.3144722282886505, 0.3659416735172272, 0.4174111485481262, 0.4688805937767029, 0.5203500390052795, 0.5718194842338562, 0.6232889294624329, 0.6747584342956543, 0.726227879524231, 0.7776973247528076, 0.8291667699813843, 0.8806362152099609, 0.9321056604385376, 0.9835751056671143, 1.035044550895691, 1.0865139961242676, 1.1379834413528442, 1.189452886581421, 1.240922451019287, 1.2923917770385742, 1.3438613414764404, 1.395330786705017, 1.4468002319335938, 1.4982696771621704, 1.549739122390747, 1.6012085676193237, 1.6526780128479004, 1.7041475772857666, 1.7556169033050537]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 1.0, 7.0, 13.0, 12.0, 14.0, 13.0, 24.0, 22.0, 28.0, 40.0, 57.0, 79.0, 105.0, 158.0, 194.0, 333.0, 618.0, 1136.0, 1845.0, 3949.0, 9611.0, 33717.0, 3206375.0, 889245.0, 29866.0, 8674.0, 3703.0, 1861.0, 921.0, 575.0, 386.0, 204.0, 135.0, 100.0, 71.0, 45.0, 35.0, 30.0, 22.0, 13.0, 17.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0], "bins": [-0.2939453125, -0.2865886688232422, -0.2792320251464844, -0.27187538146972656, -0.26451873779296875, -0.25716209411621094, -0.24980545043945312, -0.2424488067626953, -0.2350921630859375, -0.2277355194091797, -0.22037887573242188, -0.21302223205566406, -0.20566558837890625, -0.19830894470214844, -0.19095230102539062, -0.1835956573486328, -0.176239013671875, -0.1688823699951172, -0.16152572631835938, -0.15416908264160156, -0.14681243896484375, -0.13945579528808594, -0.13209915161132812, -0.12474250793457031, -0.1173858642578125, -0.11002922058105469, -0.10267257690429688, -0.09531593322753906, -0.08795928955078125, -0.08060264587402344, -0.07324600219726562, -0.06588935852050781, -0.05853271484375, -0.05117607116699219, -0.043819427490234375, -0.03646278381347656, -0.02910614013671875, -0.021749496459960938, -0.014392852783203125, -0.0070362091064453125, 0.0003204345703125, 0.0076770782470703125, 0.015033721923828125, 0.022390365600585938, 0.02974700927734375, 0.03710365295410156, 0.044460296630859375, 0.05181694030761719, 0.059173583984375, 0.06653022766113281, 0.07388687133789062, 0.08124351501464844, 0.08860015869140625, 0.09595680236816406, 0.10331344604492188, 0.11067008972167969, 0.1180267333984375, 0.1253833770751953, 0.13274002075195312, 0.14009666442871094, 0.14745330810546875, 0.15480995178222656, 0.16216659545898438, 0.1695232391357422, 0.1768798828125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 12.0, 17.0, 24.0, 25.0, 29.0, 40.0, 48.0, 38.0, 58.0, 75.0, 67.0, 69.0, 56.0, 72.0, 85.0, 57.0, 40.0, 51.0, 26.0, 24.0, 16.0, 18.0, 14.0, 9.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1748046875, -0.17061710357666016, -0.1664295196533203, -0.16224193572998047, -0.15805435180664062, -0.15386676788330078, -0.14967918395996094, -0.1454916000366211, -0.14130401611328125, -0.1371164321899414, -0.13292884826660156, -0.12874126434326172, -0.12455368041992188, -0.12036609649658203, -0.11617851257324219, -0.11199092864990234, -0.1078033447265625, -0.10361576080322266, -0.09942817687988281, -0.09524059295654297, -0.09105300903320312, -0.08686542510986328, -0.08267784118652344, -0.0784902572631836, -0.07430267333984375, -0.0701150894165039, -0.06592750549316406, -0.06173992156982422, -0.057552337646484375, -0.05336475372314453, -0.04917716979980469, -0.044989585876464844, -0.040802001953125, -0.036614418029785156, -0.03242683410644531, -0.02823925018310547, -0.024051666259765625, -0.01986408233642578, -0.015676498413085938, -0.011488914489746094, -0.00730133056640625, -0.0031137466430664062, 0.0010738372802734375, 0.005261421203613281, 0.009449005126953125, 0.013636589050292969, 0.017824172973632812, 0.022011756896972656, 0.0261993408203125, 0.030386924743652344, 0.03457450866699219, 0.03876209259033203, 0.042949676513671875, 0.04713726043701172, 0.05132484436035156, 0.055512428283691406, 0.05970001220703125, 0.0638875961303711, 0.06807518005371094, 0.07226276397705078, 0.07645034790039062, 0.08063793182373047, 0.08482551574707031, 0.08901309967041016, 0.09320068359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 4.0, 9.0, 13.0, 15.0, 25.0, 52.0, 50.0, 106.0, 156.0, 265.0, 489.0, 859.0, 1601.0, 3082.0, 6960.0, 24987.0, 1295279.0, 2819737.0, 26576.0, 7230.0, 3065.0, 1612.0, 899.0, 493.0, 296.0, 176.0, 81.0, 62.0, 35.0, 15.0, 18.0, 8.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17724609375, -0.17016220092773438, -0.16307830810546875, -0.15599441528320312, -0.1489105224609375, -0.14182662963867188, -0.13474273681640625, -0.12765884399414062, -0.120574951171875, -0.11349105834960938, -0.10640716552734375, -0.09932327270507812, -0.0922393798828125, -0.08515548706054688, -0.07807159423828125, -0.07098770141601562, -0.06390380859375, -0.056819915771484375, -0.04973602294921875, -0.042652130126953125, -0.0355682373046875, -0.028484344482421875, -0.02140045166015625, -0.014316558837890625, -0.007232666015625, -0.000148773193359375, 0.00693511962890625, 0.014019012451171875, 0.0211029052734375, 0.028186798095703125, 0.03527069091796875, 0.042354583740234375, 0.0494384765625, 0.056522369384765625, 0.06360626220703125, 0.07069015502929688, 0.0777740478515625, 0.08485794067382812, 0.09194183349609375, 0.09902572631835938, 0.106109619140625, 0.11319351196289062, 0.12027740478515625, 0.12736129760742188, 0.1344451904296875, 0.14152908325195312, 0.14861297607421875, 0.15569686889648438, 0.16278076171875, 0.16986465454101562, 0.17694854736328125, 0.18403244018554688, 0.1911163330078125, 0.19820022583007812, 0.20528411865234375, 0.21236801147460938, 0.219451904296875, 0.22653579711914062, 0.23361968994140625, 0.24070358276367188, 0.2477874755859375, 0.2548713684082031, 0.26195526123046875, 0.2690391540527344, 0.276123046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 13.0, 14.0, 23.0, 50.0, 89.0, 676.0, 2880.0, 141.0, 60.0, 37.0, 23.0, 13.0, 8.0, 7.0, 3.0, 2.0, 5.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1478271484375, -0.14308929443359375, -0.1383514404296875, -0.13361358642578125, -0.128875732421875, -0.12413787841796875, -0.1194000244140625, -0.11466217041015625, -0.10992431640625, -0.10518646240234375, -0.1004486083984375, -0.09571075439453125, -0.090972900390625, -0.08623504638671875, -0.0814971923828125, -0.07675933837890625, -0.072021484375, -0.06728363037109375, -0.0625457763671875, -0.05780792236328125, -0.053070068359375, -0.04833221435546875, -0.0435943603515625, -0.03885650634765625, -0.03411865234375, -0.02938079833984375, -0.0246429443359375, -0.01990509033203125, -0.015167236328125, -0.01042938232421875, -0.0056915283203125, -0.00095367431640625, 0.0037841796875, 0.00852203369140625, 0.0132598876953125, 0.01799774169921875, 0.022735595703125, 0.02747344970703125, 0.0322113037109375, 0.03694915771484375, 0.04168701171875, 0.04642486572265625, 0.0511627197265625, 0.05590057373046875, 0.060638427734375, 0.06537628173828125, 0.0701141357421875, 0.07485198974609375, 0.07958984375, 0.08432769775390625, 0.0890655517578125, 0.09380340576171875, 0.098541259765625, 0.10327911376953125, 0.1080169677734375, 0.11275482177734375, 0.11749267578125, 0.12223052978515625, 0.1269683837890625, 0.13170623779296875, 0.136444091796875, 0.14118194580078125, 0.1459197998046875, 0.15065765380859375, 0.1553955078125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 65.0, 778.0, 141.0, 18.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8055806756019592, -0.7213149666786194, -0.6370493173599243, -0.5527836084365845, -0.46851789951324463, -0.3842521905899048, -0.2999865412712097, -0.21572083234786987, -0.13145512342453003, -0.04718942940235138, 0.03707626461982727, 0.12134194374084473, 0.20560765266418457, 0.2898733615875244, 0.3741390109062195, 0.4584047198295593, 0.5426704287528992, 0.626936137676239, 0.7112017869949341, 0.7954674959182739, 0.8797332048416138, 0.9639989137649536, 1.048264503479004, 1.1325302124023438, 1.2167959213256836, 1.3010616302490234, 1.3853273391723633, 1.4695930480957031, 1.553858757019043, 1.6381244659423828, 1.722390055656433, 1.806655764579773, 1.8909215927124023, 1.9751873016357422, 2.059453010559082, 2.143718719482422, 2.2279844284057617, 2.3122501373291016, 2.3965158462524414, 2.4807815551757812, 2.565047264099121, 2.649312973022461, 2.733578681945801, 2.8178443908691406, 2.9021100997924805, 2.9863758087158203, 3.07064151763916, 3.1549072265625, 3.2391726970672607, 3.3234384059906006, 3.4077041149139404, 3.4919698238372803, 3.57623553276062, 3.66050124168396, 3.7447667121887207, 3.8290324211120605, 3.9132981300354004, 3.9975638389587402, 4.08182954788208, 4.16609525680542, 4.25036096572876, 4.3346266746521, 4.4188923835754395, 4.503158092498779, 4.587423801422119]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 9.0, 10.0, 11.0, 25.0, 31.0, 39.0, 41.0, 60.0, 65.0, 52.0, 75.0, 70.0, 69.0, 77.0, 67.0, 48.0, 63.0, 53.0, 28.0, 29.0, 20.0, 17.0, 11.0, 11.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3940753936767578, -0.3810008764266968, -0.36792638897895813, -0.3548518717288971, -0.34177735447883606, -0.3287028670310974, -0.3156283497810364, -0.30255383253097534, -0.2894793152809143, -0.27640479803085327, -0.2633303105831146, -0.2502557933330536, -0.23718127608299255, -0.2241067737340927, -0.21103227138519287, -0.19795775413513184, -0.1848832666873932, -0.17180876433849335, -0.1587342470884323, -0.14565974473953247, -0.13258522748947144, -0.1195107251405716, -0.10643622279167175, -0.09336171299219131, -0.08028720319271088, -0.06721269339323044, -0.0541381873190403, -0.04106368124485016, -0.02798917144536972, -0.014914661645889282, -0.001840159296989441, 0.011234350502490997, 0.024308860301971436, 0.037383370101451874, 0.050457876175642014, 0.06353238224983215, 0.07660689204931259, 0.08968140184879303, 0.10275590419769287, 0.11583041399717331, 0.12890492379665375, 0.1419794261455536, 0.15505394339561462, 0.16812844574451447, 0.1812029480934143, 0.19427746534347534, 0.20735196769237518, 0.22042647004127502, 0.23350098729133606, 0.2465754896402359, 0.25964999198913574, 0.2727245092391968, 0.2857990264892578, 0.29887354373931885, 0.3119480311870575, 0.32502254843711853, 0.3380970358848572, 0.3511715531349182, 0.36424604058265686, 0.3773205578327179, 0.39039507508277893, 0.4034695625305176, 0.4165440797805786, 0.42961859703063965, 0.4426931142807007]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 7.0, 9.0, 26.0, 40.0, 55.0, 104.0, 188.0, 463.0, 1272.0, 3900.0, 14619.0, 70514.0, 523064.0, 366492.0, 51584.0, 11346.0, 3079.0, 1028.0, 386.0, 172.0, 79.0, 48.0, 16.0, 17.0, 13.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.371826171875, -0.36250877380371094, -0.3531913757324219, -0.3438739776611328, -0.33455657958984375, -0.3252391815185547, -0.3159217834472656, -0.30660438537597656, -0.2972869873046875, -0.28796958923339844, -0.2786521911621094, -0.2693347930908203, -0.26001739501953125, -0.2506999969482422, -0.24138259887695312, -0.23206520080566406, -0.222747802734375, -0.21343040466308594, -0.20411300659179688, -0.1947956085205078, -0.18547821044921875, -0.1761608123779297, -0.16684341430664062, -0.15752601623535156, -0.1482086181640625, -0.13889122009277344, -0.12957382202148438, -0.12025642395019531, -0.11093902587890625, -0.10162162780761719, -0.09230422973632812, -0.08298683166503906, -0.07366943359375, -0.06435203552246094, -0.055034637451171875, -0.04571723937988281, -0.03639984130859375, -0.027082443237304688, -0.017765045166015625, -0.008447647094726562, 0.0008697509765625, 0.010187149047851562, 0.019504547119140625, 0.028821945190429688, 0.03813934326171875, 0.04745674133300781, 0.056774139404296875, 0.06609153747558594, 0.075408935546875, 0.08472633361816406, 0.09404373168945312, 0.10336112976074219, 0.11267852783203125, 0.12199592590332031, 0.13131332397460938, 0.14063072204589844, 0.1499481201171875, 0.15926551818847656, 0.16858291625976562, 0.1779003143310547, 0.18721771240234375, 0.1965351104736328, 0.20585250854492188, 0.21516990661621094, 0.2244873046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 5.0, 15.0, 11.0, 35.0, 23.0, 31.0, 34.0, 39.0, 58.0, 51.0, 62.0, 81.0, 67.0, 61.0, 74.0, 77.0, 59.0, 46.0, 27.0, 35.0, 25.0, 14.0, 17.0, 15.0, 14.0, 6.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.171142578125, -0.16692733764648438, -0.16271209716796875, -0.15849685668945312, -0.1542816162109375, -0.15006637573242188, -0.14585113525390625, -0.14163589477539062, -0.137420654296875, -0.13320541381835938, -0.12899017333984375, -0.12477493286132812, -0.1205596923828125, -0.11634445190429688, -0.11212921142578125, -0.10791397094726562, -0.10369873046875, -0.09948348999023438, -0.09526824951171875, -0.09105300903320312, -0.0868377685546875, -0.08262252807617188, -0.07840728759765625, -0.07419204711914062, -0.069976806640625, -0.06576156616210938, -0.06154632568359375, -0.057331085205078125, -0.0531158447265625, -0.048900604248046875, -0.04468536376953125, -0.040470123291015625, -0.0362548828125, -0.032039642333984375, -0.02782440185546875, -0.023609161376953125, -0.0193939208984375, -0.015178680419921875, -0.01096343994140625, -0.006748199462890625, -0.002532958984375, 0.001682281494140625, 0.00589752197265625, 0.010112762451171875, 0.0143280029296875, 0.018543243408203125, 0.02275848388671875, 0.026973724365234375, 0.03118896484375, 0.035404205322265625, 0.03961944580078125, 0.043834686279296875, 0.0480499267578125, 0.052265167236328125, 0.05648040771484375, 0.060695648193359375, 0.064910888671875, 0.06912612915039062, 0.07334136962890625, 0.07755661010742188, 0.0817718505859375, 0.08598709106445312, 0.09020233154296875, 0.09441757202148438, 0.0986328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 8.0, 14.0, 15.0, 24.0, 20.0, 40.0, 52.0, 67.0, 83.0, 95.0, 149.0, 285.0, 487.0, 1242.0, 5165.0, 29484.0, 359840.0, 599026.0, 42496.0, 6896.0, 1537.0, 550.0, 295.0, 186.0, 133.0, 92.0, 62.0, 56.0, 33.0, 27.0, 23.0, 16.0, 13.0, 11.0, 8.0, 9.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3753776550292969, -0.36525726318359375, -0.3551368713378906, -0.3450164794921875, -0.3348960876464844, -0.32477569580078125, -0.3146553039550781, -0.304534912109375, -0.2944145202636719, -0.28429412841796875, -0.2741737365722656, -0.2640533447265625, -0.2539329528808594, -0.24381256103515625, -0.23369216918945312, -0.22357177734375, -0.21345138549804688, -0.20333099365234375, -0.19321060180664062, -0.1830902099609375, -0.17296981811523438, -0.16284942626953125, -0.15272903442382812, -0.142608642578125, -0.13248825073242188, -0.12236785888671875, -0.11224746704101562, -0.1021270751953125, -0.09200668334960938, -0.08188629150390625, -0.07176589965820312, -0.0616455078125, -0.051525115966796875, -0.04140472412109375, -0.031284332275390625, -0.0211639404296875, -0.011043548583984375, -0.00092315673828125, 0.009197235107421875, 0.019317626953125, 0.029438018798828125, 0.03955841064453125, 0.049678802490234375, 0.0597991943359375, 0.06991958618164062, 0.08003997802734375, 0.09016036987304688, 0.10028076171875, 0.11040115356445312, 0.12052154541015625, 0.13064193725585938, 0.1407623291015625, 0.15088272094726562, 0.16100311279296875, 0.17112350463867188, 0.181243896484375, 0.19136428833007812, 0.20148468017578125, 0.21160507202148438, 0.2217254638671875, 0.23184585571289062, 0.24196624755859375, 0.2520866394042969, 0.26220703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 4.0, 5.0, 6.0, 6.0, 5.0, 17.0, 2.0, 10.0, 10.0, 15.0, 15.0, 30.0, 20.0, 24.0, 24.0, 32.0, 28.0, 35.0, 27.0, 40.0, 37.0, 49.0, 32.0, 42.0, 48.0, 42.0, 33.0, 37.0, 24.0, 30.0, 29.0, 24.0, 24.0, 20.0, 28.0, 25.0, 18.0, 14.0, 14.0, 2.0, 12.0, 8.0, 7.0, 8.0, 8.0, 4.0, 7.0, 4.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.328125, -0.3183135986328125, -0.308502197265625, -0.2986907958984375, -0.28887939453125, -0.2790679931640625, -0.269256591796875, -0.2594451904296875, -0.2496337890625, -0.2398223876953125, -0.230010986328125, -0.2201995849609375, -0.21038818359375, -0.2005767822265625, -0.190765380859375, -0.1809539794921875, -0.171142578125, -0.1613311767578125, -0.151519775390625, -0.1417083740234375, -0.13189697265625, -0.1220855712890625, -0.112274169921875, -0.1024627685546875, -0.0926513671875, -0.0828399658203125, -0.073028564453125, -0.0632171630859375, -0.05340576171875, -0.0435943603515625, -0.033782958984375, -0.0239715576171875, -0.01416015625, -0.0043487548828125, 0.005462646484375, 0.0152740478515625, 0.02508544921875, 0.0348968505859375, 0.044708251953125, 0.0545196533203125, 0.0643310546875, 0.0741424560546875, 0.083953857421875, 0.0937652587890625, 0.10357666015625, 0.1133880615234375, 0.123199462890625, 0.1330108642578125, 0.142822265625, 0.1526336669921875, 0.162445068359375, 0.1722564697265625, 0.18206787109375, 0.1918792724609375, 0.201690673828125, 0.2115020751953125, 0.2213134765625, 0.2311248779296875, 0.240936279296875, 0.2507476806640625, 0.26055908203125, 0.2703704833984375, 0.280181884765625, 0.2899932861328125, 0.2998046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 9.0, 9.0, 14.0, 17.0, 43.0, 43.0, 43.0, 73.0, 133.0, 212.0, 306.0, 523.0, 759.0, 1376.0, 2532.0, 5005.0, 10865.0, 31268.0, 232107.0, 679824.0, 53790.0, 15404.0, 6683.0, 3149.0, 1724.0, 995.0, 618.0, 363.0, 213.0, 133.0, 108.0, 65.0, 47.0, 34.0, 18.0, 17.0, 10.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11114501953125, -0.10758113861083984, -0.10401725769042969, -0.10045337677001953, -0.09688949584960938, -0.09332561492919922, -0.08976173400878906, -0.0861978530883789, -0.08263397216796875, -0.0790700912475586, -0.07550621032714844, -0.07194232940673828, -0.06837844848632812, -0.06481456756591797, -0.06125068664550781, -0.057686805725097656, -0.0541229248046875, -0.050559043884277344, -0.04699516296386719, -0.04343128204345703, -0.039867401123046875, -0.03630352020263672, -0.03273963928222656, -0.029175758361816406, -0.02561187744140625, -0.022047996520996094, -0.018484115600585938, -0.014920234680175781, -0.011356353759765625, -0.007792472839355469, -0.0042285919189453125, -0.0006647109985351562, 0.002899169921875, 0.006463050842285156, 0.010026931762695312, 0.013590812683105469, 0.017154693603515625, 0.02071857452392578, 0.024282455444335938, 0.027846336364746094, 0.03141021728515625, 0.034974098205566406, 0.03853797912597656, 0.04210186004638672, 0.045665740966796875, 0.04922962188720703, 0.05279350280761719, 0.056357383728027344, 0.0599212646484375, 0.06348514556884766, 0.06704902648925781, 0.07061290740966797, 0.07417678833007812, 0.07774066925048828, 0.08130455017089844, 0.0848684310913086, 0.08843231201171875, 0.0919961929321289, 0.09556007385253906, 0.09912395477294922, 0.10268783569335938, 0.10625171661376953, 0.10981559753417969, 0.11337947845458984, 0.116943359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 2.0, 8.0, 9.0, 10.0, 10.0, 21.0, 19.0, 29.0, 28.0, 38.0, 41.0, 66.0, 70.0, 82.0, 83.0, 101.0, 76.0, 63.0, 52.0, 40.0, 32.0, 28.0, 22.0, 16.0, 10.0, 11.0, 10.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.89897346496582e-05, -8.60951840877533e-05, -8.320063352584839e-05, -8.030608296394348e-05, -7.741153240203857e-05, -7.451698184013367e-05, -7.162243127822876e-05, -6.872788071632385e-05, -6.583333015441895e-05, -6.293877959251404e-05, -6.004422903060913e-05, -5.7149678468704224e-05, -5.4255127906799316e-05, -5.136057734489441e-05, -4.84660267829895e-05, -4.5571476221084595e-05, -4.267692565917969e-05, -3.978237509727478e-05, -3.688782453536987e-05, -3.3993273973464966e-05, -3.109872341156006e-05, -2.820417284965515e-05, -2.5309622287750244e-05, -2.2415071725845337e-05, -1.952052116394043e-05, -1.6625970602035522e-05, -1.3731420040130615e-05, -1.0836869478225708e-05, -7.9423189163208e-06, -5.0477683544158936e-06, -2.1532177925109863e-06, 7.413327693939209e-07, 3.635883331298828e-06, 6.530433893203735e-06, 9.424984455108643e-06, 1.231953501701355e-05, 1.5214085578918457e-05, 1.8108636140823364e-05, 2.100318670272827e-05, 2.389773726463318e-05, 2.6792287826538086e-05, 2.9686838388442993e-05, 3.25813889503479e-05, 3.547593951225281e-05, 3.8370490074157715e-05, 4.126504063606262e-05, 4.415959119796753e-05, 4.7054141759872437e-05, 4.9948692321777344e-05, 5.284324288368225e-05, 5.573779344558716e-05, 5.8632344007492065e-05, 6.152689456939697e-05, 6.442144513130188e-05, 6.731599569320679e-05, 7.02105462551117e-05, 7.31050968170166e-05, 7.599964737892151e-05, 7.889419794082642e-05, 8.178874850273132e-05, 8.468329906463623e-05, 8.757784962654114e-05, 9.047240018844604e-05, 9.336695075035095e-05, 9.626150131225586e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 14.0, 19.0, 16.0, 26.0, 44.0, 79.0, 113.0, 189.0, 305.0, 567.0, 957.0, 1631.0, 3173.0, 7040.0, 20140.0, 110660.0, 778897.0, 92848.0, 18414.0, 6488.0, 3046.0, 1615.0, 917.0, 586.0, 290.0, 171.0, 115.0, 73.0, 53.0, 18.0, 20.0, 12.0, 10.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1376953125, -0.1340198516845703, -0.13034439086914062, -0.12666893005371094, -0.12299346923828125, -0.11931800842285156, -0.11564254760742188, -0.11196708679199219, -0.1082916259765625, -0.10461616516113281, -0.10094070434570312, -0.09726524353027344, -0.09358978271484375, -0.08991432189941406, -0.08623886108398438, -0.08256340026855469, -0.078887939453125, -0.07521247863769531, -0.07153701782226562, -0.06786155700683594, -0.06418609619140625, -0.06051063537597656, -0.056835174560546875, -0.05315971374511719, -0.0494842529296875, -0.04580879211425781, -0.042133331298828125, -0.03845787048339844, -0.03478240966796875, -0.031106948852539062, -0.027431488037109375, -0.023756027221679688, -0.02008056640625, -0.016405105590820312, -0.012729644775390625, -0.009054183959960938, -0.00537872314453125, -0.0017032623291015625, 0.001972198486328125, 0.0056476593017578125, 0.0093231201171875, 0.012998580932617188, 0.016674041748046875, 0.020349502563476562, 0.02402496337890625, 0.027700424194335938, 0.031375885009765625, 0.03505134582519531, 0.038726806640625, 0.04240226745605469, 0.046077728271484375, 0.04975318908691406, 0.05342864990234375, 0.05710411071777344, 0.060779571533203125, 0.06445503234863281, 0.0681304931640625, 0.07180595397949219, 0.07548141479492188, 0.07915687561035156, 0.08283233642578125, 0.08650779724121094, 0.09018325805664062, 0.09385871887207031, 0.0975341796875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 7.0, 7.0, 5.0, 7.0, 14.0, 15.0, 23.0, 30.0, 56.0, 70.0, 118.0, 153.0, 153.0, 114.0, 82.0, 50.0, 26.0, 16.0, 12.0, 11.0, 3.0, 10.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134521484375, -0.13057327270507812, -0.12662506103515625, -0.12267684936523438, -0.1187286376953125, -0.11478042602539062, -0.11083221435546875, -0.10688400268554688, -0.102935791015625, -0.09898757934570312, -0.09503936767578125, -0.09109115600585938, -0.0871429443359375, -0.08319473266601562, -0.07924652099609375, -0.07529830932617188, -0.07135009765625, -0.06740188598632812, -0.06345367431640625, -0.059505462646484375, -0.0555572509765625, -0.051609039306640625, -0.04766082763671875, -0.043712615966796875, -0.039764404296875, -0.035816192626953125, -0.03186798095703125, -0.027919769287109375, -0.0239715576171875, -0.020023345947265625, -0.01607513427734375, -0.012126922607421875, -0.0081787109375, -0.004230499267578125, -0.00028228759765625, 0.003665924072265625, 0.0076141357421875, 0.011562347412109375, 0.01551055908203125, 0.019458770751953125, 0.023406982421875, 0.027355194091796875, 0.03130340576171875, 0.035251617431640625, 0.0391998291015625, 0.043148040771484375, 0.04709625244140625, 0.051044464111328125, 0.05499267578125, 0.058940887451171875, 0.06288909912109375, 0.06683731079101562, 0.0707855224609375, 0.07473373413085938, 0.07868194580078125, 0.08263015747070312, 0.086578369140625, 0.09052658081054688, 0.09447479248046875, 0.09842300415039062, 0.1023712158203125, 0.10631942749023438, 0.11026763916015625, 0.11421585083007812, 0.1181640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 16.0, 60.0, 116.0, 180.0, 221.0, 192.0, 97.0, 59.0, 28.0, 16.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0002601146697998, -0.9190535545349121, -0.8378469944000244, -0.7566404342651367, -0.675433874130249, -0.5942273139953613, -0.5130207538604736, -0.43181419372558594, -0.35060763359069824, -0.26940107345581055, -0.18819451332092285, -0.10698795318603516, -0.02578139305114746, 0.055425167083740234, 0.13663172721862793, 0.21783828735351562, 0.2990448474884033, 0.380251407623291, 0.4614579677581787, 0.5426645278930664, 0.6238710880279541, 0.7050776481628418, 0.7862842082977295, 0.8674907684326172, 0.9486973285675049, 1.0299038887023926, 1.1111104488372803, 1.192317008972168, 1.2735235691070557, 1.3547301292419434, 1.435936689376831, 1.5171432495117188, 1.5983495712280273, 1.679556131362915, 1.7607626914978027, 1.8419692516326904, 1.9231758117675781, 2.004382371902466, 2.0855889320373535, 2.166795492172241, 2.248002052307129, 2.3292086124420166, 2.4104151725769043, 2.491621732711792, 2.5728282928466797, 2.6540348529815674, 2.735241413116455, 2.8164479732513428, 2.8976545333862305, 2.978861093521118, 3.060067653656006, 3.1412742137908936, 3.2224807739257812, 3.303687334060669, 3.3848938941955566, 3.4661004543304443, 3.547307014465332, 3.6285135746002197, 3.7097201347351074, 3.790926694869995, 3.872133255004883, 3.9533398151397705, 4.034546375274658, 4.115753173828125, 4.196959495544434]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 9.0, 7.0, 13.0, 19.0, 26.0, 23.0, 25.0, 34.0, 38.0, 43.0, 53.0, 46.0, 54.0, 67.0, 52.0, 64.0, 57.0, 55.0, 57.0, 32.0, 30.0, 43.0, 25.0, 27.0, 17.0, 19.0, 10.0, 13.0, 6.0, 7.0, 7.0, 4.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.409971237182617, -2.3364856243133545, -2.263000249862671, -2.189514636993408, -2.1160292625427246, -2.042543649673462, -1.9690580368041992, -1.895572543144226, -1.822087049484253, -1.7486015558242798, -1.6751160621643066, -1.601630449295044, -1.5281449556350708, -1.4546594619750977, -1.381173849105835, -1.3076883554458618, -1.2342028617858887, -1.1607173681259155, -1.0872318744659424, -1.0137462615966797, -0.9402607679367065, -0.8667752742767334, -0.7932897210121155, -0.7198041677474976, -0.6463186740875244, -0.5728331804275513, -0.49934762716293335, -0.4258621037006378, -0.3523765802383423, -0.27889105677604675, -0.20540553331375122, -0.1319199800491333, -0.05843472480773926, 0.015050798654556274, 0.0885363221168518, 0.16202184557914734, 0.23550736904144287, 0.3089928925037384, 0.38247841596603394, 0.45596396923065186, 0.529449462890625, 0.6029349565505981, 0.6764205098152161, 0.749906063079834, 0.8233915567398071, 0.8968770503997803, 0.9703626036643982, 1.0438481569290161, 1.1173336505889893, 1.1908191442489624, 1.2643046379089355, 1.3377902507781982, 1.4112757444381714, 1.4847612380981445, 1.5582468509674072, 1.6317323446273804, 1.7052178382873535, 1.7787033319473267, 1.8521888256072998, 1.9256744384765625, 1.9991599321365356, 2.072645425796509, 2.1461310386657715, 2.219616413116455, 2.2931020259857178]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 5.0, 24.0, 36.0, 86.0, 207.0, 704.0, 5970.0, 4136410.0, 48134.0, 2064.0, 378.0, 120.0, 50.0, 27.0, 16.0, 6.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.5380859375, -0.5270500183105469, -0.5160140991210938, -0.5049781799316406, -0.4939422607421875, -0.4829063415527344, -0.47187042236328125, -0.4608345031738281, -0.449798583984375, -0.4387626647949219, -0.42772674560546875, -0.4166908264160156, -0.4056549072265625, -0.3946189880371094, -0.38358306884765625, -0.3725471496582031, -0.36151123046875, -0.3504753112792969, -0.33943939208984375, -0.3284034729003906, -0.3173675537109375, -0.3063316345214844, -0.29529571533203125, -0.2842597961425781, -0.273223876953125, -0.2621879577636719, -0.25115203857421875, -0.24011611938476562, -0.2290802001953125, -0.21804428100585938, -0.20700836181640625, -0.19597244262695312, -0.1849365234375, -0.17390060424804688, -0.16286468505859375, -0.15182876586914062, -0.1407928466796875, -0.12975692749023438, -0.11872100830078125, -0.10768508911132812, -0.096649169921875, -0.08561325073242188, -0.07457733154296875, -0.06354141235351562, -0.0525054931640625, -0.041469573974609375, -0.03043365478515625, -0.019397735595703125, -0.00836181640625, 0.002674102783203125, 0.01371002197265625, 0.024745941162109375, 0.0357818603515625, 0.046817779541015625, 0.05785369873046875, 0.06888961791992188, 0.079925537109375, 0.09096145629882812, 0.10199737548828125, 0.11303329467773438, 0.1240692138671875, 0.13510513305664062, 0.14614105224609375, 0.15717697143554688, 0.168212890625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 11.0, 6.0, 12.0, 13.0, 15.0, 28.0, 25.0, 38.0, 55.0, 44.0, 60.0, 54.0, 73.0, 66.0, 68.0, 56.0, 51.0, 47.0, 51.0, 44.0, 43.0, 27.0, 29.0, 15.0, 18.0, 17.0, 13.0, 6.0, 9.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0], "bins": [-0.17529296875, -0.17093753814697266, -0.1665821075439453, -0.16222667694091797, -0.15787124633789062, -0.15351581573486328, -0.14916038513183594, -0.1448049545288086, -0.14044952392578125, -0.1360940933227539, -0.13173866271972656, -0.12738323211669922, -0.12302780151367188, -0.11867237091064453, -0.11431694030761719, -0.10996150970458984, -0.1056060791015625, -0.10125064849853516, -0.09689521789550781, -0.09253978729248047, -0.08818435668945312, -0.08382892608642578, -0.07947349548339844, -0.0751180648803711, -0.07076263427734375, -0.0664072036743164, -0.06205177307128906, -0.05769634246826172, -0.053340911865234375, -0.04898548126220703, -0.04463005065917969, -0.040274620056152344, -0.035919189453125, -0.031563758850097656, -0.027208328247070312, -0.02285289764404297, -0.018497467041015625, -0.014142036437988281, -0.009786605834960938, -0.005431175231933594, -0.00107574462890625, 0.0032796859741210938, 0.0076351165771484375, 0.011990547180175781, 0.016345977783203125, 0.02070140838623047, 0.025056838989257812, 0.029412269592285156, 0.0337677001953125, 0.038123130798339844, 0.04247856140136719, 0.04683399200439453, 0.051189422607421875, 0.05554485321044922, 0.05990028381347656, 0.0642557144165039, 0.06861114501953125, 0.0729665756225586, 0.07732200622558594, 0.08167743682861328, 0.08603286743164062, 0.09038829803466797, 0.09474372863769531, 0.09909915924072266, 0.10345458984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 7.0, 0.0, 8.0, 6.0, 8.0, 14.0, 17.0, 22.0, 23.0, 37.0, 70.0, 79.0, 113.0, 164.0, 276.0, 371.0, 694.0, 1628.0, 5222.0, 28842.0, 3970184.0, 168437.0, 12371.0, 2989.0, 1104.0, 530.0, 340.0, 227.0, 166.0, 112.0, 61.0, 49.0, 29.0, 24.0, 23.0, 15.0, 10.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.124267578125, -0.12122058868408203, -0.11817359924316406, -0.1151266098022461, -0.11207962036132812, -0.10903263092041016, -0.10598564147949219, -0.10293865203857422, -0.09989166259765625, -0.09684467315673828, -0.09379768371582031, -0.09075069427490234, -0.08770370483398438, -0.0846567153930664, -0.08160972595214844, -0.07856273651123047, -0.0755157470703125, -0.07246875762939453, -0.06942176818847656, -0.0663747787475586, -0.06332778930664062, -0.060280799865722656, -0.05723381042480469, -0.05418682098388672, -0.05113983154296875, -0.04809284210205078, -0.04504585266113281, -0.041998863220214844, -0.038951873779296875, -0.035904884338378906, -0.03285789489746094, -0.02981090545654297, -0.026763916015625, -0.02371692657470703, -0.020669937133789062, -0.017622947692871094, -0.014575958251953125, -0.011528968811035156, -0.008481979370117188, -0.005434989929199219, -0.00238800048828125, 0.0006589889526367188, 0.0037059783935546875, 0.006752967834472656, 0.009799957275390625, 0.012846946716308594, 0.015893936157226562, 0.01894092559814453, 0.0219879150390625, 0.02503490447998047, 0.028081893920898438, 0.031128883361816406, 0.034175872802734375, 0.037222862243652344, 0.04026985168457031, 0.04331684112548828, 0.04636383056640625, 0.04941082000732422, 0.05245780944824219, 0.055504798889160156, 0.058551788330078125, 0.061598777770996094, 0.06464576721191406, 0.06769275665283203, 0.07073974609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 9.0, 8.0, 6.0, 17.0, 40.0, 110.0, 3269.0, 474.0, 79.0, 31.0, 11.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0209503173828125, -0.02013993263244629, -0.019329547882080078, -0.018519163131713867, -0.017708778381347656, -0.016898393630981445, -0.016088008880615234, -0.015277624130249023, -0.014467239379882812, -0.013656854629516602, -0.01284646987915039, -0.01203608512878418, -0.011225700378417969, -0.010415315628051758, -0.009604930877685547, -0.008794546127319336, -0.007984161376953125, -0.007173776626586914, -0.006363391876220703, -0.005553007125854492, -0.004742622375488281, -0.00393223762512207, -0.0031218528747558594, -0.0023114681243896484, -0.0015010833740234375, -0.0006906986236572266, 0.00011968612670898438, 0.0009300708770751953, 0.0017404556274414062, 0.002550840377807617, 0.003361225128173828, 0.004171609878540039, 0.00498199462890625, 0.005792379379272461, 0.006602764129638672, 0.007413148880004883, 0.008223533630371094, 0.009033918380737305, 0.009844303131103516, 0.010654687881469727, 0.011465072631835938, 0.012275457382202148, 0.01308584213256836, 0.01389622688293457, 0.014706611633300781, 0.015516996383666992, 0.016327381134033203, 0.017137765884399414, 0.017948150634765625, 0.018758535385131836, 0.019568920135498047, 0.020379304885864258, 0.02118968963623047, 0.02200007438659668, 0.02281045913696289, 0.0236208438873291, 0.024431228637695312, 0.025241613388061523, 0.026051998138427734, 0.026862382888793945, 0.027672767639160156, 0.028483152389526367, 0.029293537139892578, 0.03010392189025879, 0.030914306640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 13.0, 30.0, 180.0, 415.0, 293.0, 70.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.35568585991859436, -0.34867897629737854, -0.3416720926761627, -0.3346652090549469, -0.3276583254337311, -0.32065144181251526, -0.31364455819129944, -0.3066376745700836, -0.2996307909488678, -0.292623907327652, -0.28561702370643616, -0.27861014008522034, -0.2716032564640045, -0.2645963728427887, -0.2575894892215729, -0.25058260560035706, -0.24357573688030243, -0.2365688532590866, -0.2295619696378708, -0.22255508601665497, -0.21554820239543915, -0.20854131877422333, -0.2015344500541687, -0.19452756643295288, -0.18752068281173706, -0.18051379919052124, -0.17350691556930542, -0.1665000319480896, -0.15949314832687378, -0.15248626470565796, -0.14547938108444214, -0.13847249746322632, -0.1314656287431717, -0.12445874512195587, -0.11745186150074005, -0.11044497787952423, -0.10343809425830841, -0.09643121063709259, -0.08942433446645737, -0.08241745084524155, -0.07541056722402573, -0.0684036836028099, -0.061396799981594086, -0.054389920085668564, -0.047383036464452744, -0.04037615284323692, -0.0333692729473114, -0.02636238932609558, -0.01935550570487976, -0.012348623014986515, -0.005341740325093269, 0.0016651414334774017, 0.008672025054693222, 0.015678908675909042, 0.022685788571834564, 0.029692672193050385, 0.036699555814266205, 0.043706439435482025, 0.050713323056697845, 0.05772020295262337, 0.06472708284854889, 0.07173396646976471, 0.07874085009098053, 0.08574773371219635, 0.09275461733341217]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 4.0, 3.0, 5.0, 4.0, 10.0, 9.0, 15.0, 20.0, 10.0, 15.0, 18.0, 20.0, 27.0, 27.0, 23.0, 38.0, 37.0, 47.0, 48.0, 39.0, 56.0, 50.0, 54.0, 51.0, 56.0, 41.0, 50.0, 38.0, 31.0, 25.0, 25.0, 21.0, 21.0, 15.0, 9.0, 9.0, 12.0, 9.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04060918092727661, -0.03935711085796356, -0.03810504078865051, -0.03685297071933746, -0.035600900650024414, -0.034348830580711365, -0.033096760511398315, -0.031844690442085266, -0.030592620372772217, -0.029340550303459167, -0.028088480234146118, -0.02683641016483307, -0.02558434009552002, -0.02433227002620697, -0.02308019995689392, -0.02182812988758087, -0.020576059818267822, -0.019323989748954773, -0.018071919679641724, -0.016819849610328674, -0.015567779541015625, -0.014315709471702576, -0.013063639402389526, -0.011811569333076477, -0.010559499263763428, -0.009307429194450378, -0.008055359125137329, -0.00680328905582428, -0.0055512189865112305, -0.004299148917198181, -0.003047078847885132, -0.0017950087785720825, -0.0005429387092590332, 0.0007091313600540161, 0.0019612014293670654, 0.0032132714986801147, 0.004465341567993164, 0.005717411637306213, 0.006969481706619263, 0.008221551775932312, 0.009473621845245361, 0.01072569191455841, 0.01197776198387146, 0.01322983205318451, 0.014481902122497559, 0.015733972191810608, 0.016986042261123657, 0.018238112330436707, 0.019490182399749756, 0.020742252469062805, 0.021994322538375854, 0.023246392607688904, 0.024498462677001953, 0.025750532746315002, 0.027002602815628052, 0.0282546728849411, 0.02950674295425415, 0.0307588130235672, 0.03201088309288025, 0.0332629531621933, 0.03451502323150635, 0.0357670933008194, 0.037019163370132446, 0.038271233439445496, 0.039523303508758545]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 8.0, 5.0, 12.0, 8.0, 16.0, 25.0, 41.0, 82.0, 126.0, 185.0, 357.0, 711.0, 1766.0, 4891.0, 17222.0, 78759.0, 494945.0, 370648.0, 58201.0, 13578.0, 4131.0, 1460.0, 629.0, 302.0, 164.0, 107.0, 59.0, 46.0, 27.0, 18.0, 12.0, 9.0, 2.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.3408203125, -0.332489013671875, -0.32415771484375, -0.315826416015625, -0.3074951171875, -0.299163818359375, -0.29083251953125, -0.282501220703125, -0.274169921875, -0.265838623046875, -0.25750732421875, -0.249176025390625, -0.2408447265625, -0.232513427734375, -0.22418212890625, -0.215850830078125, -0.20751953125, -0.199188232421875, -0.19085693359375, -0.182525634765625, -0.1741943359375, -0.165863037109375, -0.15753173828125, -0.149200439453125, -0.140869140625, -0.132537841796875, -0.12420654296875, -0.115875244140625, -0.1075439453125, -0.099212646484375, -0.09088134765625, -0.082550048828125, -0.07421875, -0.065887451171875, -0.05755615234375, -0.049224853515625, -0.0408935546875, -0.032562255859375, -0.02423095703125, -0.015899658203125, -0.007568359375, 0.000762939453125, 0.00909423828125, 0.017425537109375, 0.0257568359375, 0.034088134765625, 0.04241943359375, 0.050750732421875, 0.05908203125, 0.067413330078125, 0.07574462890625, 0.084075927734375, 0.0924072265625, 0.100738525390625, 0.10906982421875, 0.117401123046875, 0.125732421875, 0.134063720703125, 0.14239501953125, 0.150726318359375, 0.1590576171875, 0.167388916015625, 0.17572021484375, 0.184051513671875, 0.1923828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 5.0, 20.0, 11.0, 25.0, 29.0, 38.0, 46.0, 48.0, 46.0, 57.0, 65.0, 70.0, 68.0, 53.0, 46.0, 54.0, 49.0, 44.0, 45.0, 34.0, 34.0, 17.0, 16.0, 17.0, 15.0, 11.0, 6.0, 6.0, 5.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.1724853515625, -0.1682415008544922, -0.16399765014648438, -0.15975379943847656, -0.15550994873046875, -0.15126609802246094, -0.14702224731445312, -0.1427783966064453, -0.1385345458984375, -0.1342906951904297, -0.13004684448242188, -0.12580299377441406, -0.12155914306640625, -0.11731529235839844, -0.11307144165039062, -0.10882759094238281, -0.104583740234375, -0.10033988952636719, -0.09609603881835938, -0.09185218811035156, -0.08760833740234375, -0.08336448669433594, -0.07912063598632812, -0.07487678527832031, -0.0706329345703125, -0.06638908386230469, -0.062145233154296875, -0.05790138244628906, -0.05365753173828125, -0.04941368103027344, -0.045169830322265625, -0.04092597961425781, -0.03668212890625, -0.03243827819824219, -0.028194427490234375, -0.023950576782226562, -0.01970672607421875, -0.015462875366210938, -0.011219024658203125, -0.0069751739501953125, -0.0027313232421875, 0.0015125274658203125, 0.005756378173828125, 0.010000228881835938, 0.01424407958984375, 0.018487930297851562, 0.022731781005859375, 0.026975631713867188, 0.031219482421875, 0.03546333312988281, 0.039707183837890625, 0.04395103454589844, 0.04819488525390625, 0.05243873596191406, 0.056682586669921875, 0.06092643737792969, 0.0651702880859375, 0.06941413879394531, 0.07365798950195312, 0.07790184020996094, 0.08214569091796875, 0.08638954162597656, 0.09063339233398438, 0.09487724304199219, 0.09912109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 7.0, 9.0, 17.0, 17.0, 19.0, 22.0, 37.0, 55.0, 64.0, 92.0, 178.0, 265.0, 497.0, 1279.0, 4871.0, 34055.0, 679603.0, 302323.0, 19794.0, 3279.0, 947.0, 415.0, 255.0, 136.0, 81.0, 82.0, 49.0, 35.0, 26.0, 14.0, 12.0, 6.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343017578125, -0.33025360107421875, -0.3174896240234375, -0.30472564697265625, -0.291961669921875, -0.27919769287109375, -0.2664337158203125, -0.25366973876953125, -0.24090576171875, -0.22814178466796875, -0.2153778076171875, -0.20261383056640625, -0.189849853515625, -0.17708587646484375, -0.1643218994140625, -0.15155792236328125, -0.1387939453125, -0.12602996826171875, -0.1132659912109375, -0.10050201416015625, -0.087738037109375, -0.07497406005859375, -0.0622100830078125, -0.04944610595703125, -0.03668212890625, -0.02391815185546875, -0.0111541748046875, 0.00160980224609375, 0.014373779296875, 0.02713775634765625, 0.0399017333984375, 0.05266571044921875, 0.0654296875, 0.07819366455078125, 0.0909576416015625, 0.10372161865234375, 0.116485595703125, 0.12924957275390625, 0.1420135498046875, 0.15477752685546875, 0.16754150390625, 0.18030548095703125, 0.1930694580078125, 0.20583343505859375, 0.218597412109375, 0.23136138916015625, 0.2441253662109375, 0.25688934326171875, 0.2696533203125, 0.28241729736328125, 0.2951812744140625, 0.30794525146484375, 0.320709228515625, 0.33347320556640625, 0.3462371826171875, 0.35900115966796875, 0.37176513671875, 0.38452911376953125, 0.3972930908203125, 0.41005706787109375, 0.422821044921875, 0.43558502197265625, 0.4483489990234375, 0.46111297607421875, 0.473876953125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 12.0, 9.0, 5.0, 18.0, 13.0, 22.0, 20.0, 41.0, 35.0, 39.0, 52.0, 56.0, 70.0, 59.0, 62.0, 78.0, 56.0, 62.0, 60.0, 50.0, 44.0, 30.0, 20.0, 23.0, 18.0, 24.0, 5.0, 10.0, 12.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6979942321777344, -0.6791915893554688, -0.6603889465332031, -0.6415863037109375, -0.6227836608886719, -0.6039810180664062, -0.5851783752441406, -0.566375732421875, -0.5475730895996094, -0.5287704467773438, -0.5099678039550781, -0.4911651611328125, -0.4723625183105469, -0.45355987548828125, -0.4347572326660156, -0.41595458984375, -0.3971519470214844, -0.37834930419921875, -0.3595466613769531, -0.3407440185546875, -0.3219413757324219, -0.30313873291015625, -0.2843360900878906, -0.265533447265625, -0.24673080444335938, -0.22792816162109375, -0.20912551879882812, -0.1903228759765625, -0.17152023315429688, -0.15271759033203125, -0.13391494750976562, -0.1151123046875, -0.09630966186523438, -0.07750701904296875, -0.058704376220703125, -0.0399017333984375, -0.021099090576171875, -0.00229644775390625, 0.016506195068359375, 0.035308837890625, 0.054111480712890625, 0.07291412353515625, 0.09171676635742188, 0.1105194091796875, 0.12932205200195312, 0.14812469482421875, 0.16692733764648438, 0.18572998046875, 0.20453262329101562, 0.22333526611328125, 0.24213790893554688, 0.2609405517578125, 0.2797431945800781, 0.29854583740234375, 0.3173484802246094, 0.336151123046875, 0.3549537658691406, 0.37375640869140625, 0.3925590515136719, 0.4113616943359375, 0.4301643371582031, 0.44896697998046875, 0.4677696228027344, 0.486572265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 12.0, 9.0, 20.0, 37.0, 52.0, 102.0, 187.0, 448.0, 1375.0, 6197.0, 74370.0, 932338.0, 28167.0, 3673.0, 872.0, 320.0, 137.0, 80.0, 56.0, 37.0, 14.0, 12.0, 8.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33349609375, -0.32349395751953125, -0.3134918212890625, -0.30348968505859375, -0.293487548828125, -0.28348541259765625, -0.2734832763671875, -0.26348114013671875, -0.25347900390625, -0.24347686767578125, -0.2334747314453125, -0.22347259521484375, -0.213470458984375, -0.20346832275390625, -0.1934661865234375, -0.18346405029296875, -0.1734619140625, -0.16345977783203125, -0.1534576416015625, -0.14345550537109375, -0.133453369140625, -0.12345123291015625, -0.1134490966796875, -0.10344696044921875, -0.09344482421875, -0.08344268798828125, -0.0734405517578125, -0.06343841552734375, -0.053436279296875, -0.04343414306640625, -0.0334320068359375, -0.02342987060546875, -0.013427734375, -0.00342559814453125, 0.0065765380859375, 0.01657867431640625, 0.026580810546875, 0.03658294677734375, 0.0465850830078125, 0.05658721923828125, 0.06658935546875, 0.07659149169921875, 0.0865936279296875, 0.09659576416015625, 0.106597900390625, 0.11660003662109375, 0.1266021728515625, 0.13660430908203125, 0.1466064453125, 0.15660858154296875, 0.1666107177734375, 0.17661285400390625, 0.186614990234375, 0.19661712646484375, 0.2066192626953125, 0.21662139892578125, 0.22662353515625, 0.23662567138671875, 0.2466278076171875, 0.25662994384765625, 0.266632080078125, 0.27663421630859375, 0.2866363525390625, 0.29663848876953125, 0.306640625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 4.0, 4.0, 6.0, 11.0, 25.0, 15.0, 20.0, 21.0, 37.0, 46.0, 53.0, 72.0, 90.0, 79.0, 100.0, 75.0, 86.0, 48.0, 44.0, 38.0, 21.0, 29.0, 20.0, 11.0, 15.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.246566772460938e-05, -6.01746141910553e-05, -5.788356065750122e-05, -5.5592507123947144e-05, -5.3301453590393066e-05, -5.101040005683899e-05, -4.871934652328491e-05, -4.6428292989730835e-05, -4.413723945617676e-05, -4.184618592262268e-05, -3.9555132389068604e-05, -3.7264078855514526e-05, -3.497302532196045e-05, -3.268197178840637e-05, -3.0390918254852295e-05, -2.8099864721298218e-05, -2.580881118774414e-05, -2.3517757654190063e-05, -2.1226704120635986e-05, -1.893565058708191e-05, -1.6644597053527832e-05, -1.4353543519973755e-05, -1.2062489986419678e-05, -9.7714364528656e-06, -7.4803829193115234e-06, -5.189329385757446e-06, -2.898275852203369e-06, -6.07222318649292e-07, 1.6838312149047852e-06, 3.974884748458862e-06, 6.2659382820129395e-06, 8.556991815567017e-06, 1.0848045349121094e-05, 1.3139098882675171e-05, 1.5430152416229248e-05, 1.7721205949783325e-05, 2.0012259483337402e-05, 2.230331301689148e-05, 2.4594366550445557e-05, 2.6885420083999634e-05, 2.917647361755371e-05, 3.146752715110779e-05, 3.3758580684661865e-05, 3.604963421821594e-05, 3.834068775177002e-05, 4.06317412853241e-05, 4.2922794818878174e-05, 4.521384835243225e-05, 4.750490188598633e-05, 4.9795955419540405e-05, 5.208700895309448e-05, 5.437806248664856e-05, 5.666911602020264e-05, 5.8960169553756714e-05, 6.125122308731079e-05, 6.354227662086487e-05, 6.583333015441895e-05, 6.812438368797302e-05, 7.04154372215271e-05, 7.270649075508118e-05, 7.499754428863525e-05, 7.728859782218933e-05, 7.957965135574341e-05, 8.187070488929749e-05, 8.416175842285156e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 6.0, 7.0, 7.0, 14.0, 23.0, 55.0, 77.0, 126.0, 314.0, 977.0, 5518.0, 139660.0, 886008.0, 13266.0, 1664.0, 474.0, 155.0, 86.0, 52.0, 26.0, 20.0, 12.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.2637672424316406, -0.25238800048828125, -0.24100875854492188, -0.2296295166015625, -0.21825027465820312, -0.20687103271484375, -0.19549179077148438, -0.184112548828125, -0.17273330688476562, -0.16135406494140625, -0.14997482299804688, -0.1385955810546875, -0.12721633911132812, -0.11583709716796875, -0.10445785522460938, -0.09307861328125, -0.08169937133789062, -0.07032012939453125, -0.058940887451171875, -0.0475616455078125, -0.036182403564453125, -0.02480316162109375, -0.013423919677734375, -0.002044677734375, 0.009334564208984375, 0.02071380615234375, 0.032093048095703125, 0.0434722900390625, 0.054851531982421875, 0.06623077392578125, 0.07761001586914062, 0.0889892578125, 0.10036849975585938, 0.11174774169921875, 0.12312698364257812, 0.1345062255859375, 0.14588546752929688, 0.15726470947265625, 0.16864395141601562, 0.180023193359375, 0.19140243530273438, 0.20278167724609375, 0.21416091918945312, 0.2255401611328125, 0.23691940307617188, 0.24829864501953125, 0.2596778869628906, 0.27105712890625, 0.2824363708496094, 0.29381561279296875, 0.3051948547363281, 0.3165740966796875, 0.3279533386230469, 0.33933258056640625, 0.3507118225097656, 0.362091064453125, 0.3734703063964844, 0.38484954833984375, 0.3962287902832031, 0.4076080322265625, 0.4189872741699219, 0.43036651611328125, 0.4417457580566406, 0.453125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 28.0, 61.0, 325.0, 473.0, 67.0, 20.0, 10.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5390625, -0.5167236328125, -0.494384765625, -0.4720458984375, -0.44970703125, -0.4273681640625, -0.405029296875, -0.3826904296875, -0.3603515625, -0.3380126953125, -0.315673828125, -0.2933349609375, -0.27099609375, -0.2486572265625, -0.226318359375, -0.2039794921875, -0.181640625, -0.1593017578125, -0.136962890625, -0.1146240234375, -0.09228515625, -0.0699462890625, -0.047607421875, -0.0252685546875, -0.0029296875, 0.0194091796875, 0.041748046875, 0.0640869140625, 0.08642578125, 0.1087646484375, 0.131103515625, 0.1534423828125, 0.17578125, 0.1981201171875, 0.220458984375, 0.2427978515625, 0.26513671875, 0.2874755859375, 0.309814453125, 0.3321533203125, 0.3544921875, 0.3768310546875, 0.399169921875, 0.4215087890625, 0.44384765625, 0.4661865234375, 0.488525390625, 0.5108642578125, 0.533203125, 0.5555419921875, 0.577880859375, 0.6002197265625, 0.62255859375, 0.6448974609375, 0.667236328125, 0.6895751953125, 0.7119140625, 0.7342529296875, 0.756591796875, 0.7789306640625, 0.80126953125, 0.8236083984375, 0.845947265625, 0.8682861328125, 0.890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 10.0, 28.0, 53.0, 100.0, 184.0, 213.0, 187.0, 127.0, 57.0, 20.0, 14.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9101192951202393, -2.815542221069336, -2.7209651470184326, -2.6263880729675293, -2.531810998916626, -2.4372339248657227, -2.3426566123962402, -2.248079776763916, -2.1535024642944336, -2.0589253902435303, -1.964348316192627, -1.8697712421417236, -1.7751941680908203, -1.680617094039917, -1.5860399007797241, -1.4914628267288208, -1.396885871887207, -1.3023087978363037, -1.2077317237854004, -1.113154649734497, -1.0185775756835938, -0.9240004420280457, -0.8294233083724976, -0.7348462343215942, -0.6402691602706909, -0.5456920862197876, -0.4511149823665619, -0.3565378785133362, -0.26196080446243286, -0.16738373041152954, -0.07280659675598145, 0.021770477294921875, 0.1163475513458252, 0.2109246402978897, 0.3055017292499542, 0.40007883310317993, 0.49465590715408325, 0.5892329812049866, 0.6838101148605347, 0.778387188911438, 0.8729642629623413, 0.9675413370132446, 1.062118411064148, 1.1566956043243408, 1.2512726783752441, 1.3458497524261475, 1.4404268264770508, 1.535003900527954, 1.6295809745788574, 1.7241580486297607, 1.818735122680664, 1.9133121967315674, 2.0078892707824707, 2.102466344833374, 2.1970434188842773, 2.2916207313537598, 2.386197566986084, 2.4807746410369873, 2.5753517150878906, 2.669928789138794, 2.7645058631896973, 2.8590829372406006, 2.953660011291504, 3.0482373237609863, 3.1428143978118896]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 9.0, 3.0, 8.0, 8.0, 10.0, 9.0, 13.0, 21.0, 25.0, 22.0, 18.0, 28.0, 34.0, 29.0, 37.0, 36.0, 30.0, 45.0, 43.0, 36.0, 48.0, 42.0, 43.0, 49.0, 37.0, 37.0, 32.0, 43.0, 37.0, 24.0, 20.0, 21.0, 20.0, 17.0, 10.0, 8.0, 8.0, 5.0, 9.0, 4.0, 14.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-2.24587345123291, -2.182187795639038, -2.118502140045166, -2.054816484451294, -1.9911308288574219, -1.9274451732635498, -1.8637595176696777, -1.8000738620758057, -1.7363882064819336, -1.6727025508880615, -1.6090168952941895, -1.5453312397003174, -1.4816455841064453, -1.4179599285125732, -1.3542742729187012, -1.290588617324829, -1.2269030809402466, -1.1632174253463745, -1.0995317697525024, -1.0358461141586304, -0.9721604585647583, -0.9084748029708862, -0.8447892069816589, -0.7811035513877869, -0.7174178957939148, -0.6537322402000427, -0.5900465846061707, -0.5263609886169434, -0.4626753032207489, -0.39898964762687683, -0.33530402183532715, -0.2716183662414551, -0.207932710647583, -0.14424705505371094, -0.08056141436100006, -0.016875773668289185, 0.046809881925582886, 0.11049553751945496, 0.17418116331100464, 0.2378668189048767, 0.3015524744987488, 0.36523813009262085, 0.4289237856864929, 0.4926094114780426, 0.5562950372695923, 0.6199806928634644, 0.6836663484573364, 0.7473520040512085, 0.8110376596450806, 0.8747233152389526, 0.9384089708328247, 1.0020946264266968, 1.0657802820205688, 1.129465937614441, 1.1931514739990234, 1.2568371295928955, 1.3205227851867676, 1.3842084407806396, 1.4478940963745117, 1.5115797519683838, 1.5752654075622559, 1.638951063156128, 1.70263671875, 1.766322374343872, 1.8300080299377441]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 8.0, 9.0, 15.0, 16.0, 44.0, 67.0, 136.0, 326.0, 849.0, 3269.0, 25192.0, 4104669.0, 52720.0, 5026.0, 1193.0, 430.0, 158.0, 73.0, 39.0, 21.0, 8.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.369384765625, -0.3617868423461914, -0.3541889190673828, -0.3465909957885742, -0.3389930725097656, -0.33139514923095703, -0.32379722595214844, -0.31619930267333984, -0.30860137939453125, -0.30100345611572266, -0.29340553283691406, -0.28580760955810547, -0.2782096862792969, -0.2706117630004883, -0.2630138397216797, -0.2554159164428711, -0.2478179931640625, -0.2402200698852539, -0.2326221466064453, -0.22502422332763672, -0.21742630004882812, -0.20982837677001953, -0.20223045349121094, -0.19463253021240234, -0.18703460693359375, -0.17943668365478516, -0.17183876037597656, -0.16424083709716797, -0.15664291381835938, -0.14904499053955078, -0.1414470672607422, -0.1338491439819336, -0.126251220703125, -0.1186532974243164, -0.11105537414550781, -0.10345745086669922, -0.09585952758789062, -0.08826160430908203, -0.08066368103027344, -0.07306575775146484, -0.06546783447265625, -0.057869911193847656, -0.05027198791503906, -0.04267406463623047, -0.035076141357421875, -0.02747821807861328, -0.019880294799804688, -0.012282371520996094, -0.0046844482421875, 0.0029134750366210938, 0.010511398315429688, 0.01810932159423828, 0.025707244873046875, 0.03330516815185547, 0.04090309143066406, 0.048501014709472656, 0.05609893798828125, 0.06369686126708984, 0.07129478454589844, 0.07889270782470703, 0.08649063110351562, 0.09408855438232422, 0.10168647766113281, 0.1092844009399414, 0.11688232421875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 8.0, 13.0, 22.0, 30.0, 32.0, 42.0, 43.0, 58.0, 54.0, 81.0, 57.0, 61.0, 67.0, 54.0, 66.0, 60.0, 47.0, 42.0, 29.0, 28.0, 20.0, 14.0, 9.0, 10.0, 4.0, 9.0, 6.0, 3.0, 4.0, 3.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.16599273681640625, -0.1612091064453125, -0.15642547607421875, -0.151641845703125, -0.14685821533203125, -0.1420745849609375, -0.13729095458984375, -0.13250732421875, -0.12772369384765625, -0.1229400634765625, -0.11815643310546875, -0.113372802734375, -0.10858917236328125, -0.1038055419921875, -0.09902191162109375, -0.09423828125, -0.08945465087890625, -0.0846710205078125, -0.07988739013671875, -0.075103759765625, -0.07032012939453125, -0.0655364990234375, -0.06075286865234375, -0.05596923828125, -0.05118560791015625, -0.0464019775390625, -0.04161834716796875, -0.036834716796875, -0.03205108642578125, -0.0272674560546875, -0.02248382568359375, -0.0177001953125, -0.01291656494140625, -0.0081329345703125, -0.00334930419921875, 0.001434326171875, 0.00621795654296875, 0.0110015869140625, 0.01578521728515625, 0.02056884765625, 0.02535247802734375, 0.0301361083984375, 0.03491973876953125, 0.039703369140625, 0.04448699951171875, 0.0492706298828125, 0.05405426025390625, 0.058837890625, 0.06362152099609375, 0.0684051513671875, 0.07318878173828125, 0.077972412109375, 0.08275604248046875, 0.0875396728515625, 0.09232330322265625, 0.09710693359375, 0.10189056396484375, 0.1066741943359375, 0.11145782470703125, 0.116241455078125, 0.12102508544921875, 0.1258087158203125, 0.13059234619140625, 0.1353759765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 5.0, 10.0, 11.0, 9.0, 13.0, 20.0, 20.0, 25.0, 27.0, 32.0, 47.0, 63.0, 72.0, 74.0, 112.0, 164.0, 232.0, 428.0, 757.0, 1518.0, 3409.0, 12734.0, 237903.0, 3903507.0, 24090.0, 4767.0, 1781.0, 900.0, 506.0, 267.0, 174.0, 111.0, 88.0, 89.0, 57.0, 63.0, 33.0, 29.0, 24.0, 34.0, 12.0, 15.0, 8.0, 12.0, 7.0, 6.0, 9.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1446533203125, -0.1402912139892578, -0.13592910766601562, -0.13156700134277344, -0.12720489501953125, -0.12284278869628906, -0.11848068237304688, -0.11411857604980469, -0.1097564697265625, -0.10539436340332031, -0.10103225708007812, -0.09667015075683594, -0.09230804443359375, -0.08794593811035156, -0.08358383178710938, -0.07922172546386719, -0.074859619140625, -0.07049751281738281, -0.06613540649414062, -0.06177330017089844, -0.05741119384765625, -0.05304908752441406, -0.048686981201171875, -0.04432487487792969, -0.0399627685546875, -0.03560066223144531, -0.031238555908203125, -0.026876449584960938, -0.02251434326171875, -0.018152236938476562, -0.013790130615234375, -0.009428024291992188, -0.00506591796875, -0.0007038116455078125, 0.003658294677734375, 0.008020401000976562, 0.01238250732421875, 0.016744613647460938, 0.021106719970703125, 0.025468826293945312, 0.0298309326171875, 0.03419303894042969, 0.038555145263671875, 0.04291725158691406, 0.04727935791015625, 0.05164146423339844, 0.056003570556640625, 0.06036567687988281, 0.064727783203125, 0.06908988952636719, 0.07345199584960938, 0.07781410217285156, 0.08217620849609375, 0.08653831481933594, 0.09090042114257812, 0.09526252746582031, 0.0996246337890625, 0.10398674011230469, 0.10834884643554688, 0.11271095275878906, 0.11707305908203125, 0.12143516540527344, 0.12579727172851562, 0.1301593780517578, 0.134521484375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 19.0, 26.0, 64.0, 217.0, 3328.0, 280.0, 70.0, 22.0, 15.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0142974853515625, -0.013062238693237305, -0.01182699203491211, -0.010591745376586914, -0.009356498718261719, -0.008121252059936523, -0.006886005401611328, -0.005650758743286133, -0.0044155120849609375, -0.003180265426635742, -0.0019450187683105469, -0.0007097721099853516, 0.0005254745483398438, 0.001760721206665039, 0.0029959678649902344, 0.00423121452331543, 0.005466461181640625, 0.00670170783996582, 0.007936954498291016, 0.009172201156616211, 0.010407447814941406, 0.011642694473266602, 0.012877941131591797, 0.014113187789916992, 0.015348434448242188, 0.016583681106567383, 0.017818927764892578, 0.019054174423217773, 0.02028942108154297, 0.021524667739868164, 0.02275991439819336, 0.023995161056518555, 0.02523040771484375, 0.026465654373168945, 0.02770090103149414, 0.028936147689819336, 0.03017139434814453, 0.03140664100646973, 0.03264188766479492, 0.03387713432312012, 0.03511238098144531, 0.03634762763977051, 0.0375828742980957, 0.0388181209564209, 0.040053367614746094, 0.04128861427307129, 0.042523860931396484, 0.04375910758972168, 0.044994354248046875, 0.04622960090637207, 0.047464847564697266, 0.04870009422302246, 0.049935340881347656, 0.05117058753967285, 0.05240583419799805, 0.05364108085632324, 0.05487632751464844, 0.05611157417297363, 0.05734682083129883, 0.05858206748962402, 0.05981731414794922, 0.061052560806274414, 0.06228780746459961, 0.0635230541229248, 0.06475830078125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 7.0, 11.0, 9.0, 18.0, 27.0, 46.0, 52.0, 72.0, 93.0, 125.0, 111.0, 109.0, 83.0, 60.0, 48.0, 40.0, 23.0, 22.0, 9.0, 8.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1159844696521759, -0.11311082541942596, -0.11023718863725662, -0.10736354440450668, -0.10448990017175674, -0.1016162633895874, -0.09874261915683746, -0.09586897492408752, -0.09299533069133759, -0.09012168645858765, -0.0872480496764183, -0.08437440544366837, -0.08150076121091843, -0.07862712442874908, -0.07575348019599915, -0.0728798359632492, -0.07000619918107986, -0.06713255494832993, -0.06425891816616058, -0.061385273933410645, -0.058511629700660706, -0.055637989193201065, -0.052764348685741425, -0.049890704452991486, -0.047017063945531845, -0.044143423438072205, -0.041269779205322266, -0.038396138697862625, -0.035522498190402985, -0.032648853957653046, -0.029775213450193405, -0.026901571080088615, -0.024027928709983826, -0.021154286339879036, -0.018280643969774246, -0.015407003462314606, -0.012533361092209816, -0.009659718722105026, -0.006786078214645386, -0.003912435844540596, -0.0010387934744358063, 0.0018348484300076962, 0.004708490334451199, 0.007582131773233414, 0.010455774143338203, 0.013329416513442993, 0.016203057020902634, 0.019076699391007423, 0.021950341761112213, 0.024823984131217003, 0.027697626501321793, 0.030571267008781433, 0.03344491124153137, 0.03631855174899101, 0.03919219225645065, 0.04206583648920059, 0.04493947699666023, 0.04781311750411987, 0.05068676173686981, 0.05356040224432945, 0.05643404275178909, 0.05930768698453903, 0.06218132749199867, 0.06505496799945831, 0.06792861223220825]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 8.0, 4.0, 8.0, 8.0, 11.0, 13.0, 11.0, 20.0, 25.0, 32.0, 23.0, 41.0, 29.0, 35.0, 42.0, 42.0, 56.0, 45.0, 40.0, 46.0, 43.0, 49.0, 51.0, 36.0, 38.0, 33.0, 39.0, 26.0, 31.0, 18.0, 16.0, 15.0, 17.0, 20.0, 9.0, 14.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051313161849975586, -0.04919978976249695, -0.04708641767501831, -0.04497304558753967, -0.042859673500061035, -0.0407463014125824, -0.03863292932510376, -0.03651955723762512, -0.034406185150146484, -0.03229281306266785, -0.03017944097518921, -0.02806606888771057, -0.025952696800231934, -0.023839324712753296, -0.021725952625274658, -0.01961258053779602, -0.017499208450317383, -0.015385836362838745, -0.013272464275360107, -0.01115909218788147, -0.009045720100402832, -0.006932348012924194, -0.004818975925445557, -0.002705603837966919, -0.0005922317504882812, 0.0015211403369903564, 0.003634512424468994, 0.005747884511947632, 0.00786125659942627, 0.009974628686904907, 0.012088000774383545, 0.014201372861862183, 0.01631474494934082, 0.018428117036819458, 0.020541489124298096, 0.022654861211776733, 0.02476823329925537, 0.02688160538673401, 0.028994977474212646, 0.031108349561691284, 0.03322172164916992, 0.03533509373664856, 0.0374484658241272, 0.039561837911605835, 0.04167520999908447, 0.04378858208656311, 0.04590195417404175, 0.048015326261520386, 0.05012869834899902, 0.05224207043647766, 0.0543554425239563, 0.056468814611434937, 0.058582186698913574, 0.06069555878639221, 0.06280893087387085, 0.06492230296134949, 0.06703567504882812, 0.06914904713630676, 0.0712624192237854, 0.07337579131126404, 0.07548916339874268, 0.07760253548622131, 0.07971590757369995, 0.08182927966117859, 0.08394265174865723]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 15.0, 19.0, 21.0, 39.0, 70.0, 116.0, 146.0, 235.0, 427.0, 701.0, 1036.0, 1805.0, 3175.0, 6019.0, 11615.0, 26116.0, 73467.0, 271665.0, 441072.0, 133863.0, 41493.0, 17117.0, 8044.0, 4295.0, 2452.0, 1424.0, 771.0, 483.0, 296.0, 184.0, 130.0, 76.0, 51.0, 36.0, 27.0, 12.0, 9.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.15576171875, -0.15077590942382812, -0.14579010009765625, -0.14080429077148438, -0.1358184814453125, -0.13083267211914062, -0.12584686279296875, -0.12086105346679688, -0.115875244140625, -0.11088943481445312, -0.10590362548828125, -0.10091781616210938, -0.0959320068359375, -0.09094619750976562, -0.08596038818359375, -0.08097457885742188, -0.07598876953125, -0.07100296020507812, -0.06601715087890625, -0.061031341552734375, -0.0560455322265625, -0.051059722900390625, -0.04607391357421875, -0.041088104248046875, -0.036102294921875, -0.031116485595703125, -0.02613067626953125, -0.021144866943359375, -0.0161590576171875, -0.011173248291015625, -0.00618743896484375, -0.001201629638671875, 0.0037841796875, 0.008769989013671875, 0.01375579833984375, 0.018741607666015625, 0.0237274169921875, 0.028713226318359375, 0.03369903564453125, 0.038684844970703125, 0.043670654296875, 0.048656463623046875, 0.05364227294921875, 0.058628082275390625, 0.0636138916015625, 0.06859970092773438, 0.07358551025390625, 0.07857131958007812, 0.08355712890625, 0.08854293823242188, 0.09352874755859375, 0.09851455688476562, 0.1035003662109375, 0.10848617553710938, 0.11347198486328125, 0.11845779418945312, 0.123443603515625, 0.12842941284179688, 0.13341522216796875, 0.13840103149414062, 0.1433868408203125, 0.14837265014648438, 0.15335845947265625, 0.15834426879882812, 0.163330078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 8.0, 7.0, 9.0, 13.0, 19.0, 25.0, 32.0, 29.0, 51.0, 57.0, 62.0, 54.0, 65.0, 75.0, 57.0, 69.0, 58.0, 66.0, 45.0, 41.0, 38.0, 23.0, 22.0, 18.0, 10.0, 15.0, 6.0, 9.0, 3.0, 5.0, 4.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.167724609375, -0.1629486083984375, -0.158172607421875, -0.1533966064453125, -0.14862060546875, -0.1438446044921875, -0.139068603515625, -0.1342926025390625, -0.1295166015625, -0.1247406005859375, -0.119964599609375, -0.1151885986328125, -0.11041259765625, -0.1056365966796875, -0.100860595703125, -0.0960845947265625, -0.09130859375, -0.0865325927734375, -0.081756591796875, -0.0769805908203125, -0.07220458984375, -0.0674285888671875, -0.062652587890625, -0.0578765869140625, -0.0531005859375, -0.0483245849609375, -0.043548583984375, -0.0387725830078125, -0.03399658203125, -0.0292205810546875, -0.024444580078125, -0.0196685791015625, -0.014892578125, -0.0101165771484375, -0.005340576171875, -0.0005645751953125, 0.00421142578125, 0.0089874267578125, 0.013763427734375, 0.0185394287109375, 0.0233154296875, 0.0280914306640625, 0.032867431640625, 0.0376434326171875, 0.04241943359375, 0.0471954345703125, 0.051971435546875, 0.0567474365234375, 0.0615234375, 0.0662994384765625, 0.071075439453125, 0.0758514404296875, 0.08062744140625, 0.0854034423828125, 0.090179443359375, 0.0949554443359375, 0.0997314453125, 0.1045074462890625, 0.109283447265625, 0.1140594482421875, 0.11883544921875, 0.1236114501953125, 0.128387451171875, 0.1331634521484375, 0.137939453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 4.0, 7.0, 7.0, 16.0, 14.0, 24.0, 23.0, 40.0, 43.0, 41.0, 91.0, 134.0, 200.0, 347.0, 845.0, 3411.0, 22778.0, 418962.0, 567610.0, 27995.0, 3931.0, 973.0, 405.0, 215.0, 124.0, 79.0, 52.0, 53.0, 32.0, 17.0, 8.0, 18.0, 9.0, 5.0, 8.0, 9.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.347900390625, -0.3359222412109375, -0.323944091796875, -0.3119659423828125, -0.29998779296875, -0.2880096435546875, -0.276031494140625, -0.2640533447265625, -0.2520751953125, -0.2400970458984375, -0.228118896484375, -0.2161407470703125, -0.20416259765625, -0.1921844482421875, -0.180206298828125, -0.1682281494140625, -0.15625, -0.1442718505859375, -0.132293701171875, -0.1203155517578125, -0.10833740234375, -0.0963592529296875, -0.084381103515625, -0.0724029541015625, -0.0604248046875, -0.0484466552734375, -0.036468505859375, -0.0244903564453125, -0.01251220703125, -0.0005340576171875, 0.011444091796875, 0.0234222412109375, 0.035400390625, 0.0473785400390625, 0.059356689453125, 0.0713348388671875, 0.08331298828125, 0.0952911376953125, 0.107269287109375, 0.1192474365234375, 0.1312255859375, 0.1432037353515625, 0.155181884765625, 0.1671600341796875, 0.17913818359375, 0.1911163330078125, 0.203094482421875, 0.2150726318359375, 0.22705078125, 0.2390289306640625, 0.251007080078125, 0.2629852294921875, 0.27496337890625, 0.2869415283203125, 0.298919677734375, 0.3108978271484375, 0.3228759765625, 0.3348541259765625, 0.346832275390625, 0.3588104248046875, 0.37078857421875, 0.3827667236328125, 0.394744873046875, 0.4067230224609375, 0.418701171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 0.0, 7.0, 5.0, 7.0, 8.0, 16.0, 16.0, 19.0, 28.0, 18.0, 24.0, 31.0, 28.0, 29.0, 31.0, 31.0, 47.0, 47.0, 52.0, 43.0, 42.0, 41.0, 40.0, 42.0, 32.0, 49.0, 28.0, 33.0, 38.0, 24.0, 21.0, 18.0, 18.0, 18.0, 13.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.457763671875, -0.4443778991699219, -0.43099212646484375, -0.4176063537597656, -0.4042205810546875, -0.3908348083496094, -0.37744903564453125, -0.3640632629394531, -0.350677490234375, -0.3372917175292969, -0.32390594482421875, -0.3105201721191406, -0.2971343994140625, -0.2837486267089844, -0.27036285400390625, -0.2569770812988281, -0.24359130859375, -0.23020553588867188, -0.21681976318359375, -0.20343399047851562, -0.1900482177734375, -0.17666244506835938, -0.16327667236328125, -0.14989089965820312, -0.136505126953125, -0.12311935424804688, -0.10973358154296875, -0.09634780883789062, -0.0829620361328125, -0.06957626342773438, -0.05619049072265625, -0.042804718017578125, -0.0294189453125, -0.016033172607421875, -0.00264739990234375, 0.010738372802734375, 0.0241241455078125, 0.037509918212890625, 0.05089569091796875, 0.06428146362304688, 0.077667236328125, 0.09105300903320312, 0.10443878173828125, 0.11782455444335938, 0.1312103271484375, 0.14459609985351562, 0.15798187255859375, 0.17136764526367188, 0.18475341796875, 0.19813919067382812, 0.21152496337890625, 0.22491073608398438, 0.2382965087890625, 0.2516822814941406, 0.26506805419921875, 0.2784538269042969, 0.291839599609375, 0.3052253723144531, 0.31861114501953125, 0.3319969177246094, 0.3453826904296875, 0.3587684631347656, 0.37215423583984375, 0.3855400085449219, 0.39892578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 6.0, 9.0, 17.0, 22.0, 36.0, 75.0, 140.0, 349.0, 927.0, 5780.0, 851982.0, 184420.0, 3506.0, 747.0, 238.0, 145.0, 68.0, 30.0, 25.0, 14.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51318359375, -0.5009346008300781, -0.48868560791015625, -0.4764366149902344, -0.4641876220703125, -0.4519386291503906, -0.43968963623046875, -0.4274406433105469, -0.415191650390625, -0.4029426574707031, -0.39069366455078125, -0.3784446716308594, -0.3661956787109375, -0.3539466857910156, -0.34169769287109375, -0.3294486999511719, -0.31719970703125, -0.3049507141113281, -0.29270172119140625, -0.2804527282714844, -0.2682037353515625, -0.2559547424316406, -0.24370574951171875, -0.23145675659179688, -0.219207763671875, -0.20695877075195312, -0.19470977783203125, -0.18246078491210938, -0.1702117919921875, -0.15796279907226562, -0.14571380615234375, -0.13346481323242188, -0.1212158203125, -0.10896682739257812, -0.09671783447265625, -0.08446884155273438, -0.0722198486328125, -0.059970855712890625, -0.04772186279296875, -0.035472869873046875, -0.023223876953125, -0.010974884033203125, 0.00127410888671875, 0.013523101806640625, 0.0257720947265625, 0.038021087646484375, 0.05027008056640625, 0.06251907348632812, 0.07476806640625, 0.08701705932617188, 0.09926605224609375, 0.11151504516601562, 0.1237640380859375, 0.13601303100585938, 0.14826202392578125, 0.16051101684570312, 0.172760009765625, 0.18500900268554688, 0.19725799560546875, 0.20950698852539062, 0.2217559814453125, 0.23400497436523438, 0.24625396728515625, 0.2585029602050781, 0.270751953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 3.0, 5.0, 10.0, 4.0, 8.0, 13.0, 12.0, 17.0, 22.0, 31.0, 36.0, 42.0, 61.0, 80.0, 86.0, 85.0, 85.0, 64.0, 66.0, 48.0, 43.0, 47.0, 29.0, 21.0, 24.0, 21.0, 10.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.309415817260742e-05, -4.1472725570201874e-05, -3.9851292967796326e-05, -3.822986036539078e-05, -3.660842776298523e-05, -3.498699516057968e-05, -3.336556255817413e-05, -3.1744129955768585e-05, -3.0122697353363037e-05, -2.850126475095749e-05, -2.687983214855194e-05, -2.5258399546146393e-05, -2.3636966943740845e-05, -2.2015534341335297e-05, -2.039410173892975e-05, -1.87726691365242e-05, -1.7151236534118652e-05, -1.5529803931713104e-05, -1.3908371329307556e-05, -1.2286938726902008e-05, -1.066550612449646e-05, -9.044073522090912e-06, -7.422640919685364e-06, -5.801208317279816e-06, -4.179775714874268e-06, -2.5583431124687195e-06, -9.369105100631714e-07, 6.845220923423767e-07, 2.305954694747925e-06, 3.927387297153473e-06, 5.548819899559021e-06, 7.170252501964569e-06, 8.791685104370117e-06, 1.0413117706775665e-05, 1.2034550309181213e-05, 1.3655982911586761e-05, 1.527741551399231e-05, 1.6898848116397858e-05, 1.8520280718803406e-05, 2.0141713321208954e-05, 2.1763145923614502e-05, 2.338457852602005e-05, 2.5006011128425598e-05, 2.6627443730831146e-05, 2.8248876333236694e-05, 2.9870308935642242e-05, 3.149174153804779e-05, 3.311317414045334e-05, 3.473460674285889e-05, 3.6356039345264435e-05, 3.797747194766998e-05, 3.959890455007553e-05, 4.122033715248108e-05, 4.284176975488663e-05, 4.4463202357292175e-05, 4.6084634959697723e-05, 4.770606756210327e-05, 4.932750016450882e-05, 5.094893276691437e-05, 5.2570365369319916e-05, 5.4191797971725464e-05, 5.581323057413101e-05, 5.743466317653656e-05, 5.905609577894211e-05, 6.0677528381347656e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 15.0, 23.0, 57.0, 90.0, 173.0, 471.0, 2241.0, 22833.0, 957955.0, 59986.0, 3587.0, 683.0, 209.0, 89.0, 49.0, 29.0, 19.0, 10.0, 4.0, 10.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2344970703125, -0.2256908416748047, -0.21688461303710938, -0.20807838439941406, -0.19927215576171875, -0.19046592712402344, -0.18165969848632812, -0.1728534698486328, -0.1640472412109375, -0.1552410125732422, -0.14643478393554688, -0.13762855529785156, -0.12882232666015625, -0.12001609802246094, -0.11120986938476562, -0.10240364074707031, -0.093597412109375, -0.08479118347167969, -0.07598495483398438, -0.06717872619628906, -0.05837249755859375, -0.04956626892089844, -0.040760040283203125, -0.03195381164550781, -0.0231475830078125, -0.014341354370117188, -0.005535125732421875, 0.0032711029052734375, 0.01207733154296875, 0.020883560180664062, 0.029689788818359375, 0.03849601745605469, 0.04730224609375, 0.05610847473144531, 0.06491470336914062, 0.07372093200683594, 0.08252716064453125, 0.09133338928222656, 0.10013961791992188, 0.10894584655761719, 0.1177520751953125, 0.1265583038330078, 0.13536453247070312, 0.14417076110839844, 0.15297698974609375, 0.16178321838378906, 0.17058944702148438, 0.1793956756591797, 0.188201904296875, 0.1970081329345703, 0.20581436157226562, 0.21462059020996094, 0.22342681884765625, 0.23223304748535156, 0.24103927612304688, 0.2498455047607422, 0.2586517333984375, 0.2674579620361328, 0.2762641906738281, 0.28507041931152344, 0.29387664794921875, 0.30268287658691406, 0.3114891052246094, 0.3202953338623047, 0.3291015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 10.0, 9.0, 9.0, 16.0, 34.0, 52.0, 98.0, 219.0, 255.0, 147.0, 64.0, 25.0, 15.0, 19.0, 14.0, 6.0, 5.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.286376953125, -0.2774620056152344, -0.26854705810546875, -0.2596321105957031, -0.2507171630859375, -0.24180221557617188, -0.23288726806640625, -0.22397232055664062, -0.215057373046875, -0.20614242553710938, -0.19722747802734375, -0.18831253051757812, -0.1793975830078125, -0.17048263549804688, -0.16156768798828125, -0.15265274047851562, -0.14373779296875, -0.13482284545898438, -0.12590789794921875, -0.11699295043945312, -0.1080780029296875, -0.09916305541992188, -0.09024810791015625, -0.08133316040039062, -0.072418212890625, -0.06350326538085938, -0.05458831787109375, -0.045673370361328125, -0.0367584228515625, -0.027843475341796875, -0.01892852783203125, -0.010013580322265625, -0.0010986328125, 0.007816314697265625, 0.01673126220703125, 0.025646209716796875, 0.0345611572265625, 0.043476104736328125, 0.05239105224609375, 0.061305999755859375, 0.070220947265625, 0.07913589477539062, 0.08805084228515625, 0.09696578979492188, 0.1058807373046875, 0.11479568481445312, 0.12371063232421875, 0.13262557983398438, 0.14154052734375, 0.15045547485351562, 0.15937042236328125, 0.16828536987304688, 0.1772003173828125, 0.18611526489257812, 0.19503021240234375, 0.20394515991210938, 0.212860107421875, 0.22177505493164062, 0.23069000244140625, 0.23960494995117188, 0.2485198974609375, 0.2574348449707031, 0.26634979248046875, 0.2752647399902344, 0.2841796875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 10.0, 34.0, 149.0, 380.0, 290.0, 99.0, 36.0, 11.0, 3.0, 1.0, 2.0, 3.0], "bins": [-9.787286758422852, -9.611881256103516, -9.43647575378418, -9.261070251464844, -9.085664749145508, -8.910259246826172, -8.734853744506836, -8.5594482421875, -8.384041786193848, -8.208636283874512, -8.033230781555176, -7.85782527923584, -7.682419300079346, -7.50701379776001, -7.331608295440674, -7.156202793121338, -6.98079776763916, -6.805392265319824, -6.629986763000488, -6.454581260681152, -6.279175281524658, -6.103769779205322, -5.928364276885986, -5.75295877456665, -5.577552795410156, -5.40214729309082, -5.226741790771484, -5.051336288452148, -4.875930309295654, -4.700524806976318, -4.525119304656982, -4.3497138023376465, -4.1743083000183105, -3.9989027976989746, -3.8234970569610596, -3.6480915546417236, -3.4726860523223877, -3.2972803115844727, -3.1218748092651367, -2.946469306945801, -2.771063804626465, -2.595658302307129, -2.420252561569214, -2.244847059249878, -2.069441556930542, -1.8940359354019165, -1.718630313873291, -1.543224811553955, -1.36781907081604, -1.1924134492874146, -1.0170079469680786, -0.8416023254394531, -0.6661967635154724, -0.4907912015914917, -0.3153855800628662, -0.13998007774353027, 0.035425543785095215, 0.21083112061023712, 0.38623669743537903, 0.5616422891616821, 0.7370478510856628, 0.9124534130096436, 1.087859034538269, 1.263264536857605, 1.4386701583862305]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 7.0, 9.0, 17.0, 11.0, 9.0, 9.0, 12.0, 23.0, 18.0, 23.0, 34.0, 26.0, 39.0, 39.0, 38.0, 39.0, 34.0, 43.0, 41.0, 51.0, 50.0, 41.0, 44.0, 47.0, 32.0, 44.0, 39.0, 26.0, 25.0, 24.0, 12.0, 16.0, 15.0, 10.0, 9.0, 15.0, 6.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.28642201423645, -2.220757007598877, -2.1550920009613037, -2.0894269943237305, -2.023761749267578, -1.9580968618392944, -1.8924317359924316, -1.8267667293548584, -1.7611017227172852, -1.695436716079712, -1.6297717094421387, -1.5641065835952759, -1.4984415769577026, -1.4327765703201294, -1.3671114444732666, -1.3014464378356934, -1.2357814311981201, -1.1701164245605469, -1.1044514179229736, -1.0387862920761108, -0.9731212854385376, -0.9074562788009644, -0.8417912125587463, -0.7761261463165283, -0.7104611396789551, -0.6447961330413818, -0.5791310667991638, -0.5134660005569458, -0.44780099391937256, -0.38213595747947693, -0.3164709210395813, -0.25080588459968567, -0.18514108657836914, -0.11947605013847351, -0.05381101369857788, 0.011854022741317749, 0.07751905918121338, 0.143184095621109, 0.20884913206100464, 0.27451416850090027, 0.3401792049407959, 0.40584424138069153, 0.47150927782058716, 0.5371743440628052, 0.6028393507003784, 0.6685043573379517, 0.7341694235801697, 0.7998344898223877, 0.8654994964599609, 0.9311645030975342, 0.9968295693397522, 1.0624946355819702, 1.1281596422195435, 1.1938246488571167, 1.2594897747039795, 1.3251547813415527, 1.390819787979126, 1.4564847946166992, 1.5221498012542725, 1.5878149271011353, 1.6534799337387085, 1.7191449403762817, 1.7848100662231445, 1.8504750728607178, 1.916140079498291]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 2.0, 9.0, 13.0, 19.0, 37.0, 52.0, 78.0, 137.0, 197.0, 441.0, 940.0, 2582.0, 13675.0, 4113651.0, 55149.0, 4692.0, 1327.0, 534.0, 294.0, 164.0, 85.0, 71.0, 34.0, 27.0, 17.0, 18.0, 14.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3740234375, -0.3646068572998047, -0.3551902770996094, -0.34577369689941406, -0.33635711669921875, -0.32694053649902344, -0.3175239562988281, -0.3081073760986328, -0.2986907958984375, -0.2892742156982422, -0.2798576354980469, -0.27044105529785156, -0.26102447509765625, -0.25160789489746094, -0.24219131469726562, -0.2327747344970703, -0.223358154296875, -0.2139415740966797, -0.20452499389648438, -0.19510841369628906, -0.18569183349609375, -0.17627525329589844, -0.16685867309570312, -0.1574420928955078, -0.1480255126953125, -0.1386089324951172, -0.12919235229492188, -0.11977577209472656, -0.11035919189453125, -0.10094261169433594, -0.09152603149414062, -0.08210945129394531, -0.07269287109375, -0.06327629089355469, -0.053859710693359375, -0.04444313049316406, -0.03502655029296875, -0.025609970092773438, -0.016193389892578125, -0.0067768096923828125, 0.0026397705078125, 0.012056350708007812, 0.021472930908203125, 0.030889511108398438, 0.04030609130859375, 0.04972267150878906, 0.059139251708984375, 0.06855583190917969, 0.077972412109375, 0.08738899230957031, 0.09680557250976562, 0.10622215270996094, 0.11563873291015625, 0.12505531311035156, 0.13447189331054688, 0.1438884735107422, 0.1533050537109375, 0.1627216339111328, 0.17213821411132812, 0.18155479431152344, 0.19097137451171875, 0.20038795471191406, 0.20980453491210938, 0.2192211151123047, 0.2286376953125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 5.0, 18.0, 17.0, 17.0, 26.0, 30.0, 25.0, 50.0, 46.0, 50.0, 55.0, 58.0, 66.0, 59.0, 60.0, 56.0, 61.0, 41.0, 46.0, 36.0, 26.0, 25.0, 26.0, 17.0, 12.0, 20.0, 13.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0], "bins": [-0.1773681640625, -0.17307567596435547, -0.16878318786621094, -0.1644906997680664, -0.16019821166992188, -0.15590572357177734, -0.1516132354736328, -0.14732074737548828, -0.14302825927734375, -0.13873577117919922, -0.1344432830810547, -0.13015079498291016, -0.12585830688476562, -0.1215658187866211, -0.11727333068847656, -0.11298084259033203, -0.1086883544921875, -0.10439586639404297, -0.10010337829589844, -0.0958108901977539, -0.09151840209960938, -0.08722591400146484, -0.08293342590332031, -0.07864093780517578, -0.07434844970703125, -0.07005596160888672, -0.06576347351074219, -0.061470985412597656, -0.057178497314453125, -0.052886009216308594, -0.04859352111816406, -0.04430103302001953, -0.040008544921875, -0.03571605682373047, -0.03142356872558594, -0.027131080627441406, -0.022838592529296875, -0.018546104431152344, -0.014253616333007812, -0.009961128234863281, -0.00566864013671875, -0.0013761520385742188, 0.0029163360595703125, 0.007208824157714844, 0.011501312255859375, 0.015793800354003906, 0.020086288452148438, 0.02437877655029297, 0.0286712646484375, 0.03296375274658203, 0.03725624084472656, 0.041548728942871094, 0.045841217041015625, 0.050133705139160156, 0.05442619323730469, 0.05871868133544922, 0.06301116943359375, 0.06730365753173828, 0.07159614562988281, 0.07588863372802734, 0.08018112182617188, 0.0844736099243164, 0.08876609802246094, 0.09305858612060547, 0.09735107421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 7.0, 10.0, 14.0, 16.0, 20.0, 36.0, 23.0, 45.0, 83.0, 93.0, 150.0, 229.0, 347.0, 469.0, 913.0, 1555.0, 3412.0, 10159.0, 84426.0, 4053152.0, 27178.0, 6193.0, 2456.0, 1202.0, 698.0, 439.0, 296.0, 214.0, 130.0, 83.0, 56.0, 47.0, 27.0, 15.0, 14.0, 13.0, 9.0, 8.0, 6.0, 11.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.1888427734375, -0.18299484252929688, -0.17714691162109375, -0.17129898071289062, -0.1654510498046875, -0.15960311889648438, -0.15375518798828125, -0.14790725708007812, -0.142059326171875, -0.13621139526367188, -0.13036346435546875, -0.12451553344726562, -0.1186676025390625, -0.11281967163085938, -0.10697174072265625, -0.10112380981445312, -0.09527587890625, -0.08942794799804688, -0.08358001708984375, -0.07773208618164062, -0.0718841552734375, -0.06603622436523438, -0.06018829345703125, -0.054340362548828125, -0.048492431640625, -0.042644500732421875, -0.03679656982421875, -0.030948638916015625, -0.0251007080078125, -0.019252777099609375, -0.01340484619140625, -0.007556915283203125, -0.001708984375, 0.004138946533203125, 0.00998687744140625, 0.015834808349609375, 0.0216827392578125, 0.027530670166015625, 0.03337860107421875, 0.039226531982421875, 0.045074462890625, 0.050922393798828125, 0.05677032470703125, 0.06261825561523438, 0.0684661865234375, 0.07431411743164062, 0.08016204833984375, 0.08600997924804688, 0.09185791015625, 0.09770584106445312, 0.10355377197265625, 0.10940170288085938, 0.1152496337890625, 0.12109756469726562, 0.12694549560546875, 0.13279342651367188, 0.138641357421875, 0.14448928833007812, 0.15033721923828125, 0.15618515014648438, 0.1620330810546875, 0.16788101196289062, 0.17372894287109375, 0.17957687377929688, 0.1854248046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 12.0, 18.0, 65.0, 606.0, 3237.0, 70.0, 23.0, 15.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.067474365234375, -0.06549072265625, -0.063507080078125, -0.0615234375, -0.059539794921875, -0.05755615234375, -0.055572509765625, -0.0535888671875, -0.051605224609375, -0.04962158203125, -0.047637939453125, -0.045654296875, -0.043670654296875, -0.04168701171875, -0.039703369140625, -0.0377197265625, -0.035736083984375, -0.03375244140625, -0.031768798828125, -0.02978515625, -0.027801513671875, -0.02581787109375, -0.023834228515625, -0.0218505859375, -0.019866943359375, -0.01788330078125, -0.015899658203125, -0.013916015625, -0.011932373046875, -0.00994873046875, -0.007965087890625, -0.0059814453125, -0.003997802734375, -0.00201416015625, -3.0517578125e-05, 0.001953125, 0.003936767578125, 0.00592041015625, 0.007904052734375, 0.0098876953125, 0.011871337890625, 0.01385498046875, 0.015838623046875, 0.017822265625, 0.019805908203125, 0.02178955078125, 0.023773193359375, 0.0257568359375, 0.027740478515625, 0.02972412109375, 0.031707763671875, 0.03369140625, 0.035675048828125, 0.03765869140625, 0.039642333984375, 0.0416259765625, 0.043609619140625, 0.04559326171875, 0.047576904296875, 0.049560546875, 0.051544189453125, 0.05352783203125, 0.055511474609375, 0.0574951171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 26.0, 53.0, 121.0, 204.0, 272.0, 154.0, 89.0, 39.0, 17.0, 7.0, 5.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2907010018825531, -0.28236693143844604, -0.2740328907966614, -0.2656988203525543, -0.25736477971076965, -0.2490307092666626, -0.24069665372371674, -0.23236259818077087, -0.22402852773666382, -0.21569447219371796, -0.2073604166507721, -0.19902634620666504, -0.19069229066371918, -0.18235823512077332, -0.17402417957782745, -0.1656901240348816, -0.15735606849193573, -0.14902201294898987, -0.140687957406044, -0.13235390186309814, -0.12401983141899109, -0.11568577587604523, -0.10735172033309937, -0.0990176647901535, -0.09068360179662704, -0.08234954625368118, -0.07401548326015472, -0.06568142771720886, -0.0573473684489727, -0.04901330918073654, -0.04067925363779068, -0.03234519436955452, -0.02401113510131836, -0.0156770758330822, -0.007343018427491188, 0.000991038978099823, 0.009325098246335983, 0.017659157514572144, 0.025993213057518005, 0.034327272325754166, 0.042661331593990326, 0.050995390862226486, 0.059329450130462646, 0.06766350567340851, 0.07599756121635437, 0.08433162420988083, 0.09266567975282669, 0.10099974274635315, 0.10933379828929901, 0.11766785383224487, 0.12600190937519073, 0.1343359649181366, 0.14267003536224365, 0.15100409090518951, 0.15933814644813538, 0.16767220199108124, 0.1760062575340271, 0.18434031307697296, 0.19267436861991882, 0.20100843906402588, 0.20934249460697174, 0.2176765501499176, 0.22601060569286346, 0.23434466123580933, 0.24267873167991638]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 7.0, 8.0, 7.0, 15.0, 9.0, 10.0, 15.0, 19.0, 19.0, 21.0, 32.0, 24.0, 31.0, 37.0, 24.0, 27.0, 41.0, 44.0, 52.0, 36.0, 44.0, 43.0, 31.0, 31.0, 31.0, 36.0, 39.0, 34.0, 46.0, 27.0, 27.0, 17.0, 26.0, 14.0, 21.0, 9.0, 7.0, 11.0, 10.0, 7.0, 5.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07930302619934082, -0.07681325823068619, -0.07432348281145096, -0.07183371484279633, -0.0693439394235611, -0.06685417145490646, -0.06436440348625183, -0.0618746317923069, -0.05938486009836197, -0.05689508840441704, -0.05440531671047211, -0.051915548741817474, -0.04942577704787254, -0.04693600535392761, -0.04444623738527298, -0.04195646569132805, -0.03946669399738312, -0.03697692230343819, -0.034487150609493256, -0.03199738264083862, -0.029507610946893692, -0.02701783925294876, -0.02452806942164898, -0.022038299590349197, -0.019548527896404266, -0.017058756202459335, -0.014568986371159554, -0.012079215608537197, -0.00958944484591484, -0.007099674083292484, -0.004609903320670128, -0.002120133489370346, 0.00036963820457458496, 0.0028594089671969414, 0.005349179729819298, 0.007838950492441654, 0.01032872125506401, 0.012818492017686367, 0.015308262780308723, 0.017798032611608505, 0.020287804305553436, 0.022777575999498367, 0.02526734583079815, 0.02775711566209793, 0.030246887356042862, 0.03273665904998779, 0.035226427018642426, 0.03771619871258736, 0.04020597040653229, 0.04269574210047722, 0.04518551379442215, 0.04767528176307678, 0.05016505345702171, 0.052654825150966644, 0.05514459311962128, 0.05763436481356621, 0.06012413650751114, 0.06261390447616577, 0.065103679895401, 0.06759344786405563, 0.07008321583271027, 0.0725729912519455, 0.07506275922060013, 0.07755252718925476, 0.08004230260848999]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 11.0, 7.0, 16.0, 42.0, 35.0, 64.0, 91.0, 177.0, 271.0, 575.0, 1046.0, 2191.0, 4829.0, 12037.0, 32383.0, 96335.0, 294787.0, 380861.0, 146169.0, 47390.0, 16841.0, 6649.0, 2822.0, 1337.0, 688.0, 357.0, 215.0, 109.0, 73.0, 49.0, 28.0, 24.0, 15.0, 8.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11279296875, -0.10848426818847656, -0.10417556762695312, -0.09986686706542969, -0.09555816650390625, -0.09124946594238281, -0.08694076538085938, -0.08263206481933594, -0.0783233642578125, -0.07401466369628906, -0.06970596313476562, -0.06539726257324219, -0.06108856201171875, -0.05677986145019531, -0.052471160888671875, -0.04816246032714844, -0.043853759765625, -0.03954505920410156, -0.035236358642578125, -0.030927658081054688, -0.02661895751953125, -0.022310256958007812, -0.018001556396484375, -0.013692855834960938, -0.0093841552734375, -0.0050754547119140625, -0.000766754150390625, 0.0035419464111328125, 0.00785064697265625, 0.012159347534179688, 0.016468048095703125, 0.020776748657226562, 0.02508544921875, 0.029394149780273438, 0.033702850341796875, 0.03801155090332031, 0.04232025146484375, 0.04662895202636719, 0.050937652587890625, 0.05524635314941406, 0.0595550537109375, 0.06386375427246094, 0.06817245483398438, 0.07248115539550781, 0.07678985595703125, 0.08109855651855469, 0.08540725708007812, 0.08971595764160156, 0.094024658203125, 0.09833335876464844, 0.10264205932617188, 0.10695075988769531, 0.11125946044921875, 0.11556816101074219, 0.11987686157226562, 0.12418556213378906, 0.1284942626953125, 0.13280296325683594, 0.13711166381835938, 0.1414203643798828, 0.14572906494140625, 0.1500377655029297, 0.15434646606445312, 0.15865516662597656, 0.1629638671875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 4.0, 8.0, 10.0, 16.0, 14.0, 20.0, 25.0, 33.0, 32.0, 41.0, 46.0, 59.0, 64.0, 54.0, 75.0, 50.0, 62.0, 57.0, 56.0, 44.0, 38.0, 28.0, 32.0, 24.0, 23.0, 15.0, 20.0, 10.0, 14.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0], "bins": [-0.17822265625, -0.17386817932128906, -0.16951370239257812, -0.1651592254638672, -0.16080474853515625, -0.1564502716064453, -0.15209579467773438, -0.14774131774902344, -0.1433868408203125, -0.13903236389160156, -0.13467788696289062, -0.1303234100341797, -0.12596893310546875, -0.12161445617675781, -0.11725997924804688, -0.11290550231933594, -0.108551025390625, -0.10419654846191406, -0.09984207153320312, -0.09548759460449219, -0.09113311767578125, -0.08677864074707031, -0.08242416381835938, -0.07806968688964844, -0.0737152099609375, -0.06936073303222656, -0.06500625610351562, -0.06065177917480469, -0.05629730224609375, -0.05194282531738281, -0.047588348388671875, -0.04323387145996094, -0.03887939453125, -0.03452491760253906, -0.030170440673828125, -0.025815963745117188, -0.02146148681640625, -0.017107009887695312, -0.012752532958984375, -0.008398056030273438, -0.0040435791015625, 0.0003108978271484375, 0.004665374755859375, 0.009019851684570312, 0.01337432861328125, 0.017728805541992188, 0.022083282470703125, 0.026437759399414062, 0.030792236328125, 0.03514671325683594, 0.039501190185546875, 0.04385566711425781, 0.04821014404296875, 0.05256462097167969, 0.056919097900390625, 0.06127357482910156, 0.0656280517578125, 0.06998252868652344, 0.07433700561523438, 0.07869148254394531, 0.08304595947265625, 0.08740043640136719, 0.09175491333007812, 0.09610939025878906, 0.1004638671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 9.0, 2.0, 7.0, 11.0, 14.0, 17.0, 17.0, 25.0, 25.0, 34.0, 54.0, 54.0, 67.0, 87.0, 114.0, 152.0, 286.0, 510.0, 1051.0, 2791.0, 10139.0, 53946.0, 430242.0, 474454.0, 58168.0, 10757.0, 2897.0, 1063.0, 540.0, 295.0, 187.0, 105.0, 93.0, 66.0, 54.0, 36.0, 39.0, 39.0, 22.0, 20.0, 14.0, 16.0, 5.0, 8.0, 7.0, 11.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.25048828125, -0.24333572387695312, -0.23618316650390625, -0.22903060913085938, -0.2218780517578125, -0.21472549438476562, -0.20757293701171875, -0.20042037963867188, -0.193267822265625, -0.18611526489257812, -0.17896270751953125, -0.17181015014648438, -0.1646575927734375, -0.15750503540039062, -0.15035247802734375, -0.14319992065429688, -0.13604736328125, -0.12889480590820312, -0.12174224853515625, -0.11458969116210938, -0.1074371337890625, -0.10028457641601562, -0.09313201904296875, -0.08597946166992188, -0.078826904296875, -0.07167434692382812, -0.06452178955078125, -0.057369232177734375, -0.0502166748046875, -0.043064117431640625, -0.03591156005859375, -0.028759002685546875, -0.0216064453125, -0.014453887939453125, -0.00730133056640625, -0.000148773193359375, 0.0070037841796875, 0.014156341552734375, 0.02130889892578125, 0.028461456298828125, 0.035614013671875, 0.042766571044921875, 0.04991912841796875, 0.057071685791015625, 0.0642242431640625, 0.07137680053710938, 0.07852935791015625, 0.08568191528320312, 0.09283447265625, 0.09998703002929688, 0.10713958740234375, 0.11429214477539062, 0.1214447021484375, 0.12859725952148438, 0.13574981689453125, 0.14290237426757812, 0.150054931640625, 0.15720748901367188, 0.16436004638671875, 0.17151260375976562, 0.1786651611328125, 0.18581771850585938, 0.19297027587890625, 0.20012283325195312, 0.207275390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 4.0, 14.0, 12.0, 15.0, 20.0, 22.0, 22.0, 23.0, 26.0, 45.0, 33.0, 52.0, 61.0, 51.0, 55.0, 46.0, 60.0, 57.0, 38.0, 49.0, 33.0, 37.0, 28.0, 25.0, 30.0, 27.0, 17.0, 23.0, 19.0, 11.0, 13.0, 8.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57861328125, -0.5621910095214844, -0.5457687377929688, -0.5293464660644531, -0.5129241943359375, -0.4965019226074219, -0.48007965087890625, -0.4636573791503906, -0.447235107421875, -0.4308128356933594, -0.41439056396484375, -0.3979682922363281, -0.3815460205078125, -0.3651237487792969, -0.34870147705078125, -0.3322792053222656, -0.31585693359375, -0.2994346618652344, -0.28301239013671875, -0.2665901184082031, -0.2501678466796875, -0.23374557495117188, -0.21732330322265625, -0.20090103149414062, -0.184478759765625, -0.16805648803710938, -0.15163421630859375, -0.13521194458007812, -0.1187896728515625, -0.10236740112304688, -0.08594512939453125, -0.06952285766601562, -0.0531005859375, -0.036678314208984375, -0.02025604248046875, -0.003833770751953125, 0.0125885009765625, 0.029010772705078125, 0.04543304443359375, 0.061855316162109375, 0.078277587890625, 0.09469985961914062, 0.11112213134765625, 0.12754440307617188, 0.1439666748046875, 0.16038894653320312, 0.17681121826171875, 0.19323348999023438, 0.20965576171875, 0.22607803344726562, 0.24250030517578125, 0.2589225769042969, 0.2753448486328125, 0.2917671203613281, 0.30818939208984375, 0.3246116638183594, 0.341033935546875, 0.3574562072753906, 0.37387847900390625, 0.3903007507324219, 0.4067230224609375, 0.4231452941894531, 0.43956756591796875, 0.4559898376464844, 0.472412109375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 6.0, 8.0, 7.0, 15.0, 24.0, 34.0, 44.0, 72.0, 126.0, 267.0, 615.0, 1608.0, 6094.0, 51659.0, 887314.0, 88952.0, 8331.0, 1966.0, 729.0, 297.0, 134.0, 72.0, 54.0, 41.0, 23.0, 14.0, 12.0, 11.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1829833984375, -0.1778411865234375, -0.172698974609375, -0.1675567626953125, -0.16241455078125, -0.1572723388671875, -0.152130126953125, -0.1469879150390625, -0.141845703125, -0.1367034912109375, -0.131561279296875, -0.1264190673828125, -0.12127685546875, -0.1161346435546875, -0.110992431640625, -0.1058502197265625, -0.1007080078125, -0.0955657958984375, -0.090423583984375, -0.0852813720703125, -0.08013916015625, -0.0749969482421875, -0.069854736328125, -0.0647125244140625, -0.0595703125, -0.0544281005859375, -0.049285888671875, -0.0441436767578125, -0.03900146484375, -0.0338592529296875, -0.028717041015625, -0.0235748291015625, -0.0184326171875, -0.0132904052734375, -0.008148193359375, -0.0030059814453125, 0.00213623046875, 0.0072784423828125, 0.012420654296875, 0.0175628662109375, 0.022705078125, 0.0278472900390625, 0.032989501953125, 0.0381317138671875, 0.04327392578125, 0.0484161376953125, 0.053558349609375, 0.0587005615234375, 0.0638427734375, 0.0689849853515625, 0.074127197265625, 0.0792694091796875, 0.08441162109375, 0.0895538330078125, 0.094696044921875, 0.0998382568359375, 0.10498046875, 0.1101226806640625, 0.115264892578125, 0.1204071044921875, 0.12554931640625, 0.1306915283203125, 0.135833740234375, 0.1409759521484375, 0.1461181640625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 4.0, 4.0, 4.0, 8.0, 14.0, 12.0, 18.0, 26.0, 34.0, 55.0, 79.0, 127.0, 149.0, 133.0, 103.0, 65.0, 41.0, 32.0, 14.0, 20.0, 11.0, 12.0, 7.0, 3.0, 5.0, 5.0, 4.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.693601608276367e-05, -6.500538438558578e-05, -6.30747526884079e-05, -6.114412099123001e-05, -5.9213489294052124e-05, -5.728285759687424e-05, -5.535222589969635e-05, -5.342159420251846e-05, -5.1490962505340576e-05, -4.956033080816269e-05, -4.76296991109848e-05, -4.5699067413806915e-05, -4.376843571662903e-05, -4.183780401945114e-05, -3.9907172322273254e-05, -3.797654062509537e-05, -3.604590892791748e-05, -3.4115277230739594e-05, -3.2184645533561707e-05, -3.025401383638382e-05, -2.8323382139205933e-05, -2.6392750442028046e-05, -2.446211874485016e-05, -2.2531487047672272e-05, -2.0600855350494385e-05, -1.8670223653316498e-05, -1.673959195613861e-05, -1.4808960258960724e-05, -1.2878328561782837e-05, -1.094769686460495e-05, -9.017065167427063e-06, -7.086433470249176e-06, -5.155801773071289e-06, -3.225170075893402e-06, -1.2945383787155151e-06, 6.360933184623718e-07, 2.566725015640259e-06, 4.497356712818146e-06, 6.427988409996033e-06, 8.35862010717392e-06, 1.0289251804351807e-05, 1.2219883501529694e-05, 1.415051519870758e-05, 1.6081146895885468e-05, 1.8011778593063354e-05, 1.994241029024124e-05, 2.187304198741913e-05, 2.3803673684597015e-05, 2.5734305381774902e-05, 2.766493707895279e-05, 2.9595568776130676e-05, 3.152620047330856e-05, 3.345683217048645e-05, 3.538746386766434e-05, 3.7318095564842224e-05, 3.924872726202011e-05, 4.1179358959198e-05, 4.3109990656375885e-05, 4.504062235355377e-05, 4.697125405073166e-05, 4.8901885747909546e-05, 5.083251744508743e-05, 5.276314914226532e-05, 5.469378083944321e-05, 5.6624412536621094e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 8.0, 5.0, 7.0, 7.0, 10.0, 27.0, 39.0, 50.0, 108.0, 187.0, 529.0, 1614.0, 6221.0, 46957.0, 814510.0, 162252.0, 11929.0, 2586.0, 786.0, 332.0, 146.0, 81.0, 49.0, 31.0, 29.0, 6.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.14064979553222656, -0.13591384887695312, -0.1311779022216797, -0.12644195556640625, -0.12170600891113281, -0.11697006225585938, -0.11223411560058594, -0.1074981689453125, -0.10276222229003906, -0.09802627563476562, -0.09329032897949219, -0.08855438232421875, -0.08381843566894531, -0.07908248901367188, -0.07434654235839844, -0.069610595703125, -0.06487464904785156, -0.060138702392578125, -0.05540275573730469, -0.05066680908203125, -0.04593086242675781, -0.041194915771484375, -0.03645896911621094, -0.0317230224609375, -0.026987075805664062, -0.022251129150390625, -0.017515182495117188, -0.01277923583984375, -0.008043289184570312, -0.003307342529296875, 0.0014286041259765625, 0.00616455078125, 0.010900497436523438, 0.015636444091796875, 0.020372390747070312, 0.02510833740234375, 0.029844284057617188, 0.034580230712890625, 0.03931617736816406, 0.0440521240234375, 0.04878807067871094, 0.053524017333984375, 0.05825996398925781, 0.06299591064453125, 0.06773185729980469, 0.07246780395507812, 0.07720375061035156, 0.081939697265625, 0.08667564392089844, 0.09141159057617188, 0.09614753723144531, 0.10088348388671875, 0.10561943054199219, 0.11035537719726562, 0.11509132385253906, 0.1198272705078125, 0.12456321716308594, 0.12929916381835938, 0.1340351104736328, 0.13877105712890625, 0.1435070037841797, 0.14824295043945312, 0.15297889709472656, 0.15771484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 11.0, 21.0, 38.0, 88.0, 161.0, 232.0, 206.0, 103.0, 44.0, 28.0, 14.0, 11.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35205078125, -0.3432121276855469, -0.33437347412109375, -0.3255348205566406, -0.3166961669921875, -0.3078575134277344, -0.29901885986328125, -0.2901802062988281, -0.281341552734375, -0.2725028991699219, -0.26366424560546875, -0.2548255920410156, -0.2459869384765625, -0.23714828491210938, -0.22830963134765625, -0.21947097778320312, -0.21063232421875, -0.20179367065429688, -0.19295501708984375, -0.18411636352539062, -0.1752777099609375, -0.16643905639648438, -0.15760040283203125, -0.14876174926757812, -0.139923095703125, -0.13108444213867188, -0.12224578857421875, -0.11340713500976562, -0.1045684814453125, -0.09572982788085938, -0.08689117431640625, -0.07805252075195312, -0.0692138671875, -0.060375213623046875, -0.05153656005859375, -0.042697906494140625, -0.0338592529296875, -0.025020599365234375, -0.01618194580078125, -0.007343292236328125, 0.001495361328125, 0.010334014892578125, 0.01917266845703125, 0.028011322021484375, 0.0368499755859375, 0.045688629150390625, 0.05452728271484375, 0.06336593627929688, 0.07220458984375, 0.08104324340820312, 0.08988189697265625, 0.09872055053710938, 0.1075592041015625, 0.11639785766601562, 0.12523651123046875, 0.13407516479492188, 0.142913818359375, 0.15175247192382812, 0.16059112548828125, 0.16942977905273438, 0.1782684326171875, 0.18710708618164062, 0.19594573974609375, 0.20478439331054688, 0.213623046875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 2.0, 5.0, 11.0, 7.0, 19.0, 48.0, 55.0, 79.0, 109.0, 139.0, 141.0, 142.0, 109.0, 47.0, 34.0, 23.0, 9.0, 16.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0867371559143066, -2.0298352241516113, -1.9729334115982056, -1.9160315990447998, -1.8591296672821045, -1.8022278547286987, -1.7453259229660034, -1.6884241104125977, -1.6315221786499023, -1.5746203660964966, -1.5177184343338013, -1.4608166217803955, -1.4039146900177002, -1.3470128774642944, -1.2901109457015991, -1.2332091331481934, -1.176307201385498, -1.1194053888320923, -1.062503457069397, -1.0056016445159912, -0.9486997127532959, -0.8917979001998901, -0.8348959684371948, -0.7779941558837891, -0.7210923433303833, -0.6641904711723328, -0.6072885990142822, -0.5503867268562317, -0.49348485469818115, -0.436583012342453, -0.37968114018440247, -0.32277926802635193, -0.265877366065979, -0.20897549390792847, -0.15207362174987793, -0.09517176449298859, -0.03826989233493805, 0.018631964921951294, 0.07553383708000183, 0.13243570923805237, 0.1893375813961029, 0.24623945355415344, 0.303141325712204, 0.36004316806793213, 0.41694504022598267, 0.4738469123840332, 0.5307487845420837, 0.5876506567001343, 0.6445525288581848, 0.7014544010162354, 0.7583562731742859, 0.8152581453323364, 0.872160017490387, 0.9290618896484375, 0.9859637022018433, 1.0428656339645386, 1.0997674465179443, 1.15666925907135, 1.2135711908340454, 1.2704730033874512, 1.3273749351501465, 1.3842767477035522, 1.4411786794662476, 1.4980804920196533, 1.5549824237823486]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 8.0, 7.0, 11.0, 7.0, 17.0, 13.0, 17.0, 12.0, 25.0, 27.0, 25.0, 24.0, 36.0, 30.0, 41.0, 54.0, 35.0, 55.0, 64.0, 50.0, 48.0, 47.0, 43.0, 36.0, 33.0, 46.0, 26.0, 33.0, 24.0, 18.0, 18.0, 12.0, 15.0, 10.0, 4.0, 6.0, 2.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0074591636657715, -1.9423013925552368, -1.8771436214447021, -1.811985969543457, -1.7468281984329224, -1.6816704273223877, -1.6165127754211426, -1.551355004310608, -1.4861972332000732, -1.4210394620895386, -1.355881690979004, -1.2907240390777588, -1.2255662679672241, -1.1604084968566895, -1.0952508449554443, -1.0300930738449097, -0.964935302734375, -0.8997775316238403, -0.8346198201179504, -0.7694621086120605, -0.7043043375015259, -0.6391465663909912, -0.5739888548851013, -0.5088311433792114, -0.44367337226867676, -0.3785156309604645, -0.3133578896522522, -0.24820014834403992, -0.18304240703582764, -0.11788466572761536, -0.052726924419403076, 0.012430816888809204, 0.07758855819702148, 0.14274629950523376, 0.20790404081344604, 0.2730617821216583, 0.3382195234298706, 0.4033772647380829, 0.46853500604629517, 0.5336927175521851, 0.5988504886627197, 0.6640082597732544, 0.7291659712791443, 0.7943236827850342, 0.8594814538955688, 0.9246392250061035, 0.9897969365119934, 1.0549546480178833, 1.120112419128418, 1.1852701902389526, 1.2504279613494873, 1.3155856132507324, 1.380743384361267, 1.4459011554718018, 1.5110588073730469, 1.5762165784835815, 1.6413743495941162, 1.7065321207046509, 1.7716898918151855, 1.8368475437164307, 1.9020053148269653, 1.9671630859375, 2.032320737838745, 2.0974786281585693, 2.1626362800598145]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 7.0, 11.0, 14.0, 24.0, 23.0, 35.0, 60.0, 99.0, 122.0, 170.0, 246.0, 374.0, 605.0, 963.0, 1760.0, 3468.0, 9282.0, 49489.0, 4014737.0, 91139.0, 12308.0, 4203.0, 2075.0, 1086.0, 684.0, 444.0, 265.0, 190.0, 105.0, 87.0, 55.0, 50.0, 30.0, 13.0, 14.0, 9.0, 5.0, 5.0, 10.0, 1.0, 4.0, 3.0], "bins": [-0.2254638671875, -0.2199115753173828, -0.21435928344726562, -0.20880699157714844, -0.20325469970703125, -0.19770240783691406, -0.19215011596679688, -0.1865978240966797, -0.1810455322265625, -0.1754932403564453, -0.16994094848632812, -0.16438865661621094, -0.15883636474609375, -0.15328407287597656, -0.14773178100585938, -0.1421794891357422, -0.136627197265625, -0.1310749053955078, -0.12552261352539062, -0.11997032165527344, -0.11441802978515625, -0.10886573791503906, -0.10331344604492188, -0.09776115417480469, -0.0922088623046875, -0.08665657043457031, -0.08110427856445312, -0.07555198669433594, -0.06999969482421875, -0.06444740295410156, -0.058895111083984375, -0.05334281921386719, -0.04779052734375, -0.04223823547363281, -0.036685943603515625, -0.031133651733398438, -0.02558135986328125, -0.020029067993164062, -0.014476776123046875, -0.008924484252929688, -0.0033721923828125, 0.0021800994873046875, 0.007732391357421875, 0.013284683227539062, 0.01883697509765625, 0.024389266967773438, 0.029941558837890625, 0.03549385070800781, 0.041046142578125, 0.04659843444824219, 0.052150726318359375, 0.05770301818847656, 0.06325531005859375, 0.06880760192871094, 0.07435989379882812, 0.07991218566894531, 0.0854644775390625, 0.09101676940917969, 0.09656906127929688, 0.10212135314941406, 0.10767364501953125, 0.11322593688964844, 0.11877822875976562, 0.12433052062988281, 0.1298828125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 10.0, 8.0, 6.0, 16.0, 9.0, 18.0, 27.0, 27.0, 28.0, 39.0, 36.0, 40.0, 49.0, 58.0, 54.0, 70.0, 44.0, 53.0, 56.0, 50.0, 48.0, 46.0, 25.0, 30.0, 30.0, 21.0, 20.0, 16.0, 14.0, 11.0, 3.0, 8.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-0.1556396484375, -0.15176105499267578, -0.14788246154785156, -0.14400386810302734, -0.14012527465820312, -0.1362466812133789, -0.1323680877685547, -0.12848949432373047, -0.12461090087890625, -0.12073230743408203, -0.11685371398925781, -0.1129751205444336, -0.10909652709960938, -0.10521793365478516, -0.10133934020996094, -0.09746074676513672, -0.0935821533203125, -0.08970355987548828, -0.08582496643066406, -0.08194637298583984, -0.07806777954101562, -0.0741891860961914, -0.07031059265136719, -0.06643199920654297, -0.06255340576171875, -0.05867481231689453, -0.05479621887207031, -0.050917625427246094, -0.047039031982421875, -0.043160438537597656, -0.03928184509277344, -0.03540325164794922, -0.031524658203125, -0.02764606475830078, -0.023767471313476562, -0.019888877868652344, -0.016010284423828125, -0.012131690979003906, -0.008253097534179688, -0.004374504089355469, -0.00049591064453125, 0.0033826828002929688, 0.0072612762451171875, 0.011139869689941406, 0.015018463134765625, 0.018897056579589844, 0.022775650024414062, 0.02665424346923828, 0.0305328369140625, 0.03441143035888672, 0.03829002380371094, 0.042168617248535156, 0.046047210693359375, 0.049925804138183594, 0.05380439758300781, 0.05768299102783203, 0.06156158447265625, 0.06544017791748047, 0.06931877136230469, 0.0731973648071289, 0.07707595825195312, 0.08095455169677734, 0.08483314514160156, 0.08871173858642578, 0.09259033203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 3.0, 6.0, 9.0, 13.0, 14.0, 18.0, 28.0, 45.0, 57.0, 80.0, 104.0, 136.0, 229.0, 360.0, 644.0, 1120.0, 2456.0, 7450.0, 85443.0, 4066232.0, 21460.0, 4264.0, 1746.0, 854.0, 472.0, 307.0, 195.0, 138.0, 99.0, 80.0, 54.0, 43.0, 33.0, 27.0, 12.0, 8.0, 12.0, 13.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300537109375, -0.29093170166015625, -0.2813262939453125, -0.27172088623046875, -0.262115478515625, -0.25251007080078125, -0.2429046630859375, -0.23329925537109375, -0.22369384765625, -0.21408843994140625, -0.2044830322265625, -0.19487762451171875, -0.185272216796875, -0.17566680908203125, -0.1660614013671875, -0.15645599365234375, -0.1468505859375, -0.13724517822265625, -0.1276397705078125, -0.11803436279296875, -0.108428955078125, -0.09882354736328125, -0.0892181396484375, -0.07961273193359375, -0.07000732421875, -0.06040191650390625, -0.0507965087890625, -0.04119110107421875, -0.031585693359375, -0.02198028564453125, -0.0123748779296875, -0.00276947021484375, 0.0068359375, 0.01644134521484375, 0.0260467529296875, 0.03565216064453125, 0.045257568359375, 0.05486297607421875, 0.0644683837890625, 0.07407379150390625, 0.08367919921875, 0.09328460693359375, 0.1028900146484375, 0.11249542236328125, 0.122100830078125, 0.13170623779296875, 0.1413116455078125, 0.15091705322265625, 0.1605224609375, 0.17012786865234375, 0.1797332763671875, 0.18933868408203125, 0.198944091796875, 0.20854949951171875, 0.2181549072265625, 0.22776031494140625, 0.23736572265625, 0.24697113037109375, 0.2565765380859375, 0.26618194580078125, 0.275787353515625, 0.28539276123046875, 0.2949981689453125, 0.30460357666015625, 0.314208984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 10.0, 22.0, 128.0, 3610.0, 229.0, 43.0, 18.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21435546875, -0.2073535919189453, -0.20035171508789062, -0.19334983825683594, -0.18634796142578125, -0.17934608459472656, -0.17234420776367188, -0.1653423309326172, -0.1583404541015625, -0.1513385772705078, -0.14433670043945312, -0.13733482360839844, -0.13033294677734375, -0.12333106994628906, -0.11632919311523438, -0.10932731628417969, -0.102325439453125, -0.09532356262207031, -0.08832168579101562, -0.08131980895996094, -0.07431793212890625, -0.06731605529785156, -0.060314178466796875, -0.05331230163574219, -0.0463104248046875, -0.03930854797363281, -0.032306671142578125, -0.025304794311523438, -0.01830291748046875, -0.011301040649414062, -0.004299163818359375, 0.0027027130126953125, 0.00970458984375, 0.016706466674804688, 0.023708343505859375, 0.030710220336914062, 0.03771209716796875, 0.04471397399902344, 0.051715850830078125, 0.05871772766113281, 0.0657196044921875, 0.07272148132324219, 0.07972335815429688, 0.08672523498535156, 0.09372711181640625, 0.10072898864746094, 0.10773086547851562, 0.11473274230957031, 0.121734619140625, 0.1287364959716797, 0.13573837280273438, 0.14274024963378906, 0.14974212646484375, 0.15674400329589844, 0.16374588012695312, 0.1707477569580078, 0.1777496337890625, 0.1847515106201172, 0.19175338745117188, 0.19875526428222656, 0.20575714111328125, 0.21275901794433594, 0.21976089477539062, 0.2267627716064453, 0.2337646484375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 9.0, 11.0, 23.0, 40.0, 58.0, 83.0, 121.0, 147.0, 184.0, 127.0, 79.0, 46.0, 31.0, 13.0, 10.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36494317650794983, -0.3513897657394409, -0.3378363847732544, -0.3242829740047455, -0.3107295632362366, -0.29717618227005005, -0.28362277150154114, -0.2700693607330322, -0.2565159797668457, -0.24296258389949799, -0.22940917313098907, -0.21585577726364136, -0.20230236649513245, -0.18874897062778473, -0.175195574760437, -0.1616421639919281, -0.1480887532234192, -0.13453535735607147, -0.12098194658756256, -0.10742855072021484, -0.09387514740228653, -0.08032174408435822, -0.0667683482170105, -0.053214944899082184, -0.03966154158115387, -0.026108140125870705, -0.01255473867058754, 0.000998660922050476, 0.01455206423997879, 0.028105467557907104, 0.04165886342525482, 0.055212266743183136, 0.06876569986343384, 0.08231910318136215, 0.09587250649929047, 0.10942590236663818, 0.1229793056845665, 0.1365327090024948, 0.15008610486984253, 0.16363951563835144, 0.17719291150569916, 0.19074630737304688, 0.2042997181415558, 0.2178531140089035, 0.23140650987625122, 0.24495992064476013, 0.25851333141326904, 0.27206671237945557, 0.2856201231479645, 0.2991735339164734, 0.3127269148826599, 0.3262803256511688, 0.33983373641967773, 0.35338711738586426, 0.36694052815437317, 0.3804939389228821, 0.3940473198890686, 0.4076007306575775, 0.42115411162376404, 0.43470752239227295, 0.44826093316078186, 0.46181434392929077, 0.4753677248954773, 0.4889211356639862, 0.5024745464324951]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 10.0, 8.0, 14.0, 21.0, 22.0, 31.0, 38.0, 36.0, 38.0, 37.0, 45.0, 55.0, 54.0, 66.0, 52.0, 46.0, 52.0, 59.0, 59.0, 43.0, 33.0, 43.0, 26.0, 23.0, 20.0, 19.0, 13.0, 7.0, 8.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24484783411026, -0.23513230681419373, -0.22541677951812744, -0.21570125222206116, -0.20598572492599487, -0.1962701976299286, -0.1865546703338623, -0.17683914303779602, -0.16712361574172974, -0.15740808844566345, -0.14769256114959717, -0.13797703385353088, -0.1282615065574646, -0.11854597926139832, -0.10883045941591263, -0.09911493211984634, -0.08939941227436066, -0.07968388497829437, -0.06996835768222809, -0.0602528341114521, -0.05053730681538582, -0.040821779519319534, -0.03110625594854355, -0.021390728652477264, -0.01167520135641098, -0.0019596749916672707, 0.007755851373076439, 0.017471376806497574, 0.027186904102563858, 0.03690243139863014, 0.04661795496940613, 0.05633348226547241, 0.0660490095615387, 0.07576453685760498, 0.08548006415367126, 0.09519559144973755, 0.10491111874580383, 0.11462664604187012, 0.1243421658873558, 0.13405770063400269, 0.14377322793006897, 0.15348875522613525, 0.16320428252220154, 0.17291980981826782, 0.1826353371143341, 0.1923508644104004, 0.20206639170646667, 0.21178191900253296, 0.22149743139743805, 0.23121295869350433, 0.24092848598957062, 0.2506439983844757, 0.260359525680542, 0.2700750529766083, 0.27979058027267456, 0.28950610756874084, 0.29922163486480713, 0.3089371621608734, 0.3186526894569397, 0.328368216753006, 0.33808374404907227, 0.34779927134513855, 0.35751479864120483, 0.3672303259372711, 0.3769458532333374]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 13.0, 11.0, 19.0, 32.0, 27.0, 47.0, 85.0, 126.0, 244.0, 493.0, 1018.0, 2349.0, 6507.0, 22587.0, 104919.0, 523954.0, 310731.0, 54349.0, 13553.0, 4168.0, 1690.0, 732.0, 343.0, 214.0, 119.0, 78.0, 45.0, 31.0, 16.0, 16.0, 7.0, 10.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.260986328125, -0.2538948059082031, -0.24680328369140625, -0.23971176147460938, -0.2326202392578125, -0.22552871704101562, -0.21843719482421875, -0.21134567260742188, -0.204254150390625, -0.19716262817382812, -0.19007110595703125, -0.18297958374023438, -0.1758880615234375, -0.16879653930664062, -0.16170501708984375, -0.15461349487304688, -0.14752197265625, -0.14043045043945312, -0.13333892822265625, -0.12624740600585938, -0.1191558837890625, -0.11206436157226562, -0.10497283935546875, -0.09788131713867188, -0.090789794921875, -0.08369827270507812, -0.07660675048828125, -0.06951522827148438, -0.0624237060546875, -0.055332183837890625, -0.04824066162109375, -0.041149139404296875, -0.0340576171875, -0.026966094970703125, -0.01987457275390625, -0.012783050537109375, -0.0056915283203125, 0.001399993896484375, 0.00849151611328125, 0.015583038330078125, 0.022674560546875, 0.029766082763671875, 0.03685760498046875, 0.043949127197265625, 0.0510406494140625, 0.058132171630859375, 0.06522369384765625, 0.07231521606445312, 0.07940673828125, 0.08649826049804688, 0.09358978271484375, 0.10068130493164062, 0.1077728271484375, 0.11486434936523438, 0.12195587158203125, 0.12904739379882812, 0.136138916015625, 0.14323043823242188, 0.15032196044921875, 0.15741348266601562, 0.1645050048828125, 0.17159652709960938, 0.17868804931640625, 0.18577957153320312, 0.19287109375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 7.0, 13.0, 15.0, 12.0, 11.0, 20.0, 16.0, 35.0, 27.0, 33.0, 37.0, 51.0, 49.0, 36.0, 59.0, 51.0, 57.0, 54.0, 41.0, 48.0, 40.0, 43.0, 34.0, 30.0, 21.0, 27.0, 24.0, 21.0, 15.0, 12.0, 12.0, 8.0, 1.0, 15.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.147216796875, -0.1434640884399414, -0.1397113800048828, -0.13595867156982422, -0.13220596313476562, -0.12845325469970703, -0.12470054626464844, -0.12094783782958984, -0.11719512939453125, -0.11344242095947266, -0.10968971252441406, -0.10593700408935547, -0.10218429565429688, -0.09843158721923828, -0.09467887878417969, -0.0909261703491211, -0.0871734619140625, -0.0834207534790039, -0.07966804504394531, -0.07591533660888672, -0.07216262817382812, -0.06840991973876953, -0.06465721130371094, -0.060904502868652344, -0.05715179443359375, -0.053399085998535156, -0.04964637756347656, -0.04589366912841797, -0.042140960693359375, -0.03838825225830078, -0.03463554382324219, -0.030882835388183594, -0.027130126953125, -0.023377418518066406, -0.019624710083007812, -0.01587200164794922, -0.012119293212890625, -0.008366584777832031, -0.0046138763427734375, -0.0008611679077148438, 0.00289154052734375, 0.006644248962402344, 0.010396957397460938, 0.014149665832519531, 0.017902374267578125, 0.02165508270263672, 0.025407791137695312, 0.029160499572753906, 0.0329132080078125, 0.036665916442871094, 0.04041862487792969, 0.04417133331298828, 0.047924041748046875, 0.05167675018310547, 0.05542945861816406, 0.059182167053222656, 0.06293487548828125, 0.06668758392333984, 0.07044029235839844, 0.07419300079345703, 0.07794570922851562, 0.08169841766357422, 0.08545112609863281, 0.0892038345336914, 0.09295654296875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 11.0, 11.0, 23.0, 31.0, 32.0, 42.0, 63.0, 97.0, 156.0, 257.0, 423.0, 940.0, 2405.0, 9137.0, 56664.0, 659879.0, 283628.0, 26044.0, 5401.0, 1654.0, 649.0, 358.0, 212.0, 130.0, 78.0, 48.0, 52.0, 32.0, 30.0, 14.0, 7.0, 7.0, 8.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25927734375, -0.2499542236328125, -0.240631103515625, -0.2313079833984375, -0.22198486328125, -0.2126617431640625, -0.203338623046875, -0.1940155029296875, -0.1846923828125, -0.1753692626953125, -0.166046142578125, -0.1567230224609375, -0.14739990234375, -0.1380767822265625, -0.128753662109375, -0.1194305419921875, -0.110107421875, -0.1007843017578125, -0.091461181640625, -0.0821380615234375, -0.07281494140625, -0.0634918212890625, -0.054168701171875, -0.0448455810546875, -0.0355224609375, -0.0261993408203125, -0.016876220703125, -0.0075531005859375, 0.00177001953125, 0.0110931396484375, 0.020416259765625, 0.0297393798828125, 0.0390625, 0.0483856201171875, 0.057708740234375, 0.0670318603515625, 0.07635498046875, 0.0856781005859375, 0.095001220703125, 0.1043243408203125, 0.1136474609375, 0.1229705810546875, 0.132293701171875, 0.1416168212890625, 0.15093994140625, 0.1602630615234375, 0.169586181640625, 0.1789093017578125, 0.188232421875, 0.1975555419921875, 0.206878662109375, 0.2162017822265625, 0.22552490234375, 0.2348480224609375, 0.244171142578125, 0.2534942626953125, 0.2628173828125, 0.2721405029296875, 0.281463623046875, 0.2907867431640625, 0.30010986328125, 0.3094329833984375, 0.318756103515625, 0.3280792236328125, 0.33740234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 10.0, 12.0, 7.0, 10.0, 15.0, 12.0, 19.0, 23.0, 29.0, 27.0, 31.0, 39.0, 44.0, 37.0, 47.0, 38.0, 47.0, 51.0, 51.0, 47.0, 59.0, 44.0, 55.0, 35.0, 39.0, 36.0, 32.0, 16.0, 16.0, 8.0, 16.0, 8.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4677734375, -0.4536552429199219, -0.43953704833984375, -0.4254188537597656, -0.4113006591796875, -0.3971824645996094, -0.38306427001953125, -0.3689460754394531, -0.354827880859375, -0.3407096862792969, -0.32659149169921875, -0.3124732971191406, -0.2983551025390625, -0.2842369079589844, -0.27011871337890625, -0.2560005187988281, -0.24188232421875, -0.22776412963867188, -0.21364593505859375, -0.19952774047851562, -0.1854095458984375, -0.17129135131835938, -0.15717315673828125, -0.14305496215820312, -0.128936767578125, -0.11481857299804688, -0.10070037841796875, -0.08658218383789062, -0.0724639892578125, -0.058345794677734375, -0.04422760009765625, -0.030109405517578125, -0.0159912109375, -0.001873016357421875, 0.01224517822265625, 0.026363372802734375, 0.0404815673828125, 0.054599761962890625, 0.06871795654296875, 0.08283615112304688, 0.096954345703125, 0.11107254028320312, 0.12519073486328125, 0.13930892944335938, 0.1534271240234375, 0.16754531860351562, 0.18166351318359375, 0.19578170776367188, 0.20989990234375, 0.22401809692382812, 0.23813629150390625, 0.2522544860839844, 0.2663726806640625, 0.2804908752441406, 0.29460906982421875, 0.3087272644042969, 0.322845458984375, 0.3369636535644531, 0.35108184814453125, 0.3652000427246094, 0.3793182373046875, 0.3934364318847656, 0.40755462646484375, 0.4216728210449219, 0.435791015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 3.0, 8.0, 12.0, 23.0, 36.0, 62.0, 75.0, 142.0, 276.0, 594.0, 1770.0, 7683.0, 83025.0, 876793.0, 68452.0, 6881.0, 1545.0, 540.0, 255.0, 133.0, 78.0, 54.0, 41.0, 15.0, 15.0, 10.0, 7.0, 3.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1175537109375, -0.11381816864013672, -0.11008262634277344, -0.10634708404541016, -0.10261154174804688, -0.0988759994506836, -0.09514045715332031, -0.09140491485595703, -0.08766937255859375, -0.08393383026123047, -0.08019828796386719, -0.0764627456665039, -0.07272720336914062, -0.06899166107177734, -0.06525611877441406, -0.06152057647705078, -0.0577850341796875, -0.05404949188232422, -0.05031394958496094, -0.046578407287597656, -0.042842864990234375, -0.039107322692871094, -0.03537178039550781, -0.03163623809814453, -0.02790069580078125, -0.02416515350341797, -0.020429611206054688, -0.016694068908691406, -0.012958526611328125, -0.009222984313964844, -0.0054874420166015625, -0.0017518997192382812, 0.001983642578125, 0.005719184875488281, 0.009454727172851562, 0.013190269470214844, 0.016925811767578125, 0.020661354064941406, 0.024396896362304688, 0.02813243865966797, 0.03186798095703125, 0.03560352325439453, 0.03933906555175781, 0.043074607849121094, 0.046810150146484375, 0.050545692443847656, 0.05428123474121094, 0.05801677703857422, 0.0617523193359375, 0.06548786163330078, 0.06922340393066406, 0.07295894622802734, 0.07669448852539062, 0.0804300308227539, 0.08416557312011719, 0.08790111541748047, 0.09163665771484375, 0.09537220001220703, 0.09910774230957031, 0.1028432846069336, 0.10657882690429688, 0.11031436920166016, 0.11404991149902344, 0.11778545379638672, 0.12152099609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 9.0, 9.0, 7.0, 16.0, 13.0, 20.0, 14.0, 29.0, 30.0, 43.0, 58.0, 72.0, 119.0, 94.0, 123.0, 86.0, 56.0, 62.0, 26.0, 28.0, 17.0, 11.0, 11.0, 8.0, 7.0, 9.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-5.358457565307617e-05, -5.211867392063141e-05, -5.0652772188186646e-05, -4.918687045574188e-05, -4.772096872329712e-05, -4.6255066990852356e-05, -4.478916525840759e-05, -4.332326352596283e-05, -4.1857361793518066e-05, -4.03914600610733e-05, -3.892555832862854e-05, -3.745965659618378e-05, -3.5993754863739014e-05, -3.452785313129425e-05, -3.306195139884949e-05, -3.1596049666404724e-05, -3.013014793395996e-05, -2.8664246201515198e-05, -2.7198344469070435e-05, -2.573244273662567e-05, -2.4266541004180908e-05, -2.2800639271736145e-05, -2.1334737539291382e-05, -1.986883580684662e-05, -1.8402934074401855e-05, -1.6937032341957092e-05, -1.547113060951233e-05, -1.4005228877067566e-05, -1.2539327144622803e-05, -1.107342541217804e-05, -9.607523679733276e-06, -8.141621947288513e-06, -6.67572021484375e-06, -5.209818482398987e-06, -3.7439167499542236e-06, -2.2780150175094604e-06, -8.121132850646973e-07, 6.537884473800659e-07, 2.119690179824829e-06, 3.5855919122695923e-06, 5.0514936447143555e-06, 6.517395377159119e-06, 7.983297109603882e-06, 9.449198842048645e-06, 1.0915100574493408e-05, 1.2381002306938171e-05, 1.3846904039382935e-05, 1.5312805771827698e-05, 1.677870750427246e-05, 1.8244609236717224e-05, 1.9710510969161987e-05, 2.117641270160675e-05, 2.2642314434051514e-05, 2.4108216166496277e-05, 2.557411789894104e-05, 2.7040019631385803e-05, 2.8505921363830566e-05, 2.997182309627533e-05, 3.143772482872009e-05, 3.2903626561164856e-05, 3.436952829360962e-05, 3.583543002605438e-05, 3.7301331758499146e-05, 3.876723349094391e-05, 4.023313522338867e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 1.0, 4.0, 9.0, 12.0, 20.0, 49.0, 92.0, 242.0, 928.0, 5940.0, 281365.0, 748002.0, 10119.0, 1195.0, 321.0, 121.0, 72.0, 28.0, 11.0, 11.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.271728515625, -0.2655668258666992, -0.25940513610839844, -0.25324344635009766, -0.24708175659179688, -0.2409200668334961, -0.2347583770751953, -0.22859668731689453, -0.22243499755859375, -0.21627330780029297, -0.2101116180419922, -0.2039499282836914, -0.19778823852539062, -0.19162654876708984, -0.18546485900878906, -0.17930316925048828, -0.1731414794921875, -0.16697978973388672, -0.16081809997558594, -0.15465641021728516, -0.14849472045898438, -0.1423330307006836, -0.1361713409423828, -0.13000965118408203, -0.12384796142578125, -0.11768627166748047, -0.11152458190917969, -0.1053628921508789, -0.09920120239257812, -0.09303951263427734, -0.08687782287597656, -0.08071613311767578, -0.074554443359375, -0.06839275360107422, -0.06223106384277344, -0.056069374084472656, -0.049907684326171875, -0.043745994567871094, -0.03758430480957031, -0.03142261505126953, -0.02526092529296875, -0.01909923553466797, -0.012937545776367188, -0.006775856018066406, -0.000614166259765625, 0.005547523498535156, 0.011709213256835938, 0.01787090301513672, 0.0240325927734375, 0.03019428253173828, 0.03635597229003906, 0.042517662048339844, 0.048679351806640625, 0.054841041564941406, 0.06100273132324219, 0.06716442108154297, 0.07332611083984375, 0.07948780059814453, 0.08564949035644531, 0.0918111801147461, 0.09797286987304688, 0.10413455963134766, 0.11029624938964844, 0.11645793914794922, 0.12261962890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 11.0, 18.0, 18.0, 30.0, 54.0, 85.0, 127.0, 143.0, 144.0, 147.0, 85.0, 37.0, 23.0, 19.0, 13.0, 13.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09625244140625, -0.09143543243408203, -0.08661842346191406, -0.0818014144897461, -0.07698440551757812, -0.07216739654541016, -0.06735038757324219, -0.06253337860107422, -0.05771636962890625, -0.05289936065673828, -0.04808235168457031, -0.043265342712402344, -0.038448333740234375, -0.033631324768066406, -0.028814315795898438, -0.02399730682373047, -0.0191802978515625, -0.014363288879394531, -0.009546279907226562, -0.004729270935058594, 8.7738037109375e-05, 0.004904747009277344, 0.009721755981445312, 0.014538764953613281, 0.01935577392578125, 0.02417278289794922, 0.028989791870117188, 0.033806800842285156, 0.038623809814453125, 0.043440818786621094, 0.04825782775878906, 0.05307483673095703, 0.057891845703125, 0.06270885467529297, 0.06752586364746094, 0.0723428726196289, 0.07715988159179688, 0.08197689056396484, 0.08679389953613281, 0.09161090850830078, 0.09642791748046875, 0.10124492645263672, 0.10606193542480469, 0.11087894439697266, 0.11569595336914062, 0.1205129623413086, 0.12532997131347656, 0.13014698028564453, 0.1349639892578125, 0.13978099822998047, 0.14459800720214844, 0.1494150161743164, 0.15423202514648438, 0.15904903411865234, 0.1638660430908203, 0.16868305206298828, 0.17350006103515625, 0.17831707000732422, 0.1831340789794922, 0.18795108795166016, 0.19276809692382812, 0.1975851058959961, 0.20240211486816406, 0.20721912384033203, 0.2120361328125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 9.0, 12.0, 72.0, 194.0, 342.0, 243.0, 92.0, 26.0, 14.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.448692321777344, -5.31413459777832, -5.179576873779297, -5.045019149780273, -4.91046142578125, -4.775903701782227, -4.641345977783203, -4.50678825378418, -4.372230529785156, -4.237672805786133, -4.103115081787109, -3.968557357788086, -3.8339996337890625, -3.699441909790039, -3.5648841857910156, -3.430326461791992, -3.295768976211548, -3.1612112522125244, -3.026653528213501, -2.8920958042144775, -2.757538080215454, -2.6229803562164307, -2.4884228706359863, -2.353865146636963, -2.2193074226379395, -2.084749698638916, -1.9501919746398926, -1.8156342506408691, -1.6810765266418457, -1.5465188026428223, -1.4119611978530884, -1.277403473854065, -1.142845630645752, -1.0082879066467285, -0.8737301826477051, -0.7391725182533264, -0.604614794254303, -0.47005707025527954, -0.3354994058609009, -0.20094168186187744, -0.066383957862854, 0.06817375123500824, 0.20273146033287048, 0.33728915452957153, 0.47184687852859497, 0.6064046025276184, 0.7409622669219971, 0.8755199909210205, 1.010077714920044, 1.1446354389190674, 1.2791931629180908, 1.4137508869171143, 1.5483086109161377, 1.6828663349151611, 1.817423939704895, 1.9519816637039185, 2.0865392684936523, 2.221096992492676, 2.355654716491699, 2.4902124404907227, 2.624770164489746, 2.7593278884887695, 2.893885612487793, 3.0284433364868164, 3.16300106048584]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 12.0, 10.0, 13.0, 12.0, 22.0, 22.0, 23.0, 26.0, 28.0, 38.0, 47.0, 43.0, 50.0, 52.0, 56.0, 54.0, 72.0, 56.0, 58.0, 41.0, 39.0, 34.0, 37.0, 37.0, 23.0, 12.0, 11.0, 15.0, 9.0, 14.0, 11.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0071139335632324, -1.9408154487609863, -1.8745168447494507, -1.8082183599472046, -1.7419198751449585, -1.6756212711334229, -1.6093227863311768, -1.5430243015289307, -1.4767258167266846, -1.4104273319244385, -1.3441287279129028, -1.2778302431106567, -1.2115317583084106, -1.145233154296875, -1.078934669494629, -1.0126361846923828, -0.9463375806808472, -0.8800390362739563, -0.8137405514717102, -0.7474420070648193, -0.6811435222625732, -0.6148449778556824, -0.5485464334487915, -0.482247918844223, -0.41594940423965454, -0.34965088963508606, -0.2833523750305176, -0.2170538306236267, -0.15075531601905823, -0.08445680141448975, -0.018158257007598877, 0.048140257596969604, 0.11443877220153809, 0.18073728680610657, 0.24703581631183624, 0.3133343458175659, 0.3796328604221344, 0.4459313750267029, 0.5122299194335938, 0.5785284042358398, 0.6448269486427307, 0.7111254930496216, 0.7774239778518677, 0.8437225222587585, 0.9100210666656494, 0.9763195514678955, 1.0426180362701416, 1.1089166402816772, 1.1752151250839233, 1.2415136098861694, 1.307812213897705, 1.3741106986999512, 1.4404091835021973, 1.5067076683044434, 1.573006272315979, 1.639304757118225, 1.7056033611297607, 1.7719018459320068, 1.8382004499435425, 1.9044989347457886, 1.9707974195480347, 2.0370960235595703, 2.1033945083618164, 2.1696929931640625, 2.2359914779663086]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 6.0, 6.0, 8.0, 10.0, 16.0, 18.0, 28.0, 41.0, 42.0, 64.0, 82.0, 145.0, 239.0, 341.0, 539.0, 965.0, 1924.0, 4066.0, 9648.0, 31947.0, 394353.0, 3572750.0, 141243.0, 21139.0, 7595.0, 3271.0, 1590.0, 893.0, 458.0, 292.0, 158.0, 123.0, 62.0, 58.0, 34.0, 33.0, 23.0, 11.0, 10.0, 9.0, 17.0, 4.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1802978515625, -0.17489242553710938, -0.16948699951171875, -0.16408157348632812, -0.1586761474609375, -0.15327072143554688, -0.14786529541015625, -0.14245986938476562, -0.137054443359375, -0.13164901733398438, -0.12624359130859375, -0.12083816528320312, -0.1154327392578125, -0.11002731323242188, -0.10462188720703125, -0.09921646118164062, -0.09381103515625, -0.08840560913085938, -0.08300018310546875, -0.07759475708007812, -0.0721893310546875, -0.06678390502929688, -0.06137847900390625, -0.055973052978515625, -0.050567626953125, -0.045162200927734375, -0.03975677490234375, -0.034351348876953125, -0.0289459228515625, -0.023540496826171875, -0.01813507080078125, -0.012729644775390625, -0.00732421875, -0.001918792724609375, 0.00348663330078125, 0.008892059326171875, 0.0142974853515625, 0.019702911376953125, 0.02510833740234375, 0.030513763427734375, 0.035919189453125, 0.041324615478515625, 0.04673004150390625, 0.052135467529296875, 0.0575408935546875, 0.06294631958007812, 0.06835174560546875, 0.07375717163085938, 0.07916259765625, 0.08456802368164062, 0.08997344970703125, 0.09537887573242188, 0.1007843017578125, 0.10618972778320312, 0.11159515380859375, 0.11700057983398438, 0.122406005859375, 0.12781143188476562, 0.13321685791015625, 0.13862228393554688, 0.1440277099609375, 0.14943313598632812, 0.15483856201171875, 0.16024398803710938, 0.1656494140625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 5.0, 12.0, 10.0, 12.0, 11.0, 17.0, 30.0, 29.0, 45.0, 42.0, 45.0, 56.0, 34.0, 58.0, 68.0, 61.0, 50.0, 42.0, 57.0, 52.0, 39.0, 40.0, 32.0, 26.0, 29.0, 19.0, 19.0, 12.0, 7.0, 7.0, 5.0, 8.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12646484375, -0.1226968765258789, -0.11892890930175781, -0.11516094207763672, -0.11139297485351562, -0.10762500762939453, -0.10385704040527344, -0.10008907318115234, -0.09632110595703125, -0.09255313873291016, -0.08878517150878906, -0.08501720428466797, -0.08124923706054688, -0.07748126983642578, -0.07371330261230469, -0.0699453353881836, -0.0661773681640625, -0.062409400939941406, -0.05864143371582031, -0.05487346649169922, -0.051105499267578125, -0.04733753204345703, -0.04356956481933594, -0.039801597595214844, -0.03603363037109375, -0.032265663146972656, -0.028497695922851562, -0.02472972869873047, -0.020961761474609375, -0.01719379425048828, -0.013425827026367188, -0.009657859802246094, -0.005889892578125, -0.0021219253540039062, 0.0016460418701171875, 0.005414009094238281, 0.009181976318359375, 0.012949943542480469, 0.016717910766601562, 0.020485877990722656, 0.02425384521484375, 0.028021812438964844, 0.03178977966308594, 0.03555774688720703, 0.039325714111328125, 0.04309368133544922, 0.04686164855957031, 0.050629615783691406, 0.0543975830078125, 0.058165550231933594, 0.06193351745605469, 0.06570148468017578, 0.06946945190429688, 0.07323741912841797, 0.07700538635253906, 0.08077335357666016, 0.08454132080078125, 0.08830928802490234, 0.09207725524902344, 0.09584522247314453, 0.09961318969726562, 0.10338115692138672, 0.10714912414550781, 0.1109170913696289, 0.11468505859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 2.0, 8.0, 13.0, 18.0, 40.0, 64.0, 121.0, 295.0, 1006.0, 6280.0, 111165.0, 4045129.0, 26463.0, 2677.0, 616.0, 199.0, 70.0, 30.0, 25.0, 17.0, 9.0, 6.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.455322265625, -0.44077301025390625, -0.4262237548828125, -0.41167449951171875, -0.397125244140625, -0.38257598876953125, -0.3680267333984375, -0.35347747802734375, -0.33892822265625, -0.32437896728515625, -0.3098297119140625, -0.29528045654296875, -0.280731201171875, -0.26618194580078125, -0.2516326904296875, -0.23708343505859375, -0.2225341796875, -0.20798492431640625, -0.1934356689453125, -0.17888641357421875, -0.164337158203125, -0.14978790283203125, -0.1352386474609375, -0.12068939208984375, -0.10614013671875, -0.09159088134765625, -0.0770416259765625, -0.06249237060546875, -0.047943115234375, -0.03339385986328125, -0.0188446044921875, -0.00429534912109375, 0.01025390625, 0.02480316162109375, 0.0393524169921875, 0.05390167236328125, 0.068450927734375, 0.08300018310546875, 0.0975494384765625, 0.11209869384765625, 0.12664794921875, 0.14119720458984375, 0.1557464599609375, 0.17029571533203125, 0.184844970703125, 0.19939422607421875, 0.2139434814453125, 0.22849273681640625, 0.2430419921875, 0.25759124755859375, 0.2721405029296875, 0.28668975830078125, 0.301239013671875, 0.31578826904296875, 0.3303375244140625, 0.34488677978515625, 0.35943603515625, 0.37398529052734375, 0.3885345458984375, 0.40308380126953125, 0.417633056640625, 0.43218231201171875, 0.4467315673828125, 0.46128082275390625, 0.475830078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 3.0, 4.0, 13.0, 12.0, 13.0, 29.0, 41.0, 101.0, 368.0, 1894.0, 1191.0, 211.0, 73.0, 42.0, 18.0, 17.0, 15.0, 7.0, 6.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.3885650634765625, -0.377716064453125, -0.3668670654296875, -0.35601806640625, -0.3451690673828125, -0.334320068359375, -0.3234710693359375, -0.3126220703125, -0.3017730712890625, -0.290924072265625, -0.2800750732421875, -0.26922607421875, -0.2583770751953125, -0.247528076171875, -0.2366790771484375, -0.225830078125, -0.2149810791015625, -0.204132080078125, -0.1932830810546875, -0.18243408203125, -0.1715850830078125, -0.160736083984375, -0.1498870849609375, -0.1390380859375, -0.1281890869140625, -0.117340087890625, -0.1064910888671875, -0.09564208984375, -0.0847930908203125, -0.073944091796875, -0.0630950927734375, -0.05224609375, -0.0413970947265625, -0.030548095703125, -0.0196990966796875, -0.00885009765625, 0.0019989013671875, 0.012847900390625, 0.0236968994140625, 0.0345458984375, 0.0453948974609375, 0.056243896484375, 0.0670928955078125, 0.07794189453125, 0.0887908935546875, 0.099639892578125, 0.1104888916015625, 0.121337890625, 0.1321868896484375, 0.143035888671875, 0.1538848876953125, 0.16473388671875, 0.1755828857421875, 0.186431884765625, 0.1972808837890625, 0.2081298828125, 0.2189788818359375, 0.229827880859375, 0.2406768798828125, 0.25152587890625, 0.2623748779296875, 0.273223876953125, 0.2840728759765625, 0.294921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 12.0, 26.0, 83.0, 195.0, 343.0, 209.0, 83.0, 22.0, 13.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.519117832183838, -3.4436111450195312, -3.3681044578552246, -3.292597770690918, -3.2170910835266113, -3.1415841579437256, -3.066077470779419, -2.9905707836151123, -2.9150640964508057, -2.839557409286499, -2.7640507221221924, -2.6885440349578857, -2.613037109375, -2.5375304222106934, -2.4620237350463867, -2.38651704788208, -2.3110103607177734, -2.235503673553467, -2.15999698638916, -2.0844902992248535, -2.008983612060547, -1.9334768056869507, -1.8579699993133545, -1.7824633121490479, -1.7069566249847412, -1.6314499378204346, -1.555943250656128, -1.4804364442825317, -1.404929757118225, -1.3294230699539185, -1.2539162635803223, -1.1784095764160156, -1.1029026508331299, -1.0273959636688232, -0.9518892168998718, -0.8763824701309204, -0.8008757829666138, -0.7253690958023071, -0.6498623490333557, -0.5743556022644043, -0.49884891510009766, -0.42334219813346863, -0.3478354811668396, -0.27232876420021057, -0.19682204723358154, -0.12131533026695251, -0.045808613300323486, 0.02969813346862793, 0.10520482063293457, 0.1807115375995636, 0.2562182545661926, 0.33172497153282166, 0.4072316884994507, 0.4827384054660797, 0.5582451224327087, 0.6337518692016602, 0.7092585563659668, 0.7847652435302734, 0.8602719902992249, 0.9357787370681763, 1.011285424232483, 1.0867921113967896, 1.1622989177703857, 1.2378056049346924, 1.313312292098999]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 7.0, 6.0, 7.0, 5.0, 10.0, 16.0, 11.0, 29.0, 32.0, 31.0, 25.0, 47.0, 57.0, 68.0, 68.0, 77.0, 73.0, 60.0, 57.0, 64.0, 51.0, 43.0, 36.0, 25.0, 28.0, 22.0, 15.0, 12.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.303004503250122, -1.2634862661361694, -1.2239681482315063, -1.1844499111175537, -1.1449317932128906, -1.105413556098938, -1.0658953189849854, -1.0263772010803223, -0.9868589639663696, -0.9473407864570618, -0.9078226089477539, -0.8683043718338013, -0.8287861943244934, -0.7892680168151855, -0.7497497797012329, -0.710231602191925, -0.6707134246826172, -0.6311952471733093, -0.5916770696640015, -0.5521588325500488, -0.512640655040741, -0.4731224775314331, -0.43360427021980286, -0.3940860629081726, -0.35456788539886475, -0.3150497078895569, -0.27553150057792664, -0.23601330816745758, -0.19649511575698853, -0.15697692334651947, -0.11745873093605042, -0.07794052362442017, -0.038422346115112305, 0.0010958462953567505, 0.040614038705825806, 0.08013223111629486, 0.11965042352676392, 0.15916861593723297, 0.19868680834770203, 0.23820501565933228, 0.27772319316864014, 0.317241370677948, 0.35675957798957825, 0.3962777853012085, 0.43579596281051636, 0.4753141403198242, 0.5148323774337769, 0.5543505549430847, 0.5938687324523926, 0.6333869099617004, 0.6729050874710083, 0.7124233245849609, 0.7519415020942688, 0.7914596796035767, 0.8309779167175293, 0.8704960942268372, 0.910014271736145, 0.9495324492454529, 0.9890506267547607, 1.0285688638687134, 1.068087100982666, 1.107605218887329, 1.1471234560012817, 1.1866416931152344, 1.2261598110198975]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 6.0, 4.0, 7.0, 11.0, 16.0, 30.0, 36.0, 44.0, 96.0, 140.0, 228.0, 393.0, 665.0, 1098.0, 1944.0, 3664.0, 7096.0, 14437.0, 32246.0, 72979.0, 170191.0, 301194.0, 241664.0, 110778.0, 47277.0, 20969.0, 10000.0, 5097.0, 2618.0, 1454.0, 864.0, 462.0, 296.0, 189.0, 113.0, 70.0, 71.0, 31.0, 33.0, 18.0, 9.0, 11.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.102294921875, -0.09943294525146484, -0.09657096862792969, -0.09370899200439453, -0.09084701538085938, -0.08798503875732422, -0.08512306213378906, -0.0822610855102539, -0.07939910888671875, -0.0765371322631836, -0.07367515563964844, -0.07081317901611328, -0.06795120239257812, -0.06508922576904297, -0.06222724914550781, -0.059365272521972656, -0.0565032958984375, -0.053641319274902344, -0.05077934265136719, -0.04791736602783203, -0.045055389404296875, -0.04219341278076172, -0.03933143615722656, -0.036469459533691406, -0.03360748291015625, -0.030745506286621094, -0.027883529663085938, -0.02502155303955078, -0.022159576416015625, -0.01929759979248047, -0.016435623168945312, -0.013573646545410156, -0.010711669921875, -0.007849693298339844, -0.0049877166748046875, -0.0021257400512695312, 0.000736236572265625, 0.0035982131958007812, 0.0064601898193359375, 0.009322166442871094, 0.01218414306640625, 0.015046119689941406, 0.017908096313476562, 0.02077007293701172, 0.023632049560546875, 0.02649402618408203, 0.029356002807617188, 0.032217979431152344, 0.0350799560546875, 0.037941932678222656, 0.04080390930175781, 0.04366588592529297, 0.046527862548828125, 0.04938983917236328, 0.05225181579589844, 0.055113792419433594, 0.05797576904296875, 0.060837745666503906, 0.06369972229003906, 0.06656169891357422, 0.06942367553710938, 0.07228565216064453, 0.07514762878417969, 0.07800960540771484, 0.08087158203125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 10.0, 18.0, 17.0, 21.0, 15.0, 22.0, 27.0, 36.0, 49.0, 41.0, 52.0, 44.0, 52.0, 65.0, 56.0, 43.0, 66.0, 46.0, 37.0, 36.0, 51.0, 30.0, 26.0, 32.0, 22.0, 17.0, 13.0, 9.0, 4.0, 6.0, 8.0, 5.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1270751953125, -0.12338829040527344, -0.11970138549804688, -0.11601448059082031, -0.11232757568359375, -0.10864067077636719, -0.10495376586914062, -0.10126686096191406, -0.0975799560546875, -0.09389305114746094, -0.09020614624023438, -0.08651924133300781, -0.08283233642578125, -0.07914543151855469, -0.07545852661132812, -0.07177162170410156, -0.068084716796875, -0.06439781188964844, -0.060710906982421875, -0.05702400207519531, -0.05333709716796875, -0.04965019226074219, -0.045963287353515625, -0.04227638244628906, -0.0385894775390625, -0.03490257263183594, -0.031215667724609375, -0.027528762817382812, -0.02384185791015625, -0.020154953002929688, -0.016468048095703125, -0.012781143188476562, -0.00909423828125, -0.0054073333740234375, -0.001720428466796875, 0.0019664764404296875, 0.00565338134765625, 0.009340286254882812, 0.013027191162109375, 0.016714096069335938, 0.0204010009765625, 0.024087905883789062, 0.027774810791015625, 0.03146171569824219, 0.03514862060546875, 0.03883552551269531, 0.042522430419921875, 0.04620933532714844, 0.049896240234375, 0.05358314514160156, 0.057270050048828125, 0.06095695495605469, 0.06464385986328125, 0.06833076477050781, 0.07201766967773438, 0.07570457458496094, 0.0793914794921875, 0.08307838439941406, 0.08676528930664062, 0.09045219421386719, 0.09413909912109375, 0.09782600402832031, 0.10151290893554688, 0.10519981384277344, 0.10888671875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 3.0, 4.0, 9.0, 10.0, 13.0, 31.0, 39.0, 73.0, 96.0, 215.0, 342.0, 706.0, 1490.0, 6621.0, 152694.0, 852601.0, 28297.0, 3040.0, 1062.0, 469.0, 285.0, 168.0, 90.0, 67.0, 34.0, 31.0, 17.0, 15.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.32210540771484375, -0.3107147216796875, -0.29932403564453125, -0.287933349609375, -0.27654266357421875, -0.2651519775390625, -0.25376129150390625, -0.24237060546875, -0.23097991943359375, -0.2195892333984375, -0.20819854736328125, -0.196807861328125, -0.18541717529296875, -0.1740264892578125, -0.16263580322265625, -0.1512451171875, -0.13985443115234375, -0.1284637451171875, -0.11707305908203125, -0.105682373046875, -0.09429168701171875, -0.0829010009765625, -0.07151031494140625, -0.06011962890625, -0.04872894287109375, -0.0373382568359375, -0.02594757080078125, -0.014556884765625, -0.00316619873046875, 0.0082244873046875, 0.01961517333984375, 0.031005859375, 0.04239654541015625, 0.0537872314453125, 0.06517791748046875, 0.076568603515625, 0.08795928955078125, 0.0993499755859375, 0.11074066162109375, 0.12213134765625, 0.13352203369140625, 0.1449127197265625, 0.15630340576171875, 0.167694091796875, 0.17908477783203125, 0.1904754638671875, 0.20186614990234375, 0.2132568359375, 0.22464752197265625, 0.2360382080078125, 0.24742889404296875, 0.258819580078125, 0.27021026611328125, 0.2816009521484375, 0.29299163818359375, 0.30438232421875, 0.31577301025390625, 0.3271636962890625, 0.33855438232421875, 0.349945068359375, 0.36133575439453125, 0.3727264404296875, 0.38411712646484375, 0.3955078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 2.0, 4.0, 14.0, 12.0, 23.0, 22.0, 19.0, 33.0, 31.0, 26.0, 31.0, 33.0, 35.0, 35.0, 34.0, 38.0, 40.0, 49.0, 45.0, 51.0, 36.0, 42.0, 46.0, 34.0, 42.0, 35.0, 30.0, 25.0, 23.0, 13.0, 22.0, 14.0, 17.0, 12.0, 6.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.408447265625, -0.3973045349121094, -0.38616180419921875, -0.3750190734863281, -0.3638763427734375, -0.3527336120605469, -0.34159088134765625, -0.3304481506347656, -0.319305419921875, -0.3081626892089844, -0.29701995849609375, -0.2858772277832031, -0.2747344970703125, -0.2635917663574219, -0.25244903564453125, -0.24130630493164062, -0.23016357421875, -0.21902084350585938, -0.20787811279296875, -0.19673538208007812, -0.1855926513671875, -0.17444992065429688, -0.16330718994140625, -0.15216445922851562, -0.141021728515625, -0.12987899780273438, -0.11873626708984375, -0.10759353637695312, -0.0964508056640625, -0.08530807495117188, -0.07416534423828125, -0.06302261352539062, -0.0518798828125, -0.040737152099609375, -0.02959442138671875, -0.018451690673828125, -0.0073089599609375, 0.003833770751953125, 0.01497650146484375, 0.026119232177734375, 0.037261962890625, 0.048404693603515625, 0.05954742431640625, 0.07069015502929688, 0.0818328857421875, 0.09297561645507812, 0.10411834716796875, 0.11526107788085938, 0.12640380859375, 0.13754653930664062, 0.14868927001953125, 0.15983200073242188, 0.1709747314453125, 0.18211746215820312, 0.19326019287109375, 0.20440292358398438, 0.215545654296875, 0.22668838500976562, 0.23783111572265625, 0.24897384643554688, 0.2601165771484375, 0.2712593078613281, 0.28240203857421875, 0.2935447692871094, 0.3046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 9.0, 10.0, 10.0, 20.0, 38.0, 44.0, 111.0, 182.0, 476.0, 1395.0, 6219.0, 278479.0, 750242.0, 8615.0, 1649.0, 524.0, 252.0, 106.0, 60.0, 34.0, 26.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2130126953125, -0.20615768432617188, -0.19930267333984375, -0.19244766235351562, -0.1855926513671875, -0.17873764038085938, -0.17188262939453125, -0.16502761840820312, -0.158172607421875, -0.15131759643554688, -0.14446258544921875, -0.13760757446289062, -0.1307525634765625, -0.12389755249023438, -0.11704254150390625, -0.11018753051757812, -0.10333251953125, -0.09647750854492188, -0.08962249755859375, -0.08276748657226562, -0.0759124755859375, -0.06905746459960938, -0.06220245361328125, -0.055347442626953125, -0.048492431640625, -0.041637420654296875, -0.03478240966796875, -0.027927398681640625, -0.0210723876953125, -0.014217376708984375, -0.00736236572265625, -0.000507354736328125, 0.00634765625, 0.013202667236328125, 0.02005767822265625, 0.026912689208984375, 0.0337677001953125, 0.040622711181640625, 0.04747772216796875, 0.054332733154296875, 0.061187744140625, 0.06804275512695312, 0.07489776611328125, 0.08175277709960938, 0.0886077880859375, 0.09546279907226562, 0.10231781005859375, 0.10917282104492188, 0.11602783203125, 0.12288284301757812, 0.12973785400390625, 0.13659286499023438, 0.1434478759765625, 0.15030288696289062, 0.15715789794921875, 0.16401290893554688, 0.170867919921875, 0.17772293090820312, 0.18457794189453125, 0.19143295288085938, 0.1982879638671875, 0.20514297485351562, 0.21199798583984375, 0.21885299682617188, 0.2257080078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 7.0, 9.0, 13.0, 7.0, 14.0, 13.0, 22.0, 27.0, 45.0, 58.0, 81.0, 112.0, 135.0, 100.0, 77.0, 62.0, 48.0, 34.0, 26.0, 15.0, 15.0, 15.0, 10.0, 6.0, 6.0, 7.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.166364669799805e-05, -4.0024518966674805e-05, -3.838539123535156e-05, -3.674626350402832e-05, -3.510713577270508e-05, -3.3468008041381836e-05, -3.1828880310058594e-05, -3.018975257873535e-05, -2.855062484741211e-05, -2.6911497116088867e-05, -2.5272369384765625e-05, -2.3633241653442383e-05, -2.199411392211914e-05, -2.03549861907959e-05, -1.8715858459472656e-05, -1.7076730728149414e-05, -1.5437602996826172e-05, -1.379847526550293e-05, -1.2159347534179688e-05, -1.0520219802856445e-05, -8.881092071533203e-06, -7.241964340209961e-06, -5.602836608886719e-06, -3.9637088775634766e-06, -2.3245811462402344e-06, -6.854534149169922e-07, 9.5367431640625e-07, 2.592802047729492e-06, 4.231929779052734e-06, 5.8710575103759766e-06, 7.510185241699219e-06, 9.149312973022461e-06, 1.0788440704345703e-05, 1.2427568435668945e-05, 1.4066696166992188e-05, 1.570582389831543e-05, 1.7344951629638672e-05, 1.8984079360961914e-05, 2.0623207092285156e-05, 2.22623348236084e-05, 2.390146255493164e-05, 2.5540590286254883e-05, 2.7179718017578125e-05, 2.8818845748901367e-05, 3.045797348022461e-05, 3.209710121154785e-05, 3.3736228942871094e-05, 3.5375356674194336e-05, 3.701448440551758e-05, 3.865361213684082e-05, 4.029273986816406e-05, 4.1931867599487305e-05, 4.357099533081055e-05, 4.521012306213379e-05, 4.684925079345703e-05, 4.8488378524780273e-05, 5.0127506256103516e-05, 5.176663398742676e-05, 5.340576171875e-05, 5.504488945007324e-05, 5.6684017181396484e-05, 5.8323144912719727e-05, 5.996227264404297e-05, 6.160140037536621e-05, 6.324052810668945e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 10.0, 4.0, 15.0, 18.0, 21.0, 39.0, 47.0, 65.0, 104.0, 170.0, 335.0, 627.0, 1488.0, 3738.0, 12848.0, 117029.0, 819553.0, 76319.0, 10476.0, 3071.0, 1246.0, 573.0, 270.0, 156.0, 99.0, 73.0, 33.0, 35.0, 17.0, 15.0, 13.0, 7.0, 7.0, 10.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1064453125, -0.10326099395751953, -0.10007667541503906, -0.0968923568725586, -0.09370803833007812, -0.09052371978759766, -0.08733940124511719, -0.08415508270263672, -0.08097076416015625, -0.07778644561767578, -0.07460212707519531, -0.07141780853271484, -0.06823348999023438, -0.0650491714477539, -0.06186485290527344, -0.05868053436279297, -0.0554962158203125, -0.05231189727783203, -0.04912757873535156, -0.045943260192871094, -0.042758941650390625, -0.039574623107910156, -0.03639030456542969, -0.03320598602294922, -0.03002166748046875, -0.02683734893798828, -0.023653030395507812, -0.020468711853027344, -0.017284393310546875, -0.014100074768066406, -0.010915756225585938, -0.007731437683105469, -0.004547119140625, -0.0013628005981445312, 0.0018215179443359375, 0.005005836486816406, 0.008190155029296875, 0.011374473571777344, 0.014558792114257812, 0.01774311065673828, 0.02092742919921875, 0.02411174774169922, 0.027296066284179688, 0.030480384826660156, 0.033664703369140625, 0.036849021911621094, 0.04003334045410156, 0.04321765899658203, 0.0464019775390625, 0.04958629608154297, 0.05277061462402344, 0.055954933166503906, 0.059139251708984375, 0.062323570251464844, 0.06550788879394531, 0.06869220733642578, 0.07187652587890625, 0.07506084442138672, 0.07824516296386719, 0.08142948150634766, 0.08461380004882812, 0.0877981185913086, 0.09098243713378906, 0.09416675567626953, 0.09735107421875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 7.0, 2.0, 0.0, 6.0, 5.0, 5.0, 13.0, 16.0, 19.0, 37.0, 40.0, 51.0, 62.0, 76.0, 113.0, 92.0, 92.0, 88.0, 71.0, 63.0, 30.0, 38.0, 22.0, 14.0, 10.0, 5.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08599853515625, -0.08277416229248047, -0.07954978942871094, -0.0763254165649414, -0.07310104370117188, -0.06987667083740234, -0.06665229797363281, -0.06342792510986328, -0.06020355224609375, -0.05697917938232422, -0.05375480651855469, -0.050530433654785156, -0.047306060791015625, -0.044081687927246094, -0.04085731506347656, -0.03763294219970703, -0.0344085693359375, -0.03118419647216797, -0.027959823608398438, -0.024735450744628906, -0.021511077880859375, -0.018286705017089844, -0.015062332153320312, -0.011837959289550781, -0.00861358642578125, -0.005389213562011719, -0.0021648406982421875, 0.0010595321655273438, 0.004283905029296875, 0.007508277893066406, 0.010732650756835938, 0.013957023620605469, 0.017181396484375, 0.02040576934814453, 0.023630142211914062, 0.026854515075683594, 0.030078887939453125, 0.033303260803222656, 0.03652763366699219, 0.03975200653076172, 0.04297637939453125, 0.04620075225830078, 0.04942512512207031, 0.052649497985839844, 0.055873870849609375, 0.059098243713378906, 0.06232261657714844, 0.06554698944091797, 0.0687713623046875, 0.07199573516845703, 0.07522010803222656, 0.0784444808959961, 0.08166885375976562, 0.08489322662353516, 0.08811759948730469, 0.09134197235107422, 0.09456634521484375, 0.09779071807861328, 0.10101509094238281, 0.10423946380615234, 0.10746383666992188, 0.1106882095336914, 0.11391258239746094, 0.11713695526123047, 0.120361328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 8.0, 11.0, 33.0, 63.0, 128.0, 219.0, 200.0, 173.0, 76.0, 45.0, 13.0, 6.0, 11.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.728104829788208, -1.6668163537979126, -1.6055278778076172, -1.5442395210266113, -1.482951045036316, -1.4216625690460205, -1.360374093055725, -1.2990856170654297, -1.2377972602844238, -1.1765087842941284, -1.115220308303833, -1.0539319515228271, -0.9926434755325317, -0.9313549995422363, -0.8700665235519409, -0.8087780475616455, -0.7474895715713501, -0.6862010955810547, -0.624912679195404, -0.5636242032051086, -0.502335786819458, -0.4410473108291626, -0.3797588348388672, -0.31847038865089417, -0.25718194246292114, -0.19589349627494812, -0.1346050351858139, -0.07331657409667969, -0.012028127908706665, 0.04926031827926636, 0.11054879426956177, 0.1718372404575348, 0.2331256866455078, 0.29441413283348083, 0.35570257902145386, 0.41699105501174927, 0.4782795011997223, 0.5395679473876953, 0.6008564233779907, 0.6621448993682861, 0.7234333157539368, 0.7847217917442322, 0.8460102081298828, 0.9072986841201782, 0.9685871601104736, 1.0298755168914795, 1.0911641120910645, 1.1524524688720703, 1.2137409448623657, 1.2750294208526611, 1.3363178968429565, 1.397606372833252, 1.4588947296142578, 1.5201832056045532, 1.5814716815948486, 1.642760157585144, 1.7040486335754395, 1.7653371095657349, 1.8266255855560303, 1.8879139423370361, 1.9492024183273315, 2.010490894317627, 2.071779251098633, 2.1330678462982178, 2.1943562030792236]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 14.0, 10.0, 21.0, 15.0, 19.0, 22.0, 25.0, 28.0, 40.0, 45.0, 52.0, 53.0, 58.0, 62.0, 69.0, 51.0, 63.0, 45.0, 37.0, 30.0, 36.0, 38.0, 23.0, 24.0, 21.0, 20.0, 15.0, 17.0, 14.0, 5.0, 3.0, 2.0, 7.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.066498041152954, -2.0110204219818115, -1.955542802810669, -1.9000651836395264, -1.8445875644683838, -1.7891099452972412, -1.733632206916809, -1.6781545877456665, -1.622676968574524, -1.5671993494033813, -1.5117217302322388, -1.4562441110610962, -1.400766372680664, -1.3452887535095215, -1.289811134338379, -1.2343335151672363, -1.1788558959960938, -1.1233782768249512, -1.0679006576538086, -1.012423038482666, -0.9569453597068787, -0.9014677405357361, -0.8459900617599487, -0.7905124425888062, -0.7350348234176636, -0.679557204246521, -0.6240795850753784, -0.5686019062995911, -0.5131242871284485, -0.4576466679573059, -0.40216901898384094, -0.346691370010376, -0.29121363162994385, -0.23573599755764008, -0.1802583634853363, -0.12478072941303253, -0.06930309534072876, -0.013825476169586182, 0.041652172803878784, 0.09712982177734375, 0.15260744094848633, 0.2080850750207901, 0.26356270909309387, 0.31904035806655884, 0.3745179772377014, 0.429995596408844, 0.48547324538230896, 0.5409508943557739, 0.5964285135269165, 0.6519061326980591, 0.7073837518692017, 0.762861430644989, 0.8183390498161316, 0.8738166689872742, 0.9292943477630615, 0.9847719669342041, 1.0402495861053467, 1.0957272052764893, 1.1512048244476318, 1.2066824436187744, 1.262160062789917, 1.3176376819610596, 1.3731154203414917, 1.4285930395126343, 1.4840706586837769]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 7.0, 9.0, 14.0, 13.0, 19.0, 33.0, 32.0, 54.0, 63.0, 89.0, 114.0, 154.0, 246.0, 618.0, 5236.0, 4162781.0, 22934.0, 870.0, 300.0, 176.0, 105.0, 90.0, 64.0, 54.0, 43.0, 39.0, 19.0, 20.0, 13.0, 13.0, 9.0, 7.0, 8.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.8193359375, -0.7956924438476562, -0.7720489501953125, -0.7484054565429688, -0.724761962890625, -0.7011184692382812, -0.6774749755859375, -0.6538314819335938, -0.63018798828125, -0.6065444946289062, -0.5829010009765625, -0.5592575073242188, -0.535614013671875, -0.5119705200195312, -0.4883270263671875, -0.46468353271484375, -0.4410400390625, -0.41739654541015625, -0.3937530517578125, -0.37010955810546875, -0.346466064453125, -0.32282257080078125, -0.2991790771484375, -0.27553558349609375, -0.25189208984375, -0.22824859619140625, -0.2046051025390625, -0.18096160888671875, -0.157318115234375, -0.13367462158203125, -0.1100311279296875, -0.08638763427734375, -0.062744140625, -0.03910064697265625, -0.0154571533203125, 0.00818634033203125, 0.031829833984375, 0.05547332763671875, 0.0791168212890625, 0.10276031494140625, 0.12640380859375, 0.15004730224609375, 0.1736907958984375, 0.19733428955078125, 0.220977783203125, 0.24462127685546875, 0.2682647705078125, 0.29190826416015625, 0.3155517578125, 0.33919525146484375, 0.3628387451171875, 0.38648223876953125, 0.410125732421875, 0.43376922607421875, 0.4574127197265625, 0.48105621337890625, 0.50469970703125, 0.5283432006835938, 0.5519866943359375, 0.5756301879882812, 0.599273681640625, 0.6229171752929688, 0.6465606689453125, 0.6702041625976562, 0.69384765625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 8.0, 9.0, 19.0, 20.0, 22.0, 30.0, 43.0, 68.0, 68.0, 76.0, 84.0, 94.0, 85.0, 78.0, 63.0, 53.0, 54.0, 40.0, 25.0, 25.0, 19.0, 4.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2431640625, -0.23758316040039062, -0.23200225830078125, -0.22642135620117188, -0.2208404541015625, -0.21525955200195312, -0.20967864990234375, -0.20409774780273438, -0.198516845703125, -0.19293594360351562, -0.18735504150390625, -0.18177413940429688, -0.1761932373046875, -0.17061233520507812, -0.16503143310546875, -0.15945053100585938, -0.15386962890625, -0.14828872680664062, -0.14270782470703125, -0.13712692260742188, -0.1315460205078125, -0.12596511840820312, -0.12038421630859375, -0.11480331420898438, -0.109222412109375, -0.10364151000976562, -0.09806060791015625, -0.09247970581054688, -0.0868988037109375, -0.08131790161132812, -0.07573699951171875, -0.07015609741210938, -0.0645751953125, -0.058994293212890625, -0.05341339111328125, -0.047832489013671875, -0.0422515869140625, -0.036670684814453125, -0.03108978271484375, -0.025508880615234375, -0.019927978515625, -0.014347076416015625, -0.00876617431640625, -0.003185272216796875, 0.0023956298828125, 0.007976531982421875, 0.01355743408203125, 0.019138336181640625, 0.02471923828125, 0.030300140380859375, 0.03588104248046875, 0.041461944580078125, 0.0470428466796875, 0.052623748779296875, 0.05820465087890625, 0.06378555297851562, 0.069366455078125, 0.07494735717773438, 0.08052825927734375, 0.08610916137695312, 0.0916900634765625, 0.09727096557617188, 0.10285186767578125, 0.10843276977539062, 0.114013671875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 9.0, 14.0, 16.0, 28.0, 38.0, 91.0, 144.0, 309.0, 752.0, 2727.0, 15411.0, 371750.0, 3757211.0, 37793.0, 5735.0, 1335.0, 472.0, 204.0, 113.0, 37.0, 38.0, 22.0, 10.0, 10.0, 6.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28759765625, -0.2789344787597656, -0.27027130126953125, -0.2616081237792969, -0.2529449462890625, -0.24428176879882812, -0.23561859130859375, -0.22695541381835938, -0.218292236328125, -0.20962905883789062, -0.20096588134765625, -0.19230270385742188, -0.1836395263671875, -0.17497634887695312, -0.16631317138671875, -0.15764999389648438, -0.14898681640625, -0.14032363891601562, -0.13166046142578125, -0.12299728393554688, -0.1143341064453125, -0.10567092895507812, -0.09700775146484375, -0.08834457397460938, -0.079681396484375, -0.07101821899414062, -0.06235504150390625, -0.053691864013671875, -0.0450286865234375, -0.036365509033203125, -0.02770233154296875, -0.019039154052734375, -0.0103759765625, -0.001712799072265625, 0.00695037841796875, 0.015613555908203125, 0.0242767333984375, 0.032939910888671875, 0.04160308837890625, 0.050266265869140625, 0.058929443359375, 0.06759262084960938, 0.07625579833984375, 0.08491897583007812, 0.0935821533203125, 0.10224533081054688, 0.11090850830078125, 0.11957168579101562, 0.12823486328125, 0.13689804077148438, 0.14556121826171875, 0.15422439575195312, 0.1628875732421875, 0.17155075073242188, 0.18021392822265625, 0.18887710571289062, 0.197540283203125, 0.20620346069335938, 0.21486663818359375, 0.22352981567382812, 0.2321929931640625, 0.24085617065429688, 0.24951934814453125, 0.2581825256347656, 0.266845703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 9.0, 12.0, 11.0, 25.0, 51.0, 114.0, 436.0, 1818.0, 1183.0, 245.0, 79.0, 26.0, 15.0, 20.0, 12.0, 9.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300537109375, -0.29137420654296875, -0.2822113037109375, -0.27304840087890625, -0.263885498046875, -0.25472259521484375, -0.2455596923828125, -0.23639678955078125, -0.22723388671875, -0.21807098388671875, -0.2089080810546875, -0.19974517822265625, -0.190582275390625, -0.18141937255859375, -0.1722564697265625, -0.16309356689453125, -0.1539306640625, -0.14476776123046875, -0.1356048583984375, -0.12644195556640625, -0.117279052734375, -0.10811614990234375, -0.0989532470703125, -0.08979034423828125, -0.08062744140625, -0.07146453857421875, -0.0623016357421875, -0.05313873291015625, -0.043975830078125, -0.03481292724609375, -0.0256500244140625, -0.01648712158203125, -0.00732421875, 0.00183868408203125, 0.0110015869140625, 0.02016448974609375, 0.029327392578125, 0.03849029541015625, 0.0476531982421875, 0.05681610107421875, 0.06597900390625, 0.07514190673828125, 0.0843048095703125, 0.09346771240234375, 0.102630615234375, 0.11179351806640625, 0.1209564208984375, 0.13011932373046875, 0.1392822265625, 0.14844512939453125, 0.1576080322265625, 0.16677093505859375, 0.175933837890625, 0.18509674072265625, 0.1942596435546875, 0.20342254638671875, 0.21258544921875, 0.22174835205078125, 0.2309112548828125, 0.24007415771484375, 0.249237060546875, 0.25839996337890625, 0.2675628662109375, 0.27672576904296875, 0.285888671875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 27.0, 40.0, 89.0, 151.0, 216.0, 196.0, 147.0, 62.0, 28.0, 13.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7672268152236938, -0.7290539741516113, -0.6908811330795288, -0.6527082920074463, -0.6145354509353638, -0.5763626098632812, -0.5381898283958435, -0.500016987323761, -0.46184414625167847, -0.42367130517959595, -0.3854984641075134, -0.3473256528377533, -0.3091528117656708, -0.27097997069358826, -0.23280714452266693, -0.1946343183517456, -0.15646147727966309, -0.11828864365816116, -0.08011581003665924, -0.04194297641515732, -0.0037701427936553955, 0.034402698278427124, 0.07257552444934845, 0.11074835062026978, 0.1489211916923523, 0.18709403276443481, 0.22526685893535614, 0.26343968510627747, 0.30161252617836, 0.3397853672504425, 0.37795817852020264, 0.41613101959228516, 0.4543037414550781, 0.49247658252716064, 0.5306494235992432, 0.5688222646713257, 0.6069951057434082, 0.6451679468154907, 0.6833407282829285, 0.721513569355011, 0.7596864104270935, 0.797859251499176, 0.8360320925712585, 0.8742049336433411, 0.9123777151107788, 0.9505505561828613, 0.9887233972549438, 1.0268962383270264, 1.0650690793991089, 1.1032419204711914, 1.141414761543274, 1.1795876026153564, 1.217760443687439, 1.2559332847595215, 1.294106125831604, 1.3322789669036865, 1.3704516887664795, 1.408624529838562, 1.4467973709106445, 1.484970211982727, 1.5231430530548096, 1.561315894126892, 1.5994887351989746, 1.6376614570617676, 1.6758344173431396]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 9.0, 16.0, 13.0, 22.0, 19.0, 24.0, 19.0, 48.0, 42.0, 51.0, 55.0, 60.0, 46.0, 68.0, 64.0, 50.0, 63.0, 47.0, 50.0, 39.0, 39.0, 31.0, 22.0, 19.0, 22.0, 12.0, 6.0, 9.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6847864985466003, -0.6613394618034363, -0.6378924250602722, -0.6144454479217529, -0.5909984111785889, -0.5675513744354248, -0.5441043376922607, -0.5206573009490967, -0.497210294008255, -0.47376325726509094, -0.45031625032424927, -0.4268692135810852, -0.40342217683792114, -0.37997516989707947, -0.3565281331539154, -0.33308112621307373, -0.30963408946990967, -0.2861870527267456, -0.26274004578590393, -0.23929300904273987, -0.215845987200737, -0.19239896535873413, -0.16895192861557007, -0.1455049067735672, -0.12205788493156433, -0.09861086308956146, -0.075163833796978, -0.05171680450439453, -0.028269782662391663, -0.004822760820388794, 0.01862427592277527, 0.04207129776477814, 0.06551837921142578, 0.08896540105342865, 0.11241243034601212, 0.13585945963859558, 0.15930648148059845, 0.18275350332260132, 0.20620054006576538, 0.22964756190776825, 0.2530945837497711, 0.2765416204929352, 0.29998862743377686, 0.3234356641769409, 0.346882700920105, 0.37032970786094666, 0.3937767446041107, 0.4172237515449524, 0.44067078828811646, 0.4641178250312805, 0.4875648319721222, 0.5110118389129639, 0.5344588756561279, 0.557905912399292, 0.581352949142456, 0.6047999858856201, 0.6282470226287842, 0.6516940593719482, 0.6751410961151123, 0.6985881328582764, 0.7220351099967957, 0.7454821467399597, 0.7689291834831238, 0.7923762202262878, 0.8158231973648071]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 3.0, 13.0, 10.0, 14.0, 14.0, 34.0, 44.0, 74.0, 104.0, 130.0, 205.0, 335.0, 443.0, 735.0, 1181.0, 2089.0, 4275.0, 8979.0, 22648.0, 64458.0, 191831.0, 382698.0, 236689.0, 81884.0, 27672.0, 11006.0, 4817.0, 2528.0, 1276.0, 821.0, 516.0, 349.0, 199.0, 143.0, 102.0, 65.0, 56.0, 50.0, 25.0, 13.0, 6.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12261962890625, -0.11861324310302734, -0.11460685729980469, -0.11060047149658203, -0.10659408569335938, -0.10258769989013672, -0.09858131408691406, -0.0945749282836914, -0.09056854248046875, -0.0865621566772461, -0.08255577087402344, -0.07854938507080078, -0.07454299926757812, -0.07053661346435547, -0.06653022766113281, -0.06252384185791016, -0.0585174560546875, -0.054511070251464844, -0.05050468444824219, -0.04649829864501953, -0.042491912841796875, -0.03848552703857422, -0.03447914123535156, -0.030472755432128906, -0.02646636962890625, -0.022459983825683594, -0.018453598022460938, -0.014447212219238281, -0.010440826416015625, -0.006434440612792969, -0.0024280548095703125, 0.0015783309936523438, 0.005584716796875, 0.009591102600097656, 0.013597488403320312, 0.01760387420654297, 0.021610260009765625, 0.02561664581298828, 0.029623031616210938, 0.033629417419433594, 0.03763580322265625, 0.041642189025878906, 0.04564857482910156, 0.04965496063232422, 0.053661346435546875, 0.05766773223876953, 0.06167411804199219, 0.06568050384521484, 0.0696868896484375, 0.07369327545166016, 0.07769966125488281, 0.08170604705810547, 0.08571243286132812, 0.08971881866455078, 0.09372520446777344, 0.0977315902709961, 0.10173797607421875, 0.1057443618774414, 0.10975074768066406, 0.11375713348388672, 0.11776351928710938, 0.12176990509033203, 0.1257762908935547, 0.12978267669677734, 0.1337890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 14.0, 13.0, 14.0, 13.0, 21.0, 27.0, 16.0, 35.0, 38.0, 49.0, 56.0, 53.0, 55.0, 56.0, 61.0, 64.0, 59.0, 42.0, 38.0, 42.0, 39.0, 36.0, 31.0, 27.0, 15.0, 26.0, 10.0, 14.0, 10.0, 3.0, 8.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12298583984375, -0.11921977996826172, -0.11545372009277344, -0.11168766021728516, -0.10792160034179688, -0.1041555404663086, -0.10038948059082031, -0.09662342071533203, -0.09285736083984375, -0.08909130096435547, -0.08532524108886719, -0.0815591812133789, -0.07779312133789062, -0.07402706146240234, -0.07026100158691406, -0.06649494171142578, -0.0627288818359375, -0.05896282196044922, -0.05519676208496094, -0.051430702209472656, -0.047664642333984375, -0.043898582458496094, -0.04013252258300781, -0.03636646270751953, -0.03260040283203125, -0.02883434295654297, -0.025068283081054688, -0.021302223205566406, -0.017536163330078125, -0.013770103454589844, -0.010004043579101562, -0.006237983703613281, -0.002471923828125, 0.0012941360473632812, 0.0050601959228515625, 0.008826255798339844, 0.012592315673828125, 0.016358375549316406, 0.020124435424804688, 0.02389049530029297, 0.02765655517578125, 0.03142261505126953, 0.03518867492675781, 0.038954734802246094, 0.042720794677734375, 0.046486854553222656, 0.05025291442871094, 0.05401897430419922, 0.0577850341796875, 0.06155109405517578, 0.06531715393066406, 0.06908321380615234, 0.07284927368164062, 0.0766153335571289, 0.08038139343261719, 0.08414745330810547, 0.08791351318359375, 0.09167957305908203, 0.09544563293457031, 0.0992116928100586, 0.10297775268554688, 0.10674381256103516, 0.11050987243652344, 0.11427593231201172, 0.1180419921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 10.0, 9.0, 12.0, 25.0, 53.0, 88.0, 189.0, 534.0, 1543.0, 12218.0, 745987.0, 279809.0, 6230.0, 1094.0, 395.0, 180.0, 79.0, 40.0, 22.0, 8.0, 4.0, 7.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.501953125, -0.48668670654296875, -0.4714202880859375, -0.45615386962890625, -0.440887451171875, -0.42562103271484375, -0.4103546142578125, -0.39508819580078125, -0.37982177734375, -0.36455535888671875, -0.3492889404296875, -0.33402252197265625, -0.318756103515625, -0.30348968505859375, -0.2882232666015625, -0.27295684814453125, -0.2576904296875, -0.24242401123046875, -0.2271575927734375, -0.21189117431640625, -0.196624755859375, -0.18135833740234375, -0.1660919189453125, -0.15082550048828125, -0.13555908203125, -0.12029266357421875, -0.1050262451171875, -0.08975982666015625, -0.074493408203125, -0.05922698974609375, -0.0439605712890625, -0.02869415283203125, -0.013427734375, 0.00183868408203125, 0.0171051025390625, 0.03237152099609375, 0.047637939453125, 0.06290435791015625, 0.0781707763671875, 0.09343719482421875, 0.10870361328125, 0.12397003173828125, 0.1392364501953125, 0.15450286865234375, 0.169769287109375, 0.18503570556640625, 0.2003021240234375, 0.21556854248046875, 0.2308349609375, 0.24610137939453125, 0.2613677978515625, 0.27663421630859375, 0.291900634765625, 0.30716705322265625, 0.3224334716796875, 0.33769989013671875, 0.35296630859375, 0.36823272705078125, 0.3834991455078125, 0.39876556396484375, 0.414031982421875, 0.42929840087890625, 0.4445648193359375, 0.45983123779296875, 0.47509765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 7.0, 7.0, 7.0, 11.0, 14.0, 16.0, 28.0, 28.0, 34.0, 33.0, 44.0, 46.0, 52.0, 45.0, 51.0, 50.0, 57.0, 52.0, 58.0, 44.0, 49.0, 43.0, 39.0, 25.0, 27.0, 23.0, 20.0, 24.0, 14.0, 15.0, 10.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.338134765625, -0.3258781433105469, -0.31362152099609375, -0.3013648986816406, -0.2891082763671875, -0.2768516540527344, -0.26459503173828125, -0.2523384094238281, -0.240081787109375, -0.22782516479492188, -0.21556854248046875, -0.20331192016601562, -0.1910552978515625, -0.17879867553710938, -0.16654205322265625, -0.15428543090820312, -0.14202880859375, -0.12977218627929688, -0.11751556396484375, -0.10525894165039062, -0.0930023193359375, -0.08074569702148438, -0.06848907470703125, -0.056232452392578125, -0.043975830078125, -0.031719207763671875, -0.01946258544921875, -0.007205963134765625, 0.0050506591796875, 0.017307281494140625, 0.02956390380859375, 0.041820526123046875, 0.0540771484375, 0.06633377075195312, 0.07859039306640625, 0.09084701538085938, 0.1031036376953125, 0.11536026000976562, 0.12761688232421875, 0.13987350463867188, 0.152130126953125, 0.16438674926757812, 0.17664337158203125, 0.18889999389648438, 0.2011566162109375, 0.21341323852539062, 0.22566986083984375, 0.23792648315429688, 0.25018310546875, 0.2624397277832031, 0.27469635009765625, 0.2869529724121094, 0.2992095947265625, 0.3114662170410156, 0.32372283935546875, 0.3359794616699219, 0.348236083984375, 0.3604927062988281, 0.37274932861328125, 0.3850059509277344, 0.3972625732421875, 0.4095191955566406, 0.42177581787109375, 0.4340324401855469, 0.4462890625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 2.0, 9.0, 10.0, 14.0, 19.0, 15.0, 32.0, 61.0, 118.0, 209.0, 568.0, 1444.0, 5924.0, 84547.0, 919813.0, 30148.0, 3730.0, 1055.0, 393.0, 193.0, 95.0, 56.0, 21.0, 20.0, 24.0, 4.0, 5.0, 5.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193359375, -0.1871929168701172, -0.18102645874023438, -0.17486000061035156, -0.16869354248046875, -0.16252708435058594, -0.15636062622070312, -0.1501941680908203, -0.1440277099609375, -0.1378612518310547, -0.13169479370117188, -0.12552833557128906, -0.11936187744140625, -0.11319541931152344, -0.10702896118164062, -0.10086250305175781, -0.094696044921875, -0.08852958679199219, -0.08236312866210938, -0.07619667053222656, -0.07003021240234375, -0.06386375427246094, -0.057697296142578125, -0.05153083801269531, -0.0453643798828125, -0.03919792175292969, -0.033031463623046875, -0.026865005493164062, -0.02069854736328125, -0.014532089233398438, -0.008365631103515625, -0.0021991729736328125, 0.00396728515625, 0.010133743286132812, 0.016300201416015625, 0.022466659545898438, 0.02863311767578125, 0.03479957580566406, 0.040966033935546875, 0.04713249206542969, 0.0532989501953125, 0.05946540832519531, 0.06563186645507812, 0.07179832458496094, 0.07796478271484375, 0.08413124084472656, 0.09029769897460938, 0.09646415710449219, 0.102630615234375, 0.10879707336425781, 0.11496353149414062, 0.12112998962402344, 0.12729644775390625, 0.13346290588378906, 0.13962936401367188, 0.1457958221435547, 0.1519622802734375, 0.1581287384033203, 0.16429519653320312, 0.17046165466308594, 0.17662811279296875, 0.18279457092285156, 0.18896102905273438, 0.1951274871826172, 0.2012939453125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 12.0, 11.0, 9.0, 12.0, 17.0, 24.0, 27.0, 48.0, 63.0, 92.0, 113.0, 128.0, 107.0, 75.0, 55.0, 54.0, 19.0, 21.0, 18.0, 10.0, 12.0, 11.0, 8.0, 10.0, 7.0, 1.0, 4.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.267692565917969e-05, -4.1171908378601074e-05, -3.966689109802246e-05, -3.816187381744385e-05, -3.6656856536865234e-05, -3.515183925628662e-05, -3.364682197570801e-05, -3.2141804695129395e-05, -3.063678741455078e-05, -2.9131770133972168e-05, -2.7626752853393555e-05, -2.612173557281494e-05, -2.4616718292236328e-05, -2.3111701011657715e-05, -2.16066837310791e-05, -2.0101666450500488e-05, -1.8596649169921875e-05, -1.7091631889343262e-05, -1.558661460876465e-05, -1.4081597328186035e-05, -1.2576580047607422e-05, -1.1071562767028809e-05, -9.566545486450195e-06, -8.061528205871582e-06, -6.556510925292969e-06, -5.0514936447143555e-06, -3.546476364135742e-06, -2.041459083557129e-06, -5.364418029785156e-07, 9.685754776000977e-07, 2.473592758178711e-06, 3.978610038757324e-06, 5.4836273193359375e-06, 6.988644599914551e-06, 8.493661880493164e-06, 9.998679161071777e-06, 1.150369644165039e-05, 1.3008713722229004e-05, 1.4513731002807617e-05, 1.601874828338623e-05, 1.7523765563964844e-05, 1.9028782844543457e-05, 2.053380012512207e-05, 2.2038817405700684e-05, 2.3543834686279297e-05, 2.504885196685791e-05, 2.6553869247436523e-05, 2.8058886528015137e-05, 2.956390380859375e-05, 3.106892108917236e-05, 3.2573938369750977e-05, 3.407895565032959e-05, 3.55839729309082e-05, 3.7088990211486816e-05, 3.859400749206543e-05, 4.009902477264404e-05, 4.1604042053222656e-05, 4.310905933380127e-05, 4.461407661437988e-05, 4.6119093894958496e-05, 4.762411117553711e-05, 4.912912845611572e-05, 5.0634145736694336e-05, 5.213916301727295e-05, 5.364418029785156e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 14.0, 13.0, 17.0, 22.0, 28.0, 55.0, 92.0, 168.0, 271.0, 508.0, 1148.0, 3082.0, 11838.0, 81626.0, 695092.0, 221694.0, 24401.0, 5216.0, 1719.0, 687.0, 318.0, 197.0, 109.0, 75.0, 46.0, 32.0, 26.0, 15.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1024169921875, -0.09937858581542969, -0.09634017944335938, -0.09330177307128906, -0.09026336669921875, -0.08722496032714844, -0.08418655395507812, -0.08114814758300781, -0.0781097412109375, -0.07507133483886719, -0.07203292846679688, -0.06899452209472656, -0.06595611572265625, -0.06291770935058594, -0.059879302978515625, -0.05684089660644531, -0.053802490234375, -0.05076408386230469, -0.047725677490234375, -0.04468727111816406, -0.04164886474609375, -0.03861045837402344, -0.035572052001953125, -0.03253364562988281, -0.0294952392578125, -0.026456832885742188, -0.023418426513671875, -0.020380020141601562, -0.01734161376953125, -0.014303207397460938, -0.011264801025390625, -0.008226394653320312, -0.00518798828125, -0.0021495819091796875, 0.000888824462890625, 0.0039272308349609375, 0.00696563720703125, 0.010004043579101562, 0.013042449951171875, 0.016080856323242188, 0.0191192626953125, 0.022157669067382812, 0.025196075439453125, 0.028234481811523438, 0.03127288818359375, 0.03431129455566406, 0.037349700927734375, 0.04038810729980469, 0.043426513671875, 0.04646492004394531, 0.049503326416015625, 0.05254173278808594, 0.05558013916015625, 0.05861854553222656, 0.061656951904296875, 0.06469535827636719, 0.0677337646484375, 0.07077217102050781, 0.07381057739257812, 0.07684898376464844, 0.07988739013671875, 0.08292579650878906, 0.08596420288085938, 0.08900260925292969, 0.092041015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 9.0, 6.0, 13.0, 20.0, 17.0, 28.0, 44.0, 50.0, 83.0, 83.0, 107.0, 112.0, 104.0, 91.0, 78.0, 48.0, 36.0, 20.0, 17.0, 20.0, 7.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1544189453125, -0.15040969848632812, -0.14640045166015625, -0.14239120483398438, -0.1383819580078125, -0.13437271118164062, -0.13036346435546875, -0.12635421752929688, -0.122344970703125, -0.11833572387695312, -0.11432647705078125, -0.11031723022460938, -0.1063079833984375, -0.10229873657226562, -0.09828948974609375, -0.09428024291992188, -0.09027099609375, -0.08626174926757812, -0.08225250244140625, -0.07824325561523438, -0.0742340087890625, -0.07022476196289062, -0.06621551513671875, -0.062206268310546875, -0.058197021484375, -0.054187774658203125, -0.05017852783203125, -0.046169281005859375, -0.0421600341796875, -0.038150787353515625, -0.03414154052734375, -0.030132293701171875, -0.026123046875, -0.022113800048828125, -0.01810455322265625, -0.014095306396484375, -0.0100860595703125, -0.006076812744140625, -0.00206756591796875, 0.001941680908203125, 0.005950927734375, 0.009960174560546875, 0.01396942138671875, 0.017978668212890625, 0.0219879150390625, 0.025997161865234375, 0.03000640869140625, 0.034015655517578125, 0.03802490234375, 0.042034149169921875, 0.04604339599609375, 0.050052642822265625, 0.0540618896484375, 0.058071136474609375, 0.06208038330078125, 0.06608963012695312, 0.070098876953125, 0.07410812377929688, 0.07811737060546875, 0.08212661743164062, 0.0861358642578125, 0.09014511108398438, 0.09415435791015625, 0.09816360473632812, 0.1021728515625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 12.0, 42.0, 133.0, 327.0, 335.0, 103.0, 28.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.97115159034729, -3.8614532947540283, -3.7517549991607666, -3.642056465148926, -3.532358169555664, -3.4226598739624023, -3.3129615783691406, -3.203263282775879, -3.093564987182617, -2.9838666915893555, -2.8741683959960938, -2.764470100402832, -2.654771566390991, -2.5450732707977295, -2.4353749752044678, -2.325676679611206, -2.2159781455993652, -2.1062798500061035, -1.9965814352035522, -1.8868831396102905, -1.7771847248077393, -1.6674864292144775, -1.5577881336212158, -1.448089838027954, -1.3383914232254028, -1.2286931276321411, -1.1189947128295898, -1.0092964172363281, -0.8995980620384216, -0.7898997068405151, -0.6802014112472534, -0.5705030560493469, -0.46080493927001953, -0.35110658407211304, -0.24140825867652893, -0.13170993328094482, -0.02201157808303833, 0.08768677711486816, 0.19738507270812988, 0.3070834279060364, 0.41678178310394287, 0.5264801383018494, 0.6361784934997559, 0.7458767890930176, 0.8555751442909241, 0.9652734994888306, 1.0749717950820923, 1.1846702098846436, 1.2943685054779053, 1.404066801071167, 1.5137652158737183, 1.62346351146698, 1.7331619262695312, 1.842860221862793, 1.9525585174560547, 2.0622568130493164, 2.171955108642578, 2.28165340423584, 2.3913516998291016, 2.5010499954223633, 2.610748529434204, 2.720446825027466, 2.8301451206207275, 2.9398434162139893, 3.04954195022583]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 13.0, 12.0, 16.0, 19.0, 17.0, 27.0, 25.0, 32.0, 43.0, 36.0, 46.0, 62.0, 61.0, 79.0, 55.0, 70.0, 61.0, 40.0, 36.0, 45.0, 31.0, 46.0, 31.0, 21.0, 14.0, 14.0, 10.0, 7.0, 13.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1596269607543945, -2.102816581726074, -2.046006202697754, -1.9891958236694336, -1.9323853254318237, -1.8755749464035034, -1.818764567375183, -1.7619541883468628, -1.705143690109253, -1.6483333110809326, -1.5915229320526123, -1.534712553024292, -1.4779020547866821, -1.4210916757583618, -1.3642812967300415, -1.3074709177017212, -1.2506605386734009, -1.1938501596450806, -1.1370397806167603, -1.0802292823791504, -1.02341890335083, -0.9666085243225098, -0.9097981452941895, -0.8529877662658691, -0.796177327632904, -0.7393669486045837, -0.6825565099716187, -0.6257461309432983, -0.568935751914978, -0.5121253132820129, -0.4553149342536926, -0.3985045254230499, -0.3416941165924072, -0.2848837077617645, -0.22807331383228302, -0.1712629199028015, -0.11445251107215881, -0.05764210224151611, -0.0008317232131958008, 0.0559786856174469, 0.1127890944480896, 0.1695995032787323, 0.2264098972082138, 0.2832202911376953, 0.340030699968338, 0.3968411087989807, 0.453651487827301, 0.5104619264602661, 0.5672723054885864, 0.6240826845169067, 0.6808931231498718, 0.7377035021781921, 0.7945139408111572, 0.8513243198394775, 0.9081346988677979, 0.9649450778961182, 1.0217554569244385, 1.0785658359527588, 1.135376214981079, 1.1921865940093994, 1.2489970922470093, 1.3058074712753296, 1.36261785030365, 1.4194282293319702, 1.47623872756958]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 12.0, 19.0, 11.0, 12.0, 42.0, 41.0, 44.0, 71.0, 97.0, 161.0, 248.0, 389.0, 761.0, 1925.0, 5772.0, 31786.0, 670293.0, 3325494.0, 134805.0, 15242.0, 4037.0, 1514.0, 634.0, 287.0, 172.0, 120.0, 76.0, 56.0, 40.0, 30.0, 16.0, 19.0, 10.0, 8.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18359375, -0.17790603637695312, -0.17221832275390625, -0.16653060913085938, -0.1608428955078125, -0.15515518188476562, -0.14946746826171875, -0.14377975463867188, -0.138092041015625, -0.13240432739257812, -0.12671661376953125, -0.12102890014648438, -0.1153411865234375, -0.10965347290039062, -0.10396575927734375, -0.09827804565429688, -0.09259033203125, -0.08690261840820312, -0.08121490478515625, -0.07552719116210938, -0.0698394775390625, -0.06415176391601562, -0.05846405029296875, -0.052776336669921875, -0.047088623046875, -0.041400909423828125, -0.03571319580078125, -0.030025482177734375, -0.0243377685546875, -0.018650054931640625, -0.01296234130859375, -0.007274627685546875, -0.0015869140625, 0.004100799560546875, 0.00978851318359375, 0.015476226806640625, 0.0211639404296875, 0.026851654052734375, 0.03253936767578125, 0.038227081298828125, 0.043914794921875, 0.049602508544921875, 0.05529022216796875, 0.060977935791015625, 0.0666656494140625, 0.07235336303710938, 0.07804107666015625, 0.08372879028320312, 0.08941650390625, 0.09510421752929688, 0.10079193115234375, 0.10647964477539062, 0.1121673583984375, 0.11785507202148438, 0.12354278564453125, 0.12923049926757812, 0.134918212890625, 0.14060592651367188, 0.14629364013671875, 0.15198135375976562, 0.1576690673828125, 0.16335678100585938, 0.16904449462890625, 0.17473220825195312, 0.180419921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 12.0, 10.0, 20.0, 23.0, 37.0, 38.0, 58.0, 79.0, 92.0, 104.0, 103.0, 108.0, 70.0, 69.0, 44.0, 38.0, 28.0, 33.0, 17.0, 9.0, 2.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2685546875, -0.26274871826171875, -0.2569427490234375, -0.25113677978515625, -0.245330810546875, -0.23952484130859375, -0.2337188720703125, -0.22791290283203125, -0.22210693359375, -0.21630096435546875, -0.2104949951171875, -0.20468902587890625, -0.198883056640625, -0.19307708740234375, -0.1872711181640625, -0.18146514892578125, -0.1756591796875, -0.16985321044921875, -0.1640472412109375, -0.15824127197265625, -0.152435302734375, -0.14662933349609375, -0.1408233642578125, -0.13501739501953125, -0.12921142578125, -0.12340545654296875, -0.1175994873046875, -0.11179351806640625, -0.105987548828125, -0.10018157958984375, -0.0943756103515625, -0.08856964111328125, -0.082763671875, -0.07695770263671875, -0.0711517333984375, -0.06534576416015625, -0.059539794921875, -0.05373382568359375, -0.0479278564453125, -0.04212188720703125, -0.03631591796875, -0.03050994873046875, -0.0247039794921875, -0.01889801025390625, -0.013092041015625, -0.00728607177734375, -0.0014801025390625, 0.00432586669921875, 0.0101318359375, 0.01593780517578125, 0.0217437744140625, 0.02754974365234375, 0.033355712890625, 0.03916168212890625, 0.0449676513671875, 0.05077362060546875, 0.05657958984375, 0.06238555908203125, 0.0681915283203125, 0.07399749755859375, 0.079803466796875, 0.08560943603515625, 0.0914154052734375, 0.09722137451171875, 0.10302734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 13.0, 11.0, 19.0, 21.0, 27.0, 36.0, 76.0, 122.0, 189.0, 370.0, 894.0, 2475.0, 8909.0, 43807.0, 638513.0, 3361160.0, 109522.0, 19186.0, 5291.0, 1843.0, 788.0, 404.0, 219.0, 125.0, 74.0, 51.0, 33.0, 25.0, 17.0, 12.0, 7.0, 10.0, 6.0, 2.0, 2.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.187744140625, -0.181915283203125, -0.17608642578125, -0.170257568359375, -0.1644287109375, -0.158599853515625, -0.15277099609375, -0.146942138671875, -0.14111328125, -0.135284423828125, -0.12945556640625, -0.123626708984375, -0.1177978515625, -0.111968994140625, -0.10614013671875, -0.100311279296875, -0.094482421875, -0.088653564453125, -0.08282470703125, -0.076995849609375, -0.0711669921875, -0.065338134765625, -0.05950927734375, -0.053680419921875, -0.0478515625, -0.042022705078125, -0.03619384765625, -0.030364990234375, -0.0245361328125, -0.018707275390625, -0.01287841796875, -0.007049560546875, -0.001220703125, 0.004608154296875, 0.01043701171875, 0.016265869140625, 0.0220947265625, 0.027923583984375, 0.03375244140625, 0.039581298828125, 0.04541015625, 0.051239013671875, 0.05706787109375, 0.062896728515625, 0.0687255859375, 0.074554443359375, 0.08038330078125, 0.086212158203125, 0.092041015625, 0.097869873046875, 0.10369873046875, 0.109527587890625, 0.1153564453125, 0.121185302734375, 0.12701416015625, 0.132843017578125, 0.138671875, 0.144500732421875, 0.15032958984375, 0.156158447265625, 0.1619873046875, 0.167816162109375, 0.17364501953125, 0.179473876953125, 0.185302734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 10.0, 15.0, 16.0, 13.0, 33.0, 37.0, 61.0, 105.0, 230.0, 609.0, 1042.0, 912.0, 432.0, 192.0, 102.0, 58.0, 51.0, 41.0, 20.0, 19.0, 17.0, 13.0, 5.0, 9.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.172607421875, -0.16594314575195312, -0.15927886962890625, -0.15261459350585938, -0.1459503173828125, -0.13928604125976562, -0.13262176513671875, -0.12595748901367188, -0.119293212890625, -0.11262893676757812, -0.10596466064453125, -0.09930038452148438, -0.0926361083984375, -0.08597183227539062, -0.07930755615234375, -0.07264328002929688, -0.06597900390625, -0.059314727783203125, -0.05265045166015625, -0.045986175537109375, -0.0393218994140625, -0.032657623291015625, -0.02599334716796875, -0.019329071044921875, -0.012664794921875, -0.006000518798828125, 0.00066375732421875, 0.007328033447265625, 0.0139923095703125, 0.020656585693359375, 0.02732086181640625, 0.033985137939453125, 0.0406494140625, 0.047313690185546875, 0.05397796630859375, 0.060642242431640625, 0.0673065185546875, 0.07397079467773438, 0.08063507080078125, 0.08729934692382812, 0.093963623046875, 0.10062789916992188, 0.10729217529296875, 0.11395645141601562, 0.1206207275390625, 0.12728500366210938, 0.13394927978515625, 0.14061355590820312, 0.14727783203125, 0.15394210815429688, 0.16060638427734375, 0.16727066040039062, 0.1739349365234375, 0.18059921264648438, 0.18726348876953125, 0.19392776489257812, 0.200592041015625, 0.20725631713867188, 0.21392059326171875, 0.22058486938476562, 0.2272491455078125, 0.23391342163085938, 0.24057769775390625, 0.24724197387695312, 0.25390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 0.0, 4.0, 18.0, 41.0, 94.0, 210.0, 268.0, 197.0, 91.0, 43.0, 13.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.014565944671631, -1.9520026445388794, -1.8894392251968384, -1.826875925064087, -1.764312505722046, -1.7017492055892944, -1.639185905456543, -1.576622486114502, -1.514059066772461, -1.4514957666397095, -1.3889323472976685, -1.326369047164917, -1.263805627822876, -1.2012423276901245, -1.138679027557373, -1.076115608215332, -1.0135523080825806, -0.9509889483451843, -0.8884255886077881, -0.8258622884750366, -0.7632988691329956, -0.7007355690002441, -0.6381722092628479, -0.5756088495254517, -0.5130454897880554, -0.4504821300506592, -0.38791877031326294, -0.3253554403781891, -0.26279208064079285, -0.2002287209033966, -0.13766539096832275, -0.07510203123092651, -0.012538790702819824, 0.05002456158399582, 0.11258791387081146, 0.1751512587070465, 0.23771461844444275, 0.300277978181839, 0.36284130811691284, 0.4254046678543091, 0.4879680275917053, 0.5505313873291016, 0.6130947470664978, 0.675658106803894, 0.7382214069366455, 0.8007848262786865, 0.863348126411438, 0.9259114861488342, 0.9884748458862305, 1.051038146018982, 1.113601565361023, 1.1761648654937744, 1.2387282848358154, 1.301291584968567, 1.3638548851013184, 1.4264183044433594, 1.4889817237854004, 1.5515450239181519, 1.6141084432601929, 1.6766717433929443, 1.7392351627349854, 1.8017984628677368, 1.8643617630004883, 1.9269251823425293, 1.9894884824752808]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 0.0, 5.0, 4.0, 9.0, 8.0, 12.0, 16.0, 23.0, 24.0, 22.0, 46.0, 46.0, 47.0, 58.0, 67.0, 61.0, 74.0, 58.0, 63.0, 56.0, 56.0, 55.0, 44.0, 38.0, 24.0, 24.0, 23.0, 8.0, 15.0, 6.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7212209105491638, -0.6860234141349792, -0.6508259177207947, -0.6156283617019653, -0.5804308652877808, -0.5452333688735962, -0.5100358724594116, -0.47483837604522705, -0.4396408498287201, -0.4044433534145355, -0.36924582719802856, -0.334048330783844, -0.2988508343696594, -0.26365330815315247, -0.2284558117389679, -0.19325830042362213, -0.15806078910827637, -0.1228632777929306, -0.08766577392816544, -0.05246827006340027, -0.017270758748054504, 0.01792675256729126, 0.05312424898147583, 0.0883217602968216, 0.12351927161216736, 0.15871678292751312, 0.1939142942428589, 0.22911179065704346, 0.264309287071228, 0.299506813287735, 0.33470430970191956, 0.3699018359184265, 0.40509939193725586, 0.44029688835144043, 0.4754944145679474, 0.5106918811798096, 0.5458894371986389, 0.5810869336128235, 0.6162844300270081, 0.6514819264411926, 0.686679482460022, 0.7218769788742065, 0.7570744752883911, 0.7922719717025757, 0.827469527721405, 0.8626670241355896, 0.8978645205497742, 0.9330620169639587, 0.9682595133781433, 1.0034570693969727, 1.0386545658111572, 1.0738520622253418, 1.1090495586395264, 1.144247055053711, 1.1794445514678955, 1.21464204788208, 1.2498395442962646, 1.2850370407104492, 1.3202345371246338, 1.3554320335388184, 1.390629529953003, 1.4258270263671875, 1.461024522781372, 1.4962221384048462, 1.5314196348190308]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 8.0, 13.0, 19.0, 31.0, 34.0, 43.0, 57.0, 91.0, 148.0, 269.0, 371.0, 512.0, 827.0, 1328.0, 2168.0, 3888.0, 6837.0, 12653.0, 24614.0, 49564.0, 100206.0, 182891.0, 243787.0, 194956.0, 109760.0, 55021.0, 26907.0, 13635.0, 7287.0, 4193.0, 2400.0, 1413.0, 925.0, 553.0, 388.0, 252.0, 154.0, 103.0, 64.0, 52.0, 39.0, 24.0, 14.0, 16.0, 11.0, 6.0, 12.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.069091796875, -0.06690311431884766, -0.06471443176269531, -0.06252574920654297, -0.060337066650390625, -0.05814838409423828, -0.05595970153808594, -0.053771018981933594, -0.05158233642578125, -0.049393653869628906, -0.04720497131347656, -0.04501628875732422, -0.042827606201171875, -0.04063892364501953, -0.03845024108886719, -0.036261558532714844, -0.0340728759765625, -0.031884193420410156, -0.029695510864257812, -0.02750682830810547, -0.025318145751953125, -0.02312946319580078, -0.020940780639648438, -0.018752098083496094, -0.01656341552734375, -0.014374732971191406, -0.012186050415039062, -0.009997367858886719, -0.007808685302734375, -0.005620002746582031, -0.0034313201904296875, -0.0012426376342773438, 0.000946044921875, 0.0031347274780273438, 0.0053234100341796875, 0.007512092590332031, 0.009700775146484375, 0.011889457702636719, 0.014078140258789062, 0.016266822814941406, 0.01845550537109375, 0.020644187927246094, 0.022832870483398438, 0.02502155303955078, 0.027210235595703125, 0.02939891815185547, 0.03158760070800781, 0.033776283264160156, 0.0359649658203125, 0.038153648376464844, 0.04034233093261719, 0.04253101348876953, 0.044719696044921875, 0.04690837860107422, 0.04909706115722656, 0.051285743713378906, 0.05347442626953125, 0.055663108825683594, 0.05785179138183594, 0.06004047393798828, 0.062229156494140625, 0.06441783905029297, 0.06660652160644531, 0.06879520416259766, 0.07098388671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 7.0, 10.0, 19.0, 13.0, 13.0, 26.0, 23.0, 30.0, 35.0, 30.0, 43.0, 42.0, 50.0, 58.0, 67.0, 61.0, 48.0, 57.0, 68.0, 42.0, 48.0, 40.0, 20.0, 15.0, 27.0, 17.0, 14.0, 9.0, 25.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.115234375, -0.11187267303466797, -0.10851097106933594, -0.1051492691040039, -0.10178756713867188, -0.09842586517333984, -0.09506416320800781, -0.09170246124267578, -0.08834075927734375, -0.08497905731201172, -0.08161735534667969, -0.07825565338134766, -0.07489395141601562, -0.0715322494506836, -0.06817054748535156, -0.06480884552001953, -0.0614471435546875, -0.05808544158935547, -0.05472373962402344, -0.051362037658691406, -0.048000335693359375, -0.044638633728027344, -0.04127693176269531, -0.03791522979736328, -0.03455352783203125, -0.03119182586669922, -0.027830123901367188, -0.024468421936035156, -0.021106719970703125, -0.017745018005371094, -0.014383316040039062, -0.011021614074707031, -0.007659912109375, -0.004298210144042969, -0.0009365081787109375, 0.0024251937866210938, 0.005786895751953125, 0.009148597717285156, 0.012510299682617188, 0.01587200164794922, 0.01923370361328125, 0.02259540557861328, 0.025957107543945312, 0.029318809509277344, 0.032680511474609375, 0.036042213439941406, 0.03940391540527344, 0.04276561737060547, 0.0461273193359375, 0.04948902130126953, 0.05285072326660156, 0.056212425231933594, 0.059574127197265625, 0.06293582916259766, 0.06629753112792969, 0.06965923309326172, 0.07302093505859375, 0.07638263702392578, 0.07974433898925781, 0.08310604095458984, 0.08646774291992188, 0.0898294448852539, 0.09319114685058594, 0.09655284881591797, 0.09991455078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 11.0, 4.0, 14.0, 24.0, 40.0, 31.0, 39.0, 64.0, 99.0, 107.0, 166.0, 221.0, 308.0, 507.0, 830.0, 1842.0, 7054.0, 75239.0, 860427.0, 89399.0, 7765.0, 1901.0, 843.0, 525.0, 295.0, 224.0, 162.0, 97.0, 90.0, 47.0, 51.0, 25.0, 28.0, 15.0, 15.0, 16.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340576171875, -0.3304176330566406, -0.32025909423828125, -0.3101005554199219, -0.2999420166015625, -0.2897834777832031, -0.27962493896484375, -0.2694664001464844, -0.259307861328125, -0.24914932250976562, -0.23899078369140625, -0.22883224487304688, -0.2186737060546875, -0.20851516723632812, -0.19835662841796875, -0.18819808959960938, -0.17803955078125, -0.16788101196289062, -0.15772247314453125, -0.14756393432617188, -0.1374053955078125, -0.12724685668945312, -0.11708831787109375, -0.10692977905273438, -0.096771240234375, -0.08661270141601562, -0.07645416259765625, -0.06629562377929688, -0.0561370849609375, -0.045978546142578125, -0.03582000732421875, -0.025661468505859375, -0.0155029296875, -0.005344390869140625, 0.00481414794921875, 0.014972686767578125, 0.0251312255859375, 0.035289764404296875, 0.04544830322265625, 0.055606842041015625, 0.065765380859375, 0.07592391967773438, 0.08608245849609375, 0.09624099731445312, 0.1063995361328125, 0.11655807495117188, 0.12671661376953125, 0.13687515258789062, 0.14703369140625, 0.15719223022460938, 0.16735076904296875, 0.17750930786132812, 0.1876678466796875, 0.19782638549804688, 0.20798492431640625, 0.21814346313476562, 0.228302001953125, 0.23846054077148438, 0.24861907958984375, 0.2587776184082031, 0.2689361572265625, 0.2790946960449219, 0.28925323486328125, 0.2994117736816406, 0.3095703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 8.0, 15.0, 4.0, 10.0, 15.0, 18.0, 16.0, 18.0, 28.0, 31.0, 39.0, 59.0, 50.0, 41.0, 59.0, 60.0, 51.0, 67.0, 63.0, 47.0, 59.0, 44.0, 34.0, 39.0, 31.0, 24.0, 12.0, 12.0, 10.0, 10.0, 4.0, 6.0, 3.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.5546875, -0.5394172668457031, -0.5241470336914062, -0.5088768005371094, -0.4936065673828125, -0.4783363342285156, -0.46306610107421875, -0.4477958679199219, -0.432525634765625, -0.4172554016113281, -0.40198516845703125, -0.3867149353027344, -0.3714447021484375, -0.3561744689941406, -0.34090423583984375, -0.3256340026855469, -0.31036376953125, -0.2950935363769531, -0.27982330322265625, -0.2645530700683594, -0.2492828369140625, -0.23401260375976562, -0.21874237060546875, -0.20347213745117188, -0.188201904296875, -0.17293167114257812, -0.15766143798828125, -0.14239120483398438, -0.1271209716796875, -0.11185073852539062, -0.09658050537109375, -0.08131027221679688, -0.0660400390625, -0.050769805908203125, -0.03549957275390625, -0.020229339599609375, -0.0049591064453125, 0.010311126708984375, 0.02558135986328125, 0.040851593017578125, 0.056121826171875, 0.07139205932617188, 0.08666229248046875, 0.10193252563476562, 0.1172027587890625, 0.13247299194335938, 0.14774322509765625, 0.16301345825195312, 0.17828369140625, 0.19355392456054688, 0.20882415771484375, 0.22409439086914062, 0.2393646240234375, 0.2546348571777344, 0.26990509033203125, 0.2851753234863281, 0.300445556640625, 0.3157157897949219, 0.33098602294921875, 0.3462562561035156, 0.3615264892578125, 0.3767967224121094, 0.39206695556640625, 0.4073371887207031, 0.422607421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 14.0, 7.0, 16.0, 16.0, 21.0, 36.0, 50.0, 58.0, 100.0, 120.0, 238.0, 354.0, 665.0, 1125.0, 1997.0, 4113.0, 9325.0, 26780.0, 133848.0, 689891.0, 134382.0, 26984.0, 9317.0, 4257.0, 2038.0, 1066.0, 647.0, 396.0, 220.0, 145.0, 95.0, 58.0, 52.0, 36.0, 22.0, 18.0, 8.0, 10.0, 7.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0635986328125, -0.06157970428466797, -0.05956077575683594, -0.057541847229003906, -0.055522918701171875, -0.053503990173339844, -0.05148506164550781, -0.04946613311767578, -0.04744720458984375, -0.04542827606201172, -0.04340934753417969, -0.041390419006347656, -0.039371490478515625, -0.037352561950683594, -0.03533363342285156, -0.03331470489501953, -0.0312957763671875, -0.02927684783935547, -0.027257919311523438, -0.025238990783691406, -0.023220062255859375, -0.021201133728027344, -0.019182205200195312, -0.01716327667236328, -0.01514434814453125, -0.013125419616699219, -0.011106491088867188, -0.009087562561035156, -0.007068634033203125, -0.005049705505371094, -0.0030307769775390625, -0.0010118484497070312, 0.001007080078125, 0.0030260086059570312, 0.0050449371337890625, 0.007063865661621094, 0.009082794189453125, 0.011101722717285156, 0.013120651245117188, 0.015139579772949219, 0.01715850830078125, 0.01917743682861328, 0.021196365356445312, 0.023215293884277344, 0.025234222412109375, 0.027253150939941406, 0.029272079467773438, 0.03129100799560547, 0.0333099365234375, 0.03532886505126953, 0.03734779357910156, 0.039366722106933594, 0.041385650634765625, 0.043404579162597656, 0.04542350769042969, 0.04744243621826172, 0.04946136474609375, 0.05148029327392578, 0.05349922180175781, 0.055518150329589844, 0.057537078857421875, 0.059556007385253906, 0.06157493591308594, 0.06359386444091797, 0.06561279296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 5.0, 5.0, 9.0, 3.0, 10.0, 10.0, 21.0, 27.0, 37.0, 49.0, 46.0, 76.0, 112.0, 102.0, 107.0, 108.0, 73.0, 50.0, 36.0, 21.0, 29.0, 10.0, 16.0, 6.0, 8.0, 9.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6597251892089844e-05, -3.492087125778198e-05, -3.324449062347412e-05, -3.156810998916626e-05, -2.98917293548584e-05, -2.8215348720550537e-05, -2.6538968086242676e-05, -2.4862587451934814e-05, -2.3186206817626953e-05, -2.1509826183319092e-05, -1.983344554901123e-05, -1.815706491470337e-05, -1.6480684280395508e-05, -1.4804303646087646e-05, -1.3127923011779785e-05, -1.1451542377471924e-05, -9.775161743164062e-06, -8.098781108856201e-06, -6.42240047454834e-06, -4.7460198402404785e-06, -3.069639205932617e-06, -1.3932585716247559e-06, 2.8312206268310547e-07, 1.959502696990967e-06, 3.635883331298828e-06, 5.3122639656066895e-06, 6.988644599914551e-06, 8.665025234222412e-06, 1.0341405868530273e-05, 1.2017786502838135e-05, 1.3694167137145996e-05, 1.5370547771453857e-05, 1.704692840576172e-05, 1.872330904006958e-05, 2.039968967437744e-05, 2.2076070308685303e-05, 2.3752450942993164e-05, 2.5428831577301025e-05, 2.7105212211608887e-05, 2.8781592845916748e-05, 3.045797348022461e-05, 3.213435411453247e-05, 3.381073474884033e-05, 3.548711538314819e-05, 3.7163496017456055e-05, 3.8839876651763916e-05, 4.051625728607178e-05, 4.219263792037964e-05, 4.38690185546875e-05, 4.554539918899536e-05, 4.722177982330322e-05, 4.8898160457611084e-05, 5.0574541091918945e-05, 5.225092172622681e-05, 5.392730236053467e-05, 5.560368299484253e-05, 5.728006362915039e-05, 5.895644426345825e-05, 6.063282489776611e-05, 6.230920553207397e-05, 6.398558616638184e-05, 6.56619668006897e-05, 6.733834743499756e-05, 6.901472806930542e-05, 7.069110870361328e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 4.0, 8.0, 6.0, 10.0, 14.0, 16.0, 18.0, 32.0, 34.0, 55.0, 72.0, 121.0, 189.0, 248.0, 436.0, 703.0, 1449.0, 2748.0, 6026.0, 15561.0, 61828.0, 559409.0, 329060.0, 46565.0, 13170.0, 5299.0, 2424.0, 1216.0, 668.0, 363.0, 246.0, 156.0, 104.0, 85.0, 52.0, 28.0, 23.0, 14.0, 20.0, 14.0, 19.0, 4.0, 8.0, 8.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0587158203125, -0.05675315856933594, -0.054790496826171875, -0.05282783508300781, -0.05086517333984375, -0.04890251159667969, -0.046939849853515625, -0.04497718811035156, -0.0430145263671875, -0.04105186462402344, -0.039089202880859375, -0.03712654113769531, -0.03516387939453125, -0.03320121765136719, -0.031238555908203125, -0.029275894165039062, -0.027313232421875, -0.025350570678710938, -0.023387908935546875, -0.021425247192382812, -0.01946258544921875, -0.017499923706054688, -0.015537261962890625, -0.013574600219726562, -0.0116119384765625, -0.009649276733398438, -0.007686614990234375, -0.0057239532470703125, -0.00376129150390625, -0.0017986297607421875, 0.000164031982421875, 0.0021266937255859375, 0.00408935546875, 0.0060520172119140625, 0.008014678955078125, 0.009977340698242188, 0.01194000244140625, 0.013902664184570312, 0.015865325927734375, 0.017827987670898438, 0.0197906494140625, 0.021753311157226562, 0.023715972900390625, 0.025678634643554688, 0.02764129638671875, 0.029603958129882812, 0.031566619873046875, 0.03352928161621094, 0.035491943359375, 0.03745460510253906, 0.039417266845703125, 0.04137992858886719, 0.04334259033203125, 0.04530525207519531, 0.047267913818359375, 0.04923057556152344, 0.0511932373046875, 0.05315589904785156, 0.055118560791015625, 0.05708122253417969, 0.05904388427734375, 0.06100654602050781, 0.06296920776367188, 0.06493186950683594, 0.06689453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 1.0, 5.0, 5.0, 4.0, 7.0, 9.0, 12.0, 17.0, 29.0, 29.0, 25.0, 60.0, 64.0, 68.0, 75.0, 72.0, 76.0, 77.0, 66.0, 52.0, 66.0, 37.0, 41.0, 24.0, 17.0, 10.0, 10.0, 13.0, 7.0, 4.0, 5.0, 5.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059661865234375, -0.0573582649230957, -0.055054664611816406, -0.05275106430053711, -0.05044746398925781, -0.048143863677978516, -0.04584026336669922, -0.04353666305541992, -0.041233062744140625, -0.03892946243286133, -0.03662586212158203, -0.034322261810302734, -0.03201866149902344, -0.02971506118774414, -0.027411460876464844, -0.025107860565185547, -0.02280426025390625, -0.020500659942626953, -0.018197059631347656, -0.01589345932006836, -0.013589859008789062, -0.011286258697509766, -0.008982658386230469, -0.006679058074951172, -0.004375457763671875, -0.002071857452392578, 0.00023174285888671875, 0.0025353431701660156, 0.0048389434814453125, 0.007142543792724609, 0.009446144104003906, 0.011749744415283203, 0.0140533447265625, 0.016356945037841797, 0.018660545349121094, 0.02096414566040039, 0.023267745971679688, 0.025571346282958984, 0.02787494659423828, 0.030178546905517578, 0.032482147216796875, 0.03478574752807617, 0.03708934783935547, 0.039392948150634766, 0.04169654846191406, 0.04400014877319336, 0.046303749084472656, 0.04860734939575195, 0.05091094970703125, 0.05321455001831055, 0.055518150329589844, 0.05782175064086914, 0.06012535095214844, 0.062428951263427734, 0.06473255157470703, 0.06703615188598633, 0.06933975219726562, 0.07164335250854492, 0.07394695281982422, 0.07625055313110352, 0.07855415344238281, 0.08085775375366211, 0.0831613540649414, 0.0854649543762207, 0.0877685546875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 9.0, 44.0, 153.0, 492.0, 237.0, 42.0, 16.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28227424621582, -5.1458940505981445, -5.009513854980469, -4.873133659362793, -4.736753463745117, -4.600373268127441, -4.463993072509766, -4.327612400054932, -4.191232204437256, -4.05485200881958, -3.9184718132019043, -3.7820916175842285, -3.6457111835479736, -3.509330987930298, -3.372950792312622, -3.2365705966949463, -3.1001904010772705, -2.9638102054595947, -2.827430009841919, -2.691049575805664, -2.5546693801879883, -2.4182891845703125, -2.2819089889526367, -2.145528793334961, -2.009148597717285, -1.8727684020996094, -1.736388087272644, -1.6000078916549683, -1.463627576828003, -1.3272473812103271, -1.1908671855926514, -1.0544869899749756, -0.9181063175201416, -0.781726062297821, -0.6453458070755005, -0.5089656114578247, -0.37258535623550415, -0.2362051010131836, -0.09982490539550781, 0.036555349826812744, 0.1729356050491333, 0.30931586027145386, 0.445696085691452, 0.5820763111114502, 0.7184565663337708, 0.8548368215560913, 0.9912170171737671, 1.1275973320007324, 1.2639775276184082, 1.400357723236084, 1.5367380380630493, 1.673118233680725, 1.8094985485076904, 1.9458787441253662, 2.082258939743042, 2.2186391353607178, 2.3550195693969727, 2.4913997650146484, 2.627779960632324, 2.76416015625, 2.900540590286255, 3.0369207859039307, 3.1733009815216064, 3.3096811771392822, 3.446061372756958]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 6.0, 4.0, 9.0, 12.0, 10.0, 24.0, 23.0, 21.0, 31.0, 21.0, 35.0, 46.0, 32.0, 51.0, 64.0, 76.0, 66.0, 56.0, 53.0, 39.0, 42.0, 39.0, 33.0, 31.0, 28.0, 19.0, 19.0, 16.0, 14.0, 19.0, 10.0, 8.0, 7.0, 5.0, 8.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3647549152374268, -1.3149229288101196, -1.2650909423828125, -1.2152589559555054, -1.1654269695281982, -1.1155951023101807, -1.0657631158828735, -1.0159311294555664, -0.9660991430282593, -0.9162671566009521, -0.866435170173645, -0.8166032433509827, -0.7667712569236755, -0.7169392704963684, -0.667107343673706, -0.6172753572463989, -0.5674433708190918, -0.5176113843917847, -0.4677794277667999, -0.4179474711418152, -0.36811548471450806, -0.3182834982872009, -0.2684515416622162, -0.21861958503723145, -0.16878759860992432, -0.11895562708377838, -0.06912365555763245, -0.01929168403148651, 0.030540287494659424, 0.08037225902080536, 0.1302042305469513, 0.18003618717193604, 0.2298680543899536, 0.27970004081726074, 0.3295319974422455, 0.3793639540672302, 0.42919594049453735, 0.4790279269218445, 0.5288598537445068, 0.578691840171814, 0.6285238265991211, 0.6783558130264282, 0.7281877994537354, 0.7780197262763977, 0.8278517127037048, 0.877683699131012, 0.9275156259536743, 0.9773476123809814, 1.0271795988082886, 1.0770115852355957, 1.1268435716629028, 1.17667555809021, 1.2265074253082275, 1.2763394117355347, 1.3261713981628418, 1.376003384590149, 1.425835371017456, 1.4756673574447632, 1.5254993438720703, 1.5753313302993774, 1.6251633167266846, 1.6749951839447021, 1.7248271703720093, 1.7746591567993164, 1.8244911432266235]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 12.0, 19.0, 24.0, 45.0, 72.0, 118.0, 180.0, 320.0, 638.0, 1331.0, 3576.0, 12619.0, 70933.0, 761820.0, 2830092.0, 449841.0, 47231.0, 10051.0, 2975.0, 1092.0, 549.0, 279.0, 176.0, 102.0, 68.0, 42.0, 26.0, 18.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.140380859375, -0.13690567016601562, -0.13343048095703125, -0.12995529174804688, -0.1264801025390625, -0.12300491333007812, -0.11952972412109375, -0.11605453491210938, -0.112579345703125, -0.10910415649414062, -0.10562896728515625, -0.10215377807617188, -0.0986785888671875, -0.09520339965820312, -0.09172821044921875, -0.08825302124023438, -0.08477783203125, -0.08130264282226562, -0.07782745361328125, -0.07435226440429688, -0.0708770751953125, -0.06740188598632812, -0.06392669677734375, -0.060451507568359375, -0.056976318359375, -0.053501129150390625, -0.05002593994140625, -0.046550750732421875, -0.0430755615234375, -0.039600372314453125, -0.03612518310546875, -0.032649993896484375, -0.0291748046875, -0.025699615478515625, -0.02222442626953125, -0.018749237060546875, -0.0152740478515625, -0.011798858642578125, -0.00832366943359375, -0.004848480224609375, -0.001373291015625, 0.002101898193359375, 0.00557708740234375, 0.009052276611328125, 0.0125274658203125, 0.016002655029296875, 0.01947784423828125, 0.022953033447265625, 0.02642822265625, 0.029903411865234375, 0.03337860107421875, 0.036853790283203125, 0.0403289794921875, 0.043804168701171875, 0.04727935791015625, 0.050754547119140625, 0.054229736328125, 0.057704925537109375, 0.06118011474609375, 0.06465530395507812, 0.0681304931640625, 0.07160568237304688, 0.07508087158203125, 0.07855606079101562, 0.08203125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 10.0, 8.0, 10.0, 16.0, 17.0, 19.0, 23.0, 30.0, 30.0, 48.0, 47.0, 51.0, 53.0, 49.0, 57.0, 61.0, 68.0, 53.0, 54.0, 44.0, 55.0, 37.0, 24.0, 23.0, 20.0, 24.0, 19.0, 17.0, 9.0, 5.0, 8.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.1279296875, -0.12450313568115234, -0.12107658386230469, -0.11765003204345703, -0.11422348022460938, -0.11079692840576172, -0.10737037658691406, -0.1039438247680664, -0.10051727294921875, -0.0970907211303711, -0.09366416931152344, -0.09023761749267578, -0.08681106567382812, -0.08338451385498047, -0.07995796203613281, -0.07653141021728516, -0.0731048583984375, -0.06967830657958984, -0.06625175476074219, -0.06282520294189453, -0.059398651123046875, -0.05597209930419922, -0.05254554748535156, -0.049118995666503906, -0.04569244384765625, -0.042265892028808594, -0.03883934020996094, -0.03541278839111328, -0.031986236572265625, -0.02855968475341797, -0.025133132934570312, -0.021706581115722656, -0.018280029296875, -0.014853477478027344, -0.011426925659179688, -0.008000373840332031, -0.004573822021484375, -0.0011472702026367188, 0.0022792816162109375, 0.005705833435058594, 0.00913238525390625, 0.012558937072753906, 0.015985488891601562, 0.01941204071044922, 0.022838592529296875, 0.02626514434814453, 0.029691696166992188, 0.033118247985839844, 0.0365447998046875, 0.039971351623535156, 0.04339790344238281, 0.04682445526123047, 0.050251007080078125, 0.05367755889892578, 0.05710411071777344, 0.060530662536621094, 0.06395721435546875, 0.0673837661743164, 0.07081031799316406, 0.07423686981201172, 0.07766342163085938, 0.08108997344970703, 0.08451652526855469, 0.08794307708740234, 0.09136962890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 9.0, 19.0, 30.0, 42.0, 62.0, 116.0, 210.0, 491.0, 1380.0, 5966.0, 46306.0, 2637082.0, 1453441.0, 39236.0, 6631.0, 1760.0, 638.0, 333.0, 193.0, 105.0, 90.0, 51.0, 24.0, 19.0, 13.0, 8.0, 6.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.18896484375, -0.18220138549804688, -0.17543792724609375, -0.16867446899414062, -0.1619110107421875, -0.15514755249023438, -0.14838409423828125, -0.14162063598632812, -0.134857177734375, -0.12809371948242188, -0.12133026123046875, -0.11456680297851562, -0.1078033447265625, -0.10103988647460938, -0.09427642822265625, -0.08751296997070312, -0.08074951171875, -0.07398605346679688, -0.06722259521484375, -0.060459136962890625, -0.0536956787109375, -0.046932220458984375, -0.04016876220703125, -0.033405303955078125, -0.026641845703125, -0.019878387451171875, -0.01311492919921875, -0.006351470947265625, 0.0004119873046875, 0.007175445556640625, 0.01393890380859375, 0.020702362060546875, 0.0274658203125, 0.034229278564453125, 0.04099273681640625, 0.047756195068359375, 0.0545196533203125, 0.061283111572265625, 0.06804656982421875, 0.07481002807617188, 0.081573486328125, 0.08833694458007812, 0.09510040283203125, 0.10186386108398438, 0.1086273193359375, 0.11539077758789062, 0.12215423583984375, 0.12891769409179688, 0.13568115234375, 0.14244461059570312, 0.14920806884765625, 0.15597152709960938, 0.1627349853515625, 0.16949844360351562, 0.17626190185546875, 0.18302536010742188, 0.189788818359375, 0.19655227661132812, 0.20331573486328125, 0.21007919311523438, 0.2168426513671875, 0.22360610961914062, 0.23036956787109375, 0.23713302612304688, 0.243896484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 7.0, 7.0, 17.0, 18.0, 41.0, 49.0, 89.0, 188.0, 493.0, 987.0, 1059.0, 549.0, 245.0, 107.0, 69.0, 45.0, 28.0, 15.0, 12.0, 8.0, 10.0, 8.0, 3.0, 2.0, 2.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1968994140625, -0.18987464904785156, -0.18284988403320312, -0.1758251190185547, -0.16880035400390625, -0.1617755889892578, -0.15475082397460938, -0.14772605895996094, -0.1407012939453125, -0.13367652893066406, -0.12665176391601562, -0.11962699890136719, -0.11260223388671875, -0.10557746887207031, -0.09855270385742188, -0.09152793884277344, -0.084503173828125, -0.07747840881347656, -0.07045364379882812, -0.06342887878417969, -0.05640411376953125, -0.04937934875488281, -0.042354583740234375, -0.03532981872558594, -0.0283050537109375, -0.021280288696289062, -0.014255523681640625, -0.0072307586669921875, -0.00020599365234375, 0.0068187713623046875, 0.013843536376953125, 0.020868301391601562, 0.02789306640625, 0.03491783142089844, 0.041942596435546875, 0.04896736145019531, 0.05599212646484375, 0.06301689147949219, 0.07004165649414062, 0.07706642150878906, 0.0840911865234375, 0.09111595153808594, 0.09814071655273438, 0.10516548156738281, 0.11219024658203125, 0.11921501159667969, 0.12623977661132812, 0.13326454162597656, 0.140289306640625, 0.14731407165527344, 0.15433883666992188, 0.1613636016845703, 0.16838836669921875, 0.1754131317138672, 0.18243789672851562, 0.18946266174316406, 0.1964874267578125, 0.20351219177246094, 0.21053695678710938, 0.2175617218017578, 0.22458648681640625, 0.2316112518310547, 0.23863601684570312, 0.24566078186035156, 0.252685546875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 18.0, 49.0, 148.0, 243.0, 263.0, 149.0, 58.0, 24.0, 10.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.006287097930908, -2.943056344985962, -2.8798258304595947, -2.8165950775146484, -2.7533645629882812, -2.690133810043335, -2.6269030570983887, -2.5636725425720215, -2.500441789627075, -2.437211036682129, -2.3739805221557617, -2.3107497692108154, -2.247519016265869, -2.184288501739502, -2.1210577487945557, -2.0578272342681885, -1.9945964813232422, -1.9313658475875854, -1.8681352138519287, -1.8049044609069824, -1.7416738271713257, -1.678443193435669, -1.6152124404907227, -1.551981806755066, -1.4887511730194092, -1.4255205392837524, -1.3622899055480957, -1.2990591526031494, -1.2358285188674927, -1.172597885131836, -1.1093671321868896, -1.046136498451233, -0.9829059839248657, -0.919675350189209, -0.8564446568489075, -0.793213963508606, -0.7299833297729492, -0.6667526960372925, -0.603522002696991, -0.5402913093566895, -0.4770606756210327, -0.4138300120830536, -0.35059934854507446, -0.28736868500709534, -0.2241380214691162, -0.16090735793113708, -0.09767669439315796, -0.03444603085517883, 0.028784632682800293, 0.09201529622077942, 0.15524595975875854, 0.21847662329673767, 0.2817072868347168, 0.3449379503726959, 0.40816861391067505, 0.4713992774486542, 0.5346299409866333, 0.59786057472229, 0.6610912680625916, 0.7243219614028931, 0.7875525951385498, 0.8507832288742065, 0.9140139222145081, 0.9772446155548096, 1.0404752492904663]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 6.0, 12.0, 8.0, 14.0, 16.0, 18.0, 26.0, 22.0, 32.0, 35.0, 45.0, 52.0, 53.0, 38.0, 45.0, 55.0, 50.0, 57.0, 55.0, 38.0, 37.0, 48.0, 32.0, 29.0, 27.0, 21.0, 18.0, 26.0, 18.0, 13.0, 10.0, 11.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7946150898933411, -0.7675920724868774, -0.7405691146850586, -0.713546097278595, -0.6865230798721313, -0.6595000624656677, -0.6324770450592041, -0.6054540872573853, -0.5784310698509216, -0.551408052444458, -0.5243850946426392, -0.49736207723617554, -0.4703390598297119, -0.4433160424232483, -0.41629305481910706, -0.3892700672149658, -0.3622470498085022, -0.3352240324020386, -0.30820104479789734, -0.2811780571937561, -0.2541550397872925, -0.22713203728199005, -0.20010903477668762, -0.1730860322713852, -0.14606302976608276, -0.11904002726078033, -0.0920170247554779, -0.06499402225017548, -0.03797101974487305, -0.010948017239570618, 0.01607498526573181, 0.04309798777103424, 0.0701209306716919, 0.09714393317699432, 0.12416693568229675, 0.15118993818759918, 0.1782129406929016, 0.20523594319820404, 0.23225894570350647, 0.2592819333076477, 0.28630495071411133, 0.31332796812057495, 0.3403509557247162, 0.3673739433288574, 0.39439696073532104, 0.42141997814178467, 0.4484429657459259, 0.47546595335006714, 0.5024889707565308, 0.5295119881629944, 0.556535005569458, 0.5835579633712769, 0.6105809807777405, 0.6376039981842041, 0.664626955986023, 0.6916499733924866, 0.7186729907989502, 0.7456960082054138, 0.7727190256118774, 0.7997419834136963, 0.8267650008201599, 0.8537880182266235, 0.8808109760284424, 0.907833993434906, 0.9348570108413696]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 1.0, 10.0, 7.0, 5.0, 11.0, 22.0, 27.0, 33.0, 62.0, 79.0, 115.0, 166.0, 236.0, 390.0, 629.0, 924.0, 1544.0, 2423.0, 4066.0, 6855.0, 11802.0, 20516.0, 35765.0, 61733.0, 103554.0, 163118.0, 202800.0, 168355.0, 109053.0, 64756.0, 37061.0, 21510.0, 12348.0, 7173.0, 4289.0, 2537.0, 1621.0, 1047.0, 620.0, 439.0, 297.0, 178.0, 133.0, 64.0, 63.0, 39.0, 15.0, 19.0, 16.0, 8.0, 13.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.06524658203125, -0.06330156326293945, -0.061356544494628906, -0.05941152572631836, -0.05746650695800781, -0.055521488189697266, -0.05357646942138672, -0.05163145065307617, -0.049686431884765625, -0.04774141311645508, -0.04579639434814453, -0.043851375579833984, -0.04190635681152344, -0.03996133804321289, -0.038016319274902344, -0.0360713005065918, -0.03412628173828125, -0.0321812629699707, -0.030236244201660156, -0.02829122543334961, -0.026346206665039062, -0.024401187896728516, -0.02245616912841797, -0.020511150360107422, -0.018566131591796875, -0.016621112823486328, -0.014676094055175781, -0.012731075286865234, -0.010786056518554688, -0.00884103775024414, -0.006896018981933594, -0.004951000213623047, -0.0030059814453125, -0.0010609626770019531, 0.0008840560913085938, 0.0028290748596191406, 0.0047740936279296875, 0.006719112396240234, 0.008664131164550781, 0.010609149932861328, 0.012554168701171875, 0.014499187469482422, 0.01644420623779297, 0.018389225006103516, 0.020334243774414062, 0.02227926254272461, 0.024224281311035156, 0.026169300079345703, 0.02811431884765625, 0.030059337615966797, 0.032004356384277344, 0.03394937515258789, 0.03589439392089844, 0.037839412689208984, 0.03978443145751953, 0.04172945022583008, 0.043674468994140625, 0.04561948776245117, 0.04756450653076172, 0.049509525299072266, 0.05145454406738281, 0.05339956283569336, 0.055344581604003906, 0.05728960037231445, 0.059234619140625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 4.0, 13.0, 11.0, 17.0, 19.0, 28.0, 30.0, 36.0, 50.0, 34.0, 60.0, 42.0, 59.0, 68.0, 62.0, 55.0, 60.0, 64.0, 57.0, 35.0, 34.0, 25.0, 34.0, 24.0, 23.0, 10.0, 18.0, 8.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1268310546875, -0.12324714660644531, -0.11966323852539062, -0.11607933044433594, -0.11249542236328125, -0.10891151428222656, -0.10532760620117188, -0.10174369812011719, -0.0981597900390625, -0.09457588195800781, -0.09099197387695312, -0.08740806579589844, -0.08382415771484375, -0.08024024963378906, -0.07665634155273438, -0.07307243347167969, -0.069488525390625, -0.06590461730957031, -0.062320709228515625, -0.05873680114746094, -0.05515289306640625, -0.05156898498535156, -0.047985076904296875, -0.04440116882324219, -0.0408172607421875, -0.03723335266113281, -0.033649444580078125, -0.030065536499023438, -0.02648162841796875, -0.022897720336914062, -0.019313812255859375, -0.015729904174804688, -0.01214599609375, -0.008562088012695312, -0.004978179931640625, -0.0013942718505859375, 0.00218963623046875, 0.0057735443115234375, 0.009357452392578125, 0.012941360473632812, 0.0165252685546875, 0.020109176635742188, 0.023693084716796875, 0.027276992797851562, 0.03086090087890625, 0.03444480895996094, 0.038028717041015625, 0.04161262512207031, 0.045196533203125, 0.04878044128417969, 0.052364349365234375, 0.05594825744628906, 0.05953216552734375, 0.06311607360839844, 0.06669998168945312, 0.07028388977050781, 0.0738677978515625, 0.07745170593261719, 0.08103561401367188, 0.08461952209472656, 0.08820343017578125, 0.09178733825683594, 0.09537124633789062, 0.09895515441894531, 0.1025390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 11.0, 9.0, 16.0, 15.0, 21.0, 31.0, 54.0, 73.0, 94.0, 128.0, 175.0, 230.0, 384.0, 540.0, 1078.0, 2311.0, 9678.0, 104328.0, 812785.0, 101916.0, 9664.0, 2266.0, 1013.0, 542.0, 346.0, 216.0, 194.0, 111.0, 77.0, 60.0, 50.0, 46.0, 24.0, 21.0, 9.0, 12.0, 6.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2614860534667969, -0.25197601318359375, -0.24246597290039062, -0.2329559326171875, -0.22344589233398438, -0.21393585205078125, -0.20442581176757812, -0.194915771484375, -0.18540573120117188, -0.17589569091796875, -0.16638565063476562, -0.1568756103515625, -0.14736557006835938, -0.13785552978515625, -0.12834548950195312, -0.11883544921875, -0.10932540893554688, -0.09981536865234375, -0.09030532836914062, -0.0807952880859375, -0.07128524780273438, -0.06177520751953125, -0.052265167236328125, -0.042755126953125, -0.033245086669921875, -0.02373504638671875, -0.014225006103515625, -0.0047149658203125, 0.004795074462890625, 0.01430511474609375, 0.023815155029296875, 0.0333251953125, 0.042835235595703125, 0.05234527587890625, 0.061855316162109375, 0.0713653564453125, 0.08087539672851562, 0.09038543701171875, 0.09989547729492188, 0.109405517578125, 0.11891555786132812, 0.12842559814453125, 0.13793563842773438, 0.1474456787109375, 0.15695571899414062, 0.16646575927734375, 0.17597579956054688, 0.18548583984375, 0.19499588012695312, 0.20450592041015625, 0.21401596069335938, 0.2235260009765625, 0.23303604125976562, 0.24254608154296875, 0.2520561218261719, 0.261566162109375, 0.2710762023925781, 0.28058624267578125, 0.2900962829589844, 0.2996063232421875, 0.3091163635253906, 0.31862640380859375, 0.3281364440917969, 0.337646484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 4.0, 5.0, 7.0, 12.0, 11.0, 17.0, 21.0, 14.0, 21.0, 30.0, 29.0, 34.0, 47.0, 43.0, 43.0, 59.0, 55.0, 60.0, 57.0, 50.0, 60.0, 53.0, 35.0, 37.0, 38.0, 31.0, 21.0, 16.0, 21.0, 12.0, 12.0, 9.0, 8.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294189453125, -0.281829833984375, -0.26947021484375, -0.257110595703125, -0.2447509765625, -0.232391357421875, -0.22003173828125, -0.207672119140625, -0.1953125, -0.182952880859375, -0.17059326171875, -0.158233642578125, -0.1458740234375, -0.133514404296875, -0.12115478515625, -0.108795166015625, -0.096435546875, -0.084075927734375, -0.07171630859375, -0.059356689453125, -0.0469970703125, -0.034637451171875, -0.02227783203125, -0.009918212890625, 0.00244140625, 0.014801025390625, 0.02716064453125, 0.039520263671875, 0.0518798828125, 0.064239501953125, 0.07659912109375, 0.088958740234375, 0.101318359375, 0.113677978515625, 0.12603759765625, 0.138397216796875, 0.1507568359375, 0.163116455078125, 0.17547607421875, 0.187835693359375, 0.2001953125, 0.212554931640625, 0.22491455078125, 0.237274169921875, 0.2496337890625, 0.261993408203125, 0.27435302734375, 0.286712646484375, 0.299072265625, 0.311431884765625, 0.32379150390625, 0.336151123046875, 0.3485107421875, 0.360870361328125, 0.37322998046875, 0.385589599609375, 0.39794921875, 0.410308837890625, 0.42266845703125, 0.435028076171875, 0.4473876953125, 0.459747314453125, 0.47210693359375, 0.484466552734375, 0.496826171875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 8.0, 16.0, 16.0, 23.0, 27.0, 37.0, 51.0, 97.0, 123.0, 256.0, 453.0, 888.0, 1817.0, 4407.0, 13150.0, 53313.0, 318406.0, 559332.0, 70364.0, 16373.0, 5218.0, 1991.0, 906.0, 505.0, 287.0, 171.0, 101.0, 67.0, 36.0, 38.0, 22.0, 14.0, 15.0, 5.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07110595703125, -0.06888961791992188, -0.06667327880859375, -0.06445693969726562, -0.0622406005859375, -0.060024261474609375, -0.05780792236328125, -0.055591583251953125, -0.053375244140625, -0.051158905029296875, -0.04894256591796875, -0.046726226806640625, -0.0445098876953125, -0.042293548583984375, -0.04007720947265625, -0.037860870361328125, -0.03564453125, -0.033428192138671875, -0.03121185302734375, -0.028995513916015625, -0.0267791748046875, -0.024562835693359375, -0.02234649658203125, -0.020130157470703125, -0.017913818359375, -0.015697479248046875, -0.01348114013671875, -0.011264801025390625, -0.0090484619140625, -0.006832122802734375, -0.00461578369140625, -0.002399444580078125, -0.00018310546875, 0.002033233642578125, 0.00424957275390625, 0.006465911865234375, 0.0086822509765625, 0.010898590087890625, 0.01311492919921875, 0.015331268310546875, 0.017547607421875, 0.019763946533203125, 0.02198028564453125, 0.024196624755859375, 0.0264129638671875, 0.028629302978515625, 0.03084564208984375, 0.033061981201171875, 0.0352783203125, 0.037494659423828125, 0.03971099853515625, 0.041927337646484375, 0.0441436767578125, 0.046360015869140625, 0.04857635498046875, 0.050792694091796875, 0.053009033203125, 0.055225372314453125, 0.05744171142578125, 0.059658050537109375, 0.0618743896484375, 0.06409072875976562, 0.06630706787109375, 0.06852340698242188, 0.07073974609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 0.0, 2.0, 4.0, 0.0, 3.0, 6.0, 6.0, 5.0, 6.0, 10.0, 10.0, 7.0, 14.0, 20.0, 30.0, 28.0, 26.0, 53.0, 69.0, 78.0, 95.0, 101.0, 83.0, 79.0, 62.0, 45.0, 26.0, 27.0, 16.0, 17.0, 16.0, 12.0, 3.0, 6.0, 8.0, 7.0, 7.0, 3.0, 0.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.227327346801758e-05, -5.0661154091358185e-05, -4.904903471469879e-05, -4.74369153380394e-05, -4.5824795961380005e-05, -4.421267658472061e-05, -4.260055720806122e-05, -4.0988437831401825e-05, -3.937631845474243e-05, -3.776419907808304e-05, -3.6152079701423645e-05, -3.453996032476425e-05, -3.292784094810486e-05, -3.1315721571445465e-05, -2.9703602194786072e-05, -2.809148281812668e-05, -2.6479363441467285e-05, -2.4867244064807892e-05, -2.32551246881485e-05, -2.1643005311489105e-05, -2.0030885934829712e-05, -1.841876655817032e-05, -1.6806647181510925e-05, -1.5194527804851532e-05, -1.3582408428192139e-05, -1.1970289051532745e-05, -1.0358169674873352e-05, -8.746050298213959e-06, -7.1339309215545654e-06, -5.521811544895172e-06, -3.909692168235779e-06, -2.2975727915763855e-06, -6.854534149169922e-07, 9.266659617424011e-07, 2.5387853384017944e-06, 4.150904715061188e-06, 5.763024091720581e-06, 7.375143468379974e-06, 8.987262845039368e-06, 1.0599382221698761e-05, 1.2211501598358154e-05, 1.3823620975017548e-05, 1.543574035167694e-05, 1.7047859728336334e-05, 1.8659979104995728e-05, 2.027209848165512e-05, 2.1884217858314514e-05, 2.3496337234973907e-05, 2.51084566116333e-05, 2.6720575988292694e-05, 2.8332695364952087e-05, 2.994481474161148e-05, 3.1556934118270874e-05, 3.316905349493027e-05, 3.478117287158966e-05, 3.6393292248249054e-05, 3.800541162490845e-05, 3.961753100156784e-05, 4.1229650378227234e-05, 4.284176975488663e-05, 4.445388913154602e-05, 4.6066008508205414e-05, 4.767812788486481e-05, 4.92902472615242e-05, 5.0902366638183594e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 2.0, 7.0, 9.0, 7.0, 6.0, 14.0, 27.0, 34.0, 49.0, 72.0, 143.0, 223.0, 438.0, 764.0, 1438.0, 3576.0, 11125.0, 52283.0, 510219.0, 399832.0, 50749.0, 10896.0, 3473.0, 1470.0, 668.0, 416.0, 222.0, 134.0, 75.0, 50.0, 44.0, 24.0, 17.0, 12.0, 10.0, 6.0, 7.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.083984375, -0.0816507339477539, -0.07931709289550781, -0.07698345184326172, -0.07464981079101562, -0.07231616973876953, -0.06998252868652344, -0.06764888763427734, -0.06531524658203125, -0.06298160552978516, -0.06064796447753906, -0.05831432342529297, -0.055980682373046875, -0.05364704132080078, -0.05131340026855469, -0.048979759216308594, -0.0466461181640625, -0.044312477111816406, -0.04197883605957031, -0.03964519500732422, -0.037311553955078125, -0.03497791290283203, -0.03264427185058594, -0.030310630798339844, -0.02797698974609375, -0.025643348693847656, -0.023309707641601562, -0.02097606658935547, -0.018642425537109375, -0.01630878448486328, -0.013975143432617188, -0.011641502380371094, -0.009307861328125, -0.006974220275878906, -0.0046405792236328125, -0.0023069381713867188, 2.6702880859375e-05, 0.0023603439331054688, 0.0046939849853515625, 0.007027626037597656, 0.00936126708984375, 0.011694908142089844, 0.014028549194335938, 0.01636219024658203, 0.018695831298828125, 0.02102947235107422, 0.023363113403320312, 0.025696754455566406, 0.0280303955078125, 0.030364036560058594, 0.03269767761230469, 0.03503131866455078, 0.037364959716796875, 0.03969860076904297, 0.04203224182128906, 0.044365882873535156, 0.04669952392578125, 0.049033164978027344, 0.05136680603027344, 0.05370044708251953, 0.056034088134765625, 0.05836772918701172, 0.06070137023925781, 0.0630350112915039, 0.06536865234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 8.0, 9.0, 10.0, 18.0, 27.0, 31.0, 49.0, 59.0, 71.0, 59.0, 83.0, 91.0, 97.0, 77.0, 70.0, 57.0, 34.0, 39.0, 24.0, 16.0, 15.0, 7.0, 11.0, 10.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08868408203125, -0.0861978530883789, -0.08371162414550781, -0.08122539520263672, -0.07873916625976562, -0.07625293731689453, -0.07376670837402344, -0.07128047943115234, -0.06879425048828125, -0.06630802154541016, -0.06382179260253906, -0.06133556365966797, -0.058849334716796875, -0.05636310577392578, -0.05387687683105469, -0.051390647888183594, -0.0489044189453125, -0.046418190002441406, -0.04393196105957031, -0.04144573211669922, -0.038959503173828125, -0.03647327423095703, -0.03398704528808594, -0.031500816345214844, -0.02901458740234375, -0.026528358459472656, -0.024042129516601562, -0.02155590057373047, -0.019069671630859375, -0.01658344268798828, -0.014097213745117188, -0.011610984802246094, -0.009124755859375, -0.006638526916503906, -0.0041522979736328125, -0.0016660690307617188, 0.000820159912109375, 0.0033063888549804688, 0.0057926177978515625, 0.008278846740722656, 0.01076507568359375, 0.013251304626464844, 0.015737533569335938, 0.01822376251220703, 0.020709991455078125, 0.02319622039794922, 0.025682449340820312, 0.028168678283691406, 0.0306549072265625, 0.033141136169433594, 0.03562736511230469, 0.03811359405517578, 0.040599822998046875, 0.04308605194091797, 0.04557228088378906, 0.048058509826660156, 0.05054473876953125, 0.053030967712402344, 0.05551719665527344, 0.05800342559814453, 0.060489654541015625, 0.06297588348388672, 0.06546211242675781, 0.0679483413696289, 0.0704345703125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 16.0, 37.0, 59.0, 125.0, 194.0, 309.0, 128.0, 54.0, 32.0, 11.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1691173315048218, -1.1052755117416382, -1.0414338111877441, -0.9775919914245605, -0.9137502908706665, -0.8499084711074829, -0.7860667109489441, -0.7222249507904053, -0.6583831906318665, -0.5945414304733276, -0.5306996703147888, -0.4668578803539276, -0.4030161201953888, -0.33917436003685, -0.27533257007598877, -0.21149080991744995, -0.14764904975891113, -0.08380728214979172, -0.019965514540672302, 0.04387626051902771, 0.10771802067756653, 0.17155978083610535, 0.23540157079696655, 0.29924333095550537, 0.3630850911140442, 0.426926851272583, 0.4907686114311218, 0.5546103715896606, 0.6184521913528442, 0.6822938919067383, 0.7461357116699219, 0.8099774718284607, 0.87381911277771, 0.9376608729362488, 1.0015026330947876, 1.0653444528579712, 1.1291861534118652, 1.1930279731750488, 1.2568697929382324, 1.3207114934921265, 1.3845531940460205, 1.448395013809204, 1.5122367143630981, 1.5760785341262817, 1.6399202346801758, 1.7037620544433594, 1.767603874206543, 1.831445574760437, 1.8952873945236206, 1.9591292142868042, 2.0229709148406982, 2.086812734603882, 2.1506545543670654, 2.21449613571167, 2.2783379554748535, 2.342179775238037, 2.4060215950012207, 2.4698634147644043, 2.533705234527588, 2.5975468158721924, 2.661388635635376, 2.7252304553985596, 2.789072275161743, 2.8529138565063477, 2.9167556762695312]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 7.0, 5.0, 8.0, 10.0, 13.0, 18.0, 10.0, 16.0, 15.0, 21.0, 17.0, 27.0, 34.0, 26.0, 35.0, 30.0, 33.0, 60.0, 77.0, 68.0, 55.0, 41.0, 37.0, 41.0, 39.0, 32.0, 18.0, 21.0, 25.0, 23.0, 19.0, 14.0, 19.0, 13.0, 12.0, 5.0, 4.0, 10.0, 2.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0], "bins": [-1.3760292530059814, -1.334822416305542, -1.2936155796051025, -1.2524088621139526, -1.2112020254135132, -1.1699951887130737, -1.1287884712219238, -1.0875816345214844, -1.046374797821045, -1.0051679611206055, -0.9639611840248108, -0.9227544069290161, -0.8815475702285767, -0.8403407335281372, -0.7991339564323425, -0.7579271793365479, -0.7167203426361084, -0.675513505935669, -0.6343067288398743, -0.5930999517440796, -0.5518931150436401, -0.5106862783432007, -0.469479501247406, -0.42827269434928894, -0.3870658874511719, -0.3458590805530548, -0.30465227365493774, -0.2634454667568207, -0.2222386598587036, -0.18103185296058655, -0.13982504606246948, -0.09861823916435242, -0.05741143226623535, -0.016204625368118286, 0.02500218152999878, 0.06620898842811584, 0.10741579532623291, 0.14862260222434998, 0.18982940912246704, 0.2310362160205841, 0.27224302291870117, 0.31344982981681824, 0.3546566367149353, 0.39586344361305237, 0.43707025051116943, 0.4782770574092865, 0.5194838643074036, 0.5606906414031982, 0.6018974781036377, 0.6431043148040771, 0.6843110918998718, 0.7255178689956665, 0.766724705696106, 0.8079315423965454, 0.8491383194923401, 0.8903450965881348, 0.9315519332885742, 0.9727587699890137, 1.0139656066894531, 1.055172324180603, 1.0963791608810425, 1.137585997581482, 1.1787927150726318, 1.2199995517730713, 1.2612063884735107]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 5.0, 11.0, 7.0, 17.0, 21.0, 31.0, 52.0, 74.0, 96.0, 165.0, 239.0, 403.0, 748.0, 1827.0, 5343.0, 23953.0, 183521.0, 2011857.0, 1784221.0, 151240.0, 21146.0, 5549.0, 1922.0, 764.0, 383.0, 234.0, 153.0, 103.0, 68.0, 38.0, 29.0, 18.0, 12.0, 11.0, 5.0, 4.0, 2.0, 0.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.12451171875, -0.12095069885253906, -0.11738967895507812, -0.11382865905761719, -0.11026763916015625, -0.10670661926269531, -0.10314559936523438, -0.09958457946777344, -0.0960235595703125, -0.09246253967285156, -0.08890151977539062, -0.08534049987792969, -0.08177947998046875, -0.07821846008300781, -0.07465744018554688, -0.07109642028808594, -0.067535400390625, -0.06397438049316406, -0.060413360595703125, -0.05685234069824219, -0.05329132080078125, -0.04973030090332031, -0.046169281005859375, -0.04260826110839844, -0.0390472412109375, -0.03548622131347656, -0.031925201416015625, -0.028364181518554688, -0.02480316162109375, -0.021242141723632812, -0.017681121826171875, -0.014120101928710938, -0.01055908203125, -0.0069980621337890625, -0.003437042236328125, 0.0001239776611328125, 0.00368499755859375, 0.0072460174560546875, 0.010807037353515625, 0.014368057250976562, 0.0179290771484375, 0.021490097045898438, 0.025051116943359375, 0.028612136840820312, 0.03217315673828125, 0.03573417663574219, 0.039295196533203125, 0.04285621643066406, 0.046417236328125, 0.04997825622558594, 0.053539276123046875, 0.05710029602050781, 0.06066131591796875, 0.06422233581542969, 0.06778335571289062, 0.07134437561035156, 0.0749053955078125, 0.07846641540527344, 0.08202743530273438, 0.08558845520019531, 0.08914947509765625, 0.09271049499511719, 0.09627151489257812, 0.09983253479003906, 0.1033935546875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 10.0, 13.0, 15.0, 26.0, 29.0, 37.0, 46.0, 45.0, 65.0, 54.0, 54.0, 56.0, 68.0, 60.0, 70.0, 58.0, 48.0, 43.0, 39.0, 39.0, 24.0, 31.0, 21.0, 16.0, 13.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1368408203125, -0.13320446014404297, -0.12956809997558594, -0.1259317398071289, -0.12229537963867188, -0.11865901947021484, -0.11502265930175781, -0.11138629913330078, -0.10774993896484375, -0.10411357879638672, -0.10047721862792969, -0.09684085845947266, -0.09320449829101562, -0.0895681381225586, -0.08593177795410156, -0.08229541778564453, -0.0786590576171875, -0.07502269744873047, -0.07138633728027344, -0.0677499771118164, -0.06411361694335938, -0.060477256774902344, -0.05684089660644531, -0.05320453643798828, -0.04956817626953125, -0.04593181610107422, -0.04229545593261719, -0.038659095764160156, -0.035022735595703125, -0.031386375427246094, -0.027750015258789062, -0.02411365509033203, -0.020477294921875, -0.01684093475341797, -0.013204574584960938, -0.009568214416503906, -0.005931854248046875, -0.0022954940795898438, 0.0013408660888671875, 0.004977226257324219, 0.00861358642578125, 0.012249946594238281, 0.015886306762695312, 0.019522666931152344, 0.023159027099609375, 0.026795387268066406, 0.030431747436523438, 0.03406810760498047, 0.0377044677734375, 0.04134082794189453, 0.04497718811035156, 0.048613548278808594, 0.052249908447265625, 0.055886268615722656, 0.05952262878417969, 0.06315898895263672, 0.06679534912109375, 0.07043170928955078, 0.07406806945800781, 0.07770442962646484, 0.08134078979492188, 0.0849771499633789, 0.08861351013183594, 0.09224987030029297, 0.09588623046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 11.0, 14.0, 17.0, 33.0, 61.0, 67.0, 118.0, 201.0, 336.0, 660.0, 2262.0, 21291.0, 3799107.0, 360489.0, 6963.0, 1253.0, 468.0, 298.0, 218.0, 154.0, 97.0, 69.0, 29.0, 24.0, 21.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42431640625, -0.41246795654296875, -0.4006195068359375, -0.38877105712890625, -0.376922607421875, -0.36507415771484375, -0.3532257080078125, -0.34137725830078125, -0.32952880859375, -0.31768035888671875, -0.3058319091796875, -0.29398345947265625, -0.282135009765625, -0.27028656005859375, -0.2584381103515625, -0.24658966064453125, -0.2347412109375, -0.22289276123046875, -0.2110443115234375, -0.19919586181640625, -0.187347412109375, -0.17549896240234375, -0.1636505126953125, -0.15180206298828125, -0.13995361328125, -0.12810516357421875, -0.1162567138671875, -0.10440826416015625, -0.092559814453125, -0.08071136474609375, -0.0688629150390625, -0.05701446533203125, -0.045166015625, -0.03331756591796875, -0.0214691162109375, -0.00962066650390625, 0.002227783203125, 0.01407623291015625, 0.0259246826171875, 0.03777313232421875, 0.04962158203125, 0.06147003173828125, 0.0733184814453125, 0.08516693115234375, 0.097015380859375, 0.10886383056640625, 0.1207122802734375, 0.13256072998046875, 0.1444091796875, 0.15625762939453125, 0.1681060791015625, 0.17995452880859375, 0.191802978515625, 0.20365142822265625, 0.2154998779296875, 0.22734832763671875, 0.23919677734375, 0.25104522705078125, 0.2628936767578125, 0.27474212646484375, 0.286590576171875, 0.29843902587890625, 0.3102874755859375, 0.32213592529296875, 0.333984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 10.0, 16.0, 22.0, 33.0, 53.0, 130.0, 325.0, 1118.0, 1382.0, 638.0, 186.0, 67.0, 46.0, 23.0, 8.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1553955078125, -0.1451396942138672, -0.13488388061523438, -0.12462806701660156, -0.11437225341796875, -0.10411643981933594, -0.09386062622070312, -0.08360481262207031, -0.0733489990234375, -0.06309318542480469, -0.052837371826171875, -0.04258155822753906, -0.03232574462890625, -0.022069931030273438, -0.011814117431640625, -0.0015583038330078125, 0.008697509765625, 0.018953323364257812, 0.029209136962890625, 0.03946495056152344, 0.04972076416015625, 0.05997657775878906, 0.07023239135742188, 0.08048820495605469, 0.0907440185546875, 0.10099983215332031, 0.11125564575195312, 0.12151145935058594, 0.13176727294921875, 0.14202308654785156, 0.15227890014648438, 0.1625347137451172, 0.17279052734375, 0.1830463409423828, 0.19330215454101562, 0.20355796813964844, 0.21381378173828125, 0.22406959533691406, 0.23432540893554688, 0.2445812225341797, 0.2548370361328125, 0.2650928497314453, 0.2753486633300781, 0.28560447692871094, 0.29586029052734375, 0.30611610412597656, 0.3163719177246094, 0.3266277313232422, 0.336883544921875, 0.3471393585205078, 0.3573951721191406, 0.36765098571777344, 0.37790679931640625, 0.38816261291503906, 0.3984184265136719, 0.4086742401123047, 0.4189300537109375, 0.4291858673095703, 0.4394416809082031, 0.44969749450683594, 0.45995330810546875, 0.47020912170410156, 0.4804649353027344, 0.4907207489013672, 0.5009765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 8.0, 8.0, 9.0, 21.0, 40.0, 58.0, 100.0, 192.0, 192.0, 155.0, 91.0, 50.0, 29.0, 18.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6926915645599365, -1.6430004835128784, -1.5933094024658203, -1.5436183214187622, -1.493927240371704, -1.444236159324646, -1.394545078277588, -1.3448539972305298, -1.2951629161834717, -1.2454718351364136, -1.1957807540893555, -1.1460896730422974, -1.0963985919952393, -1.0467075109481812, -0.997016429901123, -0.9473253488540649, -0.8976342678070068, -0.8479431867599487, -0.7982521057128906, -0.7485610246658325, -0.6988699436187744, -0.6491788625717163, -0.5994877815246582, -0.5497967004776001, -0.500105619430542, -0.4504145383834839, -0.4007234573364258, -0.3510323762893677, -0.30134129524230957, -0.25165021419525146, -0.20195913314819336, -0.15226805210113525, -0.1025770902633667, -0.052886009216308594, -0.0031949281692504883, 0.04649615287780762, 0.09618723392486572, 0.14587831497192383, 0.19556939601898193, 0.24526047706604004, 0.29495155811309814, 0.34464263916015625, 0.39433372020721436, 0.44402480125427246, 0.49371588230133057, 0.5434069633483887, 0.5930980443954468, 0.6427891254425049, 0.692480206489563, 0.7421712875366211, 0.7918623685836792, 0.8415534496307373, 0.8912445306777954, 0.9409356117248535, 0.9906266927719116, 1.0403177738189697, 1.0900088548660278, 1.139699935913086, 1.189391016960144, 1.2390820980072021, 1.2887731790542603, 1.3384642601013184, 1.3881553411483765, 1.4378464221954346, 1.4875375032424927]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 3.0, 5.0, 5.0, 7.0, 9.0, 8.0, 13.0, 17.0, 22.0, 28.0, 34.0, 25.0, 27.0, 41.0, 50.0, 40.0, 51.0, 40.0, 51.0, 41.0, 46.0, 40.0, 54.0, 45.0, 40.0, 34.0, 42.0, 29.0, 28.0, 14.0, 29.0, 8.0, 15.0, 12.0, 13.0, 12.0, 5.0, 6.0, 3.0, 7.0, 2.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0612034797668457, -1.0328896045684814, -1.0045758485794067, -0.9762619733810425, -0.9479480981826782, -0.9196342825889587, -0.8913204669952393, -0.863006591796875, -0.8346927165985107, -0.8063789010047913, -0.778065025806427, -0.7497512102127075, -0.7214373350143433, -0.6931235194206238, -0.6648097038269043, -0.63649582862854, -0.6081820130348206, -0.5798681974411011, -0.5515543222427368, -0.5232405066490173, -0.4949266314506531, -0.4666128158569336, -0.4382989704608917, -0.40998512506484985, -0.381671279668808, -0.3533574342727661, -0.32504358887672424, -0.2967297434806824, -0.2684159278869629, -0.24010206758975983, -0.21178823709487915, -0.18347439169883728, -0.15516048669815063, -0.12684664130210876, -0.09853280335664749, -0.07021896541118622, -0.04190512001514435, -0.013591274619102478, 0.014722555875778198, 0.04303640127182007, 0.07135024666786194, 0.09966409206390381, 0.12797793745994568, 0.15629176795482635, 0.18460561335086823, 0.2129194587469101, 0.24123328924179077, 0.26954713463783264, 0.2978609800338745, 0.3261748254299164, 0.35448867082595825, 0.38280248641967773, 0.411116361618042, 0.4394301772117615, 0.46774402260780334, 0.4960578680038452, 0.5243717432022095, 0.552685558795929, 0.5809994339942932, 0.6093132495880127, 0.637627124786377, 0.6659409403800964, 0.6942547559738159, 0.7225686311721802, 0.7508824467658997]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 11.0, 12.0, 22.0, 32.0, 51.0, 53.0, 114.0, 155.0, 238.0, 361.0, 533.0, 807.0, 1318.0, 2086.0, 3574.0, 6294.0, 11526.0, 21723.0, 42127.0, 82722.0, 150509.0, 226814.0, 214682.0, 132910.0, 71037.0, 36102.0, 18722.0, 10093.0, 5476.0, 3213.0, 1923.0, 1195.0, 669.0, 504.0, 287.0, 196.0, 148.0, 88.0, 60.0, 49.0, 27.0, 28.0, 20.0, 18.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07720947265625, -0.07478809356689453, -0.07236671447753906, -0.0699453353881836, -0.06752395629882812, -0.06510257720947266, -0.06268119812011719, -0.06025981903076172, -0.05783843994140625, -0.05541706085205078, -0.05299568176269531, -0.050574302673339844, -0.048152923583984375, -0.045731544494628906, -0.04331016540527344, -0.04088878631591797, -0.0384674072265625, -0.03604602813720703, -0.03362464904785156, -0.031203269958496094, -0.028781890869140625, -0.026360511779785156, -0.023939132690429688, -0.02151775360107422, -0.01909637451171875, -0.01667499542236328, -0.014253616333007812, -0.011832237243652344, -0.009410858154296875, -0.006989479064941406, -0.0045680999755859375, -0.0021467208862304688, 0.000274658203125, 0.0026960372924804688, 0.0051174163818359375, 0.007538795471191406, 0.009960174560546875, 0.012381553649902344, 0.014802932739257812, 0.01722431182861328, 0.01964569091796875, 0.02206707000732422, 0.024488449096679688, 0.026909828186035156, 0.029331207275390625, 0.031752586364746094, 0.03417396545410156, 0.03659534454345703, 0.0390167236328125, 0.04143810272216797, 0.04385948181152344, 0.046280860900878906, 0.048702239990234375, 0.051123619079589844, 0.05354499816894531, 0.05596637725830078, 0.05838775634765625, 0.06080913543701172, 0.06323051452636719, 0.06565189361572266, 0.06807327270507812, 0.0704946517944336, 0.07291603088378906, 0.07533740997314453, 0.0777587890625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 29.0, 19.0, 24.0, 42.0, 47.0, 40.0, 44.0, 49.0, 57.0, 57.0, 67.0, 66.0, 57.0, 60.0, 53.0, 49.0, 35.0, 35.0, 32.0, 36.0, 23.0, 17.0, 16.0, 8.0, 13.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1353759765625, -0.13173294067382812, -0.12808990478515625, -0.12444686889648438, -0.1208038330078125, -0.11716079711914062, -0.11351776123046875, -0.10987472534179688, -0.106231689453125, -0.10258865356445312, -0.09894561767578125, -0.09530258178710938, -0.0916595458984375, -0.08801651000976562, -0.08437347412109375, -0.08073043823242188, -0.07708740234375, -0.07344436645507812, -0.06980133056640625, -0.06615829467773438, -0.0625152587890625, -0.058872222900390625, -0.05522918701171875, -0.051586151123046875, -0.047943115234375, -0.044300079345703125, -0.04065704345703125, -0.037014007568359375, -0.0333709716796875, -0.029727935791015625, -0.02608489990234375, -0.022441864013671875, -0.018798828125, -0.015155792236328125, -0.01151275634765625, -0.007869720458984375, -0.0042266845703125, -0.000583648681640625, 0.00305938720703125, 0.006702423095703125, 0.010345458984375, 0.013988494873046875, 0.01763153076171875, 0.021274566650390625, 0.0249176025390625, 0.028560638427734375, 0.03220367431640625, 0.035846710205078125, 0.03948974609375, 0.043132781982421875, 0.04677581787109375, 0.050418853759765625, 0.0540618896484375, 0.057704925537109375, 0.06134796142578125, 0.06499099731445312, 0.068634033203125, 0.07227706909179688, 0.07592010498046875, 0.07956314086914062, 0.0832061767578125, 0.08684921264648438, 0.09049224853515625, 0.09413528442382812, 0.0977783203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 5.0, 3.0, 2.0, 6.0, 3.0, 3.0, 10.0, 9.0, 10.0, 9.0, 13.0, 12.0, 18.0, 35.0, 44.0, 69.0, 65.0, 100.0, 162.0, 237.0, 416.0, 1062.0, 2720.0, 9716.0, 45393.0, 256048.0, 610161.0, 96289.0, 18221.0, 4546.0, 1507.0, 652.0, 333.0, 198.0, 129.0, 77.0, 69.0, 49.0, 41.0, 24.0, 17.0, 17.0, 18.0, 12.0, 8.0, 8.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19287109375, -0.18626976013183594, -0.17966842651367188, -0.1730670928955078, -0.16646575927734375, -0.1598644256591797, -0.15326309204101562, -0.14666175842285156, -0.1400604248046875, -0.13345909118652344, -0.12685775756835938, -0.12025642395019531, -0.11365509033203125, -0.10705375671386719, -0.10045242309570312, -0.09385108947753906, -0.087249755859375, -0.08064842224121094, -0.07404708862304688, -0.06744575500488281, -0.06084442138671875, -0.05424308776855469, -0.047641754150390625, -0.04104042053222656, -0.0344390869140625, -0.027837753295898438, -0.021236419677734375, -0.014635086059570312, -0.00803375244140625, -0.0014324188232421875, 0.005168914794921875, 0.011770248413085938, 0.01837158203125, 0.024972915649414062, 0.031574249267578125, 0.03817558288574219, 0.04477691650390625, 0.05137825012207031, 0.057979583740234375, 0.06458091735839844, 0.0711822509765625, 0.07778358459472656, 0.08438491821289062, 0.09098625183105469, 0.09758758544921875, 0.10418891906738281, 0.11079025268554688, 0.11739158630371094, 0.123992919921875, 0.13059425354003906, 0.13719558715820312, 0.1437969207763672, 0.15039825439453125, 0.1569995880126953, 0.16360092163085938, 0.17020225524902344, 0.1768035888671875, 0.18340492248535156, 0.19000625610351562, 0.1966075897216797, 0.20320892333984375, 0.2098102569580078, 0.21641159057617188, 0.22301292419433594, 0.2296142578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 7.0, 11.0, 10.0, 8.0, 15.0, 9.0, 16.0, 13.0, 19.0, 24.0, 23.0, 41.0, 33.0, 42.0, 32.0, 42.0, 53.0, 45.0, 49.0, 58.0, 49.0, 43.0, 39.0, 47.0, 31.0, 40.0, 35.0, 24.0, 24.0, 25.0, 20.0, 12.0, 16.0, 6.0, 10.0, 10.0, 5.0, 4.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267578125, -0.2579994201660156, -0.24842071533203125, -0.23884201049804688, -0.2292633056640625, -0.21968460083007812, -0.21010589599609375, -0.20052719116210938, -0.190948486328125, -0.18136978149414062, -0.17179107666015625, -0.16221237182617188, -0.1526336669921875, -0.14305496215820312, -0.13347625732421875, -0.12389755249023438, -0.11431884765625, -0.10474014282226562, -0.09516143798828125, -0.08558273315429688, -0.0760040283203125, -0.06642532348632812, -0.05684661865234375, -0.047267913818359375, -0.037689208984375, -0.028110504150390625, -0.01853179931640625, -0.008953094482421875, 0.0006256103515625, 0.010204315185546875, 0.01978302001953125, 0.029361724853515625, 0.0389404296875, 0.048519134521484375, 0.05809783935546875, 0.06767654418945312, 0.0772552490234375, 0.08683395385742188, 0.09641265869140625, 0.10599136352539062, 0.115570068359375, 0.12514877319335938, 0.13472747802734375, 0.14430618286132812, 0.1538848876953125, 0.16346359252929688, 0.17304229736328125, 0.18262100219726562, 0.19219970703125, 0.20177841186523438, 0.21135711669921875, 0.22093582153320312, 0.2305145263671875, 0.24009323120117188, 0.24967193603515625, 0.2592506408691406, 0.268829345703125, 0.2784080505371094, 0.28798675537109375, 0.2975654602050781, 0.3071441650390625, 0.3167228698730469, 0.32630157470703125, 0.3358802795410156, 0.345458984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 3.0, 10.0, 7.0, 22.0, 21.0, 35.0, 44.0, 66.0, 74.0, 145.0, 225.0, 341.0, 585.0, 1078.0, 2042.0, 4062.0, 9630.0, 24833.0, 76381.0, 268753.0, 506857.0, 100031.0, 31355.0, 11690.0, 4920.0, 2410.0, 1103.0, 675.0, 368.0, 261.0, 160.0, 114.0, 78.0, 44.0, 30.0, 22.0, 18.0, 14.0, 13.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 6.0, 1.0], "bins": [-0.06805419921875, -0.06622028350830078, -0.06438636779785156, -0.06255245208740234, -0.060718536376953125, -0.058884620666503906, -0.05705070495605469, -0.05521678924560547, -0.05338287353515625, -0.05154895782470703, -0.04971504211425781, -0.047881126403808594, -0.046047210693359375, -0.044213294982910156, -0.04237937927246094, -0.04054546356201172, -0.0387115478515625, -0.03687763214111328, -0.03504371643066406, -0.033209800720214844, -0.031375885009765625, -0.029541969299316406, -0.027708053588867188, -0.02587413787841797, -0.02404022216796875, -0.02220630645751953, -0.020372390747070312, -0.018538475036621094, -0.016704559326171875, -0.014870643615722656, -0.013036727905273438, -0.011202812194824219, -0.009368896484375, -0.007534980773925781, -0.0057010650634765625, -0.0038671493530273438, -0.002033233642578125, -0.00019931793212890625, 0.0016345977783203125, 0.0034685134887695312, 0.00530242919921875, 0.007136344909667969, 0.008970260620117188, 0.010804176330566406, 0.012638092041015625, 0.014472007751464844, 0.016305923461914062, 0.01813983917236328, 0.0199737548828125, 0.02180767059326172, 0.023641586303710938, 0.025475502014160156, 0.027309417724609375, 0.029143333435058594, 0.030977249145507812, 0.03281116485595703, 0.03464508056640625, 0.03647899627685547, 0.03831291198730469, 0.040146827697753906, 0.041980743408203125, 0.043814659118652344, 0.04564857482910156, 0.04748249053955078, 0.04931640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 6.0, 4.0, 7.0, 11.0, 11.0, 27.0, 42.0, 54.0, 74.0, 83.0, 96.0, 119.0, 98.0, 98.0, 70.0, 69.0, 41.0, 24.0, 16.0, 16.0, 6.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.929304122924805e-05, -4.795379936695099e-05, -4.661455750465393e-05, -4.527531564235687e-05, -4.3936073780059814e-05, -4.2596831917762756e-05, -4.12575900554657e-05, -3.991834819316864e-05, -3.857910633087158e-05, -3.7239864468574524e-05, -3.5900622606277466e-05, -3.456138074398041e-05, -3.322213888168335e-05, -3.188289701938629e-05, -3.0543655157089233e-05, -2.9204413294792175e-05, -2.7865171432495117e-05, -2.652592957019806e-05, -2.5186687707901e-05, -2.3847445845603943e-05, -2.2508203983306885e-05, -2.1168962121009827e-05, -1.982972025871277e-05, -1.849047839641571e-05, -1.7151236534118652e-05, -1.5811994671821594e-05, -1.4472752809524536e-05, -1.3133510947227478e-05, -1.179426908493042e-05, -1.0455027222633362e-05, -9.115785360336304e-06, -7.776543498039246e-06, -6.4373016357421875e-06, -5.098059773445129e-06, -3.7588179111480713e-06, -2.419576048851013e-06, -1.080334186553955e-06, 2.5890767574310303e-07, 1.5981495380401611e-06, 2.9373914003372192e-06, 4.276633262634277e-06, 5.6158751249313354e-06, 6.9551169872283936e-06, 8.294358849525452e-06, 9.63360071182251e-06, 1.0972842574119568e-05, 1.2312084436416626e-05, 1.3651326298713684e-05, 1.4990568161010742e-05, 1.63298100233078e-05, 1.766905188560486e-05, 1.9008293747901917e-05, 2.0347535610198975e-05, 2.1686777472496033e-05, 2.302601933479309e-05, 2.436526119709015e-05, 2.5704503059387207e-05, 2.7043744921684265e-05, 2.8382986783981323e-05, 2.972222864627838e-05, 3.106147050857544e-05, 3.24007123708725e-05, 3.3739954233169556e-05, 3.5079196095466614e-05, 3.641843795776367e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 15.0, 12.0, 31.0, 44.0, 87.0, 161.0, 404.0, 1086.0, 3202.0, 12832.0, 69203.0, 606003.0, 298139.0, 44489.0, 8846.0, 2547.0, 776.0, 344.0, 139.0, 67.0, 42.0, 30.0, 13.0, 10.0, 7.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07598876953125, -0.07305240631103516, -0.07011604309082031, -0.06717967987060547, -0.06424331665039062, -0.06130695343017578, -0.05837059020996094, -0.055434226989746094, -0.05249786376953125, -0.049561500549316406, -0.04662513732910156, -0.04368877410888672, -0.040752410888671875, -0.03781604766845703, -0.03487968444824219, -0.031943321228027344, -0.0290069580078125, -0.026070594787597656, -0.023134231567382812, -0.02019786834716797, -0.017261505126953125, -0.014325141906738281, -0.011388778686523438, -0.008452415466308594, -0.00551605224609375, -0.0025796890258789062, 0.0003566741943359375, 0.0032930374145507812, 0.006229400634765625, 0.009165763854980469, 0.012102127075195312, 0.015038490295410156, 0.017974853515625, 0.020911216735839844, 0.023847579956054688, 0.02678394317626953, 0.029720306396484375, 0.03265666961669922, 0.03559303283691406, 0.038529396057128906, 0.04146575927734375, 0.044402122497558594, 0.04733848571777344, 0.05027484893798828, 0.053211212158203125, 0.05614757537841797, 0.05908393859863281, 0.062020301818847656, 0.0649566650390625, 0.06789302825927734, 0.07082939147949219, 0.07376575469970703, 0.07670211791992188, 0.07963848114013672, 0.08257484436035156, 0.0855112075805664, 0.08844757080078125, 0.0913839340209961, 0.09432029724121094, 0.09725666046142578, 0.10019302368164062, 0.10312938690185547, 0.10606575012207031, 0.10900211334228516, 0.1119384765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 10.0, 14.0, 17.0, 21.0, 42.0, 46.0, 58.0, 53.0, 68.0, 74.0, 84.0, 83.0, 83.0, 89.0, 46.0, 53.0, 39.0, 35.0, 15.0, 21.0, 8.0, 14.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.09307861328125, -0.09049606323242188, -0.08791351318359375, -0.08533096313476562, -0.0827484130859375, -0.08016586303710938, -0.07758331298828125, -0.07500076293945312, -0.072418212890625, -0.06983566284179688, -0.06725311279296875, -0.06467056274414062, -0.0620880126953125, -0.059505462646484375, -0.05692291259765625, -0.054340362548828125, -0.0517578125, -0.049175262451171875, -0.04659271240234375, -0.044010162353515625, -0.0414276123046875, -0.038845062255859375, -0.03626251220703125, -0.033679962158203125, -0.031097412109375, -0.028514862060546875, -0.02593231201171875, -0.023349761962890625, -0.0207672119140625, -0.018184661865234375, -0.01560211181640625, -0.013019561767578125, -0.01043701171875, -0.007854461669921875, -0.00527191162109375, -0.002689361572265625, -0.0001068115234375, 0.002475738525390625, 0.00505828857421875, 0.007640838623046875, 0.010223388671875, 0.012805938720703125, 0.01538848876953125, 0.017971038818359375, 0.0205535888671875, 0.023136138916015625, 0.02571868896484375, 0.028301239013671875, 0.0308837890625, 0.033466339111328125, 0.03604888916015625, 0.038631439208984375, 0.0412139892578125, 0.043796539306640625, 0.04637908935546875, 0.048961639404296875, 0.051544189453125, 0.054126739501953125, 0.05670928955078125, 0.059291839599609375, 0.0618743896484375, 0.06445693969726562, 0.06703948974609375, 0.06962203979492188, 0.07220458984375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 15.0, 35.0, 66.0, 94.0, 185.0, 275.0, 160.0, 60.0, 51.0, 21.0, 9.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5156450271606445, -2.453484296798706, -2.3913238048553467, -2.329163074493408, -2.267002582550049, -2.2048418521881104, -2.142681360244751, -2.0805206298828125, -2.018360137939453, -1.9561995267868042, -1.8940389156341553, -1.8318783044815063, -1.7697176933288574, -1.707556962966919, -1.6453964710235596, -1.583235740661621, -1.5210750102996826, -1.4589143991470337, -1.3967537879943848, -1.3345931768417358, -1.272432565689087, -1.2102718353271484, -1.148111343383789, -1.0859506130218506, -1.0237901210784912, -0.9616295099258423, -0.8994688987731934, -0.8373082876205444, -0.7751476168632507, -0.7129870057106018, -0.6508263945579529, -0.5886657238006592, -0.5265051126480103, -0.46434450149536133, -0.40218386054039, -0.3400232493877411, -0.2778626084327698, -0.21570199728012085, -0.15354138612747192, -0.09138074517250061, -0.029220134019851685, 0.03294048830866814, 0.09510111063718796, 0.15726172924041748, 0.2194223552942276, 0.2815829813480377, 0.34374359250068665, 0.40590423345565796, 0.4680648446083069, 0.5302254557609558, 0.5923860669136047, 0.6545467376708984, 0.7167073488235474, 0.7788679599761963, 0.8410285711288452, 0.9031891822814941, 0.9653497934341431, 1.027510404586792, 1.089671015739441, 1.1518316268920898, 1.2139922380447388, 1.2761528491973877, 1.3383135795593262, 1.400474190711975, 1.462634801864624]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 7.0, 7.0, 7.0, 8.0, 9.0, 14.0, 10.0, 9.0, 20.0, 25.0, 24.0, 22.0, 29.0, 23.0, 32.0, 43.0, 41.0, 51.0, 65.0, 78.0, 70.0, 50.0, 48.0, 35.0, 36.0, 38.0, 26.0, 31.0, 23.0, 17.0, 18.0, 14.0, 17.0, 8.0, 9.0, 12.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0125527381896973, -0.9771116971969604, -0.9416706562042236, -0.9062296152114868, -0.87078857421875, -0.8353475332260132, -0.7999064922332764, -0.7644654512405396, -0.7290244102478027, -0.6935833692550659, -0.6581423282623291, -0.6227012872695923, -0.5872602462768555, -0.5518192052841187, -0.5163781642913818, -0.48093709349632263, -0.4454960227012634, -0.4100549817085266, -0.3746139407157898, -0.339172899723053, -0.30373185873031616, -0.26829081773757935, -0.23284974694252014, -0.19740870594978333, -0.1619676649570465, -0.1265266239643097, -0.09108557552099228, -0.055644527077674866, -0.02020348608493805, 0.015237554907798767, 0.05067861080169678, 0.0861196517944336, 0.12156069278717041, 0.15700173377990723, 0.19244277477264404, 0.22788383066654205, 0.2633248567581177, 0.2987658977508545, 0.3342069685459137, 0.3696480095386505, 0.40508905053138733, 0.44053009152412415, 0.47597113251686096, 0.5114122033119202, 0.546853244304657, 0.5822942852973938, 0.6177353262901306, 0.6531763672828674, 0.6886174082756042, 0.7240584492683411, 0.7594994902610779, 0.7949405312538147, 0.8303815722465515, 0.8658226132392883, 0.9012637138366699, 0.9367047548294067, 0.9721457958221436, 1.0075868368148804, 1.0430278778076172, 1.078468918800354, 1.1139099597930908, 1.1493510007858276, 1.1847920417785645, 1.2202330827713013, 1.255674123764038]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 1.0, 2.0, 5.0, 1.0, 8.0, 5.0, 10.0, 9.0, 19.0, 17.0, 27.0, 37.0, 45.0, 85.0, 97.0, 148.0, 215.0, 294.0, 414.0, 738.0, 1231.0, 2574.0, 6562.0, 23199.0, 124371.0, 929319.0, 2398549.0, 596089.0, 82412.0, 16962.0, 5549.0, 2237.0, 1108.0, 656.0, 383.0, 267.0, 173.0, 141.0, 69.0, 79.0, 58.0, 24.0, 28.0, 22.0, 19.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0888671875, -0.08584308624267578, -0.08281898498535156, -0.07979488372802734, -0.07677078247070312, -0.0737466812133789, -0.07072257995605469, -0.06769847869873047, -0.06467437744140625, -0.06165027618408203, -0.05862617492675781, -0.055602073669433594, -0.052577972412109375, -0.049553871154785156, -0.04652976989746094, -0.04350566864013672, -0.0404815673828125, -0.03745746612548828, -0.03443336486816406, -0.031409263610839844, -0.028385162353515625, -0.025361061096191406, -0.022336959838867188, -0.01931285858154297, -0.01628875732421875, -0.013264656066894531, -0.010240554809570312, -0.007216453552246094, -0.004192352294921875, -0.0011682510375976562, 0.0018558502197265625, 0.004879951477050781, 0.007904052734375, 0.010928153991699219, 0.013952255249023438, 0.016976356506347656, 0.020000457763671875, 0.023024559020996094, 0.026048660278320312, 0.02907276153564453, 0.03209686279296875, 0.03512096405029297, 0.03814506530761719, 0.041169166564941406, 0.044193267822265625, 0.047217369079589844, 0.05024147033691406, 0.05326557159423828, 0.0562896728515625, 0.05931377410888672, 0.06233787536621094, 0.06536197662353516, 0.06838607788085938, 0.0714101791381836, 0.07443428039550781, 0.07745838165283203, 0.08048248291015625, 0.08350658416748047, 0.08653068542480469, 0.0895547866821289, 0.09257888793945312, 0.09560298919677734, 0.09862709045410156, 0.10165119171142578, 0.10467529296875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 5.0, 12.0, 12.0, 12.0, 13.0, 21.0, 32.0, 28.0, 37.0, 37.0, 38.0, 57.0, 45.0, 45.0, 65.0, 55.0, 46.0, 61.0, 59.0, 57.0, 48.0, 37.0, 37.0, 29.0, 22.0, 23.0, 14.0, 16.0, 7.0, 6.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1190185546875, -0.11565780639648438, -0.11229705810546875, -0.10893630981445312, -0.1055755615234375, -0.10221481323242188, -0.09885406494140625, -0.09549331665039062, -0.092132568359375, -0.08877182006835938, -0.08541107177734375, -0.08205032348632812, -0.0786895751953125, -0.07532882690429688, -0.07196807861328125, -0.06860733032226562, -0.06524658203125, -0.061885833740234375, -0.05852508544921875, -0.055164337158203125, -0.0518035888671875, -0.048442840576171875, -0.04508209228515625, -0.041721343994140625, -0.038360595703125, -0.034999847412109375, -0.03163909912109375, -0.028278350830078125, -0.0249176025390625, -0.021556854248046875, -0.01819610595703125, -0.014835357666015625, -0.011474609375, -0.008113861083984375, -0.00475311279296875, -0.001392364501953125, 0.0019683837890625, 0.005329132080078125, 0.00868988037109375, 0.012050628662109375, 0.015411376953125, 0.018772125244140625, 0.02213287353515625, 0.025493621826171875, 0.0288543701171875, 0.032215118408203125, 0.03557586669921875, 0.038936614990234375, 0.04229736328125, 0.045658111572265625, 0.04901885986328125, 0.052379608154296875, 0.0557403564453125, 0.059101104736328125, 0.06246185302734375, 0.06582260131835938, 0.069183349609375, 0.07254409790039062, 0.07590484619140625, 0.07926559448242188, 0.0826263427734375, 0.08598709106445312, 0.08934783935546875, 0.09270858764648438, 0.0960693359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 8.0, 19.0, 55.0, 138.0, 377.0, 1928.0, 114556.0, 4070438.0, 5687.0, 723.0, 205.0, 75.0, 34.0, 8.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7591476440429688, -0.7355804443359375, -0.7120132446289062, -0.688446044921875, -0.6648788452148438, -0.6413116455078125, -0.6177444458007812, -0.59417724609375, -0.5706100463867188, -0.5470428466796875, -0.5234756469726562, -0.499908447265625, -0.47634124755859375, -0.4527740478515625, -0.42920684814453125, -0.4056396484375, -0.38207244873046875, -0.3585052490234375, -0.33493804931640625, -0.311370849609375, -0.28780364990234375, -0.2642364501953125, -0.24066925048828125, -0.21710205078125, -0.19353485107421875, -0.1699676513671875, -0.14640045166015625, -0.122833251953125, -0.09926605224609375, -0.0756988525390625, -0.05213165283203125, -0.028564453125, -0.00499725341796875, 0.0185699462890625, 0.04213714599609375, 0.065704345703125, 0.08927154541015625, 0.1128387451171875, 0.13640594482421875, 0.15997314453125, 0.18354034423828125, 0.2071075439453125, 0.23067474365234375, 0.254241943359375, 0.27780914306640625, 0.3013763427734375, 0.32494354248046875, 0.3485107421875, 0.37207794189453125, 0.3956451416015625, 0.41921234130859375, 0.442779541015625, 0.46634674072265625, 0.4899139404296875, 0.5134811401367188, 0.53704833984375, 0.5606155395507812, 0.5841827392578125, 0.6077499389648438, 0.631317138671875, 0.6548843383789062, 0.6784515380859375, 0.7020187377929688, 0.7255859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 16.0, 14.0, 17.0, 36.0, 88.0, 189.0, 503.0, 1222.0, 1184.0, 430.0, 189.0, 86.0, 39.0, 31.0, 8.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.42578125, -0.4156208038330078, -0.4054603576660156, -0.39529991149902344, -0.38513946533203125, -0.37497901916503906, -0.3648185729980469, -0.3546581268310547, -0.3444976806640625, -0.3343372344970703, -0.3241767883300781, -0.31401634216308594, -0.30385589599609375, -0.29369544982910156, -0.2835350036621094, -0.2733745574951172, -0.263214111328125, -0.2530536651611328, -0.24289321899414062, -0.23273277282714844, -0.22257232666015625, -0.21241188049316406, -0.20225143432617188, -0.1920909881591797, -0.1819305419921875, -0.1717700958251953, -0.16160964965820312, -0.15144920349121094, -0.14128875732421875, -0.13112831115722656, -0.12096786499023438, -0.11080741882324219, -0.10064697265625, -0.09048652648925781, -0.08032608032226562, -0.07016563415527344, -0.06000518798828125, -0.04984474182128906, -0.039684295654296875, -0.029523849487304688, -0.0193634033203125, -0.009202957153320312, 0.000957489013671875, 0.011117935180664062, 0.02127838134765625, 0.03143882751464844, 0.041599273681640625, 0.05175971984863281, 0.061920166015625, 0.07208061218261719, 0.08224105834960938, 0.09240150451660156, 0.10256195068359375, 0.11272239685058594, 0.12288284301757812, 0.1330432891845703, 0.1432037353515625, 0.1533641815185547, 0.16352462768554688, 0.17368507385253906, 0.18384552001953125, 0.19400596618652344, 0.20416641235351562, 0.2143268585205078, 0.2244873046875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 11.0, 17.0, 41.0, 61.0, 141.0, 210.0, 197.0, 141.0, 94.0, 41.0, 26.0, 9.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.719484806060791, -2.6601996421813965, -2.600914239883423, -2.5416290760040283, -2.482343912124634, -2.42305850982666, -2.3637733459472656, -2.304488182067871, -2.2452027797698975, -2.185917615890503, -2.1266322135925293, -2.0673470497131348, -2.0080618858337402, -1.9487764835357666, -1.889491319656372, -1.830206036567688, -1.7709208726882935, -1.7116355895996094, -1.6523504257202148, -1.5930651426315308, -1.5337798595428467, -1.4744946956634521, -1.415209412574768, -1.355924129486084, -1.2966389656066895, -1.2373536825180054, -1.1780685186386108, -1.1187832355499268, -1.0594979524612427, -1.0002126693725586, -0.9409275054931641, -0.88164222240448, -0.8223570585250854, -0.7630718350410461, -0.7037865519523621, -0.6445013284683228, -0.5852160453796387, -0.5259308218955994, -0.46664559841156006, -0.40736034512519836, -0.34807509183883667, -0.288789838552475, -0.22950460016727448, -0.17021936178207397, -0.11093410849571228, -0.051648855209350586, 0.007636368274688721, 0.06692162156105042, 0.1262068748474121, 0.1854921281337738, 0.2447773665189743, 0.3040626049041748, 0.3633478581905365, 0.4226331114768982, 0.4819183349609375, 0.5412036180496216, 0.6004888415336609, 0.6597740650177002, 0.7190593481063843, 0.7783445715904236, 0.8376297950744629, 0.896915078163147, 0.9562003016471863, 1.0154855251312256, 1.0747708082199097]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 0.0, 6.0, 3.0, 8.0, 12.0, 13.0, 14.0, 11.0, 25.0, 27.0, 19.0, 22.0, 28.0, 31.0, 35.0, 41.0, 51.0, 50.0, 44.0, 40.0, 37.0, 51.0, 44.0, 48.0, 40.0, 40.0, 34.0, 32.0, 28.0, 17.0, 27.0, 21.0, 18.0, 11.0, 18.0, 12.0, 17.0, 6.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.8045223355293274, -0.7798269391059875, -0.7551315426826477, -0.7304361462593079, -0.7057408094406128, -0.681045413017273, -0.6563500165939331, -0.6316546201705933, -0.6069592237472534, -0.5822638273239136, -0.5575684309005737, -0.5328730344772339, -0.508177638053894, -0.4834822714328766, -0.45878690481185913, -0.4340915083885193, -0.40939611196517944, -0.3847007155418396, -0.36000531911849976, -0.3353099524974823, -0.31061455607414246, -0.2859191596508026, -0.26122379302978516, -0.2365283966064453, -0.21183300018310547, -0.18713760375976562, -0.16244222223758698, -0.13774684071540833, -0.11305144429206848, -0.08835605531930923, -0.06366066634654999, -0.03896528482437134, -0.014269888401031494, 0.010425500571727753, 0.035120889544487, 0.059816278517246246, 0.0845116674900055, 0.10920705646276474, 0.133902445435524, 0.15859782695770264, 0.18329322338104248, 0.20798861980438232, 0.23268400132656097, 0.2573793828487396, 0.28207477927207947, 0.3067701756954193, 0.33146554231643677, 0.3561609387397766, 0.38085633516311646, 0.4055517315864563, 0.43024712800979614, 0.4549424946308136, 0.47963789105415344, 0.5043332576751709, 0.5290286540985107, 0.5537240505218506, 0.5784194469451904, 0.6031148433685303, 0.6278102397918701, 0.65250563621521, 0.6772010326385498, 0.7018963694572449, 0.7265917658805847, 0.7512871623039246, 0.7759825587272644]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 12.0, 13.0, 19.0, 25.0, 38.0, 46.0, 81.0, 123.0, 199.0, 260.0, 424.0, 704.0, 1169.0, 1981.0, 3435.0, 6015.0, 11214.0, 21115.0, 41993.0, 82110.0, 161936.0, 259839.0, 216985.0, 116299.0, 58546.0, 29579.0, 15322.0, 8101.0, 4532.0, 2474.0, 1510.0, 917.0, 531.0, 320.0, 207.0, 154.0, 95.0, 71.0, 39.0, 42.0, 28.0, 10.0, 12.0, 7.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07135009765625, -0.06895160675048828, -0.06655311584472656, -0.06415462493896484, -0.061756134033203125, -0.059357643127441406, -0.05695915222167969, -0.05456066131591797, -0.05216217041015625, -0.04976367950439453, -0.04736518859863281, -0.044966697692871094, -0.042568206787109375, -0.040169715881347656, -0.03777122497558594, -0.03537273406982422, -0.0329742431640625, -0.03057575225830078, -0.028177261352539062, -0.025778770446777344, -0.023380279541015625, -0.020981788635253906, -0.018583297729492188, -0.01618480682373047, -0.01378631591796875, -0.011387825012207031, -0.008989334106445312, -0.006590843200683594, -0.004192352294921875, -0.0017938613891601562, 0.0006046295166015625, 0.0030031204223632812, 0.005401611328125, 0.007800102233886719, 0.010198593139648438, 0.012597084045410156, 0.014995574951171875, 0.017394065856933594, 0.019792556762695312, 0.02219104766845703, 0.02458953857421875, 0.02698802947998047, 0.029386520385742188, 0.031785011291503906, 0.034183502197265625, 0.036581993103027344, 0.03898048400878906, 0.04137897491455078, 0.0437774658203125, 0.04617595672607422, 0.04857444763183594, 0.050972938537597656, 0.053371429443359375, 0.055769920349121094, 0.05816841125488281, 0.06056690216064453, 0.06296539306640625, 0.06536388397216797, 0.06776237487792969, 0.0701608657836914, 0.07255935668945312, 0.07495784759521484, 0.07735633850097656, 0.07975482940673828, 0.0821533203125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 13.0, 8.0, 17.0, 13.0, 13.0, 29.0, 26.0, 30.0, 35.0, 32.0, 50.0, 50.0, 49.0, 33.0, 59.0, 47.0, 58.0, 65.0, 53.0, 45.0, 47.0, 41.0, 39.0, 29.0, 24.0, 12.0, 17.0, 22.0, 6.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1192626953125, -0.11587905883789062, -0.11249542236328125, -0.10911178588867188, -0.1057281494140625, -0.10234451293945312, -0.09896087646484375, -0.09557723999023438, -0.092193603515625, -0.08880996704101562, -0.08542633056640625, -0.08204269409179688, -0.0786590576171875, -0.07527542114257812, -0.07189178466796875, -0.06850814819335938, -0.06512451171875, -0.061740875244140625, -0.05835723876953125, -0.054973602294921875, -0.0515899658203125, -0.048206329345703125, -0.04482269287109375, -0.041439056396484375, -0.038055419921875, -0.034671783447265625, -0.03128814697265625, -0.027904510498046875, -0.0245208740234375, -0.021137237548828125, -0.01775360107421875, -0.014369964599609375, -0.010986328125, -0.007602691650390625, -0.00421905517578125, -0.000835418701171875, 0.0025482177734375, 0.005931854248046875, 0.00931549072265625, 0.012699127197265625, 0.016082763671875, 0.019466400146484375, 0.02285003662109375, 0.026233673095703125, 0.0296173095703125, 0.033000946044921875, 0.03638458251953125, 0.039768218994140625, 0.04315185546875, 0.046535491943359375, 0.04991912841796875, 0.053302764892578125, 0.0566864013671875, 0.060070037841796875, 0.06345367431640625, 0.06683731079101562, 0.070220947265625, 0.07360458374023438, 0.07698822021484375, 0.08037185668945312, 0.0837554931640625, 0.08713912963867188, 0.09052276611328125, 0.09390640258789062, 0.0972900390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 8.0, 3.0, 10.0, 3.0, 10.0, 14.0, 17.0, 21.0, 51.0, 41.0, 73.0, 91.0, 128.0, 193.0, 274.0, 511.0, 991.0, 2297.0, 7997.0, 44482.0, 615634.0, 329124.0, 35348.0, 6860.0, 2087.0, 823.0, 493.0, 271.0, 213.0, 147.0, 82.0, 70.0, 49.0, 34.0, 24.0, 18.0, 10.0, 13.0, 10.0, 8.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.271240234375, -0.26274871826171875, -0.2542572021484375, -0.24576568603515625, -0.237274169921875, -0.22878265380859375, -0.2202911376953125, -0.21179962158203125, -0.20330810546875, -0.19481658935546875, -0.1863250732421875, -0.17783355712890625, -0.169342041015625, -0.16085052490234375, -0.1523590087890625, -0.14386749267578125, -0.1353759765625, -0.12688446044921875, -0.1183929443359375, -0.10990142822265625, -0.101409912109375, -0.09291839599609375, -0.0844268798828125, -0.07593536376953125, -0.06744384765625, -0.05895233154296875, -0.0504608154296875, -0.04196929931640625, -0.033477783203125, -0.02498626708984375, -0.0164947509765625, -0.00800323486328125, 0.00048828125, 0.00897979736328125, 0.0174713134765625, 0.02596282958984375, 0.034454345703125, 0.04294586181640625, 0.0514373779296875, 0.05992889404296875, 0.06842041015625, 0.07691192626953125, 0.0854034423828125, 0.09389495849609375, 0.102386474609375, 0.11087799072265625, 0.1193695068359375, 0.12786102294921875, 0.1363525390625, 0.14484405517578125, 0.1533355712890625, 0.16182708740234375, 0.170318603515625, 0.17881011962890625, 0.1873016357421875, 0.19579315185546875, 0.20428466796875, 0.21277618408203125, 0.2212677001953125, 0.22975921630859375, 0.238250732421875, 0.24674224853515625, 0.2552337646484375, 0.26372528076171875, 0.272216796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 9.0, 6.0, 12.0, 16.0, 25.0, 14.0, 34.0, 43.0, 52.0, 49.0, 58.0, 69.0, 72.0, 71.0, 84.0, 76.0, 59.0, 51.0, 41.0, 34.0, 30.0, 27.0, 15.0, 13.0, 14.0, 6.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5081634521484375, -0.491424560546875, -0.4746856689453125, -0.45794677734375, -0.4412078857421875, -0.424468994140625, -0.4077301025390625, -0.3909912109375, -0.3742523193359375, -0.357513427734375, -0.3407745361328125, -0.32403564453125, -0.3072967529296875, -0.290557861328125, -0.2738189697265625, -0.257080078125, -0.2403411865234375, -0.223602294921875, -0.2068634033203125, -0.19012451171875, -0.1733856201171875, -0.156646728515625, -0.1399078369140625, -0.1231689453125, -0.1064300537109375, -0.089691162109375, -0.0729522705078125, -0.05621337890625, -0.0394744873046875, -0.022735595703125, -0.0059967041015625, 0.0107421875, 0.0274810791015625, 0.044219970703125, 0.0609588623046875, 0.07769775390625, 0.0944366455078125, 0.111175537109375, 0.1279144287109375, 0.1446533203125, 0.1613922119140625, 0.178131103515625, 0.1948699951171875, 0.21160888671875, 0.2283477783203125, 0.245086669921875, 0.2618255615234375, 0.278564453125, 0.2953033447265625, 0.312042236328125, 0.3287811279296875, 0.34552001953125, 0.3622589111328125, 0.378997802734375, 0.3957366943359375, 0.4124755859375, 0.4292144775390625, 0.445953369140625, 0.4626922607421875, 0.47943115234375, 0.4961700439453125, 0.512908935546875, 0.5296478271484375, 0.54638671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 7.0, 9.0, 7.0, 16.0, 27.0, 39.0, 59.0, 92.0, 140.0, 292.0, 561.0, 1199.0, 2931.0, 7671.0, 25654.0, 124552.0, 741216.0, 108153.0, 23538.0, 7302.0, 2706.0, 1162.0, 562.0, 281.0, 163.0, 86.0, 47.0, 24.0, 18.0, 18.0, 10.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09222412109375, -0.08954811096191406, -0.08687210083007812, -0.08419609069824219, -0.08152008056640625, -0.07884407043457031, -0.07616806030273438, -0.07349205017089844, -0.0708160400390625, -0.06814002990722656, -0.06546401977539062, -0.06278800964355469, -0.06011199951171875, -0.05743598937988281, -0.054759979248046875, -0.05208396911621094, -0.049407958984375, -0.04673194885253906, -0.044055938720703125, -0.04137992858886719, -0.03870391845703125, -0.03602790832519531, -0.033351898193359375, -0.030675888061523438, -0.0279998779296875, -0.025323867797851562, -0.022647857666015625, -0.019971847534179688, -0.01729583740234375, -0.014619827270507812, -0.011943817138671875, -0.009267807006835938, -0.006591796875, -0.0039157867431640625, -0.001239776611328125, 0.0014362335205078125, 0.00411224365234375, 0.0067882537841796875, 0.009464263916015625, 0.012140274047851562, 0.0148162841796875, 0.017492294311523438, 0.020168304443359375, 0.022844314575195312, 0.02552032470703125, 0.028196334838867188, 0.030872344970703125, 0.03354835510253906, 0.036224365234375, 0.03890037536621094, 0.041576385498046875, 0.04425239562988281, 0.04692840576171875, 0.04960441589355469, 0.052280426025390625, 0.05495643615722656, 0.0576324462890625, 0.06030845642089844, 0.06298446655273438, 0.06566047668457031, 0.06833648681640625, 0.07101249694824219, 0.07368850708007812, 0.07636451721191406, 0.07904052734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 5.0, 16.0, 7.0, 15.0, 16.0, 24.0, 29.0, 36.0, 67.0, 92.0, 118.0, 117.0, 122.0, 83.0, 58.0, 46.0, 28.0, 26.0, 24.0, 8.0, 9.0, 8.0, 9.0, 3.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1961669921875e-05, -4.074070602655411e-05, -3.9519742131233215e-05, -3.829877823591232e-05, -3.707781434059143e-05, -3.585685044527054e-05, -3.4635886549949646e-05, -3.3414922654628754e-05, -3.219395875930786e-05, -3.097299486398697e-05, -2.9752030968666077e-05, -2.8531067073345184e-05, -2.7310103178024292e-05, -2.60891392827034e-05, -2.4868175387382507e-05, -2.3647211492061615e-05, -2.2426247596740723e-05, -2.120528370141983e-05, -1.9984319806098938e-05, -1.8763355910778046e-05, -1.7542392015457153e-05, -1.632142812013626e-05, -1.5100464224815369e-05, -1.3879500329494476e-05, -1.2658536434173584e-05, -1.1437572538852692e-05, -1.02166086435318e-05, -8.995644748210907e-06, -7.774680852890015e-06, -6.553716957569122e-06, -5.33275306224823e-06, -4.111789166927338e-06, -2.8908252716064453e-06, -1.669861376285553e-06, -4.4889748096466064e-07, 7.720664143562317e-07, 1.993030309677124e-06, 3.2139942049980164e-06, 4.434958100318909e-06, 5.655921995639801e-06, 6.876885890960693e-06, 8.097849786281586e-06, 9.318813681602478e-06, 1.053977757692337e-05, 1.1760741472244263e-05, 1.2981705367565155e-05, 1.4202669262886047e-05, 1.542363315820694e-05, 1.6644597053527832e-05, 1.7865560948848724e-05, 1.9086524844169617e-05, 2.030748873949051e-05, 2.15284526348114e-05, 2.2749416530132294e-05, 2.3970380425453186e-05, 2.519134432077408e-05, 2.641230821609497e-05, 2.7633272111415863e-05, 2.8854236006736755e-05, 3.0075199902057648e-05, 3.129616379737854e-05, 3.251712769269943e-05, 3.3738091588020325e-05, 3.495905548334122e-05, 3.618001937866211e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 9.0, 15.0, 16.0, 23.0, 34.0, 68.0, 102.0, 202.0, 394.0, 915.0, 2607.0, 9587.0, 62196.0, 792126.0, 155123.0, 18554.0, 4177.0, 1288.0, 552.0, 234.0, 118.0, 71.0, 44.0, 39.0, 21.0, 17.0, 8.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.149169921875, -0.14550399780273438, -0.14183807373046875, -0.13817214965820312, -0.1345062255859375, -0.13084030151367188, -0.12717437744140625, -0.12350845336914062, -0.119842529296875, -0.11617660522460938, -0.11251068115234375, -0.10884475708007812, -0.1051788330078125, -0.10151290893554688, -0.09784698486328125, -0.09418106079101562, -0.09051513671875, -0.08684921264648438, -0.08318328857421875, -0.07951736450195312, -0.0758514404296875, -0.07218551635742188, -0.06851959228515625, -0.06485366821289062, -0.061187744140625, -0.057521820068359375, -0.05385589599609375, -0.050189971923828125, -0.0465240478515625, -0.042858123779296875, -0.03919219970703125, -0.035526275634765625, -0.0318603515625, -0.028194427490234375, -0.02452850341796875, -0.020862579345703125, -0.0171966552734375, -0.013530731201171875, -0.00986480712890625, -0.006198883056640625, -0.002532958984375, 0.001132965087890625, 0.00479888916015625, 0.008464813232421875, 0.0121307373046875, 0.015796661376953125, 0.01946258544921875, 0.023128509521484375, 0.02679443359375, 0.030460357666015625, 0.03412628173828125, 0.037792205810546875, 0.0414581298828125, 0.045124053955078125, 0.04878997802734375, 0.052455902099609375, 0.056121826171875, 0.059787750244140625, 0.06345367431640625, 0.06711959838867188, 0.0707855224609375, 0.07445144653320312, 0.07811737060546875, 0.08178329467773438, 0.08544921875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 9.0, 2.0, 8.0, 6.0, 8.0, 9.0, 18.0, 20.0, 22.0, 31.0, 51.0, 57.0, 81.0, 106.0, 120.0, 103.0, 101.0, 53.0, 37.0, 40.0, 22.0, 22.0, 17.0, 22.0, 15.0, 7.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.128173828125, -0.12515735626220703, -0.12214088439941406, -0.1191244125366211, -0.11610794067382812, -0.11309146881103516, -0.11007499694824219, -0.10705852508544922, -0.10404205322265625, -0.10102558135986328, -0.09800910949707031, -0.09499263763427734, -0.09197616577148438, -0.0889596939086914, -0.08594322204589844, -0.08292675018310547, -0.0799102783203125, -0.07689380645751953, -0.07387733459472656, -0.0708608627319336, -0.06784439086914062, -0.06482791900634766, -0.06181144714355469, -0.05879497528076172, -0.05577850341796875, -0.05276203155517578, -0.04974555969238281, -0.046729087829589844, -0.043712615966796875, -0.040696144104003906, -0.03767967224121094, -0.03466320037841797, -0.031646728515625, -0.02863025665283203, -0.025613784790039062, -0.022597312927246094, -0.019580841064453125, -0.016564369201660156, -0.013547897338867188, -0.010531425476074219, -0.00751495361328125, -0.004498481750488281, -0.0014820098876953125, 0.0015344619750976562, 0.004550933837890625, 0.007567405700683594, 0.010583877563476562, 0.013600349426269531, 0.0166168212890625, 0.01963329315185547, 0.022649765014648438, 0.025666236877441406, 0.028682708740234375, 0.031699180603027344, 0.03471565246582031, 0.03773212432861328, 0.04074859619140625, 0.04376506805419922, 0.04678153991699219, 0.049798011779785156, 0.052814483642578125, 0.055830955505371094, 0.05884742736816406, 0.06186389923095703, 0.06488037109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 13.0, 19.0, 32.0, 52.0, 107.0, 148.0, 301.0, 117.0, 75.0, 45.0, 33.0, 17.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1613118648529053, -2.1052229404449463, -2.0491340160369873, -1.9930450916290283, -1.9369560480117798, -1.8808671236038208, -1.8247781991958618, -1.7686892747879028, -1.7126003503799438, -1.6565114259719849, -1.6004225015640259, -1.5443334579467773, -1.4882445335388184, -1.4321556091308594, -1.3760666847229004, -1.3199777603149414, -1.2638888359069824, -1.2077999114990234, -1.1517109870910645, -1.0956220626831055, -1.039533019065857, -0.983444094657898, -0.927355170249939, -0.87126624584198, -0.8151772022247314, -0.7590882778167725, -0.7029992938041687, -0.6469103693962097, -0.5908214449882507, -0.534732460975647, -0.478643536567688, -0.422554612159729, -0.36646568775177, -0.31037673354148865, -0.25428780913352966, -0.1981988549232483, -0.1421099156141281, -0.08602097630500793, -0.029932022094726562, 0.026156902313232422, 0.0822458565235138, 0.13833479583263397, 0.19442373514175415, 0.2505126893520355, 0.3066016435623169, 0.3626905679702759, 0.41877952218055725, 0.47486844658851624, 0.5309574007987976, 0.5870463252067566, 0.6431353092193604, 0.6992242336273193, 0.7553131580352783, 0.8114020824432373, 0.8674910664558411, 0.9235799908638, 0.9796689748764038, 1.0357578992843628, 1.0918468236923218, 1.1479358673095703, 1.2040247917175293, 1.2601137161254883, 1.3162026405334473, 1.3722915649414062, 1.4283804893493652]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 3.0, 7.0, 9.0, 14.0, 14.0, 10.0, 14.0, 17.0, 14.0, 23.0, 23.0, 29.0, 20.0, 30.0, 36.0, 43.0, 69.0, 103.0, 101.0, 72.0, 46.0, 42.0, 29.0, 29.0, 29.0, 19.0, 20.0, 14.0, 15.0, 18.0, 10.0, 10.0, 7.0, 4.0, 6.0, 7.0, 8.0, 2.0, 8.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3526108264923096, -1.3089009523391724, -1.2651911973953247, -1.2214813232421875, -1.1777715682983398, -1.1340616941452026, -1.0903518199920654, -1.0466420650482178, -1.0029321908950806, -0.9592223763465881, -0.9155125617980957, -0.8718026876449585, -0.8280928730964661, -0.7843830585479736, -0.7406731843948364, -0.696963369846344, -0.6532535552978516, -0.6095437407493591, -0.5658339262008667, -0.5221240520477295, -0.47841423749923706, -0.43470442295074463, -0.3909945785999298, -0.347284734249115, -0.30357491970062256, -0.2598651051521301, -0.2161552608013153, -0.17244543135166168, -0.12873560190200806, -0.08502577245235443, -0.041315943002700806, 0.0023939013481140137, 0.046103835105895996, 0.08981366455554962, 0.13352349400520325, 0.17723332345485687, 0.2209431529045105, 0.26465296745300293, 0.30836281180381775, 0.35207265615463257, 0.395782470703125, 0.43949228525161743, 0.48320212960243225, 0.5269119739532471, 0.5706217885017395, 0.6143316030502319, 0.6580414772033691, 0.7017512917518616, 0.745461106300354, 0.7891709208488464, 0.8328807353973389, 0.8765906095504761, 0.9203004240989685, 0.9640102386474609, 1.0077201128005981, 1.0514299869537354, 1.095139741897583, 1.1388496160507202, 1.1825593709945679, 1.226269245147705, 1.2699790000915527, 1.31368887424469, 1.3573987483978271, 1.4011085033416748, 1.444818377494812]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 8.0, 15.0, 14.0, 19.0, 23.0, 29.0, 43.0, 41.0, 53.0, 70.0, 109.0, 182.0, 299.0, 605.0, 1388.0, 4393.0, 25314.0, 392459.0, 3037558.0, 679716.0, 42491.0, 6054.0, 1780.0, 688.0, 286.0, 183.0, 92.0, 71.0, 54.0, 55.0, 41.0, 35.0, 33.0, 19.0, 17.0, 13.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15380859375, -0.14861106872558594, -0.14341354370117188, -0.1382160186767578, -0.13301849365234375, -0.1278209686279297, -0.12262344360351562, -0.11742591857910156, -0.1122283935546875, -0.10703086853027344, -0.10183334350585938, -0.09663581848144531, -0.09143829345703125, -0.08624076843261719, -0.08104324340820312, -0.07584571838378906, -0.070648193359375, -0.06545066833496094, -0.060253143310546875, -0.05505561828613281, -0.04985809326171875, -0.04466056823730469, -0.039463043212890625, -0.03426551818847656, -0.0290679931640625, -0.023870468139648438, -0.018672943115234375, -0.013475418090820312, -0.00827789306640625, -0.0030803680419921875, 0.002117156982421875, 0.0073146820068359375, 0.01251220703125, 0.017709732055664062, 0.022907257080078125, 0.028104782104492188, 0.03330230712890625, 0.03849983215332031, 0.043697357177734375, 0.04889488220214844, 0.0540924072265625, 0.05928993225097656, 0.06448745727539062, 0.06968498229980469, 0.07488250732421875, 0.08008003234863281, 0.08527755737304688, 0.09047508239746094, 0.095672607421875, 0.10087013244628906, 0.10606765747070312, 0.11126518249511719, 0.11646270751953125, 0.12166023254394531, 0.12685775756835938, 0.13205528259277344, 0.1372528076171875, 0.14245033264160156, 0.14764785766601562, 0.1528453826904297, 0.15804290771484375, 0.1632404327392578, 0.16843795776367188, 0.17363548278808594, 0.1788330078125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 8.0, 8.0, 4.0, 12.0, 14.0, 13.0, 22.0, 26.0, 24.0, 38.0, 37.0, 38.0, 47.0, 30.0, 59.0, 46.0, 42.0, 56.0, 39.0, 55.0, 60.0, 42.0, 35.0, 42.0, 40.0, 35.0, 19.0, 20.0, 20.0, 18.0, 11.0, 9.0, 6.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11773681640625, -0.11440181732177734, -0.11106681823730469, -0.10773181915283203, -0.10439682006835938, -0.10106182098388672, -0.09772682189941406, -0.0943918228149414, -0.09105682373046875, -0.0877218246459961, -0.08438682556152344, -0.08105182647705078, -0.07771682739257812, -0.07438182830810547, -0.07104682922363281, -0.06771183013916016, -0.0643768310546875, -0.061041831970214844, -0.05770683288574219, -0.05437183380126953, -0.051036834716796875, -0.04770183563232422, -0.04436683654785156, -0.041031837463378906, -0.03769683837890625, -0.034361839294433594, -0.031026840209960938, -0.02769184112548828, -0.024356842041015625, -0.02102184295654297, -0.017686843872070312, -0.014351844787597656, -0.011016845703125, -0.007681846618652344, -0.0043468475341796875, -0.0010118484497070312, 0.002323150634765625, 0.005658149719238281, 0.008993148803710938, 0.012328147888183594, 0.01566314697265625, 0.018998146057128906, 0.022333145141601562, 0.02566814422607422, 0.029003143310546875, 0.03233814239501953, 0.03567314147949219, 0.039008140563964844, 0.0423431396484375, 0.045678138732910156, 0.04901313781738281, 0.05234813690185547, 0.055683135986328125, 0.05901813507080078, 0.06235313415527344, 0.0656881332397461, 0.06902313232421875, 0.0723581314086914, 0.07569313049316406, 0.07902812957763672, 0.08236312866210938, 0.08569812774658203, 0.08903312683105469, 0.09236812591552734, 0.095703125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 13.0, 14.0, 24.0, 36.0, 67.0, 128.0, 255.0, 738.0, 2635.0, 32149.0, 3936723.0, 213263.0, 6369.0, 1098.0, 374.0, 188.0, 75.0, 45.0, 30.0, 15.0, 13.0, 2.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50390625, -0.49018096923828125, -0.4764556884765625, -0.46273040771484375, -0.449005126953125, -0.43527984619140625, -0.4215545654296875, -0.40782928466796875, -0.39410400390625, -0.38037872314453125, -0.3666534423828125, -0.35292816162109375, -0.339202880859375, -0.32547760009765625, -0.3117523193359375, -0.29802703857421875, -0.2843017578125, -0.27057647705078125, -0.2568511962890625, -0.24312591552734375, -0.229400634765625, -0.21567535400390625, -0.2019500732421875, -0.18822479248046875, -0.17449951171875, -0.16077423095703125, -0.1470489501953125, -0.13332366943359375, -0.119598388671875, -0.10587310791015625, -0.0921478271484375, -0.07842254638671875, -0.064697265625, -0.05097198486328125, -0.0372467041015625, -0.02352142333984375, -0.009796142578125, 0.00392913818359375, 0.0176544189453125, 0.03137969970703125, 0.04510498046875, 0.05883026123046875, 0.0725555419921875, 0.08628082275390625, 0.100006103515625, 0.11373138427734375, 0.1274566650390625, 0.14118194580078125, 0.1549072265625, 0.16863250732421875, 0.1823577880859375, 0.19608306884765625, 0.209808349609375, 0.22353363037109375, 0.2372589111328125, 0.25098419189453125, 0.26470947265625, 0.27843475341796875, 0.2921600341796875, 0.30588531494140625, 0.319610595703125, 0.33333587646484375, 0.3470611572265625, 0.36078643798828125, 0.37451171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 4.0, 5.0, 4.0, 19.0, 25.0, 30.0, 38.0, 69.0, 103.0, 178.0, 336.0, 640.0, 892.0, 728.0, 420.0, 248.0, 114.0, 79.0, 49.0, 24.0, 21.0, 14.0, 9.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2020263671875, -0.19414329528808594, -0.18626022338867188, -0.1783771514892578, -0.17049407958984375, -0.1626110076904297, -0.15472793579101562, -0.14684486389160156, -0.1389617919921875, -0.13107872009277344, -0.12319564819335938, -0.11531257629394531, -0.10742950439453125, -0.09954643249511719, -0.09166336059570312, -0.08378028869628906, -0.075897216796875, -0.06801414489746094, -0.060131072998046875, -0.05224800109863281, -0.04436492919921875, -0.03648185729980469, -0.028598785400390625, -0.020715713500976562, -0.0128326416015625, -0.0049495697021484375, 0.002933502197265625, 0.010816574096679688, 0.01869964599609375, 0.026582717895507812, 0.034465789794921875, 0.04234886169433594, 0.05023193359375, 0.05811500549316406, 0.06599807739257812, 0.07388114929199219, 0.08176422119140625, 0.08964729309082031, 0.09753036499023438, 0.10541343688964844, 0.1132965087890625, 0.12117958068847656, 0.12906265258789062, 0.1369457244873047, 0.14482879638671875, 0.1527118682861328, 0.16059494018554688, 0.16847801208496094, 0.176361083984375, 0.18424415588378906, 0.19212722778320312, 0.2000102996826172, 0.20789337158203125, 0.2157764434814453, 0.22365951538085938, 0.23154258728027344, 0.2394256591796875, 0.24730873107910156, 0.2551918029785156, 0.2630748748779297, 0.27095794677734375, 0.2788410186767578, 0.2867240905761719, 0.29460716247558594, 0.302490234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 13.0, 34.0, 64.0, 223.0, 317.0, 208.0, 98.0, 18.0, 14.0, 8.0, 4.0, 2.0], "bins": [-5.664047718048096, -5.56368350982666, -5.463318824768066, -5.362954616546631, -5.262590408325195, -5.162225723266602, -5.061861515045166, -4.9614973068237305, -4.861132621765137, -4.760768413543701, -4.660403728485107, -4.560039520263672, -4.459675312042236, -4.359310626983643, -4.258946418762207, -4.158581733703613, -4.058217525482178, -3.957853078842163, -3.8574888706207275, -3.757124423980713, -3.6567599773406982, -3.5563955307006836, -3.456031322479248, -3.3556668758392334, -3.255302667617798, -3.154938220977783, -3.0545740127563477, -2.954209566116333, -2.8538451194763184, -2.753480911254883, -2.653116464614868, -2.5527520179748535, -2.4523873329162598, -2.352022886276245, -2.2516586780548096, -2.151294231414795, -2.0509297847747803, -1.9505654573440552, -1.85020112991333, -1.7498366832733154, -1.6494724750518799, -1.5491081476211548, -1.4487437009811401, -1.348379373550415, -1.2480149269104004, -1.1476505994796753, -1.0472862720489502, -0.9469218254089355, -0.8465573787689209, -0.746192991733551, -0.6458286046981812, -0.545464277267456, -0.4450998604297638, -0.3447355031967163, -0.24437111616134644, -0.14400672912597656, -0.04364234209060669, 0.05672203749418259, 0.15708641707897186, 0.25745078921318054, 0.3578151762485504, 0.4581795334815979, 0.5585439205169678, 0.6589083075523376, 0.7592726945877075]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 8.0, 9.0, 5.0, 8.0, 11.0, 13.0, 20.0, 32.0, 24.0, 23.0, 27.0, 41.0, 36.0, 40.0, 41.0, 58.0, 66.0, 58.0, 52.0, 60.0, 46.0, 53.0, 30.0, 40.0, 38.0, 22.0, 29.0, 22.0, 16.0, 16.0, 13.0, 6.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8728641867637634, -0.8426277041435242, -0.8123912215232849, -0.7821547985076904, -0.7519183158874512, -0.7216818332672119, -0.6914453506469727, -0.6612088680267334, -0.6309723854064941, -0.6007359027862549, -0.5704994201660156, -0.5402629375457764, -0.5100265145301819, -0.4797900319099426, -0.44955354928970337, -0.4193170666694641, -0.38908064365386963, -0.35884416103363037, -0.3286077082157135, -0.29837122559547424, -0.2681347727775574, -0.23789829015731812, -0.20766180753707886, -0.1774253398180008, -0.14718887209892273, -0.11695240437984467, -0.086715929210186, -0.056479454040527344, -0.02624298632144928, 0.003993481397628784, 0.03422996401786804, 0.0644664317369461, 0.0947028398513794, 0.12493930757045746, 0.15517577528953552, 0.18541225790977478, 0.21564872562885284, 0.2458851933479309, 0.27612167596817017, 0.3063581585884094, 0.3365946114063263, 0.36683109402656555, 0.3970675468444824, 0.4273040294647217, 0.45754051208496094, 0.4877769649028778, 0.5180134773254395, 0.5482499003410339, 0.5784863829612732, 0.6087228655815125, 0.6389593482017517, 0.6691957712173462, 0.6994322538375854, 0.7296687364578247, 0.759905219078064, 0.7901417016983032, 0.8203781843185425, 0.8506146669387817, 0.880851149559021, 0.9110876321792603, 0.9413240551948547, 0.971560537815094, 1.0017969608306885, 1.0320334434509277, 1.062269926071167]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 8.0, 8.0, 12.0, 13.0, 20.0, 34.0, 42.0, 72.0, 113.0, 180.0, 295.0, 442.0, 801.0, 1307.0, 2262.0, 3975.0, 7678.0, 15827.0, 35103.0, 83079.0, 219813.0, 369613.0, 180276.0, 69035.0, 29699.0, 13546.0, 6869.0, 3565.0, 1871.0, 1169.0, 667.0, 408.0, 279.0, 155.0, 119.0, 60.0, 53.0, 25.0, 19.0, 21.0, 8.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12261962890625, -0.1187143325805664, -0.11480903625488281, -0.11090373992919922, -0.10699844360351562, -0.10309314727783203, -0.09918785095214844, -0.09528255462646484, -0.09137725830078125, -0.08747196197509766, -0.08356666564941406, -0.07966136932373047, -0.07575607299804688, -0.07185077667236328, -0.06794548034667969, -0.0640401840209961, -0.0601348876953125, -0.056229591369628906, -0.05232429504394531, -0.04841899871826172, -0.044513702392578125, -0.04060840606689453, -0.03670310974121094, -0.032797813415527344, -0.02889251708984375, -0.024987220764160156, -0.021081924438476562, -0.01717662811279297, -0.013271331787109375, -0.009366035461425781, -0.0054607391357421875, -0.0015554428100585938, 0.002349853515625, 0.006255149841308594, 0.010160446166992188, 0.014065742492675781, 0.017971038818359375, 0.02187633514404297, 0.025781631469726562, 0.029686927795410156, 0.03359222412109375, 0.037497520446777344, 0.04140281677246094, 0.04530811309814453, 0.049213409423828125, 0.05311870574951172, 0.05702400207519531, 0.060929298400878906, 0.0648345947265625, 0.0687398910522461, 0.07264518737792969, 0.07655048370361328, 0.08045578002929688, 0.08436107635498047, 0.08826637268066406, 0.09217166900634766, 0.09607696533203125, 0.09998226165771484, 0.10388755798339844, 0.10779285430908203, 0.11169815063476562, 0.11560344696044922, 0.11950874328613281, 0.1234140396118164, 0.1273193359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 16.0, 12.0, 10.0, 22.0, 21.0, 18.0, 27.0, 29.0, 38.0, 40.0, 53.0, 44.0, 47.0, 62.0, 24.0, 52.0, 38.0, 56.0, 51.0, 47.0, 37.0, 27.0, 29.0, 34.0, 22.0, 24.0, 19.0, 15.0, 19.0, 11.0, 12.0, 6.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.11328125, -0.11006927490234375, -0.1068572998046875, -0.10364532470703125, -0.100433349609375, -0.09722137451171875, -0.0940093994140625, -0.09079742431640625, -0.08758544921875, -0.08437347412109375, -0.0811614990234375, -0.07794952392578125, -0.074737548828125, -0.07152557373046875, -0.0683135986328125, -0.06510162353515625, -0.0618896484375, -0.05867767333984375, -0.0554656982421875, -0.05225372314453125, -0.049041748046875, -0.04582977294921875, -0.0426177978515625, -0.03940582275390625, -0.03619384765625, -0.03298187255859375, -0.0297698974609375, -0.02655792236328125, -0.023345947265625, -0.02013397216796875, -0.0169219970703125, -0.01371002197265625, -0.010498046875, -0.00728607177734375, -0.0040740966796875, -0.00086212158203125, 0.002349853515625, 0.00556182861328125, 0.0087738037109375, 0.01198577880859375, 0.01519775390625, 0.01840972900390625, 0.0216217041015625, 0.02483367919921875, 0.028045654296875, 0.03125762939453125, 0.0344696044921875, 0.03768157958984375, 0.0408935546875, 0.04410552978515625, 0.0473175048828125, 0.05052947998046875, 0.053741455078125, 0.05695343017578125, 0.0601654052734375, 0.06337738037109375, 0.06658935546875, 0.06980133056640625, 0.0730133056640625, 0.07622528076171875, 0.079437255859375, 0.08264923095703125, 0.0858612060546875, 0.08907318115234375, 0.09228515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 9.0, 16.0, 17.0, 17.0, 35.0, 40.0, 80.0, 102.0, 131.0, 290.0, 475.0, 943.0, 2185.0, 10887.0, 338912.0, 677141.0, 12686.0, 2350.0, 990.0, 469.0, 277.0, 177.0, 109.0, 68.0, 44.0, 26.0, 26.0, 15.0, 12.0, 11.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.448974609375, -0.4345054626464844, -0.42003631591796875, -0.4055671691894531, -0.3910980224609375, -0.3766288757324219, -0.36215972900390625, -0.3476905822753906, -0.333221435546875, -0.3187522888183594, -0.30428314208984375, -0.2898139953613281, -0.2753448486328125, -0.2608757019042969, -0.24640655517578125, -0.23193740844726562, -0.21746826171875, -0.20299911499023438, -0.18852996826171875, -0.17406082153320312, -0.1595916748046875, -0.14512252807617188, -0.13065338134765625, -0.11618423461914062, -0.101715087890625, -0.08724594116210938, -0.07277679443359375, -0.058307647705078125, -0.0438385009765625, -0.029369354248046875, -0.01490020751953125, -0.000431060791015625, 0.0140380859375, 0.028507232666015625, 0.04297637939453125, 0.057445526123046875, 0.0719146728515625, 0.08638381958007812, 0.10085296630859375, 0.11532211303710938, 0.129791259765625, 0.14426040649414062, 0.15872955322265625, 0.17319869995117188, 0.1876678466796875, 0.20213699340820312, 0.21660614013671875, 0.23107528686523438, 0.24554443359375, 0.2600135803222656, 0.27448272705078125, 0.2889518737792969, 0.3034210205078125, 0.3178901672363281, 0.33235931396484375, 0.3468284606933594, 0.361297607421875, 0.3757667541503906, 0.39023590087890625, 0.4047050476074219, 0.4191741943359375, 0.4336433410644531, 0.44811248779296875, 0.4625816345214844, 0.47705078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 4.0, 5.0, 10.0, 18.0, 20.0, 22.0, 36.0, 40.0, 55.0, 57.0, 62.0, 86.0, 64.0, 79.0, 81.0, 62.0, 60.0, 47.0, 51.0, 27.0, 24.0, 17.0, 14.0, 15.0, 7.0, 3.0, 5.0, 5.0, 4.0, 1.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57861328125, -0.5628204345703125, -0.547027587890625, -0.5312347412109375, -0.51544189453125, -0.4996490478515625, -0.483856201171875, -0.4680633544921875, -0.4522705078125, -0.4364776611328125, -0.420684814453125, -0.4048919677734375, -0.38909912109375, -0.3733062744140625, -0.357513427734375, -0.3417205810546875, -0.325927734375, -0.3101348876953125, -0.294342041015625, -0.2785491943359375, -0.26275634765625, -0.2469635009765625, -0.231170654296875, -0.2153778076171875, -0.1995849609375, -0.1837921142578125, -0.167999267578125, -0.1522064208984375, -0.13641357421875, -0.1206207275390625, -0.104827880859375, -0.0890350341796875, -0.0732421875, -0.0574493408203125, -0.041656494140625, -0.0258636474609375, -0.01007080078125, 0.0057220458984375, 0.021514892578125, 0.0373077392578125, 0.0531005859375, 0.0688934326171875, 0.084686279296875, 0.1004791259765625, 0.11627197265625, 0.1320648193359375, 0.147857666015625, 0.1636505126953125, 0.179443359375, 0.1952362060546875, 0.211029052734375, 0.2268218994140625, 0.24261474609375, 0.2584075927734375, 0.274200439453125, 0.2899932861328125, 0.3057861328125, 0.3215789794921875, 0.337371826171875, 0.3531646728515625, 0.36895751953125, 0.3847503662109375, 0.400543212890625, 0.4163360595703125, 0.43212890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 12.0, 20.0, 36.0, 60.0, 91.0, 147.0, 319.0, 710.0, 2046.0, 7701.0, 43152.0, 768306.0, 198129.0, 20833.0, 4462.0, 1366.0, 518.0, 227.0, 140.0, 76.0, 49.0, 24.0, 15.0, 14.0, 11.0, 14.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08660888671875, -0.08388614654541016, -0.08116340637207031, -0.07844066619873047, -0.07571792602539062, -0.07299518585205078, -0.07027244567871094, -0.0675497055053711, -0.06482696533203125, -0.062104225158691406, -0.05938148498535156, -0.05665874481201172, -0.053936004638671875, -0.05121326446533203, -0.04849052429199219, -0.045767784118652344, -0.0430450439453125, -0.040322303771972656, -0.03759956359863281, -0.03487682342529297, -0.032154083251953125, -0.02943134307861328, -0.026708602905273438, -0.023985862731933594, -0.02126312255859375, -0.018540382385253906, -0.015817642211914062, -0.013094902038574219, -0.010372161865234375, -0.007649421691894531, -0.0049266815185546875, -0.0022039413452148438, 0.000518798828125, 0.0032415390014648438, 0.0059642791748046875, 0.008687019348144531, 0.011409759521484375, 0.014132499694824219, 0.016855239868164062, 0.019577980041503906, 0.02230072021484375, 0.025023460388183594, 0.027746200561523438, 0.03046894073486328, 0.033191680908203125, 0.03591442108154297, 0.03863716125488281, 0.041359901428222656, 0.0440826416015625, 0.046805381774902344, 0.04952812194824219, 0.05225086212158203, 0.054973602294921875, 0.05769634246826172, 0.06041908264160156, 0.0631418228149414, 0.06586456298828125, 0.0685873031616211, 0.07131004333496094, 0.07403278350830078, 0.07675552368164062, 0.07947826385498047, 0.08220100402832031, 0.08492374420166016, 0.087646484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 8.0, 2.0, 3.0, 8.0, 11.0, 10.0, 16.0, 22.0, 16.0, 16.0, 30.0, 27.0, 39.0, 55.0, 71.0, 79.0, 86.0, 89.0, 80.0, 65.0, 46.0, 53.0, 33.0, 24.0, 23.0, 16.0, 21.0, 9.0, 6.0, 5.0, 3.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9981136322021484e-05, -2.9012560844421387e-05, -2.804398536682129e-05, -2.707540988922119e-05, -2.6106834411621094e-05, -2.5138258934020996e-05, -2.41696834564209e-05, -2.32011079788208e-05, -2.2232532501220703e-05, -2.1263957023620605e-05, -2.0295381546020508e-05, -1.932680606842041e-05, -1.8358230590820312e-05, -1.7389655113220215e-05, -1.6421079635620117e-05, -1.545250415802002e-05, -1.4483928680419922e-05, -1.3515353202819824e-05, -1.2546777725219727e-05, -1.1578202247619629e-05, -1.0609626770019531e-05, -9.641051292419434e-06, -8.672475814819336e-06, -7.703900337219238e-06, -6.735324859619141e-06, -5.766749382019043e-06, -4.798173904418945e-06, -3.829598426818848e-06, -2.86102294921875e-06, -1.8924474716186523e-06, -9.238719940185547e-07, 4.470348358154297e-08, 1.0132789611816406e-06, 1.9818544387817383e-06, 2.950429916381836e-06, 3.919005393981934e-06, 4.887580871582031e-06, 5.856156349182129e-06, 6.8247318267822266e-06, 7.793307304382324e-06, 8.761882781982422e-06, 9.73045825958252e-06, 1.0699033737182617e-05, 1.1667609214782715e-05, 1.2636184692382812e-05, 1.360476016998291e-05, 1.4573335647583008e-05, 1.5541911125183105e-05, 1.6510486602783203e-05, 1.74790620803833e-05, 1.84476375579834e-05, 1.9416213035583496e-05, 2.0384788513183594e-05, 2.135336399078369e-05, 2.232193946838379e-05, 2.3290514945983887e-05, 2.4259090423583984e-05, 2.5227665901184082e-05, 2.619624137878418e-05, 2.7164816856384277e-05, 2.8133392333984375e-05, 2.9101967811584473e-05, 3.007054328918457e-05, 3.103911876678467e-05, 3.2007694244384766e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 15.0, 9.0, 25.0, 38.0, 44.0, 81.0, 131.0, 173.0, 367.0, 691.0, 1622.0, 4513.0, 17840.0, 122369.0, 790389.0, 89436.0, 14170.0, 3755.0, 1369.0, 642.0, 328.0, 173.0, 111.0, 70.0, 44.0, 40.0, 29.0, 22.0, 9.0, 7.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06842041015625, -0.06609535217285156, -0.06377029418945312, -0.06144523620605469, -0.05912017822265625, -0.05679512023925781, -0.054470062255859375, -0.05214500427246094, -0.0498199462890625, -0.04749488830566406, -0.045169830322265625, -0.04284477233886719, -0.04051971435546875, -0.03819465637207031, -0.035869598388671875, -0.03354454040527344, -0.031219482421875, -0.028894424438476562, -0.026569366455078125, -0.024244308471679688, -0.02191925048828125, -0.019594192504882812, -0.017269134521484375, -0.014944076538085938, -0.0126190185546875, -0.010293960571289062, -0.007968902587890625, -0.0056438446044921875, -0.00331878662109375, -0.0009937286376953125, 0.001331329345703125, 0.0036563873291015625, 0.0059814453125, 0.008306503295898438, 0.010631561279296875, 0.012956619262695312, 0.01528167724609375, 0.017606735229492188, 0.019931793212890625, 0.022256851196289062, 0.0245819091796875, 0.026906967163085938, 0.029232025146484375, 0.03155708312988281, 0.03388214111328125, 0.03620719909667969, 0.038532257080078125, 0.04085731506347656, 0.043182373046875, 0.04550743103027344, 0.047832489013671875, 0.05015754699707031, 0.05248260498046875, 0.05480766296386719, 0.057132720947265625, 0.05945777893066406, 0.0617828369140625, 0.06410789489746094, 0.06643295288085938, 0.06875801086425781, 0.07108306884765625, 0.07340812683105469, 0.07573318481445312, 0.07805824279785156, 0.08038330078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 8.0, 15.0, 14.0, 15.0, 29.0, 19.0, 40.0, 57.0, 84.0, 150.0, 127.0, 115.0, 87.0, 61.0, 54.0, 27.0, 32.0, 17.0, 7.0, 14.0, 7.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0650634765625, -0.062419891357421875, -0.05977630615234375, -0.057132720947265625, -0.0544891357421875, -0.051845550537109375, -0.04920196533203125, -0.046558380126953125, -0.043914794921875, -0.041271209716796875, -0.03862762451171875, -0.035984039306640625, -0.0333404541015625, -0.030696868896484375, -0.02805328369140625, -0.025409698486328125, -0.02276611328125, -0.020122528076171875, -0.01747894287109375, -0.014835357666015625, -0.0121917724609375, -0.009548187255859375, -0.00690460205078125, -0.004261016845703125, -0.001617431640625, 0.001026153564453125, 0.00366973876953125, 0.006313323974609375, 0.0089569091796875, 0.011600494384765625, 0.01424407958984375, 0.016887664794921875, 0.01953125, 0.022174835205078125, 0.02481842041015625, 0.027462005615234375, 0.0301055908203125, 0.032749176025390625, 0.03539276123046875, 0.038036346435546875, 0.040679931640625, 0.043323516845703125, 0.04596710205078125, 0.048610687255859375, 0.0512542724609375, 0.053897857666015625, 0.05654144287109375, 0.059185028076171875, 0.06182861328125, 0.06447219848632812, 0.06711578369140625, 0.06975936889648438, 0.0724029541015625, 0.07504653930664062, 0.07769012451171875, 0.08033370971679688, 0.082977294921875, 0.08562088012695312, 0.08826446533203125, 0.09090805053710938, 0.0935516357421875, 0.09619522094726562, 0.09883880615234375, 0.10148239135742188, 0.1041259765625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 10.0, 15.0, 38.0, 113.0, 307.0, 385.0, 91.0, 30.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8249331712722778, -1.7238578796386719, -1.6227824687957764, -1.5217071771621704, -1.4206318855285645, -1.319556474685669, -1.218481183052063, -1.117405891418457, -1.0163304805755615, -0.9152551293373108, -0.8141798377037048, -0.7131044864654541, -0.6120291948318481, -0.5109538435935974, -0.4098784923553467, -0.3088032007217407, -0.20772790908813477, -0.10665258020162582, -0.005577251315116882, 0.09549808502197266, 0.196573406457901, 0.29764872789382935, 0.3987240791320801, 0.49979937076568604, 0.6008747220039368, 0.7019500732421875, 0.8030253648757935, 0.9041007161140442, 1.005176067352295, 1.1062513589859009, 1.2073266506195068, 1.3084020614624023, 1.4094774723052979, 1.5105527639389038, 1.6116281747817993, 1.7127034664154053, 1.8137787580490112, 1.9148540496826172, 2.0159294605255127, 2.117004871368408, 2.2180800437927246, 2.31915545463562, 2.4202306270599365, 2.521306037902832, 2.6223814487457275, 2.723456621170044, 2.8245320320129395, 2.925607204437256, 3.0266828536987305, 3.127758264541626, 3.2288334369659424, 3.329908847808838, 3.4309842586517334, 3.53205943107605, 3.6331348419189453, 3.7342100143432617, 3.8352854251861572, 3.9363608360290527, 4.037436008453369, 4.138511657714844, 4.23958683013916, 4.340662002563477, 4.441737174987793, 4.542812824249268, 4.643887996673584]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 4.0, 8.0, 3.0, 9.0, 7.0, 13.0, 12.0, 12.0, 15.0, 15.0, 24.0, 16.0, 23.0, 34.0, 34.0, 38.0, 60.0, 87.0, 176.0, 75.0, 52.0, 39.0, 38.0, 27.0, 29.0, 25.0, 20.0, 18.0, 20.0, 13.0, 12.0, 7.0, 3.0, 8.0, 4.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3344430923461914, -1.2888784408569336, -1.2433139085769653, -1.1977492570877075, -1.1521847248077393, -1.1066200733184814, -1.0610554218292236, -1.0154907703399658, -0.9699262380599976, -0.9243616461753845, -0.8787970542907715, -0.8332324028015137, -0.7876678109169006, -0.7421032190322876, -0.6965385675430298, -0.6509739756584167, -0.6054093837738037, -0.5598447918891907, -0.5142802000045776, -0.4687155485153198, -0.4231509566307068, -0.37758636474609375, -0.3320217430591583, -0.2864571213722229, -0.24089252948760986, -0.19532792270183563, -0.1497633159160614, -0.10419870913028717, -0.05863410234451294, -0.013069495558738708, 0.03249511122703552, 0.07805973291397095, 0.12362432479858398, 0.16918893158435822, 0.21475353837013245, 0.26031816005706787, 0.3058827519416809, 0.35144734382629395, 0.39701196551322937, 0.4425765872001648, 0.48814117908477783, 0.5337057709693909, 0.5792703628540039, 0.6248350143432617, 0.6703996062278748, 0.7159641981124878, 0.7615288496017456, 0.8070934414863586, 0.8526580333709717, 0.8982226252555847, 0.9437872171401978, 0.9893518686294556, 1.0349164009094238, 1.0804810523986816, 1.1260457038879395, 1.1716103553771973, 1.2171748876571655, 1.2627395391464233, 1.3083040714263916, 1.3538687229156494, 1.3994333744049072, 1.4449979066848755, 1.4905625581741333, 1.5361270904541016, 1.5816917419433594]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 8.0, 15.0, 17.0, 30.0, 42.0, 48.0, 67.0, 90.0, 121.0, 174.0, 308.0, 416.0, 593.0, 965.0, 1506.0, 2660.0, 5009.0, 10397.0, 26402.0, 82610.0, 289211.0, 883815.0, 1555223.0, 903211.0, 296483.0, 83515.0, 28229.0, 10936.0, 4981.0, 2793.0, 1554.0, 901.0, 626.0, 411.0, 264.0, 170.0, 144.0, 88.0, 75.0, 34.0, 33.0, 22.0, 22.0, 19.0, 16.0, 3.0, 3.0, 5.0, 0.0, 8.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0950927734375, -0.09216785430908203, -0.08924293518066406, -0.0863180160522461, -0.08339309692382812, -0.08046817779541016, -0.07754325866699219, -0.07461833953857422, -0.07169342041015625, -0.06876850128173828, -0.06584358215332031, -0.06291866302490234, -0.059993743896484375, -0.057068824768066406, -0.05414390563964844, -0.05121898651123047, -0.0482940673828125, -0.04536914825439453, -0.04244422912597656, -0.039519309997558594, -0.036594390869140625, -0.033669471740722656, -0.030744552612304688, -0.02781963348388672, -0.02489471435546875, -0.02196979522705078, -0.019044876098632812, -0.016119956970214844, -0.013195037841796875, -0.010270118713378906, -0.0073451995849609375, -0.004420280456542969, -0.001495361328125, 0.0014295578002929688, 0.0043544769287109375, 0.007279396057128906, 0.010204315185546875, 0.013129234313964844, 0.016054153442382812, 0.01897907257080078, 0.02190399169921875, 0.02482891082763672, 0.027753829956054688, 0.030678749084472656, 0.033603668212890625, 0.036528587341308594, 0.03945350646972656, 0.04237842559814453, 0.0453033447265625, 0.04822826385498047, 0.05115318298339844, 0.054078102111816406, 0.057003021240234375, 0.059927940368652344, 0.06285285949707031, 0.06577777862548828, 0.06870269775390625, 0.07162761688232422, 0.07455253601074219, 0.07747745513916016, 0.08040237426757812, 0.0833272933959961, 0.08625221252441406, 0.08917713165283203, 0.09210205078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 13.0, 10.0, 12.0, 14.0, 19.0, 18.0, 30.0, 30.0, 36.0, 41.0, 45.0, 44.0, 48.0, 51.0, 50.0, 40.0, 55.0, 48.0, 49.0, 42.0, 41.0, 36.0, 37.0, 22.0, 32.0, 29.0, 14.0, 16.0, 18.0, 12.0, 10.0, 7.0, 4.0, 1.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0992431640625, -0.09629535675048828, -0.09334754943847656, -0.09039974212646484, -0.08745193481445312, -0.0845041275024414, -0.08155632019042969, -0.07860851287841797, -0.07566070556640625, -0.07271289825439453, -0.06976509094238281, -0.0668172836303711, -0.06386947631835938, -0.060921669006347656, -0.05797386169433594, -0.05502605438232422, -0.0520782470703125, -0.04913043975830078, -0.04618263244628906, -0.043234825134277344, -0.040287017822265625, -0.037339210510253906, -0.03439140319824219, -0.03144359588623047, -0.02849578857421875, -0.02554798126220703, -0.022600173950195312, -0.019652366638183594, -0.016704559326171875, -0.013756752014160156, -0.010808944702148438, -0.007861137390136719, -0.004913330078125, -0.0019655227661132812, 0.0009822845458984375, 0.003930091857910156, 0.006877899169921875, 0.009825706481933594, 0.012773513793945312, 0.01572132110595703, 0.01866912841796875, 0.02161693572998047, 0.024564743041992188, 0.027512550354003906, 0.030460357666015625, 0.033408164978027344, 0.03635597229003906, 0.03930377960205078, 0.0422515869140625, 0.04519939422607422, 0.04814720153808594, 0.051095008850097656, 0.054042816162109375, 0.056990623474121094, 0.05993843078613281, 0.06288623809814453, 0.06583404541015625, 0.06878185272216797, 0.07172966003417969, 0.0746774673461914, 0.07762527465820312, 0.08057308197021484, 0.08352088928222656, 0.08646869659423828, 0.08941650390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 5.0, 10.0, 10.0, 6.0, 18.0, 19.0, 29.0, 46.0, 70.0, 89.0, 142.0, 227.0, 377.0, 520.0, 1035.0, 2095.0, 7221.0, 93610.0, 3971736.0, 104698.0, 7754.0, 2140.0, 969.0, 505.0, 318.0, 183.0, 139.0, 88.0, 54.0, 48.0, 22.0, 32.0, 16.0, 11.0, 11.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.51611328125, -0.5015792846679688, -0.4870452880859375, -0.47251129150390625, -0.457977294921875, -0.44344329833984375, -0.4289093017578125, -0.41437530517578125, -0.39984130859375, -0.38530731201171875, -0.3707733154296875, -0.35623931884765625, -0.341705322265625, -0.32717132568359375, -0.3126373291015625, -0.29810333251953125, -0.2835693359375, -0.26903533935546875, -0.2545013427734375, -0.23996734619140625, -0.225433349609375, -0.21089935302734375, -0.1963653564453125, -0.18183135986328125, -0.16729736328125, -0.15276336669921875, -0.1382293701171875, -0.12369537353515625, -0.109161376953125, -0.09462738037109375, -0.0800933837890625, -0.06555938720703125, -0.051025390625, -0.03649139404296875, -0.0219573974609375, -0.00742340087890625, 0.007110595703125, 0.02164459228515625, 0.0361785888671875, 0.05071258544921875, 0.06524658203125, 0.07978057861328125, 0.0943145751953125, 0.10884857177734375, 0.123382568359375, 0.13791656494140625, 0.1524505615234375, 0.16698455810546875, 0.1815185546875, 0.19605255126953125, 0.2105865478515625, 0.22512054443359375, 0.239654541015625, 0.25418853759765625, 0.2687225341796875, 0.28325653076171875, 0.29779052734375, 0.31232452392578125, 0.3268585205078125, 0.34139251708984375, 0.355926513671875, 0.37046051025390625, 0.3849945068359375, 0.39952850341796875, 0.4140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 12.0, 5.0, 8.0, 6.0, 11.0, 18.0, 20.0, 35.0, 33.0, 56.0, 93.0, 120.0, 194.0, 252.0, 357.0, 479.0, 609.0, 467.0, 367.0, 246.0, 188.0, 134.0, 87.0, 74.0, 48.0, 37.0, 30.0, 28.0, 16.0, 11.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.314697265625, -0.3062782287597656, -0.29785919189453125, -0.2894401550292969, -0.2810211181640625, -0.2726020812988281, -0.26418304443359375, -0.2557640075683594, -0.247344970703125, -0.23892593383789062, -0.23050689697265625, -0.22208786010742188, -0.2136688232421875, -0.20524978637695312, -0.19683074951171875, -0.18841171264648438, -0.17999267578125, -0.17157363891601562, -0.16315460205078125, -0.15473556518554688, -0.1463165283203125, -0.13789749145507812, -0.12947845458984375, -0.12105941772460938, -0.112640380859375, -0.10422134399414062, -0.09580230712890625, -0.08738327026367188, -0.0789642333984375, -0.07054519653320312, -0.06212615966796875, -0.053707122802734375, -0.0452880859375, -0.036869049072265625, -0.02845001220703125, -0.020030975341796875, -0.0116119384765625, -0.003192901611328125, 0.00522613525390625, 0.013645172119140625, 0.022064208984375, 0.030483245849609375, 0.03890228271484375, 0.047321319580078125, 0.0557403564453125, 0.06415939331054688, 0.07257843017578125, 0.08099746704101562, 0.08941650390625, 0.09783554077148438, 0.10625457763671875, 0.11467361450195312, 0.1230926513671875, 0.13151168823242188, 0.13993072509765625, 0.14834976196289062, 0.156768798828125, 0.16518783569335938, 0.17360687255859375, 0.18202590942382812, 0.1904449462890625, 0.19886398315429688, 0.20728302001953125, 0.21570205688476562, 0.22412109375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 11.0, 8.0, 24.0, 61.0, 142.0, 240.0, 260.0, 139.0, 64.0, 25.0, 15.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.275860786437988, -6.118461608886719, -5.961061954498291, -5.8036627769470215, -5.646263122558594, -5.488863945007324, -5.3314642906188965, -5.174065113067627, -5.016665458679199, -4.85926628112793, -4.701866626739502, -4.544467449188232, -4.387067794799805, -4.229668617248535, -4.072268962860107, -3.914869785308838, -3.7574706077575684, -3.6000711917877197, -3.442671775817871, -3.2852723598480225, -3.127872943878174, -2.9704737663269043, -2.8130743503570557, -2.655674934387207, -2.4982755184173584, -2.3408761024475098, -2.183476686477661, -2.0260772705078125, -1.8686779737472534, -1.7112785577774048, -1.5538792610168457, -1.396479845046997, -1.2390809059143066, -1.081681489944458, -0.9242821335792542, -0.7668827772140503, -0.6094833612442017, -0.452083945274353, -0.29468458890914917, -0.1372852325439453, 0.02011418342590332, 0.17751356959342957, 0.3349129557609558, 0.49231234192848206, 0.6497117280960083, 0.8071111440658569, 0.9645105004310608, 1.1219098567962646, 1.2793092727661133, 1.436708688735962, 1.5941081047058105, 1.7515074014663696, 1.9089068174362183, 2.0663061141967773, 2.223705530166626, 2.3811049461364746, 2.5385043621063232, 2.695903778076172, 2.8533031940460205, 3.010702610015869, 3.1681017875671387, 3.3255014419555664, 3.482900619506836, 3.6403000354766846, 3.797699451446533]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 10.0, 10.0, 15.0, 20.0, 21.0, 46.0, 45.0, 45.0, 51.0, 84.0, 99.0, 92.0, 85.0, 54.0, 68.0, 51.0, 58.0, 32.0, 33.0, 28.0, 20.0, 13.0, 10.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.195653200149536, -3.114492893218994, -3.033332586288452, -2.95217227935791, -2.871011734008789, -2.789851427078247, -2.708691120147705, -2.627530813217163, -2.546370506286621, -2.465210199356079, -2.384049892425537, -2.302889585494995, -2.221729278564453, -2.140568733215332, -2.05940842628479, -1.978248119354248, -1.897087812423706, -1.815927505493164, -1.734767198562622, -1.6536067724227905, -1.5724464654922485, -1.4912861585617065, -1.410125732421875, -1.328965425491333, -1.247805118560791, -1.166644811630249, -1.085484504699707, -1.0043240785598755, -0.9231637716293335, -0.8420034646987915, -0.7608430981636047, -0.679682731628418, -0.598522424697876, -0.517362117767334, -0.4362017512321472, -0.35504141449928284, -0.27388107776641846, -0.19272074103355408, -0.1115604043006897, -0.03040003776550293, 0.05076026916503906, 0.13192060589790344, 0.21308094263076782, 0.2942412793636322, 0.3754016160964966, 0.45656195282936096, 0.5377222895622253, 0.6188826560974121, 0.7000429630279541, 0.7812032699584961, 0.8623636364936829, 0.9435240030288696, 1.0246843099594116, 1.1058446168899536, 1.1870050430297852, 1.2681653499603271, 1.3493256568908691, 1.4304859638214111, 1.5116462707519531, 1.5928066968917847, 1.6739670038223267, 1.7551273107528687, 1.8362877368927002, 1.9174480438232422, 1.9986083507537842]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 3.0, 6.0, 10.0, 9.0, 15.0, 15.0, 26.0, 34.0, 58.0, 65.0, 122.0, 233.0, 546.0, 1515.0, 4814.0, 19845.0, 143181.0, 784774.0, 74868.0, 12923.0, 3391.0, 1120.0, 451.0, 205.0, 124.0, 53.0, 41.0, 36.0, 24.0, 11.0, 7.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270263671875, -0.2610588073730469, -0.25185394287109375, -0.24264907836914062, -0.2334442138671875, -0.22423934936523438, -0.21503448486328125, -0.20582962036132812, -0.196624755859375, -0.18741989135742188, -0.17821502685546875, -0.16901016235351562, -0.1598052978515625, -0.15060043334960938, -0.14139556884765625, -0.13219070434570312, -0.12298583984375, -0.11378097534179688, -0.10457611083984375, -0.09537124633789062, -0.0861663818359375, -0.07696151733398438, -0.06775665283203125, -0.058551788330078125, -0.049346923828125, -0.040142059326171875, -0.03093719482421875, -0.021732330322265625, -0.0125274658203125, -0.003322601318359375, 0.00588226318359375, 0.015087127685546875, 0.0242919921875, 0.033496856689453125, 0.04270172119140625, 0.051906585693359375, 0.0611114501953125, 0.07031631469726562, 0.07952117919921875, 0.08872604370117188, 0.097930908203125, 0.10713577270507812, 0.11634063720703125, 0.12554550170898438, 0.1347503662109375, 0.14395523071289062, 0.15316009521484375, 0.16236495971679688, 0.17156982421875, 0.18077468872070312, 0.18997955322265625, 0.19918441772460938, 0.2083892822265625, 0.21759414672851562, 0.22679901123046875, 0.23600387573242188, 0.245208740234375, 0.2544136047363281, 0.26361846923828125, 0.2728233337402344, 0.2820281982421875, 0.2912330627441406, 0.30043792724609375, 0.3096427917480469, 0.31884765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 10.0, 22.0, 40.0, 56.0, 56.0, 96.0, 119.0, 98.0, 118.0, 107.0, 87.0, 69.0, 42.0, 28.0, 18.0, 11.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329345703125, -0.3212776184082031, -0.31320953369140625, -0.3051414489746094, -0.2970733642578125, -0.2890052795410156, -0.28093719482421875, -0.2728691101074219, -0.264801025390625, -0.2567329406738281, -0.24866485595703125, -0.24059677124023438, -0.2325286865234375, -0.22446060180664062, -0.21639251708984375, -0.20832443237304688, -0.20025634765625, -0.19218826293945312, -0.18412017822265625, -0.17605209350585938, -0.1679840087890625, -0.15991592407226562, -0.15184783935546875, -0.14377975463867188, -0.135711669921875, -0.12764358520507812, -0.11957550048828125, -0.11150741577148438, -0.1034393310546875, -0.09537124633789062, -0.08730316162109375, -0.07923507690429688, -0.0711669921875, -0.06309890747070312, -0.05503082275390625, -0.046962738037109375, -0.0388946533203125, -0.030826568603515625, -0.02275848388671875, -0.014690399169921875, -0.006622314453125, 0.001445770263671875, 0.00951385498046875, 0.017581939697265625, 0.0256500244140625, 0.033718109130859375, 0.04178619384765625, 0.049854278564453125, 0.05792236328125, 0.06599044799804688, 0.07405853271484375, 0.08212661743164062, 0.0901947021484375, 0.09826278686523438, 0.10633087158203125, 0.11439895629882812, 0.122467041015625, 0.13053512573242188, 0.13860321044921875, 0.14667129516601562, 0.1547393798828125, 0.16280746459960938, 0.17087554931640625, 0.17894363403320312, 0.18701171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 10.0, 12.0, 12.0, 24.0, 26.0, 43.0, 42.0, 72.0, 151.0, 220.0, 395.0, 872.0, 2804.0, 17982.0, 854669.0, 158202.0, 9619.0, 1848.0, 700.0, 330.0, 169.0, 115.0, 75.0, 56.0, 29.0, 21.0, 16.0, 11.0, 13.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371826171875, -0.36200714111328125, -0.3521881103515625, -0.34236907958984375, -0.332550048828125, -0.32273101806640625, -0.3129119873046875, -0.30309295654296875, -0.29327392578125, -0.28345489501953125, -0.2736358642578125, -0.26381683349609375, -0.253997802734375, -0.24417877197265625, -0.2343597412109375, -0.22454071044921875, -0.2147216796875, -0.20490264892578125, -0.1950836181640625, -0.18526458740234375, -0.175445556640625, -0.16562652587890625, -0.1558074951171875, -0.14598846435546875, -0.13616943359375, -0.12635040283203125, -0.1165313720703125, -0.10671234130859375, -0.096893310546875, -0.08707427978515625, -0.0772552490234375, -0.06743621826171875, -0.0576171875, -0.04779815673828125, -0.0379791259765625, -0.02816009521484375, -0.018341064453125, -0.00852203369140625, 0.0012969970703125, 0.01111602783203125, 0.02093505859375, 0.03075408935546875, 0.0405731201171875, 0.05039215087890625, 0.060211181640625, 0.07003021240234375, 0.0798492431640625, 0.08966827392578125, 0.0994873046875, 0.10930633544921875, 0.1191253662109375, 0.12894439697265625, 0.138763427734375, 0.14858245849609375, 0.1584014892578125, 0.16822052001953125, 0.17803955078125, 0.18785858154296875, 0.1976776123046875, 0.20749664306640625, 0.217315673828125, 0.22713470458984375, 0.2369537353515625, 0.24677276611328125, 0.256591796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 9.0, 9.0, 9.0, 12.0, 10.0, 21.0, 21.0, 19.0, 33.0, 21.0, 32.0, 28.0, 37.0, 52.0, 66.0, 65.0, 73.0, 74.0, 75.0, 71.0, 34.0, 30.0, 34.0, 25.0, 20.0, 21.0, 21.0, 13.0, 12.0, 14.0, 8.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.52294921875, -0.5094566345214844, -0.49596405029296875, -0.4824714660644531, -0.4689788818359375, -0.4554862976074219, -0.44199371337890625, -0.4285011291503906, -0.415008544921875, -0.4015159606933594, -0.38802337646484375, -0.3745307922363281, -0.3610382080078125, -0.3475456237792969, -0.33405303955078125, -0.3205604553222656, -0.30706787109375, -0.2935752868652344, -0.28008270263671875, -0.2665901184082031, -0.2530975341796875, -0.23960494995117188, -0.22611236572265625, -0.21261978149414062, -0.199127197265625, -0.18563461303710938, -0.17214202880859375, -0.15864944458007812, -0.1451568603515625, -0.13166427612304688, -0.11817169189453125, -0.10467910766601562, -0.0911865234375, -0.07769393920898438, -0.06420135498046875, -0.050708770751953125, -0.0372161865234375, -0.023723602294921875, -0.01023101806640625, 0.003261566162109375, 0.016754150390625, 0.030246734619140625, 0.04373931884765625, 0.057231903076171875, 0.0707244873046875, 0.08421707153320312, 0.09770965576171875, 0.11120223999023438, 0.12469482421875, 0.13818740844726562, 0.15167999267578125, 0.16517257690429688, 0.1786651611328125, 0.19215774536132812, 0.20565032958984375, 0.21914291381835938, 0.232635498046875, 0.24612808227539062, 0.25962066650390625, 0.2731132507324219, 0.2866058349609375, 0.3000984191894531, 0.31359100341796875, 0.3270835876464844, 0.340576171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 2.0, 15.0, 11.0, 26.0, 34.0, 48.0, 83.0, 133.0, 249.0, 535.0, 1297.0, 4425.0, 28282.0, 953441.0, 50663.0, 6317.0, 1592.0, 631.0, 329.0, 165.0, 89.0, 57.0, 41.0, 21.0, 20.0, 15.0, 7.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0799560546875, -0.07750415802001953, -0.07505226135253906, -0.0726003646850586, -0.07014846801757812, -0.06769657135009766, -0.06524467468261719, -0.06279277801513672, -0.06034088134765625, -0.05788898468017578, -0.05543708801269531, -0.052985191345214844, -0.050533294677734375, -0.048081398010253906, -0.04562950134277344, -0.04317760467529297, -0.0407257080078125, -0.03827381134033203, -0.03582191467285156, -0.033370018005371094, -0.030918121337890625, -0.028466224670410156, -0.026014328002929688, -0.02356243133544922, -0.02111053466796875, -0.01865863800048828, -0.016206741333007812, -0.013754844665527344, -0.011302947998046875, -0.008851051330566406, -0.0063991546630859375, -0.003947257995605469, -0.001495361328125, 0.0009565353393554688, 0.0034084320068359375, 0.005860328674316406, 0.008312225341796875, 0.010764122009277344, 0.013216018676757812, 0.01566791534423828, 0.01811981201171875, 0.02057170867919922, 0.023023605346679688, 0.025475502014160156, 0.027927398681640625, 0.030379295349121094, 0.03283119201660156, 0.03528308868408203, 0.0377349853515625, 0.04018688201904297, 0.04263877868652344, 0.045090675354003906, 0.047542572021484375, 0.049994468688964844, 0.05244636535644531, 0.05489826202392578, 0.05735015869140625, 0.05980205535888672, 0.06225395202636719, 0.06470584869384766, 0.06715774536132812, 0.0696096420288086, 0.07206153869628906, 0.07451343536376953, 0.07696533203125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 7.0, 9.0, 7.0, 20.0, 18.0, 26.0, 20.0, 32.0, 44.0, 50.0, 72.0, 90.0, 84.0, 78.0, 92.0, 72.0, 60.0, 43.0, 31.0, 23.0, 20.0, 17.0, 14.0, 17.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.74913215637207e-05, -3.645382821559906e-05, -3.541633486747742e-05, -3.4378841519355774e-05, -3.334134817123413e-05, -3.230385482311249e-05, -3.1266361474990845e-05, -3.02288681268692e-05, -2.919137477874756e-05, -2.8153881430625916e-05, -2.7116388082504272e-05, -2.607889473438263e-05, -2.5041401386260986e-05, -2.4003908038139343e-05, -2.29664146900177e-05, -2.1928921341896057e-05, -2.0891427993774414e-05, -1.985393464565277e-05, -1.8816441297531128e-05, -1.7778947949409485e-05, -1.6741454601287842e-05, -1.57039612531662e-05, -1.4666467905044556e-05, -1.3628974556922913e-05, -1.259148120880127e-05, -1.1553987860679626e-05, -1.0516494512557983e-05, -9.47900116443634e-06, -8.441507816314697e-06, -7.404014468193054e-06, -6.366521120071411e-06, -5.329027771949768e-06, -4.291534423828125e-06, -3.254041075706482e-06, -2.216547727584839e-06, -1.1790543794631958e-06, -1.4156103134155273e-07, 8.959323167800903e-07, 1.9334256649017334e-06, 2.9709190130233765e-06, 4.0084123611450195e-06, 5.045905709266663e-06, 6.083399057388306e-06, 7.120892405509949e-06, 8.158385753631592e-06, 9.195879101753235e-06, 1.0233372449874878e-05, 1.1270865797996521e-05, 1.2308359146118164e-05, 1.3345852494239807e-05, 1.438334584236145e-05, 1.5420839190483093e-05, 1.6458332538604736e-05, 1.749582588672638e-05, 1.8533319234848022e-05, 1.9570812582969666e-05, 2.060830593109131e-05, 2.164579927921295e-05, 2.2683292627334595e-05, 2.3720785975456238e-05, 2.475827932357788e-05, 2.5795772671699524e-05, 2.6833266019821167e-05, 2.787075936794281e-05, 2.8908252716064453e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 7.0, 13.0, 23.0, 23.0, 37.0, 53.0, 93.0, 190.0, 288.0, 537.0, 1086.0, 2521.0, 6830.0, 23331.0, 249926.0, 725359.0, 25677.0, 7322.0, 2723.0, 1156.0, 564.0, 318.0, 170.0, 98.0, 62.0, 32.0, 29.0, 22.0, 15.0, 12.0, 2.0, 10.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03973388671875, -0.03831624984741211, -0.03689861297607422, -0.03548097610473633, -0.03406333923339844, -0.03264570236206055, -0.031228065490722656, -0.029810428619384766, -0.028392791748046875, -0.026975154876708984, -0.025557518005371094, -0.024139881134033203, -0.022722244262695312, -0.021304607391357422, -0.01988697052001953, -0.01846933364868164, -0.01705169677734375, -0.01563405990600586, -0.014216423034667969, -0.012798786163330078, -0.011381149291992188, -0.009963512420654297, -0.008545875549316406, -0.007128238677978516, -0.005710601806640625, -0.004292964935302734, -0.0028753280639648438, -0.0014576911926269531, -4.00543212890625e-05, 0.0013775825500488281, 0.0027952194213867188, 0.004212856292724609, 0.0056304931640625, 0.007048130035400391, 0.008465766906738281, 0.009883403778076172, 0.011301040649414062, 0.012718677520751953, 0.014136314392089844, 0.015553951263427734, 0.016971588134765625, 0.018389225006103516, 0.019806861877441406, 0.021224498748779297, 0.022642135620117188, 0.024059772491455078, 0.02547740936279297, 0.02689504623413086, 0.02831268310546875, 0.02973031997680664, 0.03114795684814453, 0.03256559371948242, 0.03398323059082031, 0.0354008674621582, 0.036818504333496094, 0.038236141204833984, 0.039653778076171875, 0.041071414947509766, 0.042489051818847656, 0.04390668869018555, 0.04532432556152344, 0.04674196243286133, 0.04815959930419922, 0.04957723617553711, 0.050994873046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 8.0, 7.0, 12.0, 21.0, 20.0, 24.0, 26.0, 30.0, 34.0, 46.0, 84.0, 116.0, 141.0, 98.0, 66.0, 54.0, 37.0, 25.0, 23.0, 19.0, 11.0, 14.0, 15.0, 5.0, 7.0, 7.0, 7.0, 4.0, 2.0, 3.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0382080078125, -0.03698539733886719, -0.035762786865234375, -0.03454017639160156, -0.03331756591796875, -0.03209495544433594, -0.030872344970703125, -0.029649734497070312, -0.0284271240234375, -0.027204513549804688, -0.025981903076171875, -0.024759292602539062, -0.02353668212890625, -0.022314071655273438, -0.021091461181640625, -0.019868850708007812, -0.018646240234375, -0.017423629760742188, -0.016201019287109375, -0.014978408813476562, -0.01375579833984375, -0.012533187866210938, -0.011310577392578125, -0.010087966918945312, -0.0088653564453125, -0.0076427459716796875, -0.006420135498046875, -0.0051975250244140625, -0.00397491455078125, -0.0027523040771484375, -0.001529693603515625, -0.0003070831298828125, 0.00091552734375, 0.0021381378173828125, 0.003360748291015625, 0.0045833587646484375, 0.00580596923828125, 0.0070285797119140625, 0.008251190185546875, 0.009473800659179688, 0.0106964111328125, 0.011919021606445312, 0.013141632080078125, 0.014364242553710938, 0.01558685302734375, 0.016809463500976562, 0.018032073974609375, 0.019254684448242188, 0.020477294921875, 0.021699905395507812, 0.022922515869140625, 0.024145126342773438, 0.02536773681640625, 0.026590347290039062, 0.027812957763671875, 0.029035568237304688, 0.0302581787109375, 0.03148078918457031, 0.032703399658203125, 0.03392601013183594, 0.03514862060546875, 0.03637123107910156, 0.037593841552734375, 0.03881645202636719, 0.0400390625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 40.0, 86.0, 571.0, 194.0, 54.0, 25.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.972259521484375, -3.8644375801086426, -3.75661563873291, -3.6487936973571777, -3.5409717559814453, -3.433149814605713, -3.3253278732299805, -3.217505931854248, -3.1096839904785156, -3.001862049102783, -2.894040107727051, -2.7862181663513184, -2.678396224975586, -2.5705742835998535, -2.462752342224121, -2.3549304008483887, -2.2471084594726562, -2.139286518096924, -2.0314645767211914, -1.923642635345459, -1.8158206939697266, -1.7079987525939941, -1.6001768112182617, -1.4923548698425293, -1.3845326900482178, -1.2767107486724854, -1.168888807296753, -1.0610668659210205, -0.9532449245452881, -0.8454229235649109, -0.7376009821891785, -0.629779040813446, -0.5219571590423584, -0.414135217666626, -0.30631327629089355, -0.19849130511283875, -0.09066936373710632, 0.017152607440948486, 0.12497454881668091, 0.23279649019241333, 0.34061843156814575, 0.4484403729438782, 0.5562623143196106, 0.6640843152999878, 0.7719062566757202, 0.8797281980514526, 0.9875501394271851, 1.0953720808029175, 1.20319402217865, 1.3110159635543823, 1.4188379049301147, 1.5266598463058472, 1.6344817876815796, 1.7423038482666016, 1.850125789642334, 1.9579477310180664, 2.065769672393799, 2.1735916137695312, 2.2814135551452637, 2.389235496520996, 2.4970574378967285, 2.604879379272461, 2.7127013206481934, 2.820523262023926, 2.928345203399658]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 7.0, 9.0, 17.0, 13.0, 18.0, 20.0, 13.0, 27.0, 19.0, 26.0, 24.0, 34.0, 129.0, 316.0, 74.0, 26.0, 34.0, 22.0, 17.0, 16.0, 16.0, 12.0, 17.0, 9.0, 8.0, 7.0, 7.0, 10.0, 8.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2284584045410156, -1.1880301237106323, -1.147601842880249, -1.1071734428405762, -1.0667451620101929, -1.0263168811798096, -0.9858886003494263, -0.9454602599143982, -0.9050319194793701, -0.8646036386489868, -0.8241752982139587, -0.7837470173835754, -0.7433186769485474, -0.7028903961181641, -0.6624621152877808, -0.6220337748527527, -0.5816054940223694, -0.5411772131919861, -0.500748872756958, -0.4603205919265747, -0.41989225149154663, -0.37946397066116333, -0.33903566002845764, -0.29860734939575195, -0.25817903876304626, -0.21775072813034058, -0.1773224174976349, -0.1368941217660904, -0.0964658111333847, -0.056037500500679016, -0.015609204769134521, 0.024819105863571167, 0.06524741649627686, 0.10567572712898254, 0.14610403776168823, 0.18653233349323273, 0.22696064412593842, 0.2673889398574829, 0.3078172504901886, 0.3482455611228943, 0.3886738717556, 0.42910218238830566, 0.46953049302101135, 0.509958803653717, 0.5503870844841003, 0.5908154249191284, 0.6312437057495117, 0.671671986579895, 0.7121003270149231, 0.7525286078453064, 0.7929569482803345, 0.8333852291107178, 0.8738135695457458, 0.9142418503761292, 0.9546701908111572, 0.9950984716415405, 1.0355267524719238, 1.0759550333023071, 1.1163833141326904, 1.1568117141723633, 1.1972399950027466, 1.2376682758331299, 1.2780965566635132, 1.3185248374938965, 1.3589532375335693]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 6.0, 4.0, 8.0, 12.0, 14.0, 20.0, 16.0, 22.0, 24.0, 30.0, 38.0, 38.0, 85.0, 246.0, 95.0, 48.0, 49.0, 39.0, 37.0, 13.0, 21.0, 13.0, 20.0, 11.0, 13.0, 12.0, 3.0, 8.0, 6.0, 7.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.10479736328125, -0.10167503356933594, -0.09855270385742188, -0.09543037414550781, -0.09230804443359375, -0.08918571472167969, -0.08606338500976562, -0.08294105529785156, -0.0798187255859375, -0.07669639587402344, -0.07357406616210938, -0.07045173645019531, -0.06732940673828125, -0.06420707702636719, -0.061084747314453125, -0.05796241760253906, -0.054840087890625, -0.05171775817871094, -0.048595428466796875, -0.04547309875488281, -0.04235076904296875, -0.03922843933105469, -0.036106109619140625, -0.03298377990722656, -0.0298614501953125, -0.026739120483398438, -0.023616790771484375, -0.020494461059570312, -0.01737213134765625, -0.014249801635742188, -0.011127471923828125, -0.008005142211914062, -0.0048828125, -0.0017604827880859375, 0.001361846923828125, 0.0044841766357421875, 0.00760650634765625, 0.010728836059570312, 0.013851165771484375, 0.016973495483398438, 0.0200958251953125, 0.023218154907226562, 0.026340484619140625, 0.029462814331054688, 0.03258514404296875, 0.03570747375488281, 0.038829803466796875, 0.04195213317871094, 0.045074462890625, 0.04819679260253906, 0.051319122314453125, 0.05444145202636719, 0.05756378173828125, 0.06068611145019531, 0.06380844116210938, 0.06693077087402344, 0.0700531005859375, 0.07317543029785156, 0.07629776000976562, 0.07942008972167969, 0.08254241943359375, 0.08566474914550781, 0.08878707885742188, 0.09190940856933594, 0.09503173828125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 2.0, 7.0, 7.0, 15.0, 18.0, 31.0, 52.0, 58.0, 127.0, 215.0, 585.0, 2083.0, 18128.0, 8355497.0, 9468.0, 1416.0, 363.0, 185.0, 109.0, 86.0, 47.0, 22.0, 16.0, 4.0, 6.0, 3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 7.0, 6.0], "bins": [-1.727432131767273, -1.6866792440414429, -1.6459263563156128, -1.6051735877990723, -1.5644207000732422, -1.523667812347412, -1.482914924621582, -1.442162036895752, -1.4014091491699219, -1.3606562614440918, -1.3199033737182617, -1.2791506052017212, -1.2383977174758911, -1.197644829750061, -1.156891942024231, -1.1161390542984009, -1.0753862857818604, -1.0346333980560303, -0.993880569934845, -0.9531276822090149, -0.9123748540878296, -0.8716219663619995, -0.8308690786361694, -0.7901161909103394, -0.749363362789154, -0.708610475063324, -0.6678576469421387, -0.6271047592163086, -0.5863518714904785, -0.5455990433692932, -0.5048461556434631, -0.46409329771995544, -0.423340380191803, -0.3825875222682953, -0.3418346643447876, -0.3010817766189575, -0.26032891869544983, -0.21957606077194214, -0.17882318794727325, -0.13807031512260437, -0.09731745719909668, -0.05656459182500839, -0.015811726450920105, 0.024941138923168182, 0.06569400429725647, 0.10644686222076416, 0.14719973504543304, 0.18795260787010193, 0.22870546579360962, 0.2694583237171173, 0.310211181640625, 0.3509640693664551, 0.39171692728996277, 0.43246978521347046, 0.47322267293930054, 0.5139755010604858, 0.5547283887863159, 0.595481276512146, 0.6362341046333313, 0.6769869923591614, 0.7177398204803467, 0.7584927082061768, 0.7992455959320068, 0.8399984836578369, 0.8807513117790222]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 2.0, 3.0, 6.0, 2.0, 3.0, 2.0, 5.0, 7.0, 3.0, 6.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8476085662841797, -0.810314953327179, -0.7730213403701782, -0.7357277274131775, -0.6984341144561768, -0.6611405611038208, -0.6238469481468201, -0.5865533351898193, -0.5492597222328186, -0.5119661092758179, -0.47467249631881714, -0.4373789131641388, -0.40008530020713806, -0.36279168725013733, -0.325498104095459, -0.28820449113845825, -0.2509108781814575, -0.2136172652244568, -0.17632366716861725, -0.1390300691127777, -0.10173645615577698, -0.06444284319877625, -0.027149245142936707, 0.010144352912902832, 0.047437965869903564, 0.0847315713763237, 0.12202517688274384, 0.15931877493858337, 0.1966123878955841, 0.23390600085258484, 0.2711995840072632, 0.3084931969642639, 0.3457869291305542, 0.38308054208755493, 0.42037415504455566, 0.457667738199234, 0.49496135115623474, 0.5322549343109131, 0.5695485472679138, 0.6068421602249146, 0.6441357731819153, 0.681429386138916, 0.7187229990959167, 0.7560166120529175, 0.7933101654052734, 0.830603837966919, 0.8678973913192749, 0.9051910042762756, 0.9424846172332764, 0.9797782301902771, 1.0170718431472778, 1.0543653964996338, 1.0916590690612793, 1.1289526224136353, 1.1662462949752808, 1.2035398483276367, 1.2408335208892822, 1.2781270742416382, 1.3154207468032837, 1.3527143001556396, 1.3900079727172852, 1.4273015260696411, 1.4645951986312866, 1.5018887519836426, 1.5391823053359985]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 9.0, 3.0, 8.0, 6.0, 25.0, 29.0, 37.0, 71.0, 80.0, 117.0, 208.0, 352.0, 545.0, 932.0, 1781.0, 3639.0, 8081.0, 21462.0, 65313.0, 189003.0, 153837.0, 48876.0, 16877.0, 6587.0, 2838.0, 1500.0, 789.0, 445.0, 273.0, 188.0, 116.0, 83.0, 39.0, 37.0, 28.0, 19.0, 10.0, 7.0, 8.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.93896484375, -0.9135055541992188, -0.8880462646484375, -0.8625869750976562, -0.837127685546875, -0.8116683959960938, -0.7862091064453125, -0.7607498168945312, -0.73529052734375, -0.7098312377929688, -0.6843719482421875, -0.6589126586914062, -0.633453369140625, -0.6079940795898438, -0.5825347900390625, -0.5570755004882812, -0.5316162109375, -0.5061569213867188, -0.4806976318359375, -0.45523834228515625, -0.429779052734375, -0.40431976318359375, -0.3788604736328125, -0.35340118408203125, -0.32794189453125, -0.30248260498046875, -0.2770233154296875, -0.25156402587890625, -0.226104736328125, -0.20064544677734375, -0.1751861572265625, -0.14972686767578125, -0.124267578125, -0.09880828857421875, -0.0733489990234375, -0.04788970947265625, -0.022430419921875, 0.00302886962890625, 0.0284881591796875, 0.05394744873046875, 0.07940673828125, 0.10486602783203125, 0.1303253173828125, 0.15578460693359375, 0.181243896484375, 0.20670318603515625, 0.2321624755859375, 0.25762176513671875, 0.2830810546875, 0.30854034423828125, 0.3339996337890625, 0.35945892333984375, 0.384918212890625, 0.41037750244140625, 0.4358367919921875, 0.46129608154296875, 0.48675537109375, 0.5122146606445312, 0.5376739501953125, 0.5631332397460938, 0.588592529296875, 0.6140518188476562, 0.6395111083984375, 0.6649703979492188, 0.6904296875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 10.0, 14.0, 26.0, 44.0, 57.0, 98.0, 148.0, 131.0, 130.0, 112.0, 63.0, 48.0, 39.0, 27.0, 26.0, 11.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322509765625, -0.3142223358154297, -0.3059349060058594, -0.29764747619628906, -0.28936004638671875, -0.28107261657714844, -0.2727851867675781, -0.2644977569580078, -0.2562103271484375, -0.2479228973388672, -0.23963546752929688, -0.23134803771972656, -0.22306060791015625, -0.21477317810058594, -0.20648574829101562, -0.1981983184814453, -0.189910888671875, -0.1816234588623047, -0.17333602905273438, -0.16504859924316406, -0.15676116943359375, -0.14847373962402344, -0.14018630981445312, -0.1318988800048828, -0.1236114501953125, -0.11532402038574219, -0.10703659057617188, -0.09874916076660156, -0.09046173095703125, -0.08217430114746094, -0.07388687133789062, -0.06559944152832031, -0.05731201171875, -0.04902458190917969, -0.040737152099609375, -0.03244972229003906, -0.02416229248046875, -0.015874862670898438, -0.007587432861328125, 0.0006999969482421875, 0.0089874267578125, 0.017274856567382812, 0.025562286376953125, 0.03384971618652344, 0.04213714599609375, 0.05042457580566406, 0.058712005615234375, 0.06699943542480469, 0.075286865234375, 0.08357429504394531, 0.09186172485351562, 0.10014915466308594, 0.10843658447265625, 0.11672401428222656, 0.12501144409179688, 0.1332988739013672, 0.1415863037109375, 0.1498737335205078, 0.15816116333007812, 0.16644859313964844, 0.17473602294921875, 0.18302345275878906, 0.19131088256835938, 0.1995983123779297, 0.2078857421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 16.0, 31.0, 49.0, 117.0, 110.0, 64.0, 43.0, 11.0, 6.0, 5.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6203757524490356, -1.5752099752426147, -1.5300440788269043, -1.4848783016204834, -1.439712405204773, -1.394546627998352, -1.3493807315826416, -1.3042149543762207, -1.2590491771697998, -1.213883399963379, -1.1687175035476685, -1.1235517263412476, -1.078385829925537, -1.0332200527191162, -0.9880542159080505, -0.9428883790969849, -0.8977224826812744, -0.8525566458702087, -0.8073908090591431, -0.7622250318527222, -0.7170591354370117, -0.6718933582305908, -0.6267275214195251, -0.5815616846084595, -0.5363958477973938, -0.4912300109863281, -0.44606417417526245, -0.40089836716651917, -0.3557325303554535, -0.3105666935443878, -0.26540088653564453, -0.22023504972457886, -0.17506933212280273, -0.12990349531173706, -0.08473767340183258, -0.0395718514919281, 0.005593985319137573, 0.05075982213020325, 0.09592562913894653, 0.1410914659500122, 0.18625730276107788, 0.23142313957214355, 0.27658897638320923, 0.3217547833919525, 0.3669206202030182, 0.41208645701408386, 0.45725226402282715, 0.5024181008338928, 0.5475839376449585, 0.5927497744560242, 0.6379156112670898, 0.6830813884735107, 0.7282472848892212, 0.7734130620956421, 0.8185788989067078, 0.8637447357177734, 0.9089105725288391, 0.9540764093399048, 0.9992422461509705, 1.0444080829620361, 1.089573860168457, 1.1347397565841675, 1.1799055337905884, 1.2250714302062988, 1.2702372074127197]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 6.0, 15.0, 6.0, 21.0, 58.0, 117.0, 123.0, 55.0, 17.0, 13.0, 8.0, 1.0, 3.0, 2.0, 8.0, 8.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1648681163787842, -1.1329078674316406, -1.100947618484497, -1.0689873695373535, -1.03702712059021, -1.0050668716430664, -0.9731065630912781, -0.9411463141441345, -0.909186065196991, -0.8772258162498474, -0.8452655673027039, -0.8133053183555603, -0.781345009803772, -0.7493847608566284, -0.7174245119094849, -0.6854642629623413, -0.6535040140151978, -0.6215437650680542, -0.5895835161209106, -0.5576232671737671, -0.5256630182266235, -0.4937027394771576, -0.46174246072769165, -0.4297822117805481, -0.39782196283340454, -0.365861713886261, -0.33390146493911743, -0.3019411861896515, -0.26998093724250793, -0.23802068829536438, -0.20606042444705963, -0.17410016059875488, -0.14213979244232178, -0.11017953604459763, -0.07821927964687347, -0.04625902324914932, -0.014298766851425171, 0.017661482095718384, 0.04962174594402313, 0.08158200979232788, 0.11354225873947144, 0.145502507686615, 0.17746277153491974, 0.2094230353832245, 0.24138328433036804, 0.2733435332775116, 0.30530381202697754, 0.3372640609741211, 0.36922430992126465, 0.4011845588684082, 0.43314480781555176, 0.4651050865650177, 0.49706533551216125, 0.5290255546569824, 0.5609858632087708, 0.5929461121559143, 0.6249063611030579, 0.6568666100502014, 0.688826858997345, 0.7207871079444885, 0.7527474164962769, 0.7847076654434204, 0.816667914390564, 0.8486281633377075, 0.8805884122848511]}, "eval/loss": 4.194759368896484, "eval/wer": 2.4282625942086473, "eval/runtime": 1143.8371, "eval/samples_per_second": 2.31, "eval/steps_per_second": 0.289, "train/train_runtime": 6364.0567, "train/train_samples_per_second": 4.484, "train/train_steps_per_second": 0.14, "train/total_flos": 0.0, "train/train_loss": 4.297821357913081, "_wandb": {"runtime": 7878}} \ No newline at end of file