diff --git "a/wandb/run-20220302_200036-31e4k99c/files/wandb-summary.json" "b/wandb/run-20220302_200036-31e4k99c/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220302_200036-31e4k99c/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.5291, "train/learning_rate": 0.00017759999999999998, "train/epoch": 1.0, "train/global_step": 297, "_runtime": 4796, "_timestamp": 1646256032, "_step": 297, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 32.0, 208.0, 492.0, 240.0, 41.0, 4.0, 1.0, 0.0, 1.0], "bins": [-272.8752136230469, -268.13763427734375, -263.4000549316406, -258.6624755859375, -253.92489624023438, -249.18731689453125, -244.44973754882812, -239.712158203125, -234.97457885742188, -230.23699951171875, -225.49942016601562, -220.7618408203125, -216.02426147460938, -211.28668212890625, -206.54910278320312, -201.8115234375, -197.07394409179688, -192.33636474609375, -187.59878540039062, -182.8612060546875, -178.12362670898438, -173.38604736328125, -168.64846801757812, -163.910888671875, -159.17330932617188, -154.43572998046875, -149.69815063476562, -144.9605712890625, -140.22299194335938, -135.48541259765625, -130.74783325195312, -126.01025390625, -121.2726821899414, -116.53510284423828, -111.79752349853516, -107.05994415283203, -102.3223648071289, -97.58478546142578, -92.84720611572266, -88.10962677001953, -83.3720474243164, -78.63446807861328, -73.89688873291016, -69.15930938720703, -64.4217300415039, -59.68415069580078, -54.946571350097656, -50.20899200439453, -45.471412658691406, -40.73383331298828, -35.996253967285156, -31.25867462158203, -26.521095275878906, -21.78351593017578, -17.045936584472656, -12.308357238769531, -7.570777893066406, -2.8331985473632812, 1.9043807983398438, 6.641960144042969, 11.379539489746094, 16.11711883544922, 20.854698181152344, 25.59227752685547, 30.329856872558594]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 13.0, 18.0, 21.0, 25.0, 28.0, 32.0, 47.0, 44.0, 50.0, 56.0, 52.0, 60.0, 49.0, 59.0, 59.0, 57.0, 49.0, 52.0, 43.0, 39.0, 26.0, 24.0, 20.0, 13.0, 9.0, 10.0, 13.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-83.19218444824219, -81.14936828613281, -79.10655212402344, -77.06373596191406, -75.02091217041016, -72.97809600830078, -70.9352798461914, -68.89246368408203, -66.84964752197266, -64.80683135986328, -62.76401138305664, -60.721195220947266, -58.67837905883789, -56.63555908203125, -54.592742919921875, -52.5499267578125, -50.50710678100586, -48.464290618896484, -46.421470642089844, -44.37865447998047, -42.335838317871094, -40.29302215576172, -38.25020217895508, -36.2073860168457, -34.16456604003906, -32.12174987792969, -30.07893180847168, -28.036113739013672, -25.993297576904297, -23.95047950744629, -21.90766143798828, -19.864845275878906, -17.822025299072266, -15.779208183288574, -13.736391067504883, -11.693572998046875, -9.650755882263184, -7.607938766479492, -5.565120697021484, -3.522303581237793, -1.4794864654541016, 0.563330888748169, 2.6061482429504395, 4.648965835571289, 6.6917829513549805, 8.734600067138672, 10.77741813659668, 12.820235252380371, 14.863052368164062, 16.90587043762207, 18.948686599731445, 20.991504669189453, 23.034320831298828, 25.077138900756836, 27.119956970214844, 29.16277313232422, 31.205591201782227, 33.248409271240234, 35.29122543334961, 37.33404541015625, 39.376861572265625, 41.419677734375, 43.462493896484375, 45.505313873291016, 47.54813003540039]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 7.0, 9.0, 15.0, 16.0, 23.0, 27.0, 39.0, 40.0, 35.0, 58.0, 64.0, 56.0, 63.0, 42.0, 76.0, 66.0, 58.0, 52.0, 56.0, 49.0, 28.0, 27.0, 23.0, 23.0, 14.0, 9.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.677734375, -2.58111572265625, -2.4844970703125, -2.38787841796875, -2.291259765625, -2.19464111328125, -2.0980224609375, -2.00140380859375, -1.90478515625, -1.80816650390625, -1.7115478515625, -1.61492919921875, -1.518310546875, -1.42169189453125, -1.3250732421875, -1.22845458984375, -1.1318359375, -1.03521728515625, -0.9385986328125, -0.84197998046875, -0.745361328125, -0.64874267578125, -0.5521240234375, -0.45550537109375, -0.35888671875, -0.26226806640625, -0.1656494140625, -0.06903076171875, 0.027587890625, 0.12420654296875, 0.2208251953125, 0.31744384765625, 0.4140625, 0.51068115234375, 0.6072998046875, 0.70391845703125, 0.800537109375, 0.89715576171875, 0.9937744140625, 1.09039306640625, 1.18701171875, 1.28363037109375, 1.3802490234375, 1.47686767578125, 1.573486328125, 1.67010498046875, 1.7667236328125, 1.86334228515625, 1.9599609375, 2.05657958984375, 2.1531982421875, 2.24981689453125, 2.346435546875, 2.44305419921875, 2.5396728515625, 2.63629150390625, 2.73291015625, 2.82952880859375, 2.9261474609375, 3.02276611328125, 3.119384765625, 3.21600341796875, 3.3126220703125, 3.40924072265625, 3.505859375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 6.0, 19.0, 12.0, 26.0, 46.0, 38.0, 51.0, 101.0, 185.0, 304.0, 489.0, 970.0, 2110.0, 5697.0, 21435.0, 140499.0, 2710044.0, 1216418.0, 74188.0, 14342.0, 4146.0, 1494.0, 696.0, 343.0, 188.0, 141.0, 85.0, 64.0, 43.0, 36.0, 13.0, 10.0, 14.0, 10.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.8671875, -11.4825439453125, -11.097900390625, -10.7132568359375, -10.32861328125, -9.9439697265625, -9.559326171875, -9.1746826171875, -8.7900390625, -8.4053955078125, -8.020751953125, -7.6361083984375, -7.25146484375, -6.8668212890625, -6.482177734375, -6.0975341796875, -5.712890625, -5.3282470703125, -4.943603515625, -4.5589599609375, -4.17431640625, -3.7896728515625, -3.405029296875, -3.0203857421875, -2.6357421875, -2.2510986328125, -1.866455078125, -1.4818115234375, -1.09716796875, -0.7125244140625, -0.327880859375, 0.0567626953125, 0.44140625, 0.8260498046875, 1.210693359375, 1.5953369140625, 1.97998046875, 2.3646240234375, 2.749267578125, 3.1339111328125, 3.5185546875, 3.9031982421875, 4.287841796875, 4.6724853515625, 5.05712890625, 5.4417724609375, 5.826416015625, 6.2110595703125, 6.595703125, 6.9803466796875, 7.364990234375, 7.7496337890625, 8.13427734375, 8.5189208984375, 8.903564453125, 9.2882080078125, 9.6728515625, 10.0574951171875, 10.442138671875, 10.8267822265625, 11.21142578125, 11.5960693359375, 11.980712890625, 12.3653564453125, 12.75]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 10.0, 6.0, 16.0, 17.0, 39.0, 54.0, 63.0, 97.0, 138.0, 185.0, 271.0, 386.0, 515.0, 551.0, 461.0, 377.0, 260.0, 172.0, 150.0, 80.0, 60.0, 46.0, 29.0, 23.0, 18.0, 11.0, 4.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.390625, -11.09283447265625, -10.7950439453125, -10.49725341796875, -10.199462890625, -9.90167236328125, -9.6038818359375, -9.30609130859375, -9.00830078125, -8.71051025390625, -8.4127197265625, -8.11492919921875, -7.817138671875, -7.51934814453125, -7.2215576171875, -6.92376708984375, -6.6259765625, -6.32818603515625, -6.0303955078125, -5.73260498046875, -5.434814453125, -5.13702392578125, -4.8392333984375, -4.54144287109375, -4.24365234375, -3.94586181640625, -3.6480712890625, -3.35028076171875, -3.052490234375, -2.75469970703125, -2.4569091796875, -2.15911865234375, -1.861328125, -1.56353759765625, -1.2657470703125, -0.96795654296875, -0.670166015625, -0.37237548828125, -0.0745849609375, 0.22320556640625, 0.52099609375, 0.81878662109375, 1.1165771484375, 1.41436767578125, 1.712158203125, 2.00994873046875, 2.3077392578125, 2.60552978515625, 2.9033203125, 3.20111083984375, 3.4989013671875, 3.79669189453125, 4.094482421875, 4.39227294921875, 4.6900634765625, 4.98785400390625, 5.28564453125, 5.58343505859375, 5.8812255859375, 6.17901611328125, 6.476806640625, 6.77459716796875, 7.0723876953125, 7.37017822265625, 7.66796875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 5.0, 7.0, 6.0, 13.0, 25.0, 25.0, 43.0, 71.0, 116.0, 199.0, 330.0, 509.0, 1161.0, 3186.0, 21597.0, 1087839.0, 3027962.0, 43350.0, 4717.0, 1457.0, 703.0, 341.0, 230.0, 119.0, 69.0, 66.0, 30.0, 19.0, 14.0, 11.0, 10.0, 8.0, 6.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.78125, -31.7607421875, -30.740234375, -29.7197265625, -28.69921875, -27.6787109375, -26.658203125, -25.6376953125, -24.6171875, -23.5966796875, -22.576171875, -21.5556640625, -20.53515625, -19.5146484375, -18.494140625, -17.4736328125, -16.453125, -15.4326171875, -14.412109375, -13.3916015625, -12.37109375, -11.3505859375, -10.330078125, -9.3095703125, -8.2890625, -7.2685546875, -6.248046875, -5.2275390625, -4.20703125, -3.1865234375, -2.166015625, -1.1455078125, -0.125, 0.8955078125, 1.916015625, 2.9365234375, 3.95703125, 4.9775390625, 5.998046875, 7.0185546875, 8.0390625, 9.0595703125, 10.080078125, 11.1005859375, 12.12109375, 13.1416015625, 14.162109375, 15.1826171875, 16.203125, 17.2236328125, 18.244140625, 19.2646484375, 20.28515625, 21.3056640625, 22.326171875, 23.3466796875, 24.3671875, 25.3876953125, 26.408203125, 27.4287109375, 28.44921875, 29.4697265625, 30.490234375, 31.5107421875, 32.53125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 28.0, 127.0, 301.0, 333.0, 141.0, 62.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-120.14483642578125, -117.35649108886719, -114.56815338134766, -111.77981567382812, -108.99147033691406, -106.203125, -103.41478729248047, -100.62644958496094, -97.83810424804688, -95.04975891113281, -92.26142120361328, -89.47308349609375, -86.68473815917969, -83.89639282226562, -81.1080551147461, -78.31971740722656, -75.5313720703125, -72.74302673339844, -69.9546890258789, -67.16635131835938, -64.37800598144531, -61.589664459228516, -58.80132293701172, -56.01298141479492, -53.224639892578125, -50.43629837036133, -47.64795684814453, -44.859615325927734, -42.07127380371094, -39.28293228149414, -36.494590759277344, -33.70624923706055, -30.91790008544922, -28.129558563232422, -25.341217041015625, -22.552875518798828, -19.76453399658203, -16.976192474365234, -14.187850952148438, -11.39950942993164, -8.611167907714844, -5.822826385498047, -3.03448486328125, -0.24614334106445312, 2.5421981811523438, 5.330539703369141, 8.118881225585938, 10.907222747802734, 13.695564270019531, 16.483905792236328, 19.272247314453125, 22.060588836669922, 24.84893035888672, 27.637271881103516, 30.425613403320312, 33.21395492553711, 36.002296447753906, 38.7906379699707, 41.5789794921875, 44.3673210144043, 47.155662536621094, 49.94400405883789, 52.73234558105469, 55.520687103271484, 58.30902862548828]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 9.0, 7.0, 17.0, 19.0, 19.0, 25.0, 25.0, 25.0, 37.0, 42.0, 25.0, 52.0, 49.0, 56.0, 47.0, 68.0, 43.0, 57.0, 42.0, 40.0, 35.0, 49.0, 41.0, 22.0, 29.0, 26.0, 20.0, 11.0, 19.0, 10.0, 8.0, 6.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.958919525146484, -38.758872985839844, -37.5588264465332, -36.35877990722656, -35.15873718261719, -33.95869064331055, -32.758644104003906, -31.558597564697266, -30.358551025390625, -29.158504486083984, -27.958457946777344, -26.758413314819336, -25.558366775512695, -24.358320236206055, -23.158275604248047, -21.958229064941406, -20.758182525634766, -19.558135986328125, -18.358089447021484, -17.158044815063477, -15.957998275756836, -14.757951736450195, -13.557906150817871, -12.357860565185547, -11.157814025878906, -9.957767486572266, -8.757721900939941, -7.557675838470459, -6.357629776000977, -5.157583713531494, -3.9575376510620117, -2.7574920654296875, -1.5574455261230469, -0.35739946365356445, 0.842646598815918, 2.0426926612854004, 3.242738723754883, 4.442784786224365, 5.642830848693848, 6.842876434326172, 8.042922973632812, 9.242969512939453, 10.443015098571777, 11.643060684204102, 12.843107223510742, 14.043153762817383, 15.243199348449707, 16.44324493408203, 17.643291473388672, 18.843338012695312, 20.043384552001953, 21.24342918395996, 22.4434757232666, 23.643522262573242, 24.84356689453125, 26.04361343383789, 27.24365997314453, 28.443706512451172, 29.643753051757812, 30.84379768371582, 32.043846130371094, 33.24388885498047, 34.44393539428711, 35.64398193359375, 36.84402847290039]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 8.0, 11.0, 12.0, 18.0, 18.0, 33.0, 23.0, 30.0, 35.0, 39.0, 42.0, 51.0, 49.0, 46.0, 58.0, 48.0, 53.0, 55.0, 50.0, 44.0, 48.0, 36.0, 40.0, 24.0, 23.0, 25.0, 20.0, 16.0, 17.0, 8.0, 2.0, 2.0, 5.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.4453125, -2.359375, -2.2734375, -2.1875, -2.1015625, -2.015625, -1.9296875, -1.84375, -1.7578125, -1.671875, -1.5859375, -1.5, -1.4140625, -1.328125, -1.2421875, -1.15625, -1.0703125, -0.984375, -0.8984375, -0.8125, -0.7265625, -0.640625, -0.5546875, -0.46875, -0.3828125, -0.296875, -0.2109375, -0.125, -0.0390625, 0.046875, 0.1328125, 0.21875, 0.3046875, 0.390625, 0.4765625, 0.5625, 0.6484375, 0.734375, 0.8203125, 0.90625, 0.9921875, 1.078125, 1.1640625, 1.25, 1.3359375, 1.421875, 1.5078125, 1.59375, 1.6796875, 1.765625, 1.8515625, 1.9375, 2.0234375, 2.109375, 2.1953125, 2.28125, 2.3671875, 2.453125, 2.5390625, 2.625, 2.7109375, 2.796875, 2.8828125, 2.96875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 8.0, 6.0, 14.0, 16.0, 22.0, 42.0, 42.0, 51.0, 71.0, 103.0, 142.0, 225.0, 322.0, 529.0, 884.0, 1431.0, 2400.0, 4305.0, 7995.0, 15463.0, 29674.0, 57031.0, 107705.0, 181675.0, 235497.0, 178967.0, 105655.0, 55694.0, 29226.0, 14976.0, 7870.0, 4261.0, 2333.0, 1410.0, 882.0, 502.0, 359.0, 235.0, 129.0, 115.0, 71.0, 50.0, 47.0, 27.0, 15.0, 20.0, 19.0, 7.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.39013671875, -0.3773384094238281, -0.36454010009765625, -0.3517417907714844, -0.3389434814453125, -0.3261451721191406, -0.31334686279296875, -0.3005485534667969, -0.287750244140625, -0.2749519348144531, -0.26215362548828125, -0.24935531616210938, -0.2365570068359375, -0.22375869750976562, -0.21096038818359375, -0.19816207885742188, -0.18536376953125, -0.17256546020507812, -0.15976715087890625, -0.14696884155273438, -0.1341705322265625, -0.12137222290039062, -0.10857391357421875, -0.09577560424804688, -0.082977294921875, -0.07017898559570312, -0.05738067626953125, -0.044582366943359375, -0.0317840576171875, -0.018985748291015625, -0.00618743896484375, 0.006610870361328125, 0.0194091796875, 0.032207489013671875, 0.04500579833984375, 0.057804107666015625, 0.0706024169921875, 0.08340072631835938, 0.09619903564453125, 0.10899734497070312, 0.121795654296875, 0.13459396362304688, 0.14739227294921875, 0.16019058227539062, 0.1729888916015625, 0.18578720092773438, 0.19858551025390625, 0.21138381958007812, 0.22418212890625, 0.23698043823242188, 0.24977874755859375, 0.2625770568847656, 0.2753753662109375, 0.2881736755371094, 0.30097198486328125, 0.3137702941894531, 0.326568603515625, 0.3393669128417969, 0.35216522216796875, 0.3649635314941406, 0.3777618408203125, 0.3905601501464844, 0.40335845947265625, 0.4161567687988281, 0.428955078125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 3.0, 8.0, 7.0, 11.0, 18.0, 16.0, 15.0, 34.0, 24.0, 31.0, 39.0, 29.0, 37.0, 40.0, 35.0, 36.0, 57.0, 48.0, 1066.0, 42.0, 40.0, 37.0, 35.0, 30.0, 33.0, 35.0, 36.0, 22.0, 25.0, 22.0, 17.0, 22.0, 13.0, 14.0, 6.0, 10.0, 11.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.568359375, -1.52252197265625, -1.4766845703125, -1.43084716796875, -1.385009765625, -1.33917236328125, -1.2933349609375, -1.24749755859375, -1.20166015625, -1.15582275390625, -1.1099853515625, -1.06414794921875, -1.018310546875, -0.97247314453125, -0.9266357421875, -0.88079833984375, -0.8349609375, -0.78912353515625, -0.7432861328125, -0.69744873046875, -0.651611328125, -0.60577392578125, -0.5599365234375, -0.51409912109375, -0.46826171875, -0.42242431640625, -0.3765869140625, -0.33074951171875, -0.284912109375, -0.23907470703125, -0.1932373046875, -0.14739990234375, -0.1015625, -0.05572509765625, -0.0098876953125, 0.03594970703125, 0.081787109375, 0.12762451171875, 0.1734619140625, 0.21929931640625, 0.26513671875, 0.31097412109375, 0.3568115234375, 0.40264892578125, 0.448486328125, 0.49432373046875, 0.5401611328125, 0.58599853515625, 0.6318359375, 0.67767333984375, 0.7235107421875, 0.76934814453125, 0.815185546875, 0.86102294921875, 0.9068603515625, 0.95269775390625, 0.99853515625, 1.04437255859375, 1.0902099609375, 1.13604736328125, 1.181884765625, 1.22772216796875, 1.2735595703125, 1.31939697265625, 1.365234375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 6.0, 13.0, 14.0, 30.0, 34.0, 45.0, 67.0, 97.0, 164.0, 244.0, 350.0, 571.0, 919.0, 1389.0, 2003.0, 3135.0, 5070.0, 7678.0, 11961.0, 18538.0, 29104.0, 45075.0, 69260.0, 100979.0, 137419.0, 1205524.0, 141713.0, 106626.0, 72900.0, 48477.0, 31430.0, 19933.0, 12925.0, 8342.0, 5217.0, 3542.0, 2277.0, 1372.0, 936.0, 609.0, 432.0, 250.0, 146.0, 105.0, 81.0, 46.0, 35.0, 17.0, 17.0, 5.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.160400390625, -0.1547870635986328, -0.14917373657226562, -0.14356040954589844, -0.13794708251953125, -0.13233375549316406, -0.12672042846679688, -0.12110710144042969, -0.1154937744140625, -0.10988044738769531, -0.10426712036132812, -0.09865379333496094, -0.09304046630859375, -0.08742713928222656, -0.08181381225585938, -0.07620048522949219, -0.070587158203125, -0.06497383117675781, -0.059360504150390625, -0.05374717712402344, -0.04813385009765625, -0.04252052307128906, -0.036907196044921875, -0.03129386901855469, -0.0256805419921875, -0.020067214965820312, -0.014453887939453125, -0.008840560913085938, -0.00322723388671875, 0.0023860931396484375, 0.007999420166015625, 0.013612747192382812, 0.01922607421875, 0.024839401245117188, 0.030452728271484375, 0.03606605529785156, 0.04167938232421875, 0.04729270935058594, 0.052906036376953125, 0.05851936340332031, 0.0641326904296875, 0.06974601745605469, 0.07535934448242188, 0.08097267150878906, 0.08658599853515625, 0.09219932556152344, 0.09781265258789062, 0.10342597961425781, 0.109039306640625, 0.11465263366699219, 0.12026596069335938, 0.12587928771972656, 0.13149261474609375, 0.13710594177246094, 0.14271926879882812, 0.1483325958251953, 0.1539459228515625, 0.1595592498779297, 0.16517257690429688, 0.17078590393066406, 0.17639923095703125, 0.18201255798339844, 0.18762588500976562, 0.1932392120361328, 0.1988525390625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 8.0, 3.0, 3.0, 2.0, 7.0, 5.0, 11.0, 12.0, 12.0, 32.0, 54.0, 61.0, 81.0, 136.0, 148.0, 127.0, 95.0, 59.0, 31.0, 18.0, 18.0, 14.0, 16.0, 12.0, 6.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00228118896484375, -0.002206355333328247, -0.002131521701812744, -0.002056688070297241, -0.0019818544387817383, -0.0019070208072662354, -0.0018321871757507324, -0.0017573535442352295, -0.0016825199127197266, -0.0016076862812042236, -0.0015328526496887207, -0.0014580190181732178, -0.0013831853866577148, -0.001308351755142212, -0.001233518123626709, -0.001158684492111206, -0.0010838508605957031, -0.0010090172290802002, -0.0009341835975646973, -0.0008593499660491943, -0.0007845163345336914, -0.0007096827030181885, -0.0006348490715026855, -0.0005600154399871826, -0.0004851818084716797, -0.00041034817695617676, -0.00033551454544067383, -0.0002606809139251709, -0.00018584728240966797, -0.00011101365089416504, -3.618001937866211e-05, 3.865361213684082e-05, 0.00011348724365234375, 0.00018832087516784668, 0.0002631545066833496, 0.00033798813819885254, 0.00041282176971435547, 0.0004876554012298584, 0.0005624890327453613, 0.0006373226642608643, 0.0007121562957763672, 0.0007869899272918701, 0.000861823558807373, 0.000936657190322876, 0.001011490821838379, 0.0010863244533538818, 0.0011611580848693848, 0.0012359917163848877, 0.0013108253479003906, 0.0013856589794158936, 0.0014604926109313965, 0.0015353262424468994, 0.0016101598739624023, 0.0016849935054779053, 0.0017598271369934082, 0.0018346607685089111, 0.001909494400024414, 0.001984328031539917, 0.00205916166305542, 0.002133995294570923, 0.0022088289260864258, 0.0022836625576019287, 0.0023584961891174316, 0.0024333298206329346, 0.0025081634521484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 2.0, 7.0, 7.0, 6.0, 14.0, 13.0, 10.0, 16.0, 21.0, 25.0, 41.0, 38.0, 74.0, 146.0, 166.0, 328.0, 930.0, 82191.0, 961044.0, 2316.0, 451.0, 228.0, 129.0, 72.0, 57.0, 34.0, 44.0, 24.0, 23.0, 16.0, 19.0, 11.0, 5.0, 8.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.039276123046875, -0.03797483444213867, -0.036673545837402344, -0.035372257232666016, -0.03407096862792969, -0.03276968002319336, -0.03146839141845703, -0.030167102813720703, -0.028865814208984375, -0.027564525604248047, -0.02626323699951172, -0.02496194839477539, -0.023660659790039062, -0.022359371185302734, -0.021058082580566406, -0.019756793975830078, -0.01845550537109375, -0.017154216766357422, -0.015852928161621094, -0.014551639556884766, -0.013250350952148438, -0.01194906234741211, -0.010647773742675781, -0.009346485137939453, -0.008045196533203125, -0.006743907928466797, -0.005442619323730469, -0.004141330718994141, -0.0028400421142578125, -0.0015387535095214844, -0.00023746490478515625, 0.0010638236999511719, 0.0023651123046875, 0.003666400909423828, 0.004967689514160156, 0.006268978118896484, 0.0075702667236328125, 0.00887155532836914, 0.010172843933105469, 0.011474132537841797, 0.012775421142578125, 0.014076709747314453, 0.015377998352050781, 0.01667928695678711, 0.017980575561523438, 0.019281864166259766, 0.020583152770996094, 0.021884441375732422, 0.02318572998046875, 0.024487018585205078, 0.025788307189941406, 0.027089595794677734, 0.028390884399414062, 0.02969217300415039, 0.03099346160888672, 0.03229475021362305, 0.033596038818359375, 0.0348973274230957, 0.03619861602783203, 0.03749990463256836, 0.03880119323730469, 0.040102481842041016, 0.041403770446777344, 0.04270505905151367, 0.04400634765625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 11.0, 538.0, 460.0, 5.0, 1.0, 1.0], "bins": [-0.030485354363918304, -0.029977165162563324, -0.029468975961208344, -0.028960786759853363, -0.028452597558498383, -0.02794441021978855, -0.02743622101843357, -0.02692803181707859, -0.02641984261572361, -0.02591165341436863, -0.02540346421301365, -0.02489527501165867, -0.024387087672948837, -0.023878898471593857, -0.023370709270238876, -0.022862520068883896, -0.022354330867528915, -0.021846141666173935, -0.021337952464818954, -0.020829763263463974, -0.020321574062108994, -0.019813386723399162, -0.019305197522044182, -0.0187970083206892, -0.01828881911933422, -0.01778062991797924, -0.01727244071662426, -0.01676425151526928, -0.016256064176559448, -0.015747874975204468, -0.015239685773849487, -0.014731496572494507, -0.014223309233784676, -0.013715120032429695, -0.013206930831074715, -0.012698742561042309, -0.012190553359687328, -0.011682364158332348, -0.011174175888299942, -0.010665986686944962, -0.010157797485589981, -0.009649608284235, -0.00914141908288002, -0.008633230812847614, -0.008125041611492634, -0.007616852410137653, -0.00710866367444396, -0.006600474938750267, -0.006092285271733999, -0.005584096536040306, -0.005075907334685326, -0.004567718133330345, -0.004059529397636652, -0.003551340429112315, -0.0030431514605879784, -0.0025349624920636415, -0.0020267735235393047, -0.001518584555014968, -0.001010395586490631, -0.0005022066179662943, 5.982350558042526e-06, 0.0005141713190823793, 0.0010223602876067162, 0.001530549256131053, 0.00203873822465539]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 6.0, 6.0, 9.0, 14.0, 18.0, 27.0, 27.0, 41.0, 23.0, 36.0, 42.0, 47.0, 46.0, 49.0, 53.0, 63.0, 42.0, 53.0, 41.0, 58.0, 42.0, 44.0, 32.0, 32.0, 33.0, 28.0, 24.0, 9.0, 16.0, 15.0, 11.0, 8.0, 6.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014300942420959473, -0.0013913484290242195, -0.0013526026159524918, -0.001313856802880764, -0.0012751109898090363, -0.0012363651767373085, -0.0011976193636655807, -0.001158873550593853, -0.0011201277375221252, -0.0010813819244503975, -0.0010426361113786697, -0.001003890298306942, -0.0009651444852352142, -0.0009263986721634865, -0.0008876528590917587, -0.000848907046020031, -0.0008101612329483032, -0.0007714154198765755, -0.0007326696068048477, -0.00069392379373312, -0.0006551779806613922, -0.0006164321675896645, -0.0005776863545179367, -0.000538940541446209, -0.0005001947283744812, -0.00046144891530275345, -0.0004227031022310257, -0.00038395728915929794, -0.0003452114760875702, -0.00030646566301584244, -0.0002677198499441147, -0.00022897403687238693, -0.00019022822380065918, -0.00015148241072893143, -0.00011273659765720367, -7.399078458547592e-05, -3.524497151374817e-05, 3.5008415579795837e-06, 4.2246654629707336e-05, 8.099246770143509e-05, 0.00011973828077316284, 0.0001584840938448906, 0.00019722990691661835, 0.0002359757199883461, 0.00027472153306007385, 0.0003134673461318016, 0.00035221315920352936, 0.0003909589722752571, 0.00042970478534698486, 0.0004684505984187126, 0.0005071964114904404, 0.0005459422245621681, 0.0005846880376338959, 0.0006234338507056236, 0.0006621796637773514, 0.0007009254768490791, 0.0007396712899208069, 0.0007784171029925346, 0.0008171629160642624, 0.0008559087291359901, 0.0008946545422077179, 0.0009334003552794456, 0.0009721461683511734, 0.0010108919814229012, 0.001049637794494629]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 8.0, 11.0, 12.0, 18.0, 18.0, 33.0, 23.0, 30.0, 35.0, 40.0, 41.0, 51.0, 49.0, 46.0, 58.0, 48.0, 53.0, 55.0, 50.0, 44.0, 48.0, 36.0, 40.0, 24.0, 23.0, 25.0, 20.0, 16.0, 17.0, 8.0, 2.0, 2.0, 5.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.4453125, -2.359375, -2.2734375, -2.1875, -2.1015625, -2.015625, -1.9296875, -1.84375, -1.7578125, -1.671875, -1.5859375, -1.5, -1.4140625, -1.328125, -1.2421875, -1.15625, -1.0703125, -0.984375, -0.8984375, -0.8125, -0.7265625, -0.640625, -0.5546875, -0.46875, -0.3828125, -0.296875, -0.2109375, -0.125, -0.0390625, 0.046875, 0.1328125, 0.21875, 0.3046875, 0.390625, 0.4765625, 0.5625, 0.6484375, 0.734375, 0.8203125, 0.90625, 0.9921875, 1.078125, 1.1640625, 1.25, 1.3359375, 1.421875, 1.5078125, 1.59375, 1.6796875, 1.765625, 1.8515625, 1.9375, 2.0234375, 2.109375, 2.1953125, 2.28125, 2.3671875, 2.453125, 2.5390625, 2.625, 2.7109375, 2.796875, 2.8828125, 2.96875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 2.0, 5.0, 7.0, 10.0, 8.0, 10.0, 14.0, 24.0, 31.0, 38.0, 68.0, 76.0, 134.0, 186.0, 273.0, 384.0, 563.0, 888.0, 1241.0, 1969.0, 3037.0, 5092.0, 8990.0, 17954.0, 44195.0, 135317.0, 378143.0, 290944.0, 93054.0, 32445.0, 14050.0, 7151.0, 4352.0, 2738.0, 1726.0, 1112.0, 748.0, 501.0, 323.0, 204.0, 158.0, 97.0, 77.0, 63.0, 45.0, 32.0, 31.0, 13.0, 13.0, 10.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.3125, -6.1009521484375, -5.889404296875, -5.6778564453125, -5.46630859375, -5.2547607421875, -5.043212890625, -4.8316650390625, -4.6201171875, -4.4085693359375, -4.197021484375, -3.9854736328125, -3.77392578125, -3.5623779296875, -3.350830078125, -3.1392822265625, -2.927734375, -2.7161865234375, -2.504638671875, -2.2930908203125, -2.08154296875, -1.8699951171875, -1.658447265625, -1.4468994140625, -1.2353515625, -1.0238037109375, -0.812255859375, -0.6007080078125, -0.38916015625, -0.1776123046875, 0.033935546875, 0.2454833984375, 0.45703125, 0.6685791015625, 0.880126953125, 1.0916748046875, 1.30322265625, 1.5147705078125, 1.726318359375, 1.9378662109375, 2.1494140625, 2.3609619140625, 2.572509765625, 2.7840576171875, 2.99560546875, 3.2071533203125, 3.418701171875, 3.6302490234375, 3.841796875, 4.0533447265625, 4.264892578125, 4.4764404296875, 4.68798828125, 4.8995361328125, 5.111083984375, 5.3226318359375, 5.5341796875, 5.7457275390625, 5.957275390625, 6.1688232421875, 6.38037109375, 6.5919189453125, 6.803466796875, 7.0150146484375, 7.2265625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 1.0, 4.0, 10.0, 8.0, 9.0, 12.0, 11.0, 11.0, 14.0, 13.0, 23.0, 15.0, 21.0, 30.0, 21.0, 30.0, 43.0, 44.0, 42.0, 56.0, 102.0, 162.0, 287.0, 1312.0, 192.0, 116.0, 87.0, 47.0, 34.0, 45.0, 30.0, 31.0, 26.0, 22.0, 26.0, 13.0, 19.0, 11.0, 14.0, 13.0, 13.0, 8.0, 5.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.84375, -5.64349365234375, -5.4432373046875, -5.24298095703125, -5.042724609375, -4.84246826171875, -4.6422119140625, -4.44195556640625, -4.24169921875, -4.04144287109375, -3.8411865234375, -3.64093017578125, -3.440673828125, -3.24041748046875, -3.0401611328125, -2.83990478515625, -2.6396484375, -2.43939208984375, -2.2391357421875, -2.03887939453125, -1.838623046875, -1.63836669921875, -1.4381103515625, -1.23785400390625, -1.03759765625, -0.83734130859375, -0.6370849609375, -0.43682861328125, -0.236572265625, -0.03631591796875, 0.1639404296875, 0.36419677734375, 0.564453125, 0.76470947265625, 0.9649658203125, 1.16522216796875, 1.365478515625, 1.56573486328125, 1.7659912109375, 1.96624755859375, 2.16650390625, 2.36676025390625, 2.5670166015625, 2.76727294921875, 2.967529296875, 3.16778564453125, 3.3680419921875, 3.56829833984375, 3.7685546875, 3.96881103515625, 4.1690673828125, 4.36932373046875, 4.569580078125, 4.76983642578125, 4.9700927734375, 5.17034912109375, 5.37060546875, 5.57086181640625, 5.7711181640625, 5.97137451171875, 6.171630859375, 6.37188720703125, 6.5721435546875, 6.77239990234375, 6.97265625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 9.0, 9.0, 8.0, 14.0, 16.0, 17.0, 23.0, 13.0, 17.0, 22.0, 25.0, 44.0, 34.0, 69.0, 112.0, 245.0, 702.0, 7309.0, 2143900.0, 986852.0, 4968.0, 591.0, 212.0, 138.0, 60.0, 44.0, 33.0, 32.0, 22.0, 16.0, 19.0, 16.0, 16.0, 22.0, 6.0, 9.0, 8.0, 11.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 6.0], "bins": [-28.765625, -27.96533203125, -27.1650390625, -26.36474609375, -25.564453125, -24.76416015625, -23.9638671875, -23.16357421875, -22.36328125, -21.56298828125, -20.7626953125, -19.96240234375, -19.162109375, -18.36181640625, -17.5615234375, -16.76123046875, -15.9609375, -15.16064453125, -14.3603515625, -13.56005859375, -12.759765625, -11.95947265625, -11.1591796875, -10.35888671875, -9.55859375, -8.75830078125, -7.9580078125, -7.15771484375, -6.357421875, -5.55712890625, -4.7568359375, -3.95654296875, -3.15625, -2.35595703125, -1.5556640625, -0.75537109375, 0.044921875, 0.84521484375, 1.6455078125, 2.44580078125, 3.24609375, 4.04638671875, 4.8466796875, 5.64697265625, 6.447265625, 7.24755859375, 8.0478515625, 8.84814453125, 9.6484375, 10.44873046875, 11.2490234375, 12.04931640625, 12.849609375, 13.64990234375, 14.4501953125, 15.25048828125, 16.05078125, 16.85107421875, 17.6513671875, 18.45166015625, 19.251953125, 20.05224609375, 20.8525390625, 21.65283203125, 22.453125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 134.0, 807.0, 69.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.606422424316406, -37.03171920776367, -33.4570198059082, -29.88231658935547, -26.307615280151367, -22.732913970947266, -19.15821075439453, -15.58350944519043, -12.008808135986328, -8.434106826782227, -4.859404563903809, -1.2847023010253906, 2.289999008178711, 5.8647003173828125, 9.439403533935547, 13.014104843139648, 16.58880615234375, 20.16350746154785, 23.738208770751953, 27.312911987304688, 30.88761329650879, 34.46231460571289, 38.037017822265625, 41.611717224121094, 45.18642044067383, 48.76112365722656, 52.33582305908203, 55.910526275634766, 59.4852294921875, 63.05992889404297, 66.63462829589844, 70.20933532714844, 73.78404235839844, 77.3587417602539, 80.9334487915039, 84.50814819335938, 88.08284759521484, 91.65754699707031, 95.23225402832031, 98.80695343017578, 102.38165283203125, 105.95635223388672, 109.53105926513672, 113.10575866699219, 116.68045806884766, 120.25515747070312, 123.82986450195312, 127.4045639038086, 130.97927856445312, 134.55398559570312, 138.12867736816406, 141.70338439941406, 145.27809143066406, 148.852783203125, 152.427490234375, 156.002197265625, 159.57688903808594, 163.15159606933594, 166.72628784179688, 170.30099487304688, 173.87570190429688, 177.4503936767578, 181.0251007080078, 184.5998077392578, 188.17449951171875]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 7.0, 7.0, 10.0, 10.0, 12.0, 21.0, 18.0, 13.0, 39.0, 25.0, 27.0, 33.0, 27.0, 37.0, 42.0, 44.0, 48.0, 36.0, 32.0, 43.0, 46.0, 51.0, 38.0, 35.0, 32.0, 16.0, 32.0, 26.0, 22.0, 19.0, 28.0, 12.0, 21.0, 18.0, 15.0, 7.0, 7.0, 6.0, 4.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-23.8145694732666, -23.078014373779297, -22.341461181640625, -21.60490608215332, -20.868350982666016, -20.131797790527344, -19.39524269104004, -18.658687591552734, -17.922134399414062, -17.185579299926758, -16.449026107788086, -15.712471008300781, -14.975915908813477, -14.239361763000488, -13.5028076171875, -12.766252517700195, -12.02969741821289, -11.293143272399902, -10.556588172912598, -9.82003402709961, -9.083478927612305, -8.346924781799316, -7.610370635986328, -6.873816013336182, -6.137261390686035, -5.400706768035889, -4.664152145385742, -3.927597999572754, -3.1910433769226074, -2.454488754272461, -1.7179346084594727, -0.9813799858093262, -0.24482345581054688, 0.49173104763031006, 1.228285551071167, 1.9648399353027344, 2.701394557952881, 3.4379491806030273, 4.174503326416016, 4.911057949066162, 5.647612571716309, 6.384167194366455, 7.120721817016602, 7.85727596282959, 8.593830108642578, 9.330385208129883, 10.066939353942871, 10.80349349975586, 11.540048599243164, 12.276602745056152, 13.013157844543457, 13.749711990356445, 14.48626708984375, 15.222821235656738, 15.959375381469727, 16.69593048095703, 17.432483673095703, 18.169038772583008, 18.90559196472168, 19.642147064208984, 20.37870216369629, 21.115257263183594, 21.851810455322266, 22.58836555480957, 23.324920654296875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 6.0, 13.0, 16.0, 19.0, 22.0, 22.0, 29.0, 30.0, 34.0, 41.0, 54.0, 54.0, 46.0, 54.0, 59.0, 41.0, 58.0, 53.0, 38.0, 46.0, 43.0, 39.0, 34.0, 29.0, 30.0, 21.0, 12.0, 15.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0078125, -2.91387939453125, -2.8199462890625, -2.72601318359375, -2.632080078125, -2.53814697265625, -2.4442138671875, -2.35028076171875, -2.25634765625, -2.16241455078125, -2.0684814453125, -1.97454833984375, -1.880615234375, -1.78668212890625, -1.6927490234375, -1.59881591796875, -1.5048828125, -1.41094970703125, -1.3170166015625, -1.22308349609375, -1.129150390625, -1.03521728515625, -0.9412841796875, -0.84735107421875, -0.75341796875, -0.65948486328125, -0.5655517578125, -0.47161865234375, -0.377685546875, -0.28375244140625, -0.1898193359375, -0.09588623046875, -0.001953125, 0.09197998046875, 0.1859130859375, 0.27984619140625, 0.373779296875, 0.46771240234375, 0.5616455078125, 0.65557861328125, 0.74951171875, 0.84344482421875, 0.9373779296875, 1.03131103515625, 1.125244140625, 1.21917724609375, 1.3131103515625, 1.40704345703125, 1.5009765625, 1.59490966796875, 1.6888427734375, 1.78277587890625, 1.876708984375, 1.97064208984375, 2.0645751953125, 2.15850830078125, 2.25244140625, 2.34637451171875, 2.4403076171875, 2.53424072265625, 2.628173828125, 2.72210693359375, 2.8160400390625, 2.90997314453125, 3.00390625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 12.0, 15.0, 16.0, 22.0, 37.0, 59.0, 70.0, 119.0, 153.0, 230.0, 336.0, 516.0, 1094.0, 2519.0, 8697.0, 44155.0, 467351.0, 3195936.0, 418566.0, 41395.0, 8218.0, 2359.0, 944.0, 457.0, 299.0, 197.0, 135.0, 98.0, 61.0, 50.0, 32.0, 28.0, 26.0, 21.0, 11.0, 11.0, 7.0, 3.0, 4.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.046875, -10.6844482421875, -10.322021484375, -9.9595947265625, -9.59716796875, -9.2347412109375, -8.872314453125, -8.5098876953125, -8.1474609375, -7.7850341796875, -7.422607421875, -7.0601806640625, -6.69775390625, -6.3353271484375, -5.972900390625, -5.6104736328125, -5.248046875, -4.8856201171875, -4.523193359375, -4.1607666015625, -3.79833984375, -3.4359130859375, -3.073486328125, -2.7110595703125, -2.3486328125, -1.9862060546875, -1.623779296875, -1.2613525390625, -0.89892578125, -0.5364990234375, -0.174072265625, 0.1883544921875, 0.55078125, 0.9132080078125, 1.275634765625, 1.6380615234375, 2.00048828125, 2.3629150390625, 2.725341796875, 3.0877685546875, 3.4501953125, 3.8126220703125, 4.175048828125, 4.5374755859375, 4.89990234375, 5.2623291015625, 5.624755859375, 5.9871826171875, 6.349609375, 6.7120361328125, 7.074462890625, 7.4368896484375, 7.79931640625, 8.1617431640625, 8.524169921875, 8.8865966796875, 9.2490234375, 9.6114501953125, 9.973876953125, 10.3363037109375, 10.69873046875, 11.0611572265625, 11.423583984375, 11.7860107421875, 12.1484375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 9.0, 11.0, 10.0, 31.0, 37.0, 57.0, 76.0, 89.0, 128.0, 208.0, 282.0, 389.0, 486.0, 531.0, 456.0, 391.0, 262.0, 179.0, 147.0, 80.0, 66.0, 39.0, 30.0, 25.0, 16.0, 8.0, 8.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7265625, -9.426513671875, -9.12646484375, -8.826416015625, -8.5263671875, -8.226318359375, -7.92626953125, -7.626220703125, -7.326171875, -7.026123046875, -6.72607421875, -6.426025390625, -6.1259765625, -5.825927734375, -5.52587890625, -5.225830078125, -4.92578125, -4.625732421875, -4.32568359375, -4.025634765625, -3.7255859375, -3.425537109375, -3.12548828125, -2.825439453125, -2.525390625, -2.225341796875, -1.92529296875, -1.625244140625, -1.3251953125, -1.025146484375, -0.72509765625, -0.425048828125, -0.125, 0.175048828125, 0.47509765625, 0.775146484375, 1.0751953125, 1.375244140625, 1.67529296875, 1.975341796875, 2.275390625, 2.575439453125, 2.87548828125, 3.175537109375, 3.4755859375, 3.775634765625, 4.07568359375, 4.375732421875, 4.67578125, 4.975830078125, 5.27587890625, 5.575927734375, 5.8759765625, 6.176025390625, 6.47607421875, 6.776123046875, 7.076171875, 7.376220703125, 7.67626953125, 7.976318359375, 8.2763671875, 8.576416015625, 8.87646484375, 9.176513671875, 9.4765625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 7.0, 11.0, 20.0, 21.0, 27.0, 45.0, 87.0, 150.0, 250.0, 479.0, 1013.0, 2619.0, 8860.0, 45050.0, 437731.0, 3009809.0, 614076.0, 58242.0, 10537.0, 2963.0, 1102.0, 561.0, 279.0, 152.0, 68.0, 51.0, 25.0, 15.0, 14.0, 7.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.053466796875, -16.51318359375, -15.972900390625, -15.4326171875, -14.892333984375, -14.35205078125, -13.811767578125, -13.271484375, -12.731201171875, -12.19091796875, -11.650634765625, -11.1103515625, -10.570068359375, -10.02978515625, -9.489501953125, -8.94921875, -8.408935546875, -7.86865234375, -7.328369140625, -6.7880859375, -6.247802734375, -5.70751953125, -5.167236328125, -4.626953125, -4.086669921875, -3.54638671875, -3.006103515625, -2.4658203125, -1.925537109375, -1.38525390625, -0.844970703125, -0.3046875, 0.235595703125, 0.77587890625, 1.316162109375, 1.8564453125, 2.396728515625, 2.93701171875, 3.477294921875, 4.017578125, 4.557861328125, 5.09814453125, 5.638427734375, 6.1787109375, 6.718994140625, 7.25927734375, 7.799560546875, 8.33984375, 8.880126953125, 9.42041015625, 9.960693359375, 10.5009765625, 11.041259765625, 11.58154296875, 12.121826171875, 12.662109375, 13.202392578125, 13.74267578125, 14.282958984375, 14.8232421875, 15.363525390625, 15.90380859375, 16.444091796875, 16.984375]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 43.0, 181.0, 365.0, 299.0, 98.0, 18.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.43085861206055, -40.977272033691406, -37.523685455322266, -34.070098876953125, -30.616514205932617, -27.162927627563477, -23.70934295654297, -20.255756378173828, -16.802169799804688, -13.348583221435547, -9.894997596740723, -6.441411972045898, -2.987825393676758, 0.4657611846923828, 3.9193458557128906, 7.372932434082031, 10.826519012451172, 14.280105590820312, 17.733692169189453, 21.18727684020996, 24.6408634185791, 28.094449996948242, 31.54803466796875, 35.00162124633789, 38.45520782470703, 41.90879440307617, 45.36238098144531, 48.81596374511719, 52.269554138183594, 55.72313690185547, 59.17672348022461, 62.63031005859375, 66.08389282226562, 69.5374755859375, 72.9910659790039, 76.44464874267578, 79.89823913574219, 83.35182189941406, 86.80540466308594, 90.25899505615234, 93.71258544921875, 97.16616821289062, 100.61975860595703, 104.0733413696289, 107.52693176269531, 110.98051452636719, 114.43409729003906, 117.88768768310547, 121.34127044677734, 124.79485321044922, 128.24844360351562, 131.7020263671875, 135.15560913085938, 138.6092071533203, 142.0627899169922, 145.51637268066406, 148.96995544433594, 152.4235382080078, 155.8771209716797, 159.33071899414062, 162.7843017578125, 166.23788452148438, 169.69146728515625, 173.14505004882812, 176.59864807128906]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 13.0, 6.0, 5.0, 6.0, 11.0, 17.0, 14.0, 24.0, 21.0, 26.0, 26.0, 32.0, 29.0, 42.0, 45.0, 33.0, 43.0, 36.0, 39.0, 28.0, 51.0, 44.0, 43.0, 45.0, 44.0, 27.0, 29.0, 28.0, 26.0, 27.0, 26.0, 17.0, 21.0, 15.0, 19.0, 11.0, 6.0, 6.0, 4.0, 8.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.333749771118164, -25.468366622924805, -24.602985382080078, -23.73760223388672, -22.87221908569336, -22.0068359375, -21.14145278930664, -20.276071548461914, -19.410688400268555, -18.545305252075195, -17.67992401123047, -16.81454086303711, -15.94915771484375, -15.08377456665039, -14.218392372131348, -13.353010177612305, -12.487627029418945, -11.622243881225586, -10.756861686706543, -9.8914794921875, -9.02609634399414, -8.160713195800781, -7.295331001281738, -6.429948329925537, -5.564565658569336, -4.699182987213135, -3.8338003158569336, -2.9684176445007324, -2.1030349731445312, -1.23765230178833, -0.3722696304321289, 0.49311304092407227, 1.3584976196289062, 2.2238802909851074, 3.0892629623413086, 3.9546456336975098, 4.820028305053711, 5.685410976409912, 6.550793647766113, 7.4161763191223145, 8.281558990478516, 9.146942138671875, 10.012324333190918, 10.877706527709961, 11.74308967590332, 12.60847282409668, 13.473855018615723, 14.339237213134766, 15.204620361328125, 16.070003509521484, 16.935386657714844, 17.80076789855957, 18.66615104675293, 19.53153419494629, 20.396915435791016, 21.262298583984375, 22.127681732177734, 22.993064880371094, 23.858448028564453, 24.72382926940918, 25.58921241760254, 26.4545955657959, 27.319976806640625, 28.185359954833984, 29.050743103027344]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 10.0, 10.0, 15.0, 21.0, 18.0, 17.0, 34.0, 29.0, 27.0, 17.0, 41.0, 40.0, 41.0, 45.0, 49.0, 38.0, 42.0, 42.0, 44.0, 44.0, 40.0, 41.0, 28.0, 25.0, 25.0, 22.0, 30.0, 25.0, 26.0, 20.0, 17.0, 17.0, 8.0, 11.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-2.814453125, -2.735565185546875, -2.65667724609375, -2.577789306640625, -2.4989013671875, -2.420013427734375, -2.34112548828125, -2.262237548828125, -2.183349609375, -2.104461669921875, -2.02557373046875, -1.946685791015625, -1.8677978515625, -1.788909912109375, -1.71002197265625, -1.631134033203125, -1.55224609375, -1.473358154296875, -1.39447021484375, -1.315582275390625, -1.2366943359375, -1.157806396484375, -1.07891845703125, -1.000030517578125, -0.921142578125, -0.842254638671875, -0.76336669921875, -0.684478759765625, -0.6055908203125, -0.526702880859375, -0.44781494140625, -0.368927001953125, -0.2900390625, -0.211151123046875, -0.13226318359375, -0.053375244140625, 0.0255126953125, 0.104400634765625, 0.18328857421875, 0.262176513671875, 0.341064453125, 0.419952392578125, 0.49884033203125, 0.577728271484375, 0.6566162109375, 0.735504150390625, 0.81439208984375, 0.893280029296875, 0.97216796875, 1.051055908203125, 1.12994384765625, 1.208831787109375, 1.2877197265625, 1.366607666015625, 1.44549560546875, 1.524383544921875, 1.603271484375, 1.682159423828125, 1.76104736328125, 1.839935302734375, 1.9188232421875, 1.997711181640625, 2.07659912109375, 2.155487060546875, 2.234375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 2.0, 9.0, 17.0, 20.0, 27.0, 34.0, 49.0, 87.0, 108.0, 219.0, 328.0, 497.0, 849.0, 1446.0, 2564.0, 4425.0, 8127.0, 15402.0, 29431.0, 56819.0, 109027.0, 188255.0, 240770.0, 178025.0, 100909.0, 52380.0, 27038.0, 14047.0, 7531.0, 4173.0, 2346.0, 1391.0, 818.0, 500.0, 338.0, 178.0, 140.0, 83.0, 47.0, 42.0, 17.0, 12.0, 11.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.476806640625, -0.46254730224609375, -0.4482879638671875, -0.43402862548828125, -0.419769287109375, -0.40550994873046875, -0.3912506103515625, -0.37699127197265625, -0.36273193359375, -0.34847259521484375, -0.3342132568359375, -0.31995391845703125, -0.305694580078125, -0.29143524169921875, -0.2771759033203125, -0.26291656494140625, -0.2486572265625, -0.23439788818359375, -0.2201385498046875, -0.20587921142578125, -0.191619873046875, -0.17736053466796875, -0.1631011962890625, -0.14884185791015625, -0.13458251953125, -0.12032318115234375, -0.1060638427734375, -0.09180450439453125, -0.077545166015625, -0.06328582763671875, -0.0490264892578125, -0.03476715087890625, -0.0205078125, -0.00624847412109375, 0.0080108642578125, 0.02227020263671875, 0.036529541015625, 0.05078887939453125, 0.0650482177734375, 0.07930755615234375, 0.09356689453125, 0.10782623291015625, 0.1220855712890625, 0.13634490966796875, 0.150604248046875, 0.16486358642578125, 0.1791229248046875, 0.19338226318359375, 0.2076416015625, 0.22190093994140625, 0.2361602783203125, 0.25041961669921875, 0.264678955078125, 0.27893829345703125, 0.2931976318359375, 0.30745697021484375, 0.32171630859375, 0.33597564697265625, 0.3502349853515625, 0.36449432373046875, 0.378753662109375, 0.39301300048828125, 0.4072723388671875, 0.42153167724609375, 0.435791015625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 2.0, 4.0, 9.0, 5.0, 8.0, 6.0, 14.0, 8.0, 8.0, 6.0, 13.0, 14.0, 26.0, 18.0, 33.0, 26.0, 40.0, 34.0, 27.0, 39.0, 41.0, 33.0, 31.0, 36.0, 1065.0, 53.0, 38.0, 26.0, 37.0, 43.0, 32.0, 38.0, 25.0, 24.0, 18.0, 20.0, 22.0, 16.0, 18.0, 9.0, 5.0, 11.0, 8.0, 7.0, 5.0, 6.0, 5.0, 5.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.6396484375, -1.591278076171875, -1.54290771484375, -1.494537353515625, -1.4461669921875, -1.397796630859375, -1.34942626953125, -1.301055908203125, -1.252685546875, -1.204315185546875, -1.15594482421875, -1.107574462890625, -1.0592041015625, -1.010833740234375, -0.96246337890625, -0.914093017578125, -0.86572265625, -0.817352294921875, -0.76898193359375, -0.720611572265625, -0.6722412109375, -0.623870849609375, -0.57550048828125, -0.527130126953125, -0.478759765625, -0.430389404296875, -0.38201904296875, -0.333648681640625, -0.2852783203125, -0.236907958984375, -0.18853759765625, -0.140167236328125, -0.091796875, -0.043426513671875, 0.00494384765625, 0.053314208984375, 0.1016845703125, 0.150054931640625, 0.19842529296875, 0.246795654296875, 0.295166015625, 0.343536376953125, 0.39190673828125, 0.440277099609375, 0.4886474609375, 0.537017822265625, 0.58538818359375, 0.633758544921875, 0.68212890625, 0.730499267578125, 0.77886962890625, 0.827239990234375, 0.8756103515625, 0.923980712890625, 0.97235107421875, 1.020721435546875, 1.069091796875, 1.117462158203125, 1.16583251953125, 1.214202880859375, 1.2625732421875, 1.310943603515625, 1.35931396484375, 1.407684326171875, 1.4560546875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 12.0, 14.0, 27.0, 36.0, 56.0, 95.0, 162.0, 228.0, 353.0, 587.0, 865.0, 1320.0, 2133.0, 3634.0, 5748.0, 9476.0, 15573.0, 26160.0, 43855.0, 70881.0, 111229.0, 161393.0, 1223059.0, 150303.0, 103540.0, 65209.0, 39774.0, 23931.0, 14494.0, 8661.0, 5436.0, 3209.0, 2089.0, 1297.0, 804.0, 514.0, 355.0, 207.0, 129.0, 101.0, 66.0, 30.0, 16.0, 21.0, 18.0, 10.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.214111328125, -0.2068328857421875, -0.199554443359375, -0.1922760009765625, -0.18499755859375, -0.1777191162109375, -0.170440673828125, -0.1631622314453125, -0.1558837890625, -0.1486053466796875, -0.141326904296875, -0.1340484619140625, -0.12677001953125, -0.1194915771484375, -0.112213134765625, -0.1049346923828125, -0.09765625, -0.0903778076171875, -0.083099365234375, -0.0758209228515625, -0.06854248046875, -0.0612640380859375, -0.053985595703125, -0.0467071533203125, -0.0394287109375, -0.0321502685546875, -0.024871826171875, -0.0175933837890625, -0.01031494140625, -0.0030364990234375, 0.004241943359375, 0.0115203857421875, 0.018798828125, 0.0260772705078125, 0.033355712890625, 0.0406341552734375, 0.04791259765625, 0.0551910400390625, 0.062469482421875, 0.0697479248046875, 0.0770263671875, 0.0843048095703125, 0.091583251953125, 0.0988616943359375, 0.10614013671875, 0.1134185791015625, 0.120697021484375, 0.1279754638671875, 0.13525390625, 0.1425323486328125, 0.149810791015625, 0.1570892333984375, 0.16436767578125, 0.1716461181640625, 0.178924560546875, 0.1862030029296875, 0.1934814453125, 0.2007598876953125, 0.208038330078125, 0.2153167724609375, 0.22259521484375, 0.2298736572265625, 0.237152099609375, 0.2444305419921875, 0.251708984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 9.0, 6.0, 7.0, 9.0, 10.0, 28.0, 29.0, 41.0, 45.0, 46.0, 66.0, 82.0, 126.0, 107.0, 87.0, 59.0, 58.0, 44.0, 30.0, 40.0, 14.0, 11.0, 13.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008209228515625, -0.007926106452941895, -0.007642984390258789, -0.007359862327575684, -0.007076740264892578, -0.006793618202209473, -0.006510496139526367, -0.006227374076843262, -0.005944252014160156, -0.005661129951477051, -0.005378007888793945, -0.00509488582611084, -0.004811763763427734, -0.004528641700744629, -0.0042455196380615234, -0.003962397575378418, -0.0036792755126953125, -0.003396153450012207, -0.0031130313873291016, -0.002829909324645996, -0.0025467872619628906, -0.002263665199279785, -0.0019805431365966797, -0.0016974210739135742, -0.0014142990112304688, -0.0011311769485473633, -0.0008480548858642578, -0.0005649328231811523, -0.0002818107604980469, 1.3113021850585938e-06, 0.00028443336486816406, 0.0005675554275512695, 0.000850677490234375, 0.0011337995529174805, 0.001416921615600586, 0.0017000436782836914, 0.001983165740966797, 0.0022662878036499023, 0.002549409866333008, 0.0028325319290161133, 0.0031156539916992188, 0.0033987760543823242, 0.0036818981170654297, 0.003965020179748535, 0.004248142242431641, 0.004531264305114746, 0.0048143863677978516, 0.005097508430480957, 0.0053806304931640625, 0.005663752555847168, 0.0059468746185302734, 0.006229996681213379, 0.006513118743896484, 0.00679624080657959, 0.007079362869262695, 0.007362484931945801, 0.007645606994628906, 0.007928729057312012, 0.008211851119995117, 0.008494973182678223, 0.008778095245361328, 0.009061217308044434, 0.009344339370727539, 0.009627461433410645, 0.00991058349609375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 6.0, 6.0, 7.0, 12.0, 26.0, 15.0, 30.0, 43.0, 55.0, 76.0, 112.0, 142.0, 196.0, 318.0, 928.0, 165053.0, 879136.0, 1261.0, 358.0, 191.0, 168.0, 105.0, 70.0, 59.0, 39.0, 35.0, 20.0, 15.0, 17.0, 12.0, 7.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1343994140625, -0.1297779083251953, -0.12515640258789062, -0.12053489685058594, -0.11591339111328125, -0.11129188537597656, -0.10667037963867188, -0.10204887390136719, -0.0974273681640625, -0.09280586242675781, -0.08818435668945312, -0.08356285095214844, -0.07894134521484375, -0.07431983947753906, -0.06969833374023438, -0.06507682800292969, -0.060455322265625, -0.05583381652832031, -0.051212310791015625, -0.04659080505371094, -0.04196929931640625, -0.03734779357910156, -0.032726287841796875, -0.028104782104492188, -0.0234832763671875, -0.018861770629882812, -0.014240264892578125, -0.009618759155273438, -0.00499725341796875, -0.0003757476806640625, 0.004245758056640625, 0.008867263793945312, 0.01348876953125, 0.018110275268554688, 0.022731781005859375, 0.027353286743164062, 0.03197479248046875, 0.03659629821777344, 0.041217803955078125, 0.04583930969238281, 0.0504608154296875, 0.05508232116699219, 0.059703826904296875, 0.06432533264160156, 0.06894683837890625, 0.07356834411621094, 0.07818984985351562, 0.08281135559082031, 0.087432861328125, 0.09205436706542969, 0.09667587280273438, 0.10129737854003906, 0.10591888427734375, 0.11054039001464844, 0.11516189575195312, 0.11978340148925781, 0.1244049072265625, 0.1290264129638672, 0.13364791870117188, 0.13826942443847656, 0.14289093017578125, 0.14751243591308594, 0.15213394165039062, 0.1567554473876953, 0.161376953125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 44.0, 974.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21586118638515472, -0.21063318848609924, -0.20540520548820496, -0.20017720758914948, -0.1949492245912552, -0.1897212266921997, -0.18449324369430542, -0.17926524579524994, -0.17403726279735565, -0.16880926489830017, -0.16358128190040588, -0.1583532840013504, -0.15312530100345612, -0.14789730310440063, -0.14266932010650635, -0.13744132220745087, -0.13221332430839539, -0.1269853264093399, -0.12175734341144562, -0.11652935296297073, -0.11130136251449585, -0.10607337206602097, -0.10084538161754608, -0.0956173837184906, -0.09038940072059631, -0.08516141027212143, -0.07993341982364655, -0.07470542937517166, -0.06947743892669678, -0.0642494484782219, -0.05902145430445671, -0.05379346385598183, -0.04856547713279724, -0.04333748668432236, -0.03810949623584747, -0.03288150578737259, -0.027653513476252556, -0.022425523027777672, -0.01719753071665764, -0.011969540268182755, -0.0067415498197078705, -0.0015135589055716991, 0.003714432008564472, 0.00894242338836193, 0.014170413836836815, 0.0193984042853117, 0.024626396596431732, 0.029854387044906616, 0.0350823774933815, 0.040310367941856384, 0.04553835839033127, 0.05076634883880615, 0.055994339287281036, 0.06122232973575592, 0.0664503276348114, 0.07167831063270569, 0.07690630853176117, 0.08213429898023605, 0.08736228942871094, 0.09259027987718582, 0.0978182703256607, 0.10304626077413559, 0.10827425122261047, 0.11350224912166595, 0.11873023211956024]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 6.0, 3.0, 8.0, 16.0, 19.0, 17.0, 41.0, 47.0, 46.0, 52.0, 71.0, 71.0, 62.0, 95.0, 67.0, 68.0, 58.0, 72.0, 36.0, 36.0, 35.0, 25.0, 27.0, 12.0, 11.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013050436973571777, -0.012714066542685032, -0.012377696111798286, -0.012041325680911541, -0.011704955250024796, -0.01136858481913805, -0.011032214388251305, -0.01069584395736456, -0.010359473526477814, -0.010023103095591068, -0.009686732664704323, -0.009350362233817577, -0.009013991802930832, -0.008677621372044086, -0.008341250941157341, -0.008004880510270596, -0.00766851007938385, -0.007332139648497105, -0.006995769217610359, -0.006659398786723614, -0.006323028355836868, -0.005986657924950123, -0.005650287494063377, -0.005313917063176632, -0.0049775466322898865, -0.004641176201403141, -0.004304805770516396, -0.00396843533962965, -0.0036320649087429047, -0.003295694477856159, -0.0029593240469694138, -0.0026229536160826683, -0.002286583185195923, -0.0019502127543091774, -0.001613842323422432, -0.0012774718925356865, -0.000941101461648941, -0.0006047310307621956, -0.00026836059987545013, 6.800983101129532e-05, 0.00040438026189804077, 0.0007407506927847862, 0.0010771211236715317, 0.0014134915545582771, 0.0017498619854450226, 0.002086232416331768, 0.0024226028472185135, 0.002758973278105259, 0.0030953437089920044, 0.00343171413987875, 0.0037680845707654953, 0.004104455001652241, 0.004440825432538986, 0.004777195863425732, 0.005113566294312477, 0.0054499367251992226, 0.005786307156085968, 0.0061226775869727135, 0.006459048017859459, 0.006795418448746204, 0.00713178887963295, 0.007468159310519695, 0.007804529741406441, 0.008140900172293186, 0.008477270603179932]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 10.0, 10.0, 15.0, 21.0, 18.0, 16.0, 35.0, 27.0, 28.0, 18.0, 40.0, 40.0, 42.0, 45.0, 49.0, 37.0, 43.0, 42.0, 44.0, 44.0, 40.0, 41.0, 28.0, 24.0, 26.0, 22.0, 30.0, 25.0, 26.0, 20.0, 17.0, 17.0, 8.0, 11.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-2.81640625, -2.73748779296875, -2.6585693359375, -2.57965087890625, -2.500732421875, -2.42181396484375, -2.3428955078125, -2.26397705078125, -2.18505859375, -2.10614013671875, -2.0272216796875, -1.94830322265625, -1.869384765625, -1.79046630859375, -1.7115478515625, -1.63262939453125, -1.5537109375, -1.47479248046875, -1.3958740234375, -1.31695556640625, -1.238037109375, -1.15911865234375, -1.0802001953125, -1.00128173828125, -0.92236328125, -0.84344482421875, -0.7645263671875, -0.68560791015625, -0.606689453125, -0.52777099609375, -0.4488525390625, -0.36993408203125, -0.291015625, -0.21209716796875, -0.1331787109375, -0.05426025390625, 0.024658203125, 0.10357666015625, 0.1824951171875, 0.26141357421875, 0.34033203125, 0.41925048828125, 0.4981689453125, 0.57708740234375, 0.656005859375, 0.73492431640625, 0.8138427734375, 0.89276123046875, 0.9716796875, 1.05059814453125, 1.1295166015625, 1.20843505859375, 1.287353515625, 1.36627197265625, 1.4451904296875, 1.52410888671875, 1.60302734375, 1.68194580078125, 1.7608642578125, 1.83978271484375, 1.918701171875, 1.99761962890625, 2.0765380859375, 2.15545654296875, 2.234375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 3.0, 6.0, 13.0, 13.0, 24.0, 31.0, 40.0, 59.0, 61.0, 118.0, 158.0, 231.0, 352.0, 509.0, 808.0, 1141.0, 1972.0, 3757.0, 7809.0, 17870.0, 44269.0, 107547.0, 219815.0, 290149.0, 194609.0, 90123.0, 36940.0, 15156.0, 6554.0, 3289.0, 1828.0, 1096.0, 721.0, 478.0, 311.0, 172.0, 140.0, 101.0, 84.0, 36.0, 54.0, 37.0, 24.0, 11.0, 10.0, 7.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-2.822265625, -2.737762451171875, -2.65325927734375, -2.568756103515625, -2.4842529296875, -2.399749755859375, -2.31524658203125, -2.230743408203125, -2.146240234375, -2.061737060546875, -1.97723388671875, -1.892730712890625, -1.8082275390625, -1.723724365234375, -1.63922119140625, -1.554718017578125, -1.47021484375, -1.385711669921875, -1.30120849609375, -1.216705322265625, -1.1322021484375, -1.047698974609375, -0.96319580078125, -0.878692626953125, -0.794189453125, -0.709686279296875, -0.62518310546875, -0.540679931640625, -0.4561767578125, -0.371673583984375, -0.28717041015625, -0.202667236328125, -0.1181640625, -0.033660888671875, 0.05084228515625, 0.135345458984375, 0.2198486328125, 0.304351806640625, 0.38885498046875, 0.473358154296875, 0.557861328125, 0.642364501953125, 0.72686767578125, 0.811370849609375, 0.8958740234375, 0.980377197265625, 1.06488037109375, 1.149383544921875, 1.23388671875, 1.318389892578125, 1.40289306640625, 1.487396240234375, 1.5718994140625, 1.656402587890625, 1.74090576171875, 1.825408935546875, 1.909912109375, 1.994415283203125, 2.07891845703125, 2.163421630859375, 2.2479248046875, 2.332427978515625, 2.41693115234375, 2.501434326171875, 2.5859375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 6.0, 6.0, 10.0, 19.0, 7.0, 11.0, 15.0, 22.0, 28.0, 29.0, 31.0, 22.0, 32.0, 41.0, 47.0, 49.0, 70.0, 105.0, 302.0, 1407.0, 235.0, 118.0, 65.0, 50.0, 38.0, 38.0, 33.0, 27.0, 30.0, 22.0, 19.0, 22.0, 15.0, 16.0, 12.0, 8.0, 11.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.984375, -8.6983642578125, -8.412353515625, -8.1263427734375, -7.84033203125, -7.5543212890625, -7.268310546875, -6.9822998046875, -6.6962890625, -6.4102783203125, -6.124267578125, -5.8382568359375, -5.55224609375, -5.2662353515625, -4.980224609375, -4.6942138671875, -4.408203125, -4.1221923828125, -3.836181640625, -3.5501708984375, -3.26416015625, -2.9781494140625, -2.692138671875, -2.4061279296875, -2.1201171875, -1.8341064453125, -1.548095703125, -1.2620849609375, -0.97607421875, -0.6900634765625, -0.404052734375, -0.1180419921875, 0.16796875, 0.4539794921875, 0.739990234375, 1.0260009765625, 1.31201171875, 1.5980224609375, 1.884033203125, 2.1700439453125, 2.4560546875, 2.7420654296875, 3.028076171875, 3.3140869140625, 3.60009765625, 3.8861083984375, 4.172119140625, 4.4581298828125, 4.744140625, 5.0301513671875, 5.316162109375, 5.6021728515625, 5.88818359375, 6.1741943359375, 6.460205078125, 6.7462158203125, 7.0322265625, 7.3182373046875, 7.604248046875, 7.8902587890625, 8.17626953125, 8.4622802734375, 8.748291015625, 9.0343017578125, 9.3203125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 7.0, 3.0, 5.0, 8.0, 12.0, 6.0, 17.0, 10.0, 25.0, 19.0, 22.0, 27.0, 34.0, 39.0, 58.0, 83.0, 157.0, 290.0, 831.0, 6067.0, 459507.0, 2659838.0, 16071.0, 1573.0, 389.0, 161.0, 105.0, 69.0, 53.0, 37.0, 32.0, 22.0, 25.0, 20.0, 17.0, 13.0, 12.0, 10.0, 8.0, 7.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.375, -19.7607421875, -19.146484375, -18.5322265625, -17.91796875, -17.3037109375, -16.689453125, -16.0751953125, -15.4609375, -14.8466796875, -14.232421875, -13.6181640625, -13.00390625, -12.3896484375, -11.775390625, -11.1611328125, -10.546875, -9.9326171875, -9.318359375, -8.7041015625, -8.08984375, -7.4755859375, -6.861328125, -6.2470703125, -5.6328125, -5.0185546875, -4.404296875, -3.7900390625, -3.17578125, -2.5615234375, -1.947265625, -1.3330078125, -0.71875, -0.1044921875, 0.509765625, 1.1240234375, 1.73828125, 2.3525390625, 2.966796875, 3.5810546875, 4.1953125, 4.8095703125, 5.423828125, 6.0380859375, 6.65234375, 7.2666015625, 7.880859375, 8.4951171875, 9.109375, 9.7236328125, 10.337890625, 10.9521484375, 11.56640625, 12.1806640625, 12.794921875, 13.4091796875, 14.0234375, 14.6376953125, 15.251953125, 15.8662109375, 16.48046875, 17.0947265625, 17.708984375, 18.3232421875, 18.9375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 90.0, 671.0, 243.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.43699645996094, -61.82619094848633, -59.21538543701172, -56.60457992553711, -53.9937744140625, -51.382965087890625, -48.772159576416016, -46.161354064941406, -43.5505485534668, -40.93974304199219, -38.32893753051758, -35.71813201904297, -33.107322692871094, -30.496519088745117, -27.885711669921875, -25.274906158447266, -22.664100646972656, -20.053295135498047, -17.442489624023438, -14.831682205200195, -12.220876693725586, -9.610071182250977, -6.999264717102051, -4.388458251953125, -1.7776527404785156, 0.833153247833252, 3.4439592361450195, 6.054765224456787, 8.665571212768555, 11.276376724243164, 13.88718318939209, 16.497989654541016, 19.108787536621094, 21.719593048095703, 24.330398559570312, 26.941205978393555, 29.552011489868164, 32.162818908691406, 34.773624420166016, 37.384429931640625, 39.995235443115234, 42.606040954589844, 45.21684646606445, 47.82765197753906, 50.43846130371094, 53.04926300048828, 55.660072326660156, 58.270877838134766, 60.881683349609375, 63.492488861083984, 66.1032943725586, 68.71410369873047, 71.32490539550781, 73.93571472167969, 76.54651641845703, 79.1573257446289, 81.76812744140625, 84.37893676757812, 86.98973846435547, 89.60054779052734, 92.21134948730469, 94.82215881347656, 97.4329605102539, 100.04376983642578, 102.65457916259766]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 8.0, 13.0, 11.0, 17.0, 15.0, 17.0, 22.0, 19.0, 26.0, 24.0, 32.0, 33.0, 52.0, 48.0, 34.0, 39.0, 48.0, 41.0, 39.0, 40.0, 47.0, 38.0, 53.0, 41.0, 32.0, 26.0, 40.0, 19.0, 19.0, 26.0, 15.0, 17.0, 14.0, 5.0, 13.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.764469146728516, -30.7552490234375, -29.746028900146484, -28.73680877685547, -27.727588653564453, -26.718368530273438, -25.70914649963379, -24.699926376342773, -23.690706253051758, -22.681486129760742, -21.672266006469727, -20.66304588317871, -19.653823852539062, -18.644603729248047, -17.63538360595703, -16.626163482666016, -15.616943359375, -14.607723236083984, -13.598503112792969, -12.589282035827637, -11.580061912536621, -10.570841789245605, -9.561620712280273, -8.552400588989258, -7.543180465698242, -6.533960342407227, -5.524739742279053, -4.515519142150879, -3.5062990188598633, -2.4970788955688477, -1.4878582954406738, -0.4786376953125, 0.5305862426757812, 1.539806604385376, 2.5490269660949707, 3.5582473278045654, 4.56746768951416, 5.576687812805176, 6.58590841293335, 7.595129013061523, 8.604349136352539, 9.613569259643555, 10.62278938293457, 11.632010459899902, 12.641230583190918, 13.650450706481934, 14.659671783447266, 15.668891906738281, 16.678112030029297, 17.687332153320312, 18.696552276611328, 19.705772399902344, 20.71499252319336, 21.724212646484375, 22.733434677124023, 23.74265480041504, 24.751874923706055, 25.76109504699707, 26.770315170288086, 27.7795352935791, 28.78875732421875, 29.797977447509766, 30.80719757080078, 31.816417694091797, 32.82563781738281]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 8.0, 9.0, 7.0, 11.0, 14.0, 16.0, 21.0, 26.0, 28.0, 30.0, 27.0, 18.0, 39.0, 42.0, 42.0, 38.0, 44.0, 40.0, 44.0, 43.0, 50.0, 47.0, 46.0, 33.0, 28.0, 25.0, 29.0, 17.0, 41.0, 19.0, 31.0, 14.0, 15.0, 13.0, 8.0, 8.0, 8.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0], "bins": [-3.0625, -2.9788818359375, -2.895263671875, -2.8116455078125, -2.72802734375, -2.6444091796875, -2.560791015625, -2.4771728515625, -2.3935546875, -2.3099365234375, -2.226318359375, -2.1427001953125, -2.05908203125, -1.9754638671875, -1.891845703125, -1.8082275390625, -1.724609375, -1.6409912109375, -1.557373046875, -1.4737548828125, -1.39013671875, -1.3065185546875, -1.222900390625, -1.1392822265625, -1.0556640625, -0.9720458984375, -0.888427734375, -0.8048095703125, -0.72119140625, -0.6375732421875, -0.553955078125, -0.4703369140625, -0.38671875, -0.3031005859375, -0.219482421875, -0.1358642578125, -0.05224609375, 0.0313720703125, 0.114990234375, 0.1986083984375, 0.2822265625, 0.3658447265625, 0.449462890625, 0.5330810546875, 0.61669921875, 0.7003173828125, 0.783935546875, 0.8675537109375, 0.951171875, 1.0347900390625, 1.118408203125, 1.2020263671875, 1.28564453125, 1.3692626953125, 1.452880859375, 1.5364990234375, 1.6201171875, 1.7037353515625, 1.787353515625, 1.8709716796875, 1.95458984375, 2.0382080078125, 2.121826171875, 2.2054443359375, 2.2890625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 7.0, 7.0, 12.0, 17.0, 22.0, 28.0, 43.0, 53.0, 59.0, 86.0, 133.0, 167.0, 415.0, 958.0, 2855.0, 11308.0, 77685.0, 1180719.0, 2697220.0, 193353.0, 22032.0, 4551.0, 1345.0, 512.0, 239.0, 100.0, 82.0, 73.0, 54.0, 34.0, 38.0, 13.0, 10.0, 11.0, 15.0, 8.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-12.6953125, -12.344482421875, -11.99365234375, -11.642822265625, -11.2919921875, -10.941162109375, -10.59033203125, -10.239501953125, -9.888671875, -9.537841796875, -9.18701171875, -8.836181640625, -8.4853515625, -8.134521484375, -7.78369140625, -7.432861328125, -7.08203125, -6.731201171875, -6.38037109375, -6.029541015625, -5.6787109375, -5.327880859375, -4.97705078125, -4.626220703125, -4.275390625, -3.924560546875, -3.57373046875, -3.222900390625, -2.8720703125, -2.521240234375, -2.17041015625, -1.819580078125, -1.46875, -1.117919921875, -0.76708984375, -0.416259765625, -0.0654296875, 0.285400390625, 0.63623046875, 0.987060546875, 1.337890625, 1.688720703125, 2.03955078125, 2.390380859375, 2.7412109375, 3.092041015625, 3.44287109375, 3.793701171875, 4.14453125, 4.495361328125, 4.84619140625, 5.197021484375, 5.5478515625, 5.898681640625, 6.24951171875, 6.600341796875, 6.951171875, 7.302001953125, 7.65283203125, 8.003662109375, 8.3544921875, 8.705322265625, 9.05615234375, 9.406982421875, 9.7578125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 8.0, 1.0, 5.0, 8.0, 10.0, 19.0, 22.0, 24.0, 76.0, 98.0, 141.0, 232.0, 348.0, 502.0, 647.0, 611.0, 457.0, 305.0, 193.0, 130.0, 83.0, 54.0, 36.0, 24.0, 17.0, 14.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.0718994140625, -8.706298828125, -8.3406982421875, -7.97509765625, -7.6094970703125, -7.243896484375, -6.8782958984375, -6.5126953125, -6.1470947265625, -5.781494140625, -5.4158935546875, -5.05029296875, -4.6846923828125, -4.319091796875, -3.9534912109375, -3.587890625, -3.2222900390625, -2.856689453125, -2.4910888671875, -2.12548828125, -1.7598876953125, -1.394287109375, -1.0286865234375, -0.6630859375, -0.2974853515625, 0.068115234375, 0.4337158203125, 0.79931640625, 1.1649169921875, 1.530517578125, 1.8961181640625, 2.26171875, 2.6273193359375, 2.992919921875, 3.3585205078125, 3.72412109375, 4.0897216796875, 4.455322265625, 4.8209228515625, 5.1865234375, 5.5521240234375, 5.917724609375, 6.2833251953125, 6.64892578125, 7.0145263671875, 7.380126953125, 7.7457275390625, 8.111328125, 8.4769287109375, 8.842529296875, 9.2081298828125, 9.57373046875, 9.9393310546875, 10.304931640625, 10.6705322265625, 11.0361328125, 11.4017333984375, 11.767333984375, 12.1329345703125, 12.49853515625, 12.8641357421875, 13.229736328125, 13.5953369140625, 13.9609375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 16.0, 18.0, 21.0, 30.0, 43.0, 91.0, 146.0, 219.0, 396.0, 809.0, 1691.0, 4600.0, 15386.0, 74786.0, 538139.0, 2677140.0, 752878.0, 99325.0, 19182.0, 5318.0, 2046.0, 941.0, 452.0, 244.0, 148.0, 73.0, 49.0, 27.0, 33.0, 10.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5546875, -14.10791015625, -13.6611328125, -13.21435546875, -12.767578125, -12.32080078125, -11.8740234375, -11.42724609375, -10.98046875, -10.53369140625, -10.0869140625, -9.64013671875, -9.193359375, -8.74658203125, -8.2998046875, -7.85302734375, -7.40625, -6.95947265625, -6.5126953125, -6.06591796875, -5.619140625, -5.17236328125, -4.7255859375, -4.27880859375, -3.83203125, -3.38525390625, -2.9384765625, -2.49169921875, -2.044921875, -1.59814453125, -1.1513671875, -0.70458984375, -0.2578125, 0.18896484375, 0.6357421875, 1.08251953125, 1.529296875, 1.97607421875, 2.4228515625, 2.86962890625, 3.31640625, 3.76318359375, 4.2099609375, 4.65673828125, 5.103515625, 5.55029296875, 5.9970703125, 6.44384765625, 6.890625, 7.33740234375, 7.7841796875, 8.23095703125, 8.677734375, 9.12451171875, 9.5712890625, 10.01806640625, 10.46484375, 10.91162109375, 11.3583984375, 11.80517578125, 12.251953125, 12.69873046875, 13.1455078125, 13.59228515625, 14.0390625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 19.0, 80.0, 220.0, 347.0, 214.0, 96.0, 27.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-173.36392211914062, -169.86744689941406, -166.3709716796875, -162.87451171875, -159.37803649902344, -155.88156127929688, -152.3850860595703, -148.88861083984375, -145.3921356201172, -141.89566040039062, -138.39918518066406, -134.9027099609375, -131.40625, -127.90977478027344, -124.41329956054688, -120.91682434082031, -117.42036437988281, -113.92388916015625, -110.42742156982422, -106.93094635009766, -103.4344711303711, -99.93800354003906, -96.4415283203125, -92.94505310058594, -89.44857788085938, -85.95210266113281, -82.45563507080078, -78.95915985107422, -75.46268463134766, -71.96621704101562, -68.46974182128906, -64.9732666015625, -61.4767951965332, -57.980323791503906, -54.483848571777344, -50.98737716674805, -47.49090576171875, -43.99443054199219, -40.49795913696289, -37.001487731933594, -33.50501251220703, -30.0085391998291, -26.512067794799805, -23.015594482421875, -19.519123077392578, -16.02264976501465, -12.526176452636719, -9.029705047607422, -5.533233642578125, -2.0367610454559326, 1.4597115516662598, 4.956184387207031, 8.452656745910645, 11.949129104614258, 15.445602416992188, 18.942073822021484, 22.438547134399414, 25.935020446777344, 29.43149185180664, 32.92796325683594, 36.4244384765625, 39.9209098815918, 43.417381286621094, 46.913856506347656, 50.41032791137695]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 8.0, 6.0, 6.0, 18.0, 5.0, 13.0, 19.0, 17.0, 19.0, 22.0, 34.0, 39.0, 44.0, 30.0, 33.0, 30.0, 34.0, 43.0, 40.0, 43.0, 36.0, 35.0, 34.0, 33.0, 45.0, 35.0, 25.0, 24.0, 35.0, 32.0, 28.0, 20.0, 22.0, 12.0, 8.0, 9.0, 12.0, 4.0, 7.0, 11.0, 7.0, 4.0, 2.0, 3.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0], "bins": [-28.353797912597656, -27.50921058654785, -26.66462516784668, -25.820037841796875, -24.975452423095703, -24.1308650970459, -23.286277770996094, -22.441692352294922, -21.59710693359375, -20.752519607543945, -19.907934188842773, -19.06334686279297, -18.218761444091797, -17.374174118041992, -16.529586791992188, -15.685001373291016, -14.840414047241211, -13.995827674865723, -13.151241302490234, -12.30665397644043, -11.462068557739258, -10.617481231689453, -9.772894859313965, -8.928308486938477, -8.083722114562988, -7.2391357421875, -6.394549369812012, -5.549962520599365, -4.705376148223877, -3.8607897758483887, -3.016202926635742, -2.171616554260254, -1.3270282745361328, -0.482441782951355, 0.36214470863342285, 1.2067313194274902, 2.0513176918029785, 2.895904064178467, 3.7404909133911133, 4.585077285766602, 5.42966365814209, 6.274250030517578, 7.118836402893066, 7.963423252105713, 8.80801010131836, 9.652595520019531, 10.497182846069336, 11.341769218444824, 12.186355590820312, 13.0309419631958, 13.875528335571289, 14.720115661621094, 15.564701080322266, 16.40928840637207, 17.253875732421875, 18.098461151123047, 18.94304656982422, 19.787633895874023, 20.632219314575195, 21.476806640625, 22.321392059326172, 23.165979385375977, 24.01056671142578, 24.855152130126953, 25.699739456176758]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 11.0, 7.0, 14.0, 21.0, 14.0, 19.0, 22.0, 22.0, 27.0, 26.0, 31.0, 31.0, 39.0, 29.0, 50.0, 44.0, 50.0, 48.0, 48.0, 47.0, 35.0, 39.0, 46.0, 31.0, 33.0, 21.0, 27.0, 31.0, 21.0, 14.0, 22.0, 15.0, 16.0, 12.0, 9.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.150390625, -3.061859130859375, -2.97332763671875, -2.884796142578125, -2.7962646484375, -2.707733154296875, -2.61920166015625, -2.530670166015625, -2.442138671875, -2.353607177734375, -2.26507568359375, -2.176544189453125, -2.0880126953125, -1.999481201171875, -1.91094970703125, -1.822418212890625, -1.73388671875, -1.645355224609375, -1.55682373046875, -1.468292236328125, -1.3797607421875, -1.291229248046875, -1.20269775390625, -1.114166259765625, -1.025634765625, -0.937103271484375, -0.84857177734375, -0.760040283203125, -0.6715087890625, -0.582977294921875, -0.49444580078125, -0.405914306640625, -0.3173828125, -0.228851318359375, -0.14031982421875, -0.051788330078125, 0.0367431640625, 0.125274658203125, 0.21380615234375, 0.302337646484375, 0.390869140625, 0.479400634765625, 0.56793212890625, 0.656463623046875, 0.7449951171875, 0.833526611328125, 0.92205810546875, 1.010589599609375, 1.09912109375, 1.187652587890625, 1.27618408203125, 1.364715576171875, 1.4532470703125, 1.541778564453125, 1.63031005859375, 1.718841552734375, 1.807373046875, 1.895904541015625, 1.98443603515625, 2.072967529296875, 2.1614990234375, 2.250030517578125, 2.33856201171875, 2.427093505859375, 2.515625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 8.0, 14.0, 16.0, 31.0, 48.0, 85.0, 109.0, 187.0, 324.0, 566.0, 1021.0, 1942.0, 3781.0, 7615.0, 15220.0, 31329.0, 64549.0, 128676.0, 225041.0, 250993.0, 158028.0, 80630.0, 39455.0, 19245.0, 9687.0, 4720.0, 2344.0, 1275.0, 672.0, 367.0, 220.0, 140.0, 78.0, 53.0, 29.0, 22.0, 13.0, 9.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51220703125, -0.4952239990234375, -0.478240966796875, -0.4612579345703125, -0.44427490234375, -0.4272918701171875, -0.410308837890625, -0.3933258056640625, -0.3763427734375, -0.3593597412109375, -0.342376708984375, -0.3253936767578125, -0.30841064453125, -0.2914276123046875, -0.274444580078125, -0.2574615478515625, -0.240478515625, -0.2234954833984375, -0.206512451171875, -0.1895294189453125, -0.17254638671875, -0.1555633544921875, -0.138580322265625, -0.1215972900390625, -0.1046142578125, -0.0876312255859375, -0.070648193359375, -0.0536651611328125, -0.03668212890625, -0.0196990966796875, -0.002716064453125, 0.0142669677734375, 0.03125, 0.0482330322265625, 0.065216064453125, 0.0821990966796875, 0.09918212890625, 0.1161651611328125, 0.133148193359375, 0.1501312255859375, 0.1671142578125, 0.1840972900390625, 0.201080322265625, 0.2180633544921875, 0.23504638671875, 0.2520294189453125, 0.269012451171875, 0.2859954833984375, 0.302978515625, 0.3199615478515625, 0.336944580078125, 0.3539276123046875, 0.37091064453125, 0.3878936767578125, 0.404876708984375, 0.4218597412109375, 0.4388427734375, 0.4558258056640625, 0.472808837890625, 0.4897918701171875, 0.50677490234375, 0.5237579345703125, 0.540740966796875, 0.5577239990234375, 0.57470703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 14.0, 15.0, 10.0, 14.0, 16.0, 18.0, 22.0, 26.0, 27.0, 20.0, 22.0, 36.0, 42.0, 32.0, 44.0, 40.0, 36.0, 33.0, 1070.0, 38.0, 40.0, 36.0, 38.0, 35.0, 29.0, 34.0, 26.0, 31.0, 23.0, 25.0, 19.0, 29.0, 6.0, 11.0, 13.0, 14.0, 10.0, 8.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6494140625, -1.59417724609375, -1.5389404296875, -1.48370361328125, -1.428466796875, -1.37322998046875, -1.3179931640625, -1.26275634765625, -1.20751953125, -1.15228271484375, -1.0970458984375, -1.04180908203125, -0.986572265625, -0.93133544921875, -0.8760986328125, -0.82086181640625, -0.765625, -0.71038818359375, -0.6551513671875, -0.59991455078125, -0.544677734375, -0.48944091796875, -0.4342041015625, -0.37896728515625, -0.32373046875, -0.26849365234375, -0.2132568359375, -0.15802001953125, -0.102783203125, -0.04754638671875, 0.0076904296875, 0.06292724609375, 0.1181640625, 0.17340087890625, 0.2286376953125, 0.28387451171875, 0.339111328125, 0.39434814453125, 0.4495849609375, 0.50482177734375, 0.56005859375, 0.61529541015625, 0.6705322265625, 0.72576904296875, 0.781005859375, 0.83624267578125, 0.8914794921875, 0.94671630859375, 1.001953125, 1.05718994140625, 1.1124267578125, 1.16766357421875, 1.222900390625, 1.27813720703125, 1.3333740234375, 1.38861083984375, 1.44384765625, 1.49908447265625, 1.5543212890625, 1.60955810546875, 1.664794921875, 1.72003173828125, 1.7752685546875, 1.83050537109375, 1.8857421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 11.0, 12.0, 19.0, 25.0, 42.0, 45.0, 84.0, 150.0, 193.0, 325.0, 457.0, 718.0, 1263.0, 2017.0, 3322.0, 5396.0, 8957.0, 14755.0, 24603.0, 41080.0, 67326.0, 108254.0, 159109.0, 1226516.0, 157304.0, 106385.0, 66937.0, 40459.0, 24228.0, 14365.0, 8940.0, 5298.0, 3185.0, 2012.0, 1194.0, 821.0, 483.0, 272.0, 210.0, 126.0, 81.0, 64.0, 33.0, 19.0, 19.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23412513732910156, -0.22618484497070312, -0.2182445526123047, -0.21030426025390625, -0.2023639678955078, -0.19442367553710938, -0.18648338317871094, -0.1785430908203125, -0.17060279846191406, -0.16266250610351562, -0.1547222137451172, -0.14678192138671875, -0.1388416290283203, -0.13090133666992188, -0.12296104431152344, -0.115020751953125, -0.10708045959472656, -0.09914016723632812, -0.09119987487792969, -0.08325958251953125, -0.07531929016113281, -0.06737899780273438, -0.05943870544433594, -0.0514984130859375, -0.04355812072753906, -0.035617828369140625, -0.027677536010742188, -0.01973724365234375, -0.011796951293945312, -0.003856658935546875, 0.0040836334228515625, 0.01202392578125, 0.019964218139648438, 0.027904510498046875, 0.03584480285644531, 0.04378509521484375, 0.05172538757324219, 0.059665679931640625, 0.06760597229003906, 0.0755462646484375, 0.08348655700683594, 0.09142684936523438, 0.09936714172363281, 0.10730743408203125, 0.11524772644042969, 0.12318801879882812, 0.13112831115722656, 0.139068603515625, 0.14700889587402344, 0.15494918823242188, 0.1628894805908203, 0.17082977294921875, 0.1787700653076172, 0.18671035766601562, 0.19465065002441406, 0.2025909423828125, 0.21053123474121094, 0.21847152709960938, 0.2264118194580078, 0.23435211181640625, 0.2422924041748047, 0.2502326965332031, 0.25817298889160156, 0.26611328125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 2.0, 2.0, 8.0, 8.0, 14.0, 19.0, 15.0, 18.0, 18.0, 31.0, 40.0, 44.0, 57.0, 71.0, 90.0, 116.0, 95.0, 72.0, 47.0, 51.0, 36.0, 36.0, 26.0, 21.0, 15.0, 11.0, 11.0, 7.0, 5.0, 6.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01045989990234375, -0.010173201560974121, -0.009886503219604492, -0.009599804878234863, -0.009313106536865234, -0.009026408195495605, -0.008739709854125977, -0.008453011512756348, -0.008166313171386719, -0.00787961483001709, -0.007592916488647461, -0.007306218147277832, -0.007019519805908203, -0.006732821464538574, -0.006446123123168945, -0.006159424781799316, -0.0058727264404296875, -0.005586028099060059, -0.00529932975769043, -0.005012631416320801, -0.004725933074951172, -0.004439234733581543, -0.004152536392211914, -0.003865838050842285, -0.0035791397094726562, -0.0032924413681030273, -0.0030057430267333984, -0.0027190446853637695, -0.0024323463439941406, -0.0021456480026245117, -0.0018589496612548828, -0.001572251319885254, -0.001285552978515625, -0.000998854637145996, -0.0007121562957763672, -0.0004254579544067383, -0.00013875961303710938, 0.00014793872833251953, 0.00043463706970214844, 0.0007213354110717773, 0.0010080337524414062, 0.0012947320938110352, 0.001581430435180664, 0.001868128776550293, 0.002154827117919922, 0.0024415254592895508, 0.0027282238006591797, 0.0030149221420288086, 0.0033016204833984375, 0.0035883188247680664, 0.0038750171661376953, 0.004161715507507324, 0.004448413848876953, 0.004735112190246582, 0.005021810531616211, 0.00530850887298584, 0.005595207214355469, 0.005881905555725098, 0.0061686038970947266, 0.0064553022384643555, 0.006742000579833984, 0.007028698921203613, 0.007315397262573242, 0.007602095603942871, 0.0078887939453125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 19.0, 13.0, 20.0, 30.0, 45.0, 65.0, 74.0, 83.0, 116.0, 177.0, 291.0, 713.0, 20439.0, 1020223.0, 4863.0, 499.0, 244.0, 159.0, 130.0, 82.0, 55.0, 42.0, 37.0, 40.0, 17.0, 14.0, 10.0, 5.0, 9.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1531982421875, -0.14846420288085938, -0.14373016357421875, -0.13899612426757812, -0.1342620849609375, -0.12952804565429688, -0.12479400634765625, -0.12005996704101562, -0.115325927734375, -0.11059188842773438, -0.10585784912109375, -0.10112380981445312, -0.0963897705078125, -0.09165573120117188, -0.08692169189453125, -0.08218765258789062, -0.07745361328125, -0.07271957397460938, -0.06798553466796875, -0.06325149536132812, -0.0585174560546875, -0.053783416748046875, -0.04904937744140625, -0.044315338134765625, -0.039581298828125, -0.034847259521484375, -0.03011322021484375, -0.025379180908203125, -0.0206451416015625, -0.015911102294921875, -0.01117706298828125, -0.006443023681640625, -0.001708984375, 0.003025054931640625, 0.00775909423828125, 0.012493133544921875, 0.0172271728515625, 0.021961212158203125, 0.02669525146484375, 0.031429290771484375, 0.036163330078125, 0.040897369384765625, 0.04563140869140625, 0.050365447998046875, 0.0550994873046875, 0.059833526611328125, 0.06456756591796875, 0.06930160522460938, 0.07403564453125, 0.07876968383789062, 0.08350372314453125, 0.08823776245117188, 0.0929718017578125, 0.09770584106445312, 0.10243988037109375, 0.10717391967773438, 0.111907958984375, 0.11664199829101562, 0.12137603759765625, 0.12611007690429688, 0.1308441162109375, 0.13557815551757812, 0.14031219482421875, 0.14504623413085938, 0.1497802734375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 915.0, 98.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14734181761741638, -0.14311569929122925, -0.13888958096504211, -0.13466346263885498, -0.13043734431266785, -0.1262112259864807, -0.12198510020971298, -0.11775898188352585, -0.11353286355733871, -0.10930674523115158, -0.10508062690496445, -0.10085450857877731, -0.09662838280200958, -0.09240226447582245, -0.08817614614963531, -0.08395002782344818, -0.07972390949726105, -0.07549779117107391, -0.07127167284488678, -0.06704555451869965, -0.06281943619251251, -0.05859331414103508, -0.05436719208955765, -0.050141073763370514, -0.04591495543718338, -0.041688837110996246, -0.03746271878480911, -0.03323659673333168, -0.029010478407144547, -0.024784360080957413, -0.02055823989212513, -0.016332119703292847, -0.012106016278266907, -0.007879897020757198, -0.00365377776324749, 0.0005723414942622185, 0.004798460751771927, 0.00902457907795906, 0.013250699266791344, 0.017476819455623627, 0.02170293778181076, 0.025929056107997894, 0.030155176296830177, 0.03438129648566246, 0.038607414811849594, 0.04283353313803673, 0.04705965518951416, 0.051285773515701294, 0.05551189184188843, 0.05973801016807556, 0.0639641284942627, 0.06819024682044983, 0.07241636514663696, 0.0766424834728241, 0.08086860924959183, 0.08509472757577896, 0.0893208459019661, 0.09354696422815323, 0.09777308255434036, 0.1019992008805275, 0.10622532665729523, 0.11045144498348236, 0.1146775633096695, 0.11890368163585663, 0.12312979996204376]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 6.0, 5.0, 8.0, 15.0, 25.0, 25.0, 28.0, 34.0, 40.0, 39.0, 37.0, 51.0, 48.0, 61.0, 72.0, 56.0, 61.0, 57.0, 61.0, 46.0, 40.0, 34.0, 34.0, 29.0, 26.0, 24.0, 14.0, 10.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011496543884277344, -0.011163455434143543, -0.010830366984009743, -0.010497278533875942, -0.010164190083742142, -0.009831101633608341, -0.00949801318347454, -0.00916492473334074, -0.00883183628320694, -0.00849874783307314, -0.008165659382939339, -0.007832570932805538, -0.007499482482671738, -0.007166394032537937, -0.006833305582404137, -0.006500217132270336, -0.006167128682136536, -0.005834040232002735, -0.005500951781868935, -0.005167863331735134, -0.004834774881601334, -0.004501686431467533, -0.004168597981333733, -0.003835509531199932, -0.0035024210810661316, -0.003169332630932331, -0.0028362441807985306, -0.00250315573066473, -0.0021700672805309296, -0.001836978830397129, -0.0015038903802633286, -0.001170801930129528, -0.0008377134799957275, -0.000504625029861927, -0.00017153657972812653, 0.00016155187040567398, 0.0004946403205394745, 0.000827728770673275, 0.0011608172208070755, 0.001493905670940876, 0.0018269941210746765, 0.002160082571208477, 0.0024931710213422775, 0.002826259471476078, 0.0031593479216098785, 0.003492436371743679, 0.0038255248218774796, 0.00415861327201128, 0.004491701722145081, 0.004824790172278881, 0.005157878622412682, 0.005490967072546482, 0.005824055522680283, 0.006157143972814083, 0.006490232422947884, 0.006823320873081684, 0.007156409323215485, 0.007489497773349285, 0.007822586223483086, 0.008155674673616886, 0.008488763123750687, 0.008821851573884487, 0.009154940024018288, 0.009488028474152088, 0.009821116924285889]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 11.0, 7.0, 14.0, 21.0, 14.0, 19.0, 22.0, 22.0, 27.0, 26.0, 31.0, 31.0, 39.0, 29.0, 50.0, 44.0, 50.0, 48.0, 48.0, 47.0, 35.0, 39.0, 46.0, 31.0, 33.0, 21.0, 27.0, 31.0, 21.0, 14.0, 22.0, 15.0, 15.0, 13.0, 9.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.150390625, -3.061859130859375, -2.97332763671875, -2.884796142578125, -2.7962646484375, -2.707733154296875, -2.61920166015625, -2.530670166015625, -2.442138671875, -2.353607177734375, -2.26507568359375, -2.176544189453125, -2.0880126953125, -1.999481201171875, -1.91094970703125, -1.822418212890625, -1.73388671875, -1.645355224609375, -1.55682373046875, -1.468292236328125, -1.3797607421875, -1.291229248046875, -1.20269775390625, -1.114166259765625, -1.025634765625, -0.937103271484375, -0.84857177734375, -0.760040283203125, -0.6715087890625, -0.582977294921875, -0.49444580078125, -0.405914306640625, -0.3173828125, -0.228851318359375, -0.14031982421875, -0.051788330078125, 0.0367431640625, 0.125274658203125, 0.21380615234375, 0.302337646484375, 0.390869140625, 0.479400634765625, 0.56793212890625, 0.656463623046875, 0.7449951171875, 0.833526611328125, 0.92205810546875, 1.010589599609375, 1.09912109375, 1.187652587890625, 1.27618408203125, 1.364715576171875, 1.4532470703125, 1.541778564453125, 1.63031005859375, 1.718841552734375, 1.807373046875, 1.895904541015625, 1.98443603515625, 2.072967529296875, 2.1614990234375, 2.250030517578125, 2.33856201171875, 2.427093505859375, 2.515625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 12.0, 10.0, 13.0, 25.0, 39.0, 65.0, 58.0, 109.0, 195.0, 286.0, 427.0, 643.0, 1095.0, 1809.0, 2969.0, 5010.0, 9604.0, 22391.0, 70836.0, 258077.0, 441859.0, 156298.0, 43609.0, 15385.0, 7284.0, 4028.0, 2424.0, 1484.0, 903.0, 586.0, 380.0, 222.0, 138.0, 80.0, 53.0, 33.0, 38.0, 16.0, 19.0, 13.0, 9.0, 8.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.365234375, -3.241973876953125, -3.11871337890625, -2.995452880859375, -2.8721923828125, -2.748931884765625, -2.62567138671875, -2.502410888671875, -2.379150390625, -2.255889892578125, -2.13262939453125, -2.009368896484375, -1.8861083984375, -1.762847900390625, -1.63958740234375, -1.516326904296875, -1.39306640625, -1.269805908203125, -1.14654541015625, -1.023284912109375, -0.9000244140625, -0.776763916015625, -0.65350341796875, -0.530242919921875, -0.406982421875, -0.283721923828125, -0.16046142578125, -0.037200927734375, 0.0860595703125, 0.209320068359375, 0.33258056640625, 0.455841064453125, 0.5791015625, 0.702362060546875, 0.82562255859375, 0.948883056640625, 1.0721435546875, 1.195404052734375, 1.31866455078125, 1.441925048828125, 1.565185546875, 1.688446044921875, 1.81170654296875, 1.934967041015625, 2.0582275390625, 2.181488037109375, 2.30474853515625, 2.428009033203125, 2.55126953125, 2.674530029296875, 2.79779052734375, 2.921051025390625, 3.0443115234375, 3.167572021484375, 3.29083251953125, 3.414093017578125, 3.537353515625, 3.660614013671875, 3.78387451171875, 3.907135009765625, 4.0303955078125, 4.153656005859375, 4.27691650390625, 4.400177001953125, 4.5234375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 0.0, 6.0, 7.0, 9.0, 6.0, 14.0, 10.0, 16.0, 18.0, 25.0, 32.0, 29.0, 21.0, 42.0, 26.0, 34.0, 39.0, 50.0, 55.0, 90.0, 260.0, 1543.0, 199.0, 83.0, 60.0, 46.0, 41.0, 37.0, 34.0, 27.0, 41.0, 25.0, 26.0, 19.0, 16.0, 10.0, 22.0, 9.0, 8.0, 7.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.7872314453125, -7.480712890625, -7.1741943359375, -6.86767578125, -6.5611572265625, -6.254638671875, -5.9481201171875, -5.6416015625, -5.3350830078125, -5.028564453125, -4.7220458984375, -4.41552734375, -4.1090087890625, -3.802490234375, -3.4959716796875, -3.189453125, -2.8829345703125, -2.576416015625, -2.2698974609375, -1.96337890625, -1.6568603515625, -1.350341796875, -1.0438232421875, -0.7373046875, -0.4307861328125, -0.124267578125, 0.1822509765625, 0.48876953125, 0.7952880859375, 1.101806640625, 1.4083251953125, 1.71484375, 2.0213623046875, 2.327880859375, 2.6343994140625, 2.94091796875, 3.2474365234375, 3.553955078125, 3.8604736328125, 4.1669921875, 4.4735107421875, 4.780029296875, 5.0865478515625, 5.39306640625, 5.6995849609375, 6.006103515625, 6.3126220703125, 6.619140625, 6.9256591796875, 7.232177734375, 7.5386962890625, 7.84521484375, 8.1517333984375, 8.458251953125, 8.7647705078125, 9.0712890625, 9.3778076171875, 9.684326171875, 9.9908447265625, 10.29736328125, 10.6038818359375, 10.910400390625, 11.2169189453125, 11.5234375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 4.0, 7.0, 11.0, 13.0, 14.0, 21.0, 14.0, 27.0, 30.0, 49.0, 52.0, 76.0, 105.0, 223.0, 420.0, 1068.0, 4428.0, 35660.0, 2576694.0, 506261.0, 16334.0, 2613.0, 719.0, 292.0, 149.0, 98.0, 69.0, 55.0, 35.0, 36.0, 32.0, 20.0, 15.0, 16.0, 11.0, 12.0, 4.0, 3.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.34375, -18.83251953125, -18.3212890625, -17.81005859375, -17.298828125, -16.78759765625, -16.2763671875, -15.76513671875, -15.25390625, -14.74267578125, -14.2314453125, -13.72021484375, -13.208984375, -12.69775390625, -12.1865234375, -11.67529296875, -11.1640625, -10.65283203125, -10.1416015625, -9.63037109375, -9.119140625, -8.60791015625, -8.0966796875, -7.58544921875, -7.07421875, -6.56298828125, -6.0517578125, -5.54052734375, -5.029296875, -4.51806640625, -4.0068359375, -3.49560546875, -2.984375, -2.47314453125, -1.9619140625, -1.45068359375, -0.939453125, -0.42822265625, 0.0830078125, 0.59423828125, 1.10546875, 1.61669921875, 2.1279296875, 2.63916015625, 3.150390625, 3.66162109375, 4.1728515625, 4.68408203125, 5.1953125, 5.70654296875, 6.2177734375, 6.72900390625, 7.240234375, 7.75146484375, 8.2626953125, 8.77392578125, 9.28515625, 9.79638671875, 10.3076171875, 10.81884765625, 11.330078125, 11.84130859375, 12.3525390625, 12.86376953125, 13.375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 25.0, 59.0, 221.0, 243.0, 221.0, 143.0, 70.0, 13.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.67424774169922, -39.62382125854492, -38.573394775390625, -37.52296829223633, -36.47254180908203, -35.42211151123047, -34.37168502807617, -33.321258544921875, -32.27083206176758, -31.22040557861328, -30.169979095458984, -29.119550704956055, -28.069124221801758, -27.01869773864746, -25.96826934814453, -24.917842864990234, -23.867416381835938, -22.81698989868164, -21.766563415527344, -20.716135025024414, -19.665708541870117, -18.61528205871582, -17.56485366821289, -16.514427185058594, -15.464000701904297, -14.41357421875, -13.363146781921387, -12.312719345092773, -11.262292861938477, -10.21186637878418, -9.161438941955566, -8.111011505126953, -7.060581207275391, -6.0101542472839355, -4.9597272872924805, -3.9093003273010254, -2.8588733673095703, -1.8084464073181152, -0.7580194473266602, 0.2924075126647949, 1.34283447265625, 2.393261432647705, 3.44368839263916, 4.494115352630615, 5.54454231262207, 6.594969272613525, 7.6453962326049805, 8.695823669433594, 9.74625015258789, 10.796676635742188, 11.8471040725708, 12.897531509399414, 13.947957992553711, 14.998384475708008, 16.048812866210938, 17.099239349365234, 18.14966583251953, 19.200092315673828, 20.250518798828125, 21.300947189331055, 22.35137367248535, 23.40180015563965, 24.452228546142578, 25.502655029296875, 26.553081512451172]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 7.0, 5.0, 3.0, 11.0, 8.0, 11.0, 11.0, 15.0, 24.0, 14.0, 24.0, 18.0, 27.0, 26.0, 33.0, 36.0, 37.0, 36.0, 37.0, 41.0, 37.0, 34.0, 47.0, 38.0, 32.0, 42.0, 34.0, 44.0, 29.0, 33.0, 24.0, 31.0, 23.0, 23.0, 20.0, 25.0, 14.0, 13.0, 6.0, 10.0, 4.0, 1.0, 7.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.69546890258789, -27.72551918029785, -26.75556755065918, -25.78561782836914, -24.81566619873047, -23.84571647644043, -22.875764846801758, -21.90581512451172, -20.935863494873047, -19.965913772583008, -18.995962142944336, -18.026012420654297, -17.056060791015625, -16.086111068725586, -15.116159439086914, -14.146209716796875, -13.17625904083252, -12.206308364868164, -11.236357688903809, -10.266407012939453, -9.296456336975098, -8.326505661010742, -7.356555461883545, -6.3866047859191895, -5.416654109954834, -4.4467034339904785, -3.476752758026123, -2.5068023204803467, -1.5368516445159912, -0.5669012069702148, 0.4030494689941406, 1.373000144958496, 2.3429508209228516, 3.312901496887207, 4.2828521728515625, 5.252802848815918, 6.222753524780273, 7.192703723907471, 8.162654876708984, 9.132604598999023, 10.102556228637695, 11.07250690460205, 12.042457580566406, 13.012408256530762, 13.982358932495117, 14.952308654785156, 15.922260284423828, 16.892210006713867, 17.862159729003906, 18.832109451293945, 19.802061080932617, 20.772010803222656, 21.741962432861328, 22.711912155151367, 23.68186378479004, 24.651813507080078, 25.62176513671875, 26.59171485900879, 27.56166648864746, 28.5316162109375, 29.501567840576172, 30.47151756286621, 31.441469192504883, 32.41141891479492, 33.381370544433594]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 5.0, 13.0, 10.0, 14.0, 12.0, 19.0, 23.0, 15.0, 21.0, 21.0, 26.0, 25.0, 36.0, 41.0, 37.0, 43.0, 39.0, 42.0, 39.0, 68.0, 45.0, 52.0, 41.0, 39.0, 25.0, 35.0, 25.0, 23.0, 20.0, 29.0, 23.0, 14.0, 12.0, 19.0, 12.0, 11.0, 12.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.34375, -3.250732421875, -3.15771484375, -3.064697265625, -2.9716796875, -2.878662109375, -2.78564453125, -2.692626953125, -2.599609375, -2.506591796875, -2.41357421875, -2.320556640625, -2.2275390625, -2.134521484375, -2.04150390625, -1.948486328125, -1.85546875, -1.762451171875, -1.66943359375, -1.576416015625, -1.4833984375, -1.390380859375, -1.29736328125, -1.204345703125, -1.111328125, -1.018310546875, -0.92529296875, -0.832275390625, -0.7392578125, -0.646240234375, -0.55322265625, -0.460205078125, -0.3671875, -0.274169921875, -0.18115234375, -0.088134765625, 0.0048828125, 0.097900390625, 0.19091796875, 0.283935546875, 0.376953125, 0.469970703125, 0.56298828125, 0.656005859375, 0.7490234375, 0.842041015625, 0.93505859375, 1.028076171875, 1.12109375, 1.214111328125, 1.30712890625, 1.400146484375, 1.4931640625, 1.586181640625, 1.67919921875, 1.772216796875, 1.865234375, 1.958251953125, 2.05126953125, 2.144287109375, 2.2373046875, 2.330322265625, 2.42333984375, 2.516357421875, 2.609375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 5.0, 5.0, 8.0, 7.0, 14.0, 12.0, 21.0, 23.0, 29.0, 38.0, 54.0, 80.0, 124.0, 311.0, 862.0, 3286.0, 18306.0, 199800.0, 3075169.0, 838942.0, 48445.0, 6521.0, 1346.0, 401.0, 155.0, 81.0, 58.0, 30.0, 24.0, 27.0, 19.0, 14.0, 15.0, 11.0, 12.0, 5.0, 10.0, 4.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.8515625, -13.45263671875, -13.0537109375, -12.65478515625, -12.255859375, -11.85693359375, -11.4580078125, -11.05908203125, -10.66015625, -10.26123046875, -9.8623046875, -9.46337890625, -9.064453125, -8.66552734375, -8.2666015625, -7.86767578125, -7.46875, -7.06982421875, -6.6708984375, -6.27197265625, -5.873046875, -5.47412109375, -5.0751953125, -4.67626953125, -4.27734375, -3.87841796875, -3.4794921875, -3.08056640625, -2.681640625, -2.28271484375, -1.8837890625, -1.48486328125, -1.0859375, -0.68701171875, -0.2880859375, 0.11083984375, 0.509765625, 0.90869140625, 1.3076171875, 1.70654296875, 2.10546875, 2.50439453125, 2.9033203125, 3.30224609375, 3.701171875, 4.10009765625, 4.4990234375, 4.89794921875, 5.296875, 5.69580078125, 6.0947265625, 6.49365234375, 6.892578125, 7.29150390625, 7.6904296875, 8.08935546875, 8.48828125, 8.88720703125, 9.2861328125, 9.68505859375, 10.083984375, 10.48291015625, 10.8818359375, 11.28076171875, 11.6796875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 8.0, 6.0, 13.0, 16.0, 20.0, 31.0, 49.0, 49.0, 63.0, 126.0, 126.0, 192.0, 214.0, 329.0, 422.0, 454.0, 442.0, 405.0, 307.0, 212.0, 161.0, 104.0, 77.0, 59.0, 43.0, 45.0, 23.0, 13.0, 7.0, 11.0, 9.0, 8.0, 5.0, 6.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-8.9609375, -8.70257568359375, -8.4442138671875, -8.18585205078125, -7.927490234375, -7.66912841796875, -7.4107666015625, -7.15240478515625, -6.89404296875, -6.63568115234375, -6.3773193359375, -6.11895751953125, -5.860595703125, -5.60223388671875, -5.3438720703125, -5.08551025390625, -4.8271484375, -4.56878662109375, -4.3104248046875, -4.05206298828125, -3.793701171875, -3.53533935546875, -3.2769775390625, -3.01861572265625, -2.76025390625, -2.50189208984375, -2.2435302734375, -1.98516845703125, -1.726806640625, -1.46844482421875, -1.2100830078125, -0.95172119140625, -0.693359375, -0.43499755859375, -0.1766357421875, 0.08172607421875, 0.340087890625, 0.59844970703125, 0.8568115234375, 1.11517333984375, 1.37353515625, 1.63189697265625, 1.8902587890625, 2.14862060546875, 2.406982421875, 2.66534423828125, 2.9237060546875, 3.18206787109375, 3.4404296875, 3.69879150390625, 3.9571533203125, 4.21551513671875, 4.473876953125, 4.73223876953125, 4.9906005859375, 5.24896240234375, 5.50732421875, 5.76568603515625, 6.0240478515625, 6.28240966796875, 6.540771484375, 6.79913330078125, 7.0574951171875, 7.31585693359375, 7.57421875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 7.0, 19.0, 13.0, 23.0, 52.0, 77.0, 117.0, 184.0, 321.0, 730.0, 1806.0, 5567.0, 23808.0, 153242.0, 1539743.0, 2195451.0, 229954.0, 32154.0, 7113.0, 2142.0, 826.0, 373.0, 196.0, 109.0, 78.0, 49.0, 23.0, 25.0, 13.0, 13.0, 7.0, 11.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9609375, -13.4639892578125, -12.967041015625, -12.4700927734375, -11.97314453125, -11.4761962890625, -10.979248046875, -10.4822998046875, -9.9853515625, -9.4884033203125, -8.991455078125, -8.4945068359375, -7.99755859375, -7.5006103515625, -7.003662109375, -6.5067138671875, -6.009765625, -5.5128173828125, -5.015869140625, -4.5189208984375, -4.02197265625, -3.5250244140625, -3.028076171875, -2.5311279296875, -2.0341796875, -1.5372314453125, -1.040283203125, -0.5433349609375, -0.04638671875, 0.4505615234375, 0.947509765625, 1.4444580078125, 1.94140625, 2.4383544921875, 2.935302734375, 3.4322509765625, 3.92919921875, 4.4261474609375, 4.923095703125, 5.4200439453125, 5.9169921875, 6.4139404296875, 6.910888671875, 7.4078369140625, 7.90478515625, 8.4017333984375, 8.898681640625, 9.3956298828125, 9.892578125, 10.3895263671875, 10.886474609375, 11.3834228515625, 11.88037109375, 12.3773193359375, 12.874267578125, 13.3712158203125, 13.8681640625, 14.3651123046875, 14.862060546875, 15.3590087890625, 15.85595703125, 16.3529052734375, 16.849853515625, 17.3468017578125, 17.84375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 38.0, 102.0, 293.0, 304.0, 186.0, 72.0, 15.0, 0.0, 0.0, 0.0, 1.0], "bins": [-226.0171356201172, -221.99790954589844, -217.97866821289062, -213.95944213867188, -209.94020080566406, -205.9209747314453, -201.9017333984375, -197.88250732421875, -193.86326599121094, -189.8440399169922, -185.82479858398438, -181.80557250976562, -177.7863311767578, -173.76710510253906, -169.74786376953125, -165.7286376953125, -161.70941162109375, -157.690185546875, -153.6709442138672, -149.65171813964844, -145.63247680664062, -141.61325073242188, -137.59400939941406, -133.5747833251953, -129.5555419921875, -125.53630828857422, -121.51707458496094, -117.49784088134766, -113.47860717773438, -109.4593734741211, -105.44013977050781, -101.42091369628906, -97.40167999267578, -93.3824462890625, -89.36321258544922, -85.34397888183594, -81.32474517822266, -77.30551147460938, -73.28628540039062, -69.26704406738281, -65.24781799316406, -61.22858428955078, -57.2093505859375, -53.19011688232422, -49.17088317871094, -45.151649475097656, -41.13241958618164, -37.11318588256836, -33.09394836425781, -29.07471466064453, -25.05548095703125, -21.0362491607666, -17.01701545715332, -12.997781753540039, -8.97854995727539, -4.959316253662109, -0.9400844573974609, 3.079148769378662, 7.098381996154785, 11.11761474609375, 15.136848449707031, 19.156082153320312, 23.17531394958496, 27.194547653198242, 31.213781356811523]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 4.0, 4.0, 7.0, 7.0, 9.0, 9.0, 10.0, 16.0, 12.0, 14.0, 15.0, 20.0, 23.0, 29.0, 22.0, 29.0, 37.0, 40.0, 39.0, 38.0, 46.0, 37.0, 38.0, 43.0, 25.0, 42.0, 37.0, 41.0, 32.0, 23.0, 34.0, 30.0, 29.0, 19.0, 18.0, 16.0, 13.0, 17.0, 8.0, 18.0, 13.0, 12.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.757465362548828, -23.924449920654297, -23.091434478759766, -22.258420944213867, -21.425405502319336, -20.592390060424805, -19.759376525878906, -18.926361083984375, -18.093345642089844, -17.260330200195312, -16.42731475830078, -15.594301223754883, -14.761285781860352, -13.92827033996582, -13.095255851745605, -12.26224136352539, -11.42922592163086, -10.596210479736328, -9.763195991516113, -8.930181503295898, -8.097166061401367, -7.264151096343994, -6.431136131286621, -5.598121166229248, -4.765106201171875, -3.932091236114502, -3.099076271057129, -2.266061305999756, -1.4330463409423828, -0.6000313758850098, 0.23298358917236328, 1.0659985542297363, 1.8990116119384766, 2.7320265769958496, 3.5650415420532227, 4.398056507110596, 5.231071472167969, 6.064086437225342, 6.897101402282715, 7.730116367340088, 8.563131332397461, 9.396146774291992, 10.229161262512207, 11.062175750732422, 11.895191192626953, 12.728206634521484, 13.5612211227417, 14.394235610961914, 15.227251052856445, 16.060266494750977, 16.893280029296875, 17.726295471191406, 18.559310913085938, 19.39232635498047, 20.225341796875, 21.0583553314209, 21.89137077331543, 22.72438621520996, 23.55739974975586, 24.39041519165039, 25.223430633544922, 26.056446075439453, 26.889461517333984, 27.722475051879883, 28.555490493774414]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 4.0, 7.0, 9.0, 18.0, 14.0, 16.0, 25.0, 17.0, 26.0, 31.0, 29.0, 34.0, 36.0, 42.0, 43.0, 51.0, 38.0, 55.0, 43.0, 67.0, 51.0, 53.0, 30.0, 34.0, 36.0, 35.0, 30.0, 21.0, 26.0, 19.0, 16.0, 13.0, 8.0, 8.0, 10.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.880859375, -3.773223876953125, -3.66558837890625, -3.557952880859375, -3.4503173828125, -3.342681884765625, -3.23504638671875, -3.127410888671875, -3.019775390625, -2.912139892578125, -2.80450439453125, -2.696868896484375, -2.5892333984375, -2.481597900390625, -2.37396240234375, -2.266326904296875, -2.15869140625, -2.051055908203125, -1.94342041015625, -1.835784912109375, -1.7281494140625, -1.620513916015625, -1.51287841796875, -1.405242919921875, -1.297607421875, -1.189971923828125, -1.08233642578125, -0.974700927734375, -0.8670654296875, -0.759429931640625, -0.65179443359375, -0.544158935546875, -0.4365234375, -0.328887939453125, -0.22125244140625, -0.113616943359375, -0.0059814453125, 0.101654052734375, 0.20928955078125, 0.316925048828125, 0.424560546875, 0.532196044921875, 0.63983154296875, 0.747467041015625, 0.8551025390625, 0.962738037109375, 1.07037353515625, 1.178009033203125, 1.28564453125, 1.393280029296875, 1.50091552734375, 1.608551025390625, 1.7161865234375, 1.823822021484375, 1.93145751953125, 2.039093017578125, 2.146728515625, 2.254364013671875, 2.36199951171875, 2.469635009765625, 2.5772705078125, 2.684906005859375, 2.79254150390625, 2.900177001953125, 3.0078125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 7.0, 6.0, 13.0, 20.0, 29.0, 53.0, 62.0, 121.0, 189.0, 328.0, 620.0, 1083.0, 1974.0, 3619.0, 7232.0, 14102.0, 27304.0, 53943.0, 101212.0, 173428.0, 232777.0, 190461.0, 113878.0, 61363.0, 31200.0, 16148.0, 8177.0, 4172.0, 2163.0, 1208.0, 676.0, 387.0, 221.0, 134.0, 79.0, 52.0, 35.0, 23.0, 13.0, 14.0, 9.0, 8.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4580078125, -0.44141387939453125, -0.4248199462890625, -0.40822601318359375, -0.391632080078125, -0.37503814697265625, -0.3584442138671875, -0.34185028076171875, -0.32525634765625, -0.30866241455078125, -0.2920684814453125, -0.27547454833984375, -0.258880615234375, -0.24228668212890625, -0.2256927490234375, -0.20909881591796875, -0.1925048828125, -0.17591094970703125, -0.1593170166015625, -0.14272308349609375, -0.126129150390625, -0.10953521728515625, -0.0929412841796875, -0.07634735107421875, -0.05975341796875, -0.04315948486328125, -0.0265655517578125, -0.00997161865234375, 0.006622314453125, 0.02321624755859375, 0.0398101806640625, 0.05640411376953125, 0.072998046875, 0.08959197998046875, 0.1061859130859375, 0.12277984619140625, 0.139373779296875, 0.15596771240234375, 0.1725616455078125, 0.18915557861328125, 0.20574951171875, 0.22234344482421875, 0.2389373779296875, 0.25553131103515625, 0.272125244140625, 0.28871917724609375, 0.3053131103515625, 0.32190704345703125, 0.3385009765625, 0.35509490966796875, 0.3716888427734375, 0.38828277587890625, 0.404876708984375, 0.42147064208984375, 0.4380645751953125, 0.45465850830078125, 0.47125244140625, 0.48784637451171875, 0.5044403076171875, 0.5210342407226562, 0.537628173828125, 0.5542221069335938, 0.5708160400390625, 0.5874099731445312, 0.60400390625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 6.0, 7.0, 5.0, 4.0, 14.0, 8.0, 11.0, 19.0, 20.0, 19.0, 21.0, 16.0, 19.0, 25.0, 32.0, 30.0, 35.0, 41.0, 50.0, 34.0, 45.0, 1059.0, 46.0, 37.0, 43.0, 50.0, 30.0, 32.0, 41.0, 30.0, 24.0, 31.0, 22.0, 17.0, 11.0, 16.0, 15.0, 6.0, 8.0, 8.0, 6.0, 10.0, 5.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.77734375, -1.7187042236328125, -1.660064697265625, -1.6014251708984375, -1.54278564453125, -1.4841461181640625, -1.425506591796875, -1.3668670654296875, -1.3082275390625, -1.2495880126953125, -1.190948486328125, -1.1323089599609375, -1.07366943359375, -1.0150299072265625, -0.956390380859375, -0.8977508544921875, -0.839111328125, -0.7804718017578125, -0.721832275390625, -0.6631927490234375, -0.60455322265625, -0.5459136962890625, -0.487274169921875, -0.4286346435546875, -0.3699951171875, -0.3113555908203125, -0.252716064453125, -0.1940765380859375, -0.13543701171875, -0.0767974853515625, -0.018157958984375, 0.0404815673828125, 0.09912109375, 0.1577606201171875, 0.216400146484375, 0.2750396728515625, 0.33367919921875, 0.3923187255859375, 0.450958251953125, 0.5095977783203125, 0.5682373046875, 0.6268768310546875, 0.685516357421875, 0.7441558837890625, 0.80279541015625, 0.8614349365234375, 0.920074462890625, 0.9787139892578125, 1.037353515625, 1.0959930419921875, 1.154632568359375, 1.2132720947265625, 1.27191162109375, 1.3305511474609375, 1.389190673828125, 1.4478302001953125, 1.5064697265625, 1.5651092529296875, 1.623748779296875, 1.6823883056640625, 1.74102783203125, 1.7996673583984375, 1.858306884765625, 1.9169464111328125, 1.9755859375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 9.0, 5.0, 15.0, 19.0, 32.0, 28.0, 72.0, 75.0, 144.0, 240.0, 379.0, 589.0, 841.0, 1354.0, 2170.0, 3510.0, 5453.0, 9087.0, 15261.0, 25753.0, 44040.0, 73730.0, 116746.0, 174532.0, 1223734.0, 148816.0, 99586.0, 60863.0, 36350.0, 21071.0, 12501.0, 7509.0, 4585.0, 2980.0, 1848.0, 1155.0, 759.0, 454.0, 310.0, 184.0, 124.0, 88.0, 46.0, 29.0, 26.0, 13.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26708984375, -0.2585601806640625, -0.250030517578125, -0.2415008544921875, -0.23297119140625, -0.2244415283203125, -0.215911865234375, -0.2073822021484375, -0.1988525390625, -0.1903228759765625, -0.181793212890625, -0.1732635498046875, -0.16473388671875, -0.1562042236328125, -0.147674560546875, -0.1391448974609375, -0.130615234375, -0.1220855712890625, -0.113555908203125, -0.1050262451171875, -0.09649658203125, -0.0879669189453125, -0.079437255859375, -0.0709075927734375, -0.0623779296875, -0.0538482666015625, -0.045318603515625, -0.0367889404296875, -0.02825927734375, -0.0197296142578125, -0.011199951171875, -0.0026702880859375, 0.005859375, 0.0143890380859375, 0.022918701171875, 0.0314483642578125, 0.03997802734375, 0.0485076904296875, 0.057037353515625, 0.0655670166015625, 0.0740966796875, 0.0826263427734375, 0.091156005859375, 0.0996856689453125, 0.10821533203125, 0.1167449951171875, 0.125274658203125, 0.1338043212890625, 0.142333984375, 0.1508636474609375, 0.159393310546875, 0.1679229736328125, 0.17645263671875, 0.1849822998046875, 0.193511962890625, 0.2020416259765625, 0.2105712890625, 0.2191009521484375, 0.227630615234375, 0.2361602783203125, 0.24468994140625, 0.2532196044921875, 0.261749267578125, 0.2702789306640625, 0.27880859375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 2.0, 5.0, 5.0, 1.0, 2.0, 8.0, 7.0, 6.0, 9.0, 11.0, 17.0, 16.0, 19.0, 13.0, 20.0, 31.0, 32.0, 26.0, 52.0, 60.0, 79.0, 89.0, 106.0, 69.0, 40.0, 41.0, 34.0, 26.0, 23.0, 29.0, 20.0, 16.0, 18.0, 14.0, 11.0, 11.0, 8.0, 7.0, 6.0, 4.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.0091400146484375, -0.008888006210327148, -0.008635997772216797, -0.008383989334106445, -0.008131980895996094, -0.007879972457885742, -0.007627964019775391, -0.007375955581665039, -0.0071239471435546875, -0.006871938705444336, -0.006619930267333984, -0.006367921829223633, -0.006115913391113281, -0.00586390495300293, -0.005611896514892578, -0.0053598880767822266, -0.005107879638671875, -0.0048558712005615234, -0.004603862762451172, -0.00435185432434082, -0.004099845886230469, -0.003847837448120117, -0.0035958290100097656, -0.003343820571899414, -0.0030918121337890625, -0.002839803695678711, -0.0025877952575683594, -0.002335786819458008, -0.0020837783813476562, -0.0018317699432373047, -0.0015797615051269531, -0.0013277530670166016, -0.00107574462890625, -0.0008237361907958984, -0.0005717277526855469, -0.0003197193145751953, -6.771087646484375e-05, 0.0001842975616455078, 0.0004363059997558594, 0.0006883144378662109, 0.0009403228759765625, 0.001192331314086914, 0.0014443397521972656, 0.0016963481903076172, 0.0019483566284179688, 0.0022003650665283203, 0.002452373504638672, 0.0027043819427490234, 0.002956390380859375, 0.0032083988189697266, 0.003460407257080078, 0.0037124156951904297, 0.003964424133300781, 0.004216432571411133, 0.004468441009521484, 0.004720449447631836, 0.0049724578857421875, 0.005224466323852539, 0.005476474761962891, 0.005728483200073242, 0.005980491638183594, 0.006232500076293945, 0.006484508514404297, 0.0067365169525146484, 0.006988525390625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 8.0, 14.0, 14.0, 22.0, 16.0, 15.0, 31.0, 29.0, 41.0, 67.0, 68.0, 85.0, 98.0, 162.0, 184.0, 285.0, 628.0, 8702.0, 970005.0, 65461.0, 1295.0, 375.0, 229.0, 155.0, 109.0, 98.0, 80.0, 53.0, 48.0, 39.0, 39.0, 19.0, 19.0, 7.0, 9.0, 9.0, 7.0, 10.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11175537109375, -0.10772228240966797, -0.10368919372558594, -0.0996561050415039, -0.09562301635742188, -0.09158992767333984, -0.08755683898925781, -0.08352375030517578, -0.07949066162109375, -0.07545757293701172, -0.07142448425292969, -0.06739139556884766, -0.06335830688476562, -0.059325218200683594, -0.05529212951660156, -0.05125904083251953, -0.0472259521484375, -0.04319286346435547, -0.03915977478027344, -0.035126686096191406, -0.031093597412109375, -0.027060508728027344, -0.023027420043945312, -0.01899433135986328, -0.01496124267578125, -0.010928153991699219, -0.0068950653076171875, -0.0028619766235351562, 0.001171112060546875, 0.005204200744628906, 0.009237289428710938, 0.013270378112792969, 0.017303466796875, 0.02133655548095703, 0.025369644165039062, 0.029402732849121094, 0.033435821533203125, 0.037468910217285156, 0.04150199890136719, 0.04553508758544922, 0.04956817626953125, 0.05360126495361328, 0.05763435363769531, 0.061667442321777344, 0.06570053100585938, 0.0697336196899414, 0.07376670837402344, 0.07779979705810547, 0.0818328857421875, 0.08586597442626953, 0.08989906311035156, 0.0939321517944336, 0.09796524047851562, 0.10199832916259766, 0.10603141784667969, 0.11006450653076172, 0.11409759521484375, 0.11813068389892578, 0.12216377258300781, 0.12619686126708984, 0.13022994995117188, 0.1342630386352539, 0.13829612731933594, 0.14232921600341797, 0.1463623046875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 34.0, 809.0, 169.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1530391275882721, -0.14990441501140594, -0.1467697024345398, -0.14363498985767365, -0.1405002772808075, -0.13736556470394135, -0.1342308521270752, -0.13109613955020905, -0.1279614269733429, -0.12482671439647675, -0.1216920018196106, -0.11855728924274445, -0.1154225766658783, -0.11228786408901215, -0.109153151512146, -0.10601843893527985, -0.1028837189078331, -0.09974900633096695, -0.0966142937541008, -0.09347958117723465, -0.0903448686003685, -0.08721015602350235, -0.0840754359960556, -0.08094072341918945, -0.0778060108423233, -0.07467129826545715, -0.071536585688591, -0.06840187311172485, -0.0652671605348587, -0.062132447957992554, -0.058997731655836105, -0.055863019078969955, -0.052728310227394104, -0.049593597650527954, -0.046458885073661804, -0.043324172496795654, -0.040189459919929504, -0.037054747343063354, -0.033920031040906906, -0.030785318464040756, -0.027650605887174606, -0.024515893310308456, -0.021381180733442307, -0.018246466293931007, -0.015111753717064857, -0.011977041140198708, -0.008842326700687408, -0.0057076141238212585, -0.0025729015469551086, 0.0005618114955723286, 0.0036965245380997658, 0.00683123804628849, 0.00996595062315464, 0.01310066320002079, 0.01623537763953209, 0.01937009021639824, 0.02250480279326439, 0.02563951537013054, 0.02877422794699669, 0.03190894424915314, 0.03504365682601929, 0.03817836940288544, 0.04131308197975159, 0.04444779455661774, 0.04758250713348389]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 9.0, 7.0, 15.0, 8.0, 20.0, 29.0, 22.0, 29.0, 32.0, 48.0, 50.0, 56.0, 45.0, 52.0, 43.0, 45.0, 56.0, 48.0, 58.0, 41.0, 51.0, 41.0, 41.0, 24.0, 29.0, 24.0, 17.0, 12.0, 21.0, 11.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013088226318359375, -0.012706208974123001, -0.012324191629886627, -0.011942174285650253, -0.01156015694141388, -0.011178139597177505, -0.010796122252941132, -0.010414104908704758, -0.010032087564468384, -0.00965007022023201, -0.009268052875995636, -0.008886035531759262, -0.008504018187522888, -0.008122000843286514, -0.00773998349905014, -0.0073579661548137665, -0.006975948810577393, -0.006593931466341019, -0.006211914122104645, -0.005829896777868271, -0.005447879433631897, -0.005065862089395523, -0.004683844745159149, -0.004301827400922775, -0.003919810056686401, -0.0035377927124500275, -0.0031557753682136536, -0.0027737580239772797, -0.0023917406797409058, -0.002009723335504532, -0.001627705991268158, -0.001245688647031784, -0.0008636713027954102, -0.00048165395855903625, -9.963661432266235e-05, 0.00028238072991371155, 0.0006643980741500854, 0.0010464154183864594, 0.0014284327626228333, 0.0018104501068592072, 0.002192467451095581, 0.002574484795331955, 0.002956502139568329, 0.0033385194838047028, 0.0037205368280410767, 0.0041025541722774506, 0.0044845715165138245, 0.004866588860750198, 0.005248606204986572, 0.005630623549222946, 0.00601264089345932, 0.006394658237695694, 0.006776675581932068, 0.007158692926168442, 0.007540710270404816, 0.00792272761464119, 0.008304744958877563, 0.008686762303113937, 0.009068779647350311, 0.009450796991586685, 0.009832814335823059, 0.010214831680059433, 0.010596849024295807, 0.01097886636853218, 0.011360883712768555]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 4.0, 7.0, 9.0, 18.0, 14.0, 16.0, 25.0, 17.0, 26.0, 31.0, 29.0, 34.0, 36.0, 42.0, 43.0, 51.0, 38.0, 55.0, 43.0, 67.0, 51.0, 53.0, 30.0, 34.0, 36.0, 35.0, 31.0, 20.0, 26.0, 19.0, 16.0, 13.0, 8.0, 8.0, 10.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.880859375, -3.773223876953125, -3.66558837890625, -3.557952880859375, -3.4503173828125, -3.342681884765625, -3.23504638671875, -3.127410888671875, -3.019775390625, -2.912139892578125, -2.80450439453125, -2.696868896484375, -2.5892333984375, -2.481597900390625, -2.37396240234375, -2.266326904296875, -2.15869140625, -2.051055908203125, -1.94342041015625, -1.835784912109375, -1.7281494140625, -1.620513916015625, -1.51287841796875, -1.405242919921875, -1.297607421875, -1.189971923828125, -1.08233642578125, -0.974700927734375, -0.8670654296875, -0.759429931640625, -0.65179443359375, -0.544158935546875, -0.4365234375, -0.328887939453125, -0.22125244140625, -0.113616943359375, -0.0059814453125, 0.101654052734375, 0.20928955078125, 0.316925048828125, 0.424560546875, 0.532196044921875, 0.63983154296875, 0.747467041015625, 0.8551025390625, 0.962738037109375, 1.07037353515625, 1.178009033203125, 1.28564453125, 1.393280029296875, 1.50091552734375, 1.608551025390625, 1.7161865234375, 1.823822021484375, 1.93145751953125, 2.039093017578125, 2.146728515625, 2.254364013671875, 2.36199951171875, 2.469635009765625, 2.5772705078125, 2.684906005859375, 2.79254150390625, 2.900177001953125, 3.0078125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 18.0, 38.0, 37.0, 42.0, 67.0, 96.0, 173.0, 204.0, 352.0, 635.0, 1100.0, 2250.0, 5073.0, 12518.0, 33915.0, 118664.0, 399620.0, 334746.0, 92111.0, 27570.0, 10341.0, 4366.0, 2011.0, 1058.0, 576.0, 304.0, 213.0, 151.0, 104.0, 62.0, 34.0, 30.0, 25.0, 15.0, 6.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1171875, -3.995758056640625, -3.87432861328125, -3.752899169921875, -3.6314697265625, -3.510040283203125, -3.38861083984375, -3.267181396484375, -3.145751953125, -3.024322509765625, -2.90289306640625, -2.781463623046875, -2.6600341796875, -2.538604736328125, -2.41717529296875, -2.295745849609375, -2.17431640625, -2.052886962890625, -1.93145751953125, -1.810028076171875, -1.6885986328125, -1.567169189453125, -1.44573974609375, -1.324310302734375, -1.202880859375, -1.081451416015625, -0.96002197265625, -0.838592529296875, -0.7171630859375, -0.595733642578125, -0.47430419921875, -0.352874755859375, -0.2314453125, -0.110015869140625, 0.01141357421875, 0.132843017578125, 0.2542724609375, 0.375701904296875, 0.49713134765625, 0.618560791015625, 0.739990234375, 0.861419677734375, 0.98284912109375, 1.104278564453125, 1.2257080078125, 1.347137451171875, 1.46856689453125, 1.589996337890625, 1.71142578125, 1.832855224609375, 1.95428466796875, 2.075714111328125, 2.1971435546875, 2.318572998046875, 2.44000244140625, 2.561431884765625, 2.682861328125, 2.804290771484375, 2.92572021484375, 3.047149658203125, 3.1685791015625, 3.290008544921875, 3.41143798828125, 3.532867431640625, 3.654296875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 6.0, 3.0, 15.0, 7.0, 17.0, 16.0, 19.0, 21.0, 25.0, 33.0, 34.0, 41.0, 45.0, 46.0, 37.0, 64.0, 140.0, 427.0, 1454.0, 132.0, 51.0, 50.0, 48.0, 39.0, 40.0, 34.0, 34.0, 26.0, 17.0, 23.0, 23.0, 11.0, 8.0, 10.0, 5.0, 13.0, 3.0, 5.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.828125, -9.5006103515625, -9.173095703125, -8.8455810546875, -8.51806640625, -8.1905517578125, -7.863037109375, -7.5355224609375, -7.2080078125, -6.8804931640625, -6.552978515625, -6.2254638671875, -5.89794921875, -5.5704345703125, -5.242919921875, -4.9154052734375, -4.587890625, -4.2603759765625, -3.932861328125, -3.6053466796875, -3.27783203125, -2.9503173828125, -2.622802734375, -2.2952880859375, -1.9677734375, -1.6402587890625, -1.312744140625, -0.9852294921875, -0.65771484375, -0.3302001953125, -0.002685546875, 0.3248291015625, 0.65234375, 0.9798583984375, 1.307373046875, 1.6348876953125, 1.96240234375, 2.2899169921875, 2.617431640625, 2.9449462890625, 3.2724609375, 3.5999755859375, 3.927490234375, 4.2550048828125, 4.58251953125, 4.9100341796875, 5.237548828125, 5.5650634765625, 5.892578125, 6.2200927734375, 6.547607421875, 6.8751220703125, 7.20263671875, 7.5301513671875, 7.857666015625, 8.1851806640625, 8.5126953125, 8.8402099609375, 9.167724609375, 9.4952392578125, 9.82275390625, 10.1502685546875, 10.477783203125, 10.8052978515625, 11.1328125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 2.0, 5.0, 4.0, 6.0, 11.0, 7.0, 6.0, 11.0, 13.0, 21.0, 26.0, 32.0, 23.0, 39.0, 62.0, 76.0, 137.0, 207.0, 337.0, 811.0, 2456.0, 14411.0, 259293.0, 2797555.0, 60917.0, 6415.0, 1446.0, 560.0, 258.0, 151.0, 106.0, 53.0, 49.0, 37.0, 23.0, 31.0, 20.0, 16.0, 12.0, 14.0, 7.0, 6.0, 4.0, 4.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.6484375, -13.197998046875, -12.74755859375, -12.297119140625, -11.8466796875, -11.396240234375, -10.94580078125, -10.495361328125, -10.044921875, -9.594482421875, -9.14404296875, -8.693603515625, -8.2431640625, -7.792724609375, -7.34228515625, -6.891845703125, -6.44140625, -5.990966796875, -5.54052734375, -5.090087890625, -4.6396484375, -4.189208984375, -3.73876953125, -3.288330078125, -2.837890625, -2.387451171875, -1.93701171875, -1.486572265625, -1.0361328125, -0.585693359375, -0.13525390625, 0.315185546875, 0.765625, 1.216064453125, 1.66650390625, 2.116943359375, 2.5673828125, 3.017822265625, 3.46826171875, 3.918701171875, 4.369140625, 4.819580078125, 5.27001953125, 5.720458984375, 6.1708984375, 6.621337890625, 7.07177734375, 7.522216796875, 7.97265625, 8.423095703125, 8.87353515625, 9.323974609375, 9.7744140625, 10.224853515625, 10.67529296875, 11.125732421875, 11.576171875, 12.026611328125, 12.47705078125, 12.927490234375, 13.3779296875, 13.828369140625, 14.27880859375, 14.729248046875, 15.1796875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 92.0, 436.0, 393.0, 79.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.15377807617188, -78.89427185058594, -76.63475799560547, -74.37525177001953, -72.11573791503906, -69.85623168945312, -67.59671783447266, -65.33721160888672, -63.07769775390625, -60.81818771362305, -58.558677673339844, -56.29916763305664, -54.03965759277344, -51.780147552490234, -49.52063751220703, -47.261131286621094, -45.00162124633789, -42.74211120605469, -40.482601165771484, -38.22309112548828, -35.96358108520508, -33.704071044921875, -31.444562911987305, -29.1850528717041, -26.9255428314209, -24.666032791137695, -22.406522750854492, -20.147014617919922, -17.88750457763672, -15.6279935836792, -13.368484497070312, -11.10897445678711, -8.849468231201172, -6.589958190917969, -4.330448627471924, -2.070939064025879, 0.18857097625732422, 2.4480810165405273, 4.707590103149414, 6.967100143432617, 9.22661018371582, 11.486120223999023, 13.745630264282227, 16.005138397216797, 18.2646484375, 20.524158477783203, 22.783668518066406, 25.04317855834961, 27.302688598632812, 29.562198638916016, 31.82170867919922, 34.08121871948242, 36.340728759765625, 38.60023880004883, 40.85974884033203, 43.11925506591797, 45.37876892089844, 47.63827896118164, 49.897789001464844, 52.15729904174805, 54.41680908203125, 56.67631912231445, 58.935829162597656, 61.195335388183594, 63.4548454284668]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 10.0, 8.0, 11.0, 12.0, 20.0, 20.0, 20.0, 20.0, 22.0, 26.0, 25.0, 27.0, 41.0, 32.0, 26.0, 41.0, 42.0, 33.0, 44.0, 47.0, 47.0, 53.0, 40.0, 27.0, 38.0, 41.0, 25.0, 26.0, 28.0, 19.0, 21.0, 17.0, 10.0, 16.0, 14.0, 8.0, 5.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-39.18626403808594, -38.09932327270508, -37.01238250732422, -35.92544174194336, -34.8385009765625, -33.75156021118164, -32.66461944580078, -31.577678680419922, -30.490737915039062, -29.403797149658203, -28.316856384277344, -27.229915618896484, -26.142974853515625, -25.056034088134766, -23.969093322753906, -22.882152557373047, -21.795211791992188, -20.708271026611328, -19.62133026123047, -18.53438949584961, -17.44744873046875, -16.36050796508789, -15.273567199707031, -14.186626434326172, -13.099685668945312, -12.012744903564453, -10.925804138183594, -9.838863372802734, -8.751922607421875, -7.664981842041016, -6.578041076660156, -5.491100311279297, -4.4041595458984375, -3.317218780517578, -2.2302780151367188, -1.1433372497558594, -0.056396484375, 1.0305442810058594, 2.1174850463867188, 3.204425811767578, 4.2913665771484375, 5.378307342529297, 6.465248107910156, 7.552188873291016, 8.639129638671875, 9.726070404052734, 10.813011169433594, 11.899951934814453, 12.986892700195312, 14.073833465576172, 15.160774230957031, 16.24771499633789, 17.33465576171875, 18.42159652709961, 19.50853729248047, 20.595478057861328, 21.682418823242188, 22.769359588623047, 23.856300354003906, 24.943241119384766, 26.030181884765625, 27.117122650146484, 28.204063415527344, 29.291004180908203, 30.377944946289062]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 7.0, 8.0, 18.0, 20.0, 15.0, 23.0, 27.0, 18.0, 34.0, 25.0, 36.0, 34.0, 37.0, 43.0, 40.0, 51.0, 41.0, 54.0, 55.0, 45.0, 50.0, 47.0, 33.0, 30.0, 34.0, 25.0, 24.0, 24.0, 26.0, 13.0, 17.0, 11.0, 13.0, 5.0, 5.0, 5.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.700408935546875, -3.59222412109375, -3.484039306640625, -3.3758544921875, -3.267669677734375, -3.15948486328125, -3.051300048828125, -2.943115234375, -2.834930419921875, -2.72674560546875, -2.618560791015625, -2.5103759765625, -2.402191162109375, -2.29400634765625, -2.185821533203125, -2.07763671875, -1.969451904296875, -1.86126708984375, -1.753082275390625, -1.6448974609375, -1.536712646484375, -1.42852783203125, -1.320343017578125, -1.212158203125, -1.103973388671875, -0.99578857421875, -0.887603759765625, -0.7794189453125, -0.671234130859375, -0.56304931640625, -0.454864501953125, -0.3466796875, -0.238494873046875, -0.13031005859375, -0.022125244140625, 0.0860595703125, 0.194244384765625, 0.30242919921875, 0.410614013671875, 0.518798828125, 0.626983642578125, 0.73516845703125, 0.843353271484375, 0.9515380859375, 1.059722900390625, 1.16790771484375, 1.276092529296875, 1.38427734375, 1.492462158203125, 1.60064697265625, 1.708831787109375, 1.8170166015625, 1.925201416015625, 2.03338623046875, 2.141571044921875, 2.249755859375, 2.357940673828125, 2.46612548828125, 2.574310302734375, 2.6824951171875, 2.790679931640625, 2.89886474609375, 3.007049560546875, 3.115234375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 7.0, 4.0, 12.0, 11.0, 13.0, 24.0, 29.0, 52.0, 67.0, 113.0, 178.0, 342.0, 766.0, 1885.0, 5375.0, 18127.0, 81319.0, 568141.0, 2542198.0, 829272.0, 112520.0, 23405.0, 6571.0, 2168.0, 809.0, 390.0, 181.0, 102.0, 57.0, 38.0, 27.0, 18.0, 24.0, 12.0, 5.0, 7.0, 5.0, 3.0, 1.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.546875, -8.29241943359375, -8.0379638671875, -7.78350830078125, -7.529052734375, -7.27459716796875, -7.0201416015625, -6.76568603515625, -6.51123046875, -6.25677490234375, -6.0023193359375, -5.74786376953125, -5.493408203125, -5.23895263671875, -4.9844970703125, -4.73004150390625, -4.4755859375, -4.22113037109375, -3.9666748046875, -3.71221923828125, -3.457763671875, -3.20330810546875, -2.9488525390625, -2.69439697265625, -2.43994140625, -2.18548583984375, -1.9310302734375, -1.67657470703125, -1.422119140625, -1.16766357421875, -0.9132080078125, -0.65875244140625, -0.404296875, -0.14984130859375, 0.1046142578125, 0.35906982421875, 0.613525390625, 0.86798095703125, 1.1224365234375, 1.37689208984375, 1.63134765625, 1.88580322265625, 2.1402587890625, 2.39471435546875, 2.649169921875, 2.90362548828125, 3.1580810546875, 3.41253662109375, 3.6669921875, 3.92144775390625, 4.1759033203125, 4.43035888671875, 4.684814453125, 4.93927001953125, 5.1937255859375, 5.44818115234375, 5.70263671875, 5.95709228515625, 6.2115478515625, 6.46600341796875, 6.720458984375, 6.97491455078125, 7.2293701171875, 7.48382568359375, 7.73828125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 1.0, 6.0, 5.0, 6.0, 13.0, 19.0, 23.0, 19.0, 33.0, 42.0, 52.0, 61.0, 97.0, 137.0, 163.0, 248.0, 342.0, 453.0, 488.0, 448.0, 393.0, 289.0, 224.0, 127.0, 102.0, 76.0, 46.0, 42.0, 32.0, 22.0, 19.0, 11.0, 8.0, 3.0, 8.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.421875, -9.1494140625, -8.876953125, -8.6044921875, -8.33203125, -8.0595703125, -7.787109375, -7.5146484375, -7.2421875, -6.9697265625, -6.697265625, -6.4248046875, -6.15234375, -5.8798828125, -5.607421875, -5.3349609375, -5.0625, -4.7900390625, -4.517578125, -4.2451171875, -3.97265625, -3.7001953125, -3.427734375, -3.1552734375, -2.8828125, -2.6103515625, -2.337890625, -2.0654296875, -1.79296875, -1.5205078125, -1.248046875, -0.9755859375, -0.703125, -0.4306640625, -0.158203125, 0.1142578125, 0.38671875, 0.6591796875, 0.931640625, 1.2041015625, 1.4765625, 1.7490234375, 2.021484375, 2.2939453125, 2.56640625, 2.8388671875, 3.111328125, 3.3837890625, 3.65625, 3.9287109375, 4.201171875, 4.4736328125, 4.74609375, 5.0185546875, 5.291015625, 5.5634765625, 5.8359375, 6.1083984375, 6.380859375, 6.6533203125, 6.92578125, 7.1982421875, 7.470703125, 7.7431640625, 8.015625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 9.0, 11.0, 16.0, 14.0, 29.0, 60.0, 91.0, 111.0, 191.0, 344.0, 584.0, 1128.0, 2362.0, 5261.0, 14202.0, 46823.0, 211341.0, 1209604.0, 2137251.0, 440988.0, 86425.0, 22942.0, 7789.0, 3263.0, 1562.0, 813.0, 428.0, 236.0, 136.0, 107.0, 59.0, 25.0, 26.0, 17.0, 12.0, 7.0, 8.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.171875, -11.805419921875, -11.43896484375, -11.072509765625, -10.7060546875, -10.339599609375, -9.97314453125, -9.606689453125, -9.240234375, -8.873779296875, -8.50732421875, -8.140869140625, -7.7744140625, -7.407958984375, -7.04150390625, -6.675048828125, -6.30859375, -5.942138671875, -5.57568359375, -5.209228515625, -4.8427734375, -4.476318359375, -4.10986328125, -3.743408203125, -3.376953125, -3.010498046875, -2.64404296875, -2.277587890625, -1.9111328125, -1.544677734375, -1.17822265625, -0.811767578125, -0.4453125, -0.078857421875, 0.28759765625, 0.654052734375, 1.0205078125, 1.386962890625, 1.75341796875, 2.119873046875, 2.486328125, 2.852783203125, 3.21923828125, 3.585693359375, 3.9521484375, 4.318603515625, 4.68505859375, 5.051513671875, 5.41796875, 5.784423828125, 6.15087890625, 6.517333984375, 6.8837890625, 7.250244140625, 7.61669921875, 7.983154296875, 8.349609375, 8.716064453125, 9.08251953125, 9.448974609375, 9.8154296875, 10.181884765625, 10.54833984375, 10.914794921875, 11.28125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 19.0, 64.0, 138.0, 237.0, 266.0, 175.0, 73.0, 22.0, 13.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-172.69281005859375, -169.1873321533203, -165.68185424804688, -162.1763916015625, -158.67091369628906, -155.16543579101562, -151.6599578857422, -148.15447998046875, -144.6490020751953, -141.14352416992188, -137.63804626464844, -134.132568359375, -130.62710571289062, -127.12162780761719, -123.61614990234375, -120.11067199707031, -116.6052017211914, -113.09972381591797, -109.59425354003906, -106.08877563476562, -102.58329772949219, -99.07781982421875, -95.57234954833984, -92.0668716430664, -88.5614013671875, -85.05592346191406, -81.55045318603516, -78.04497528076172, -74.53949737548828, -71.03402709960938, -67.52854919433594, -64.0230712890625, -60.51759719848633, -57.012123107910156, -53.50664520263672, -50.00117111206055, -46.495697021484375, -42.99021911621094, -39.484745025634766, -35.979270935058594, -32.473793029785156, -28.96831703186035, -25.462841033935547, -21.957366943359375, -18.45189094543457, -14.946414947509766, -11.440940856933594, -7.935464859008789, -4.429988861083984, -0.9245133399963379, 2.5809621810913086, 6.086437225341797, 9.591913223266602, 13.097389221191406, 16.602863311767578, 20.108339309692383, 23.613815307617188, 27.119291305541992, 30.624767303466797, 34.13024139404297, 37.635719299316406, 41.14119338989258, 44.64666748046875, 48.15214538574219, 51.65761947631836]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 1.0, 8.0, 3.0, 4.0, 12.0, 11.0, 10.0, 19.0, 19.0, 16.0, 19.0, 27.0, 14.0, 22.0, 23.0, 28.0, 21.0, 25.0, 30.0, 25.0, 30.0, 38.0, 40.0, 40.0, 40.0, 33.0, 46.0, 29.0, 42.0, 26.0, 34.0, 20.0, 29.0, 31.0, 19.0, 23.0, 23.0, 18.0, 16.0, 12.0, 6.0, 6.0, 7.0, 10.0, 12.0, 8.0, 8.0, 5.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-26.002193450927734, -25.206300735473633, -24.41040802001953, -23.61451530456543, -22.818622589111328, -22.022727966308594, -21.226837158203125, -20.43094253540039, -19.63504981994629, -18.839157104492188, -18.043264389038086, -17.247371673583984, -16.451478958129883, -15.655585289001465, -14.859692573547363, -14.063798904418945, -13.26790714263916, -12.472014427185059, -11.676121711730957, -10.880228042602539, -10.084335327148438, -9.288442611694336, -8.492549896240234, -7.696656703948975, -6.900763988494873, -6.1048712730407715, -5.308978080749512, -4.51308536529541, -3.7171924114227295, -2.921299457550049, -2.1254067420959473, -1.3295135498046875, -0.5336208343505859, 0.26227205991744995, 1.0581649541854858, 1.854057788848877, 2.6499507427215576, 3.4458436965942383, 4.24173641204834, 5.0376296043396, 5.833522319793701, 6.629415035247803, 7.4253082275390625, 8.221200942993164, 9.017093658447266, 9.812986373901367, 10.608879089355469, 11.404772758483887, 12.200665473937988, 12.99655818939209, 13.792450904846191, 14.58834457397461, 15.384237289428711, 16.180130004882812, 16.976022720336914, 17.771915435791016, 18.567808151245117, 19.36370086669922, 20.15959358215332, 20.955486297607422, 21.751379013061523, 22.547271728515625, 23.34316635131836, 24.13905906677246, 24.934951782226562]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 8.0, 10.0, 8.0, 9.0, 12.0, 18.0, 22.0, 26.0, 20.0, 26.0, 34.0, 29.0, 38.0, 40.0, 39.0, 43.0, 48.0, 48.0, 49.0, 49.0, 52.0, 41.0, 58.0, 27.0, 27.0, 40.0, 30.0, 24.0, 25.0, 23.0, 19.0, 15.0, 10.0, 14.0, 10.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.87109375, -3.7589111328125, -3.646728515625, -3.5345458984375, -3.42236328125, -3.3101806640625, -3.197998046875, -3.0858154296875, -2.9736328125, -2.8614501953125, -2.749267578125, -2.6370849609375, -2.52490234375, -2.4127197265625, -2.300537109375, -2.1883544921875, -2.076171875, -1.9639892578125, -1.851806640625, -1.7396240234375, -1.62744140625, -1.5152587890625, -1.403076171875, -1.2908935546875, -1.1787109375, -1.0665283203125, -0.954345703125, -0.8421630859375, -0.72998046875, -0.6177978515625, -0.505615234375, -0.3934326171875, -0.28125, -0.1690673828125, -0.056884765625, 0.0552978515625, 0.16748046875, 0.2796630859375, 0.391845703125, 0.5040283203125, 0.6162109375, 0.7283935546875, 0.840576171875, 0.9527587890625, 1.06494140625, 1.1771240234375, 1.289306640625, 1.4014892578125, 1.513671875, 1.6258544921875, 1.738037109375, 1.8502197265625, 1.96240234375, 2.0745849609375, 2.186767578125, 2.2989501953125, 2.4111328125, 2.5233154296875, 2.635498046875, 2.7476806640625, 2.85986328125, 2.9720458984375, 3.084228515625, 3.1964111328125, 3.30859375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 6.0, 15.0, 11.0, 19.0, 32.0, 42.0, 64.0, 115.0, 177.0, 282.0, 470.0, 737.0, 1375.0, 2259.0, 3965.0, 7050.0, 12266.0, 21702.0, 37622.0, 65142.0, 107675.0, 158843.0, 192413.0, 163119.0, 111514.0, 68401.0, 40253.0, 22793.0, 12801.0, 7332.0, 4176.0, 2432.0, 1366.0, 812.0, 488.0, 304.0, 184.0, 110.0, 63.0, 40.0, 33.0, 15.0, 10.0, 11.0, 5.0, 5.0, 5.0, 0.0, 2.0, 3.0, 3.0, 2.0], "bins": [-0.5185546875, -0.5035438537597656, -0.48853302001953125, -0.4735221862792969, -0.4585113525390625, -0.4435005187988281, -0.42848968505859375, -0.4134788513183594, -0.398468017578125, -0.3834571838378906, -0.36844635009765625, -0.3534355163574219, -0.3384246826171875, -0.3234138488769531, -0.30840301513671875, -0.2933921813964844, -0.27838134765625, -0.2633705139160156, -0.24835968017578125, -0.23334884643554688, -0.2183380126953125, -0.20332717895507812, -0.18831634521484375, -0.17330551147460938, -0.158294677734375, -0.14328384399414062, -0.12827301025390625, -0.11326217651367188, -0.0982513427734375, -0.08324050903320312, -0.06822967529296875, -0.053218841552734375, -0.0382080078125, -0.023197174072265625, -0.00818634033203125, 0.006824493408203125, 0.0218353271484375, 0.036846160888671875, 0.05185699462890625, 0.06686782836914062, 0.081878662109375, 0.09688949584960938, 0.11190032958984375, 0.12691116333007812, 0.1419219970703125, 0.15693283081054688, 0.17194366455078125, 0.18695449829101562, 0.20196533203125, 0.21697616577148438, 0.23198699951171875, 0.24699783325195312, 0.2620086669921875, 0.2770195007324219, 0.29203033447265625, 0.3070411682128906, 0.322052001953125, 0.3370628356933594, 0.35207366943359375, 0.3670845031738281, 0.3820953369140625, 0.3971061706542969, 0.41211700439453125, 0.4271278381347656, 0.442138671875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 7.0, 1.0, 5.0, 10.0, 5.0, 14.0, 22.0, 8.0, 26.0, 21.0, 25.0, 30.0, 17.0, 26.0, 26.0, 24.0, 41.0, 34.0, 39.0, 46.0, 42.0, 1047.0, 41.0, 32.0, 35.0, 35.0, 53.0, 34.0, 31.0, 33.0, 35.0, 28.0, 18.0, 20.0, 24.0, 19.0, 15.0, 14.0, 8.0, 8.0, 8.0, 9.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.015625, -1.950164794921875, -1.88470458984375, -1.819244384765625, -1.7537841796875, -1.688323974609375, -1.62286376953125, -1.557403564453125, -1.491943359375, -1.426483154296875, -1.36102294921875, -1.295562744140625, -1.2301025390625, -1.164642333984375, -1.09918212890625, -1.033721923828125, -0.96826171875, -0.902801513671875, -0.83734130859375, -0.771881103515625, -0.7064208984375, -0.640960693359375, -0.57550048828125, -0.510040283203125, -0.444580078125, -0.379119873046875, -0.31365966796875, -0.248199462890625, -0.1827392578125, -0.117279052734375, -0.05181884765625, 0.013641357421875, 0.0791015625, 0.144561767578125, 0.21002197265625, 0.275482177734375, 0.3409423828125, 0.406402587890625, 0.47186279296875, 0.537322998046875, 0.602783203125, 0.668243408203125, 0.73370361328125, 0.799163818359375, 0.8646240234375, 0.930084228515625, 0.99554443359375, 1.061004638671875, 1.12646484375, 1.191925048828125, 1.25738525390625, 1.322845458984375, 1.3883056640625, 1.453765869140625, 1.51922607421875, 1.584686279296875, 1.650146484375, 1.715606689453125, 1.78106689453125, 1.846527099609375, 1.9119873046875, 1.977447509765625, 2.04290771484375, 2.108367919921875, 2.173828125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 12.0, 13.0, 21.0, 39.0, 42.0, 48.0, 106.0, 138.0, 221.0, 300.0, 445.0, 705.0, 1062.0, 1548.0, 2519.0, 4005.0, 6253.0, 9801.0, 15559.0, 25212.0, 41056.0, 64802.0, 98179.0, 139364.0, 1200802.0, 164308.0, 113327.0, 76461.0, 48953.0, 30737.0, 18894.0, 11689.0, 7322.0, 4758.0, 2861.0, 1896.0, 1161.0, 859.0, 561.0, 389.0, 234.0, 157.0, 100.0, 73.0, 45.0, 29.0, 19.0, 17.0, 14.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.26318359375, -0.254608154296875, -0.24603271484375, -0.237457275390625, -0.2288818359375, -0.220306396484375, -0.21173095703125, -0.203155517578125, -0.194580078125, -0.186004638671875, -0.17742919921875, -0.168853759765625, -0.1602783203125, -0.151702880859375, -0.14312744140625, -0.134552001953125, -0.1259765625, -0.117401123046875, -0.10882568359375, -0.100250244140625, -0.0916748046875, -0.083099365234375, -0.07452392578125, -0.065948486328125, -0.057373046875, -0.048797607421875, -0.04022216796875, -0.031646728515625, -0.0230712890625, -0.014495849609375, -0.00592041015625, 0.002655029296875, 0.01123046875, 0.019805908203125, 0.02838134765625, 0.036956787109375, 0.0455322265625, 0.054107666015625, 0.06268310546875, 0.071258544921875, 0.079833984375, 0.088409423828125, 0.09698486328125, 0.105560302734375, 0.1141357421875, 0.122711181640625, 0.13128662109375, 0.139862060546875, 0.1484375, 0.157012939453125, 0.16558837890625, 0.174163818359375, 0.1827392578125, 0.191314697265625, 0.19989013671875, 0.208465576171875, 0.217041015625, 0.225616455078125, 0.23419189453125, 0.242767333984375, 0.2513427734375, 0.259918212890625, 0.26849365234375, 0.277069091796875, 0.28564453125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 3.0, 5.0, 7.0, 5.0, 14.0, 12.0, 20.0, 21.0, 24.0, 41.0, 37.0, 55.0, 65.0, 78.0, 125.0, 120.0, 92.0, 62.0, 32.0, 41.0, 29.0, 12.0, 15.0, 20.0, 20.0, 9.0, 10.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0138702392578125, -0.013421177864074707, -0.012972116470336914, -0.012523055076599121, -0.012073993682861328, -0.011624932289123535, -0.011175870895385742, -0.01072680950164795, -0.010277748107910156, -0.009828686714172363, -0.00937962532043457, -0.008930563926696777, -0.008481502532958984, -0.008032441139221191, -0.0075833797454833984, -0.0071343183517456055, -0.0066852569580078125, -0.0062361955642700195, -0.0057871341705322266, -0.005338072776794434, -0.004889011383056641, -0.004439949989318848, -0.003990888595581055, -0.0035418272018432617, -0.0030927658081054688, -0.0026437044143676758, -0.002194643020629883, -0.0017455816268920898, -0.0012965202331542969, -0.0008474588394165039, -0.00039839744567871094, 5.066394805908203e-05, 0.000499725341796875, 0.000948786735534668, 0.001397848129272461, 0.001846909523010254, 0.002295970916748047, 0.00274503231048584, 0.003194093704223633, 0.0036431550979614258, 0.004092216491699219, 0.004541277885437012, 0.004990339279174805, 0.005439400672912598, 0.005888462066650391, 0.006337523460388184, 0.0067865848541259766, 0.0072356462478637695, 0.0076847076416015625, 0.008133769035339355, 0.008582830429077148, 0.009031891822814941, 0.009480953216552734, 0.009930014610290527, 0.01037907600402832, 0.010828137397766113, 0.011277198791503906, 0.0117262601852417, 0.012175321578979492, 0.012624382972717285, 0.013073444366455078, 0.013522505760192871, 0.013971567153930664, 0.014420628547668457, 0.01486968994140625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 9.0, 15.0, 25.0, 36.0, 40.0, 41.0, 54.0, 107.0, 136.0, 241.0, 342.0, 953.0, 52798.0, 989815.0, 2631.0, 465.0, 255.0, 147.0, 123.0, 89.0, 59.0, 46.0, 24.0, 25.0, 13.0, 10.0, 9.0, 3.0, 9.0, 5.0, 6.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2305908203125, -0.2236480712890625, -0.216705322265625, -0.2097625732421875, -0.20281982421875, -0.1958770751953125, -0.188934326171875, -0.1819915771484375, -0.175048828125, -0.1681060791015625, -0.161163330078125, -0.1542205810546875, -0.14727783203125, -0.1403350830078125, -0.133392333984375, -0.1264495849609375, -0.1195068359375, -0.1125640869140625, -0.105621337890625, -0.0986785888671875, -0.09173583984375, -0.0847930908203125, -0.077850341796875, -0.0709075927734375, -0.06396484375, -0.0570220947265625, -0.050079345703125, -0.0431365966796875, -0.03619384765625, -0.0292510986328125, -0.022308349609375, -0.0153656005859375, -0.0084228515625, -0.0014801025390625, 0.005462646484375, 0.0124053955078125, 0.01934814453125, 0.0262908935546875, 0.033233642578125, 0.0401763916015625, 0.047119140625, 0.0540618896484375, 0.061004638671875, 0.0679473876953125, 0.07489013671875, 0.0818328857421875, 0.088775634765625, 0.0957183837890625, 0.1026611328125, 0.1096038818359375, 0.116546630859375, 0.1234893798828125, 0.13043212890625, 0.1373748779296875, 0.144317626953125, 0.1512603759765625, 0.158203125, 0.1651458740234375, 0.172088623046875, 0.1790313720703125, 0.18597412109375, 0.1929168701171875, 0.199859619140625, 0.2068023681640625, 0.2137451171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 61.0, 938.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13172505795955658, -0.1265614628791809, -0.12139785289764404, -0.11623425036668777, -0.1110706478357315, -0.10590704530477524, -0.10074344277381897, -0.0955798402428627, -0.09041623771190643, -0.08525263518095016, -0.0800890326499939, -0.07492543011903763, -0.06976182758808136, -0.06459822505712509, -0.05943462252616882, -0.054271019995212555, -0.04910741746425629, -0.04394381493330002, -0.03878021240234375, -0.03361660987138748, -0.028453007340431213, -0.023289404809474945, -0.018125802278518677, -0.012962199747562408, -0.00779859721660614, -0.002634994685649872, 0.0025286078453063965, 0.007692210376262665, 0.012855812907218933, 0.0180194154381752, 0.02318301796913147, 0.028346620500087738, 0.033510223031044006, 0.038673825562000275, 0.04383742809295654, 0.04900103062391281, 0.05416463315486908, 0.05932823568582535, 0.06449183821678162, 0.06965544074773788, 0.07481904327869415, 0.07998264580965042, 0.08514624834060669, 0.09030985087156296, 0.09547345340251923, 0.1006370559334755, 0.10580065846443176, 0.11096426099538803, 0.1161278635263443, 0.12129146605730057, 0.12645506858825684, 0.1316186785697937, 0.13678227365016937, 0.14194586873054504, 0.1471094787120819, 0.15227308869361877, 0.15743668377399445, 0.16260027885437012, 0.16776388883590698, 0.17292749881744385, 0.17809109389781952, 0.1832546889781952, 0.18841829895973206, 0.19358190894126892, 0.1987455040216446]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 9.0, 7.0, 7.0, 11.0, 19.0, 18.0, 17.0, 30.0, 20.0, 19.0, 30.0, 41.0, 39.0, 24.0, 33.0, 36.0, 49.0, 43.0, 36.0, 37.0, 34.0, 39.0, 39.0, 36.0, 40.0, 40.0, 35.0, 28.0, 26.0, 26.0, 23.0, 14.0, 19.0, 11.0, 8.0, 14.0, 4.0, 8.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.013681352138519287, -0.01326003111898899, -0.012838710099458694, -0.012417389079928398, -0.011996068060398102, -0.011574747040867805, -0.01115342602133751, -0.010732105001807213, -0.010310783982276917, -0.00988946296274662, -0.009468141943216324, -0.009046820923686028, -0.008625499904155731, -0.008204178884625435, -0.0077828578650951385, -0.007361536845564842, -0.006940215826034546, -0.00651889480650425, -0.006097573786973953, -0.005676252767443657, -0.005254931747913361, -0.004833610728383064, -0.004412289708852768, -0.003990968689322472, -0.0035696476697921753, -0.003148326650261879, -0.0027270056307315826, -0.0023056846112012863, -0.00188436359167099, -0.0014630425721406937, -0.0010417215526103973, -0.000620400533080101, -0.0001990795135498047, 0.00022224150598049164, 0.000643562525510788, 0.0010648835450410843, 0.0014862045645713806, 0.001907525584101677, 0.0023288466036319733, 0.0027501676231622696, 0.003171488642692566, 0.0035928096622228622, 0.004014130681753159, 0.004435451701283455, 0.004856772720813751, 0.0052780937403440475, 0.005699414759874344, 0.00612073577940464, 0.0065420567989349365, 0.006963377818465233, 0.007384698837995529, 0.0078060198575258255, 0.008227340877056122, 0.008648661896586418, 0.009069982916116714, 0.00949130393564701, 0.009912624955177307, 0.010333945974707603, 0.0107552669942379, 0.011176588013768196, 0.011597909033298492, 0.012019230052828789, 0.012440551072359085, 0.012861872091889381, 0.013283193111419678]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 8.0, 10.0, 8.0, 9.0, 12.0, 18.0, 22.0, 26.0, 20.0, 26.0, 34.0, 29.0, 38.0, 40.0, 39.0, 43.0, 48.0, 47.0, 50.0, 49.0, 52.0, 41.0, 58.0, 27.0, 28.0, 39.0, 31.0, 23.0, 25.0, 23.0, 19.0, 15.0, 10.0, 14.0, 10.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.87109375, -3.7589111328125, -3.646728515625, -3.5345458984375, -3.42236328125, -3.3101806640625, -3.197998046875, -3.0858154296875, -2.9736328125, -2.8614501953125, -2.749267578125, -2.6370849609375, -2.52490234375, -2.4127197265625, -2.300537109375, -2.1883544921875, -2.076171875, -1.9639892578125, -1.851806640625, -1.7396240234375, -1.62744140625, -1.5152587890625, -1.403076171875, -1.2908935546875, -1.1787109375, -1.0665283203125, -0.954345703125, -0.8421630859375, -0.72998046875, -0.6177978515625, -0.505615234375, -0.3934326171875, -0.28125, -0.1690673828125, -0.056884765625, 0.0552978515625, 0.16748046875, 0.2796630859375, 0.391845703125, 0.5040283203125, 0.6162109375, 0.7283935546875, 0.840576171875, 0.9527587890625, 1.06494140625, 1.1771240234375, 1.289306640625, 1.4014892578125, 1.513671875, 1.6258544921875, 1.738037109375, 1.8502197265625, 1.96240234375, 2.0745849609375, 2.186767578125, 2.2989501953125, 2.4111328125, 2.5233154296875, 2.635498046875, 2.7476806640625, 2.85986328125, 2.9720458984375, 3.084228515625, 3.1964111328125, 3.30859375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 7.0, 8.0, 18.0, 18.0, 27.0, 60.0, 64.0, 119.0, 205.0, 306.0, 530.0, 872.0, 1493.0, 2766.0, 5366.0, 10296.0, 20662.0, 44237.0, 99140.0, 224895.0, 312577.0, 177966.0, 77201.0, 34678.0, 16769.0, 8425.0, 4375.0, 2373.0, 1273.0, 713.0, 436.0, 242.0, 153.0, 87.0, 71.0, 39.0, 29.0, 18.0, 14.0, 7.0, 8.0, 5.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.86328125, -2.765716552734375, -2.66815185546875, -2.570587158203125, -2.4730224609375, -2.375457763671875, -2.27789306640625, -2.180328369140625, -2.082763671875, -1.985198974609375, -1.88763427734375, -1.790069580078125, -1.6925048828125, -1.594940185546875, -1.49737548828125, -1.399810791015625, -1.30224609375, -1.204681396484375, -1.10711669921875, -1.009552001953125, -0.9119873046875, -0.814422607421875, -0.71685791015625, -0.619293212890625, -0.521728515625, -0.424163818359375, -0.32659912109375, -0.229034423828125, -0.1314697265625, -0.033905029296875, 0.06365966796875, 0.161224365234375, 0.2587890625, 0.356353759765625, 0.45391845703125, 0.551483154296875, 0.6490478515625, 0.746612548828125, 0.84417724609375, 0.941741943359375, 1.039306640625, 1.136871337890625, 1.23443603515625, 1.332000732421875, 1.4295654296875, 1.527130126953125, 1.62469482421875, 1.722259521484375, 1.81982421875, 1.917388916015625, 2.01495361328125, 2.112518310546875, 2.2100830078125, 2.307647705078125, 2.40521240234375, 2.502777099609375, 2.600341796875, 2.697906494140625, 2.79547119140625, 2.893035888671875, 2.9906005859375, 3.088165283203125, 3.18572998046875, 3.283294677734375, 3.380859375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 5.0, 5.0, 3.0, 8.0, 10.0, 14.0, 14.0, 14.0, 17.0, 20.0, 19.0, 23.0, 36.0, 37.0, 43.0, 60.0, 77.0, 91.0, 140.0, 320.0, 1450.0, 169.0, 94.0, 63.0, 50.0, 40.0, 34.0, 42.0, 20.0, 27.0, 15.0, 20.0, 14.0, 20.0, 16.0, 4.0, 7.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.703125, -12.3079833984375, -11.912841796875, -11.5177001953125, -11.12255859375, -10.7274169921875, -10.332275390625, -9.9371337890625, -9.5419921875, -9.1468505859375, -8.751708984375, -8.3565673828125, -7.96142578125, -7.5662841796875, -7.171142578125, -6.7760009765625, -6.380859375, -5.9857177734375, -5.590576171875, -5.1954345703125, -4.80029296875, -4.4051513671875, -4.010009765625, -3.6148681640625, -3.2197265625, -2.8245849609375, -2.429443359375, -2.0343017578125, -1.63916015625, -1.2440185546875, -0.848876953125, -0.4537353515625, -0.05859375, 0.3365478515625, 0.731689453125, 1.1268310546875, 1.52197265625, 1.9171142578125, 2.312255859375, 2.7073974609375, 3.1025390625, 3.4976806640625, 3.892822265625, 4.2879638671875, 4.68310546875, 5.0782470703125, 5.473388671875, 5.8685302734375, 6.263671875, 6.6588134765625, 7.053955078125, 7.4490966796875, 7.84423828125, 8.2393798828125, 8.634521484375, 9.0296630859375, 9.4248046875, 9.8199462890625, 10.215087890625, 10.6102294921875, 11.00537109375, 11.4005126953125, 11.795654296875, 12.1907958984375, 12.5859375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 7.0, 4.0, 6.0, 4.0, 15.0, 15.0, 11.0, 20.0, 21.0, 27.0, 34.0, 51.0, 83.0, 95.0, 172.0, 375.0, 915.0, 3536.0, 41487.0, 2582836.0, 500186.0, 12493.0, 1925.0, 587.0, 271.0, 164.0, 108.0, 70.0, 39.0, 35.0, 24.0, 16.0, 23.0, 14.0, 15.0, 7.0, 7.0, 6.0, 3.0, 0.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.22705078125, -19.6103515625, -18.99365234375, -18.376953125, -17.76025390625, -17.1435546875, -16.52685546875, -15.91015625, -15.29345703125, -14.6767578125, -14.06005859375, -13.443359375, -12.82666015625, -12.2099609375, -11.59326171875, -10.9765625, -10.35986328125, -9.7431640625, -9.12646484375, -8.509765625, -7.89306640625, -7.2763671875, -6.65966796875, -6.04296875, -5.42626953125, -4.8095703125, -4.19287109375, -3.576171875, -2.95947265625, -2.3427734375, -1.72607421875, -1.109375, -0.49267578125, 0.1240234375, 0.74072265625, 1.357421875, 1.97412109375, 2.5908203125, 3.20751953125, 3.82421875, 4.44091796875, 5.0576171875, 5.67431640625, 6.291015625, 6.90771484375, 7.5244140625, 8.14111328125, 8.7578125, 9.37451171875, 9.9912109375, 10.60791015625, 11.224609375, 11.84130859375, 12.4580078125, 13.07470703125, 13.69140625, 14.30810546875, 14.9248046875, 15.54150390625, 16.158203125, 16.77490234375, 17.3916015625, 18.00830078125, 18.625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 17.0, 53.0, 184.0, 286.0, 275.0, 148.0, 34.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.094955444335938, -15.357843399047852, -13.620732307434082, -11.883620262145996, -10.146509170532227, -8.40939712524414, -6.672285079956055, -4.935173988342285, -3.198061943054199, -1.460950255393982, 0.27616143226623535, 2.013273239135742, 3.75038480758667, 5.487496376037598, 7.224608421325684, 8.961719512939453, 10.698831558227539, 12.435943603515625, 14.173054695129395, 15.91016674041748, 17.64727783203125, 19.384389877319336, 21.121501922607422, 22.858612060546875, 24.595726013183594, 26.33283805847168, 28.069950103759766, 29.80706024169922, 31.544172286987305, 33.28128433227539, 35.018394470214844, 36.75550842285156, 38.492618560791016, 40.22972869873047, 41.96684265136719, 43.70395278930664, 45.44106674194336, 47.17817687988281, 48.91529083251953, 50.652400970458984, 52.38951110839844, 54.12662124633789, 55.86373519897461, 57.60084533691406, 59.33795928955078, 61.075069427490234, 62.81217956542969, 64.5492935180664, 66.28640747070312, 68.02352142333984, 69.76062774658203, 71.49774169921875, 73.23485565185547, 74.97196960449219, 76.70907592773438, 78.4461898803711, 80.18329620361328, 81.92041015625, 83.65751647949219, 85.3946304321289, 87.13174438476562, 88.86885070800781, 90.60596466064453, 92.34307861328125, 94.08019256591797]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 7.0, 5.0, 7.0, 7.0, 8.0, 5.0, 11.0, 20.0, 20.0, 12.0, 29.0, 35.0, 32.0, 32.0, 34.0, 44.0, 52.0, 34.0, 45.0, 51.0, 45.0, 52.0, 51.0, 28.0, 39.0, 33.0, 28.0, 30.0, 39.0, 21.0, 32.0, 16.0, 24.0, 21.0, 13.0, 11.0, 11.0, 4.0, 2.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.736412048339844, -34.60384750366211, -33.471282958984375, -32.338722229003906, -31.206157684326172, -30.073593139648438, -28.941030502319336, -27.808467864990234, -26.6759033203125, -25.543338775634766, -24.410776138305664, -23.278213500976562, -22.145648956298828, -21.013084411621094, -19.880521774291992, -18.74795913696289, -17.615394592285156, -16.482830047607422, -15.35026741027832, -14.217703819274902, -13.085140228271484, -11.952576637268066, -10.820013046264648, -9.68744945526123, -8.554885864257812, -7.4223222732543945, -6.289758682250977, -5.157195091247559, -4.024631500244141, -2.8920679092407227, -1.7595043182373047, -0.6269407272338867, 0.5056190490722656, 1.6381826400756836, 2.7707462310791016, 3.9033098220825195, 5.0358734130859375, 6.1684370040893555, 7.301000595092773, 8.433564186096191, 9.56612777709961, 10.698691368103027, 11.831254959106445, 12.963818550109863, 14.096382141113281, 15.2289457321167, 16.361509323120117, 17.49407196044922, 18.626636505126953, 19.759201049804688, 20.89176368713379, 22.02432632446289, 23.156890869140625, 24.28945541381836, 25.42201805114746, 26.554580688476562, 27.687145233154297, 28.81970977783203, 29.952272415161133, 31.084835052490234, 32.21739959716797, 33.3499641418457, 34.48252868652344, 35.615089416503906, 36.74765396118164]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 9.0, 8.0, 18.0, 21.0, 20.0, 17.0, 30.0, 23.0, 30.0, 28.0, 37.0, 46.0, 38.0, 41.0, 40.0, 41.0, 45.0, 56.0, 42.0, 57.0, 38.0, 36.0, 29.0, 34.0, 28.0, 34.0, 20.0, 26.0, 15.0, 18.0, 9.0, 19.0, 17.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.826171875, -3.712371826171875, -3.59857177734375, -3.484771728515625, -3.3709716796875, -3.257171630859375, -3.14337158203125, -3.029571533203125, -2.915771484375, -2.801971435546875, -2.68817138671875, -2.574371337890625, -2.4605712890625, -2.346771240234375, -2.23297119140625, -2.119171142578125, -2.00537109375, -1.891571044921875, -1.77777099609375, -1.663970947265625, -1.5501708984375, -1.436370849609375, -1.32257080078125, -1.208770751953125, -1.094970703125, -0.981170654296875, -0.86737060546875, -0.753570556640625, -0.6397705078125, -0.525970458984375, -0.41217041015625, -0.298370361328125, -0.1845703125, -0.070770263671875, 0.04302978515625, 0.156829833984375, 0.2706298828125, 0.384429931640625, 0.49822998046875, 0.612030029296875, 0.725830078125, 0.839630126953125, 0.95343017578125, 1.067230224609375, 1.1810302734375, 1.294830322265625, 1.40863037109375, 1.522430419921875, 1.63623046875, 1.750030517578125, 1.86383056640625, 1.977630615234375, 2.0914306640625, 2.205230712890625, 2.31903076171875, 2.432830810546875, 2.546630859375, 2.660430908203125, 2.77423095703125, 2.888031005859375, 3.0018310546875, 3.115631103515625, 3.22943115234375, 3.343231201171875, 3.45703125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 1.0, 10.0, 13.0, 13.0, 11.0, 27.0, 33.0, 34.0, 68.0, 82.0, 157.0, 348.0, 644.0, 1443.0, 4005.0, 11853.0, 44687.0, 226136.0, 1339292.0, 2025390.0, 433630.0, 77884.0, 19111.0, 5727.0, 2081.0, 807.0, 333.0, 182.0, 82.0, 40.0, 39.0, 29.0, 20.0, 20.0, 9.0, 7.0, 10.0, 3.0, 12.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3671875, -7.13824462890625, -6.9093017578125, -6.68035888671875, -6.451416015625, -6.22247314453125, -5.9935302734375, -5.76458740234375, -5.53564453125, -5.30670166015625, -5.0777587890625, -4.84881591796875, -4.619873046875, -4.39093017578125, -4.1619873046875, -3.93304443359375, -3.7041015625, -3.47515869140625, -3.2462158203125, -3.01727294921875, -2.788330078125, -2.55938720703125, -2.3304443359375, -2.10150146484375, -1.87255859375, -1.64361572265625, -1.4146728515625, -1.18572998046875, -0.956787109375, -0.72784423828125, -0.4989013671875, -0.26995849609375, -0.041015625, 0.18792724609375, 0.4168701171875, 0.64581298828125, 0.874755859375, 1.10369873046875, 1.3326416015625, 1.56158447265625, 1.79052734375, 2.01947021484375, 2.2484130859375, 2.47735595703125, 2.706298828125, 2.93524169921875, 3.1641845703125, 3.39312744140625, 3.6220703125, 3.85101318359375, 4.0799560546875, 4.30889892578125, 4.537841796875, 4.76678466796875, 4.9957275390625, 5.22467041015625, 5.45361328125, 5.68255615234375, 5.9114990234375, 6.14044189453125, 6.369384765625, 6.59832763671875, 6.8272705078125, 7.05621337890625, 7.28515625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 8.0, 13.0, 17.0, 14.0, 32.0, 42.0, 78.0, 130.0, 201.0, 367.0, 543.0, 718.0, 672.0, 474.0, 286.0, 191.0, 115.0, 61.0, 36.0, 23.0, 14.0, 17.0, 9.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1484375, -13.71728515625, -13.2861328125, -12.85498046875, -12.423828125, -11.99267578125, -11.5615234375, -11.13037109375, -10.69921875, -10.26806640625, -9.8369140625, -9.40576171875, -8.974609375, -8.54345703125, -8.1123046875, -7.68115234375, -7.25, -6.81884765625, -6.3876953125, -5.95654296875, -5.525390625, -5.09423828125, -4.6630859375, -4.23193359375, -3.80078125, -3.36962890625, -2.9384765625, -2.50732421875, -2.076171875, -1.64501953125, -1.2138671875, -0.78271484375, -0.3515625, 0.07958984375, 0.5107421875, 0.94189453125, 1.373046875, 1.80419921875, 2.2353515625, 2.66650390625, 3.09765625, 3.52880859375, 3.9599609375, 4.39111328125, 4.822265625, 5.25341796875, 5.6845703125, 6.11572265625, 6.546875, 6.97802734375, 7.4091796875, 7.84033203125, 8.271484375, 8.70263671875, 9.1337890625, 9.56494140625, 9.99609375, 10.42724609375, 10.8583984375, 11.28955078125, 11.720703125, 12.15185546875, 12.5830078125, 13.01416015625, 13.4453125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 16.0, 26.0, 36.0, 60.0, 76.0, 142.0, 272.0, 603.0, 1368.0, 3828.0, 15200.0, 104619.0, 1220618.0, 2548210.0, 259737.0, 29647.0, 6199.0, 2070.0, 750.0, 355.0, 167.0, 111.0, 57.0, 38.0, 31.0, 14.0, 11.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.90625, -16.3642578125, -15.822265625, -15.2802734375, -14.73828125, -14.1962890625, -13.654296875, -13.1123046875, -12.5703125, -12.0283203125, -11.486328125, -10.9443359375, -10.40234375, -9.8603515625, -9.318359375, -8.7763671875, -8.234375, -7.6923828125, -7.150390625, -6.6083984375, -6.06640625, -5.5244140625, -4.982421875, -4.4404296875, -3.8984375, -3.3564453125, -2.814453125, -2.2724609375, -1.73046875, -1.1884765625, -0.646484375, -0.1044921875, 0.4375, 0.9794921875, 1.521484375, 2.0634765625, 2.60546875, 3.1474609375, 3.689453125, 4.2314453125, 4.7734375, 5.3154296875, 5.857421875, 6.3994140625, 6.94140625, 7.4833984375, 8.025390625, 8.5673828125, 9.109375, 9.6513671875, 10.193359375, 10.7353515625, 11.27734375, 11.8193359375, 12.361328125, 12.9033203125, 13.4453125, 13.9873046875, 14.529296875, 15.0712890625, 15.61328125, 16.1552734375, 16.697265625, 17.2392578125, 17.78125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 34.0, 102.0, 212.0, 311.0, 216.0, 97.0, 30.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-222.94378662109375, -218.93153381347656, -214.9192657470703, -210.90701293945312, -206.89474487304688, -202.8824920654297, -198.8702392578125, -194.85797119140625, -190.84571838378906, -186.83346557617188, -182.82119750976562, -178.80894470214844, -174.7966766357422, -170.784423828125, -166.77215576171875, -162.75990295410156, -158.74765014648438, -154.7353973388672, -150.72312927246094, -146.71087646484375, -142.6986083984375, -138.6863555908203, -134.67410278320312, -130.66183471679688, -126.64956665039062, -122.6373062133789, -118.62504577636719, -114.61279296875, -110.60053253173828, -106.58827209472656, -102.57601165771484, -98.56375122070312, -94.55149841308594, -90.53923797607422, -86.5269775390625, -82.51472473144531, -78.5024642944336, -74.49020385742188, -70.47794342041016, -66.46568298339844, -62.453426361083984, -58.441165924072266, -54.42890930175781, -50.416648864746094, -46.404388427734375, -42.39213180541992, -38.3798713684082, -34.36761474609375, -30.35535430908203, -26.343095779418945, -22.33083724975586, -18.31857681274414, -14.306318283081055, -10.294059753417969, -6.28179931640625, -2.269540786743164, 1.7427177429199219, 5.754976749420166, 9.76723575592041, 13.779495239257812, 17.7917537689209, 21.804012298583984, 25.816272735595703, 29.82853126525879, 33.840789794921875]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 2.0, 5.0, 13.0, 7.0, 5.0, 9.0, 14.0, 18.0, 10.0, 19.0, 29.0, 25.0, 23.0, 22.0, 28.0, 40.0, 43.0, 35.0, 49.0, 35.0, 39.0, 48.0, 33.0, 47.0, 36.0, 52.0, 36.0, 43.0, 28.0, 32.0, 33.0, 14.0, 32.0, 18.0, 11.0, 10.0, 15.0, 8.0, 10.0, 5.0, 4.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.356494903564453, -30.371456146240234, -29.386417388916016, -28.401378631591797, -27.416337966918945, -26.431299209594727, -25.446260452270508, -24.46122169494629, -23.47618293762207, -22.49114418029785, -21.506105422973633, -20.52106475830078, -19.536026000976562, -18.550987243652344, -17.565948486328125, -16.580909729003906, -15.595870018005371, -14.610831260681152, -13.625791549682617, -12.640752792358398, -11.65571403503418, -10.670675277709961, -9.685635566711426, -8.700596809387207, -7.71555757522583, -6.730518341064453, -5.745479583740234, -4.760440349578857, -3.7754013538360596, -2.7903623580932617, -1.8053231239318848, -0.820284366607666, 0.16475486755371094, 1.1497938632965088, 2.1348328590393066, 3.1198720932006836, 4.104910850524902, 5.089950084686279, 6.074989318847656, 7.060028076171875, 8.045066833496094, 9.030105590820312, 10.015145301818848, 11.000184059143066, 11.985222816467285, 12.97026252746582, 13.955301284790039, 14.940340042114258, 15.925379753112793, 16.910419464111328, 17.895458221435547, 18.880496978759766, 19.865535736083984, 20.850574493408203, 21.835613250732422, 22.82065200805664, 23.805692672729492, 24.79073143005371, 25.77577018737793, 26.76081085205078, 27.745849609375, 28.73088836669922, 29.715927124023438, 30.700965881347656, 31.686004638671875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 3.0, 2.0, 8.0, 12.0, 12.0, 16.0, 17.0, 20.0, 24.0, 29.0, 38.0, 30.0, 51.0, 29.0, 59.0, 28.0, 45.0, 34.0, 50.0, 49.0, 45.0, 37.0, 47.0, 38.0, 40.0, 34.0, 31.0, 26.0, 33.0, 23.0, 17.0, 16.0, 14.0, 12.0, 11.0, 6.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.990692138671875, -3.87200927734375, -3.753326416015625, -3.6346435546875, -3.515960693359375, -3.39727783203125, -3.278594970703125, -3.159912109375, -3.041229248046875, -2.92254638671875, -2.803863525390625, -2.6851806640625, -2.566497802734375, -2.44781494140625, -2.329132080078125, -2.21044921875, -2.091766357421875, -1.97308349609375, -1.854400634765625, -1.7357177734375, -1.617034912109375, -1.49835205078125, -1.379669189453125, -1.260986328125, -1.142303466796875, -1.02362060546875, -0.904937744140625, -0.7862548828125, -0.667572021484375, -0.54888916015625, -0.430206298828125, -0.3115234375, -0.192840576171875, -0.07415771484375, 0.044525146484375, 0.1632080078125, 0.281890869140625, 0.40057373046875, 0.519256591796875, 0.637939453125, 0.756622314453125, 0.87530517578125, 0.993988037109375, 1.1126708984375, 1.231353759765625, 1.35003662109375, 1.468719482421875, 1.58740234375, 1.706085205078125, 1.82476806640625, 1.943450927734375, 2.0621337890625, 2.180816650390625, 2.29949951171875, 2.418182373046875, 2.536865234375, 2.655548095703125, 2.77423095703125, 2.892913818359375, 3.0115966796875, 3.130279541015625, 3.24896240234375, 3.367645263671875, 3.486328125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 16.0, 13.0, 30.0, 46.0, 77.0, 120.0, 173.0, 278.0, 459.0, 732.0, 1127.0, 1864.0, 2915.0, 5017.0, 8100.0, 13529.0, 22521.0, 37068.0, 59376.0, 90843.0, 129761.0, 163400.0, 159197.0, 123988.0, 86050.0, 55030.0, 34231.0, 20743.0, 12353.0, 7611.0, 4546.0, 2775.0, 1641.0, 1057.0, 661.0, 419.0, 284.0, 179.0, 104.0, 67.0, 37.0, 30.0, 32.0, 19.0, 7.0, 11.0, 5.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.45361328125, -0.43845367431640625, -0.4232940673828125, -0.40813446044921875, -0.392974853515625, -0.37781524658203125, -0.3626556396484375, -0.34749603271484375, -0.33233642578125, -0.31717681884765625, -0.3020172119140625, -0.28685760498046875, -0.271697998046875, -0.25653839111328125, -0.2413787841796875, -0.22621917724609375, -0.2110595703125, -0.19589996337890625, -0.1807403564453125, -0.16558074951171875, -0.150421142578125, -0.13526153564453125, -0.1201019287109375, -0.10494232177734375, -0.08978271484375, -0.07462310791015625, -0.0594635009765625, -0.04430389404296875, -0.029144287109375, -0.01398468017578125, 0.0011749267578125, 0.01633453369140625, 0.031494140625, 0.04665374755859375, 0.0618133544921875, 0.07697296142578125, 0.092132568359375, 0.10729217529296875, 0.1224517822265625, 0.13761138916015625, 0.15277099609375, 0.16793060302734375, 0.1830902099609375, 0.19824981689453125, 0.213409423828125, 0.22856903076171875, 0.2437286376953125, 0.25888824462890625, 0.2740478515625, 0.28920745849609375, 0.3043670654296875, 0.31952667236328125, 0.334686279296875, 0.34984588623046875, 0.3650054931640625, 0.38016510009765625, 0.39532470703125, 0.41048431396484375, 0.4256439208984375, 0.44080352783203125, 0.455963134765625, 0.47112274169921875, 0.4862823486328125, 0.5014419555664062, 0.5166015625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 1.0, 7.0, 3.0, 5.0, 8.0, 6.0, 11.0, 13.0, 13.0, 19.0, 18.0, 20.0, 29.0, 27.0, 30.0, 36.0, 27.0, 36.0, 34.0, 48.0, 40.0, 38.0, 1055.0, 36.0, 32.0, 42.0, 46.0, 35.0, 34.0, 26.0, 38.0, 25.0, 35.0, 12.0, 17.0, 32.0, 21.0, 15.0, 10.0, 9.0, 10.0, 15.0, 2.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6640625, -2.587921142578125, -2.51177978515625, -2.435638427734375, -2.3594970703125, -2.283355712890625, -2.20721435546875, -2.131072998046875, -2.054931640625, -1.978790283203125, -1.90264892578125, -1.826507568359375, -1.7503662109375, -1.674224853515625, -1.59808349609375, -1.521942138671875, -1.44580078125, -1.369659423828125, -1.29351806640625, -1.217376708984375, -1.1412353515625, -1.065093994140625, -0.98895263671875, -0.912811279296875, -0.836669921875, -0.760528564453125, -0.68438720703125, -0.608245849609375, -0.5321044921875, -0.455963134765625, -0.37982177734375, -0.303680419921875, -0.2275390625, -0.151397705078125, -0.07525634765625, 0.000885009765625, 0.0770263671875, 0.153167724609375, 0.22930908203125, 0.305450439453125, 0.381591796875, 0.457733154296875, 0.53387451171875, 0.610015869140625, 0.6861572265625, 0.762298583984375, 0.83843994140625, 0.914581298828125, 0.99072265625, 1.066864013671875, 1.14300537109375, 1.219146728515625, 1.2952880859375, 1.371429443359375, 1.44757080078125, 1.523712158203125, 1.599853515625, 1.675994873046875, 1.75213623046875, 1.828277587890625, 1.9044189453125, 1.980560302734375, 2.05670166015625, 2.132843017578125, 2.208984375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 8.0, 5.0, 5.0, 6.0, 19.0, 22.0, 36.0, 60.0, 55.0, 100.0, 158.0, 235.0, 369.0, 553.0, 797.0, 1220.0, 1887.0, 2893.0, 4400.0, 6723.0, 10302.0, 15952.0, 24937.0, 38540.0, 58878.0, 87600.0, 125348.0, 977944.0, 373526.0, 120696.0, 84352.0, 56131.0, 36108.0, 23294.0, 15375.0, 9850.0, 6540.0, 4278.0, 2796.0, 1697.0, 1193.0, 746.0, 503.0, 348.0, 224.0, 136.0, 91.0, 69.0, 47.0, 25.0, 17.0, 16.0, 11.0, 6.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.271484375, -0.2624168395996094, -0.25334930419921875, -0.24428176879882812, -0.2352142333984375, -0.22614669799804688, -0.21707916259765625, -0.20801162719726562, -0.198944091796875, -0.18987655639648438, -0.18080902099609375, -0.17174148559570312, -0.1626739501953125, -0.15360641479492188, -0.14453887939453125, -0.13547134399414062, -0.12640380859375, -0.11733627319335938, -0.10826873779296875, -0.09920120239257812, -0.0901336669921875, -0.08106613159179688, -0.07199859619140625, -0.06293106079101562, -0.053863525390625, -0.044795989990234375, -0.03572845458984375, -0.026660919189453125, -0.0175933837890625, -0.008525848388671875, 0.00054168701171875, 0.009609222412109375, 0.0186767578125, 0.027744293212890625, 0.03681182861328125, 0.045879364013671875, 0.0549468994140625, 0.06401443481445312, 0.07308197021484375, 0.08214950561523438, 0.091217041015625, 0.10028457641601562, 0.10935211181640625, 0.11841964721679688, 0.1274871826171875, 0.13655471801757812, 0.14562225341796875, 0.15468978881835938, 0.16375732421875, 0.17282485961914062, 0.18189239501953125, 0.19095993041992188, 0.2000274658203125, 0.20909500122070312, 0.21816253662109375, 0.22723007202148438, 0.236297607421875, 0.24536514282226562, 0.25443267822265625, 0.2635002136230469, 0.2725677490234375, 0.2816352844238281, 0.29070281982421875, 0.2997703552246094, 0.308837890625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 10.0, 6.0, 12.0, 12.0, 14.0, 14.0, 24.0, 18.0, 18.0, 29.0, 24.0, 36.0, 32.0, 39.0, 33.0, 60.0, 55.0, 83.0, 83.0, 55.0, 52.0, 30.0, 30.0, 30.0, 21.0, 32.0, 25.0, 17.0, 19.0, 8.0, 12.0, 14.0, 9.0, 3.0, 10.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01303863525390625, -0.012598514556884766, -0.012158393859863281, -0.011718273162841797, -0.011278152465820312, -0.010838031768798828, -0.010397911071777344, -0.00995779037475586, -0.009517669677734375, -0.00907754898071289, -0.008637428283691406, -0.008197307586669922, -0.0077571868896484375, -0.007317066192626953, -0.006876945495605469, -0.006436824798583984, -0.0059967041015625, -0.005556583404541016, -0.005116462707519531, -0.004676342010498047, -0.0042362213134765625, -0.003796100616455078, -0.0033559799194335938, -0.0029158592224121094, -0.002475738525390625, -0.0020356178283691406, -0.0015954971313476562, -0.0011553764343261719, -0.0007152557373046875, -0.0002751350402832031, 0.00016498565673828125, 0.0006051063537597656, 0.00104522705078125, 0.0014853477478027344, 0.0019254684448242188, 0.002365589141845703, 0.0028057098388671875, 0.003245830535888672, 0.0036859512329101562, 0.004126071929931641, 0.004566192626953125, 0.005006313323974609, 0.005446434020996094, 0.005886554718017578, 0.0063266754150390625, 0.006766796112060547, 0.007206916809082031, 0.007647037506103516, 0.008087158203125, 0.008527278900146484, 0.008967399597167969, 0.009407520294189453, 0.009847640991210938, 0.010287761688232422, 0.010727882385253906, 0.01116800308227539, 0.011608123779296875, 0.01204824447631836, 0.012488365173339844, 0.012928485870361328, 0.013368606567382812, 0.013808727264404297, 0.014248847961425781, 0.014688968658447266, 0.01512908935546875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 10.0, 3.0, 17.0, 20.0, 26.0, 29.0, 42.0, 71.0, 84.0, 125.0, 145.0, 188.0, 301.0, 436.0, 1111.0, 52078.0, 983884.0, 7977.0, 693.0, 348.0, 249.0, 192.0, 106.0, 100.0, 78.0, 45.0, 46.0, 34.0, 16.0, 19.0, 11.0, 14.0, 12.0, 11.0, 4.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.2467041015625, -0.23929786682128906, -0.23189163208007812, -0.2244853973388672, -0.21707916259765625, -0.2096729278564453, -0.20226669311523438, -0.19486045837402344, -0.1874542236328125, -0.18004798889160156, -0.17264175415039062, -0.1652355194091797, -0.15782928466796875, -0.1504230499267578, -0.14301681518554688, -0.13561058044433594, -0.128204345703125, -0.12079811096191406, -0.11339187622070312, -0.10598564147949219, -0.09857940673828125, -0.09117317199707031, -0.08376693725585938, -0.07636070251464844, -0.0689544677734375, -0.06154823303222656, -0.054141998291015625, -0.04673576354980469, -0.03932952880859375, -0.03192329406738281, -0.024517059326171875, -0.017110824584960938, -0.00970458984375, -0.0022983551025390625, 0.005107879638671875, 0.012514114379882812, 0.01992034912109375, 0.027326583862304688, 0.034732818603515625, 0.04213905334472656, 0.0495452880859375, 0.05695152282714844, 0.06435775756835938, 0.07176399230957031, 0.07917022705078125, 0.08657646179199219, 0.09398269653320312, 0.10138893127441406, 0.108795166015625, 0.11620140075683594, 0.12360763549804688, 0.1310138702392578, 0.13842010498046875, 0.1458263397216797, 0.15323257446289062, 0.16063880920410156, 0.1680450439453125, 0.17545127868652344, 0.18285751342773438, 0.1902637481689453, 0.19766998291015625, 0.2050762176513672, 0.21248245239257812, 0.21988868713378906, 0.227294921875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 54.0, 379.0, 546.0, 23.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17351217567920685, -0.16958020627498627, -0.16564823687076569, -0.1617162525653839, -0.15778428316116333, -0.15385231375694275, -0.14992034435272217, -0.1459883749485016, -0.142056405544281, -0.13812443614006042, -0.13419246673583984, -0.13026048243045807, -0.1263285130262375, -0.1223965436220169, -0.11846457421779633, -0.11453260481357574, -0.11060062050819397, -0.10666865110397339, -0.10273667424917221, -0.09880470484495163, -0.09487272799015045, -0.09094075858592987, -0.08700878918170929, -0.08307681977748871, -0.07914484292268753, -0.07521287351846695, -0.07128089666366577, -0.06734892725944519, -0.06341695785522461, -0.05948498100042343, -0.05555301159620285, -0.05162103846669197, -0.047689057886600494, -0.043757084757089615, -0.039825111627578735, -0.035893142223358154, -0.031961169093847275, -0.028029195964336395, -0.024097224697470665, -0.020165253430604935, -0.016233280301094055, -0.01230130810290575, -0.008369335904717445, -0.0044373637065291405, -0.0005053915083408356, 0.003426581621170044, 0.007358552888035774, 0.011290524154901505, 0.015222497284412384, 0.019154470413923264, 0.023086441680788994, 0.027018412947654724, 0.030950386077165604, 0.03488235920667648, 0.038814328610897064, 0.042746301740407944, 0.04667827486991882, 0.0506102479994297, 0.05454222112894058, 0.05847419053316116, 0.06240616366267204, 0.06633813679218292, 0.0702701061964035, 0.07420207560062408, 0.07813405245542526]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 16.0, 12.0, 11.0, 19.0, 16.0, 22.0, 17.0, 32.0, 27.0, 38.0, 24.0, 34.0, 28.0, 24.0, 40.0, 33.0, 29.0, 57.0, 21.0, 44.0, 30.0, 37.0, 31.0, 41.0, 25.0, 23.0, 29.0, 35.0, 22.0, 23.0, 18.0, 19.0, 19.0, 12.0, 10.0, 9.0, 9.0, 14.0, 6.0, 8.0, 4.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.020041584968566895, -0.019436698406934738, -0.018831809982657433, -0.018226921558380127, -0.01762203499674797, -0.017017148435115814, -0.01641226001083851, -0.015807371586561203, -0.015202485024929047, -0.014597597531974316, -0.013992710039019585, -0.013387822546064854, -0.012782935053110123, -0.012178047560155392, -0.01157316006720066, -0.01096827257424593, -0.010363385081291199, -0.009758497588336468, -0.009153610095381737, -0.008548722602427006, -0.007943835109472275, -0.007338947616517544, -0.006734060123562813, -0.006129172630608082, -0.005524285137653351, -0.00491939764469862, -0.004314510151743889, -0.003709622658789158, -0.003104735165834427, -0.002499847672879696, -0.001894960179924965, -0.001290072686970234, -0.0006851851940155029, -8.029770106077194e-05, 0.000524589791893959, 0.00112947728484869, 0.001734364777803421, 0.002339252270758152, 0.002944139763712883, 0.003549027256667614, 0.004153914749622345, 0.004758802242577076, 0.005363689735531807, 0.005968577228486538, 0.006573464721441269, 0.007178352214396, 0.007783239707350731, 0.008388127200305462, 0.008993014693260193, 0.009597902186214924, 0.010202789679169655, 0.010807677172124386, 0.011412564665079117, 0.012017452158033848, 0.012622339650988579, 0.01322722714394331, 0.01383211463689804, 0.014437002129852772, 0.015041889622807503, 0.01564677804708481, 0.016251664608716965, 0.01685655117034912, 0.017461439594626427, 0.018066328018903732, 0.01867121458053589]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 3.0, 2.0, 8.0, 11.0, 13.0, 16.0, 17.0, 20.0, 24.0, 29.0, 38.0, 30.0, 51.0, 29.0, 59.0, 28.0, 45.0, 35.0, 49.0, 49.0, 45.0, 38.0, 46.0, 39.0, 39.0, 34.0, 31.0, 26.0, 32.0, 24.0, 17.0, 16.0, 14.0, 12.0, 11.0, 5.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.990692138671875, -3.87200927734375, -3.753326416015625, -3.6346435546875, -3.515960693359375, -3.39727783203125, -3.278594970703125, -3.159912109375, -3.041229248046875, -2.92254638671875, -2.803863525390625, -2.6851806640625, -2.566497802734375, -2.44781494140625, -2.329132080078125, -2.21044921875, -2.091766357421875, -1.97308349609375, -1.854400634765625, -1.7357177734375, -1.617034912109375, -1.49835205078125, -1.379669189453125, -1.260986328125, -1.142303466796875, -1.02362060546875, -0.904937744140625, -0.7862548828125, -0.667572021484375, -0.54888916015625, -0.430206298828125, -0.3115234375, -0.192840576171875, -0.07415771484375, 0.044525146484375, 0.1632080078125, 0.281890869140625, 0.40057373046875, 0.519256591796875, 0.637939453125, 0.756622314453125, 0.87530517578125, 0.993988037109375, 1.1126708984375, 1.231353759765625, 1.35003662109375, 1.468719482421875, 1.58740234375, 1.706085205078125, 1.82476806640625, 1.943450927734375, 2.0621337890625, 2.180816650390625, 2.29949951171875, 2.418182373046875, 2.536865234375, 2.655548095703125, 2.77423095703125, 2.892913818359375, 3.0115966796875, 3.130279541015625, 3.24896240234375, 3.367645263671875, 3.486328125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 4.0, 2.0, 2.0, 7.0, 9.0, 12.0, 20.0, 18.0, 35.0, 33.0, 70.0, 116.0, 216.0, 309.0, 559.0, 1004.0, 1774.0, 3213.0, 5946.0, 11908.0, 29521.0, 96961.0, 422286.0, 345591.0, 80525.0, 25385.0, 10731.0, 5502.0, 2897.0, 1635.0, 928.0, 537.0, 316.0, 167.0, 98.0, 62.0, 47.0, 36.0, 15.0, 17.0, 10.0, 4.0, 4.0, 10.0, 3.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.23699951171875, -4.0599365234375, -3.88287353515625, -3.705810546875, -3.52874755859375, -3.3516845703125, -3.17462158203125, -2.99755859375, -2.82049560546875, -2.6434326171875, -2.46636962890625, -2.289306640625, -2.11224365234375, -1.9351806640625, -1.75811767578125, -1.5810546875, -1.40399169921875, -1.2269287109375, -1.04986572265625, -0.872802734375, -0.69573974609375, -0.5186767578125, -0.34161376953125, -0.16455078125, 0.01251220703125, 0.1895751953125, 0.36663818359375, 0.543701171875, 0.72076416015625, 0.8978271484375, 1.07489013671875, 1.251953125, 1.42901611328125, 1.6060791015625, 1.78314208984375, 1.960205078125, 2.13726806640625, 2.3143310546875, 2.49139404296875, 2.66845703125, 2.84552001953125, 3.0225830078125, 3.19964599609375, 3.376708984375, 3.55377197265625, 3.7308349609375, 3.90789794921875, 4.0849609375, 4.26202392578125, 4.4390869140625, 4.61614990234375, 4.793212890625, 4.97027587890625, 5.1473388671875, 5.32440185546875, 5.50146484375, 5.67852783203125, 5.8555908203125, 6.03265380859375, 6.209716796875, 6.38677978515625, 6.5638427734375, 6.74090576171875, 6.91796875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 4.0, 5.0, 10.0, 3.0, 10.0, 13.0, 15.0, 16.0, 18.0, 23.0, 23.0, 39.0, 36.0, 36.0, 52.0, 55.0, 77.0, 119.0, 345.0, 1506.0, 173.0, 82.0, 56.0, 47.0, 39.0, 42.0, 26.0, 30.0, 17.0, 22.0, 25.0, 13.0, 17.0, 13.0, 8.0, 9.0, 6.0, 6.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6796875, -13.267333984375, -12.85498046875, -12.442626953125, -12.0302734375, -11.617919921875, -11.20556640625, -10.793212890625, -10.380859375, -9.968505859375, -9.55615234375, -9.143798828125, -8.7314453125, -8.319091796875, -7.90673828125, -7.494384765625, -7.08203125, -6.669677734375, -6.25732421875, -5.844970703125, -5.4326171875, -5.020263671875, -4.60791015625, -4.195556640625, -3.783203125, -3.370849609375, -2.95849609375, -2.546142578125, -2.1337890625, -1.721435546875, -1.30908203125, -0.896728515625, -0.484375, -0.072021484375, 0.34033203125, 0.752685546875, 1.1650390625, 1.577392578125, 1.98974609375, 2.402099609375, 2.814453125, 3.226806640625, 3.63916015625, 4.051513671875, 4.4638671875, 4.876220703125, 5.28857421875, 5.700927734375, 6.11328125, 6.525634765625, 6.93798828125, 7.350341796875, 7.7626953125, 8.175048828125, 8.58740234375, 8.999755859375, 9.412109375, 9.824462890625, 10.23681640625, 10.649169921875, 11.0615234375, 11.473876953125, 11.88623046875, 12.298583984375, 12.7109375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 1.0, 3.0, 9.0, 11.0, 15.0, 15.0, 13.0, 28.0, 25.0, 34.0, 41.0, 62.0, 99.0, 172.0, 242.0, 453.0, 1574.0, 11774.0, 518526.0, 2583069.0, 25394.0, 2592.0, 630.0, 308.0, 177.0, 121.0, 70.0, 48.0, 34.0, 39.0, 24.0, 12.0, 25.0, 7.0, 9.0, 8.0, 10.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.796875, -21.049072265625, -20.30126953125, -19.553466796875, -18.8056640625, -18.057861328125, -17.31005859375, -16.562255859375, -15.814453125, -15.066650390625, -14.31884765625, -13.571044921875, -12.8232421875, -12.075439453125, -11.32763671875, -10.579833984375, -9.83203125, -9.084228515625, -8.33642578125, -7.588623046875, -6.8408203125, -6.093017578125, -5.34521484375, -4.597412109375, -3.849609375, -3.101806640625, -2.35400390625, -1.606201171875, -0.8583984375, -0.110595703125, 0.63720703125, 1.385009765625, 2.1328125, 2.880615234375, 3.62841796875, 4.376220703125, 5.1240234375, 5.871826171875, 6.61962890625, 7.367431640625, 8.115234375, 8.863037109375, 9.61083984375, 10.358642578125, 11.1064453125, 11.854248046875, 12.60205078125, 13.349853515625, 14.09765625, 14.845458984375, 15.59326171875, 16.341064453125, 17.0888671875, 17.836669921875, 18.58447265625, 19.332275390625, 20.080078125, 20.827880859375, 21.57568359375, 22.323486328125, 23.0712890625, 23.819091796875, 24.56689453125, 25.314697265625, 26.0625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 150.0, 546.0, 291.0, 24.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.98736572265625, -155.42532348632812, -151.86329650878906, -148.30125427246094, -144.73922729492188, -141.17718505859375, -137.61514282226562, -134.05311584472656, -130.49107360839844, -126.92903900146484, -123.36700439453125, -119.80496215820312, -116.24292755126953, -112.68089294433594, -109.11885833740234, -105.55682373046875, -101.99478912353516, -98.43275451660156, -94.87071990966797, -91.30868530273438, -87.74664306640625, -84.18460845947266, -80.62257385253906, -77.06053924560547, -73.49850463867188, -69.93647003173828, -66.37443542480469, -62.81239700317383, -59.25035858154297, -55.688323974609375, -52.12628936767578, -48.56425476074219, -45.00220489501953, -41.44017028808594, -37.87813186645508, -34.316097259521484, -30.754060745239258, -27.19202423095703, -23.629989624023438, -20.06795310974121, -16.505916595458984, -12.943880081176758, -9.381844520568848, -5.8198089599609375, -2.257772445678711, 1.3042640686035156, 4.866298675537109, 8.428335189819336, 11.990371704101562, 15.552408218383789, 19.114444732666016, 22.67647933959961, 26.238515853881836, 29.800552368164062, 33.362586975097656, 36.92462158203125, 40.48666000366211, 44.0486946105957, 47.61073303222656, 51.172767639160156, 54.73480224609375, 58.29684066772461, 61.8588752746582, 65.42091369628906, 68.98294830322266]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 5.0, 9.0, 13.0, 12.0, 14.0, 16.0, 14.0, 30.0, 27.0, 24.0, 34.0, 32.0, 31.0, 48.0, 33.0, 51.0, 37.0, 50.0, 44.0, 52.0, 48.0, 49.0, 37.0, 30.0, 41.0, 26.0, 29.0, 35.0, 26.0, 30.0, 12.0, 11.0, 15.0, 6.0, 3.0, 4.0, 8.0, 3.0, 3.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.27981185913086, -36.99015808105469, -35.700504302978516, -34.41084671020508, -33.121192932128906, -31.831539154052734, -30.541885375976562, -29.25223159790039, -27.962575912475586, -26.672922134399414, -25.38326644897461, -24.093612670898438, -22.803958892822266, -21.51430320739746, -20.22464942932129, -18.934993743896484, -17.645339965820312, -16.35568618774414, -15.066030502319336, -13.776376724243164, -12.486721992492676, -11.197067260742188, -9.907413482666016, -8.617758750915527, -7.328104019165039, -6.038449287414551, -4.748795032501221, -3.4591405391693115, -2.1694860458374023, -0.8798313140869141, 0.409822940826416, 1.699477195739746, 2.9891357421875, 4.278790473937988, 5.568444728851318, 6.858098983764648, 8.147753715515137, 9.437408447265625, 10.727062225341797, 12.016716957092285, 13.306371688842773, 14.596026420593262, 15.88568115234375, 17.175334930419922, 18.464988708496094, 19.7546443939209, 21.04429817199707, 22.333953857421875, 23.623607635498047, 24.91326141357422, 26.202917098999023, 27.492570877075195, 28.7822265625, 30.071880340576172, 31.361534118652344, 32.651187896728516, 33.94084167480469, 35.23049545288086, 36.52014923095703, 37.80980682373047, 39.09946060180664, 40.38911437988281, 41.678768157958984, 42.968421936035156, 44.258079528808594]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 10.0, 4.0, 3.0, 5.0, 12.0, 9.0, 21.0, 21.0, 20.0, 34.0, 29.0, 32.0, 40.0, 46.0, 51.0, 44.0, 34.0, 45.0, 48.0, 50.0, 54.0, 45.0, 50.0, 42.0, 38.0, 29.0, 31.0, 34.0, 25.0, 19.0, 18.0, 19.0, 16.0, 11.0, 4.0, 5.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.472930908203125, -4.34039306640625, -4.207855224609375, -4.0753173828125, -3.942779541015625, -3.81024169921875, -3.677703857421875, -3.545166015625, -3.412628173828125, -3.28009033203125, -3.147552490234375, -3.0150146484375, -2.882476806640625, -2.74993896484375, -2.617401123046875, -2.48486328125, -2.352325439453125, -2.21978759765625, -2.087249755859375, -1.9547119140625, -1.822174072265625, -1.68963623046875, -1.557098388671875, -1.424560546875, -1.292022705078125, -1.15948486328125, -1.026947021484375, -0.8944091796875, -0.761871337890625, -0.62933349609375, -0.496795654296875, -0.3642578125, -0.231719970703125, -0.09918212890625, 0.033355712890625, 0.1658935546875, 0.298431396484375, 0.43096923828125, 0.563507080078125, 0.696044921875, 0.828582763671875, 0.96112060546875, 1.093658447265625, 1.2261962890625, 1.358734130859375, 1.49127197265625, 1.623809814453125, 1.75634765625, 1.888885498046875, 2.02142333984375, 2.153961181640625, 2.2864990234375, 2.419036865234375, 2.55157470703125, 2.684112548828125, 2.816650390625, 2.949188232421875, 3.08172607421875, 3.214263916015625, 3.3468017578125, 3.479339599609375, 3.61187744140625, 3.744415283203125, 3.876953125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 11.0, 14.0, 19.0, 21.0, 47.0, 55.0, 70.0, 116.0, 152.0, 235.0, 400.0, 617.0, 1108.0, 1800.0, 3199.0, 6392.0, 13116.0, 28933.0, 71982.0, 199370.0, 583041.0, 1313220.0, 1200145.0, 491128.0, 167409.0, 61794.0, 25496.0, 11599.0, 5566.0, 2979.0, 1645.0, 978.0, 604.0, 360.0, 210.0, 149.0, 103.0, 75.0, 50.0, 20.0, 21.0, 11.0, 11.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.09375, -4.951934814453125, -4.81011962890625, -4.668304443359375, -4.5264892578125, -4.384674072265625, -4.24285888671875, -4.101043701171875, -3.959228515625, -3.817413330078125, -3.67559814453125, -3.533782958984375, -3.3919677734375, -3.250152587890625, -3.10833740234375, -2.966522216796875, -2.82470703125, -2.682891845703125, -2.54107666015625, -2.399261474609375, -2.2574462890625, -2.115631103515625, -1.97381591796875, -1.832000732421875, -1.690185546875, -1.548370361328125, -1.40655517578125, -1.264739990234375, -1.1229248046875, -0.981109619140625, -0.83929443359375, -0.697479248046875, -0.5556640625, -0.413848876953125, -0.27203369140625, -0.130218505859375, 0.0115966796875, 0.153411865234375, 0.29522705078125, 0.437042236328125, 0.578857421875, 0.720672607421875, 0.86248779296875, 1.004302978515625, 1.1461181640625, 1.287933349609375, 1.42974853515625, 1.571563720703125, 1.71337890625, 1.855194091796875, 1.99700927734375, 2.138824462890625, 2.2806396484375, 2.422454833984375, 2.56427001953125, 2.706085205078125, 2.847900390625, 2.989715576171875, 3.13153076171875, 3.273345947265625, 3.4151611328125, 3.556976318359375, 3.69879150390625, 3.840606689453125, 3.982421875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 1.0, 7.0, 8.0, 13.0, 11.0, 19.0, 24.0, 30.0, 37.0, 60.0, 64.0, 99.0, 145.0, 186.0, 306.0, 334.0, 482.0, 460.0, 429.0, 327.0, 282.0, 175.0, 154.0, 106.0, 96.0, 60.0, 52.0, 39.0, 21.0, 13.0, 10.0, 5.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.015625, -10.721435546875, -10.42724609375, -10.133056640625, -9.8388671875, -9.544677734375, -9.25048828125, -8.956298828125, -8.662109375, -8.367919921875, -8.07373046875, -7.779541015625, -7.4853515625, -7.191162109375, -6.89697265625, -6.602783203125, -6.30859375, -6.014404296875, -5.72021484375, -5.426025390625, -5.1318359375, -4.837646484375, -4.54345703125, -4.249267578125, -3.955078125, -3.660888671875, -3.36669921875, -3.072509765625, -2.7783203125, -2.484130859375, -2.18994140625, -1.895751953125, -1.6015625, -1.307373046875, -1.01318359375, -0.718994140625, -0.4248046875, -0.130615234375, 0.16357421875, 0.457763671875, 0.751953125, 1.046142578125, 1.34033203125, 1.634521484375, 1.9287109375, 2.222900390625, 2.51708984375, 2.811279296875, 3.10546875, 3.399658203125, 3.69384765625, 3.988037109375, 4.2822265625, 4.576416015625, 4.87060546875, 5.164794921875, 5.458984375, 5.753173828125, 6.04736328125, 6.341552734375, 6.6357421875, 6.929931640625, 7.22412109375, 7.518310546875, 7.8125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 5.0, 14.0, 15.0, 16.0, 15.0, 46.0, 64.0, 125.0, 192.0, 308.0, 660.0, 1270.0, 2531.0, 6031.0, 18098.0, 67356.0, 315387.0, 1541259.0, 1752836.0, 376725.0, 78225.0, 20682.0, 6984.0, 2715.0, 1247.0, 612.0, 299.0, 228.0, 106.0, 76.0, 40.0, 36.0, 23.0, 18.0, 9.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.890625, -8.5357666015625, -8.180908203125, -7.8260498046875, -7.47119140625, -7.1163330078125, -6.761474609375, -6.4066162109375, -6.0517578125, -5.6968994140625, -5.342041015625, -4.9871826171875, -4.63232421875, -4.2774658203125, -3.922607421875, -3.5677490234375, -3.212890625, -2.8580322265625, -2.503173828125, -2.1483154296875, -1.79345703125, -1.4385986328125, -1.083740234375, -0.7288818359375, -0.3740234375, -0.0191650390625, 0.335693359375, 0.6905517578125, 1.04541015625, 1.4002685546875, 1.755126953125, 2.1099853515625, 2.46484375, 2.8197021484375, 3.174560546875, 3.5294189453125, 3.88427734375, 4.2391357421875, 4.593994140625, 4.9488525390625, 5.3037109375, 5.6585693359375, 6.013427734375, 6.3682861328125, 6.72314453125, 7.0780029296875, 7.432861328125, 7.7877197265625, 8.142578125, 8.4974365234375, 8.852294921875, 9.2071533203125, 9.56201171875, 9.9168701171875, 10.271728515625, 10.6265869140625, 10.9814453125, 11.3363037109375, 11.691162109375, 12.0460205078125, 12.40087890625, 12.7557373046875, 13.110595703125, 13.4654541015625, 13.8203125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 16.0, 68.0, 180.0, 332.0, 265.0, 119.0, 24.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-234.86798095703125, -230.33230590820312, -225.79661560058594, -221.2609405517578, -216.7252655029297, -212.1895751953125, -207.65390014648438, -203.11822509765625, -198.58253479003906, -194.04685974121094, -189.51116943359375, -184.97549438476562, -180.4398193359375, -175.9041290283203, -171.3684539794922, -166.83277893066406, -162.29708862304688, -157.76141357421875, -153.22572326660156, -148.69004821777344, -144.1543731689453, -139.61868286132812, -135.0830078125, -130.54733276367188, -126.01165771484375, -121.4759750366211, -116.94029998779297, -112.40461730957031, -107.86893463134766, -103.333251953125, -98.79757690429688, -94.26189422607422, -89.72621154785156, -85.1905288696289, -80.65485382080078, -76.11917114257812, -71.58348846435547, -67.04780578613281, -62.51213073730469, -57.97644805908203, -53.440765380859375, -48.905086517333984, -44.36940383911133, -39.83372497558594, -35.29804229736328, -30.76236343383789, -26.2266845703125, -21.691003799438477, -17.155323028564453, -12.61964225769043, -8.083962440490723, -3.5482826232910156, 0.9873981475830078, 5.523078918457031, 10.058757781982422, 14.594438552856445, 19.13011932373047, 23.665800094604492, 28.201480865478516, 32.737159729003906, 37.27284240722656, 41.80852127075195, 46.344200134277344, 50.8798828125, 55.41556167602539]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 2.0, 6.0, 5.0, 4.0, 11.0, 11.0, 10.0, 12.0, 14.0, 19.0, 20.0, 17.0, 19.0, 24.0, 29.0, 32.0, 25.0, 28.0, 42.0, 33.0, 26.0, 32.0, 30.0, 48.0, 41.0, 48.0, 32.0, 30.0, 38.0, 27.0, 21.0, 31.0, 30.0, 20.0, 25.0, 19.0, 11.0, 12.0, 13.0, 15.0, 17.0, 18.0, 15.0, 3.0, 6.0, 6.0, 13.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-27.68250846862793, -26.85538101196289, -26.02825164794922, -25.201122283935547, -24.373994827270508, -23.54686737060547, -22.719738006591797, -21.892608642578125, -21.065481185913086, -20.238353729248047, -19.411224365234375, -18.584095001220703, -17.756967544555664, -16.929840087890625, -16.102710723876953, -15.275582313537598, -14.448453903198242, -13.621325492858887, -12.794197082519531, -11.967068672180176, -11.13994026184082, -10.312811851501465, -9.48568344116211, -8.658555030822754, -7.831426620483398, -7.004298210144043, -6.1771697998046875, -5.350041389465332, -4.522912979125977, -3.695784568786621, -2.8686561584472656, -2.04152774810791, -1.2143993377685547, -0.3872709274291992, 0.43985748291015625, 1.2669858932495117, 2.094114303588867, 2.9212427139282227, 3.748371124267578, 4.575499534606934, 5.402627944946289, 6.2297563552856445, 7.056884765625, 7.8840131759643555, 8.711141586303711, 9.538269996643066, 10.365398406982422, 11.192526817321777, 12.019655227661133, 12.846783638000488, 13.673912048339844, 14.5010404586792, 15.328168869018555, 16.155296325683594, 16.982425689697266, 17.809555053710938, 18.636682510375977, 19.463809967041016, 20.290939331054688, 21.11806869506836, 21.9451961517334, 22.772323608398438, 23.59945297241211, 24.42658233642578, 25.25370979309082]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 4.0, 5.0, 12.0, 13.0, 11.0, 10.0, 22.0, 24.0, 18.0, 25.0, 26.0, 40.0, 37.0, 35.0, 42.0, 40.0, 50.0, 41.0, 44.0, 45.0, 49.0, 50.0, 46.0, 38.0, 43.0, 35.0, 26.0, 28.0, 27.0, 24.0, 13.0, 17.0, 16.0, 12.0, 7.0, 9.0, 5.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.93017578125, -3.8017578125, -3.67333984375, -3.544921875, -3.41650390625, -3.2880859375, -3.15966796875, -3.03125, -2.90283203125, -2.7744140625, -2.64599609375, -2.517578125, -2.38916015625, -2.2607421875, -2.13232421875, -2.00390625, -1.87548828125, -1.7470703125, -1.61865234375, -1.490234375, -1.36181640625, -1.2333984375, -1.10498046875, -0.9765625, -0.84814453125, -0.7197265625, -0.59130859375, -0.462890625, -0.33447265625, -0.2060546875, -0.07763671875, 0.05078125, 0.17919921875, 0.3076171875, 0.43603515625, 0.564453125, 0.69287109375, 0.8212890625, 0.94970703125, 1.078125, 1.20654296875, 1.3349609375, 1.46337890625, 1.591796875, 1.72021484375, 1.8486328125, 1.97705078125, 2.10546875, 2.23388671875, 2.3623046875, 2.49072265625, 2.619140625, 2.74755859375, 2.8759765625, 3.00439453125, 3.1328125, 3.26123046875, 3.3896484375, 3.51806640625, 3.646484375, 3.77490234375, 3.9033203125, 4.03173828125, 4.16015625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 12.0, 12.0, 24.0, 38.0, 55.0, 88.0, 158.0, 235.0, 371.0, 679.0, 1164.0, 1899.0, 3308.0, 5848.0, 10249.0, 18242.0, 32284.0, 58922.0, 101150.0, 160055.0, 204432.0, 175718.0, 116654.0, 68767.0, 38539.0, 21671.0, 11909.0, 6712.0, 3766.0, 2261.0, 1307.0, 796.0, 482.0, 282.0, 172.0, 109.0, 65.0, 47.0, 19.0, 26.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.64404296875, -0.623687744140625, -0.60333251953125, -0.582977294921875, -0.5626220703125, -0.542266845703125, -0.52191162109375, -0.501556396484375, -0.481201171875, -0.460845947265625, -0.44049072265625, -0.420135498046875, -0.3997802734375, -0.379425048828125, -0.35906982421875, -0.338714599609375, -0.318359375, -0.298004150390625, -0.27764892578125, -0.257293701171875, -0.2369384765625, -0.216583251953125, -0.19622802734375, -0.175872802734375, -0.155517578125, -0.135162353515625, -0.11480712890625, -0.094451904296875, -0.0740966796875, -0.053741455078125, -0.03338623046875, -0.013031005859375, 0.00732421875, 0.027679443359375, 0.04803466796875, 0.068389892578125, 0.0887451171875, 0.109100341796875, 0.12945556640625, 0.149810791015625, 0.170166015625, 0.190521240234375, 0.21087646484375, 0.231231689453125, 0.2515869140625, 0.271942138671875, 0.29229736328125, 0.312652587890625, 0.3330078125, 0.353363037109375, 0.37371826171875, 0.394073486328125, 0.4144287109375, 0.434783935546875, 0.45513916015625, 0.475494384765625, 0.495849609375, 0.516204833984375, 0.53656005859375, 0.556915283203125, 0.5772705078125, 0.597625732421875, 0.61798095703125, 0.638336181640625, 0.65869140625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 2.0, 9.0, 6.0, 9.0, 15.0, 15.0, 14.0, 14.0, 13.0, 23.0, 32.0, 31.0, 40.0, 25.0, 46.0, 43.0, 42.0, 40.0, 43.0, 38.0, 1065.0, 31.0, 47.0, 30.0, 30.0, 33.0, 51.0, 30.0, 26.0, 28.0, 18.0, 16.0, 20.0, 13.0, 15.0, 16.0, 6.0, 8.0, 6.0, 10.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.4375, -2.35711669921875, -2.2767333984375, -2.19635009765625, -2.115966796875, -2.03558349609375, -1.9552001953125, -1.87481689453125, -1.79443359375, -1.71405029296875, -1.6336669921875, -1.55328369140625, -1.472900390625, -1.39251708984375, -1.3121337890625, -1.23175048828125, -1.1513671875, -1.07098388671875, -0.9906005859375, -0.91021728515625, -0.829833984375, -0.74945068359375, -0.6690673828125, -0.58868408203125, -0.50830078125, -0.42791748046875, -0.3475341796875, -0.26715087890625, -0.186767578125, -0.10638427734375, -0.0260009765625, 0.05438232421875, 0.134765625, 0.21514892578125, 0.2955322265625, 0.37591552734375, 0.456298828125, 0.53668212890625, 0.6170654296875, 0.69744873046875, 0.77783203125, 0.85821533203125, 0.9385986328125, 1.01898193359375, 1.099365234375, 1.17974853515625, 1.2601318359375, 1.34051513671875, 1.4208984375, 1.50128173828125, 1.5816650390625, 1.66204833984375, 1.742431640625, 1.82281494140625, 1.9031982421875, 1.98358154296875, 2.06396484375, 2.14434814453125, 2.2247314453125, 2.30511474609375, 2.385498046875, 2.46588134765625, 2.5462646484375, 2.62664794921875, 2.70703125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 16.0, 23.0, 31.0, 40.0, 88.0, 107.0, 133.0, 237.0, 342.0, 541.0, 818.0, 1220.0, 2018.0, 2935.0, 4646.0, 7069.0, 10953.0, 16762.0, 26959.0, 43398.0, 68646.0, 106013.0, 152190.0, 1210668.0, 150465.0, 105201.0, 68082.0, 42899.0, 26947.0, 16825.0, 10747.0, 7087.0, 4537.0, 3019.0, 1937.0, 1206.0, 788.0, 513.0, 354.0, 229.0, 143.0, 115.0, 59.0, 32.0, 25.0, 19.0, 15.0, 10.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.318603515625, -0.3081550598144531, -0.29770660400390625, -0.2872581481933594, -0.2768096923828125, -0.2663612365722656, -0.25591278076171875, -0.24546432495117188, -0.235015869140625, -0.22456741333007812, -0.21411895751953125, -0.20367050170898438, -0.1932220458984375, -0.18277359008789062, -0.17232513427734375, -0.16187667846679688, -0.15142822265625, -0.14097976684570312, -0.13053131103515625, -0.12008285522460938, -0.1096343994140625, -0.09918594360351562, -0.08873748779296875, -0.07828903198242188, -0.067840576171875, -0.057392120361328125, -0.04694366455078125, -0.036495208740234375, -0.0260467529296875, -0.015598297119140625, -0.00514984130859375, 0.005298614501953125, 0.0157470703125, 0.026195526123046875, 0.03664398193359375, 0.047092437744140625, 0.0575408935546875, 0.06798934936523438, 0.07843780517578125, 0.08888626098632812, 0.099334716796875, 0.10978317260742188, 0.12023162841796875, 0.13068008422851562, 0.1411285400390625, 0.15157699584960938, 0.16202545166015625, 0.17247390747070312, 0.18292236328125, 0.19337081909179688, 0.20381927490234375, 0.21426773071289062, 0.2247161865234375, 0.23516464233398438, 0.24561309814453125, 0.2560615539550781, 0.266510009765625, 0.2769584655761719, 0.28740692138671875, 0.2978553771972656, 0.3083038330078125, 0.3187522888183594, 0.32920074462890625, 0.3396492004394531, 0.35009765625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 4.0, 3.0, 7.0, 14.0, 7.0, 12.0, 20.0, 11.0, 15.0, 16.0, 17.0, 21.0, 28.0, 33.0, 40.0, 43.0, 48.0, 54.0, 64.0, 64.0, 62.0, 50.0, 36.0, 42.0, 38.0, 39.0, 27.0, 15.0, 23.0, 23.0, 19.0, 16.0, 15.0, 13.0, 10.0, 7.0, 6.0, 5.0, 4.0, 3.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.01137542724609375, -0.010986566543579102, -0.010597705841064453, -0.010208845138549805, -0.009819984436035156, -0.009431123733520508, -0.00904226303100586, -0.008653402328491211, -0.008264541625976562, -0.007875680923461914, -0.007486820220947266, -0.007097959518432617, -0.006709098815917969, -0.00632023811340332, -0.005931377410888672, -0.0055425167083740234, -0.005153656005859375, -0.0047647953033447266, -0.004375934600830078, -0.00398707389831543, -0.0035982131958007812, -0.003209352493286133, -0.0028204917907714844, -0.002431631088256836, -0.0020427703857421875, -0.001653909683227539, -0.0012650489807128906, -0.0008761882781982422, -0.00048732757568359375, -9.846687316894531e-05, 0.0002903938293457031, 0.0006792545318603516, 0.001068115234375, 0.0014569759368896484, 0.0018458366394042969, 0.0022346973419189453, 0.0026235580444335938, 0.003012418746948242, 0.0034012794494628906, 0.003790140151977539, 0.0041790008544921875, 0.004567861557006836, 0.004956722259521484, 0.005345582962036133, 0.005734443664550781, 0.00612330436706543, 0.006512165069580078, 0.0069010257720947266, 0.007289886474609375, 0.0076787471771240234, 0.008067607879638672, 0.00845646858215332, 0.008845329284667969, 0.009234189987182617, 0.009623050689697266, 0.010011911392211914, 0.010400772094726562, 0.010789632797241211, 0.01117849349975586, 0.011567354202270508, 0.011956214904785156, 0.012345075607299805, 0.012733936309814453, 0.013122797012329102, 0.01351165771484375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 6.0, 4.0, 5.0, 5.0, 8.0, 16.0, 16.0, 28.0, 22.0, 38.0, 48.0, 49.0, 71.0, 124.0, 166.0, 245.0, 293.0, 521.0, 2312.0, 146329.0, 889387.0, 6799.0, 703.0, 407.0, 249.0, 200.0, 135.0, 86.0, 57.0, 48.0, 25.0, 35.0, 26.0, 12.0, 16.0, 18.0, 4.0, 8.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.2261962890625, -0.2195758819580078, -0.21295547485351562, -0.20633506774902344, -0.19971466064453125, -0.19309425354003906, -0.18647384643554688, -0.1798534393310547, -0.1732330322265625, -0.1666126251220703, -0.15999221801757812, -0.15337181091308594, -0.14675140380859375, -0.14013099670410156, -0.13351058959960938, -0.1268901824951172, -0.120269775390625, -0.11364936828613281, -0.10702896118164062, -0.10040855407714844, -0.09378814697265625, -0.08716773986816406, -0.08054733276367188, -0.07392692565917969, -0.0673065185546875, -0.06068611145019531, -0.054065704345703125, -0.04744529724121094, -0.04082489013671875, -0.03420448303222656, -0.027584075927734375, -0.020963668823242188, -0.01434326171875, -0.0077228546142578125, -0.001102447509765625, 0.0055179595947265625, 0.01213836669921875, 0.018758773803710938, 0.025379180908203125, 0.03199958801269531, 0.0386199951171875, 0.04524040222167969, 0.051860809326171875, 0.05848121643066406, 0.06510162353515625, 0.07172203063964844, 0.07834243774414062, 0.08496284484863281, 0.091583251953125, 0.09820365905761719, 0.10482406616210938, 0.11144447326660156, 0.11806488037109375, 0.12468528747558594, 0.13130569458007812, 0.1379261016845703, 0.1445465087890625, 0.1511669158935547, 0.15778732299804688, 0.16440773010253906, 0.17102813720703125, 0.17764854431152344, 0.18426895141601562, 0.1908893585205078, 0.197509765625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 53.0, 731.0, 217.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12403152137994766, -0.11883340030908585, -0.11363527923822403, -0.10843715816736221, -0.1032390370965004, -0.09804091602563858, -0.09284279495477676, -0.08764467388391495, -0.08244655281305313, -0.07724843174219131, -0.0720503106713295, -0.06685218960046768, -0.061654068529605865, -0.05645594745874405, -0.05125782638788223, -0.046059705317020416, -0.0408615842461586, -0.03566346317529678, -0.030465342104434967, -0.02526722103357315, -0.020069099962711334, -0.014870978891849518, -0.009672857820987701, -0.004474736750125885, 0.0007233843207359314, 0.005921505391597748, 0.011119626462459564, 0.01631774753332138, 0.021515868604183197, 0.026713989675045013, 0.03191211074590683, 0.037110231816768646, 0.042308345437049866, 0.04750646650791168, 0.0527045875787735, 0.057902708649635315, 0.06310082972049713, 0.06829895079135895, 0.07349707186222076, 0.07869519293308258, 0.0838933140039444, 0.08909143507480621, 0.09428955614566803, 0.09948767721652985, 0.10468579828739166, 0.10988391935825348, 0.1150820404291153, 0.12028016149997711, 0.12547828257083893, 0.13067640364170074, 0.13587452471256256, 0.14107264578342438, 0.1462707668542862, 0.151468887925148, 0.15666700899600983, 0.16186513006687164, 0.16706325113773346, 0.17226137220859528, 0.1774594932794571, 0.1826576143503189, 0.18785573542118073, 0.19305385649204254, 0.19825197756290436, 0.20345009863376617, 0.208648219704628]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 9.0, 6.0, 10.0, 10.0, 10.0, 13.0, 15.0, 17.0, 28.0, 23.0, 29.0, 29.0, 21.0, 31.0, 29.0, 37.0, 45.0, 37.0, 38.0, 46.0, 39.0, 39.0, 39.0, 34.0, 34.0, 47.0, 33.0, 29.0, 30.0, 30.0, 28.0, 18.0, 17.0, 17.0, 11.0, 12.0, 16.0, 8.0, 7.0, 6.0, 6.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018207669258117676, -0.017568517476320267, -0.01692936383187771, -0.01629021018743515, -0.01565105840563774, -0.015011905692517757, -0.014372752979397774, -0.01373360026627779, -0.013094447553157806, -0.012455294840037823, -0.011816142126917839, -0.011176989413797855, -0.010537836700677872, -0.009898683987557888, -0.009259531274437904, -0.00862037856131792, -0.007981225848197937, -0.007342073135077953, -0.00670292042195797, -0.006063767708837986, -0.005424614995718002, -0.004785462282598019, -0.004146309569478035, -0.0035071568563580513, -0.0028680041432380676, -0.002228851430118084, -0.0015896987169981003, -0.0009505460038781166, -0.00031139329075813293, 0.00032775942236185074, 0.0009669121354818344, 0.001606064848601818, 0.0022452175617218018, 0.0028843702748417854, 0.003523522987961769, 0.004162675701081753, 0.0048018284142017365, 0.00544098112732172, 0.006080133840441704, 0.0067192865535616875, 0.007358439266681671, 0.007997591979801655, 0.008636744692921638, 0.009275897406041622, 0.009915050119161606, 0.01055420283228159, 0.011193355545401573, 0.011832508258521557, 0.01247166097164154, 0.013110813684761524, 0.013749966397881508, 0.014389119111001492, 0.015028271824121475, 0.015667423605918884, 0.016306577250361443, 0.016945730894804, 0.01758488267660141, 0.01822403445839882, 0.018863188102841377, 0.019502341747283936, 0.020141493529081345, 0.020780645310878754, 0.021419798955321312, 0.02205895259976387, 0.02269810438156128]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 4.0, 6.0, 11.0, 13.0, 11.0, 10.0, 22.0, 24.0, 18.0, 25.0, 26.0, 40.0, 38.0, 34.0, 42.0, 41.0, 49.0, 41.0, 45.0, 44.0, 49.0, 50.0, 46.0, 38.0, 43.0, 35.0, 26.0, 28.0, 27.0, 24.0, 13.0, 17.0, 16.0, 12.0, 7.0, 9.0, 5.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.93017578125, -3.8017578125, -3.67333984375, -3.544921875, -3.41650390625, -3.2880859375, -3.15966796875, -3.03125, -2.90283203125, -2.7744140625, -2.64599609375, -2.517578125, -2.38916015625, -2.2607421875, -2.13232421875, -2.00390625, -1.87548828125, -1.7470703125, -1.61865234375, -1.490234375, -1.36181640625, -1.2333984375, -1.10498046875, -0.9765625, -0.84814453125, -0.7197265625, -0.59130859375, -0.462890625, -0.33447265625, -0.2060546875, -0.07763671875, 0.05078125, 0.17919921875, 0.3076171875, 0.43603515625, 0.564453125, 0.69287109375, 0.8212890625, 0.94970703125, 1.078125, 1.20654296875, 1.3349609375, 1.46337890625, 1.591796875, 1.72021484375, 1.8486328125, 1.97705078125, 2.10546875, 2.23388671875, 2.3623046875, 2.49072265625, 2.619140625, 2.74755859375, 2.8759765625, 3.00439453125, 3.1328125, 3.26123046875, 3.3896484375, 3.51806640625, 3.646484375, 3.77490234375, 3.9033203125, 4.03173828125, 4.16015625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 7.0, 12.0, 21.0, 20.0, 37.0, 46.0, 80.0, 91.0, 90.0, 166.0, 208.0, 317.0, 476.0, 861.0, 1349.0, 2166.0, 3700.0, 6059.0, 10333.0, 18444.0, 39120.0, 102728.0, 298585.0, 343346.0, 125310.0, 45523.0, 20865.0, 11462.0, 6543.0, 4001.0, 2402.0, 1461.0, 931.0, 599.0, 373.0, 248.0, 178.0, 114.0, 72.0, 55.0, 43.0, 35.0, 12.0, 14.0, 15.0, 6.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.171875, -4.0418701171875, -3.911865234375, -3.7818603515625, -3.65185546875, -3.5218505859375, -3.391845703125, -3.2618408203125, -3.1318359375, -3.0018310546875, -2.871826171875, -2.7418212890625, -2.61181640625, -2.4818115234375, -2.351806640625, -2.2218017578125, -2.091796875, -1.9617919921875, -1.831787109375, -1.7017822265625, -1.57177734375, -1.4417724609375, -1.311767578125, -1.1817626953125, -1.0517578125, -0.9217529296875, -0.791748046875, -0.6617431640625, -0.53173828125, -0.4017333984375, -0.271728515625, -0.1417236328125, -0.01171875, 0.1182861328125, 0.248291015625, 0.3782958984375, 0.50830078125, 0.6383056640625, 0.768310546875, 0.8983154296875, 1.0283203125, 1.1583251953125, 1.288330078125, 1.4183349609375, 1.54833984375, 1.6783447265625, 1.808349609375, 1.9383544921875, 2.068359375, 2.1983642578125, 2.328369140625, 2.4583740234375, 2.58837890625, 2.7183837890625, 2.848388671875, 2.9783935546875, 3.1083984375, 3.2384033203125, 3.368408203125, 3.4984130859375, 3.62841796875, 3.7584228515625, 3.888427734375, 4.0184326171875, 4.1484375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 11.0, 8.0, 12.0, 14.0, 19.0, 19.0, 31.0, 27.0, 32.0, 41.0, 47.0, 61.0, 63.0, 110.0, 239.0, 1526.0, 257.0, 101.0, 69.0, 50.0, 47.0, 47.0, 31.0, 40.0, 30.0, 24.0, 14.0, 13.0, 13.0, 14.0, 13.0, 5.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.234375, -17.74853515625, -17.2626953125, -16.77685546875, -16.291015625, -15.80517578125, -15.3193359375, -14.83349609375, -14.34765625, -13.86181640625, -13.3759765625, -12.89013671875, -12.404296875, -11.91845703125, -11.4326171875, -10.94677734375, -10.4609375, -9.97509765625, -9.4892578125, -9.00341796875, -8.517578125, -8.03173828125, -7.5458984375, -7.06005859375, -6.57421875, -6.08837890625, -5.6025390625, -5.11669921875, -4.630859375, -4.14501953125, -3.6591796875, -3.17333984375, -2.6875, -2.20166015625, -1.7158203125, -1.22998046875, -0.744140625, -0.25830078125, 0.2275390625, 0.71337890625, 1.19921875, 1.68505859375, 2.1708984375, 2.65673828125, 3.142578125, 3.62841796875, 4.1142578125, 4.60009765625, 5.0859375, 5.57177734375, 6.0576171875, 6.54345703125, 7.029296875, 7.51513671875, 8.0009765625, 8.48681640625, 8.97265625, 9.45849609375, 9.9443359375, 10.43017578125, 10.916015625, 11.40185546875, 11.8876953125, 12.37353515625, 12.859375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 6.0, 7.0, 6.0, 9.0, 17.0, 21.0, 25.0, 30.0, 52.0, 62.0, 106.0, 175.0, 259.0, 526.0, 2055.0, 56300.0, 3051405.0, 31826.0, 1630.0, 478.0, 247.0, 139.0, 81.0, 65.0, 63.0, 25.0, 21.0, 12.0, 11.0, 9.0, 6.0, 10.0, 4.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.5625, -37.4091796875, -36.255859375, -35.1025390625, -33.94921875, -32.7958984375, -31.642578125, -30.4892578125, -29.3359375, -28.1826171875, -27.029296875, -25.8759765625, -24.72265625, -23.5693359375, -22.416015625, -21.2626953125, -20.109375, -18.9560546875, -17.802734375, -16.6494140625, -15.49609375, -14.3427734375, -13.189453125, -12.0361328125, -10.8828125, -9.7294921875, -8.576171875, -7.4228515625, -6.26953125, -5.1162109375, -3.962890625, -2.8095703125, -1.65625, -0.5029296875, 0.650390625, 1.8037109375, 2.95703125, 4.1103515625, 5.263671875, 6.4169921875, 7.5703125, 8.7236328125, 9.876953125, 11.0302734375, 12.18359375, 13.3369140625, 14.490234375, 15.6435546875, 16.796875, 17.9501953125, 19.103515625, 20.2568359375, 21.41015625, 22.5634765625, 23.716796875, 24.8701171875, 26.0234375, 27.1767578125, 28.330078125, 29.4833984375, 30.63671875, 31.7900390625, 32.943359375, 34.0966796875, 35.25]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 14.0, 33.0, 85.0, 191.0, 203.0, 225.0, 143.0, 62.0, 40.0, 11.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.109067916870117, -17.74233627319336, -16.37560272216797, -15.008871078491211, -13.642139434814453, -12.275406837463379, -10.908674240112305, -9.541942596435547, -8.175209999084473, -6.808477878570557, -5.441745758056641, -4.075013160705566, -2.7082810401916504, -1.3415489196777344, 0.025183677673339844, 1.3919153213500977, 2.758647918701172, 4.125380039215088, 5.492112159729004, 6.858844757080078, 8.225576400756836, 9.59230899810791, 10.959041595458984, 12.325773239135742, 13.692505836486816, 15.05923843383789, 16.42597007751465, 17.792701721191406, 19.159435272216797, 20.526166915893555, 21.892898559570312, 23.259632110595703, 24.626361846923828, 25.993093490600586, 27.359827041625977, 28.726558685302734, 30.093290328979492, 31.46002197265625, 32.82675552368164, 34.19348907470703, 35.560218811035156, 36.92695236206055, 38.29368209838867, 39.66041564941406, 41.02714920043945, 42.39387893676758, 43.76061248779297, 45.127342224121094, 46.49407958984375, 47.86081314086914, 49.227542877197266, 50.594276428222656, 51.96100997924805, 53.32773971557617, 54.69447326660156, 56.06120300292969, 57.42793655395508, 58.79467010498047, 60.161399841308594, 61.528133392333984, 62.894866943359375, 64.2615966796875, 65.62832641601562, 66.99506378173828, 68.3617935180664]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 11.0, 3.0, 13.0, 18.0, 13.0, 21.0, 16.0, 24.0, 19.0, 15.0, 29.0, 24.0, 27.0, 35.0, 31.0, 37.0, 31.0, 41.0, 49.0, 37.0, 48.0, 36.0, 31.0, 32.0, 41.0, 36.0, 34.0, 30.0, 30.0, 28.0, 22.0, 16.0, 21.0, 16.0, 14.0, 19.0, 9.0, 10.0, 5.0, 7.0, 5.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-33.74267578125, -32.720741271972656, -31.698808670043945, -30.676876068115234, -29.65494155883789, -28.63300895690918, -27.61107635498047, -26.589141845703125, -25.56720733642578, -24.54527473449707, -23.523340225219727, -22.501407623291016, -21.479473114013672, -20.45754051208496, -19.43560791015625, -18.413673400878906, -17.391740798950195, -16.369808197021484, -15.34787368774414, -14.32594108581543, -13.304006576538086, -12.282073974609375, -11.260140419006348, -10.23820686340332, -9.216273307800293, -8.194339752197266, -7.172406196594238, -6.150473117828369, -5.128539562225342, -4.1066060066223145, -3.0846729278564453, -2.062739372253418, -1.0408058166503906, -0.018872380256652832, 1.003061056137085, 2.024994373321533, 3.0469279289245605, 4.068861484527588, 5.090794563293457, 6.112728118896484, 7.134661674499512, 8.156595230102539, 9.178528785705566, 10.200462341308594, 11.222394943237305, 12.244329452514648, 13.26626205444336, 14.288195610046387, 15.310129165649414, 16.332061767578125, 17.35399627685547, 18.37592887878418, 19.397863388061523, 20.419795989990234, 21.441730499267578, 22.46366310119629, 23.485595703125, 24.50752830505371, 25.529462814331055, 26.551395416259766, 27.57332992553711, 28.59526252746582, 29.61719512939453, 30.639129638671875, 31.66106414794922]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 7.0, 8.0, 13.0, 9.0, 11.0, 8.0, 22.0, 22.0, 25.0, 26.0, 29.0, 34.0, 41.0, 29.0, 46.0, 41.0, 40.0, 47.0, 45.0, 53.0, 41.0, 48.0, 37.0, 41.0, 35.0, 36.0, 39.0, 35.0, 24.0, 19.0, 18.0, 12.0, 23.0, 8.0, 10.0, 6.0, 1.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.112060546875, -3.97802734375, -3.843994140625, -3.7099609375, -3.575927734375, -3.44189453125, -3.307861328125, -3.173828125, -3.039794921875, -2.90576171875, -2.771728515625, -2.6376953125, -2.503662109375, -2.36962890625, -2.235595703125, -2.1015625, -1.967529296875, -1.83349609375, -1.699462890625, -1.5654296875, -1.431396484375, -1.29736328125, -1.163330078125, -1.029296875, -0.895263671875, -0.76123046875, -0.627197265625, -0.4931640625, -0.359130859375, -0.22509765625, -0.091064453125, 0.04296875, 0.177001953125, 0.31103515625, 0.445068359375, 0.5791015625, 0.713134765625, 0.84716796875, 0.981201171875, 1.115234375, 1.249267578125, 1.38330078125, 1.517333984375, 1.6513671875, 1.785400390625, 1.91943359375, 2.053466796875, 2.1875, 2.321533203125, 2.45556640625, 2.589599609375, 2.7236328125, 2.857666015625, 2.99169921875, 3.125732421875, 3.259765625, 3.393798828125, 3.52783203125, 3.661865234375, 3.7958984375, 3.929931640625, 4.06396484375, 4.197998046875, 4.33203125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 5.0, 13.0, 9.0, 14.0, 14.0, 16.0, 27.0, 25.0, 42.0, 35.0, 59.0, 86.0, 108.0, 224.0, 636.0, 2439.0, 12239.0, 163594.0, 2868391.0, 1092932.0, 45819.0, 5412.0, 1236.0, 370.0, 152.0, 98.0, 48.0, 35.0, 49.0, 34.0, 20.0, 21.0, 23.0, 17.0, 13.0, 9.0, 3.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.5703125, -15.0953369140625, -14.620361328125, -14.1453857421875, -13.67041015625, -13.1954345703125, -12.720458984375, -12.2454833984375, -11.7705078125, -11.2955322265625, -10.820556640625, -10.3455810546875, -9.87060546875, -9.3956298828125, -8.920654296875, -8.4456787109375, -7.970703125, -7.4957275390625, -7.020751953125, -6.5457763671875, -6.07080078125, -5.5958251953125, -5.120849609375, -4.6458740234375, -4.1708984375, -3.6959228515625, -3.220947265625, -2.7459716796875, -2.27099609375, -1.7960205078125, -1.321044921875, -0.8460693359375, -0.37109375, 0.1038818359375, 0.578857421875, 1.0538330078125, 1.52880859375, 2.0037841796875, 2.478759765625, 2.9537353515625, 3.4287109375, 3.9036865234375, 4.378662109375, 4.8536376953125, 5.32861328125, 5.8035888671875, 6.278564453125, 6.7535400390625, 7.228515625, 7.7034912109375, 8.178466796875, 8.6534423828125, 9.12841796875, 9.6033935546875, 10.078369140625, 10.5533447265625, 11.0283203125, 11.5032958984375, 11.978271484375, 12.4532470703125, 12.92822265625, 13.4031982421875, 13.878173828125, 14.3531494140625, 14.828125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 7.0, 11.0, 20.0, 31.0, 28.0, 34.0, 67.0, 97.0, 145.0, 224.0, 352.0, 412.0, 526.0, 606.0, 447.0, 349.0, 225.0, 154.0, 113.0, 79.0, 50.0, 35.0, 23.0, 19.0, 5.0, 9.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.765625, -10.382080078125, -9.99853515625, -9.614990234375, -9.2314453125, -8.847900390625, -8.46435546875, -8.080810546875, -7.697265625, -7.313720703125, -6.93017578125, -6.546630859375, -6.1630859375, -5.779541015625, -5.39599609375, -5.012451171875, -4.62890625, -4.245361328125, -3.86181640625, -3.478271484375, -3.0947265625, -2.711181640625, -2.32763671875, -1.944091796875, -1.560546875, -1.177001953125, -0.79345703125, -0.409912109375, -0.0263671875, 0.357177734375, 0.74072265625, 1.124267578125, 1.5078125, 1.891357421875, 2.27490234375, 2.658447265625, 3.0419921875, 3.425537109375, 3.80908203125, 4.192626953125, 4.576171875, 4.959716796875, 5.34326171875, 5.726806640625, 6.1103515625, 6.493896484375, 6.87744140625, 7.260986328125, 7.64453125, 8.028076171875, 8.41162109375, 8.795166015625, 9.1787109375, 9.562255859375, 9.94580078125, 10.329345703125, 10.712890625, 11.096435546875, 11.47998046875, 11.863525390625, 12.2470703125, 12.630615234375, 13.01416015625, 13.397705078125, 13.78125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 9.0, 11.0, 8.0, 26.0, 40.0, 48.0, 73.0, 127.0, 225.0, 442.0, 1767.0, 16100.0, 837509.0, 3268172.0, 64608.0, 3676.0, 762.0, 306.0, 128.0, 84.0, 52.0, 37.0, 27.0, 21.0, 12.0, 7.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.46875, -37.434814453125, -36.40087890625, -35.366943359375, -34.3330078125, -33.299072265625, -32.26513671875, -31.231201171875, -30.197265625, -29.163330078125, -28.12939453125, -27.095458984375, -26.0615234375, -25.027587890625, -23.99365234375, -22.959716796875, -21.92578125, -20.891845703125, -19.85791015625, -18.823974609375, -17.7900390625, -16.756103515625, -15.72216796875, -14.688232421875, -13.654296875, -12.620361328125, -11.58642578125, -10.552490234375, -9.5185546875, -8.484619140625, -7.45068359375, -6.416748046875, -5.3828125, -4.348876953125, -3.31494140625, -2.281005859375, -1.2470703125, -0.213134765625, 0.82080078125, 1.854736328125, 2.888671875, 3.922607421875, 4.95654296875, 5.990478515625, 7.0244140625, 8.058349609375, 9.09228515625, 10.126220703125, 11.16015625, 12.194091796875, 13.22802734375, 14.261962890625, 15.2958984375, 16.329833984375, 17.36376953125, 18.397705078125, 19.431640625, 20.465576171875, 21.49951171875, 22.533447265625, 23.5673828125, 24.601318359375, 25.63525390625, 26.669189453125, 27.703125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 8.0, 6.0, 18.0, 28.0, 38.0, 64.0, 85.0, 93.0, 102.0, 97.0, 93.0, 99.0, 86.0, 63.0, 49.0, 29.0, 17.0, 15.0, 7.0, 4.0, 2.0, 3.0, 2.0], "bins": [-78.19986724853516, -76.66096496582031, -75.1220703125, -73.58316802978516, -72.04427337646484, -70.50537109375, -68.96647644042969, -67.42757415771484, -65.88867950439453, -64.34977722167969, -62.810882568359375, -61.2719841003418, -59.73308563232422, -58.19418716430664, -56.65528869628906, -55.11638641357422, -53.57748794555664, -52.03858947753906, -50.499691009521484, -48.960792541503906, -47.42189407348633, -45.88299560546875, -44.344093322753906, -42.805198669433594, -41.26629638671875, -39.72739791870117, -38.188499450683594, -36.649600982666016, -35.11070251464844, -33.57180404663086, -32.03290557861328, -30.49400520324707, -28.955106735229492, -27.416208267211914, -25.877309799194336, -24.338409423828125, -22.799510955810547, -21.26061248779297, -19.72171401977539, -18.182815551757812, -16.643917083740234, -15.105018615722656, -13.566120147705078, -12.027220726013184, -10.488322257995605, -8.949423789978027, -7.410524368286133, -5.871625900268555, -4.332727432250977, -2.7938287258148193, -1.254930019378662, 0.2839689254760742, 1.8228673934936523, 3.3617658615112305, 4.900665283203125, 6.439563751220703, 7.978462219238281, 9.51736068725586, 11.056259155273438, 12.595158576965332, 14.13405704498291, 15.672955513000488, 17.211854934692383, 18.75075340270996, 20.28965187072754]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 5.0, 11.0, 10.0, 14.0, 18.0, 15.0, 19.0, 27.0, 34.0, 20.0, 35.0, 47.0, 26.0, 52.0, 62.0, 56.0, 50.0, 46.0, 36.0, 42.0, 36.0, 39.0, 49.0, 40.0, 29.0, 29.0, 28.0, 13.0, 19.0, 16.0, 20.0, 11.0, 9.0, 8.0, 10.0, 1.0, 2.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.34918212890625, -31.29689598083496, -30.244611740112305, -29.192325592041016, -28.14004135131836, -27.08775520324707, -26.03546905517578, -24.983184814453125, -23.93090057373047, -22.87861442565918, -21.826330184936523, -20.774044036865234, -19.721759796142578, -18.66947364807129, -17.6171875, -16.564903259277344, -15.512617111206055, -14.460331916809082, -13.40804672241211, -12.35576057434082, -11.303476333618164, -10.251190185546875, -9.198904991149902, -8.14661979675293, -7.094334602355957, -6.042049407958984, -4.989764213562012, -3.937478542327881, -2.885193347930908, -1.8329081535339355, -0.7806224822998047, 0.27166271209716797, 1.3239479064941406, 2.3762331008911133, 3.428518533706665, 4.480803966522217, 5.5330891609191895, 6.585374355316162, 7.637660026550293, 8.689945220947266, 9.742230415344238, 10.794515609741211, 11.846800804138184, 12.899085998535156, 13.951372146606445, 15.003656387329102, 16.05594253540039, 17.108226776123047, 18.160512924194336, 19.212799072265625, 20.26508331298828, 21.31736946105957, 22.369653701782227, 23.421939849853516, 24.474224090576172, 25.52651023864746, 26.57879638671875, 27.63108253479004, 28.683366775512695, 29.735652923583984, 30.78793716430664, 31.84022331237793, 32.89250946044922, 33.944793701171875, 34.99707794189453]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 5.0, 4.0, 12.0, 10.0, 12.0, 11.0, 22.0, 22.0, 17.0, 19.0, 30.0, 41.0, 26.0, 49.0, 40.0, 35.0, 42.0, 57.0, 48.0, 38.0, 49.0, 35.0, 48.0, 45.0, 37.0, 41.0, 37.0, 28.0, 25.0, 25.0, 17.0, 21.0, 17.0, 5.0, 6.0, 9.0, 3.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.25, -4.11309814453125, -3.9761962890625, -3.83929443359375, -3.702392578125, -3.56549072265625, -3.4285888671875, -3.29168701171875, -3.15478515625, -3.01788330078125, -2.8809814453125, -2.74407958984375, -2.607177734375, -2.47027587890625, -2.3333740234375, -2.19647216796875, -2.0595703125, -1.92266845703125, -1.7857666015625, -1.64886474609375, -1.511962890625, -1.37506103515625, -1.2381591796875, -1.10125732421875, -0.96435546875, -0.82745361328125, -0.6905517578125, -0.55364990234375, -0.416748046875, -0.27984619140625, -0.1429443359375, -0.00604248046875, 0.130859375, 0.26776123046875, 0.4046630859375, 0.54156494140625, 0.678466796875, 0.81536865234375, 0.9522705078125, 1.08917236328125, 1.22607421875, 1.36297607421875, 1.4998779296875, 1.63677978515625, 1.773681640625, 1.91058349609375, 2.0474853515625, 2.18438720703125, 2.3212890625, 2.45819091796875, 2.5950927734375, 2.73199462890625, 2.868896484375, 3.00579833984375, 3.1427001953125, 3.27960205078125, 3.41650390625, 3.55340576171875, 3.6903076171875, 3.82720947265625, 3.964111328125, 4.10101318359375, 4.2379150390625, 4.37481689453125, 4.51171875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 8.0, 9.0, 10.0, 16.0, 29.0, 50.0, 61.0, 115.0, 161.0, 211.0, 345.0, 509.0, 843.0, 1288.0, 1755.0, 2768.0, 4110.0, 6179.0, 9962.0, 15331.0, 23556.0, 36199.0, 54550.0, 80436.0, 111413.0, 140670.0, 148442.0, 125480.0, 93276.0, 65763.0, 43322.0, 28741.0, 18458.0, 11789.0, 7862.0, 5000.0, 3323.0, 2158.0, 1485.0, 951.0, 656.0, 406.0, 298.0, 173.0, 150.0, 68.0, 65.0, 39.0, 20.0, 20.0, 10.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.489501953125, -0.4727516174316406, -0.45600128173828125, -0.4392509460449219, -0.4225006103515625, -0.4057502746582031, -0.38899993896484375, -0.3722496032714844, -0.355499267578125, -0.3387489318847656, -0.32199859619140625, -0.3052482604980469, -0.2884979248046875, -0.2717475891113281, -0.25499725341796875, -0.23824691772460938, -0.22149658203125, -0.20474624633789062, -0.18799591064453125, -0.17124557495117188, -0.1544952392578125, -0.13774490356445312, -0.12099456787109375, -0.10424423217773438, -0.087493896484375, -0.07074356079101562, -0.05399322509765625, -0.037242889404296875, -0.0204925537109375, -0.003742218017578125, 0.01300811767578125, 0.029758453369140625, 0.0465087890625, 0.06325912475585938, 0.08000946044921875, 0.09675979614257812, 0.1135101318359375, 0.13026046752929688, 0.14701080322265625, 0.16376113891601562, 0.180511474609375, 0.19726181030273438, 0.21401214599609375, 0.23076248168945312, 0.2475128173828125, 0.2642631530761719, 0.28101348876953125, 0.2977638244628906, 0.31451416015625, 0.3312644958496094, 0.34801483154296875, 0.3647651672363281, 0.3815155029296875, 0.3982658386230469, 0.41501617431640625, 0.4317665100097656, 0.448516845703125, 0.4652671813964844, 0.48201751708984375, 0.4987678527832031, 0.5155181884765625, 0.5322685241699219, 0.5490188598632812, 0.5657691955566406, 0.58251953125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 10.0, 3.0, 11.0, 3.0, 11.0, 7.0, 21.0, 18.0, 19.0, 17.0, 32.0, 27.0, 52.0, 37.0, 35.0, 40.0, 36.0, 52.0, 48.0, 39.0, 1068.0, 56.0, 34.0, 41.0, 30.0, 38.0, 34.0, 34.0, 29.0, 23.0, 20.0, 21.0, 21.0, 17.0, 12.0, 9.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.91229248046875, -2.8187255859375, -2.72515869140625, -2.631591796875, -2.53802490234375, -2.4444580078125, -2.35089111328125, -2.25732421875, -2.16375732421875, -2.0701904296875, -1.97662353515625, -1.883056640625, -1.78948974609375, -1.6959228515625, -1.60235595703125, -1.5087890625, -1.41522216796875, -1.3216552734375, -1.22808837890625, -1.134521484375, -1.04095458984375, -0.9473876953125, -0.85382080078125, -0.76025390625, -0.66668701171875, -0.5731201171875, -0.47955322265625, -0.385986328125, -0.29241943359375, -0.1988525390625, -0.10528564453125, -0.01171875, 0.08184814453125, 0.1754150390625, 0.26898193359375, 0.362548828125, 0.45611572265625, 0.5496826171875, 0.64324951171875, 0.73681640625, 0.83038330078125, 0.9239501953125, 1.01751708984375, 1.111083984375, 1.20465087890625, 1.2982177734375, 1.39178466796875, 1.4853515625, 1.57891845703125, 1.6724853515625, 1.76605224609375, 1.859619140625, 1.95318603515625, 2.0467529296875, 2.14031982421875, 2.23388671875, 2.32745361328125, 2.4210205078125, 2.51458740234375, 2.608154296875, 2.70172119140625, 2.7952880859375, 2.88885498046875, 2.982421875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 8.0, 5.0, 5.0, 6.0, 12.0, 47.0, 51.0, 63.0, 114.0, 170.0, 256.0, 440.0, 692.0, 1051.0, 1660.0, 2648.0, 4122.0, 6504.0, 10795.0, 17387.0, 28413.0, 46870.0, 76339.0, 117885.0, 180077.0, 1204963.0, 143420.0, 96249.0, 60739.0, 37095.0, 22417.0, 13735.0, 8495.0, 5300.0, 3305.0, 2039.0, 1329.0, 856.0, 557.0, 344.0, 243.0, 130.0, 85.0, 76.0, 48.0, 33.0, 18.0, 18.0, 10.0, 6.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.373046875, -0.3614845275878906, -0.34992218017578125, -0.3383598327636719, -0.3267974853515625, -0.3152351379394531, -0.30367279052734375, -0.2921104431152344, -0.280548095703125, -0.2689857482910156, -0.25742340087890625, -0.24586105346679688, -0.2342987060546875, -0.22273635864257812, -0.21117401123046875, -0.19961166381835938, -0.18804931640625, -0.17648696899414062, -0.16492462158203125, -0.15336227416992188, -0.1417999267578125, -0.13023757934570312, -0.11867523193359375, -0.10711288452148438, -0.095550537109375, -0.08398818969726562, -0.07242584228515625, -0.060863494873046875, -0.0493011474609375, -0.037738800048828125, -0.02617645263671875, -0.014614105224609375, -0.0030517578125, 0.008510589599609375, 0.02007293701171875, 0.031635284423828125, 0.0431976318359375, 0.054759979248046875, 0.06632232666015625, 0.07788467407226562, 0.089447021484375, 0.10100936889648438, 0.11257171630859375, 0.12413406372070312, 0.1356964111328125, 0.14725875854492188, 0.15882110595703125, 0.17038345336914062, 0.18194580078125, 0.19350814819335938, 0.20507049560546875, 0.21663284301757812, 0.2281951904296875, 0.23975753784179688, 0.25131988525390625, 0.2628822326660156, 0.274444580078125, 0.2860069274902344, 0.29756927490234375, 0.3091316223144531, 0.3206939697265625, 0.3322563171386719, 0.34381866455078125, 0.3553810119628906, 0.366943359375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 4.0, 7.0, 9.0, 8.0, 10.0, 16.0, 27.0, 35.0, 54.0, 65.0, 93.0, 106.0, 154.0, 106.0, 77.0, 59.0, 51.0, 35.0, 20.0, 17.0, 6.0, 8.0, 11.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0222930908203125, -0.021509170532226562, -0.020725250244140625, -0.019941329956054688, -0.01915740966796875, -0.018373489379882812, -0.017589569091796875, -0.016805648803710938, -0.016021728515625, -0.015237808227539062, -0.014453887939453125, -0.013669967651367188, -0.01288604736328125, -0.012102127075195312, -0.011318206787109375, -0.010534286499023438, -0.0097503662109375, -0.008966445922851562, -0.008182525634765625, -0.0073986053466796875, -0.00661468505859375, -0.0058307647705078125, -0.005046844482421875, -0.0042629241943359375, -0.00347900390625, -0.0026950836181640625, -0.001911163330078125, -0.0011272430419921875, -0.00034332275390625, 0.0004405975341796875, 0.001224517822265625, 0.0020084381103515625, 0.0027923583984375, 0.0035762786865234375, 0.004360198974609375, 0.0051441192626953125, 0.00592803955078125, 0.0067119598388671875, 0.007495880126953125, 0.008279800415039062, 0.009063720703125, 0.009847640991210938, 0.010631561279296875, 0.011415481567382812, 0.01219940185546875, 0.012983322143554688, 0.013767242431640625, 0.014551162719726562, 0.0153350830078125, 0.016119003295898438, 0.016902923583984375, 0.017686843872070312, 0.01847076416015625, 0.019254684448242188, 0.020038604736328125, 0.020822525024414062, 0.0216064453125, 0.022390365600585938, 0.023174285888671875, 0.023958206176757812, 0.02474212646484375, 0.025526046752929688, 0.026309967041015625, 0.027093887329101562, 0.0278778076171875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 9.0, 16.0, 16.0, 16.0, 42.0, 51.0, 112.0, 162.0, 312.0, 1072.0, 105326.0, 938804.0, 1756.0, 374.0, 173.0, 96.0, 66.0, 41.0, 32.0, 17.0, 14.0, 7.0, 10.0, 6.0, 2.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46875, -0.4553985595703125, -0.442047119140625, -0.4286956787109375, -0.41534423828125, -0.4019927978515625, -0.388641357421875, -0.3752899169921875, -0.3619384765625, -0.3485870361328125, -0.335235595703125, -0.3218841552734375, -0.30853271484375, -0.2951812744140625, -0.281829833984375, -0.2684783935546875, -0.255126953125, -0.2417755126953125, -0.228424072265625, -0.2150726318359375, -0.20172119140625, -0.1883697509765625, -0.175018310546875, -0.1616668701171875, -0.1483154296875, -0.1349639892578125, -0.121612548828125, -0.1082611083984375, -0.09490966796875, -0.0815582275390625, -0.068206787109375, -0.0548553466796875, -0.04150390625, -0.0281524658203125, -0.014801025390625, -0.0014495849609375, 0.01190185546875, 0.0252532958984375, 0.038604736328125, 0.0519561767578125, 0.0653076171875, 0.0786590576171875, 0.092010498046875, 0.1053619384765625, 0.11871337890625, 0.1320648193359375, 0.145416259765625, 0.1587677001953125, 0.172119140625, 0.1854705810546875, 0.198822021484375, 0.2121734619140625, 0.22552490234375, 0.2388763427734375, 0.252227783203125, 0.2655792236328125, 0.2789306640625, 0.2922821044921875, 0.305633544921875, 0.3189849853515625, 0.33233642578125, 0.3456878662109375, 0.359039306640625, 0.3723907470703125, 0.3857421875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 55.0, 772.0, 176.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16217412054538727, -0.15654630959033966, -0.15091849863529205, -0.14529068768024445, -0.13966286182403564, -0.13403505086898804, -0.12840723991394043, -0.12277942895889282, -0.11715161800384521, -0.11152380704879761, -0.10589599609375, -0.1002681776881218, -0.09464036673307419, -0.08901255577802658, -0.08338473737239838, -0.07775692641735077, -0.07212911546230316, -0.06650130450725555, -0.06087348982691765, -0.05524567514657974, -0.049617864191532135, -0.04399005323648453, -0.03836223855614662, -0.032734423875808716, -0.02710661292076111, -0.021478800103068352, -0.015850987285375595, -0.010223174467682838, -0.004595361649990082, 0.0010324511677026749, 0.0066602639853954315, 0.012288078665733337, 0.01791590452194214, 0.023543717339634895, 0.029171530157327652, 0.03479934483766556, 0.040427155792713165, 0.04605496674776077, 0.05168278142809868, 0.057310596108436584, 0.06293840706348419, 0.0685662180185318, 0.0741940289735794, 0.07982184737920761, 0.08544965833425522, 0.09107746928930283, 0.09670528769493103, 0.10233309864997864, 0.10796090960502625, 0.11358872056007385, 0.11921653151512146, 0.12484434992074966, 0.13047215342521667, 0.13609997928142548, 0.14172779023647308, 0.1473556011915207, 0.1529834121465683, 0.1586112231016159, 0.1642390340566635, 0.16986684501171112, 0.17549467086791992, 0.18112248182296753, 0.18675029277801514, 0.19237810373306274, 0.19800591468811035]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 8.0, 9.0, 4.0, 12.0, 4.0, 13.0, 10.0, 19.0, 19.0, 18.0, 30.0, 30.0, 29.0, 34.0, 38.0, 24.0, 24.0, 37.0, 18.0, 39.0, 41.0, 29.0, 29.0, 31.0, 30.0, 35.0, 42.0, 44.0, 38.0, 31.0, 18.0, 21.0, 27.0, 28.0, 20.0, 22.0, 10.0, 11.0, 10.0, 6.0, 16.0, 13.0, 7.0, 7.0, 3.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.020583808422088623, -0.019961532205343246, -0.01933925412595272, -0.018716976046562195, -0.018094699829816818, -0.01747242361307144, -0.016850145533680916, -0.01622786745429039, -0.015605591237545013, -0.014983314089477062, -0.014361036941409111, -0.01373875979334116, -0.013116482645273209, -0.012494205497205257, -0.011871928349137306, -0.011249651201069355, -0.010627374053001404, -0.010005096904933453, -0.009382819756865501, -0.00876054260879755, -0.008138265460729599, -0.007515988312661648, -0.006893711164593697, -0.006271434016525745, -0.005649156868457794, -0.005026879720389843, -0.004404602572321892, -0.0037823254242539406, -0.0031600482761859894, -0.002537771128118038, -0.001915493980050087, -0.0012932168319821358, -0.0006709396839141846, -4.866253584623337e-05, 0.0005736146122217178, 0.001195891760289669, 0.0018181689083576202, 0.0024404460564255714, 0.0030627232044935226, 0.003685000352561474, 0.004307277500629425, 0.004929554648697376, 0.0055518317967653275, 0.006174108944833279, 0.00679638609290123, 0.007418663240969181, 0.008040940389037132, 0.008663217537105083, 0.009285494685173035, 0.009907771833240986, 0.010530048981308937, 0.011152326129376888, 0.01177460327744484, 0.01239688042551279, 0.013019157573580742, 0.013641434721648693, 0.014263711869716644, 0.014885989017784595, 0.015508266165852547, 0.016130544245243073, 0.01675282046198845, 0.017375096678733826, 0.01799737475812435, 0.018619652837514877, 0.019241929054260254]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 5.0, 4.0, 12.0, 10.0, 12.0, 11.0, 22.0, 22.0, 17.0, 19.0, 29.0, 41.0, 27.0, 47.0, 41.0, 36.0, 41.0, 57.0, 48.0, 39.0, 48.0, 35.0, 48.0, 45.0, 37.0, 42.0, 37.0, 27.0, 26.0, 24.0, 18.0, 20.0, 17.0, 6.0, 6.0, 9.0, 3.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.25, -4.1131591796875, -3.976318359375, -3.8394775390625, -3.70263671875, -3.5657958984375, -3.428955078125, -3.2921142578125, -3.1552734375, -3.0184326171875, -2.881591796875, -2.7447509765625, -2.60791015625, -2.4710693359375, -2.334228515625, -2.1973876953125, -2.060546875, -1.9237060546875, -1.786865234375, -1.6500244140625, -1.51318359375, -1.3763427734375, -1.239501953125, -1.1026611328125, -0.9658203125, -0.8289794921875, -0.692138671875, -0.5552978515625, -0.41845703125, -0.2816162109375, -0.144775390625, -0.0079345703125, 0.12890625, 0.2657470703125, 0.402587890625, 0.5394287109375, 0.67626953125, 0.8131103515625, 0.949951171875, 1.0867919921875, 1.2236328125, 1.3604736328125, 1.497314453125, 1.6341552734375, 1.77099609375, 1.9078369140625, 2.044677734375, 2.1815185546875, 2.318359375, 2.4552001953125, 2.592041015625, 2.7288818359375, 2.86572265625, 3.0025634765625, 3.139404296875, 3.2762451171875, 3.4130859375, 3.5499267578125, 3.686767578125, 3.8236083984375, 3.96044921875, 4.0972900390625, 4.234130859375, 4.3709716796875, 4.5078125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 8.0, 8.0, 9.0, 25.0, 27.0, 33.0, 81.0, 140.0, 206.0, 341.0, 688.0, 1252.0, 2202.0, 4221.0, 7552.0, 13529.0, 24202.0, 43590.0, 94214.0, 233912.0, 332663.0, 152248.0, 63574.0, 32219.0, 18458.0, 10451.0, 5817.0, 3148.0, 1668.0, 885.0, 481.0, 294.0, 146.0, 88.0, 69.0, 27.0, 31.0, 12.0, 10.0, 12.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.228515625, -3.125244140625, -3.02197265625, -2.918701171875, -2.8154296875, -2.712158203125, -2.60888671875, -2.505615234375, -2.40234375, -2.299072265625, -2.19580078125, -2.092529296875, -1.9892578125, -1.885986328125, -1.78271484375, -1.679443359375, -1.576171875, -1.472900390625, -1.36962890625, -1.266357421875, -1.1630859375, -1.059814453125, -0.95654296875, -0.853271484375, -0.75, -0.646728515625, -0.54345703125, -0.440185546875, -0.3369140625, -0.233642578125, -0.13037109375, -0.027099609375, 0.076171875, 0.179443359375, 0.28271484375, 0.385986328125, 0.4892578125, 0.592529296875, 0.69580078125, 0.799072265625, 0.90234375, 1.005615234375, 1.10888671875, 1.212158203125, 1.3154296875, 1.418701171875, 1.52197265625, 1.625244140625, 1.728515625, 1.831787109375, 1.93505859375, 2.038330078125, 2.1416015625, 2.244873046875, 2.34814453125, 2.451416015625, 2.5546875, 2.657958984375, 2.76123046875, 2.864501953125, 2.9677734375, 3.071044921875, 3.17431640625, 3.277587890625, 3.380859375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 7.0, 6.0, 9.0, 15.0, 18.0, 22.0, 21.0, 20.0, 16.0, 31.0, 27.0, 39.0, 34.0, 52.0, 59.0, 59.0, 118.0, 265.0, 1501.0, 200.0, 82.0, 83.0, 52.0, 33.0, 32.0, 34.0, 30.0, 31.0, 34.0, 21.0, 13.0, 15.0, 16.0, 9.0, 7.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.203125, -12.7373046875, -12.271484375, -11.8056640625, -11.33984375, -10.8740234375, -10.408203125, -9.9423828125, -9.4765625, -9.0107421875, -8.544921875, -8.0791015625, -7.61328125, -7.1474609375, -6.681640625, -6.2158203125, -5.75, -5.2841796875, -4.818359375, -4.3525390625, -3.88671875, -3.4208984375, -2.955078125, -2.4892578125, -2.0234375, -1.5576171875, -1.091796875, -0.6259765625, -0.16015625, 0.3056640625, 0.771484375, 1.2373046875, 1.703125, 2.1689453125, 2.634765625, 3.1005859375, 3.56640625, 4.0322265625, 4.498046875, 4.9638671875, 5.4296875, 5.8955078125, 6.361328125, 6.8271484375, 7.29296875, 7.7587890625, 8.224609375, 8.6904296875, 9.15625, 9.6220703125, 10.087890625, 10.5537109375, 11.01953125, 11.4853515625, 11.951171875, 12.4169921875, 12.8828125, 13.3486328125, 13.814453125, 14.2802734375, 14.74609375, 15.2119140625, 15.677734375, 16.1435546875, 16.609375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 6.0, 4.0, 14.0, 30.0, 28.0, 57.0, 69.0, 113.0, 164.0, 283.0, 592.0, 2881.0, 2121228.0, 1016304.0, 2531.0, 585.0, 321.0, 155.0, 94.0, 78.0, 45.0, 40.0, 23.0, 21.0, 10.0, 6.0, 12.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.71875, -42.15576171875, -40.5927734375, -39.02978515625, -37.466796875, -35.90380859375, -34.3408203125, -32.77783203125, -31.21484375, -29.65185546875, -28.0888671875, -26.52587890625, -24.962890625, -23.39990234375, -21.8369140625, -20.27392578125, -18.7109375, -17.14794921875, -15.5849609375, -14.02197265625, -12.458984375, -10.89599609375, -9.3330078125, -7.77001953125, -6.20703125, -4.64404296875, -3.0810546875, -1.51806640625, 0.044921875, 1.60791015625, 3.1708984375, 4.73388671875, 6.296875, 7.85986328125, 9.4228515625, 10.98583984375, 12.548828125, 14.11181640625, 15.6748046875, 17.23779296875, 18.80078125, 20.36376953125, 21.9267578125, 23.48974609375, 25.052734375, 26.61572265625, 28.1787109375, 29.74169921875, 31.3046875, 32.86767578125, 34.4306640625, 35.99365234375, 37.556640625, 39.11962890625, 40.6826171875, 42.24560546875, 43.80859375, 45.37158203125, 46.9345703125, 48.49755859375, 50.060546875, 51.62353515625, 53.1865234375, 54.74951171875, 56.3125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [427.0, 586.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.176066398620605, -0.4833803176879883, 7.209305763244629, 14.901991844177246, 22.594676971435547, 30.287364959716797, 37.98004913330078, 45.672733306884766, 53.365421295166016, 61.05810546875, 68.75079345703125, 76.4434814453125, 84.13616943359375, 91.828857421875, 99.52153778076172, 107.21421813964844, 114.90691375732422, 122.59960174560547, 130.2922821044922, 137.98497009277344, 145.6776580810547, 153.37034606933594, 161.0630340576172, 168.75570678710938, 176.44839477539062, 184.14108276367188, 191.83377075195312, 199.52645874023438, 207.21914672851562, 214.91183471679688, 222.60450744628906, 230.2971954345703, 237.98989868164062, 245.68258666992188, 253.37527465820312, 261.0679626464844, 268.7606506347656, 276.4533386230469, 284.1460266113281, 291.83868408203125, 299.5313720703125, 307.22406005859375, 314.916748046875, 322.60943603515625, 330.3021240234375, 337.99481201171875, 345.6875, 353.38018798828125, 361.0728759765625, 368.76556396484375, 376.458251953125, 384.15093994140625, 391.8436279296875, 399.53631591796875, 407.22900390625, 414.92169189453125, 422.6143798828125, 430.30706787109375, 437.999755859375, 445.69244384765625, 453.3851318359375, 461.07781982421875, 468.7705078125, 476.46319580078125, 484.1558532714844]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 2.0, 4.0, 7.0, 10.0, 12.0, 11.0, 12.0, 13.0, 16.0, 18.0, 25.0, 27.0, 33.0, 33.0, 26.0, 27.0, 37.0, 39.0, 32.0, 39.0, 42.0, 42.0, 39.0, 43.0, 21.0, 36.0, 28.0, 43.0, 37.0, 41.0, 23.0, 29.0, 26.0, 15.0, 24.0, 17.0, 13.0, 14.0, 11.0, 7.0, 8.0, 7.0, 5.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.046756744384766, -38.795963287353516, -37.545169830322266, -36.294376373291016, -35.0435791015625, -33.79278564453125, -32.5419921875, -31.29119873046875, -30.0404052734375, -28.78961181640625, -27.538818359375, -26.288022994995117, -25.037229537963867, -23.786436080932617, -22.535640716552734, -21.284847259521484, -20.034053802490234, -18.783260345458984, -17.532466888427734, -16.28167152404785, -15.030878067016602, -13.780084609985352, -12.529290199279785, -11.278495788574219, -10.027702331542969, -8.776908874511719, -7.526114463806152, -6.275320529937744, -5.024526596069336, -3.7737326622009277, -2.5229387283325195, -1.2721443176269531, -0.02135467529296875, 1.2294392585754395, 2.4802331924438477, 3.731027126312256, 4.981821060180664, 6.232614994049072, 7.4834089279174805, 8.734203338623047, 9.984996795654297, 11.235790252685547, 12.486584663391113, 13.73737907409668, 14.98817253112793, 16.23896598815918, 17.489761352539062, 18.740554809570312, 19.991348266601562, 21.242141723632812, 22.492935180664062, 23.743730545043945, 24.994524002075195, 26.245317459106445, 27.496112823486328, 28.746906280517578, 29.997699737548828, 31.248493194580078, 32.49928665161133, 33.75008010864258, 35.000877380371094, 36.251670837402344, 37.502464294433594, 38.753257751464844, 40.004051208496094]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 5.0, 5.0, 5.0, 7.0, 10.0, 19.0, 21.0, 19.0, 20.0, 22.0, 27.0, 30.0, 36.0, 39.0, 39.0, 37.0, 42.0, 47.0, 52.0, 39.0, 46.0, 37.0, 45.0, 47.0, 40.0, 29.0, 37.0, 31.0, 28.0, 21.0, 26.0, 23.0, 17.0, 9.0, 8.0, 8.0, 6.0, 3.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.09375, -3.95501708984375, -3.8162841796875, -3.67755126953125, -3.538818359375, -3.40008544921875, -3.2613525390625, -3.12261962890625, -2.98388671875, -2.84515380859375, -2.7064208984375, -2.56768798828125, -2.428955078125, -2.29022216796875, -2.1514892578125, -2.01275634765625, -1.8740234375, -1.73529052734375, -1.5965576171875, -1.45782470703125, -1.319091796875, -1.18035888671875, -1.0416259765625, -0.90289306640625, -0.76416015625, -0.62542724609375, -0.4866943359375, -0.34796142578125, -0.209228515625, -0.07049560546875, 0.0682373046875, 0.20697021484375, 0.345703125, 0.48443603515625, 0.6231689453125, 0.76190185546875, 0.900634765625, 1.03936767578125, 1.1781005859375, 1.31683349609375, 1.45556640625, 1.59429931640625, 1.7330322265625, 1.87176513671875, 2.010498046875, 2.14923095703125, 2.2879638671875, 2.42669677734375, 2.5654296875, 2.70416259765625, 2.8428955078125, 2.98162841796875, 3.120361328125, 3.25909423828125, 3.3978271484375, 3.53656005859375, 3.67529296875, 3.81402587890625, 3.9527587890625, 4.09149169921875, 4.230224609375, 4.36895751953125, 4.5076904296875, 4.64642333984375, 4.78515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 9.0, 11.0, 18.0, 26.0, 34.0, 52.0, 78.0, 96.0, 161.0, 320.0, 499.0, 827.0, 1541.0, 2939.0, 6104.0, 15212.0, 43363.0, 142072.0, 483690.0, 1284316.0, 1394234.0, 567888.0, 168594.0, 50981.0, 17481.0, 6871.0, 3120.0, 1547.0, 855.0, 504.0, 307.0, 171.0, 118.0, 77.0, 51.0, 31.0, 20.0, 17.0, 16.0, 13.0, 6.0, 3.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.078125, -5.89971923828125, -5.7213134765625, -5.54290771484375, -5.364501953125, -5.18609619140625, -5.0076904296875, -4.82928466796875, -4.65087890625, -4.47247314453125, -4.2940673828125, -4.11566162109375, -3.937255859375, -3.75885009765625, -3.5804443359375, -3.40203857421875, -3.2236328125, -3.04522705078125, -2.8668212890625, -2.68841552734375, -2.510009765625, -2.33160400390625, -2.1531982421875, -1.97479248046875, -1.79638671875, -1.61798095703125, -1.4395751953125, -1.26116943359375, -1.082763671875, -0.90435791015625, -0.7259521484375, -0.54754638671875, -0.369140625, -0.19073486328125, -0.0123291015625, 0.16607666015625, 0.344482421875, 0.52288818359375, 0.7012939453125, 0.87969970703125, 1.05810546875, 1.23651123046875, 1.4149169921875, 1.59332275390625, 1.771728515625, 1.95013427734375, 2.1285400390625, 2.30694580078125, 2.4853515625, 2.66375732421875, 2.8421630859375, 3.02056884765625, 3.198974609375, 3.37738037109375, 3.5557861328125, 3.73419189453125, 3.91259765625, 4.09100341796875, 4.2694091796875, 4.44781494140625, 4.626220703125, 4.80462646484375, 4.9830322265625, 5.16143798828125, 5.33984375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 1.0, 3.0, 8.0, 8.0, 15.0, 18.0, 19.0, 52.0, 75.0, 95.0, 170.0, 262.0, 359.0, 406.0, 563.0, 557.0, 458.0, 337.0, 222.0, 142.0, 105.0, 47.0, 44.0, 33.0, 21.0, 21.0, 12.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.90625, -16.511962890625, -16.11767578125, -15.723388671875, -15.3291015625, -14.934814453125, -14.54052734375, -14.146240234375, -13.751953125, -13.357666015625, -12.96337890625, -12.569091796875, -12.1748046875, -11.780517578125, -11.38623046875, -10.991943359375, -10.59765625, -10.203369140625, -9.80908203125, -9.414794921875, -9.0205078125, -8.626220703125, -8.23193359375, -7.837646484375, -7.443359375, -7.049072265625, -6.65478515625, -6.260498046875, -5.8662109375, -5.471923828125, -5.07763671875, -4.683349609375, -4.2890625, -3.894775390625, -3.50048828125, -3.106201171875, -2.7119140625, -2.317626953125, -1.92333984375, -1.529052734375, -1.134765625, -0.740478515625, -0.34619140625, 0.048095703125, 0.4423828125, 0.836669921875, 1.23095703125, 1.625244140625, 2.01953125, 2.413818359375, 2.80810546875, 3.202392578125, 3.5966796875, 3.990966796875, 4.38525390625, 4.779541015625, 5.173828125, 5.568115234375, 5.96240234375, 6.356689453125, 6.7509765625, 7.145263671875, 7.53955078125, 7.933837890625, 8.328125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 9.0, 12.0, 22.0, 23.0, 39.0, 56.0, 99.0, 191.0, 392.0, 841.0, 2540.0, 13156.0, 170703.0, 2795884.0, 1146506.0, 54767.0, 6215.0, 1588.0, 600.0, 284.0, 144.0, 82.0, 48.0, 24.0, 21.0, 13.0, 8.0, 5.0, 4.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6875, -13.9814453125, -13.275390625, -12.5693359375, -11.86328125, -11.1572265625, -10.451171875, -9.7451171875, -9.0390625, -8.3330078125, -7.626953125, -6.9208984375, -6.21484375, -5.5087890625, -4.802734375, -4.0966796875, -3.390625, -2.6845703125, -1.978515625, -1.2724609375, -0.56640625, 0.1396484375, 0.845703125, 1.5517578125, 2.2578125, 2.9638671875, 3.669921875, 4.3759765625, 5.08203125, 5.7880859375, 6.494140625, 7.2001953125, 7.90625, 8.6123046875, 9.318359375, 10.0244140625, 10.73046875, 11.4365234375, 12.142578125, 12.8486328125, 13.5546875, 14.2607421875, 14.966796875, 15.6728515625, 16.37890625, 17.0849609375, 17.791015625, 18.4970703125, 19.203125, 19.9091796875, 20.615234375, 21.3212890625, 22.02734375, 22.7333984375, 23.439453125, 24.1455078125, 24.8515625, 25.5576171875, 26.263671875, 26.9697265625, 27.67578125, 28.3818359375, 29.087890625, 29.7939453125, 30.5]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 20.0, 54.0, 90.0, 202.0, 204.0, 210.0, 129.0, 58.0, 28.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.40191650390625, -151.1575164794922, -147.91311645507812, -144.66871643066406, -141.42431640625, -138.17991638183594, -134.93551635742188, -131.6911163330078, -128.44671630859375, -125.20231628417969, -121.95791625976562, -118.71351623535156, -115.4691162109375, -112.22471618652344, -108.98031616210938, -105.73591613769531, -102.49152374267578, -99.24712371826172, -96.00272369384766, -92.7583236694336, -89.51392364501953, -86.26952362060547, -83.02513122558594, -79.78073120117188, -76.53633117675781, -73.29193115234375, -70.04753112792969, -66.80313110351562, -63.55873107910156, -60.3143310546875, -57.0699348449707, -53.82553482055664, -50.58113479614258, -47.336734771728516, -44.09233474731445, -40.847938537597656, -37.603538513183594, -34.35913848876953, -31.11473846435547, -27.870338439941406, -24.625938415527344, -21.38153839111328, -18.13713836669922, -14.892740249633789, -11.648340225219727, -8.403940200805664, -5.159542083740234, -1.9151420593261719, 1.3292579650878906, 4.573657512664795, 7.818057060241699, 11.062456130981445, 14.306856155395508, 17.55125617980957, 20.795654296875, 24.040054321289062, 27.284454345703125, 30.528854370117188, 33.77325439453125, 37.01765441894531, 40.262054443359375, 43.50645446777344, 46.750850677490234, 49.9952507019043, 53.23965072631836]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 8.0, 9.0, 3.0, 10.0, 14.0, 19.0, 8.0, 16.0, 22.0, 21.0, 36.0, 35.0, 38.0, 30.0, 36.0, 34.0, 31.0, 48.0, 41.0, 35.0, 54.0, 43.0, 36.0, 33.0, 41.0, 43.0, 34.0, 35.0, 28.0, 17.0, 36.0, 14.0, 17.0, 22.0, 10.0, 10.0, 6.0, 4.0, 8.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.089622497558594, -30.034391403198242, -28.97916030883789, -27.923927307128906, -26.868696212768555, -25.813465118408203, -24.75823402404785, -23.7030029296875, -22.647769927978516, -21.592538833618164, -20.537307739257812, -19.482074737548828, -18.426843643188477, -17.371612548828125, -16.316381454467773, -15.261150360107422, -14.20591926574707, -13.150688171386719, -12.09545612335205, -11.0402250289917, -9.984992980957031, -8.92976188659668, -7.874530792236328, -6.819299221038818, -5.764067649841309, -4.708836078643799, -3.653604745864868, -2.5983734130859375, -1.5431418418884277, -0.48791027069091797, 0.5673208236694336, 1.6225523948669434, 2.677783966064453, 3.733015537261963, 4.788247108459473, 5.843478202819824, 6.898709774017334, 7.953941345214844, 9.009172439575195, 10.064403533935547, 11.119635581970215, 12.174866676330566, 13.230098724365234, 14.285329818725586, 15.340560913085938, 16.395793914794922, 17.45102310180664, 18.506256103515625, 19.561487197875977, 20.616718292236328, 21.67194938659668, 22.72718048095703, 23.782413482666016, 24.837644577026367, 25.89287567138672, 26.94810676574707, 28.003337860107422, 29.058568954467773, 30.113800048828125, 31.16903305053711, 32.22426223754883, 33.27949523925781, 34.33472442626953, 35.389957427978516, 36.4451904296875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 4.0, 4.0, 4.0, 12.0, 5.0, 14.0, 17.0, 18.0, 27.0, 20.0, 29.0, 32.0, 29.0, 31.0, 40.0, 39.0, 45.0, 48.0, 34.0, 38.0, 55.0, 43.0, 45.0, 39.0, 34.0, 39.0, 32.0, 34.0, 34.0, 26.0, 17.0, 19.0, 11.0, 12.0, 19.0, 9.0, 6.0, 2.0, 8.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.908203125, -3.772247314453125, -3.63629150390625, -3.500335693359375, -3.3643798828125, -3.228424072265625, -3.09246826171875, -2.956512451171875, -2.820556640625, -2.684600830078125, -2.54864501953125, -2.412689208984375, -2.2767333984375, -2.140777587890625, -2.00482177734375, -1.868865966796875, -1.73291015625, -1.596954345703125, -1.46099853515625, -1.325042724609375, -1.1890869140625, -1.053131103515625, -0.91717529296875, -0.781219482421875, -0.645263671875, -0.509307861328125, -0.37335205078125, -0.237396240234375, -0.1014404296875, 0.034515380859375, 0.17047119140625, 0.306427001953125, 0.4423828125, 0.578338623046875, 0.71429443359375, 0.850250244140625, 0.9862060546875, 1.122161865234375, 1.25811767578125, 1.394073486328125, 1.530029296875, 1.665985107421875, 1.80194091796875, 1.937896728515625, 2.0738525390625, 2.209808349609375, 2.34576416015625, 2.481719970703125, 2.61767578125, 2.753631591796875, 2.88958740234375, 3.025543212890625, 3.1614990234375, 3.297454833984375, 3.43341064453125, 3.569366455078125, 3.705322265625, 3.841278076171875, 3.97723388671875, 4.113189697265625, 4.2491455078125, 4.385101318359375, 4.52105712890625, 4.657012939453125, 4.79296875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 9.0, 11.0, 6.0, 22.0, 30.0, 46.0, 91.0, 112.0, 210.0, 341.0, 548.0, 897.0, 1456.0, 2481.0, 4157.0, 6907.0, 12259.0, 21374.0, 37066.0, 62979.0, 102846.0, 153025.0, 186872.0, 165440.0, 116008.0, 71975.0, 42661.0, 24301.0, 14141.0, 7983.0, 4976.0, 2875.0, 1697.0, 1050.0, 674.0, 390.0, 245.0, 147.0, 109.0, 53.0, 41.0, 18.0, 10.0, 6.0, 9.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.68896484375, -0.666473388671875, -0.64398193359375, -0.621490478515625, -0.5989990234375, -0.576507568359375, -0.55401611328125, -0.531524658203125, -0.509033203125, -0.486541748046875, -0.46405029296875, -0.441558837890625, -0.4190673828125, -0.396575927734375, -0.37408447265625, -0.351593017578125, -0.3291015625, -0.306610107421875, -0.28411865234375, -0.261627197265625, -0.2391357421875, -0.216644287109375, -0.19415283203125, -0.171661376953125, -0.149169921875, -0.126678466796875, -0.10418701171875, -0.081695556640625, -0.0592041015625, -0.036712646484375, -0.01422119140625, 0.008270263671875, 0.03076171875, 0.053253173828125, 0.07574462890625, 0.098236083984375, 0.1207275390625, 0.143218994140625, 0.16571044921875, 0.188201904296875, 0.210693359375, 0.233184814453125, 0.25567626953125, 0.278167724609375, 0.3006591796875, 0.323150634765625, 0.34564208984375, 0.368133544921875, 0.390625, 0.413116455078125, 0.43560791015625, 0.458099365234375, 0.4805908203125, 0.503082275390625, 0.52557373046875, 0.548065185546875, 0.570556640625, 0.593048095703125, 0.61553955078125, 0.638031005859375, 0.6605224609375, 0.683013916015625, 0.70550537109375, 0.727996826171875, 0.75048828125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0, 9.0, 10.0, 8.0, 14.0, 15.0, 21.0, 15.0, 16.0, 24.0, 34.0, 34.0, 29.0, 28.0, 46.0, 38.0, 36.0, 39.0, 46.0, 1070.0, 39.0, 44.0, 36.0, 43.0, 34.0, 46.0, 36.0, 33.0, 21.0, 22.0, 21.0, 20.0, 19.0, 16.0, 16.0, 13.0, 11.0, 4.0, 3.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.611328125, -2.510650634765625, -2.40997314453125, -2.309295654296875, -2.2086181640625, -2.107940673828125, -2.00726318359375, -1.906585693359375, -1.805908203125, -1.705230712890625, -1.60455322265625, -1.503875732421875, -1.4031982421875, -1.302520751953125, -1.20184326171875, -1.101165771484375, -1.00048828125, -0.899810791015625, -0.79913330078125, -0.698455810546875, -0.5977783203125, -0.497100830078125, -0.39642333984375, -0.295745849609375, -0.195068359375, -0.094390869140625, 0.00628662109375, 0.106964111328125, 0.2076416015625, 0.308319091796875, 0.40899658203125, 0.509674072265625, 0.6103515625, 0.711029052734375, 0.81170654296875, 0.912384033203125, 1.0130615234375, 1.113739013671875, 1.21441650390625, 1.315093994140625, 1.415771484375, 1.516448974609375, 1.61712646484375, 1.717803955078125, 1.8184814453125, 1.919158935546875, 2.01983642578125, 2.120513916015625, 2.22119140625, 2.321868896484375, 2.42254638671875, 2.523223876953125, 2.6239013671875, 2.724578857421875, 2.82525634765625, 2.925933837890625, 3.026611328125, 3.127288818359375, 3.22796630859375, 3.328643798828125, 3.4293212890625, 3.529998779296875, 3.63067626953125, 3.731353759765625, 3.83203125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 17.0, 6.0, 24.0, 22.0, 33.0, 75.0, 94.0, 156.0, 245.0, 384.0, 661.0, 1124.0, 1728.0, 2879.0, 4553.0, 7800.0, 12968.0, 21814.0, 37609.0, 63302.0, 101329.0, 149641.0, 1211148.0, 176875.0, 117278.0, 75097.0, 45093.0, 26336.0, 15462.0, 9182.0, 5529.0, 3216.0, 2107.0, 1238.0, 810.0, 456.0, 298.0, 204.0, 122.0, 83.0, 62.0, 31.0, 14.0, 14.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.440673828125, -0.4279632568359375, -0.415252685546875, -0.4025421142578125, -0.38983154296875, -0.3771209716796875, -0.364410400390625, -0.3516998291015625, -0.3389892578125, -0.3262786865234375, -0.313568115234375, -0.3008575439453125, -0.28814697265625, -0.2754364013671875, -0.262725830078125, -0.2500152587890625, -0.2373046875, -0.2245941162109375, -0.211883544921875, -0.1991729736328125, -0.18646240234375, -0.1737518310546875, -0.161041259765625, -0.1483306884765625, -0.1356201171875, -0.1229095458984375, -0.110198974609375, -0.0974884033203125, -0.08477783203125, -0.0720672607421875, -0.059356689453125, -0.0466461181640625, -0.033935546875, -0.0212249755859375, -0.008514404296875, 0.0041961669921875, 0.01690673828125, 0.0296173095703125, 0.042327880859375, 0.0550384521484375, 0.0677490234375, 0.0804595947265625, 0.093170166015625, 0.1058807373046875, 0.11859130859375, 0.1313018798828125, 0.144012451171875, 0.1567230224609375, 0.16943359375, 0.1821441650390625, 0.194854736328125, 0.2075653076171875, 0.22027587890625, 0.2329864501953125, 0.245697021484375, 0.2584075927734375, 0.2711181640625, 0.2838287353515625, 0.296539306640625, 0.3092498779296875, 0.32196044921875, 0.3346710205078125, 0.347381591796875, 0.3600921630859375, 0.372802734375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 9.0, 7.0, 10.0, 17.0, 23.0, 24.0, 39.0, 34.0, 45.0, 46.0, 61.0, 58.0, 50.0, 74.0, 78.0, 55.0, 53.0, 44.0, 48.0, 44.0, 32.0, 33.0, 17.0, 24.0, 25.0, 15.0, 5.0, 5.0, 4.0, 4.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0194091796875, -0.018801212310791016, -0.01819324493408203, -0.017585277557373047, -0.016977310180664062, -0.016369342803955078, -0.015761375427246094, -0.01515340805053711, -0.014545440673828125, -0.01393747329711914, -0.013329505920410156, -0.012721538543701172, -0.012113571166992188, -0.011505603790283203, -0.010897636413574219, -0.010289669036865234, -0.00968170166015625, -0.009073734283447266, -0.008465766906738281, -0.007857799530029297, -0.0072498321533203125, -0.006641864776611328, -0.006033897399902344, -0.005425930023193359, -0.004817962646484375, -0.004209995269775391, -0.0036020278930664062, -0.002994060516357422, -0.0023860931396484375, -0.0017781257629394531, -0.0011701583862304688, -0.0005621910095214844, 4.57763671875e-05, 0.0006537437438964844, 0.0012617111206054688, 0.0018696784973144531, 0.0024776458740234375, 0.003085613250732422, 0.0036935806274414062, 0.004301548004150391, 0.004909515380859375, 0.005517482757568359, 0.006125450134277344, 0.006733417510986328, 0.0073413848876953125, 0.007949352264404297, 0.008557319641113281, 0.009165287017822266, 0.00977325439453125, 0.010381221771240234, 0.010989189147949219, 0.011597156524658203, 0.012205123901367188, 0.012813091278076172, 0.013421058654785156, 0.01402902603149414, 0.014636993408203125, 0.01524496078491211, 0.015852928161621094, 0.016460895538330078, 0.017068862915039062, 0.017676830291748047, 0.01828479766845703, 0.018892765045166016, 0.019500732421875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 7.0, 5.0, 2.0, 19.0, 20.0, 25.0, 29.0, 36.0, 36.0, 55.0, 119.0, 158.0, 269.0, 528.0, 1267.0, 122106.0, 920240.0, 2089.0, 593.0, 320.0, 205.0, 121.0, 90.0, 57.0, 45.0, 28.0, 24.0, 15.0, 9.0, 5.0, 7.0, 6.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.333251953125, -0.3228797912597656, -0.31250762939453125, -0.3021354675292969, -0.2917633056640625, -0.2813911437988281, -0.27101898193359375, -0.2606468200683594, -0.250274658203125, -0.23990249633789062, -0.22953033447265625, -0.21915817260742188, -0.2087860107421875, -0.19841384887695312, -0.18804168701171875, -0.17766952514648438, -0.16729736328125, -0.15692520141601562, -0.14655303955078125, -0.13618087768554688, -0.1258087158203125, -0.11543655395507812, -0.10506439208984375, -0.09469223022460938, -0.084320068359375, -0.07394790649414062, -0.06357574462890625, -0.053203582763671875, -0.0428314208984375, -0.032459259033203125, -0.02208709716796875, -0.011714935302734375, -0.0013427734375, 0.009029388427734375, 0.01940155029296875, 0.029773712158203125, 0.0401458740234375, 0.050518035888671875, 0.06089019775390625, 0.07126235961914062, 0.081634521484375, 0.09200668334960938, 0.10237884521484375, 0.11275100708007812, 0.1231231689453125, 0.13349533081054688, 0.14386749267578125, 0.15423965454101562, 0.16461181640625, 0.17498397827148438, 0.18535614013671875, 0.19572830200195312, 0.2061004638671875, 0.21647262573242188, 0.22684478759765625, 0.23721694946289062, 0.247589111328125, 0.2579612731933594, 0.26833343505859375, 0.2787055969238281, 0.2890777587890625, 0.2994499206542969, 0.30982208251953125, 0.3201942443847656, 0.33056640625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 16.0, 72.0, 627.0, 282.0, 15.0], "bins": [-0.255596786737442, -0.251468300819397, -0.24733978509902954, -0.2432112991809845, -0.23908279836177826, -0.23495429754257202, -0.23082581162452698, -0.22669731080532074, -0.2225688099861145, -0.21844030916690826, -0.21431180834770203, -0.21018332242965698, -0.20605482161045074, -0.2019263207912445, -0.19779783487319946, -0.19366933405399323, -0.189540833234787, -0.18541233241558075, -0.1812838315963745, -0.17715534567832947, -0.17302684485912323, -0.168898344039917, -0.16476985812187195, -0.1606413573026657, -0.15651285648345947, -0.15238435566425323, -0.148255854845047, -0.14412736892700195, -0.13999886810779572, -0.13587036728858948, -0.13174188137054443, -0.1276133805513382, -0.12348486483097076, -0.11935636401176453, -0.11522787064313889, -0.11109937727451324, -0.106970876455307, -0.10284237563610077, -0.09871388226747513, -0.09458538889884949, -0.09045688807964325, -0.08632838726043701, -0.08219989389181137, -0.07807140052318573, -0.07394289970397949, -0.06981439888477325, -0.06568590551614761, -0.061557408422231674, -0.057428911328315735, -0.053300414234399796, -0.049171917140483856, -0.04504342004656792, -0.04091492295265198, -0.03678642585873604, -0.0326579287648201, -0.02852943167090416, -0.02440093457698822, -0.02027243748307228, -0.01614394038915634, -0.012015443295240402, -0.007886946201324463, -0.0037584491074085236, 0.00037004798650741577, 0.004498545080423355, 0.00862704124301672]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 9.0, 16.0, 10.0, 20.0, 20.0, 26.0, 33.0, 30.0, 24.0, 42.0, 34.0, 37.0, 32.0, 42.0, 37.0, 58.0, 45.0, 33.0, 28.0, 46.0, 45.0, 36.0, 39.0, 37.0, 32.0, 27.0, 25.0, 25.0, 17.0, 14.0, 21.0, 16.0, 14.0, 10.0, 3.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026240408420562744, -0.025387877598404884, -0.024535346776247025, -0.023682815954089165, -0.022830285131931305, -0.021977754309773445, -0.021125223487615585, -0.020272692665457726, -0.019420161843299866, -0.018567631021142006, -0.017715100198984146, -0.016862569376826286, -0.016010038554668427, -0.015157507732510567, -0.014304976910352707, -0.013452446088194847, -0.012599915266036987, -0.011747384443879128, -0.010894853621721268, -0.010042322799563408, -0.009189791977405548, -0.008337261155247688, -0.0074847303330898285, -0.006632199510931969, -0.005779668688774109, -0.004927137866616249, -0.004074607044458389, -0.0032220762223005295, -0.0023695454001426697, -0.0015170145779848099, -0.0006644837558269501, 0.00018804706633090973, 0.0010405778884887695, 0.0018931087106466293, 0.002745639532804489, 0.003598170354962349, 0.004450701177120209, 0.0053032319992780685, 0.006155762821435928, 0.007008293643593788, 0.007860824465751648, 0.008713355287909508, 0.009565886110067368, 0.010418416932225227, 0.011270947754383087, 0.012123478576540947, 0.012976009398698807, 0.013828540220856667, 0.014681071043014526, 0.015533601865172386, 0.016386132687330246, 0.017238663509488106, 0.018091194331645966, 0.018943725153803825, 0.019796255975961685, 0.020648786798119545, 0.021501317620277405, 0.022353848442435265, 0.023206379264593124, 0.024058910086750984, 0.024911440908908844, 0.025763971731066704, 0.026616502553224564, 0.027469033375382423, 0.028321564197540283]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 4.0, 4.0, 3.0, 13.0, 5.0, 14.0, 17.0, 18.0, 27.0, 19.0, 29.0, 33.0, 29.0, 31.0, 40.0, 39.0, 43.0, 50.0, 34.0, 38.0, 55.0, 42.0, 46.0, 39.0, 34.0, 39.0, 32.0, 34.0, 34.0, 26.0, 17.0, 19.0, 11.0, 12.0, 19.0, 9.0, 6.0, 2.0, 8.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.91015625, -3.774169921875, -3.63818359375, -3.502197265625, -3.3662109375, -3.230224609375, -3.09423828125, -2.958251953125, -2.822265625, -2.686279296875, -2.55029296875, -2.414306640625, -2.2783203125, -2.142333984375, -2.00634765625, -1.870361328125, -1.734375, -1.598388671875, -1.46240234375, -1.326416015625, -1.1904296875, -1.054443359375, -0.91845703125, -0.782470703125, -0.646484375, -0.510498046875, -0.37451171875, -0.238525390625, -0.1025390625, 0.033447265625, 0.16943359375, 0.305419921875, 0.44140625, 0.577392578125, 0.71337890625, 0.849365234375, 0.9853515625, 1.121337890625, 1.25732421875, 1.393310546875, 1.529296875, 1.665283203125, 1.80126953125, 1.937255859375, 2.0732421875, 2.209228515625, 2.34521484375, 2.481201171875, 2.6171875, 2.753173828125, 2.88916015625, 3.025146484375, 3.1611328125, 3.297119140625, 3.43310546875, 3.569091796875, 3.705078125, 3.841064453125, 3.97705078125, 4.113037109375, 4.2490234375, 4.385009765625, 4.52099609375, 4.656982421875, 4.79296875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 13.0, 9.0, 13.0, 20.0, 28.0, 48.0, 53.0, 94.0, 111.0, 223.0, 308.0, 449.0, 781.0, 1292.0, 2235.0, 3930.0, 7748.0, 14883.0, 28741.0, 55935.0, 109372.0, 207210.0, 269167.0, 166648.0, 86297.0, 44566.0, 22726.0, 11610.0, 6121.0, 3314.0, 1821.0, 1055.0, 609.0, 366.0, 229.0, 151.0, 108.0, 70.0, 50.0, 41.0, 23.0, 28.0, 14.0, 13.0, 4.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.7890625, -3.6680908203125, -3.547119140625, -3.4261474609375, -3.30517578125, -3.1842041015625, -3.063232421875, -2.9422607421875, -2.8212890625, -2.7003173828125, -2.579345703125, -2.4583740234375, -2.33740234375, -2.2164306640625, -2.095458984375, -1.9744873046875, -1.853515625, -1.7325439453125, -1.611572265625, -1.4906005859375, -1.36962890625, -1.2486572265625, -1.127685546875, -1.0067138671875, -0.8857421875, -0.7647705078125, -0.643798828125, -0.5228271484375, -0.40185546875, -0.2808837890625, -0.159912109375, -0.0389404296875, 0.08203125, 0.2030029296875, 0.323974609375, 0.4449462890625, 0.56591796875, 0.6868896484375, 0.807861328125, 0.9288330078125, 1.0498046875, 1.1707763671875, 1.291748046875, 1.4127197265625, 1.53369140625, 1.6546630859375, 1.775634765625, 1.8966064453125, 2.017578125, 2.1385498046875, 2.259521484375, 2.3804931640625, 2.50146484375, 2.6224365234375, 2.743408203125, 2.8643798828125, 2.9853515625, 3.1063232421875, 3.227294921875, 3.3482666015625, 3.46923828125, 3.5902099609375, 3.711181640625, 3.8321533203125, 3.953125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 3.0, 4.0, 11.0, 8.0, 13.0, 18.0, 29.0, 20.0, 30.0, 33.0, 34.0, 51.0, 56.0, 80.0, 81.0, 144.0, 374.0, 1407.0, 198.0, 89.0, 59.0, 46.0, 38.0, 44.0, 33.0, 31.0, 22.0, 16.0, 16.0, 14.0, 9.0, 12.0, 5.0, 9.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0, -17.4033203125, -16.806640625, -16.2099609375, -15.61328125, -15.0166015625, -14.419921875, -13.8232421875, -13.2265625, -12.6298828125, -12.033203125, -11.4365234375, -10.83984375, -10.2431640625, -9.646484375, -9.0498046875, -8.453125, -7.8564453125, -7.259765625, -6.6630859375, -6.06640625, -5.4697265625, -4.873046875, -4.2763671875, -3.6796875, -3.0830078125, -2.486328125, -1.8896484375, -1.29296875, -0.6962890625, -0.099609375, 0.4970703125, 1.09375, 1.6904296875, 2.287109375, 2.8837890625, 3.48046875, 4.0771484375, 4.673828125, 5.2705078125, 5.8671875, 6.4638671875, 7.060546875, 7.6572265625, 8.25390625, 8.8505859375, 9.447265625, 10.0439453125, 10.640625, 11.2373046875, 11.833984375, 12.4306640625, 13.02734375, 13.6240234375, 14.220703125, 14.8173828125, 15.4140625, 16.0107421875, 16.607421875, 17.2041015625, 17.80078125, 18.3974609375, 18.994140625, 19.5908203125, 20.1875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 3.0, 4.0, 12.0, 20.0, 38.0, 39.0, 58.0, 120.0, 199.0, 305.0, 817.0, 16791.0, 3116965.0, 8764.0, 747.0, 350.0, 183.0, 116.0, 68.0, 45.0, 28.0, 12.0, 14.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.03125, -58.88525390625, -56.7392578125, -54.59326171875, -52.447265625, -50.30126953125, -48.1552734375, -46.00927734375, -43.86328125, -41.71728515625, -39.5712890625, -37.42529296875, -35.279296875, -33.13330078125, -30.9873046875, -28.84130859375, -26.6953125, -24.54931640625, -22.4033203125, -20.25732421875, -18.111328125, -15.96533203125, -13.8193359375, -11.67333984375, -9.52734375, -7.38134765625, -5.2353515625, -3.08935546875, -0.943359375, 1.20263671875, 3.3486328125, 5.49462890625, 7.640625, 9.78662109375, 11.9326171875, 14.07861328125, 16.224609375, 18.37060546875, 20.5166015625, 22.66259765625, 24.80859375, 26.95458984375, 29.1005859375, 31.24658203125, 33.392578125, 35.53857421875, 37.6845703125, 39.83056640625, 41.9765625, 44.12255859375, 46.2685546875, 48.41455078125, 50.560546875, 52.70654296875, 54.8525390625, 56.99853515625, 59.14453125, 61.29052734375, 63.4365234375, 65.58251953125, 67.728515625, 69.87451171875, 72.0205078125, 74.16650390625, 76.3125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [2.0, 517.0, 496.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.420413970947266, -9.360157012939453, -0.2999000549316406, 8.760356903076172, 17.820613861083984, 26.880870819091797, 35.94112777709961, 45.00138473510742, 54.061641693115234, 63.12189865112305, 72.18215942382812, 81.24241638183594, 90.30267333984375, 99.36293029785156, 108.42318725585938, 117.48344421386719, 126.543701171875, 135.6039581298828, 144.66421508789062, 153.72447204589844, 162.78472900390625, 171.84498596191406, 180.90524291992188, 189.9654998779297, 199.0257568359375, 208.0860137939453, 217.14627075195312, 226.20652770996094, 235.26678466796875, 244.32704162597656, 253.38729858398438, 262.44757080078125, 271.5078125, 280.56805419921875, 289.6283264160156, 298.6885986328125, 307.74884033203125, 316.80908203125, 325.8693542480469, 334.92962646484375, 343.9898681640625, 353.05010986328125, 362.1103820800781, 371.170654296875, 380.23089599609375, 389.2911376953125, 398.3514099121094, 407.41168212890625, 416.471923828125, 425.53216552734375, 434.5924377441406, 443.6527099609375, 452.71295166015625, 461.773193359375, 470.8334655761719, 479.89373779296875, 488.9539794921875, 498.01422119140625, 507.0744934082031, 516.134765625, 525.1950073242188, 534.2552490234375, 543.3155517578125, 552.3757934570312, 561.43603515625]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 8.0, 4.0, 7.0, 7.0, 10.0, 16.0, 16.0, 18.0, 18.0, 19.0, 28.0, 28.0, 22.0, 35.0, 46.0, 47.0, 46.0, 42.0, 49.0, 38.0, 46.0, 35.0, 45.0, 42.0, 33.0, 30.0, 29.0, 39.0, 26.0, 25.0, 25.0, 29.0, 19.0, 10.0, 12.0, 13.0, 9.0, 9.0, 4.0, 5.0, 9.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-42.22984313964844, -40.94559097290039, -39.66133499145508, -38.37708282470703, -37.09282684326172, -35.80857467651367, -34.524322509765625, -33.24006652832031, -31.955814361572266, -30.671560287475586, -29.387306213378906, -28.10305404663086, -26.81879997253418, -25.5345458984375, -24.25029182434082, -22.96603775024414, -21.68178367614746, -20.39752960205078, -19.1132755279541, -17.829021453857422, -16.544769287109375, -15.260515213012695, -13.976261138916016, -12.692008018493652, -11.407753944396973, -10.123499870300293, -8.83924674987793, -7.55499267578125, -6.2707390785217285, -4.986485481262207, -3.7022314071655273, -2.417978286743164, -1.1337242126464844, 0.15052950382232666, 1.4347832202911377, 2.7190370559692383, 4.00329065322876, 5.287544250488281, 6.571798324584961, 7.856051445007324, 9.140305519104004, 10.424559593200684, 11.708812713623047, 12.993066787719727, 14.277320861816406, 15.56157398223877, 16.845829010009766, 18.130081176757812, 19.414335250854492, 20.698589324951172, 21.98284339904785, 23.26709747314453, 24.551349639892578, 25.835603713989258, 27.119857788085938, 28.404109954833984, 29.688365936279297, 30.972620010375977, 32.256874084472656, 33.5411262512207, 34.825382232666016, 36.10963439941406, 37.393890380859375, 38.67814254760742, 39.96239471435547]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 5.0, 4.0, 6.0, 10.0, 12.0, 16.0, 14.0, 14.0, 28.0, 24.0, 24.0, 28.0, 39.0, 35.0, 29.0, 30.0, 36.0, 53.0, 35.0, 40.0, 42.0, 44.0, 37.0, 34.0, 51.0, 35.0, 34.0, 35.0, 30.0, 24.0, 29.0, 24.0, 15.0, 13.0, 11.0, 12.0, 4.0, 7.0, 10.0, 3.0, 3.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-4.109375, -3.96795654296875, -3.8265380859375, -3.68511962890625, -3.543701171875, -3.40228271484375, -3.2608642578125, -3.11944580078125, -2.97802734375, -2.83660888671875, -2.6951904296875, -2.55377197265625, -2.412353515625, -2.27093505859375, -2.1295166015625, -1.98809814453125, -1.8466796875, -1.70526123046875, -1.5638427734375, -1.42242431640625, -1.281005859375, -1.13958740234375, -0.9981689453125, -0.85675048828125, -0.71533203125, -0.57391357421875, -0.4324951171875, -0.29107666015625, -0.149658203125, -0.00823974609375, 0.1331787109375, 0.27459716796875, 0.416015625, 0.55743408203125, 0.6988525390625, 0.84027099609375, 0.981689453125, 1.12310791015625, 1.2645263671875, 1.40594482421875, 1.54736328125, 1.68878173828125, 1.8302001953125, 1.97161865234375, 2.113037109375, 2.25445556640625, 2.3958740234375, 2.53729248046875, 2.6787109375, 2.82012939453125, 2.9615478515625, 3.10296630859375, 3.244384765625, 3.38580322265625, 3.5272216796875, 3.66864013671875, 3.81005859375, 3.95147705078125, 4.0928955078125, 4.23431396484375, 4.375732421875, 4.51715087890625, 4.6585693359375, 4.79998779296875, 4.94140625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 3.0, 3.0, 7.0, 12.0, 16.0, 13.0, 14.0, 26.0, 20.0, 31.0, 44.0, 77.0, 112.0, 208.0, 382.0, 1068.0, 4483.0, 36113.0, 602194.0, 2946071.0, 564121.0, 33467.0, 3980.0, 921.0, 351.0, 171.0, 112.0, 53.0, 40.0, 33.0, 12.0, 28.0, 11.0, 11.0, 12.0, 18.0, 4.0, 6.0, 7.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.203125, -12.75537109375, -12.3076171875, -11.85986328125, -11.412109375, -10.96435546875, -10.5166015625, -10.06884765625, -9.62109375, -9.17333984375, -8.7255859375, -8.27783203125, -7.830078125, -7.38232421875, -6.9345703125, -6.48681640625, -6.0390625, -5.59130859375, -5.1435546875, -4.69580078125, -4.248046875, -3.80029296875, -3.3525390625, -2.90478515625, -2.45703125, -2.00927734375, -1.5615234375, -1.11376953125, -0.666015625, -0.21826171875, 0.2294921875, 0.67724609375, 1.125, 1.57275390625, 2.0205078125, 2.46826171875, 2.916015625, 3.36376953125, 3.8115234375, 4.25927734375, 4.70703125, 5.15478515625, 5.6025390625, 6.05029296875, 6.498046875, 6.94580078125, 7.3935546875, 7.84130859375, 8.2890625, 8.73681640625, 9.1845703125, 9.63232421875, 10.080078125, 10.52783203125, 10.9755859375, 11.42333984375, 11.87109375, 12.31884765625, 12.7666015625, 13.21435546875, 13.662109375, 14.10986328125, 14.5576171875, 15.00537109375, 15.453125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 8.0, 6.0, 6.0, 9.0, 17.0, 17.0, 28.0, 29.0, 42.0, 47.0, 86.0, 109.0, 160.0, 181.0, 276.0, 340.0, 388.0, 418.0, 417.0, 348.0, 279.0, 222.0, 161.0, 121.0, 92.0, 84.0, 54.0, 40.0, 29.0, 25.0, 11.0, 14.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.390625, -11.08843994140625, -10.7862548828125, -10.48406982421875, -10.181884765625, -9.87969970703125, -9.5775146484375, -9.27532958984375, -8.97314453125, -8.67095947265625, -8.3687744140625, -8.06658935546875, -7.764404296875, -7.46221923828125, -7.1600341796875, -6.85784912109375, -6.5556640625, -6.25347900390625, -5.9512939453125, -5.64910888671875, -5.346923828125, -5.04473876953125, -4.7425537109375, -4.44036865234375, -4.13818359375, -3.83599853515625, -3.5338134765625, -3.23162841796875, -2.929443359375, -2.62725830078125, -2.3250732421875, -2.02288818359375, -1.720703125, -1.41851806640625, -1.1163330078125, -0.81414794921875, -0.511962890625, -0.20977783203125, 0.0924072265625, 0.39459228515625, 0.69677734375, 0.99896240234375, 1.3011474609375, 1.60333251953125, 1.905517578125, 2.20770263671875, 2.5098876953125, 2.81207275390625, 3.1142578125, 3.41644287109375, 3.7186279296875, 4.02081298828125, 4.322998046875, 4.62518310546875, 4.9273681640625, 5.22955322265625, 5.53173828125, 5.83392333984375, 6.1361083984375, 6.43829345703125, 6.740478515625, 7.04266357421875, 7.3448486328125, 7.64703369140625, 7.94921875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 20.0, 31.0, 24.0, 55.0, 63.0, 79.0, 141.0, 202.0, 369.0, 831.0, 2928.0, 21662.0, 352088.0, 3119967.0, 653585.0, 35902.0, 4166.0, 1017.0, 454.0, 242.0, 151.0, 77.0, 63.0, 44.0, 29.0, 25.0, 20.0, 8.0, 10.0, 8.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.9375, -17.26318359375, -16.5888671875, -15.91455078125, -15.240234375, -14.56591796875, -13.8916015625, -13.21728515625, -12.54296875, -11.86865234375, -11.1943359375, -10.52001953125, -9.845703125, -9.17138671875, -8.4970703125, -7.82275390625, -7.1484375, -6.47412109375, -5.7998046875, -5.12548828125, -4.451171875, -3.77685546875, -3.1025390625, -2.42822265625, -1.75390625, -1.07958984375, -0.4052734375, 0.26904296875, 0.943359375, 1.61767578125, 2.2919921875, 2.96630859375, 3.640625, 4.31494140625, 4.9892578125, 5.66357421875, 6.337890625, 7.01220703125, 7.6865234375, 8.36083984375, 9.03515625, 9.70947265625, 10.3837890625, 11.05810546875, 11.732421875, 12.40673828125, 13.0810546875, 13.75537109375, 14.4296875, 15.10400390625, 15.7783203125, 16.45263671875, 17.126953125, 17.80126953125, 18.4755859375, 19.14990234375, 19.82421875, 20.49853515625, 21.1728515625, 21.84716796875, 22.521484375, 23.19580078125, 23.8701171875, 24.54443359375, 25.21875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 23.0, 48.0, 91.0, 124.0, 146.0, 183.0, 149.0, 94.0, 71.0, 32.0, 21.0, 12.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.71366119384766, -92.24703979492188, -89.78041076660156, -87.31378936767578, -84.84716033935547, -82.38053894042969, -79.91390991210938, -77.4472885131836, -74.98065948486328, -72.5140380859375, -70.04740905761719, -67.5807876586914, -65.1141586303711, -62.64753341674805, -60.180908203125, -57.71428680419922, -55.24766159057617, -52.781036376953125, -50.31441116333008, -47.84778594970703, -45.381160736083984, -42.91453552246094, -40.447914123535156, -37.981285095214844, -35.51466369628906, -33.048038482666016, -30.58141326904297, -28.114788055419922, -25.648162841796875, -23.181537628173828, -20.714914321899414, -18.248289108276367, -15.781665802001953, -13.315040588378906, -10.84841537475586, -8.381791114807129, -5.915165901184082, -3.448540687561035, -0.9819164276123047, 1.4847087860107422, 3.951333999633789, 6.417959213256836, 8.884584426879883, 11.351208686828613, 13.81783390045166, 16.28445816040039, 18.751083374023438, 21.217708587646484, 23.68433380126953, 26.150959014892578, 28.617584228515625, 31.084209442138672, 33.55083465576172, 36.017459869384766, 38.48408508300781, 40.950706481933594, 43.417335510253906, 45.88396072387695, 48.3505859375, 50.81721115112305, 53.283836364746094, 55.75046157836914, 58.21708679199219, 60.68370819091797, 63.150333404541016]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 8.0, 5.0, 10.0, 13.0, 7.0, 15.0, 21.0, 16.0, 19.0, 15.0, 16.0, 22.0, 29.0, 44.0, 31.0, 33.0, 34.0, 31.0, 39.0, 39.0, 34.0, 42.0, 38.0, 47.0, 29.0, 28.0, 38.0, 28.0, 30.0, 26.0, 27.0, 24.0, 21.0, 23.0, 24.0, 13.0, 16.0, 11.0, 13.0, 11.0, 10.0, 5.0, 3.0, 4.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-29.55217933654785, -28.636825561523438, -27.721473693847656, -26.806119918823242, -25.89076805114746, -24.975414276123047, -24.060062408447266, -23.14470863342285, -22.229354858398438, -21.314001083374023, -20.398649215698242, -19.483295440673828, -18.567943572998047, -17.652589797973633, -16.73723602294922, -15.821884155273438, -14.906532287597656, -13.991179466247559, -13.075826644897461, -12.160472869873047, -11.245121002197266, -10.329767227172852, -9.414414405822754, -8.499061584472656, -7.583708763122559, -6.668355941772461, -5.753003120422363, -4.837649822235107, -3.9222970008850098, -3.006944179534912, -2.0915908813476562, -1.1762380599975586, -0.26088714599609375, 0.6544657945632935, 1.5698187351226807, 2.4851717948913574, 3.400524616241455, 4.315877437591553, 5.231230735778809, 6.146583557128906, 7.061936378479004, 7.977289199829102, 8.8926420211792, 9.807994842529297, 10.723348617553711, 11.638700485229492, 12.554054260253906, 13.469407081604004, 14.384759902954102, 15.3001127243042, 16.215465545654297, 17.13081932067871, 18.046171188354492, 18.961524963378906, 19.876876831054688, 20.7922306060791, 21.707584381103516, 22.62293815612793, 23.53829002380371, 24.453643798828125, 25.368995666503906, 26.28434944152832, 27.199703216552734, 28.115055084228516, 29.030406951904297]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 7.0, 11.0, 6.0, 10.0, 9.0, 16.0, 19.0, 21.0, 27.0, 17.0, 21.0, 28.0, 42.0, 34.0, 40.0, 47.0, 39.0, 37.0, 50.0, 39.0, 42.0, 38.0, 38.0, 37.0, 43.0, 28.0, 28.0, 21.0, 36.0, 29.0, 22.0, 25.0, 19.0, 14.0, 10.0, 7.0, 6.0, 5.0, 6.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.125, -3.98553466796875, -3.8460693359375, -3.70660400390625, -3.567138671875, -3.42767333984375, -3.2882080078125, -3.14874267578125, -3.00927734375, -2.86981201171875, -2.7303466796875, -2.59088134765625, -2.451416015625, -2.31195068359375, -2.1724853515625, -2.03302001953125, -1.8935546875, -1.75408935546875, -1.6146240234375, -1.47515869140625, -1.335693359375, -1.19622802734375, -1.0567626953125, -0.91729736328125, -0.77783203125, -0.63836669921875, -0.4989013671875, -0.35943603515625, -0.219970703125, -0.08050537109375, 0.0589599609375, 0.19842529296875, 0.337890625, 0.47735595703125, 0.6168212890625, 0.75628662109375, 0.895751953125, 1.03521728515625, 1.1746826171875, 1.31414794921875, 1.45361328125, 1.59307861328125, 1.7325439453125, 1.87200927734375, 2.011474609375, 2.15093994140625, 2.2904052734375, 2.42987060546875, 2.5693359375, 2.70880126953125, 2.8482666015625, 2.98773193359375, 3.127197265625, 3.26666259765625, 3.4061279296875, 3.54559326171875, 3.68505859375, 3.82452392578125, 3.9639892578125, 4.10345458984375, 4.242919921875, 4.38238525390625, 4.5218505859375, 4.66131591796875, 4.80078125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 7.0, 11.0, 15.0, 18.0, 24.0, 41.0, 51.0, 72.0, 100.0, 158.0, 204.0, 357.0, 487.0, 670.0, 1055.0, 1540.0, 2284.0, 3547.0, 5399.0, 8173.0, 13047.0, 20389.0, 31798.0, 49742.0, 76778.0, 110215.0, 143828.0, 155242.0, 134861.0, 99298.0, 66878.0, 43853.0, 27950.0, 17758.0, 11383.0, 7131.0, 4626.0, 3145.0, 2093.0, 1343.0, 960.0, 643.0, 425.0, 298.0, 190.0, 146.0, 81.0, 75.0, 69.0, 29.0, 32.0, 23.0, 4.0, 8.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6337890625, -0.6135711669921875, -0.593353271484375, -0.5731353759765625, -0.55291748046875, -0.5326995849609375, -0.512481689453125, -0.4922637939453125, -0.4720458984375, -0.4518280029296875, -0.431610107421875, -0.4113922119140625, -0.39117431640625, -0.3709564208984375, -0.350738525390625, -0.3305206298828125, -0.310302734375, -0.2900848388671875, -0.269866943359375, -0.2496490478515625, -0.22943115234375, -0.2092132568359375, -0.188995361328125, -0.1687774658203125, -0.1485595703125, -0.1283416748046875, -0.108123779296875, -0.0879058837890625, -0.06768798828125, -0.0474700927734375, -0.027252197265625, -0.0070343017578125, 0.01318359375, 0.0334014892578125, 0.053619384765625, 0.0738372802734375, 0.09405517578125, 0.1142730712890625, 0.134490966796875, 0.1547088623046875, 0.1749267578125, 0.1951446533203125, 0.215362548828125, 0.2355804443359375, 0.25579833984375, 0.2760162353515625, 0.296234130859375, 0.3164520263671875, 0.336669921875, 0.3568878173828125, 0.377105712890625, 0.3973236083984375, 0.41754150390625, 0.4377593994140625, 0.457977294921875, 0.4781951904296875, 0.4984130859375, 0.5186309814453125, 0.538848876953125, 0.5590667724609375, 0.57928466796875, 0.5995025634765625, 0.619720458984375, 0.6399383544921875, 0.66015625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 5.0, 7.0, 6.0, 5.0, 5.0, 8.0, 13.0, 15.0, 13.0, 13.0, 15.0, 26.0, 25.0, 15.0, 26.0, 32.0, 32.0, 29.0, 41.0, 46.0, 38.0, 42.0, 30.0, 1060.0, 45.0, 31.0, 40.0, 47.0, 33.0, 37.0, 27.0, 27.0, 29.0, 23.0, 20.0, 19.0, 21.0, 21.0, 15.0, 7.0, 7.0, 6.0, 10.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.861328125, -2.766357421875, -2.67138671875, -2.576416015625, -2.4814453125, -2.386474609375, -2.29150390625, -2.196533203125, -2.1015625, -2.006591796875, -1.91162109375, -1.816650390625, -1.7216796875, -1.626708984375, -1.53173828125, -1.436767578125, -1.341796875, -1.246826171875, -1.15185546875, -1.056884765625, -0.9619140625, -0.866943359375, -0.77197265625, -0.677001953125, -0.58203125, -0.487060546875, -0.39208984375, -0.297119140625, -0.2021484375, -0.107177734375, -0.01220703125, 0.082763671875, 0.177734375, 0.272705078125, 0.36767578125, 0.462646484375, 0.5576171875, 0.652587890625, 0.74755859375, 0.842529296875, 0.9375, 1.032470703125, 1.12744140625, 1.222412109375, 1.3173828125, 1.412353515625, 1.50732421875, 1.602294921875, 1.697265625, 1.792236328125, 1.88720703125, 1.982177734375, 2.0771484375, 2.172119140625, 2.26708984375, 2.362060546875, 2.45703125, 2.552001953125, 2.64697265625, 2.741943359375, 2.8369140625, 2.931884765625, 3.02685546875, 3.121826171875, 3.216796875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 9.0, 13.0, 19.0, 27.0, 42.0, 52.0, 94.0, 145.0, 195.0, 301.0, 534.0, 698.0, 1072.0, 1738.0, 2502.0, 3954.0, 6240.0, 9513.0, 14913.0, 24231.0, 38826.0, 61024.0, 93488.0, 134607.0, 1149179.0, 213386.0, 119118.0, 80493.0, 52001.0, 32791.0, 20176.0, 12605.0, 8192.0, 5220.0, 3335.0, 2239.0, 1395.0, 954.0, 619.0, 415.0, 257.0, 183.0, 101.0, 64.0, 57.0, 43.0, 25.0, 19.0, 11.0, 5.0, 6.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.345703125, -0.3337059020996094, -0.32170867919921875, -0.3097114562988281, -0.2977142333984375, -0.2857170104980469, -0.27371978759765625, -0.2617225646972656, -0.249725341796875, -0.23772811889648438, -0.22573089599609375, -0.21373367309570312, -0.2017364501953125, -0.18973922729492188, -0.17774200439453125, -0.16574478149414062, -0.15374755859375, -0.14175033569335938, -0.12975311279296875, -0.11775588989257812, -0.1057586669921875, -0.09376144409179688, -0.08176422119140625, -0.06976699829101562, -0.057769775390625, -0.045772552490234375, -0.03377532958984375, -0.021778106689453125, -0.0097808837890625, 0.002216339111328125, 0.01421356201171875, 0.026210784912109375, 0.0382080078125, 0.050205230712890625, 0.06220245361328125, 0.07419967651367188, 0.0861968994140625, 0.09819412231445312, 0.11019134521484375, 0.12218856811523438, 0.134185791015625, 0.14618301391601562, 0.15818023681640625, 0.17017745971679688, 0.1821746826171875, 0.19417190551757812, 0.20616912841796875, 0.21816635131835938, 0.23016357421875, 0.24216079711914062, 0.25415802001953125, 0.2661552429199219, 0.2781524658203125, 0.2901496887207031, 0.30214691162109375, 0.3141441345214844, 0.326141357421875, 0.3381385803222656, 0.35013580322265625, 0.3621330261230469, 0.3741302490234375, 0.3861274719238281, 0.39812469482421875, 0.4101219177246094, 0.422119140625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 11.0, 15.0, 16.0, 30.0, 23.0, 32.0, 46.0, 66.0, 68.0, 80.0, 97.0, 99.0, 86.0, 75.0, 51.0, 48.0, 42.0, 29.0, 16.0, 13.0, 13.0, 12.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031494140625, -0.030615806579589844, -0.029737472534179688, -0.02885913848876953, -0.027980804443359375, -0.02710247039794922, -0.026224136352539062, -0.025345802307128906, -0.02446746826171875, -0.023589134216308594, -0.022710800170898438, -0.02183246612548828, -0.020954132080078125, -0.02007579803466797, -0.019197463989257812, -0.018319129943847656, -0.0174407958984375, -0.016562461853027344, -0.015684127807617188, -0.014805793762207031, -0.013927459716796875, -0.013049125671386719, -0.012170791625976562, -0.011292457580566406, -0.01041412353515625, -0.009535789489746094, -0.008657455444335938, -0.007779121398925781, -0.006900787353515625, -0.006022453308105469, -0.0051441192626953125, -0.004265785217285156, -0.003387451171875, -0.0025091171264648438, -0.0016307830810546875, -0.0007524490356445312, 0.000125885009765625, 0.0010042190551757812, 0.0018825531005859375, 0.0027608871459960938, 0.00363922119140625, 0.004517555236816406, 0.0053958892822265625, 0.006274223327636719, 0.007152557373046875, 0.008030891418457031, 0.008909225463867188, 0.009787559509277344, 0.0106658935546875, 0.011544227600097656, 0.012422561645507812, 0.013300895690917969, 0.014179229736328125, 0.015057563781738281, 0.015935897827148438, 0.016814231872558594, 0.01769256591796875, 0.018570899963378906, 0.019449234008789062, 0.02032756805419922, 0.021205902099609375, 0.02208423614501953, 0.022962570190429688, 0.023840904235839844, 0.02471923828125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 14.0, 19.0, 16.0, 27.0, 61.0, 101.0, 124.0, 327.0, 794.0, 59426.0, 985601.0, 1197.0, 366.0, 184.0, 88.0, 57.0, 39.0, 29.0, 23.0, 12.0, 9.0, 0.0, 7.0, 2.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499755859375, -0.4819908142089844, -0.46422576904296875, -0.4464607238769531, -0.4286956787109375, -0.4109306335449219, -0.39316558837890625, -0.3754005432128906, -0.357635498046875, -0.3398704528808594, -0.32210540771484375, -0.3043403625488281, -0.2865753173828125, -0.2688102722167969, -0.25104522705078125, -0.23328018188476562, -0.21551513671875, -0.19775009155273438, -0.17998504638671875, -0.16222000122070312, -0.1444549560546875, -0.12668991088867188, -0.10892486572265625, -0.09115982055664062, -0.073394775390625, -0.055629730224609375, -0.03786468505859375, -0.020099639892578125, -0.0023345947265625, 0.015430450439453125, 0.03319549560546875, 0.050960540771484375, 0.0687255859375, 0.08649063110351562, 0.10425567626953125, 0.12202072143554688, 0.1397857666015625, 0.15755081176757812, 0.17531585693359375, 0.19308090209960938, 0.210845947265625, 0.22861099243164062, 0.24637603759765625, 0.2641410827636719, 0.2819061279296875, 0.2996711730957031, 0.31743621826171875, 0.3352012634277344, 0.35296630859375, 0.3707313537597656, 0.38849639892578125, 0.4062614440917969, 0.4240264892578125, 0.4417915344238281, 0.45955657958984375, 0.4773216247558594, 0.495086669921875, 0.5128517150878906, 0.5306167602539062, 0.5483818054199219, 0.5661468505859375, 0.5839118957519531, 0.6016769409179688, 0.6194419860839844, 0.63720703125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 17.0, 160.0, 802.0, 29.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24430254101753235, -0.23839910328388214, -0.23249565064907074, -0.22659221291542053, -0.22068876028060913, -0.21478532254695892, -0.20888188481330872, -0.20297843217849731, -0.1970749795436859, -0.1911715418100357, -0.1852680891752243, -0.1793646514415741, -0.1734611988067627, -0.1675577610731125, -0.16165432333946228, -0.15575087070465088, -0.14984743297100067, -0.14394399523735046, -0.13804054260253906, -0.13213710486888885, -0.12623365223407745, -0.12033021450042725, -0.11442676931619644, -0.10852332413196564, -0.10261987894773483, -0.09671643376350403, -0.09081298857927322, -0.08490954339504242, -0.07900610566139221, -0.07310265302658081, -0.0671992152929306, -0.0612957701086998, -0.05539233982563019, -0.049488894641399384, -0.04358544945716858, -0.03768200799822807, -0.03177856281399727, -0.025875117629766464, -0.019971676170825958, -0.014068230986595154, -0.00816478580236435, -0.0022613415494561195, 0.0036421027034521103, 0.009545546025037766, 0.01544899120926857, 0.021352436393499374, 0.02725587785243988, 0.033159323036670685, 0.03906276822090149, 0.044966213405132294, 0.0508696585893631, 0.056773100048303604, 0.06267654895782471, 0.06857998669147491, 0.07448343187570572, 0.08038687705993652, 0.08629032224416733, 0.09219376742839813, 0.09809721261262894, 0.10400065779685974, 0.10990409553050995, 0.11580754816532135, 0.12171098589897156, 0.12761443853378296, 0.13351787626743317]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 10.0, 7.0, 4.0, 10.0, 9.0, 13.0, 7.0, 14.0, 22.0, 17.0, 21.0, 21.0, 19.0, 24.0, 23.0, 35.0, 21.0, 29.0, 36.0, 29.0, 39.0, 33.0, 33.0, 36.0, 34.0, 28.0, 31.0, 33.0, 35.0, 36.0, 34.0, 30.0, 14.0, 28.0, 21.0, 21.0, 26.0, 14.0, 15.0, 11.0, 14.0, 12.0, 10.0, 8.0, 2.0, 8.0, 6.0, 3.0, 7.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.022610485553741455, -0.02184230647981167, -0.02107412740588188, -0.020305948331952095, -0.01953776925802231, -0.01876959018409252, -0.018001411110162735, -0.01723323203623295, -0.01646505296230316, -0.015696873888373375, -0.014928694814443588, -0.014160515740513802, -0.013392336666584015, -0.012624157592654228, -0.011855978518724442, -0.011087799444794655, -0.010319620370864868, -0.009551441296935081, -0.008783262223005295, -0.008015083149075508, -0.0072469040751457214, -0.006478725001215935, -0.005710545927286148, -0.004942366853356361, -0.004174187779426575, -0.003406008705496788, -0.0026378296315670013, -0.0018696505576372147, -0.001101471483707428, -0.0003332924097776413, 0.0004348866641521454, 0.001203065738081932, 0.0019712448120117188, 0.0027394238859415054, 0.003507602959871292, 0.004275782033801079, 0.0050439611077308655, 0.005812140181660652, 0.006580319255590439, 0.0073484983295202255, 0.008116677403450012, 0.008884856477379799, 0.009653035551309586, 0.010421214625239372, 0.011189393699169159, 0.011957572773098946, 0.012725751847028732, 0.013493930920958519, 0.014262109994888306, 0.015030289068818092, 0.01579846814274788, 0.016566647216677666, 0.017334826290607452, 0.01810300536453724, 0.018871184438467026, 0.019639363512396812, 0.0204075425863266, 0.021175721660256386, 0.021943900734186172, 0.02271207980811596, 0.023480258882045746, 0.024248437955975533, 0.02501661702990532, 0.025784796103835106, 0.026552975177764893]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 2.0, 7.0, 11.0, 6.0, 10.0, 9.0, 16.0, 19.0, 20.0, 28.0, 17.0, 21.0, 28.0, 42.0, 34.0, 40.0, 47.0, 39.0, 37.0, 52.0, 37.0, 42.0, 38.0, 38.0, 37.0, 42.0, 29.0, 28.0, 21.0, 36.0, 29.0, 22.0, 25.0, 19.0, 14.0, 10.0, 7.0, 6.0, 5.0, 6.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.125, -3.98553466796875, -3.8460693359375, -3.70660400390625, -3.567138671875, -3.42767333984375, -3.2882080078125, -3.14874267578125, -3.00927734375, -2.86981201171875, -2.7303466796875, -2.59088134765625, -2.451416015625, -2.31195068359375, -2.1724853515625, -2.03302001953125, -1.8935546875, -1.75408935546875, -1.6146240234375, -1.47515869140625, -1.335693359375, -1.19622802734375, -1.0567626953125, -0.91729736328125, -0.77783203125, -0.63836669921875, -0.4989013671875, -0.35943603515625, -0.219970703125, -0.08050537109375, 0.0589599609375, 0.19842529296875, 0.337890625, 0.47735595703125, 0.6168212890625, 0.75628662109375, 0.895751953125, 1.03521728515625, 1.1746826171875, 1.31414794921875, 1.45361328125, 1.59307861328125, 1.7325439453125, 1.87200927734375, 2.011474609375, 2.15093994140625, 2.2904052734375, 2.42987060546875, 2.5693359375, 2.70880126953125, 2.8482666015625, 2.98773193359375, 3.127197265625, 3.26666259765625, 3.4061279296875, 3.54559326171875, 3.68505859375, 3.82452392578125, 3.9639892578125, 4.10345458984375, 4.242919921875, 4.38238525390625, 4.5218505859375, 4.66131591796875, 4.80078125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 1.0, 6.0, 7.0, 1.0, 4.0, 10.0, 5.0, 6.0, 13.0, 14.0, 25.0, 23.0, 56.0, 75.0, 146.0, 290.0, 601.0, 1273.0, 2743.0, 5924.0, 12668.0, 26129.0, 55736.0, 116817.0, 236775.0, 292795.0, 154903.0, 74541.0, 35190.0, 16617.0, 8007.0, 3666.0, 1764.0, 840.0, 391.0, 214.0, 91.0, 80.0, 28.0, 26.0, 14.0, 12.0, 9.0, 6.0, 1.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.16796875, -4.02520751953125, -3.8824462890625, -3.73968505859375, -3.596923828125, -3.45416259765625, -3.3114013671875, -3.16864013671875, -3.02587890625, -2.88311767578125, -2.7403564453125, -2.59759521484375, -2.454833984375, -2.31207275390625, -2.1693115234375, -2.02655029296875, -1.8837890625, -1.74102783203125, -1.5982666015625, -1.45550537109375, -1.312744140625, -1.16998291015625, -1.0272216796875, -0.88446044921875, -0.74169921875, -0.59893798828125, -0.4561767578125, -0.31341552734375, -0.170654296875, -0.02789306640625, 0.1148681640625, 0.25762939453125, 0.400390625, 0.54315185546875, 0.6859130859375, 0.82867431640625, 0.971435546875, 1.11419677734375, 1.2569580078125, 1.39971923828125, 1.54248046875, 1.68524169921875, 1.8280029296875, 1.97076416015625, 2.113525390625, 2.25628662109375, 2.3990478515625, 2.54180908203125, 2.6845703125, 2.82733154296875, 2.9700927734375, 3.11285400390625, 3.255615234375, 3.39837646484375, 3.5411376953125, 3.68389892578125, 3.82666015625, 3.96942138671875, 4.1121826171875, 4.25494384765625, 4.397705078125, 4.54046630859375, 4.6832275390625, 4.82598876953125, 4.96875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 4.0, 8.0, 3.0, 8.0, 8.0, 17.0, 12.0, 12.0, 10.0, 22.0, 17.0, 30.0, 32.0, 31.0, 35.0, 46.0, 48.0, 58.0, 86.0, 182.0, 1393.0, 342.0, 152.0, 76.0, 66.0, 51.0, 36.0, 38.0, 35.0, 33.0, 25.0, 28.0, 18.0, 24.0, 15.0, 11.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.375, -13.89306640625, -13.4111328125, -12.92919921875, -12.447265625, -11.96533203125, -11.4833984375, -11.00146484375, -10.51953125, -10.03759765625, -9.5556640625, -9.07373046875, -8.591796875, -8.10986328125, -7.6279296875, -7.14599609375, -6.6640625, -6.18212890625, -5.7001953125, -5.21826171875, -4.736328125, -4.25439453125, -3.7724609375, -3.29052734375, -2.80859375, -2.32666015625, -1.8447265625, -1.36279296875, -0.880859375, -0.39892578125, 0.0830078125, 0.56494140625, 1.046875, 1.52880859375, 2.0107421875, 2.49267578125, 2.974609375, 3.45654296875, 3.9384765625, 4.42041015625, 4.90234375, 5.38427734375, 5.8662109375, 6.34814453125, 6.830078125, 7.31201171875, 7.7939453125, 8.27587890625, 8.7578125, 9.23974609375, 9.7216796875, 10.20361328125, 10.685546875, 11.16748046875, 11.6494140625, 12.13134765625, 12.61328125, 13.09521484375, 13.5771484375, 14.05908203125, 14.541015625, 15.02294921875, 15.5048828125, 15.98681640625, 16.46875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 4.0, 1.0, 12.0, 14.0, 13.0, 25.0, 20.0, 21.0, 43.0, 35.0, 50.0, 65.0, 75.0, 92.0, 124.0, 181.0, 309.0, 390.0, 931.0, 5418.0, 575484.0, 2544596.0, 14943.0, 1291.0, 464.0, 288.0, 180.0, 124.0, 111.0, 69.0, 68.0, 49.0, 42.0, 40.0, 27.0, 25.0, 17.0, 13.0, 13.0, 12.0, 7.0, 8.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.3125, -34.2783203125, -33.244140625, -32.2099609375, -31.17578125, -30.1416015625, -29.107421875, -28.0732421875, -27.0390625, -26.0048828125, -24.970703125, -23.9365234375, -22.90234375, -21.8681640625, -20.833984375, -19.7998046875, -18.765625, -17.7314453125, -16.697265625, -15.6630859375, -14.62890625, -13.5947265625, -12.560546875, -11.5263671875, -10.4921875, -9.4580078125, -8.423828125, -7.3896484375, -6.35546875, -5.3212890625, -4.287109375, -3.2529296875, -2.21875, -1.1845703125, -0.150390625, 0.8837890625, 1.91796875, 2.9521484375, 3.986328125, 5.0205078125, 6.0546875, 7.0888671875, 8.123046875, 9.1572265625, 10.19140625, 11.2255859375, 12.259765625, 13.2939453125, 14.328125, 15.3623046875, 16.396484375, 17.4306640625, 18.46484375, 19.4990234375, 20.533203125, 21.5673828125, 22.6015625, 23.6357421875, 24.669921875, 25.7041015625, 26.73828125, 27.7724609375, 28.806640625, 29.8408203125, 30.875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 10.0, 41.0, 69.0, 105.0, 152.0, 163.0, 191.0, 134.0, 79.0, 36.0, 19.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.75235366821289, -46.520484924316406, -45.28861618041992, -44.05674743652344, -42.82487869262695, -41.59300994873047, -40.361141204833984, -39.1292724609375, -37.89739990234375, -36.665531158447266, -35.43366241455078, -34.2017936706543, -32.96992492675781, -31.738056182861328, -30.50618553161621, -29.274316787719727, -28.042449951171875, -26.81058120727539, -25.578712463378906, -24.346843719482422, -23.114974975585938, -21.883106231689453, -20.651235580444336, -19.41936683654785, -18.187498092651367, -16.955629348754883, -15.723760604858398, -14.491890907287598, -13.260022163391113, -12.028153419494629, -10.796283721923828, -9.564414978027344, -8.332550048828125, -7.100681304931641, -5.868812084197998, -4.6369428634643555, -3.405074119567871, -2.1732053756713867, -0.9413361549377441, 0.29053306579589844, 1.5224018096923828, 2.7542707920074463, 3.9861397743225098, 5.218008995056152, 6.449877738952637, 7.681746482849121, 8.913616180419922, 10.145484924316406, 11.37735366821289, 12.609222412109375, 13.84109115600586, 15.07296085357666, 16.304828643798828, 17.536697387695312, 18.76856803894043, 20.000436782836914, 21.2323055267334, 22.464174270629883, 23.696043014526367, 24.92791175842285, 26.15978240966797, 27.391651153564453, 28.623519897460938, 29.855388641357422, 31.087257385253906]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 9.0, 3.0, 7.0, 8.0, 5.0, 18.0, 24.0, 31.0, 11.0, 20.0, 26.0, 37.0, 31.0, 29.0, 43.0, 27.0, 38.0, 52.0, 41.0, 43.0, 52.0, 43.0, 55.0, 44.0, 36.0, 39.0, 31.0, 24.0, 32.0, 25.0, 19.0, 17.0, 12.0, 14.0, 15.0, 9.0, 8.0, 9.0, 8.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-46.419464111328125, -44.99747085571289, -43.575477600097656, -42.15348815917969, -40.73149490356445, -39.30950164794922, -37.88751220703125, -36.465518951416016, -35.04352569580078, -33.62153244018555, -32.19953918457031, -30.777549743652344, -29.35555648803711, -27.933563232421875, -26.511571884155273, -25.089580535888672, -23.667587280273438, -22.245594024658203, -20.8236026763916, -19.401611328125, -17.979618072509766, -16.55762481689453, -15.13563346862793, -13.713641166687012, -12.291648864746094, -10.869656562805176, -9.447664260864258, -8.02567195892334, -6.603679656982422, -5.181687355041504, -3.759695053100586, -2.337702751159668, -0.9157066345214844, 0.5062856674194336, 1.9282779693603516, 3.3502702713012695, 4.7722625732421875, 6.1942548751831055, 7.616247177124023, 9.038239479064941, 10.46023178100586, 11.882224082946777, 13.304216384887695, 14.726208686828613, 16.14820098876953, 17.570194244384766, 18.992185592651367, 20.41417694091797, 21.836170196533203, 23.258163452148438, 24.68015480041504, 26.10214614868164, 27.524139404296875, 28.94613265991211, 30.36812400817871, 31.790115356445312, 33.21210861206055, 34.63410186767578, 36.05609130859375, 37.478084564208984, 38.90007781982422, 40.32207107543945, 41.74406433105469, 43.166053771972656, 44.58804702758789]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 3.0, 0.0, 2.0, 7.0, 7.0, 5.0, 10.0, 12.0, 14.0, 10.0, 18.0, 19.0, 19.0, 18.0, 22.0, 46.0, 25.0, 30.0, 44.0, 37.0, 41.0, 32.0, 41.0, 48.0, 43.0, 39.0, 34.0, 48.0, 33.0, 26.0, 30.0, 35.0, 29.0, 25.0, 27.0, 27.0, 17.0, 20.0, 11.0, 13.0, 7.0, 6.0, 4.0, 6.0, 9.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.19140625, -4.04217529296875, -3.8929443359375, -3.74371337890625, -3.594482421875, -3.44525146484375, -3.2960205078125, -3.14678955078125, -2.99755859375, -2.84832763671875, -2.6990966796875, -2.54986572265625, -2.400634765625, -2.25140380859375, -2.1021728515625, -1.95294189453125, -1.8037109375, -1.65447998046875, -1.5052490234375, -1.35601806640625, -1.206787109375, -1.05755615234375, -0.9083251953125, -0.75909423828125, -0.60986328125, -0.46063232421875, -0.3114013671875, -0.16217041015625, -0.012939453125, 0.13629150390625, 0.2855224609375, 0.43475341796875, 0.583984375, 0.73321533203125, 0.8824462890625, 1.03167724609375, 1.180908203125, 1.33013916015625, 1.4793701171875, 1.62860107421875, 1.77783203125, 1.92706298828125, 2.0762939453125, 2.22552490234375, 2.374755859375, 2.52398681640625, 2.6732177734375, 2.82244873046875, 2.9716796875, 3.12091064453125, 3.2701416015625, 3.41937255859375, 3.568603515625, 3.71783447265625, 3.8670654296875, 4.01629638671875, 4.16552734375, 4.31475830078125, 4.4639892578125, 4.61322021484375, 4.762451171875, 4.91168212890625, 5.0609130859375, 5.21014404296875, 5.359375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 10.0, 4.0, 10.0, 15.0, 18.0, 23.0, 27.0, 25.0, 45.0, 41.0, 69.0, 121.0, 231.0, 455.0, 1277.0, 4565.0, 28336.0, 313541.0, 2259138.0, 1432515.0, 135264.0, 14280.0, 2702.0, 786.0, 315.0, 149.0, 78.0, 45.0, 36.0, 30.0, 17.0, 21.0, 12.0, 17.0, 9.0, 8.0, 11.0, 6.0, 5.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.734375, -10.3343505859375, -9.934326171875, -9.5343017578125, -9.13427734375, -8.7342529296875, -8.334228515625, -7.9342041015625, -7.5341796875, -7.1341552734375, -6.734130859375, -6.3341064453125, -5.93408203125, -5.5340576171875, -5.134033203125, -4.7340087890625, -4.333984375, -3.9339599609375, -3.533935546875, -3.1339111328125, -2.73388671875, -2.3338623046875, -1.933837890625, -1.5338134765625, -1.1337890625, -0.7337646484375, -0.333740234375, 0.0662841796875, 0.46630859375, 0.8663330078125, 1.266357421875, 1.6663818359375, 2.06640625, 2.4664306640625, 2.866455078125, 3.2664794921875, 3.66650390625, 4.0665283203125, 4.466552734375, 4.8665771484375, 5.2666015625, 5.6666259765625, 6.066650390625, 6.4666748046875, 6.86669921875, 7.2667236328125, 7.666748046875, 8.0667724609375, 8.466796875, 8.8668212890625, 9.266845703125, 9.6668701171875, 10.06689453125, 10.4669189453125, 10.866943359375, 11.2669677734375, 11.6669921875, 12.0670166015625, 12.467041015625, 12.8670654296875, 13.26708984375, 13.6671142578125, 14.067138671875, 14.4671630859375, 14.8671875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 7.0, 6.0, 14.0, 22.0, 23.0, 38.0, 52.0, 88.0, 141.0, 185.0, 290.0, 370.0, 481.0, 516.0, 509.0, 391.0, 291.0, 197.0, 155.0, 101.0, 66.0, 47.0, 29.0, 17.0, 14.0, 5.0, 10.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.479736328125, -9.07666015625, -8.673583984375, -8.2705078125, -7.867431640625, -7.46435546875, -7.061279296875, -6.658203125, -6.255126953125, -5.85205078125, -5.448974609375, -5.0458984375, -4.642822265625, -4.23974609375, -3.836669921875, -3.43359375, -3.030517578125, -2.62744140625, -2.224365234375, -1.8212890625, -1.418212890625, -1.01513671875, -0.612060546875, -0.208984375, 0.194091796875, 0.59716796875, 1.000244140625, 1.4033203125, 1.806396484375, 2.20947265625, 2.612548828125, 3.015625, 3.418701171875, 3.82177734375, 4.224853515625, 4.6279296875, 5.031005859375, 5.43408203125, 5.837158203125, 6.240234375, 6.643310546875, 7.04638671875, 7.449462890625, 7.8525390625, 8.255615234375, 8.65869140625, 9.061767578125, 9.46484375, 9.867919921875, 10.27099609375, 10.674072265625, 11.0771484375, 11.480224609375, 11.88330078125, 12.286376953125, 12.689453125, 13.092529296875, 13.49560546875, 13.898681640625, 14.3017578125, 14.704833984375, 15.10791015625, 15.510986328125, 15.9140625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 10.0, 11.0, 7.0, 17.0, 32.0, 48.0, 80.0, 109.0, 190.0, 291.0, 628.0, 2822.0, 169566.0, 3918728.0, 98183.0, 2293.0, 552.0, 257.0, 175.0, 105.0, 60.0, 34.0, 26.0, 21.0, 16.0, 7.0, 5.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-52.125, -50.8037109375, -49.482421875, -48.1611328125, -46.83984375, -45.5185546875, -44.197265625, -42.8759765625, -41.5546875, -40.2333984375, -38.912109375, -37.5908203125, -36.26953125, -34.9482421875, -33.626953125, -32.3056640625, -30.984375, -29.6630859375, -28.341796875, -27.0205078125, -25.69921875, -24.3779296875, -23.056640625, -21.7353515625, -20.4140625, -19.0927734375, -17.771484375, -16.4501953125, -15.12890625, -13.8076171875, -12.486328125, -11.1650390625, -9.84375, -8.5224609375, -7.201171875, -5.8798828125, -4.55859375, -3.2373046875, -1.916015625, -0.5947265625, 0.7265625, 2.0478515625, 3.369140625, 4.6904296875, 6.01171875, 7.3330078125, 8.654296875, 9.9755859375, 11.296875, 12.6181640625, 13.939453125, 15.2607421875, 16.58203125, 17.9033203125, 19.224609375, 20.5458984375, 21.8671875, 23.1884765625, 24.509765625, 25.8310546875, 27.15234375, 28.4736328125, 29.794921875, 31.1162109375, 32.4375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 11.0, 92.0, 391.0, 404.0, 98.0, 16.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-233.0514678955078, -226.18728637695312, -219.32308959960938, -212.4589080810547, -205.59471130371094, -198.73052978515625, -191.8663330078125, -185.0021514892578, -178.13796997070312, -171.27378845214844, -164.4095916748047, -157.54541015625, -150.68121337890625, -143.81703186035156, -136.95285034179688, -130.08865356445312, -123.22445678710938, -116.36026763916016, -109.49607849121094, -102.63189697265625, -95.7677001953125, -88.90351867675781, -82.0393295288086, -75.17514038085938, -68.31095123291016, -61.44676208496094, -54.58257293701172, -47.718387603759766, -40.85419845581055, -33.99000930786133, -27.125823974609375, -20.261634826660156, -13.3974609375, -6.533272743225098, 0.3309154510498047, 7.195102691650391, 14.05929183959961, 20.923480987548828, 27.78766632080078, 34.65185546875, 41.51604461669922, 48.38023376464844, 55.244422912597656, 62.10860824584961, 68.97279357910156, 75.83699035644531, 82.701171875, 89.56536102294922, 96.42955017089844, 103.29373931884766, 110.15792846679688, 117.02210998535156, 123.88630676269531, 130.75048828125, 137.61468505859375, 144.47886657714844, 151.34304809570312, 158.2072296142578, 165.07142639160156, 171.93560791015625, 178.7998046875, 185.6639862060547, 192.52816772460938, 199.39236450195312, 206.25656127929688]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 10.0, 12.0, 14.0, 18.0, 17.0, 31.0, 29.0, 23.0, 32.0, 40.0, 50.0, 40.0, 45.0, 50.0, 40.0, 44.0, 52.0, 53.0, 40.0, 42.0, 46.0, 37.0, 38.0, 41.0, 33.0, 18.0, 19.0, 18.0, 18.0, 16.0, 7.0, 7.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.510833740234375, -38.17347717285156, -36.836124420166016, -35.4987678527832, -34.161415100097656, -32.824058532714844, -31.486703872680664, -30.149349212646484, -28.811994552612305, -27.474639892578125, -26.137285232543945, -24.799930572509766, -23.462574005126953, -22.125221252441406, -20.787864685058594, -19.450510025024414, -18.113155364990234, -16.775800704956055, -15.438446044921875, -14.101090431213379, -12.7637357711792, -11.42638111114502, -10.089025497436523, -8.751670837402344, -7.414316177368164, -6.076961517333984, -4.7396063804626465, -3.4022512435913086, -2.064896583557129, -0.7275419235229492, 0.6098136901855469, 1.9471683502197266, 3.2845230102539062, 4.621877670288086, 5.959232807159424, 7.296587944030762, 8.633942604064941, 9.971297264099121, 11.308652877807617, 12.646007537841797, 13.983362197875977, 15.320716857910156, 16.658071517944336, 17.995426177978516, 19.332782745361328, 20.670135498046875, 22.007492065429688, 23.344846725463867, 24.682201385498047, 26.019556045532227, 27.356910705566406, 28.69426727294922, 30.031620025634766, 31.368976593017578, 32.706329345703125, 34.04368591308594, 35.38104248046875, 36.71839904785156, 38.05575180053711, 39.39310836791992, 40.73046112060547, 42.06781768798828, 43.405174255371094, 44.74252700805664, 46.07987976074219]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 6.0, 7.0, 11.0, 12.0, 6.0, 8.0, 16.0, 18.0, 35.0, 27.0, 27.0, 26.0, 35.0, 36.0, 36.0, 34.0, 41.0, 45.0, 45.0, 36.0, 33.0, 45.0, 37.0, 33.0, 29.0, 37.0, 40.0, 23.0, 37.0, 30.0, 26.0, 24.0, 11.0, 17.0, 12.0, 10.0, 7.0, 10.0, 6.0, 7.0, 2.0, 4.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.85540771484375, -3.7069091796875, -3.55841064453125, -3.409912109375, -3.26141357421875, -3.1129150390625, -2.96441650390625, -2.81591796875, -2.66741943359375, -2.5189208984375, -2.37042236328125, -2.221923828125, -2.07342529296875, -1.9249267578125, -1.77642822265625, -1.6279296875, -1.47943115234375, -1.3309326171875, -1.18243408203125, -1.033935546875, -0.88543701171875, -0.7369384765625, -0.58843994140625, -0.43994140625, -0.29144287109375, -0.1429443359375, 0.00555419921875, 0.154052734375, 0.30255126953125, 0.4510498046875, 0.59954833984375, 0.748046875, 0.89654541015625, 1.0450439453125, 1.19354248046875, 1.342041015625, 1.49053955078125, 1.6390380859375, 1.78753662109375, 1.93603515625, 2.08453369140625, 2.2330322265625, 2.38153076171875, 2.530029296875, 2.67852783203125, 2.8270263671875, 2.97552490234375, 3.1240234375, 3.27252197265625, 3.4210205078125, 3.56951904296875, 3.718017578125, 3.86651611328125, 4.0150146484375, 4.16351318359375, 4.31201171875, 4.46051025390625, 4.6090087890625, 4.75750732421875, 4.906005859375, 5.05450439453125, 5.2030029296875, 5.35150146484375, 5.5]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 10.0, 14.0, 20.0, 27.0, 39.0, 66.0, 103.0, 146.0, 216.0, 281.0, 468.0, 554.0, 919.0, 1335.0, 2079.0, 2991.0, 4523.0, 6943.0, 10933.0, 16872.0, 27550.0, 44067.0, 70541.0, 107742.0, 149284.0, 168670.0, 145547.0, 104390.0, 67629.0, 41991.0, 25838.0, 16343.0, 10375.0, 6650.0, 4443.0, 2901.0, 1955.0, 1294.0, 923.0, 560.0, 447.0, 289.0, 183.0, 101.0, 100.0, 77.0, 48.0, 35.0, 20.0, 12.0, 6.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6689453125, -0.6462326049804688, -0.6235198974609375, -0.6008071899414062, -0.578094482421875, -0.5553817749023438, -0.5326690673828125, -0.5099563598632812, -0.48724365234375, -0.46453094482421875, -0.4418182373046875, -0.41910552978515625, -0.396392822265625, -0.37368011474609375, -0.3509674072265625, -0.32825469970703125, -0.3055419921875, -0.28282928466796875, -0.2601165771484375, -0.23740386962890625, -0.214691162109375, -0.19197845458984375, -0.1692657470703125, -0.14655303955078125, -0.12384033203125, -0.10112762451171875, -0.0784149169921875, -0.05570220947265625, -0.032989501953125, -0.01027679443359375, 0.0124359130859375, 0.03514862060546875, 0.057861328125, 0.08057403564453125, 0.1032867431640625, 0.12599945068359375, 0.148712158203125, 0.17142486572265625, 0.1941375732421875, 0.21685028076171875, 0.23956298828125, 0.26227569580078125, 0.2849884033203125, 0.30770111083984375, 0.330413818359375, 0.35312652587890625, 0.3758392333984375, 0.39855194091796875, 0.4212646484375, 0.44397735595703125, 0.4666900634765625, 0.48940277099609375, 0.512115478515625, 0.5348281860351562, 0.5575408935546875, 0.5802536010742188, 0.60296630859375, 0.6256790161132812, 0.6483917236328125, 0.6711044311523438, 0.693817138671875, 0.7165298461914062, 0.7392425537109375, 0.7619552612304688, 0.78466796875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 6.0, 0.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 3.0, 10.0, 11.0, 15.0, 8.0, 19.0, 16.0, 19.0, 21.0, 25.0, 34.0, 37.0, 44.0, 37.0, 43.0, 47.0, 39.0, 48.0, 1056.0, 43.0, 32.0, 46.0, 35.0, 39.0, 36.0, 30.0, 32.0, 24.0, 21.0, 24.0, 21.0, 13.0, 10.0, 14.0, 11.0, 11.0, 7.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.255859375, -3.147674560546875, -3.03948974609375, -2.931304931640625, -2.8231201171875, -2.714935302734375, -2.60675048828125, -2.498565673828125, -2.390380859375, -2.282196044921875, -2.17401123046875, -2.065826416015625, -1.9576416015625, -1.849456787109375, -1.74127197265625, -1.633087158203125, -1.52490234375, -1.416717529296875, -1.30853271484375, -1.200347900390625, -1.0921630859375, -0.983978271484375, -0.87579345703125, -0.767608642578125, -0.659423828125, -0.551239013671875, -0.44305419921875, -0.334869384765625, -0.2266845703125, -0.118499755859375, -0.01031494140625, 0.097869873046875, 0.2060546875, 0.314239501953125, 0.42242431640625, 0.530609130859375, 0.6387939453125, 0.746978759765625, 0.85516357421875, 0.963348388671875, 1.071533203125, 1.179718017578125, 1.28790283203125, 1.396087646484375, 1.5042724609375, 1.612457275390625, 1.72064208984375, 1.828826904296875, 1.93701171875, 2.045196533203125, 2.15338134765625, 2.261566162109375, 2.3697509765625, 2.477935791015625, 2.58612060546875, 2.694305419921875, 2.802490234375, 2.910675048828125, 3.01885986328125, 3.127044677734375, 3.2352294921875, 3.343414306640625, 3.45159912109375, 3.559783935546875, 3.66796875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 6.0, 3.0, 6.0, 13.0, 19.0, 27.0, 35.0, 31.0, 65.0, 104.0, 159.0, 219.0, 320.0, 555.0, 884.0, 1345.0, 2242.0, 3554.0, 5829.0, 9410.0, 15614.0, 26879.0, 45604.0, 76750.0, 121382.0, 206638.0, 1188650.0, 148250.0, 96384.0, 59097.0, 35065.0, 20316.0, 12214.0, 7236.0, 4521.0, 2916.0, 1675.0, 1152.0, 690.0, 460.0, 284.0, 191.0, 127.0, 72.0, 56.0, 34.0, 18.0, 13.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.424072265625, -0.4095726013183594, -0.39507293701171875, -0.3805732727050781, -0.3660736083984375, -0.3515739440917969, -0.33707427978515625, -0.3225746154785156, -0.308074951171875, -0.2935752868652344, -0.27907562255859375, -0.2645759582519531, -0.2500762939453125, -0.23557662963867188, -0.22107696533203125, -0.20657730102539062, -0.19207763671875, -0.17757797241210938, -0.16307830810546875, -0.14857864379882812, -0.1340789794921875, -0.11957931518554688, -0.10507965087890625, -0.09057998657226562, -0.076080322265625, -0.061580657958984375, -0.04708099365234375, -0.032581329345703125, -0.0180816650390625, -0.003582000732421875, 0.01091766357421875, 0.025417327880859375, 0.0399169921875, 0.054416656494140625, 0.06891632080078125, 0.08341598510742188, 0.0979156494140625, 0.11241531372070312, 0.12691497802734375, 0.14141464233398438, 0.155914306640625, 0.17041397094726562, 0.18491363525390625, 0.19941329956054688, 0.2139129638671875, 0.22841262817382812, 0.24291229248046875, 0.2574119567871094, 0.27191162109375, 0.2864112854003906, 0.30091094970703125, 0.3154106140136719, 0.3299102783203125, 0.3444099426269531, 0.35890960693359375, 0.3734092712402344, 0.387908935546875, 0.4024085998535156, 0.41690826416015625, 0.4314079284667969, 0.4459075927734375, 0.4604072570800781, 0.47490692138671875, 0.4894065856933594, 0.50390625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 14.0, 10.0, 18.0, 22.0, 12.0, 20.0, 32.0, 30.0, 53.0, 40.0, 54.0, 76.0, 75.0, 81.0, 75.0, 69.0, 51.0, 35.0, 52.0, 34.0, 20.0, 18.0, 22.0, 14.0, 12.0, 10.0, 12.0, 10.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038665771484375, -0.03754568099975586, -0.03642559051513672, -0.03530550003051758, -0.03418540954589844, -0.0330653190612793, -0.031945228576660156, -0.030825138092041016, -0.029705047607421875, -0.028584957122802734, -0.027464866638183594, -0.026344776153564453, -0.025224685668945312, -0.024104595184326172, -0.02298450469970703, -0.02186441421508789, -0.02074432373046875, -0.01962423324584961, -0.01850414276123047, -0.017384052276611328, -0.016263961791992188, -0.015143871307373047, -0.014023780822753906, -0.012903690338134766, -0.011783599853515625, -0.010663509368896484, -0.009543418884277344, -0.008423328399658203, -0.0073032379150390625, -0.006183147430419922, -0.005063056945800781, -0.003942966461181641, -0.0028228759765625, -0.0017027854919433594, -0.0005826950073242188, 0.0005373954772949219, 0.0016574859619140625, 0.002777576446533203, 0.0038976669311523438, 0.005017757415771484, 0.006137847900390625, 0.007257938385009766, 0.008378028869628906, 0.009498119354248047, 0.010618209838867188, 0.011738300323486328, 0.012858390808105469, 0.01397848129272461, 0.01509857177734375, 0.01621866226196289, 0.01733875274658203, 0.018458843231201172, 0.019578933715820312, 0.020699024200439453, 0.021819114685058594, 0.022939205169677734, 0.024059295654296875, 0.025179386138916016, 0.026299476623535156, 0.027419567108154297, 0.028539657592773438, 0.029659748077392578, 0.03077983856201172, 0.03189992904663086, 0.03302001953125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 10.0, 12.0, 12.0, 15.0, 17.0, 24.0, 26.0, 47.0, 62.0, 100.0, 133.0, 274.0, 602.0, 3095.0, 1037943.0, 4722.0, 645.0, 282.0, 143.0, 108.0, 67.0, 56.0, 33.0, 17.0, 25.0, 22.0, 12.0, 15.0, 7.0, 5.0, 8.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.6208267211914062, -0.5990753173828125, -0.5773239135742188, -0.555572509765625, -0.5338211059570312, -0.5120697021484375, -0.49031829833984375, -0.46856689453125, -0.44681549072265625, -0.4250640869140625, -0.40331268310546875, -0.381561279296875, -0.35980987548828125, -0.3380584716796875, -0.31630706787109375, -0.2945556640625, -0.27280426025390625, -0.2510528564453125, -0.22930145263671875, -0.207550048828125, -0.18579864501953125, -0.1640472412109375, -0.14229583740234375, -0.12054443359375, -0.09879302978515625, -0.0770416259765625, -0.05529022216796875, -0.033538818359375, -0.01178741455078125, 0.0099639892578125, 0.03171539306640625, 0.053466796875, 0.07521820068359375, 0.0969696044921875, 0.11872100830078125, 0.140472412109375, 0.16222381591796875, 0.1839752197265625, 0.20572662353515625, 0.22747802734375, 0.24922943115234375, 0.2709808349609375, 0.29273223876953125, 0.314483642578125, 0.33623504638671875, 0.3579864501953125, 0.37973785400390625, 0.4014892578125, 0.42324066162109375, 0.4449920654296875, 0.46674346923828125, 0.488494873046875, 0.5102462768554688, 0.5319976806640625, 0.5537490844726562, 0.57550048828125, 0.5972518920898438, 0.6190032958984375, 0.6407546997070312, 0.662506103515625, 0.6842575073242188, 0.7060089111328125, 0.7277603149414062, 0.74951171875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 231.0, 783.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13723061978816986, -0.11794070154428482, -0.09865078330039978, -0.07936087250709534, -0.0600709542632103, -0.040781036019325256, -0.021491125226020813, -0.0022011995315551758, 0.017088711261749268, 0.03637862950563431, 0.05566854402422905, 0.07495845854282379, 0.09424837678670883, 0.11353829503059387, 0.13282820582389832, 0.15211813151836395, 0.1714080423116684, 0.19069795310497284, 0.20998787879943848, 0.22927778959274292, 0.24856770038604736, 0.2678576111793518, 0.28714752197265625, 0.3064374625682831, 0.3257273733615875, 0.34501728415489197, 0.3643071949481964, 0.38359713554382324, 0.4028870463371277, 0.42217695713043213, 0.4414668679237366, 0.460756778717041, 0.48004668951034546, 0.4993366003036499, 0.5186265110969543, 0.5379164218902588, 0.5572063326835632, 0.5764962434768677, 0.5957862138748169, 0.6150761246681213, 0.6343660354614258, 0.6536559462547302, 0.6729458570480347, 0.6922357678413391, 0.7115256786346436, 0.7308156490325928, 0.7501055002212524, 0.7693954706192017, 0.7886853218078613, 0.8079752326011658, 0.8272651433944702, 0.8465550541877747, 0.8658449649810791, 0.8851349353790283, 0.904424786567688, 0.9237147569656372, 0.9430046677589417, 0.9622945785522461, 0.9815844893455505, 1.000874400138855, 1.0201643705368042, 1.0394542217254639, 1.058744192123413, 1.0780340433120728, 1.097324013710022]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 9.0, 10.0, 8.0, 6.0, 11.0, 7.0, 13.0, 12.0, 27.0, 14.0, 32.0, 24.0, 32.0, 27.0, 32.0, 32.0, 31.0, 39.0, 43.0, 48.0, 41.0, 41.0, 36.0, 36.0, 52.0, 42.0, 20.0, 28.0, 34.0, 28.0, 26.0, 30.0, 18.0, 21.0, 22.0, 16.0, 12.0, 4.0, 12.0, 6.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.05590951442718506, -0.054350536316633224, -0.05279155820608139, -0.051232583820819855, -0.04967360571026802, -0.048114627599716187, -0.04655565321445465, -0.04499667510390282, -0.04343769699335098, -0.04187871888279915, -0.040319740772247314, -0.03876076638698578, -0.037201788276433945, -0.03564281016588211, -0.034083835780620575, -0.03252485767006874, -0.030965879559516907, -0.029406901448965073, -0.027847925201058388, -0.026288948953151703, -0.02472997084259987, -0.023170992732048035, -0.02161201648414135, -0.020053040236234665, -0.01849406212568283, -0.016935084015130997, -0.015376107767224312, -0.013817130587995052, -0.012258153408765793, -0.010699176229536533, -0.009140199050307274, -0.007581221871078014, -0.006022244691848755, -0.004463267512619495, -0.002904290333390236, -0.0013453131541609764, 0.00021366402506828308, 0.0017726412042975426, 0.003331618383526802, 0.0048905955627560616, 0.006449572741985321, 0.00800854992121458, 0.00956752710044384, 0.0111265042796731, 0.012685481458902359, 0.014244458638131618, 0.015803435817360878, 0.017362412065267563, 0.018921390175819397, 0.02048036828637123, 0.022039344534277916, 0.0235983207821846, 0.025157298892736435, 0.02671627700328827, 0.028275253251194954, 0.02983422949910164, 0.03139320760965347, 0.03295218572020531, 0.03451116383075714, 0.03607013821601868, 0.03762911632657051, 0.039188094437122345, 0.04074706882238388, 0.042306046932935715, 0.04386502504348755]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 6.0, 7.0, 11.0, 12.0, 7.0, 7.0, 16.0, 18.0, 35.0, 27.0, 27.0, 26.0, 35.0, 36.0, 36.0, 33.0, 42.0, 46.0, 43.0, 37.0, 34.0, 44.0, 37.0, 33.0, 29.0, 37.0, 40.0, 23.0, 37.0, 30.0, 26.0, 24.0, 11.0, 16.0, 13.0, 10.0, 7.0, 10.0, 6.0, 7.0, 2.0, 4.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.85540771484375, -3.7069091796875, -3.55841064453125, -3.409912109375, -3.26141357421875, -3.1129150390625, -2.96441650390625, -2.81591796875, -2.66741943359375, -2.5189208984375, -2.37042236328125, -2.221923828125, -2.07342529296875, -1.9249267578125, -1.77642822265625, -1.6279296875, -1.47943115234375, -1.3309326171875, -1.18243408203125, -1.033935546875, -0.88543701171875, -0.7369384765625, -0.58843994140625, -0.43994140625, -0.29144287109375, -0.1429443359375, 0.00555419921875, 0.154052734375, 0.30255126953125, 0.4510498046875, 0.59954833984375, 0.748046875, 0.89654541015625, 1.0450439453125, 1.19354248046875, 1.342041015625, 1.49053955078125, 1.6390380859375, 1.78753662109375, 1.93603515625, 2.08453369140625, 2.2330322265625, 2.38153076171875, 2.530029296875, 2.67852783203125, 2.8270263671875, 2.97552490234375, 3.1240234375, 3.27252197265625, 3.4210205078125, 3.56951904296875, 3.718017578125, 3.86651611328125, 4.0150146484375, 4.16351318359375, 4.31201171875, 4.46051025390625, 4.6090087890625, 4.75750732421875, 4.906005859375, 5.05450439453125, 5.2030029296875, 5.35150146484375, 5.5]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 4.0, 18.0, 35.0, 52.0, 116.0, 195.0, 362.0, 701.0, 1533.0, 3210.0, 7008.0, 17992.0, 54705.0, 184808.0, 437453.0, 233318.0, 69326.0, 21991.0, 8517.0, 3747.0, 1727.0, 838.0, 419.0, 229.0, 88.0, 79.0, 27.0, 20.0, 14.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.86328125, -7.64239501953125, -7.4215087890625, -7.20062255859375, -6.979736328125, -6.75885009765625, -6.5379638671875, -6.31707763671875, -6.09619140625, -5.87530517578125, -5.6544189453125, -5.43353271484375, -5.212646484375, -4.99176025390625, -4.7708740234375, -4.54998779296875, -4.3291015625, -4.10821533203125, -3.8873291015625, -3.66644287109375, -3.445556640625, -3.22467041015625, -3.0037841796875, -2.78289794921875, -2.56201171875, -2.34112548828125, -2.1202392578125, -1.89935302734375, -1.678466796875, -1.45758056640625, -1.2366943359375, -1.01580810546875, -0.794921875, -0.57403564453125, -0.3531494140625, -0.13226318359375, 0.088623046875, 0.30950927734375, 0.5303955078125, 0.75128173828125, 0.97216796875, 1.19305419921875, 1.4139404296875, 1.63482666015625, 1.855712890625, 2.07659912109375, 2.2974853515625, 2.51837158203125, 2.7392578125, 2.96014404296875, 3.1810302734375, 3.40191650390625, 3.622802734375, 3.84368896484375, 4.0645751953125, 4.28546142578125, 4.50634765625, 4.72723388671875, 4.9481201171875, 5.16900634765625, 5.389892578125, 5.61077880859375, 5.8316650390625, 6.05255126953125, 6.2734375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 1.0, 4.0, 5.0, 6.0, 5.0, 4.0, 9.0, 12.0, 11.0, 17.0, 23.0, 22.0, 24.0, 25.0, 35.0, 44.0, 37.0, 42.0, 52.0, 76.0, 169.0, 358.0, 1407.0, 188.0, 79.0, 64.0, 55.0, 36.0, 37.0, 25.0, 27.0, 22.0, 33.0, 17.0, 15.0, 12.0, 9.0, 10.0, 12.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.96875, -14.453857421875, -13.93896484375, -13.424072265625, -12.9091796875, -12.394287109375, -11.87939453125, -11.364501953125, -10.849609375, -10.334716796875, -9.81982421875, -9.304931640625, -8.7900390625, -8.275146484375, -7.76025390625, -7.245361328125, -6.73046875, -6.215576171875, -5.70068359375, -5.185791015625, -4.6708984375, -4.156005859375, -3.64111328125, -3.126220703125, -2.611328125, -2.096435546875, -1.58154296875, -1.066650390625, -0.5517578125, -0.036865234375, 0.47802734375, 0.992919921875, 1.5078125, 2.022705078125, 2.53759765625, 3.052490234375, 3.5673828125, 4.082275390625, 4.59716796875, 5.112060546875, 5.626953125, 6.141845703125, 6.65673828125, 7.171630859375, 7.6865234375, 8.201416015625, 8.71630859375, 9.231201171875, 9.74609375, 10.260986328125, 10.77587890625, 11.290771484375, 11.8056640625, 12.320556640625, 12.83544921875, 13.350341796875, 13.865234375, 14.380126953125, 14.89501953125, 15.409912109375, 15.9248046875, 16.439697265625, 16.95458984375, 17.469482421875, 17.984375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 12.0, 10.0, 9.0, 26.0, 31.0, 45.0, 76.0, 115.0, 149.0, 265.0, 432.0, 1228.0, 69266.0, 3066597.0, 5765.0, 698.0, 317.0, 243.0, 132.0, 101.0, 47.0, 34.0, 26.0, 21.0, 20.0, 5.0, 7.0, 6.0, 5.0, 7.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.3125, -74.2646484375, -72.216796875, -70.1689453125, -68.12109375, -66.0732421875, -64.025390625, -61.9775390625, -59.9296875, -57.8818359375, -55.833984375, -53.7861328125, -51.73828125, -49.6904296875, -47.642578125, -45.5947265625, -43.546875, -41.4990234375, -39.451171875, -37.4033203125, -35.35546875, -33.3076171875, -31.259765625, -29.2119140625, -27.1640625, -25.1162109375, -23.068359375, -21.0205078125, -18.97265625, -16.9248046875, -14.876953125, -12.8291015625, -10.78125, -8.7333984375, -6.685546875, -4.6376953125, -2.58984375, -0.5419921875, 1.505859375, 3.5537109375, 5.6015625, 7.6494140625, 9.697265625, 11.7451171875, 13.79296875, 15.8408203125, 17.888671875, 19.9365234375, 21.984375, 24.0322265625, 26.080078125, 28.1279296875, 30.17578125, 32.2236328125, 34.271484375, 36.3193359375, 38.3671875, 40.4150390625, 42.462890625, 44.5107421875, 46.55859375, 48.6064453125, 50.654296875, 52.7021484375, 54.75]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 78.0, 355.0, 434.0, 138.0, 10.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-195.0911407470703, -191.5563201904297, -188.02151489257812, -184.4866943359375, -180.95188903808594, -177.4170684814453, -173.88226318359375, -170.34744262695312, -166.81263732910156, -163.27781677246094, -159.74301147460938, -156.20819091796875, -152.6733856201172, -149.13856506347656, -145.603759765625, -142.06893920898438, -138.53411865234375, -134.99929809570312, -131.46449279785156, -127.92967987060547, -124.39486694335938, -120.86005401611328, -117.32524108886719, -113.79042053222656, -110.255615234375, -106.7208023071289, -103.18598937988281, -99.65117645263672, -96.11636352539062, -92.58155059814453, -89.04673767089844, -85.51191711425781, -81.97711181640625, -78.44229888916016, -74.90748596191406, -71.37267303466797, -67.83786010742188, -64.30304718017578, -60.76823043823242, -57.23341751098633, -53.6986083984375, -50.163795471191406, -46.62898254394531, -43.09416961669922, -39.559356689453125, -36.02454376220703, -32.48972702026367, -28.954914093017578, -25.42009925842285, -21.885286331176758, -18.35047149658203, -14.815658569335938, -11.280845642089844, -7.74603271484375, -4.211217880249023, -0.6764049530029297, 2.858407974243164, 6.393221378326416, 9.928034782409668, 13.462848663330078, 16.997661590576172, 20.532474517822266, 24.067289352416992, 27.602102279663086, 31.13691520690918]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 8.0, 7.0, 8.0, 8.0, 13.0, 12.0, 9.0, 14.0, 12.0, 25.0, 24.0, 29.0, 33.0, 36.0, 34.0, 33.0, 36.0, 33.0, 24.0, 41.0, 42.0, 37.0, 34.0, 53.0, 40.0, 44.0, 30.0, 30.0, 35.0, 38.0, 18.0, 24.0, 27.0, 20.0, 16.0, 10.0, 13.0, 11.0, 6.0, 10.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0], "bins": [-49.89497756958008, -48.5804328918457, -47.26588821411133, -45.95134353637695, -44.636802673339844, -43.32225799560547, -42.007713317871094, -40.69316864013672, -39.378623962402344, -38.06407928466797, -36.749534606933594, -35.43498992919922, -34.120445251464844, -32.805904388427734, -31.49135971069336, -30.176815032958984, -28.86227035522461, -27.547725677490234, -26.23318099975586, -24.918638229370117, -23.604093551635742, -22.289548873901367, -20.975006103515625, -19.66046142578125, -18.345916748046875, -17.0313720703125, -15.716828346252441, -14.402284622192383, -13.087739944458008, -11.773195266723633, -10.458651542663574, -9.144107818603516, -7.829566955566406, -6.5150227546691895, -5.200478553771973, -3.885934352874756, -2.571390151977539, -1.2568459510803223, 0.05769824981689453, 1.3722419738769531, 2.686786651611328, 4.001330852508545, 5.315875053405762, 6.6304192543029785, 7.944963455200195, 9.25950813293457, 10.574051856994629, 11.888595581054688, 13.203140258789062, 14.517684936523438, 15.832228660583496, 17.146772384643555, 18.46131706237793, 19.775861740112305, 21.090404510498047, 22.404949188232422, 23.719493865966797, 25.034038543701172, 26.348583221435547, 27.66312599182129, 28.977670669555664, 30.29221534729004, 31.60675811767578, 32.921302795410156, 34.23584747314453]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 0.0, 7.0, 5.0, 11.0, 8.0, 11.0, 13.0, 15.0, 18.0, 18.0, 21.0, 21.0, 27.0, 35.0, 39.0, 29.0, 33.0, 43.0, 46.0, 41.0, 39.0, 28.0, 31.0, 53.0, 34.0, 31.0, 45.0, 44.0, 27.0, 26.0, 39.0, 31.0, 24.0, 18.0, 22.0, 13.0, 8.0, 8.0, 13.0, 3.0, 5.0, 3.0, 4.0, 5.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.4976806640625, -4.335205078125, -4.1727294921875, -4.01025390625, -3.8477783203125, -3.685302734375, -3.5228271484375, -3.3603515625, -3.1978759765625, -3.035400390625, -2.8729248046875, -2.71044921875, -2.5479736328125, -2.385498046875, -2.2230224609375, -2.060546875, -1.8980712890625, -1.735595703125, -1.5731201171875, -1.41064453125, -1.2481689453125, -1.085693359375, -0.9232177734375, -0.7607421875, -0.5982666015625, -0.435791015625, -0.2733154296875, -0.11083984375, 0.0516357421875, 0.214111328125, 0.3765869140625, 0.5390625, 0.7015380859375, 0.864013671875, 1.0264892578125, 1.18896484375, 1.3514404296875, 1.513916015625, 1.6763916015625, 1.8388671875, 2.0013427734375, 2.163818359375, 2.3262939453125, 2.48876953125, 2.6512451171875, 2.813720703125, 2.9761962890625, 3.138671875, 3.3011474609375, 3.463623046875, 3.6260986328125, 3.78857421875, 3.9510498046875, 4.113525390625, 4.2760009765625, 4.4384765625, 4.6009521484375, 4.763427734375, 4.9259033203125, 5.08837890625, 5.2508544921875, 5.413330078125, 5.5758056640625, 5.73828125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 4.0, 6.0, 10.0, 10.0, 14.0, 18.0, 23.0, 36.0, 41.0, 70.0, 82.0, 117.0, 192.0, 280.0, 463.0, 833.0, 1778.0, 4269.0, 13274.0, 54530.0, 266397.0, 1124656.0, 1806942.0, 723068.0, 151236.0, 31732.0, 8457.0, 2984.0, 1233.0, 623.0, 286.0, 205.0, 119.0, 78.0, 75.0, 36.0, 30.0, 21.0, 8.0, 9.0, 7.0, 9.0, 1.0, 5.0, 6.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.140625, -7.8807373046875, -7.620849609375, -7.3609619140625, -7.10107421875, -6.8411865234375, -6.581298828125, -6.3214111328125, -6.0615234375, -5.8016357421875, -5.541748046875, -5.2818603515625, -5.02197265625, -4.7620849609375, -4.502197265625, -4.2423095703125, -3.982421875, -3.7225341796875, -3.462646484375, -3.2027587890625, -2.94287109375, -2.6829833984375, -2.423095703125, -2.1632080078125, -1.9033203125, -1.6434326171875, -1.383544921875, -1.1236572265625, -0.86376953125, -0.6038818359375, -0.343994140625, -0.0841064453125, 0.17578125, 0.4356689453125, 0.695556640625, 0.9554443359375, 1.21533203125, 1.4752197265625, 1.735107421875, 1.9949951171875, 2.2548828125, 2.5147705078125, 2.774658203125, 3.0345458984375, 3.29443359375, 3.5543212890625, 3.814208984375, 4.0740966796875, 4.333984375, 4.5938720703125, 4.853759765625, 5.1136474609375, 5.37353515625, 5.6334228515625, 5.893310546875, 6.1531982421875, 6.4130859375, 6.6729736328125, 6.932861328125, 7.1927490234375, 7.45263671875, 7.7125244140625, 7.972412109375, 8.2322998046875, 8.4921875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 2.0, 8.0, 7.0, 7.0, 8.0, 22.0, 25.0, 32.0, 54.0, 60.0, 95.0, 125.0, 194.0, 228.0, 307.0, 420.0, 475.0, 475.0, 386.0, 327.0, 217.0, 168.0, 124.0, 98.0, 54.0, 49.0, 39.0, 23.0, 13.0, 8.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.125, -10.7760009765625, -10.427001953125, -10.0780029296875, -9.72900390625, -9.3800048828125, -9.031005859375, -8.6820068359375, -8.3330078125, -7.9840087890625, -7.635009765625, -7.2860107421875, -6.93701171875, -6.5880126953125, -6.239013671875, -5.8900146484375, -5.541015625, -5.1920166015625, -4.843017578125, -4.4940185546875, -4.14501953125, -3.7960205078125, -3.447021484375, -3.0980224609375, -2.7490234375, -2.4000244140625, -2.051025390625, -1.7020263671875, -1.35302734375, -1.0040283203125, -0.655029296875, -0.3060302734375, 0.04296875, 0.3919677734375, 0.740966796875, 1.0899658203125, 1.43896484375, 1.7879638671875, 2.136962890625, 2.4859619140625, 2.8349609375, 3.1839599609375, 3.532958984375, 3.8819580078125, 4.23095703125, 4.5799560546875, 4.928955078125, 5.2779541015625, 5.626953125, 5.9759521484375, 6.324951171875, 6.6739501953125, 7.02294921875, 7.3719482421875, 7.720947265625, 8.0699462890625, 8.4189453125, 8.7679443359375, 9.116943359375, 9.4659423828125, 9.81494140625, 10.1639404296875, 10.512939453125, 10.8619384765625, 11.2109375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 4.0, 8.0, 13.0, 20.0, 33.0, 54.0, 71.0, 94.0, 158.0, 205.0, 354.0, 705.0, 4814.0, 279867.0, 3783061.0, 120188.0, 2982.0, 659.0, 344.0, 202.0, 153.0, 75.0, 64.0, 50.0, 27.0, 21.0, 10.0, 10.0, 5.0, 12.0, 3.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.90625, -36.73681640625, -35.5673828125, -34.39794921875, -33.228515625, -32.05908203125, -30.8896484375, -29.72021484375, -28.55078125, -27.38134765625, -26.2119140625, -25.04248046875, -23.873046875, -22.70361328125, -21.5341796875, -20.36474609375, -19.1953125, -18.02587890625, -16.8564453125, -15.68701171875, -14.517578125, -13.34814453125, -12.1787109375, -11.00927734375, -9.83984375, -8.67041015625, -7.5009765625, -6.33154296875, -5.162109375, -3.99267578125, -2.8232421875, -1.65380859375, -0.484375, 0.68505859375, 1.8544921875, 3.02392578125, 4.193359375, 5.36279296875, 6.5322265625, 7.70166015625, 8.87109375, 10.04052734375, 11.2099609375, 12.37939453125, 13.548828125, 14.71826171875, 15.8876953125, 17.05712890625, 18.2265625, 19.39599609375, 20.5654296875, 21.73486328125, 22.904296875, 24.07373046875, 25.2431640625, 26.41259765625, 27.58203125, 28.75146484375, 29.9208984375, 31.09033203125, 32.259765625, 33.42919921875, 34.5986328125, 35.76806640625, 36.9375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 11.0, 15.0, 25.0, 52.0, 61.0, 88.0, 98.0, 115.0, 131.0, 115.0, 86.0, 69.0, 54.0, 33.0, 27.0, 13.0, 11.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.04686737060547, -67.33910369873047, -65.63134002685547, -63.9235725402832, -62.2158088684082, -60.50804138183594, -58.80027770996094, -57.09251403808594, -55.38475036621094, -53.67698669433594, -51.96921920776367, -50.26145553588867, -48.55369186401367, -46.845924377441406, -45.138160705566406, -43.430397033691406, -41.72262954711914, -40.01486587524414, -38.307098388671875, -36.599334716796875, -34.891571044921875, -33.183807373046875, -31.47603988647461, -29.76827621459961, -28.060510635375977, -26.352745056152344, -24.644981384277344, -22.93721580505371, -21.229450225830078, -19.521686553955078, -17.813920974731445, -16.106155395507812, -14.398387908935547, -12.69062328338623, -10.982858657836914, -9.275093078613281, -7.567328453063965, -5.859563827514648, -4.151798248291016, -2.444033622741699, -0.7362689971923828, 0.9714958667755127, 2.679260730743408, 4.387025833129883, 6.094790458679199, 7.802555084228516, 9.510320663452148, 11.218085289001465, 12.925849914550781, 14.633614540100098, 16.341379165649414, 18.049144744873047, 19.756908416748047, 21.46467399597168, 23.172439575195312, 24.880203247070312, 26.587968826293945, 28.295734405517578, 30.003498077392578, 31.71126365661621, 33.419029235839844, 35.126792907714844, 36.834556579589844, 38.54232406616211, 40.25008773803711]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 12.0, 9.0, 7.0, 8.0, 11.0, 9.0, 11.0, 18.0, 18.0, 15.0, 18.0, 12.0, 24.0, 29.0, 30.0, 29.0, 33.0, 31.0, 45.0, 41.0, 35.0, 33.0, 46.0, 34.0, 32.0, 49.0, 29.0, 46.0, 30.0, 37.0, 26.0, 24.0, 19.0, 17.0, 25.0, 17.0, 13.0, 15.0, 12.0, 11.0, 9.0, 8.0, 13.0, 5.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.984907150268555, -30.021028518676758, -29.057147979736328, -28.09326934814453, -27.129390716552734, -26.165512084960938, -25.20163345336914, -24.23775291442871, -23.273874282836914, -22.309995651245117, -21.346115112304688, -20.38223648071289, -19.418357849121094, -18.454479217529297, -17.4906005859375, -16.52672004699707, -15.562841415405273, -14.598962783813477, -13.635083198547363, -12.67120361328125, -11.707324981689453, -10.743446350097656, -9.779566764831543, -8.81568717956543, -7.851808547973633, -6.887929439544678, -5.924050331115723, -4.960171222686768, -3.9962921142578125, -3.0324130058288574, -2.0685338973999023, -1.1046547889709473, -0.140777587890625, 0.8231015205383301, 1.7869806289672852, 2.7508597373962402, 3.7147388458251953, 4.67861795425415, 5.6424970626831055, 6.6063761711120605, 7.570255279541016, 8.534133911132812, 9.498013496398926, 10.461893081665039, 11.425771713256836, 12.389650344848633, 13.353529930114746, 14.31740951538086, 15.281288146972656, 16.245166778564453, 17.20904541015625, 18.17292594909668, 19.136804580688477, 20.100683212280273, 21.064563751220703, 22.0284423828125, 22.992321014404297, 23.956199645996094, 24.92007827758789, 25.88395881652832, 26.847837448120117, 27.811716079711914, 28.775596618652344, 29.73947525024414, 30.703353881835938]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 2.0, 3.0, 5.0, 5.0, 14.0, 16.0, 16.0, 10.0, 17.0, 26.0, 30.0, 26.0, 23.0, 32.0, 39.0, 36.0, 26.0, 30.0, 43.0, 41.0, 36.0, 56.0, 47.0, 44.0, 37.0, 44.0, 43.0, 24.0, 28.0, 31.0, 26.0, 18.0, 24.0, 15.0, 15.0, 16.0, 15.0, 14.0, 4.0, 6.0, 4.0, 3.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.86328125, -4.70135498046875, -4.5394287109375, -4.37750244140625, -4.215576171875, -4.05364990234375, -3.8917236328125, -3.72979736328125, -3.56787109375, -3.40594482421875, -3.2440185546875, -3.08209228515625, -2.920166015625, -2.75823974609375, -2.5963134765625, -2.43438720703125, -2.2724609375, -2.11053466796875, -1.9486083984375, -1.78668212890625, -1.624755859375, -1.46282958984375, -1.3009033203125, -1.13897705078125, -0.97705078125, -0.81512451171875, -0.6531982421875, -0.49127197265625, -0.329345703125, -0.16741943359375, -0.0054931640625, 0.15643310546875, 0.318359375, 0.48028564453125, 0.6422119140625, 0.80413818359375, 0.966064453125, 1.12799072265625, 1.2899169921875, 1.45184326171875, 1.61376953125, 1.77569580078125, 1.9376220703125, 2.09954833984375, 2.261474609375, 2.42340087890625, 2.5853271484375, 2.74725341796875, 2.9091796875, 3.07110595703125, 3.2330322265625, 3.39495849609375, 3.556884765625, 3.71881103515625, 3.8807373046875, 4.04266357421875, 4.20458984375, 4.36651611328125, 4.5284423828125, 4.69036865234375, 4.852294921875, 5.01422119140625, 5.1761474609375, 5.33807373046875, 5.5]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 8.0, 15.0, 14.0, 26.0, 34.0, 51.0, 63.0, 99.0, 173.0, 218.0, 350.0, 434.0, 649.0, 963.0, 1476.0, 2335.0, 3468.0, 5357.0, 8422.0, 13303.0, 21229.0, 34896.0, 55987.0, 89701.0, 134395.0, 172743.0, 166305.0, 123035.0, 79828.0, 49793.0, 30579.0, 18809.0, 12057.0, 7461.0, 4856.0, 3205.0, 2045.0, 1304.0, 892.0, 597.0, 409.0, 306.0, 207.0, 133.0, 108.0, 66.0, 42.0, 21.0, 22.0, 15.0, 21.0, 12.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.81640625, -0.7907943725585938, -0.7651824951171875, -0.7395706176757812, -0.713958740234375, -0.6883468627929688, -0.6627349853515625, -0.6371231079101562, -0.61151123046875, -0.5858993530273438, -0.5602874755859375, -0.5346755981445312, -0.509063720703125, -0.48345184326171875, -0.4578399658203125, -0.43222808837890625, -0.4066162109375, -0.38100433349609375, -0.3553924560546875, -0.32978057861328125, -0.304168701171875, -0.27855682373046875, -0.2529449462890625, -0.22733306884765625, -0.20172119140625, -0.17610931396484375, -0.1504974365234375, -0.12488555908203125, -0.099273681640625, -0.07366180419921875, -0.0480499267578125, -0.02243804931640625, 0.003173828125, 0.02878570556640625, 0.0543975830078125, 0.08000946044921875, 0.105621337890625, 0.13123321533203125, 0.1568450927734375, 0.18245697021484375, 0.20806884765625, 0.23368072509765625, 0.2592926025390625, 0.28490447998046875, 0.310516357421875, 0.33612823486328125, 0.3617401123046875, 0.38735198974609375, 0.4129638671875, 0.43857574462890625, 0.4641876220703125, 0.48979949951171875, 0.515411376953125, 0.5410232543945312, 0.5666351318359375, 0.5922470092773438, 0.61785888671875, 0.6434707641601562, 0.6690826416015625, 0.6946945190429688, 0.720306396484375, 0.7459182739257812, 0.7715301513671875, 0.7971420288085938, 0.82275390625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 9.0, 7.0, 13.0, 11.0, 9.0, 14.0, 15.0, 17.0, 29.0, 22.0, 26.0, 34.0, 37.0, 36.0, 38.0, 48.0, 36.0, 40.0, 39.0, 1071.0, 38.0, 46.0, 45.0, 37.0, 36.0, 36.0, 41.0, 32.0, 24.0, 25.0, 13.0, 16.0, 11.0, 17.0, 13.0, 11.0, 5.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.716796875, -3.593536376953125, -3.47027587890625, -3.347015380859375, -3.2237548828125, -3.100494384765625, -2.97723388671875, -2.853973388671875, -2.730712890625, -2.607452392578125, -2.48419189453125, -2.360931396484375, -2.2376708984375, -2.114410400390625, -1.99114990234375, -1.867889404296875, -1.74462890625, -1.621368408203125, -1.49810791015625, -1.374847412109375, -1.2515869140625, -1.128326416015625, -1.00506591796875, -0.881805419921875, -0.758544921875, -0.635284423828125, -0.51202392578125, -0.388763427734375, -0.2655029296875, -0.142242431640625, -0.01898193359375, 0.104278564453125, 0.2275390625, 0.350799560546875, 0.47406005859375, 0.597320556640625, 0.7205810546875, 0.843841552734375, 0.96710205078125, 1.090362548828125, 1.213623046875, 1.336883544921875, 1.46014404296875, 1.583404541015625, 1.7066650390625, 1.829925537109375, 1.95318603515625, 2.076446533203125, 2.19970703125, 2.322967529296875, 2.44622802734375, 2.569488525390625, 2.6927490234375, 2.816009521484375, 2.93927001953125, 3.062530517578125, 3.185791015625, 3.309051513671875, 3.43231201171875, 3.555572509765625, 3.6788330078125, 3.802093505859375, 3.92535400390625, 4.048614501953125, 4.171875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 11.0, 11.0, 19.0, 32.0, 45.0, 81.0, 128.0, 264.0, 419.0, 766.0, 1374.0, 2527.0, 4509.0, 8535.0, 16028.0, 30720.0, 58982.0, 110681.0, 190157.0, 1272267.0, 179508.0, 103515.0, 54963.0, 28865.0, 15147.0, 7940.0, 4258.0, 2327.0, 1262.0, 746.0, 435.0, 254.0, 119.0, 82.0, 48.0, 37.0, 21.0, 19.0, 10.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.71630859375, -0.6966552734375, -0.677001953125, -0.6573486328125, -0.6376953125, -0.6180419921875, -0.598388671875, -0.5787353515625, -0.55908203125, -0.5394287109375, -0.519775390625, -0.5001220703125, -0.48046875, -0.4608154296875, -0.441162109375, -0.4215087890625, -0.40185546875, -0.3822021484375, -0.362548828125, -0.3428955078125, -0.3232421875, -0.3035888671875, -0.283935546875, -0.2642822265625, -0.24462890625, -0.2249755859375, -0.205322265625, -0.1856689453125, -0.166015625, -0.1463623046875, -0.126708984375, -0.1070556640625, -0.08740234375, -0.0677490234375, -0.048095703125, -0.0284423828125, -0.0087890625, 0.0108642578125, 0.030517578125, 0.0501708984375, 0.06982421875, 0.0894775390625, 0.109130859375, 0.1287841796875, 0.1484375, 0.1680908203125, 0.187744140625, 0.2073974609375, 0.22705078125, 0.2467041015625, 0.266357421875, 0.2860107421875, 0.3056640625, 0.3253173828125, 0.344970703125, 0.3646240234375, 0.38427734375, 0.4039306640625, 0.423583984375, 0.4432373046875, 0.462890625, 0.4825439453125, 0.502197265625, 0.5218505859375, 0.54150390625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 6.0, 5.0, 2.0, 6.0, 8.0, 19.0, 20.0, 19.0, 28.0, 37.0, 30.0, 43.0, 45.0, 54.0, 51.0, 68.0, 60.0, 70.0, 53.0, 50.0, 42.0, 45.0, 31.0, 25.0, 34.0, 16.0, 29.0, 15.0, 16.0, 14.0, 7.0, 14.0, 4.0, 4.0, 5.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0290679931640625, -0.028173208236694336, -0.027278423309326172, -0.026383638381958008, -0.025488853454589844, -0.02459406852722168, -0.023699283599853516, -0.02280449867248535, -0.021909713745117188, -0.021014928817749023, -0.02012014389038086, -0.019225358963012695, -0.01833057403564453, -0.017435789108276367, -0.016541004180908203, -0.01564621925354004, -0.014751434326171875, -0.013856649398803711, -0.012961864471435547, -0.012067079544067383, -0.011172294616699219, -0.010277509689331055, -0.00938272476196289, -0.008487939834594727, -0.0075931549072265625, -0.0066983699798583984, -0.005803585052490234, -0.00490880012512207, -0.004014015197753906, -0.003119230270385742, -0.002224445343017578, -0.001329660415649414, -0.00043487548828125, 0.00045990943908691406, 0.0013546943664550781, 0.002249479293823242, 0.0031442642211914062, 0.00403904914855957, 0.004933834075927734, 0.0058286190032958984, 0.0067234039306640625, 0.0076181888580322266, 0.00851297378540039, 0.009407758712768555, 0.010302543640136719, 0.011197328567504883, 0.012092113494873047, 0.012986898422241211, 0.013881683349609375, 0.014776468276977539, 0.015671253204345703, 0.016566038131713867, 0.01746082305908203, 0.018355607986450195, 0.01925039291381836, 0.020145177841186523, 0.021039962768554688, 0.02193474769592285, 0.022829532623291016, 0.02372431755065918, 0.024619102478027344, 0.025513887405395508, 0.026408672332763672, 0.027303457260131836, 0.0281982421875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 5.0, 6.0, 6.0, 10.0, 13.0, 19.0, 20.0, 27.0, 37.0, 30.0, 49.0, 60.0, 77.0, 113.0, 168.0, 315.0, 636.0, 5277.0, 1032947.0, 7108.0, 635.0, 330.0, 195.0, 145.0, 74.0, 57.0, 46.0, 29.0, 28.0, 28.0, 8.0, 8.0, 6.0, 4.0, 5.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5517578125, -0.5342559814453125, -0.516754150390625, -0.4992523193359375, -0.48175048828125, -0.4642486572265625, -0.446746826171875, -0.4292449951171875, -0.4117431640625, -0.3942413330078125, -0.376739501953125, -0.3592376708984375, -0.34173583984375, -0.3242340087890625, -0.306732177734375, -0.2892303466796875, -0.271728515625, -0.2542266845703125, -0.236724853515625, -0.2192230224609375, -0.20172119140625, -0.1842193603515625, -0.166717529296875, -0.1492156982421875, -0.1317138671875, -0.1142120361328125, -0.096710205078125, -0.0792083740234375, -0.06170654296875, -0.0442047119140625, -0.026702880859375, -0.0092010498046875, 0.00830078125, 0.0258026123046875, 0.043304443359375, 0.0608062744140625, 0.07830810546875, 0.0958099365234375, 0.113311767578125, 0.1308135986328125, 0.1483154296875, 0.1658172607421875, 0.183319091796875, 0.2008209228515625, 0.21832275390625, 0.2358245849609375, 0.253326416015625, 0.2708282470703125, 0.288330078125, 0.3058319091796875, 0.323333740234375, 0.3408355712890625, 0.35833740234375, 0.3758392333984375, 0.393341064453125, 0.4108428955078125, 0.4283447265625, 0.4458465576171875, 0.463348388671875, 0.4808502197265625, 0.49835205078125, 0.5158538818359375, 0.533355712890625, 0.5508575439453125, 0.568359375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 36.0, 979.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11276122182607651, -0.0918130949139595, -0.0708649754524231, -0.04991684854030609, -0.028968721628189087, -0.008020594716072083, 0.012927524745464325, 0.03387565165758133, 0.054823778569698334, 0.07577190548181534, 0.09672002494335175, 0.11766815185546875, 0.13861627876758575, 0.15956440567970276, 0.18051251769065857, 0.20146065950393677, 0.22240877151489258, 0.24335689842700958, 0.2643050253391266, 0.2852531373500824, 0.3062012791633606, 0.3271493911743164, 0.3480975031852722, 0.3690456449985504, 0.3899937868118286, 0.4109418988227844, 0.4318900406360626, 0.45283815264701843, 0.47378629446029663, 0.49473440647125244, 0.5156825184822083, 0.5366306304931641, 0.5575787425041199, 0.5785268545150757, 0.5994749665260315, 0.6204231381416321, 0.6413712501525879, 0.6623193621635437, 0.6832674741744995, 0.7042156457901001, 0.7251637578010559, 0.7461118698120117, 0.7670599818229675, 0.7880081534385681, 0.8089562654495239, 0.8299043774604797, 0.8508524894714355, 0.8718006610870361, 0.8927487134933472, 0.913696825504303, 0.9346449375152588, 0.9555931091308594, 0.9765412211418152, 0.997489333152771, 1.0184375047683716, 1.0393855571746826, 1.0603337287902832, 1.0812819004058838, 1.1022299528121948, 1.1231781244277954, 1.1441261768341064, 1.165074348449707, 1.1860225200653076, 1.2069705724716187, 1.2279187440872192]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 4.0, 17.0, 13.0, 18.0, 22.0, 19.0, 14.0, 29.0, 34.0, 43.0, 26.0, 29.0, 39.0, 55.0, 31.0, 62.0, 46.0, 49.0, 35.0, 46.0, 51.0, 50.0, 33.0, 39.0, 37.0, 31.0, 20.0, 18.0, 16.0, 21.0, 15.0, 8.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.06246870756149292, -0.06079918146133423, -0.05912965536117554, -0.057460129261016846, -0.055790603160858154, -0.05412107706069946, -0.05245155096054077, -0.05078202486038208, -0.04911249876022339, -0.0474429726600647, -0.045773446559906006, -0.044103920459747314, -0.04243439435958862, -0.04076486825942993, -0.03909534215927124, -0.03742581605911255, -0.03575628995895386, -0.034086763858795166, -0.032417237758636475, -0.030747711658477783, -0.029078185558319092, -0.0274086594581604, -0.02573913335800171, -0.024069607257843018, -0.022400081157684326, -0.020730555057525635, -0.019061028957366943, -0.017391502857208252, -0.01572197675704956, -0.01405245065689087, -0.012382924556732178, -0.010713398456573486, -0.009043872356414795, -0.0073743462562561035, -0.005704820156097412, -0.004035294055938721, -0.0023657679557800293, -0.0006962418556213379, 0.0009732842445373535, 0.002642810344696045, 0.004312336444854736, 0.005981862545013428, 0.007651388645172119, 0.00932091474533081, 0.010990440845489502, 0.012659966945648193, 0.014329493045806885, 0.015999019145965576, 0.017668545246124268, 0.01933807134628296, 0.02100759744644165, 0.022677123546600342, 0.024346649646759033, 0.026016175746917725, 0.027685701847076416, 0.029355227947235107, 0.0310247540473938, 0.03269428014755249, 0.03436380624771118, 0.03603333234786987, 0.037702858448028564, 0.039372384548187256, 0.04104191064834595, 0.04271143674850464, 0.04438096284866333]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 2.0, 3.0, 5.0, 5.0, 14.0, 16.0, 16.0, 10.0, 17.0, 26.0, 30.0, 25.0, 24.0, 32.0, 39.0, 35.0, 26.0, 31.0, 41.0, 43.0, 33.0, 58.0, 47.0, 45.0, 37.0, 43.0, 44.0, 25.0, 26.0, 31.0, 27.0, 17.0, 26.0, 13.0, 16.0, 16.0, 15.0, 14.0, 4.0, 6.0, 4.0, 3.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8671875, -4.7052001953125, -4.543212890625, -4.3812255859375, -4.21923828125, -4.0572509765625, -3.895263671875, -3.7332763671875, -3.5712890625, -3.4093017578125, -3.247314453125, -3.0853271484375, -2.92333984375, -2.7613525390625, -2.599365234375, -2.4373779296875, -2.275390625, -2.1134033203125, -1.951416015625, -1.7894287109375, -1.62744140625, -1.4654541015625, -1.303466796875, -1.1414794921875, -0.9794921875, -0.8175048828125, -0.655517578125, -0.4935302734375, -0.33154296875, -0.1695556640625, -0.007568359375, 0.1544189453125, 0.31640625, 0.4783935546875, 0.640380859375, 0.8023681640625, 0.96435546875, 1.1263427734375, 1.288330078125, 1.4503173828125, 1.6123046875, 1.7742919921875, 1.936279296875, 2.0982666015625, 2.26025390625, 2.4222412109375, 2.584228515625, 2.7462158203125, 2.908203125, 3.0701904296875, 3.232177734375, 3.3941650390625, 3.55615234375, 3.7181396484375, 3.880126953125, 4.0421142578125, 4.2041015625, 4.3660888671875, 4.528076171875, 4.6900634765625, 4.85205078125, 5.0140380859375, 5.176025390625, 5.3380126953125, 5.5]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 10.0, 10.0, 15.0, 22.0, 27.0, 50.0, 67.0, 89.0, 150.0, 245.0, 416.0, 790.0, 1633.0, 3423.0, 8261.0, 21699.0, 60973.0, 168341.0, 386113.0, 251034.0, 91319.0, 32519.0, 11805.0, 4857.0, 2185.0, 1088.0, 561.0, 315.0, 183.0, 108.0, 82.0, 47.0, 36.0, 23.0, 20.0, 9.0, 9.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73046875, -6.54193115234375, -6.3533935546875, -6.16485595703125, -5.976318359375, -5.78778076171875, -5.5992431640625, -5.41070556640625, -5.22216796875, -5.03363037109375, -4.8450927734375, -4.65655517578125, -4.468017578125, -4.27947998046875, -4.0909423828125, -3.90240478515625, -3.7138671875, -3.52532958984375, -3.3367919921875, -3.14825439453125, -2.959716796875, -2.77117919921875, -2.5826416015625, -2.39410400390625, -2.20556640625, -2.01702880859375, -1.8284912109375, -1.63995361328125, -1.451416015625, -1.26287841796875, -1.0743408203125, -0.88580322265625, -0.697265625, -0.50872802734375, -0.3201904296875, -0.13165283203125, 0.056884765625, 0.24542236328125, 0.4339599609375, 0.62249755859375, 0.81103515625, 0.99957275390625, 1.1881103515625, 1.37664794921875, 1.565185546875, 1.75372314453125, 1.9422607421875, 2.13079833984375, 2.3193359375, 2.50787353515625, 2.6964111328125, 2.88494873046875, 3.073486328125, 3.26202392578125, 3.4505615234375, 3.63909912109375, 3.82763671875, 4.01617431640625, 4.2047119140625, 4.39324951171875, 4.581787109375, 4.77032470703125, 4.9588623046875, 5.14739990234375, 5.3359375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 3.0, 7.0, 7.0, 5.0, 10.0, 15.0, 9.0, 18.0, 14.0, 16.0, 17.0, 26.0, 34.0, 32.0, 30.0, 48.0, 38.0, 56.0, 93.0, 142.0, 287.0, 1383.0, 205.0, 105.0, 77.0, 53.0, 49.0, 40.0, 44.0, 26.0, 17.0, 22.0, 23.0, 14.0, 9.0, 14.0, 10.0, 14.0, 9.0, 2.0, 8.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-16.078125, -15.579345703125, -15.08056640625, -14.581787109375, -14.0830078125, -13.584228515625, -13.08544921875, -12.586669921875, -12.087890625, -11.589111328125, -11.09033203125, -10.591552734375, -10.0927734375, -9.593994140625, -9.09521484375, -8.596435546875, -8.09765625, -7.598876953125, -7.10009765625, -6.601318359375, -6.1025390625, -5.603759765625, -5.10498046875, -4.606201171875, -4.107421875, -3.608642578125, -3.10986328125, -2.611083984375, -2.1123046875, -1.613525390625, -1.11474609375, -0.615966796875, -0.1171875, 0.381591796875, 0.88037109375, 1.379150390625, 1.8779296875, 2.376708984375, 2.87548828125, 3.374267578125, 3.873046875, 4.371826171875, 4.87060546875, 5.369384765625, 5.8681640625, 6.366943359375, 6.86572265625, 7.364501953125, 7.86328125, 8.362060546875, 8.86083984375, 9.359619140625, 9.8583984375, 10.357177734375, 10.85595703125, 11.354736328125, 11.853515625, 12.352294921875, 12.85107421875, 13.349853515625, 13.8486328125, 14.347412109375, 14.84619140625, 15.344970703125, 15.84375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 12.0, 22.0, 28.0, 56.0, 60.0, 86.0, 156.0, 303.0, 729.0, 2903.0, 826594.0, 2309712.0, 3438.0, 789.0, 342.0, 158.0, 120.0, 54.0, 49.0, 25.0, 26.0, 14.0, 3.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.3125, -78.9921875, -76.671875, -74.3515625, -72.03125, -69.7109375, -67.390625, -65.0703125, -62.75, -60.4296875, -58.109375, -55.7890625, -53.46875, -51.1484375, -48.828125, -46.5078125, -44.1875, -41.8671875, -39.546875, -37.2265625, -34.90625, -32.5859375, -30.265625, -27.9453125, -25.625, -23.3046875, -20.984375, -18.6640625, -16.34375, -14.0234375, -11.703125, -9.3828125, -7.0625, -4.7421875, -2.421875, -0.1015625, 2.21875, 4.5390625, 6.859375, 9.1796875, 11.5, 13.8203125, 16.140625, 18.4609375, 20.78125, 23.1015625, 25.421875, 27.7421875, 30.0625, 32.3828125, 34.703125, 37.0234375, 39.34375, 41.6640625, 43.984375, 46.3046875, 48.625, 50.9453125, 53.265625, 55.5859375, 57.90625, 60.2265625, 62.546875, 64.8671875, 67.1875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 21.0, 167.0, 407.0, 329.0, 80.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.73880386352539, -51.657752990722656, -48.57670593261719, -45.49565505981445, -42.41460418701172, -39.333553314208984, -36.25250244140625, -33.17145538330078, -30.090404510498047, -27.009353637695312, -23.92830467224121, -20.84725570678711, -17.766204833984375, -14.685154914855957, -11.604104995727539, -8.523056030273438, -5.442005157470703, -2.360955238342285, 0.7200946807861328, 3.801144599914551, 6.882194519042969, 9.963244438171387, 13.044294357299805, 16.125343322753906, 19.20639419555664, 22.287445068359375, 25.368494033813477, 28.449542999267578, 31.530593872070312, 34.61164474487305, 37.69269561767578, 40.77374267578125, 43.85479736328125, 46.935848236083984, 50.01689910888672, 53.09794616699219, 56.17899703979492, 59.260047912597656, 62.341094970703125, 65.42214965820312, 68.5031967163086, 71.58424377441406, 74.66529846191406, 77.74634552001953, 80.827392578125, 83.908447265625, 86.98949432373047, 90.07054138183594, 93.15159606933594, 96.2326431274414, 99.3136978149414, 102.39474487304688, 105.47579956054688, 108.55684661865234, 111.63789367675781, 114.71894836425781, 117.79999542236328, 120.88104248046875, 123.96209716796875, 127.04314422607422, 130.1241912841797, 133.2052459716797, 136.2863006591797, 139.36734008789062, 142.44839477539062]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 6.0, 12.0, 10.0, 12.0, 10.0, 18.0, 16.0, 14.0, 22.0, 24.0, 23.0, 30.0, 35.0, 46.0, 45.0, 37.0, 41.0, 53.0, 37.0, 46.0, 47.0, 41.0, 33.0, 45.0, 30.0, 27.0, 27.0, 23.0, 30.0, 26.0, 19.0, 17.0, 20.0, 15.0, 7.0, 10.0, 6.0, 9.0, 4.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-44.62644958496094, -43.326961517333984, -42.027469635009766, -40.72798156738281, -39.428489685058594, -38.12900161743164, -36.82950973510742, -35.53002166748047, -34.23052978515625, -32.9310417175293, -31.631549835205078, -30.332059860229492, -29.032569885253906, -27.733081817626953, -26.433591842651367, -25.13410186767578, -23.834613800048828, -22.535123825073242, -21.235633850097656, -19.93614387512207, -18.636653900146484, -17.33716583251953, -16.037675857543945, -14.73818588256836, -13.438695907592773, -12.139205932617188, -10.839715957641602, -9.540226936340332, -8.240736961364746, -6.94124698638916, -5.641757488250732, -4.342267990112305, -3.0427780151367188, -1.743288278579712, -0.4437985420227051, 0.8556911945343018, 2.1551809310913086, 3.4546709060668945, 4.754160404205322, 6.05364990234375, 7.353139877319336, 8.652629852294922, 9.952119827270508, 11.251608848571777, 12.551098823547363, 13.85058879852295, 15.150077819824219, 16.449567794799805, 17.74905776977539, 19.048547744750977, 20.348037719726562, 21.64752769470215, 22.947017669677734, 24.246505737304688, 25.545995712280273, 26.84548568725586, 28.144975662231445, 29.44446563720703, 30.743955612182617, 32.0434455871582, 33.342933654785156, 34.642425537109375, 35.94191360473633, 37.24140167236328, 38.5408935546875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 3.0, 6.0, 4.0, 10.0, 11.0, 9.0, 21.0, 14.0, 22.0, 23.0, 26.0, 28.0, 29.0, 28.0, 37.0, 25.0, 33.0, 30.0, 39.0, 36.0, 29.0, 40.0, 53.0, 33.0, 48.0, 40.0, 36.0, 43.0, 28.0, 31.0, 23.0, 27.0, 17.0, 23.0, 20.0, 15.0, 15.0, 10.0, 7.0, 7.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.47955322265625, -4.3145751953125, -4.14959716796875, -3.984619140625, -3.81964111328125, -3.6546630859375, -3.48968505859375, -3.32470703125, -3.15972900390625, -2.9947509765625, -2.82977294921875, -2.664794921875, -2.49981689453125, -2.3348388671875, -2.16986083984375, -2.0048828125, -1.83990478515625, -1.6749267578125, -1.50994873046875, -1.344970703125, -1.17999267578125, -1.0150146484375, -0.85003662109375, -0.68505859375, -0.52008056640625, -0.3551025390625, -0.19012451171875, -0.025146484375, 0.13983154296875, 0.3048095703125, 0.46978759765625, 0.634765625, 0.79974365234375, 0.9647216796875, 1.12969970703125, 1.294677734375, 1.45965576171875, 1.6246337890625, 1.78961181640625, 1.95458984375, 2.11956787109375, 2.2845458984375, 2.44952392578125, 2.614501953125, 2.77947998046875, 2.9444580078125, 3.10943603515625, 3.2744140625, 3.43939208984375, 3.6043701171875, 3.76934814453125, 3.934326171875, 4.09930419921875, 4.2642822265625, 4.42926025390625, 4.59423828125, 4.75921630859375, 4.9241943359375, 5.08917236328125, 5.254150390625, 5.41912841796875, 5.5841064453125, 5.74908447265625, 5.9140625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 3.0, 4.0, 5.0, 8.0, 15.0, 14.0, 22.0, 19.0, 26.0, 36.0, 55.0, 82.0, 104.0, 150.0, 228.0, 402.0, 921.0, 1933.0, 5270.0, 19464.0, 90284.0, 469297.0, 1644777.0, 1475487.0, 387756.0, 73968.0, 15981.0, 4580.0, 1589.0, 722.0, 395.0, 209.0, 122.0, 86.0, 47.0, 46.0, 25.0, 41.0, 15.0, 25.0, 13.0, 13.0, 13.0, 7.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.7578125, -8.4747314453125, -8.191650390625, -7.9085693359375, -7.62548828125, -7.3424072265625, -7.059326171875, -6.7762451171875, -6.4931640625, -6.2100830078125, -5.927001953125, -5.6439208984375, -5.36083984375, -5.0777587890625, -4.794677734375, -4.5115966796875, -4.228515625, -3.9454345703125, -3.662353515625, -3.3792724609375, -3.09619140625, -2.8131103515625, -2.530029296875, -2.2469482421875, -1.9638671875, -1.6807861328125, -1.397705078125, -1.1146240234375, -0.83154296875, -0.5484619140625, -0.265380859375, 0.0177001953125, 0.30078125, 0.5838623046875, 0.866943359375, 1.1500244140625, 1.43310546875, 1.7161865234375, 1.999267578125, 2.2823486328125, 2.5654296875, 2.8485107421875, 3.131591796875, 3.4146728515625, 3.69775390625, 3.9808349609375, 4.263916015625, 4.5469970703125, 4.830078125, 5.1131591796875, 5.396240234375, 5.6793212890625, 5.96240234375, 6.2454833984375, 6.528564453125, 6.8116455078125, 7.0947265625, 7.3778076171875, 7.660888671875, 7.9439697265625, 8.22705078125, 8.5101318359375, 8.793212890625, 9.0762939453125, 9.359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 8.0, 9.0, 8.0, 15.0, 32.0, 15.0, 30.0, 26.0, 61.0, 50.0, 81.0, 101.0, 128.0, 158.0, 226.0, 243.0, 262.0, 335.0, 336.0, 328.0, 305.0, 285.0, 180.0, 175.0, 152.0, 105.0, 84.0, 56.0, 62.0, 42.0, 37.0, 31.0, 19.0, 15.0, 12.0, 9.0, 5.0, 6.0, 8.0, 5.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.0234375, -7.7628173828125, -7.502197265625, -7.2415771484375, -6.98095703125, -6.7203369140625, -6.459716796875, -6.1990966796875, -5.9384765625, -5.6778564453125, -5.417236328125, -5.1566162109375, -4.89599609375, -4.6353759765625, -4.374755859375, -4.1141357421875, -3.853515625, -3.5928955078125, -3.332275390625, -3.0716552734375, -2.81103515625, -2.5504150390625, -2.289794921875, -2.0291748046875, -1.7685546875, -1.5079345703125, -1.247314453125, -0.9866943359375, -0.72607421875, -0.4654541015625, -0.204833984375, 0.0557861328125, 0.31640625, 0.5770263671875, 0.837646484375, 1.0982666015625, 1.35888671875, 1.6195068359375, 1.880126953125, 2.1407470703125, 2.4013671875, 2.6619873046875, 2.922607421875, 3.1832275390625, 3.44384765625, 3.7044677734375, 3.965087890625, 4.2257080078125, 4.486328125, 4.7469482421875, 5.007568359375, 5.2681884765625, 5.52880859375, 5.7894287109375, 6.050048828125, 6.3106689453125, 6.5712890625, 6.8319091796875, 7.092529296875, 7.3531494140625, 7.61376953125, 7.8743896484375, 8.135009765625, 8.3956298828125, 8.65625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 7.0, 1.0, 0.0, 7.0, 8.0, 7.0, 8.0, 6.0, 7.0, 14.0, 20.0, 19.0, 36.0, 39.0, 64.0, 45.0, 69.0, 107.0, 148.0, 211.0, 266.0, 474.0, 2424.0, 98820.0, 3687365.0, 396325.0, 5898.0, 630.0, 355.0, 223.0, 171.0, 116.0, 87.0, 77.0, 55.0, 38.0, 27.0, 18.0, 26.0, 21.0, 11.0, 4.0, 12.0, 9.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-40.3125, -39.14892578125, -37.9853515625, -36.82177734375, -35.658203125, -34.49462890625, -33.3310546875, -32.16748046875, -31.00390625, -29.84033203125, -28.6767578125, -27.51318359375, -26.349609375, -25.18603515625, -24.0224609375, -22.85888671875, -21.6953125, -20.53173828125, -19.3681640625, -18.20458984375, -17.041015625, -15.87744140625, -14.7138671875, -13.55029296875, -12.38671875, -11.22314453125, -10.0595703125, -8.89599609375, -7.732421875, -6.56884765625, -5.4052734375, -4.24169921875, -3.078125, -1.91455078125, -0.7509765625, 0.41259765625, 1.576171875, 2.73974609375, 3.9033203125, 5.06689453125, 6.23046875, 7.39404296875, 8.5576171875, 9.72119140625, 10.884765625, 12.04833984375, 13.2119140625, 14.37548828125, 15.5390625, 16.70263671875, 17.8662109375, 19.02978515625, 20.193359375, 21.35693359375, 22.5205078125, 23.68408203125, 24.84765625, 26.01123046875, 27.1748046875, 28.33837890625, 29.501953125, 30.66552734375, 31.8291015625, 32.99267578125, 34.15625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 12.0, 10.0, 38.0, 71.0, 147.0, 148.0, 185.0, 167.0, 106.0, 59.0, 41.0, 20.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.710391998291016, -42.2735481262207, -39.83670425415039, -37.39986038208008, -34.963016510009766, -32.52617263793945, -30.089326858520508, -27.652482986450195, -25.215639114379883, -22.77879524230957, -20.341951370239258, -17.905105590820312, -15.468262672424316, -13.031418800354004, -10.594573974609375, -8.157730102539062, -5.72088623046875, -3.2840421199798584, -0.8471980094909668, 1.589646339416504, 4.026490211486816, 6.463334083557129, 8.900178909301758, 11.33702278137207, 13.773866653442383, 16.210710525512695, 18.647554397583008, 21.084400177001953, 23.521244049072266, 25.958087921142578, 28.39493179321289, 30.831775665283203, 33.26861572265625, 35.70545959472656, 38.142303466796875, 40.57914733886719, 43.0159912109375, 45.45283508300781, 47.889678955078125, 50.32652282714844, 52.76336669921875, 55.20021057128906, 57.637054443359375, 60.07389831542969, 62.5107421875, 64.94758605957031, 67.38442993164062, 69.82127380371094, 72.25811767578125, 74.69496154785156, 77.13180541992188, 79.56864929199219, 82.0054931640625, 84.44233703613281, 86.87918090820312, 89.31602478027344, 91.75287628173828, 94.1897201538086, 96.6265640258789, 99.06340789794922, 101.50025177001953, 103.93709564208984, 106.37393951416016, 108.81078338623047, 111.24762725830078]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 2.0, 2.0, 7.0, 7.0, 12.0, 11.0, 16.0, 18.0, 18.0, 22.0, 26.0, 20.0, 23.0, 39.0, 41.0, 22.0, 41.0, 37.0, 24.0, 54.0, 46.0, 41.0, 36.0, 46.0, 28.0, 42.0, 35.0, 33.0, 32.0, 30.0, 32.0, 30.0, 19.0, 9.0, 15.0, 12.0, 13.0, 13.0, 7.0, 8.0, 6.0, 1.0, 13.0, 1.0, 2.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.08102798461914, -32.02484130859375, -30.96865463256836, -29.9124698638916, -28.85628318786621, -27.80009651184082, -26.743911743164062, -25.687725067138672, -24.63153839111328, -23.57535171508789, -22.5191650390625, -21.462980270385742, -20.40679359436035, -19.35060691833496, -18.294422149658203, -17.238235473632812, -16.182048797607422, -15.125862121582031, -14.069676399230957, -13.013490676879883, -11.957304000854492, -10.901117324829102, -9.844931602478027, -8.788745880126953, -7.7325592041015625, -6.67637300491333, -5.620186805725098, -4.564000606536865, -3.507814407348633, -2.4516282081604004, -1.395442008972168, -0.33925580978393555, 0.7169342041015625, 1.773120403289795, 2.8293066024780273, 3.8854928016662598, 4.941679000854492, 5.997865200042725, 7.054051399230957, 8.110237121582031, 9.166423797607422, 10.222610473632812, 11.278796195983887, 12.334981918334961, 13.391168594360352, 14.447355270385742, 15.503540992736816, 16.55972671508789, 17.61591339111328, 18.672100067138672, 19.728286743164062, 20.78447151184082, 21.84065818786621, 22.8968448638916, 23.95302963256836, 25.00921630859375, 26.06540298461914, 27.12158966064453, 28.177776336669922, 29.23396110534668, 30.29014778137207, 31.34633445739746, 32.40251922607422, 33.45870590209961, 34.514892578125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 8.0, 7.0, 10.0, 8.0, 14.0, 16.0, 15.0, 21.0, 38.0, 27.0, 22.0, 34.0, 29.0, 27.0, 37.0, 29.0, 52.0, 45.0, 49.0, 30.0, 43.0, 47.0, 36.0, 40.0, 38.0, 32.0, 38.0, 21.0, 22.0, 20.0, 21.0, 22.0, 19.0, 16.0, 18.0, 5.0, 10.0, 5.0, 6.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.14453125, -4.98516845703125, -4.8258056640625, -4.66644287109375, -4.507080078125, -4.34771728515625, -4.1883544921875, -4.02899169921875, -3.86962890625, -3.71026611328125, -3.5509033203125, -3.39154052734375, -3.232177734375, -3.07281494140625, -2.9134521484375, -2.75408935546875, -2.5947265625, -2.43536376953125, -2.2760009765625, -2.11663818359375, -1.957275390625, -1.79791259765625, -1.6385498046875, -1.47918701171875, -1.31982421875, -1.16046142578125, -1.0010986328125, -0.84173583984375, -0.682373046875, -0.52301025390625, -0.3636474609375, -0.20428466796875, -0.044921875, 0.11444091796875, 0.2738037109375, 0.43316650390625, 0.592529296875, 0.75189208984375, 0.9112548828125, 1.07061767578125, 1.22998046875, 1.38934326171875, 1.5487060546875, 1.70806884765625, 1.867431640625, 2.02679443359375, 2.1861572265625, 2.34552001953125, 2.5048828125, 2.66424560546875, 2.8236083984375, 2.98297119140625, 3.142333984375, 3.30169677734375, 3.4610595703125, 3.62042236328125, 3.77978515625, 3.93914794921875, 4.0985107421875, 4.25787353515625, 4.417236328125, 4.57659912109375, 4.7359619140625, 4.89532470703125, 5.0546875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 0.0, 3.0, 12.0, 8.0, 16.0, 26.0, 37.0, 65.0, 101.0, 140.0, 199.0, 303.0, 452.0, 627.0, 1002.0, 1390.0, 2094.0, 3158.0, 4713.0, 7334.0, 11264.0, 17463.0, 27310.0, 43109.0, 66466.0, 98722.0, 136948.0, 162226.0, 146082.0, 108647.0, 73373.0, 48348.0, 30792.0, 19478.0, 12486.0, 8152.0, 5311.0, 3455.0, 2307.0, 1618.0, 1081.0, 706.0, 505.0, 362.0, 204.0, 141.0, 118.0, 73.0, 49.0, 27.0, 22.0, 16.0, 11.0, 7.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.7314453125, -0.7096939086914062, -0.6879425048828125, -0.6661911010742188, -0.644439697265625, -0.6226882934570312, -0.6009368896484375, -0.5791854858398438, -0.55743408203125, -0.5356826782226562, -0.5139312744140625, -0.49217987060546875, -0.470428466796875, -0.44867706298828125, -0.4269256591796875, -0.40517425537109375, -0.3834228515625, -0.36167144775390625, -0.3399200439453125, -0.31816864013671875, -0.296417236328125, -0.27466583251953125, -0.2529144287109375, -0.23116302490234375, -0.20941162109375, -0.18766021728515625, -0.1659088134765625, -0.14415740966796875, -0.122406005859375, -0.10065460205078125, -0.0789031982421875, -0.05715179443359375, -0.035400390625, -0.01364898681640625, 0.0081024169921875, 0.02985382080078125, 0.051605224609375, 0.07335662841796875, 0.0951080322265625, 0.11685943603515625, 0.13861083984375, 0.16036224365234375, 0.1821136474609375, 0.20386505126953125, 0.225616455078125, 0.24736785888671875, 0.2691192626953125, 0.29087066650390625, 0.3126220703125, 0.33437347412109375, 0.3561248779296875, 0.37787628173828125, 0.399627685546875, 0.42137908935546875, 0.4431304931640625, 0.46488189697265625, 0.48663330078125, 0.5083847045898438, 0.5301361083984375, 0.5518875122070312, 0.573638916015625, 0.5953903198242188, 0.6171417236328125, 0.6388931274414062, 0.66064453125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 5.0, 8.0, 13.0, 16.0, 12.0, 24.0, 13.0, 22.0, 16.0, 33.0, 21.0, 25.0, 34.0, 33.0, 31.0, 33.0, 36.0, 29.0, 33.0, 45.0, 1064.0, 36.0, 27.0, 44.0, 30.0, 35.0, 33.0, 35.0, 33.0, 30.0, 14.0, 17.0, 20.0, 15.0, 16.0, 8.0, 13.0, 12.0, 9.0, 11.0, 7.0, 8.0, 2.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.13671875, -3.036346435546875, -2.93597412109375, -2.835601806640625, -2.7352294921875, -2.634857177734375, -2.53448486328125, -2.434112548828125, -2.333740234375, -2.233367919921875, -2.13299560546875, -2.032623291015625, -1.9322509765625, -1.831878662109375, -1.73150634765625, -1.631134033203125, -1.53076171875, -1.430389404296875, -1.33001708984375, -1.229644775390625, -1.1292724609375, -1.028900146484375, -0.92852783203125, -0.828155517578125, -0.727783203125, -0.627410888671875, -0.52703857421875, -0.426666259765625, -0.3262939453125, -0.225921630859375, -0.12554931640625, -0.025177001953125, 0.0751953125, 0.175567626953125, 0.27593994140625, 0.376312255859375, 0.4766845703125, 0.577056884765625, 0.67742919921875, 0.777801513671875, 0.878173828125, 0.978546142578125, 1.07891845703125, 1.179290771484375, 1.2796630859375, 1.380035400390625, 1.48040771484375, 1.580780029296875, 1.68115234375, 1.781524658203125, 1.88189697265625, 1.982269287109375, 2.0826416015625, 2.183013916015625, 2.28338623046875, 2.383758544921875, 2.484130859375, 2.584503173828125, 2.68487548828125, 2.785247802734375, 2.8856201171875, 2.985992431640625, 3.08636474609375, 3.186737060546875, 3.287109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 5.0, 11.0, 10.0, 17.0, 31.0, 28.0, 47.0, 83.0, 124.0, 201.0, 317.0, 436.0, 741.0, 1091.0, 1746.0, 2615.0, 4074.0, 6364.0, 9828.0, 15004.0, 23350.0, 35615.0, 54510.0, 80967.0, 113787.0, 182959.0, 1156918.0, 127048.0, 93837.0, 64233.0, 42295.0, 27663.0, 17959.0, 11602.0, 7440.0, 4949.0, 3284.0, 2072.0, 1393.0, 830.0, 559.0, 385.0, 246.0, 165.0, 108.0, 62.0, 35.0, 34.0, 21.0, 15.0, 9.0, 7.0, 4.0, 4.0, 2.0], "bins": [-0.448486328125, -0.4357452392578125, -0.423004150390625, -0.4102630615234375, -0.39752197265625, -0.3847808837890625, -0.372039794921875, -0.3592987060546875, -0.3465576171875, -0.3338165283203125, -0.321075439453125, -0.3083343505859375, -0.29559326171875, -0.2828521728515625, -0.270111083984375, -0.2573699951171875, -0.24462890625, -0.2318878173828125, -0.219146728515625, -0.2064056396484375, -0.19366455078125, -0.1809234619140625, -0.168182373046875, -0.1554412841796875, -0.1427001953125, -0.1299591064453125, -0.117218017578125, -0.1044769287109375, -0.09173583984375, -0.0789947509765625, -0.066253662109375, -0.0535125732421875, -0.040771484375, -0.0280303955078125, -0.015289306640625, -0.0025482177734375, 0.01019287109375, 0.0229339599609375, 0.035675048828125, 0.0484161376953125, 0.0611572265625, 0.0738983154296875, 0.086639404296875, 0.0993804931640625, 0.11212158203125, 0.1248626708984375, 0.137603759765625, 0.1503448486328125, 0.1630859375, 0.1758270263671875, 0.188568115234375, 0.2013092041015625, 0.21405029296875, 0.2267913818359375, 0.239532470703125, 0.2522735595703125, 0.2650146484375, 0.2777557373046875, 0.290496826171875, 0.3032379150390625, 0.31597900390625, 0.3287200927734375, 0.341461181640625, 0.3542022705078125, 0.366943359375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 9.0, 12.0, 12.0, 15.0, 21.0, 30.0, 54.0, 65.0, 83.0, 90.0, 139.0, 91.0, 80.0, 63.0, 65.0, 45.0, 39.0, 19.0, 9.0, 13.0, 12.0, 7.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02984619140625, -0.02893662452697754, -0.028027057647705078, -0.027117490768432617, -0.026207923889160156, -0.025298357009887695, -0.024388790130615234, -0.023479223251342773, -0.022569656372070312, -0.02166008949279785, -0.02075052261352539, -0.01984095573425293, -0.01893138885498047, -0.018021821975708008, -0.017112255096435547, -0.016202688217163086, -0.015293121337890625, -0.014383554458618164, -0.013473987579345703, -0.012564420700073242, -0.011654853820800781, -0.01074528694152832, -0.00983572006225586, -0.008926153182983398, -0.008016586303710938, -0.0071070194244384766, -0.006197452545166016, -0.005287885665893555, -0.004378318786621094, -0.003468751907348633, -0.002559185028076172, -0.001649618148803711, -0.00074005126953125, 0.00016951560974121094, 0.0010790824890136719, 0.001988649368286133, 0.0028982162475585938, 0.0038077831268310547, 0.004717350006103516, 0.0056269168853759766, 0.0065364837646484375, 0.0074460506439208984, 0.00835561752319336, 0.00926518440246582, 0.010174751281738281, 0.011084318161010742, 0.011993885040283203, 0.012903451919555664, 0.013813018798828125, 0.014722585678100586, 0.015632152557373047, 0.016541719436645508, 0.01745128631591797, 0.01836085319519043, 0.01927042007446289, 0.02017998695373535, 0.021089553833007812, 0.021999120712280273, 0.022908687591552734, 0.023818254470825195, 0.024727821350097656, 0.025637388229370117, 0.026546955108642578, 0.02745652198791504, 0.0283660888671875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 10.0, 14.0, 18.0, 21.0, 28.0, 62.0, 81.0, 147.0, 232.0, 555.0, 18333.0, 1027104.0, 1123.0, 356.0, 154.0, 92.0, 68.0, 36.0, 30.0, 18.0, 10.0, 16.0, 10.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54638671875, -0.5288848876953125, -0.511383056640625, -0.4938812255859375, -0.47637939453125, -0.4588775634765625, -0.441375732421875, -0.4238739013671875, -0.4063720703125, -0.3888702392578125, -0.371368408203125, -0.3538665771484375, -0.33636474609375, -0.3188629150390625, -0.301361083984375, -0.2838592529296875, -0.266357421875, -0.2488555908203125, -0.231353759765625, -0.2138519287109375, -0.19635009765625, -0.1788482666015625, -0.161346435546875, -0.1438446044921875, -0.1263427734375, -0.1088409423828125, -0.091339111328125, -0.0738372802734375, -0.05633544921875, -0.0388336181640625, -0.021331787109375, -0.0038299560546875, 0.013671875, 0.0311737060546875, 0.048675537109375, 0.0661773681640625, 0.08367919921875, 0.1011810302734375, 0.118682861328125, 0.1361846923828125, 0.1536865234375, 0.1711883544921875, 0.188690185546875, 0.2061920166015625, 0.22369384765625, 0.2411956787109375, 0.258697509765625, 0.2761993408203125, 0.293701171875, 0.3112030029296875, 0.328704833984375, 0.3462066650390625, 0.36370849609375, 0.3812103271484375, 0.398712158203125, 0.4162139892578125, 0.4337158203125, 0.4512176513671875, 0.468719482421875, 0.4862213134765625, 0.50372314453125, 0.5212249755859375, 0.538726806640625, 0.5562286376953125, 0.57373046875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 143.0, 851.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13320964574813843, -0.12697333097457886, -0.12073702365159988, -0.11450071632862091, -0.10826440900564194, -0.10202810168266296, -0.0957917869091034, -0.08955547958612442, -0.08331917226314545, -0.07708286494016647, -0.0708465501666069, -0.06461024284362793, -0.058373935520648956, -0.052137624472379684, -0.04590131342411041, -0.03966500610113144, -0.03342869132757187, -0.027192382141947746, -0.020956072956323624, -0.014719761908054352, -0.00848345272243023, -0.0022471435368061066, 0.003989167511463165, 0.010225474834442139, 0.01646178588271141, 0.022698095068335533, 0.028934404253959656, 0.03517071530222893, 0.0414070263504982, 0.04764333367347717, 0.053879644721746445, 0.06011595204472542, 0.06635226309299469, 0.07258857041597366, 0.07882488518953323, 0.08506119251251221, 0.09129749983549118, 0.09753380715847015, 0.10377012193202972, 0.1100064292550087, 0.11624273657798767, 0.12247904390096664, 0.12871535122394562, 0.1349516659975052, 0.14118798077106476, 0.14742428064346313, 0.1536605954170227, 0.15989691019058228, 0.16613322496414185, 0.17236953973770142, 0.1786058396100998, 0.18484215438365936, 0.19107846915721893, 0.1973147690296173, 0.20355108380317688, 0.20978739857673645, 0.21602369844913483, 0.2222600132226944, 0.22849631309509277, 0.23473262786865234, 0.24096894264221191, 0.2472052425146103, 0.25344157218933105, 0.25967785716056824, 0.2659141719341278]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 6.0, 5.0, 13.0, 16.0, 10.0, 8.0, 10.0, 19.0, 17.0, 15.0, 24.0, 30.0, 41.0, 33.0, 25.0, 35.0, 38.0, 44.0, 49.0, 33.0, 45.0, 32.0, 42.0, 45.0, 45.0, 33.0, 34.0, 37.0, 32.0, 27.0, 20.0, 15.0, 17.0, 18.0, 16.0, 13.0, 12.0, 13.0, 7.0, 9.0, 4.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.026247084140777588, -0.02541860193014145, -0.02459011971950531, -0.02376163750886917, -0.022933155298233032, -0.022104673087596893, -0.021276190876960754, -0.020447708666324615, -0.019619226455688477, -0.018790744245052338, -0.0179622620344162, -0.01713377982378006, -0.01630529761314392, -0.015476815402507782, -0.014648333191871643, -0.013819850981235504, -0.012991368770599365, -0.012162886559963226, -0.011334404349327087, -0.010505922138690948, -0.00967743992805481, -0.00884895771741867, -0.008020475506782532, -0.007191993296146393, -0.006363511085510254, -0.005535028874874115, -0.004706546664237976, -0.003878064453601837, -0.0030495822429656982, -0.0022211000323295593, -0.0013926178216934204, -0.0005641356110572815, 0.0002643465995788574, 0.0010928288102149963, 0.0019213110208511353, 0.002749793231487274, 0.003578275442123413, 0.004406757652759552, 0.005235239863395691, 0.00606372207403183, 0.006892204284667969, 0.007720686495304108, 0.008549168705940247, 0.009377650916576385, 0.010206133127212524, 0.011034615337848663, 0.011863097548484802, 0.012691579759120941, 0.01352006196975708, 0.014348544180393219, 0.015177026391029358, 0.016005508601665497, 0.016833990812301636, 0.017662473022937775, 0.018490955233573914, 0.019319437444210052, 0.02014791965484619, 0.02097640186548233, 0.02180488407611847, 0.022633366286754608, 0.023461848497390747, 0.024290330708026886, 0.025118812918663025, 0.025947295129299164, 0.026775777339935303]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 8.0, 7.0, 10.0, 8.0, 14.0, 16.0, 15.0, 21.0, 37.0, 29.0, 21.0, 34.0, 29.0, 27.0, 37.0, 28.0, 53.0, 45.0, 49.0, 30.0, 43.0, 48.0, 34.0, 41.0, 39.0, 31.0, 38.0, 21.0, 22.0, 20.0, 21.0, 22.0, 18.0, 17.0, 18.0, 5.0, 10.0, 5.0, 6.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.14453125, -4.98516845703125, -4.8258056640625, -4.66644287109375, -4.507080078125, -4.34771728515625, -4.1883544921875, -4.02899169921875, -3.86962890625, -3.71026611328125, -3.5509033203125, -3.39154052734375, -3.232177734375, -3.07281494140625, -2.9134521484375, -2.75408935546875, -2.5947265625, -2.43536376953125, -2.2760009765625, -2.11663818359375, -1.957275390625, -1.79791259765625, -1.6385498046875, -1.47918701171875, -1.31982421875, -1.16046142578125, -1.0010986328125, -0.84173583984375, -0.682373046875, -0.52301025390625, -0.3636474609375, -0.20428466796875, -0.044921875, 0.11444091796875, 0.2738037109375, 0.43316650390625, 0.592529296875, 0.75189208984375, 0.9112548828125, 1.07061767578125, 1.22998046875, 1.38934326171875, 1.5487060546875, 1.70806884765625, 1.867431640625, 2.02679443359375, 2.1861572265625, 2.34552001953125, 2.5048828125, 2.66424560546875, 2.8236083984375, 2.98297119140625, 3.142333984375, 3.30169677734375, 3.4610595703125, 3.62042236328125, 3.77978515625, 3.93914794921875, 4.0985107421875, 4.25787353515625, 4.417236328125, 4.57659912109375, 4.7359619140625, 4.89532470703125, 5.0546875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 4.0, 5.0, 5.0, 8.0, 12.0, 21.0, 30.0, 19.0, 39.0, 58.0, 84.0, 140.0, 248.0, 427.0, 692.0, 1357.0, 2244.0, 3888.0, 6784.0, 11970.0, 20995.0, 41175.0, 92329.0, 217934.0, 327716.0, 172828.0, 72374.0, 33395.0, 17749.0, 10085.0, 5820.0, 3435.0, 1938.0, 1075.0, 627.0, 388.0, 244.0, 148.0, 79.0, 47.0, 36.0, 28.0, 19.0, 9.0, 14.0, 12.0, 8.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-4.6875, -4.53802490234375, -4.3885498046875, -4.23907470703125, -4.089599609375, -3.94012451171875, -3.7906494140625, -3.64117431640625, -3.49169921875, -3.34222412109375, -3.1927490234375, -3.04327392578125, -2.893798828125, -2.74432373046875, -2.5948486328125, -2.44537353515625, -2.2958984375, -2.14642333984375, -1.9969482421875, -1.84747314453125, -1.697998046875, -1.54852294921875, -1.3990478515625, -1.24957275390625, -1.10009765625, -0.95062255859375, -0.8011474609375, -0.65167236328125, -0.502197265625, -0.35272216796875, -0.2032470703125, -0.05377197265625, 0.095703125, 0.24517822265625, 0.3946533203125, 0.54412841796875, 0.693603515625, 0.84307861328125, 0.9925537109375, 1.14202880859375, 1.29150390625, 1.44097900390625, 1.5904541015625, 1.73992919921875, 1.889404296875, 2.03887939453125, 2.1883544921875, 2.33782958984375, 2.4873046875, 2.63677978515625, 2.7862548828125, 2.93572998046875, 3.085205078125, 3.23468017578125, 3.3841552734375, 3.53363037109375, 3.68310546875, 3.83258056640625, 3.9820556640625, 4.13153076171875, 4.281005859375, 4.43048095703125, 4.5799560546875, 4.72943115234375, 4.87890625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 10.0, 12.0, 12.0, 14.0, 13.0, 19.0, 32.0, 27.0, 36.0, 23.0, 30.0, 38.0, 50.0, 64.0, 79.0, 119.0, 255.0, 1416.0, 218.0, 119.0, 74.0, 48.0, 46.0, 41.0, 28.0, 33.0, 39.0, 28.0, 20.0, 24.0, 12.0, 12.0, 16.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.125, -17.56591796875, -17.0068359375, -16.44775390625, -15.888671875, -15.32958984375, -14.7705078125, -14.21142578125, -13.65234375, -13.09326171875, -12.5341796875, -11.97509765625, -11.416015625, -10.85693359375, -10.2978515625, -9.73876953125, -9.1796875, -8.62060546875, -8.0615234375, -7.50244140625, -6.943359375, -6.38427734375, -5.8251953125, -5.26611328125, -4.70703125, -4.14794921875, -3.5888671875, -3.02978515625, -2.470703125, -1.91162109375, -1.3525390625, -0.79345703125, -0.234375, 0.32470703125, 0.8837890625, 1.44287109375, 2.001953125, 2.56103515625, 3.1201171875, 3.67919921875, 4.23828125, 4.79736328125, 5.3564453125, 5.91552734375, 6.474609375, 7.03369140625, 7.5927734375, 8.15185546875, 8.7109375, 9.27001953125, 9.8291015625, 10.38818359375, 10.947265625, 11.50634765625, 12.0654296875, 12.62451171875, 13.18359375, 13.74267578125, 14.3017578125, 14.86083984375, 15.419921875, 15.97900390625, 16.5380859375, 17.09716796875, 17.65625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 3.0, 9.0, 5.0, 10.0, 15.0, 24.0, 32.0, 42.0, 38.0, 62.0, 70.0, 86.0, 112.0, 132.0, 177.0, 308.0, 571.0, 1810.0, 28399.0, 2916325.0, 190729.0, 4549.0, 811.0, 363.0, 253.0, 180.0, 136.0, 83.0, 84.0, 50.0, 50.0, 34.0, 28.0, 20.0, 21.0, 19.0, 11.0, 6.0, 8.0, 6.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-40.96875, -39.6767578125, -38.384765625, -37.0927734375, -35.80078125, -34.5087890625, -33.216796875, -31.9248046875, -30.6328125, -29.3408203125, -28.048828125, -26.7568359375, -25.46484375, -24.1728515625, -22.880859375, -21.5888671875, -20.296875, -19.0048828125, -17.712890625, -16.4208984375, -15.12890625, -13.8369140625, -12.544921875, -11.2529296875, -9.9609375, -8.6689453125, -7.376953125, -6.0849609375, -4.79296875, -3.5009765625, -2.208984375, -0.9169921875, 0.375, 1.6669921875, 2.958984375, 4.2509765625, 5.54296875, 6.8349609375, 8.126953125, 9.4189453125, 10.7109375, 12.0029296875, 13.294921875, 14.5869140625, 15.87890625, 17.1708984375, 18.462890625, 19.7548828125, 21.046875, 22.3388671875, 23.630859375, 24.9228515625, 26.21484375, 27.5068359375, 28.798828125, 30.0908203125, 31.3828125, 32.6748046875, 33.966796875, 35.2587890625, 36.55078125, 37.8427734375, 39.134765625, 40.4267578125, 41.71875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 108.0, 850.0, 54.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.984949111938477, -19.899105072021484, -11.813262939453125, -3.727418899536133, 4.358423233032227, 12.444265365600586, 20.53011131286621, 28.61595344543457, 36.70179748535156, 44.78763961791992, 52.87348175048828, 60.959327697753906, 69.045166015625, 77.13101196289062, 85.21685791015625, 93.30270385742188, 101.38854217529297, 109.4743881225586, 117.56022644042969, 125.64607238769531, 133.73191833496094, 141.8177490234375, 149.90359497070312, 157.98944091796875, 166.07528686523438, 174.1611328125, 182.24697875976562, 190.33282470703125, 198.4186553955078, 206.50450134277344, 214.59034729003906, 222.6761932373047, 230.76202392578125, 238.84786987304688, 246.9337158203125, 255.01956176757812, 263.10540771484375, 271.19122314453125, 279.277099609375, 287.3629150390625, 295.4487609863281, 303.53460693359375, 311.6204528808594, 319.706298828125, 327.7921447753906, 335.87799072265625, 343.96380615234375, 352.0496520996094, 360.135498046875, 368.2213439941406, 376.30718994140625, 384.3930358886719, 392.4788818359375, 400.564697265625, 408.65057373046875, 416.73638916015625, 424.822265625, 432.9081115722656, 440.99395751953125, 449.0798034667969, 457.1656494140625, 465.25146484375, 473.33734130859375, 481.42315673828125, 489.5090026855469]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 11.0, 5.0, 5.0, 13.0, 15.0, 8.0, 6.0, 19.0, 27.0, 19.0, 29.0, 27.0, 26.0, 35.0, 38.0, 30.0, 32.0, 48.0, 45.0, 40.0, 41.0, 47.0, 43.0, 44.0, 30.0, 33.0, 38.0, 28.0, 33.0, 24.0, 33.0, 26.0, 19.0, 11.0, 15.0, 15.0, 10.0, 8.0, 9.0, 7.0, 1.0, 0.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.271949768066406, -43.83234786987305, -42.39274597167969, -40.953147888183594, -39.513545989990234, -38.073944091796875, -36.63434600830078, -35.19474411010742, -33.75514221191406, -32.3155403137207, -30.875940322875977, -29.43634033203125, -27.99673843383789, -26.55713653564453, -25.117536544799805, -23.677936553955078, -22.23833465576172, -20.79873275756836, -19.359132766723633, -17.919532775878906, -16.479930877685547, -15.040329933166504, -13.600728988647461, -12.161128044128418, -10.721527099609375, -9.281926155090332, -7.842325210571289, -6.402724266052246, -4.963123321533203, -3.52352237701416, -2.083921432495117, -0.6443204879760742, 0.7952804565429688, 2.2348814010620117, 3.6744823455810547, 5.114083290100098, 6.553684234619141, 7.993285179138184, 9.432886123657227, 10.87248706817627, 12.312088012695312, 13.751688957214355, 15.191289901733398, 16.630889892578125, 18.070491790771484, 19.510093688964844, 20.94969367980957, 22.389293670654297, 23.828895568847656, 25.268497467041016, 26.708097457885742, 28.14769744873047, 29.587299346923828, 31.026901245117188, 32.46649932861328, 33.90610122680664, 35.345703125, 36.78530502319336, 38.22490692138672, 39.66450500488281, 41.10410690307617, 42.54370880126953, 43.983306884765625, 45.422908782958984, 46.862510681152344]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 5.0, 5.0, 7.0, 2.0, 7.0, 10.0, 13.0, 11.0, 10.0, 18.0, 20.0, 32.0, 25.0, 21.0, 36.0, 30.0, 32.0, 19.0, 39.0, 41.0, 42.0, 39.0, 42.0, 36.0, 38.0, 43.0, 27.0, 24.0, 42.0, 26.0, 28.0, 31.0, 26.0, 27.0, 25.0, 23.0, 24.0, 14.0, 9.0, 6.0, 8.0, 5.0, 11.0, 2.0, 2.0, 3.0, 6.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.01953125, -4.85662841796875, -4.6937255859375, -4.53082275390625, -4.367919921875, -4.20501708984375, -4.0421142578125, -3.87921142578125, -3.71630859375, -3.55340576171875, -3.3905029296875, -3.22760009765625, -3.064697265625, -2.90179443359375, -2.7388916015625, -2.57598876953125, -2.4130859375, -2.25018310546875, -2.0872802734375, -1.92437744140625, -1.761474609375, -1.59857177734375, -1.4356689453125, -1.27276611328125, -1.10986328125, -0.94696044921875, -0.7840576171875, -0.62115478515625, -0.458251953125, -0.29534912109375, -0.1324462890625, 0.03045654296875, 0.193359375, 0.35626220703125, 0.5191650390625, 0.68206787109375, 0.844970703125, 1.00787353515625, 1.1707763671875, 1.33367919921875, 1.49658203125, 1.65948486328125, 1.8223876953125, 1.98529052734375, 2.148193359375, 2.31109619140625, 2.4739990234375, 2.63690185546875, 2.7998046875, 2.96270751953125, 3.1256103515625, 3.28851318359375, 3.451416015625, 3.61431884765625, 3.7772216796875, 3.94012451171875, 4.10302734375, 4.26593017578125, 4.4288330078125, 4.59173583984375, 4.754638671875, 4.91754150390625, 5.0804443359375, 5.24334716796875, 5.40625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 9.0, 10.0, 13.0, 24.0, 25.0, 26.0, 34.0, 38.0, 63.0, 95.0, 131.0, 219.0, 351.0, 773.0, 2164.0, 7150.0, 35317.0, 235092.0, 1412589.0, 1984116.0, 436904.0, 62766.0, 11410.0, 2843.0, 904.0, 444.0, 248.0, 146.0, 99.0, 52.0, 46.0, 41.0, 29.0, 27.0, 14.0, 15.0, 16.0, 11.0, 5.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.7578125, -11.4031982421875, -11.048583984375, -10.6939697265625, -10.33935546875, -9.9847412109375, -9.630126953125, -9.2755126953125, -8.9208984375, -8.5662841796875, -8.211669921875, -7.8570556640625, -7.50244140625, -7.1478271484375, -6.793212890625, -6.4385986328125, -6.083984375, -5.7293701171875, -5.374755859375, -5.0201416015625, -4.66552734375, -4.3109130859375, -3.956298828125, -3.6016845703125, -3.2470703125, -2.8924560546875, -2.537841796875, -2.1832275390625, -1.82861328125, -1.4739990234375, -1.119384765625, -0.7647705078125, -0.41015625, -0.0555419921875, 0.299072265625, 0.6536865234375, 1.00830078125, 1.3629150390625, 1.717529296875, 2.0721435546875, 2.4267578125, 2.7813720703125, 3.135986328125, 3.4906005859375, 3.84521484375, 4.1998291015625, 4.554443359375, 4.9090576171875, 5.263671875, 5.6182861328125, 5.972900390625, 6.3275146484375, 6.68212890625, 7.0367431640625, 7.391357421875, 7.7459716796875, 8.1005859375, 8.4552001953125, 8.809814453125, 9.1644287109375, 9.51904296875, 9.8736572265625, 10.228271484375, 10.5828857421875, 10.9375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 2.0, 3.0, 7.0, 10.0, 16.0, 15.0, 20.0, 34.0, 34.0, 65.0, 107.0, 137.0, 176.0, 235.0, 353.0, 453.0, 488.0, 461.0, 381.0, 287.0, 205.0, 152.0, 108.0, 95.0, 62.0, 50.0, 42.0, 18.0, 16.0, 18.0, 7.0, 3.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8046875, -10.4287109375, -10.052734375, -9.6767578125, -9.30078125, -8.9248046875, -8.548828125, -8.1728515625, -7.796875, -7.4208984375, -7.044921875, -6.6689453125, -6.29296875, -5.9169921875, -5.541015625, -5.1650390625, -4.7890625, -4.4130859375, -4.037109375, -3.6611328125, -3.28515625, -2.9091796875, -2.533203125, -2.1572265625, -1.78125, -1.4052734375, -1.029296875, -0.6533203125, -0.27734375, 0.0986328125, 0.474609375, 0.8505859375, 1.2265625, 1.6025390625, 1.978515625, 2.3544921875, 2.73046875, 3.1064453125, 3.482421875, 3.8583984375, 4.234375, 4.6103515625, 4.986328125, 5.3623046875, 5.73828125, 6.1142578125, 6.490234375, 6.8662109375, 7.2421875, 7.6181640625, 7.994140625, 8.3701171875, 8.74609375, 9.1220703125, 9.498046875, 9.8740234375, 10.25, 10.6259765625, 11.001953125, 11.3779296875, 11.75390625, 12.1298828125, 12.505859375, 12.8818359375, 13.2578125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 11.0, 17.0, 16.0, 23.0, 43.0, 51.0, 78.0, 81.0, 139.0, 163.0, 293.0, 518.0, 2842.0, 528621.0, 3642724.0, 16765.0, 828.0, 363.0, 226.0, 144.0, 106.0, 72.0, 36.0, 34.0, 25.0, 11.0, 15.0, 9.0, 10.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.78125, -55.12158203125, -53.4619140625, -51.80224609375, -50.142578125, -48.48291015625, -46.8232421875, -45.16357421875, -43.50390625, -41.84423828125, -40.1845703125, -38.52490234375, -36.865234375, -35.20556640625, -33.5458984375, -31.88623046875, -30.2265625, -28.56689453125, -26.9072265625, -25.24755859375, -23.587890625, -21.92822265625, -20.2685546875, -18.60888671875, -16.94921875, -15.28955078125, -13.6298828125, -11.97021484375, -10.310546875, -8.65087890625, -6.9912109375, -5.33154296875, -3.671875, -2.01220703125, -0.3525390625, 1.30712890625, 2.966796875, 4.62646484375, 6.2861328125, 7.94580078125, 9.60546875, 11.26513671875, 12.9248046875, 14.58447265625, 16.244140625, 17.90380859375, 19.5634765625, 21.22314453125, 22.8828125, 24.54248046875, 26.2021484375, 27.86181640625, 29.521484375, 31.18115234375, 32.8408203125, 34.50048828125, 36.16015625, 37.81982421875, 39.4794921875, 41.13916015625, 42.798828125, 44.45849609375, 46.1181640625, 47.77783203125, 49.4375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 15.0, 66.0, 131.0, 249.0, 274.0, 176.0, 71.0, 24.0, 8.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.85260009765625, -65.97642517089844, -62.100250244140625, -58.22407531738281, -54.347900390625, -50.47172546386719, -46.595550537109375, -42.71937561035156, -38.84320068359375, -34.96702575683594, -31.090850830078125, -27.214675903320312, -23.3385009765625, -19.46232795715332, -15.586153030395508, -11.709978103637695, -7.833805084228516, -3.9576303958892822, -0.08145570755004883, 3.7947187423706055, 7.670893669128418, 11.547067642211914, 15.423242568969727, 19.29941749572754, 23.17559242248535, 27.051767349243164, 30.927942276000977, 34.804115295410156, 38.68029022216797, 42.55646514892578, 46.432640075683594, 50.308815002441406, 54.18498992919922, 58.06116485595703, 61.937339782714844, 65.81351470947266, 69.68968963623047, 73.56586456298828, 77.4420394897461, 81.3182144165039, 85.19438934326172, 89.07056427001953, 92.94673919677734, 96.82291412353516, 100.69908905029297, 104.57526397705078, 108.4514389038086, 112.3276138305664, 116.20378112792969, 120.0799560546875, 123.95613098144531, 127.83230590820312, 131.70848083496094, 135.58465576171875, 139.46083068847656, 143.33700561523438, 147.2131805419922, 151.08935546875, 154.9655303955078, 158.84170532226562, 162.71788024902344, 166.59405517578125, 170.47023010253906, 174.34640502929688, 178.2225799560547]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 5.0, 3.0, 8.0, 7.0, 4.0, 9.0, 4.0, 11.0, 21.0, 17.0, 16.0, 17.0, 28.0, 30.0, 27.0, 35.0, 29.0, 25.0, 45.0, 42.0, 24.0, 37.0, 25.0, 32.0, 35.0, 38.0, 35.0, 42.0, 31.0, 31.0, 32.0, 34.0, 19.0, 25.0, 25.0, 16.0, 19.0, 15.0, 15.0, 7.0, 10.0, 10.0, 16.0, 8.0, 8.0, 10.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-28.55019187927246, -27.543489456176758, -26.536787033081055, -25.53008460998535, -24.52338218688965, -23.516679763793945, -22.50997543334961, -21.503273010253906, -20.496570587158203, -19.4898681640625, -18.483165740966797, -17.476463317871094, -16.46976089477539, -15.463058471679688, -14.456355094909668, -13.449652671813965, -12.442951202392578, -11.436248779296875, -10.429546356201172, -9.422843933105469, -8.416141510009766, -7.409438610076904, -6.402735710144043, -5.39603328704834, -4.389330863952637, -3.3826284408569336, -2.3759257793426514, -1.3692231178283691, -0.362520694732666, 0.6441817283630371, 1.6508846282958984, 2.6575870513916016, 3.6642913818359375, 4.670993804931641, 5.677696228027344, 6.684399127960205, 7.691101551055908, 8.697803497314453, 9.704506874084473, 10.711209297180176, 11.717911720275879, 12.724614143371582, 13.731316566467285, 14.738019943237305, 15.744722366333008, 16.75142478942871, 17.758127212524414, 18.764829635620117, 19.77153205871582, 20.778234481811523, 21.784936904907227, 22.79163932800293, 23.798341751098633, 24.805044174194336, 25.811748504638672, 26.818450927734375, 27.825153350830078, 28.83185577392578, 29.838558197021484, 30.845260620117188, 31.85196304321289, 32.858665466308594, 33.8653678894043, 34.8720703125, 35.8787727355957]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 8.0, 6.0, 5.0, 4.0, 7.0, 7.0, 16.0, 10.0, 17.0, 19.0, 23.0, 22.0, 20.0, 32.0, 44.0, 38.0, 45.0, 35.0, 42.0, 54.0, 42.0, 44.0, 38.0, 40.0, 38.0, 33.0, 33.0, 35.0, 42.0, 23.0, 33.0, 28.0, 25.0, 12.0, 20.0, 17.0, 13.0, 7.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.78515625, -5.611328125, -5.4375, -5.263671875, -5.08984375, -4.916015625, -4.7421875, -4.568359375, -4.39453125, -4.220703125, -4.046875, -3.873046875, -3.69921875, -3.525390625, -3.3515625, -3.177734375, -3.00390625, -2.830078125, -2.65625, -2.482421875, -2.30859375, -2.134765625, -1.9609375, -1.787109375, -1.61328125, -1.439453125, -1.265625, -1.091796875, -0.91796875, -0.744140625, -0.5703125, -0.396484375, -0.22265625, -0.048828125, 0.125, 0.298828125, 0.47265625, 0.646484375, 0.8203125, 0.994140625, 1.16796875, 1.341796875, 1.515625, 1.689453125, 1.86328125, 2.037109375, 2.2109375, 2.384765625, 2.55859375, 2.732421875, 2.90625, 3.080078125, 3.25390625, 3.427734375, 3.6015625, 3.775390625, 3.94921875, 4.123046875, 4.296875, 4.470703125, 4.64453125, 4.818359375, 4.9921875, 5.166015625, 5.33984375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 14.0, 17.0, 26.0, 38.0, 81.0, 100.0, 156.0, 207.0, 300.0, 450.0, 692.0, 1019.0, 1541.0, 2344.0, 3720.0, 5435.0, 8293.0, 12787.0, 19423.0, 29926.0, 45152.0, 67470.0, 96952.0, 129104.0, 149607.0, 138445.0, 107482.0, 76335.0, 52076.0, 34131.0, 22553.0, 14642.0, 9583.0, 6209.0, 4179.0, 2673.0, 1803.0, 1210.0, 827.0, 521.0, 348.0, 241.0, 140.0, 104.0, 55.0, 47.0, 39.0, 19.0, 18.0, 4.0, 10.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6394729614257812, -0.6192779541015625, -0.5990829467773438, -0.578887939453125, -0.5586929321289062, -0.5384979248046875, -0.5183029174804688, -0.49810791015625, -0.47791290283203125, -0.4577178955078125, -0.43752288818359375, -0.417327880859375, -0.39713287353515625, -0.3769378662109375, -0.35674285888671875, -0.3365478515625, -0.31635284423828125, -0.2961578369140625, -0.27596282958984375, -0.255767822265625, -0.23557281494140625, -0.2153778076171875, -0.19518280029296875, -0.17498779296875, -0.15479278564453125, -0.1345977783203125, -0.11440277099609375, -0.094207763671875, -0.07401275634765625, -0.0538177490234375, -0.03362274169921875, -0.013427734375, 0.00676727294921875, 0.0269622802734375, 0.04715728759765625, 0.067352294921875, 0.08754730224609375, 0.1077423095703125, 0.12793731689453125, 0.14813232421875, 0.16832733154296875, 0.1885223388671875, 0.20871734619140625, 0.228912353515625, 0.24910736083984375, 0.2693023681640625, 0.28949737548828125, 0.3096923828125, 0.32988739013671875, 0.3500823974609375, 0.37027740478515625, 0.390472412109375, 0.41066741943359375, 0.4308624267578125, 0.45105743408203125, 0.47125244140625, 0.49144744873046875, 0.5116424560546875, 0.5318374633789062, 0.552032470703125, 0.5722274780273438, 0.5924224853515625, 0.6126174926757812, 0.6328125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 12.0, 5.0, 4.0, 13.0, 14.0, 13.0, 18.0, 20.0, 22.0, 23.0, 27.0, 27.0, 30.0, 35.0, 39.0, 47.0, 32.0, 34.0, 29.0, 46.0, 1061.0, 54.0, 27.0, 46.0, 33.0, 34.0, 31.0, 24.0, 35.0, 29.0, 22.0, 18.0, 21.0, 14.0, 18.0, 15.0, 9.0, 9.0, 6.0, 6.0, 5.0, 9.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.69921875, -3.590606689453125, -3.48199462890625, -3.373382568359375, -3.2647705078125, -3.156158447265625, -3.04754638671875, -2.938934326171875, -2.830322265625, -2.721710205078125, -2.61309814453125, -2.504486083984375, -2.3958740234375, -2.287261962890625, -2.17864990234375, -2.070037841796875, -1.96142578125, -1.852813720703125, -1.74420166015625, -1.635589599609375, -1.5269775390625, -1.418365478515625, -1.30975341796875, -1.201141357421875, -1.092529296875, -0.983917236328125, -0.87530517578125, -0.766693115234375, -0.6580810546875, -0.549468994140625, -0.44085693359375, -0.332244873046875, -0.2236328125, -0.115020751953125, -0.00640869140625, 0.102203369140625, 0.2108154296875, 0.319427490234375, 0.42803955078125, 0.536651611328125, 0.645263671875, 0.753875732421875, 0.86248779296875, 0.971099853515625, 1.0797119140625, 1.188323974609375, 1.29693603515625, 1.405548095703125, 1.51416015625, 1.622772216796875, 1.73138427734375, 1.839996337890625, 1.9486083984375, 2.057220458984375, 2.16583251953125, 2.274444580078125, 2.383056640625, 2.491668701171875, 2.60028076171875, 2.708892822265625, 2.8175048828125, 2.926116943359375, 3.03472900390625, 3.143341064453125, 3.251953125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 6.0, 8.0, 11.0, 7.0, 18.0, 21.0, 36.0, 64.0, 95.0, 118.0, 180.0, 257.0, 389.0, 554.0, 933.0, 1352.0, 2076.0, 3187.0, 5107.0, 8116.0, 12542.0, 20106.0, 31332.0, 48200.0, 72733.0, 104638.0, 137556.0, 1199167.0, 137082.0, 104820.0, 72300.0, 48024.0, 31155.0, 19636.0, 12524.0, 8002.0, 5199.0, 3270.0, 2145.0, 1420.0, 874.0, 629.0, 416.0, 266.0, 189.0, 110.0, 80.0, 51.0, 37.0, 25.0, 24.0, 17.0, 13.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.40234375, -0.3891487121582031, -0.37595367431640625, -0.3627586364746094, -0.3495635986328125, -0.3363685607910156, -0.32317352294921875, -0.3099784851074219, -0.296783447265625, -0.2835884094238281, -0.27039337158203125, -0.2571983337402344, -0.2440032958984375, -0.23080825805664062, -0.21761322021484375, -0.20441818237304688, -0.19122314453125, -0.17802810668945312, -0.16483306884765625, -0.15163803100585938, -0.1384429931640625, -0.12524795532226562, -0.11205291748046875, -0.09885787963867188, -0.085662841796875, -0.07246780395507812, -0.05927276611328125, -0.046077728271484375, -0.0328826904296875, -0.019687652587890625, -0.00649261474609375, 0.006702423095703125, 0.0198974609375, 0.033092498779296875, 0.04628753662109375, 0.059482574462890625, 0.0726776123046875, 0.08587265014648438, 0.09906768798828125, 0.11226272583007812, 0.125457763671875, 0.13865280151367188, 0.15184783935546875, 0.16504287719726562, 0.1782379150390625, 0.19143295288085938, 0.20462799072265625, 0.21782302856445312, 0.23101806640625, 0.24421310424804688, 0.25740814208984375, 0.2706031799316406, 0.2837982177734375, 0.2969932556152344, 0.31018829345703125, 0.3233833312988281, 0.336578369140625, 0.3497734069824219, 0.36296844482421875, 0.3761634826660156, 0.3893585205078125, 0.4025535583496094, 0.41574859619140625, 0.4289436340332031, 0.442138671875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 9.0, 8.0, 8.0, 15.0, 20.0, 26.0, 23.0, 42.0, 41.0, 52.0, 75.0, 71.0, 81.0, 81.0, 90.0, 73.0, 42.0, 48.0, 40.0, 30.0, 14.0, 17.0, 11.0, 14.0, 8.0, 7.0, 9.0, 5.0, 6.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0121612548828125, -0.011792302131652832, -0.011423349380493164, -0.011054396629333496, -0.010685443878173828, -0.01031649112701416, -0.009947538375854492, -0.009578585624694824, -0.009209632873535156, -0.008840680122375488, -0.00847172737121582, -0.008102774620056152, -0.007733821868896484, -0.007364869117736816, -0.0069959163665771484, -0.0066269636154174805, -0.0062580108642578125, -0.0058890581130981445, -0.0055201053619384766, -0.005151152610778809, -0.004782199859619141, -0.004413247108459473, -0.004044294357299805, -0.0036753416061401367, -0.0033063888549804688, -0.0029374361038208008, -0.002568483352661133, -0.002199530601501465, -0.0018305778503417969, -0.001461625099182129, -0.001092672348022461, -0.000723719596862793, -0.000354766845703125, 1.4185905456542969e-05, 0.00038313865661621094, 0.0007520914077758789, 0.0011210441589355469, 0.0014899969100952148, 0.0018589496612548828, 0.0022279024124145508, 0.0025968551635742188, 0.0029658079147338867, 0.0033347606658935547, 0.0037037134170532227, 0.004072666168212891, 0.004441618919372559, 0.0048105716705322266, 0.0051795244216918945, 0.0055484771728515625, 0.0059174299240112305, 0.0062863826751708984, 0.006655335426330566, 0.007024288177490234, 0.007393240928649902, 0.00776219367980957, 0.008131146430969238, 0.008500099182128906, 0.008869051933288574, 0.009238004684448242, 0.00960695743560791, 0.009975910186767578, 0.010344862937927246, 0.010713815689086914, 0.011082768440246582, 0.01145172119140625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 7.0, 5.0, 6.0, 7.0, 17.0, 18.0, 13.0, 24.0, 31.0, 37.0, 66.0, 74.0, 125.0, 225.0, 539.0, 16670.0, 1025309.0, 4354.0, 436.0, 188.0, 113.0, 72.0, 64.0, 41.0, 29.0, 20.0, 12.0, 11.0, 9.0, 6.0, 5.0, 4.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24658203125, -0.2387237548828125, -0.230865478515625, -0.2230072021484375, -0.21514892578125, -0.2072906494140625, -0.199432373046875, -0.1915740966796875, -0.1837158203125, -0.1758575439453125, -0.167999267578125, -0.1601409912109375, -0.15228271484375, -0.1444244384765625, -0.136566162109375, -0.1287078857421875, -0.120849609375, -0.1129913330078125, -0.105133056640625, -0.0972747802734375, -0.08941650390625, -0.0815582275390625, -0.073699951171875, -0.0658416748046875, -0.0579833984375, -0.0501251220703125, -0.042266845703125, -0.0344085693359375, -0.02655029296875, -0.0186920166015625, -0.010833740234375, -0.0029754638671875, 0.0048828125, 0.0127410888671875, 0.020599365234375, 0.0284576416015625, 0.03631591796875, 0.0441741943359375, 0.052032470703125, 0.0598907470703125, 0.0677490234375, 0.0756072998046875, 0.083465576171875, 0.0913238525390625, 0.09918212890625, 0.1070404052734375, 0.114898681640625, 0.1227569580078125, 0.130615234375, 0.1384735107421875, 0.146331787109375, 0.1541900634765625, 0.16204833984375, 0.1699066162109375, 0.177764892578125, 0.1856231689453125, 0.1934814453125, 0.2013397216796875, 0.209197998046875, 0.2170562744140625, 0.22491455078125, 0.2327728271484375, 0.240631103515625, 0.2484893798828125, 0.25634765625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 74.0, 904.0, 32.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11567068845033646, -0.11130581051111221, -0.10694093257188797, -0.10257605463266373, -0.09821117669343948, -0.09384629875421524, -0.0894814133644104, -0.08511653542518616, -0.08075165748596191, -0.07638677954673767, -0.07202190160751343, -0.06765702366828918, -0.06329214572906494, -0.0589272677898407, -0.05456238612532616, -0.05019750818610191, -0.04583263397216797, -0.041467756032943726, -0.03710287809371948, -0.03273800015449524, -0.028373120352625847, -0.024008242413401604, -0.01964336261153221, -0.015278484672307968, -0.010913606733083725, -0.0065487283281981945, -0.002183849923312664, 0.0021810289472341537, 0.006545906886458397, 0.01091078482568264, 0.015275664627552032, 0.019640542566776276, 0.024005427956581116, 0.02837030589580536, 0.0327351838350296, 0.037100061774253845, 0.04146493971347809, 0.04582981765270233, 0.05019469931721687, 0.054559577256441116, 0.05892445519566536, 0.0632893368601799, 0.06765421479940414, 0.07201909273862839, 0.07638397067785263, 0.08074884861707687, 0.08511372655630112, 0.08947860449552536, 0.0938434824347496, 0.09820836037397385, 0.10257323831319809, 0.10693811625242233, 0.11130299419164658, 0.11566787213087082, 0.12003275752067566, 0.1243976354598999, 0.12876251339912415, 0.1331273913383484, 0.13749226927757263, 0.14185714721679688, 0.14622202515602112, 0.15058690309524536, 0.1549517810344696, 0.15931665897369385, 0.1636815369129181]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 5.0, 1.0, 10.0, 11.0, 14.0, 19.0, 20.0, 14.0, 28.0, 22.0, 35.0, 32.0, 40.0, 38.0, 33.0, 32.0, 39.0, 39.0, 42.0, 51.0, 43.0, 32.0, 43.0, 45.0, 30.0, 29.0, 27.0, 35.0, 30.0, 28.0, 24.0, 15.0, 20.0, 14.0, 8.0, 9.0, 8.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01267462968826294, -0.01226948481053114, -0.01186433993279934, -0.01145919505506754, -0.01105405017733574, -0.010648905299603939, -0.010243760421872139, -0.009838615544140339, -0.009433470666408539, -0.009028325788676739, -0.008623180910944939, -0.008218036033213139, -0.007812891155481339, -0.007407746277749538, -0.007002601400017738, -0.006597456522285938, -0.006192311644554138, -0.005787166766822338, -0.005382021889090538, -0.004976877011358738, -0.004571732133626938, -0.004166587255895138, -0.0037614423781633377, -0.0033562975004315376, -0.0029511526226997375, -0.0025460077449679375, -0.0021408628672361374, -0.0017357179895043373, -0.0013305731117725372, -0.0009254282340407372, -0.0005202833563089371, -0.000115138478577137, 0.0002900063991546631, 0.0006951512768864632, 0.0011002961546182632, 0.0015054410323500633, 0.0019105859100818634, 0.0023157307878136635, 0.0027208756655454636, 0.0031260205432772636, 0.0035311654210090637, 0.003936310298740864, 0.004341455176472664, 0.004746600054204464, 0.005151744931936264, 0.005556889809668064, 0.005962034687399864, 0.006367179565131664, 0.006772324442863464, 0.0071774693205952644, 0.0075826141983270645, 0.007987759076058865, 0.008392903953790665, 0.008798048831522465, 0.009203193709254265, 0.009608338586986065, 0.010013483464717865, 0.010418628342449665, 0.010823773220181465, 0.011228918097913265, 0.011634062975645065, 0.012039207853376865, 0.012444352731108665, 0.012849497608840466, 0.013254642486572266]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 8.0, 6.0, 5.0, 4.0, 7.0, 7.0, 16.0, 10.0, 17.0, 19.0, 23.0, 22.0, 20.0, 33.0, 43.0, 38.0, 45.0, 35.0, 42.0, 55.0, 41.0, 44.0, 38.0, 40.0, 38.0, 33.0, 33.0, 35.0, 42.0, 23.0, 33.0, 28.0, 25.0, 12.0, 20.0, 17.0, 13.0, 7.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.78515625, -5.611328125, -5.4375, -5.263671875, -5.08984375, -4.916015625, -4.7421875, -4.568359375, -4.39453125, -4.220703125, -4.046875, -3.873046875, -3.69921875, -3.525390625, -3.3515625, -3.177734375, -3.00390625, -2.830078125, -2.65625, -2.482421875, -2.30859375, -2.134765625, -1.9609375, -1.787109375, -1.61328125, -1.439453125, -1.265625, -1.091796875, -0.91796875, -0.744140625, -0.5703125, -0.396484375, -0.22265625, -0.048828125, 0.125, 0.298828125, 0.47265625, 0.646484375, 0.8203125, 0.994140625, 1.16796875, 1.341796875, 1.515625, 1.689453125, 1.86328125, 2.037109375, 2.2109375, 2.384765625, 2.55859375, 2.732421875, 2.90625, 3.080078125, 3.25390625, 3.427734375, 3.6015625, 3.775390625, 3.94921875, 4.123046875, 4.296875, 4.470703125, 4.64453125, 4.818359375, 4.9921875, 5.166015625, 5.33984375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 5.0, 13.0, 8.0, 9.0, 19.0, 25.0, 21.0, 42.0, 62.0, 79.0, 112.0, 189.0, 314.0, 534.0, 991.0, 1870.0, 3768.0, 7414.0, 14865.0, 29664.0, 62644.0, 132314.0, 278981.0, 268093.0, 128014.0, 60310.0, 28742.0, 14302.0, 7177.0, 3631.0, 1897.0, 949.0, 570.0, 372.0, 174.0, 111.0, 64.0, 41.0, 48.0, 22.0, 21.0, 27.0, 7.0, 7.0, 10.0, 6.0, 2.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-5.9375, -5.76275634765625, -5.5880126953125, -5.41326904296875, -5.238525390625, -5.06378173828125, -4.8890380859375, -4.71429443359375, -4.53955078125, -4.36480712890625, -4.1900634765625, -4.01531982421875, -3.840576171875, -3.66583251953125, -3.4910888671875, -3.31634521484375, -3.1416015625, -2.96685791015625, -2.7921142578125, -2.61737060546875, -2.442626953125, -2.26788330078125, -2.0931396484375, -1.91839599609375, -1.74365234375, -1.56890869140625, -1.3941650390625, -1.21942138671875, -1.044677734375, -0.86993408203125, -0.6951904296875, -0.52044677734375, -0.345703125, -0.17095947265625, 0.0037841796875, 0.17852783203125, 0.353271484375, 0.52801513671875, 0.7027587890625, 0.87750244140625, 1.05224609375, 1.22698974609375, 1.4017333984375, 1.57647705078125, 1.751220703125, 1.92596435546875, 2.1007080078125, 2.27545166015625, 2.4501953125, 2.62493896484375, 2.7996826171875, 2.97442626953125, 3.149169921875, 3.32391357421875, 3.4986572265625, 3.67340087890625, 3.84814453125, 4.02288818359375, 4.1976318359375, 4.37237548828125, 4.547119140625, 4.72186279296875, 4.8966064453125, 5.07135009765625, 5.24609375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 3.0, 5.0, 16.0, 7.0, 10.0, 7.0, 16.0, 14.0, 20.0, 13.0, 20.0, 24.0, 37.0, 31.0, 42.0, 33.0, 61.0, 58.0, 84.0, 146.0, 244.0, 1377.0, 207.0, 107.0, 68.0, 38.0, 40.0, 33.0, 37.0, 32.0, 25.0, 28.0, 19.0, 20.0, 19.0, 19.0, 19.0, 14.0, 11.0, 5.0, 10.0, 2.0, 5.0, 2.0, 5.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-15.140625, -14.6846923828125, -14.228759765625, -13.7728271484375, -13.31689453125, -12.8609619140625, -12.405029296875, -11.9490966796875, -11.4931640625, -11.0372314453125, -10.581298828125, -10.1253662109375, -9.66943359375, -9.2135009765625, -8.757568359375, -8.3016357421875, -7.845703125, -7.3897705078125, -6.933837890625, -6.4779052734375, -6.02197265625, -5.5660400390625, -5.110107421875, -4.6541748046875, -4.1982421875, -3.7423095703125, -3.286376953125, -2.8304443359375, -2.37451171875, -1.9185791015625, -1.462646484375, -1.0067138671875, -0.55078125, -0.0948486328125, 0.361083984375, 0.8170166015625, 1.27294921875, 1.7288818359375, 2.184814453125, 2.6407470703125, 3.0966796875, 3.5526123046875, 4.008544921875, 4.4644775390625, 4.92041015625, 5.3763427734375, 5.832275390625, 6.2882080078125, 6.744140625, 7.2000732421875, 7.656005859375, 8.1119384765625, 8.56787109375, 9.0238037109375, 9.479736328125, 9.9356689453125, 10.3916015625, 10.8475341796875, 11.303466796875, 11.7593994140625, 12.21533203125, 12.6712646484375, 13.127197265625, 13.5831298828125, 14.0390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 6.0, 7.0, 5.0, 10.0, 7.0, 11.0, 26.0, 23.0, 28.0, 47.0, 61.0, 95.0, 149.0, 227.0, 368.0, 778.0, 2877.0, 524046.0, 2610162.0, 4671.0, 929.0, 435.0, 239.0, 130.0, 98.0, 64.0, 50.0, 35.0, 29.0, 12.0, 22.0, 9.0, 12.0, 7.0, 7.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.21875, -54.28662109375, -52.3544921875, -50.42236328125, -48.490234375, -46.55810546875, -44.6259765625, -42.69384765625, -40.76171875, -38.82958984375, -36.8974609375, -34.96533203125, -33.033203125, -31.10107421875, -29.1689453125, -27.23681640625, -25.3046875, -23.37255859375, -21.4404296875, -19.50830078125, -17.576171875, -15.64404296875, -13.7119140625, -11.77978515625, -9.84765625, -7.91552734375, -5.9833984375, -4.05126953125, -2.119140625, -0.18701171875, 1.7451171875, 3.67724609375, 5.609375, 7.54150390625, 9.4736328125, 11.40576171875, 13.337890625, 15.27001953125, 17.2021484375, 19.13427734375, 21.06640625, 22.99853515625, 24.9306640625, 26.86279296875, 28.794921875, 30.72705078125, 32.6591796875, 34.59130859375, 36.5234375, 38.45556640625, 40.3876953125, 42.31982421875, 44.251953125, 46.18408203125, 48.1162109375, 50.04833984375, 51.98046875, 53.91259765625, 55.8447265625, 57.77685546875, 59.708984375, 61.64111328125, 63.5732421875, 65.50537109375, 67.4375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 19.0, 144.0, 401.0, 337.0, 97.0, 13.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.084705352783203, -25.799070358276367, -22.51343536376953, -19.227800369262695, -15.94216537475586, -12.656530380249023, -9.370895385742188, -6.085260391235352, -2.7996253967285156, 0.4860095977783203, 3.7716445922851562, 7.057279586791992, 10.342914581298828, 13.628549575805664, 16.9141845703125, 20.199819564819336, 23.485454559326172, 26.771089553833008, 30.056724548339844, 33.34236145019531, 36.627994537353516, 39.91362762451172, 43.19926452636719, 46.484901428222656, 49.77053451538086, 53.05616760253906, 56.34180450439453, 59.62744140625, 62.9130744934082, 66.1987075805664, 69.48434448242188, 72.76998138427734, 76.05561828613281, 79.34125518798828, 82.62689208984375, 85.91252136230469, 89.19815826416016, 92.48379516601562, 95.76942443847656, 99.05506134033203, 102.3406982421875, 105.62633514404297, 108.91197204589844, 112.19760131835938, 115.48323822021484, 118.76887512207031, 122.05450439453125, 125.34014129638672, 128.6257781982422, 131.91140747070312, 135.19705200195312, 138.48268127441406, 141.768310546875, 145.053955078125, 148.33958435058594, 151.62522888183594, 154.91085815429688, 158.1964874267578, 161.4821319580078, 164.76776123046875, 168.05340576171875, 171.3390350341797, 174.62466430664062, 177.91030883789062, 181.19593811035156]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 3.0, 4.0, 9.0, 12.0, 22.0, 16.0, 27.0, 22.0, 29.0, 42.0, 28.0, 48.0, 42.0, 45.0, 34.0, 64.0, 56.0, 57.0, 40.0, 46.0, 40.0, 49.0, 44.0, 35.0, 39.0, 20.0, 27.0, 22.0, 18.0, 16.0, 18.0, 4.0, 8.0, 3.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.01214599609375, -59.292633056640625, -57.5731201171875, -55.853607177734375, -54.13409423828125, -52.414581298828125, -50.695064544677734, -48.97555160522461, -47.256038665771484, -45.53652572631836, -43.817012786865234, -42.09749984741211, -40.37798309326172, -38.658470153808594, -36.93895721435547, -35.219444274902344, -33.49993133544922, -31.780418395996094, -30.06090545654297, -28.34139060974121, -26.621877670288086, -24.90236473083496, -23.182849884033203, -21.463336944580078, -19.743824005126953, -18.024311065673828, -16.304798126220703, -14.585283279418945, -12.86577033996582, -11.146257400512695, -9.426743507385254, -7.7072296142578125, -5.9877166748046875, -4.268203258514404, -2.548689842224121, -0.8291764259338379, 0.8903369903564453, 2.6098499298095703, 4.329363822937012, 6.048877716064453, 7.768390655517578, 9.487903594970703, 11.207417488098145, 12.926931381225586, 14.646444320678711, 16.365957260131836, 18.085472106933594, 19.80498504638672, 21.524497985839844, 23.24401092529297, 24.963523864746094, 26.68303871154785, 28.402551651000977, 30.1220645904541, 31.84157943725586, 33.561092376708984, 35.28060531616211, 37.000118255615234, 38.71963119506836, 40.439144134521484, 42.158660888671875, 43.878173828125, 45.597686767578125, 47.31719970703125, 49.036712646484375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 9.0, 7.0, 11.0, 7.0, 3.0, 19.0, 17.0, 26.0, 19.0, 23.0, 25.0, 26.0, 29.0, 39.0, 36.0, 39.0, 36.0, 54.0, 43.0, 29.0, 45.0, 32.0, 42.0, 38.0, 38.0, 35.0, 37.0, 28.0, 26.0, 28.0, 20.0, 22.0, 18.0, 19.0, 17.0, 12.0, 6.0, 7.0, 6.0, 4.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-6.01171875, -5.8330078125, -5.654296875, -5.4755859375, -5.296875, -5.1181640625, -4.939453125, -4.7607421875, -4.58203125, -4.4033203125, -4.224609375, -4.0458984375, -3.8671875, -3.6884765625, -3.509765625, -3.3310546875, -3.15234375, -2.9736328125, -2.794921875, -2.6162109375, -2.4375, -2.2587890625, -2.080078125, -1.9013671875, -1.72265625, -1.5439453125, -1.365234375, -1.1865234375, -1.0078125, -0.8291015625, -0.650390625, -0.4716796875, -0.29296875, -0.1142578125, 0.064453125, 0.2431640625, 0.421875, 0.6005859375, 0.779296875, 0.9580078125, 1.13671875, 1.3154296875, 1.494140625, 1.6728515625, 1.8515625, 2.0302734375, 2.208984375, 2.3876953125, 2.56640625, 2.7451171875, 2.923828125, 3.1025390625, 3.28125, 3.4599609375, 3.638671875, 3.8173828125, 3.99609375, 4.1748046875, 4.353515625, 4.5322265625, 4.7109375, 4.8896484375, 5.068359375, 5.2470703125, 5.42578125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 1.0, 8.0, 6.0, 8.0, 5.0, 9.0, 13.0, 27.0, 21.0, 37.0, 30.0, 43.0, 70.0, 110.0, 152.0, 322.0, 834.0, 3219.0, 16967.0, 140964.0, 1325218.0, 2305168.0, 355547.0, 37459.0, 5638.0, 1352.0, 447.0, 196.0, 96.0, 74.0, 56.0, 29.0, 35.0, 26.0, 25.0, 11.0, 9.0, 10.0, 8.0, 7.0, 5.0, 5.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.015625, -14.5765380859375, -14.137451171875, -13.6983642578125, -13.25927734375, -12.8201904296875, -12.381103515625, -11.9420166015625, -11.5029296875, -11.0638427734375, -10.624755859375, -10.1856689453125, -9.74658203125, -9.3074951171875, -8.868408203125, -8.4293212890625, -7.990234375, -7.5511474609375, -7.112060546875, -6.6729736328125, -6.23388671875, -5.7947998046875, -5.355712890625, -4.9166259765625, -4.4775390625, -4.0384521484375, -3.599365234375, -3.1602783203125, -2.72119140625, -2.2821044921875, -1.843017578125, -1.4039306640625, -0.96484375, -0.5257568359375, -0.086669921875, 0.3524169921875, 0.79150390625, 1.2305908203125, 1.669677734375, 2.1087646484375, 2.5478515625, 2.9869384765625, 3.426025390625, 3.8651123046875, 4.30419921875, 4.7432861328125, 5.182373046875, 5.6214599609375, 6.060546875, 6.4996337890625, 6.938720703125, 7.3778076171875, 7.81689453125, 8.2559814453125, 8.695068359375, 9.1341552734375, 9.5732421875, 10.0123291015625, 10.451416015625, 10.8905029296875, 11.32958984375, 11.7686767578125, 12.207763671875, 12.6468505859375, 13.0859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 5.0, 6.0, 8.0, 17.0, 12.0, 21.0, 29.0, 40.0, 67.0, 72.0, 91.0, 159.0, 190.0, 305.0, 339.0, 435.0, 422.0, 416.0, 318.0, 257.0, 215.0, 173.0, 135.0, 67.0, 58.0, 55.0, 32.0, 35.0, 25.0, 17.0, 9.0, 18.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.546875, -10.212646484375, -9.87841796875, -9.544189453125, -9.2099609375, -8.875732421875, -8.54150390625, -8.207275390625, -7.873046875, -7.538818359375, -7.20458984375, -6.870361328125, -6.5361328125, -6.201904296875, -5.86767578125, -5.533447265625, -5.19921875, -4.864990234375, -4.53076171875, -4.196533203125, -3.8623046875, -3.528076171875, -3.19384765625, -2.859619140625, -2.525390625, -2.191162109375, -1.85693359375, -1.522705078125, -1.1884765625, -0.854248046875, -0.52001953125, -0.185791015625, 0.1484375, 0.482666015625, 0.81689453125, 1.151123046875, 1.4853515625, 1.819580078125, 2.15380859375, 2.488037109375, 2.822265625, 3.156494140625, 3.49072265625, 3.824951171875, 4.1591796875, 4.493408203125, 4.82763671875, 5.161865234375, 5.49609375, 5.830322265625, 6.16455078125, 6.498779296875, 6.8330078125, 7.167236328125, 7.50146484375, 7.835693359375, 8.169921875, 8.504150390625, 8.83837890625, 9.172607421875, 9.5068359375, 9.841064453125, 10.17529296875, 10.509521484375, 10.84375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 18.0, 11.0, 9.0, 24.0, 29.0, 39.0, 53.0, 61.0, 79.0, 96.0, 156.0, 262.0, 352.0, 798.0, 11382.0, 2610473.0, 1561130.0, 7444.0, 760.0, 378.0, 213.0, 138.0, 89.0, 85.0, 49.0, 33.0, 20.0, 25.0, 16.0, 15.0, 8.0, 9.0, 1.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.34375, -52.6943359375, -51.044921875, -49.3955078125, -47.74609375, -46.0966796875, -44.447265625, -42.7978515625, -41.1484375, -39.4990234375, -37.849609375, -36.2001953125, -34.55078125, -32.9013671875, -31.251953125, -29.6025390625, -27.953125, -26.3037109375, -24.654296875, -23.0048828125, -21.35546875, -19.7060546875, -18.056640625, -16.4072265625, -14.7578125, -13.1083984375, -11.458984375, -9.8095703125, -8.16015625, -6.5107421875, -4.861328125, -3.2119140625, -1.5625, 0.0869140625, 1.736328125, 3.3857421875, 5.03515625, 6.6845703125, 8.333984375, 9.9833984375, 11.6328125, 13.2822265625, 14.931640625, 16.5810546875, 18.23046875, 19.8798828125, 21.529296875, 23.1787109375, 24.828125, 26.4775390625, 28.126953125, 29.7763671875, 31.42578125, 33.0751953125, 34.724609375, 36.3740234375, 38.0234375, 39.6728515625, 41.322265625, 42.9716796875, 44.62109375, 46.2705078125, 47.919921875, 49.5693359375, 51.21875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 8.0, 14.0, 28.0, 50.0, 89.0, 109.0, 162.0, 152.0, 148.0, 104.0, 85.0, 27.0, 25.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-83.05976104736328, -80.81766510009766, -78.57556915283203, -76.3334732055664, -74.09137725830078, -71.84928131103516, -69.60718536376953, -67.3650894165039, -65.12299346923828, -62.880897521972656, -60.63880157470703, -58.396705627441406, -56.15460968017578, -53.912513732910156, -51.67041778564453, -49.428321838378906, -47.18622970581055, -44.94413375854492, -42.7020378112793, -40.45994186401367, -38.21784591674805, -35.97574996948242, -33.73365783691406, -31.491559982299805, -29.24946403503418, -27.007368087768555, -24.76527214050293, -22.523178100585938, -20.281082153320312, -18.038986206054688, -15.796890258789062, -13.554794311523438, -11.312698364257812, -9.070602416992188, -6.828506946563721, -4.586411476135254, -2.344315528869629, -0.1022195816040039, 2.1398754119873047, 4.38197135925293, 6.624067306518555, 8.86616325378418, 11.108259201049805, 13.350354194641113, 15.592450141906738, 17.834545135498047, 20.076641082763672, 22.318737030029297, 24.560832977294922, 26.802928924560547, 29.045024871826172, 31.287120819091797, 33.52921676635742, 35.77131271362305, 38.013404846191406, 40.25550079345703, 42.497596740722656, 44.73969268798828, 46.981788635253906, 49.22388458251953, 51.465980529785156, 53.70807647705078, 55.950172424316406, 58.19226837158203, 60.434364318847656]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 7.0, 7.0, 6.0, 15.0, 14.0, 17.0, 14.0, 17.0, 23.0, 23.0, 24.0, 20.0, 30.0, 27.0, 35.0, 37.0, 38.0, 35.0, 39.0, 44.0, 42.0, 52.0, 41.0, 36.0, 26.0, 33.0, 40.0, 36.0, 31.0, 30.0, 28.0, 25.0, 11.0, 19.0, 12.0, 10.0, 14.0, 6.0, 12.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.778419494628906, -34.61531066894531, -33.45220184326172, -32.28909683227539, -31.125988006591797, -29.962879180908203, -28.799772262573242, -27.63666534423828, -26.473556518554688, -25.310447692871094, -24.147340774536133, -22.984233856201172, -21.821125030517578, -20.658016204833984, -19.494909286499023, -18.331802368164062, -17.16869354248047, -16.005584716796875, -14.842477798461914, -13.679369926452637, -12.51626205444336, -11.353154182434082, -10.190046310424805, -9.026938438415527, -7.86383056640625, -6.700722694396973, -5.537614822387695, -4.374506950378418, -3.2113990783691406, -2.0482912063598633, -0.8851833343505859, 0.2779245376586914, 1.4410362243652344, 2.6041440963745117, 3.767251968383789, 4.930359840393066, 6.093467712402344, 7.256575584411621, 8.419683456420898, 9.582791328430176, 10.745899200439453, 11.90900707244873, 13.072114944458008, 14.235222816467285, 15.398330688476562, 16.561439514160156, 17.724546432495117, 18.887653350830078, 20.050762176513672, 21.213871002197266, 22.376977920532227, 23.540084838867188, 24.70319366455078, 25.866302490234375, 27.029409408569336, 28.192516326904297, 29.35562515258789, 30.518733978271484, 31.681840896606445, 32.844947814941406, 34.008056640625, 35.171165466308594, 36.33427429199219, 37.497379302978516, 38.66048812866211]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 13.0, 8.0, 8.0, 17.0, 15.0, 17.0, 18.0, 28.0, 24.0, 31.0, 27.0, 35.0, 32.0, 30.0, 37.0, 42.0, 42.0, 43.0, 44.0, 47.0, 44.0, 43.0, 51.0, 30.0, 35.0, 31.0, 34.0, 29.0, 16.0, 20.0, 16.0, 16.0, 12.0, 20.0, 8.0, 8.0, 9.0, 6.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.0, -5.81842041015625, -5.6368408203125, -5.45526123046875, -5.273681640625, -5.09210205078125, -4.9105224609375, -4.72894287109375, -4.54736328125, -4.36578369140625, -4.1842041015625, -4.00262451171875, -3.821044921875, -3.63946533203125, -3.4578857421875, -3.27630615234375, -3.0947265625, -2.91314697265625, -2.7315673828125, -2.54998779296875, -2.368408203125, -2.18682861328125, -2.0052490234375, -1.82366943359375, -1.64208984375, -1.46051025390625, -1.2789306640625, -1.09735107421875, -0.915771484375, -0.73419189453125, -0.5526123046875, -0.37103271484375, -0.189453125, -0.00787353515625, 0.1737060546875, 0.35528564453125, 0.536865234375, 0.71844482421875, 0.9000244140625, 1.08160400390625, 1.26318359375, 1.44476318359375, 1.6263427734375, 1.80792236328125, 1.989501953125, 2.17108154296875, 2.3526611328125, 2.53424072265625, 2.7158203125, 2.89739990234375, 3.0789794921875, 3.26055908203125, 3.442138671875, 3.62371826171875, 3.8052978515625, 3.98687744140625, 4.16845703125, 4.35003662109375, 4.5316162109375, 4.71319580078125, 4.894775390625, 5.07635498046875, 5.2579345703125, 5.43951416015625, 5.62109375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 13.0, 3.0, 17.0, 24.0, 41.0, 54.0, 78.0, 101.0, 179.0, 239.0, 369.0, 622.0, 920.0, 1453.0, 2311.0, 3548.0, 5636.0, 9011.0, 14617.0, 24047.0, 38928.0, 62749.0, 99223.0, 145618.0, 176494.0, 157548.0, 112791.0, 73523.0, 45427.0, 27396.0, 16970.0, 10615.0, 6506.0, 4150.0, 2586.0, 1652.0, 1100.0, 688.0, 440.0, 285.0, 201.0, 118.0, 88.0, 46.0, 43.0, 27.0, 22.0, 12.0, 9.0, 5.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.84033203125, -0.8145980834960938, -0.7888641357421875, -0.7631301879882812, -0.737396240234375, -0.7116622924804688, -0.6859283447265625, -0.6601943969726562, -0.63446044921875, -0.6087265014648438, -0.5829925537109375, -0.5572586059570312, -0.531524658203125, -0.5057907104492188, -0.4800567626953125, -0.45432281494140625, -0.4285888671875, -0.40285491943359375, -0.3771209716796875, -0.35138702392578125, -0.325653076171875, -0.29991912841796875, -0.2741851806640625, -0.24845123291015625, -0.22271728515625, -0.19698333740234375, -0.1712493896484375, -0.14551544189453125, -0.119781494140625, -0.09404754638671875, -0.0683135986328125, -0.04257965087890625, -0.016845703125, 0.00888824462890625, 0.0346221923828125, 0.06035614013671875, 0.086090087890625, 0.11182403564453125, 0.1375579833984375, 0.16329193115234375, 0.18902587890625, 0.21475982666015625, 0.2404937744140625, 0.26622772216796875, 0.291961669921875, 0.31769561767578125, 0.3434295654296875, 0.36916351318359375, 0.3948974609375, 0.42063140869140625, 0.4463653564453125, 0.47209930419921875, 0.497833251953125, 0.5235671997070312, 0.5493011474609375, 0.5750350952148438, 0.60076904296875, 0.6265029907226562, 0.6522369384765625, 0.6779708862304688, 0.703704833984375, 0.7294387817382812, 0.7551727294921875, 0.7809066772460938, 0.806640625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 9.0, 5.0, 4.0, 5.0, 5.0, 17.0, 14.0, 24.0, 19.0, 27.0, 31.0, 38.0, 27.0, 38.0, 34.0, 36.0, 40.0, 57.0, 41.0, 1073.0, 44.0, 41.0, 51.0, 57.0, 39.0, 38.0, 28.0, 36.0, 27.0, 25.0, 19.0, 18.0, 18.0, 12.0, 10.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8046875, -3.6650390625, -3.525390625, -3.3857421875, -3.24609375, -3.1064453125, -2.966796875, -2.8271484375, -2.6875, -2.5478515625, -2.408203125, -2.2685546875, -2.12890625, -1.9892578125, -1.849609375, -1.7099609375, -1.5703125, -1.4306640625, -1.291015625, -1.1513671875, -1.01171875, -0.8720703125, -0.732421875, -0.5927734375, -0.453125, -0.3134765625, -0.173828125, -0.0341796875, 0.10546875, 0.2451171875, 0.384765625, 0.5244140625, 0.6640625, 0.8037109375, 0.943359375, 1.0830078125, 1.22265625, 1.3623046875, 1.501953125, 1.6416015625, 1.78125, 1.9208984375, 2.060546875, 2.2001953125, 2.33984375, 2.4794921875, 2.619140625, 2.7587890625, 2.8984375, 3.0380859375, 3.177734375, 3.3173828125, 3.45703125, 3.5966796875, 3.736328125, 3.8759765625, 4.015625, 4.1552734375, 4.294921875, 4.4345703125, 4.57421875, 4.7138671875, 4.853515625, 4.9931640625, 5.1328125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 10.0, 17.0, 21.0, 34.0, 65.0, 78.0, 152.0, 242.0, 426.0, 758.0, 1320.0, 2253.0, 4140.0, 7411.0, 13145.0, 24487.0, 43953.0, 77236.0, 127077.0, 209526.0, 1214765.0, 150628.0, 95029.0, 55185.0, 30661.0, 16920.0, 9472.0, 5168.0, 2945.0, 1712.0, 975.0, 540.0, 311.0, 192.0, 104.0, 70.0, 40.0, 21.0, 18.0, 9.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66650390625, -0.6475677490234375, -0.628631591796875, -0.6096954345703125, -0.59075927734375, -0.5718231201171875, -0.552886962890625, -0.5339508056640625, -0.5150146484375, -0.4960784912109375, -0.477142333984375, -0.4582061767578125, -0.43927001953125, -0.4203338623046875, -0.401397705078125, -0.3824615478515625, -0.363525390625, -0.3445892333984375, -0.325653076171875, -0.3067169189453125, -0.28778076171875, -0.2688446044921875, -0.249908447265625, -0.2309722900390625, -0.2120361328125, -0.1930999755859375, -0.174163818359375, -0.1552276611328125, -0.13629150390625, -0.1173553466796875, -0.098419189453125, -0.0794830322265625, -0.060546875, -0.0416107177734375, -0.022674560546875, -0.0037384033203125, 0.01519775390625, 0.0341339111328125, 0.053070068359375, 0.0720062255859375, 0.0909423828125, 0.1098785400390625, 0.128814697265625, 0.1477508544921875, 0.16668701171875, 0.1856231689453125, 0.204559326171875, 0.2234954833984375, 0.242431640625, 0.2613677978515625, 0.280303955078125, 0.2992401123046875, 0.31817626953125, 0.3371124267578125, 0.356048583984375, 0.3749847412109375, 0.3939208984375, 0.4128570556640625, 0.431793212890625, 0.4507293701171875, 0.46966552734375, 0.4886016845703125, 0.507537841796875, 0.5264739990234375, 0.54541015625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 8.0, 3.0, 4.0, 9.0, 11.0, 7.0, 7.0, 12.0, 9.0, 20.0, 23.0, 22.0, 39.0, 45.0, 44.0, 53.0, 66.0, 80.0, 127.0, 67.0, 66.0, 42.0, 39.0, 38.0, 24.0, 21.0, 25.0, 13.0, 9.0, 13.0, 11.0, 5.0, 5.0, 5.0, 8.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0256805419921875, -0.024831295013427734, -0.02398204803466797, -0.023132801055908203, -0.022283554077148438, -0.021434307098388672, -0.020585060119628906, -0.01973581314086914, -0.018886566162109375, -0.01803731918334961, -0.017188072204589844, -0.016338825225830078, -0.015489578247070312, -0.014640331268310547, -0.013791084289550781, -0.012941837310791016, -0.01209259033203125, -0.011243343353271484, -0.010394096374511719, -0.009544849395751953, -0.008695602416992188, -0.007846355438232422, -0.006997108459472656, -0.006147861480712891, -0.005298614501953125, -0.004449367523193359, -0.0036001205444335938, -0.002750873565673828, -0.0019016265869140625, -0.0010523796081542969, -0.00020313262939453125, 0.0006461143493652344, 0.001495361328125, 0.0023446083068847656, 0.0031938552856445312, 0.004043102264404297, 0.0048923492431640625, 0.005741596221923828, 0.006590843200683594, 0.007440090179443359, 0.008289337158203125, 0.00913858413696289, 0.009987831115722656, 0.010837078094482422, 0.011686325073242188, 0.012535572052001953, 0.013384819030761719, 0.014234066009521484, 0.01508331298828125, 0.015932559967041016, 0.01678180694580078, 0.017631053924560547, 0.018480300903320312, 0.019329547882080078, 0.020178794860839844, 0.02102804183959961, 0.021877288818359375, 0.02272653579711914, 0.023575782775878906, 0.024425029754638672, 0.025274276733398438, 0.026123523712158203, 0.02697277069091797, 0.027822017669677734, 0.0286712646484375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 8.0, 9.0, 7.0, 7.0, 4.0, 9.0, 15.0, 12.0, 22.0, 31.0, 32.0, 47.0, 60.0, 86.0, 122.0, 206.0, 473.0, 1750.0, 1014879.0, 29119.0, 761.0, 322.0, 148.0, 110.0, 78.0, 52.0, 49.0, 26.0, 23.0, 22.0, 9.0, 8.0, 12.0, 11.0, 4.0, 4.0, 6.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5859375, -0.5685806274414062, -0.5512237548828125, -0.5338668823242188, -0.516510009765625, -0.49915313720703125, -0.4817962646484375, -0.46443939208984375, -0.44708251953125, -0.42972564697265625, -0.4123687744140625, -0.39501190185546875, -0.377655029296875, -0.36029815673828125, -0.3429412841796875, -0.32558441162109375, -0.3082275390625, -0.29087066650390625, -0.2735137939453125, -0.25615692138671875, -0.238800048828125, -0.22144317626953125, -0.2040863037109375, -0.18672943115234375, -0.16937255859375, -0.15201568603515625, -0.1346588134765625, -0.11730194091796875, -0.099945068359375, -0.08258819580078125, -0.0652313232421875, -0.04787445068359375, -0.030517578125, -0.01316070556640625, 0.0041961669921875, 0.02155303955078125, 0.038909912109375, 0.05626678466796875, 0.0736236572265625, 0.09098052978515625, 0.10833740234375, 0.12569427490234375, 0.1430511474609375, 0.16040802001953125, 0.177764892578125, 0.19512176513671875, 0.2124786376953125, 0.22983551025390625, 0.2471923828125, 0.26454925537109375, 0.2819061279296875, 0.29926300048828125, 0.316619873046875, 0.33397674560546875, 0.3513336181640625, 0.36869049072265625, 0.38604736328125, 0.40340423583984375, 0.4207611083984375, 0.43811798095703125, 0.455474853515625, 0.47283172607421875, 0.4901885986328125, 0.5075454711914062, 0.52490234375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 21.0, 991.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05284806340932846, -0.03107510134577751, -0.009302139282226562, 0.012470819056034088, 0.034243784844875336, 0.05601675063371658, 0.07778970152139664, 0.09956266731023788, 0.12133563309907913, 0.14310859143733978, 0.16488155722618103, 0.18665450811386108, 0.20842748880386353, 0.23020043969154358, 0.25197339057922363, 0.2737463712692261, 0.29551932215690613, 0.3172922730445862, 0.3390652537345886, 0.3608382046222687, 0.38261115550994873, 0.40438413619995117, 0.4261570870876312, 0.4479300379753113, 0.4697030186653137, 0.4914759695529938, 0.5132489204406738, 0.5350219011306763, 0.5567948818206787, 0.5785678625106812, 0.6003407835960388, 0.6221137642860413, 0.6438866853713989, 0.6656596660614014, 0.687432587146759, 0.7092055678367615, 0.7309785485267639, 0.7527514696121216, 0.774524450302124, 0.7962974309921265, 0.8180704116821289, 0.8398433923721313, 0.861616313457489, 0.8833892941474915, 0.9051622748374939, 0.9269351959228516, 0.948708176612854, 0.9704811573028564, 0.9922540783882141, 1.0140269994735718, 1.0357999801635742, 1.0575729608535767, 1.079345941543579, 1.1011189222335815, 1.122891902923584, 1.1446647644042969, 1.1664377450942993, 1.1882107257843018, 1.2099837064743042, 1.2317566871643066, 1.2535295486450195, 1.275302529335022, 1.2970755100250244, 1.3188484907150269, 1.3406214714050293]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 1.0, 3.0, 8.0, 11.0, 14.0, 19.0, 21.0, 20.0, 28.0, 33.0, 38.0, 45.0, 39.0, 45.0, 47.0, 49.0, 59.0, 46.0, 54.0, 45.0, 53.0, 55.0, 42.0, 44.0, 32.0, 25.0, 31.0, 23.0, 24.0, 14.0, 10.0, 7.0, 9.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.06615883111953735, -0.06458798050880432, -0.06301712989807129, -0.06144627556204796, -0.059875424951314926, -0.058304574340581894, -0.05673372000455856, -0.05516286939382553, -0.0535920187830925, -0.05202116817235947, -0.050450317561626434, -0.048879463225603104, -0.04730861261487007, -0.04573776200413704, -0.04416690766811371, -0.042596057057380676, -0.041025206446647644, -0.03945435583591461, -0.03788350522518158, -0.03631265088915825, -0.03474180027842522, -0.033170949667692184, -0.031600095331668854, -0.03002924472093582, -0.02845839411020279, -0.026887543499469757, -0.025316691026091576, -0.023745838552713394, -0.022174987941980362, -0.02060413733124733, -0.019033284857869148, -0.017462432384490967, -0.015891581773757935, -0.014320730231702328, -0.012749878689646721, -0.011179027147591114, -0.009608175605535507, -0.0080373240634799, -0.0064664725214242935, -0.004895620979368687, -0.00332476943731308, -0.001753917895257473, -0.00018306635320186615, 0.0013877851888537407, 0.0029586367309093475, 0.004529488272964954, 0.006100339815020561, 0.007671191357076168, 0.009242042899131775, 0.010812894441187382, 0.012383745983242989, 0.013954597525298595, 0.015525449067354202, 0.017096299678087234, 0.018667152151465416, 0.020238004624843597, 0.02180885523557663, 0.023379705846309662, 0.024950558319687843, 0.026521410793066025, 0.028092261403799057, 0.02966311201453209, 0.03123396448791027, 0.03280481696128845, 0.034375667572021484]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 13.0, 8.0, 8.0, 17.0, 15.0, 16.0, 19.0, 27.0, 25.0, 31.0, 26.0, 36.0, 32.0, 29.0, 38.0, 42.0, 42.0, 43.0, 44.0, 47.0, 44.0, 43.0, 51.0, 32.0, 32.0, 32.0, 34.0, 30.0, 15.0, 20.0, 16.0, 16.0, 13.0, 19.0, 8.0, 9.0, 8.0, 6.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.00390625, -5.82220458984375, -5.6405029296875, -5.45880126953125, -5.277099609375, -5.09539794921875, -4.9136962890625, -4.73199462890625, -4.55029296875, -4.36859130859375, -4.1868896484375, -4.00518798828125, -3.823486328125, -3.64178466796875, -3.4600830078125, -3.27838134765625, -3.0966796875, -2.91497802734375, -2.7332763671875, -2.55157470703125, -2.369873046875, -2.18817138671875, -2.0064697265625, -1.82476806640625, -1.64306640625, -1.46136474609375, -1.2796630859375, -1.09796142578125, -0.916259765625, -0.73455810546875, -0.5528564453125, -0.37115478515625, -0.189453125, -0.00775146484375, 0.1739501953125, 0.35565185546875, 0.537353515625, 0.71905517578125, 0.9007568359375, 1.08245849609375, 1.26416015625, 1.44586181640625, 1.6275634765625, 1.80926513671875, 1.990966796875, 2.17266845703125, 2.3543701171875, 2.53607177734375, 2.7177734375, 2.89947509765625, 3.0811767578125, 3.26287841796875, 3.444580078125, 3.62628173828125, 3.8079833984375, 3.98968505859375, 4.17138671875, 4.35308837890625, 4.5347900390625, 4.71649169921875, 4.898193359375, 5.07989501953125, 5.2615966796875, 5.44329833984375, 5.625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 11.0, 6.0, 11.0, 8.0, 15.0, 27.0, 27.0, 39.0, 42.0, 59.0, 113.0, 115.0, 189.0, 401.0, 869.0, 2828.0, 11146.0, 47039.0, 224684.0, 578951.0, 139591.0, 31123.0, 7544.0, 2045.0, 686.0, 334.0, 178.0, 125.0, 84.0, 68.0, 43.0, 29.0, 29.0, 21.0, 18.0, 11.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.796875, -11.4432373046875, -11.089599609375, -10.7359619140625, -10.38232421875, -10.0286865234375, -9.675048828125, -9.3214111328125, -8.9677734375, -8.6141357421875, -8.260498046875, -7.9068603515625, -7.55322265625, -7.1995849609375, -6.845947265625, -6.4923095703125, -6.138671875, -5.7850341796875, -5.431396484375, -5.0777587890625, -4.72412109375, -4.3704833984375, -4.016845703125, -3.6632080078125, -3.3095703125, -2.9559326171875, -2.602294921875, -2.2486572265625, -1.89501953125, -1.5413818359375, -1.187744140625, -0.8341064453125, -0.48046875, -0.1268310546875, 0.226806640625, 0.5804443359375, 0.93408203125, 1.2877197265625, 1.641357421875, 1.9949951171875, 2.3486328125, 2.7022705078125, 3.055908203125, 3.4095458984375, 3.76318359375, 4.1168212890625, 4.470458984375, 4.8240966796875, 5.177734375, 5.5313720703125, 5.885009765625, 6.2386474609375, 6.59228515625, 6.9459228515625, 7.299560546875, 7.6531982421875, 8.0068359375, 8.3604736328125, 8.714111328125, 9.0677490234375, 9.42138671875, 9.7750244140625, 10.128662109375, 10.4822998046875, 10.8359375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 10.0, 14.0, 10.0, 21.0, 18.0, 16.0, 24.0, 24.0, 34.0, 26.0, 37.0, 35.0, 50.0, 70.0, 86.0, 173.0, 272.0, 1363.0, 165.0, 107.0, 73.0, 66.0, 42.0, 47.0, 35.0, 37.0, 26.0, 24.0, 21.0, 14.0, 14.0, 13.0, 9.0, 11.0, 11.0, 8.0, 2.0, 7.0, 3.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.875, -17.301513671875, -16.72802734375, -16.154541015625, -15.5810546875, -15.007568359375, -14.43408203125, -13.860595703125, -13.287109375, -12.713623046875, -12.14013671875, -11.566650390625, -10.9931640625, -10.419677734375, -9.84619140625, -9.272705078125, -8.69921875, -8.125732421875, -7.55224609375, -6.978759765625, -6.4052734375, -5.831787109375, -5.25830078125, -4.684814453125, -4.111328125, -3.537841796875, -2.96435546875, -2.390869140625, -1.8173828125, -1.243896484375, -0.67041015625, -0.096923828125, 0.4765625, 1.050048828125, 1.62353515625, 2.197021484375, 2.7705078125, 3.343994140625, 3.91748046875, 4.490966796875, 5.064453125, 5.637939453125, 6.21142578125, 6.784912109375, 7.3583984375, 7.931884765625, 8.50537109375, 9.078857421875, 9.65234375, 10.225830078125, 10.79931640625, 11.372802734375, 11.9462890625, 12.519775390625, 13.09326171875, 13.666748046875, 14.240234375, 14.813720703125, 15.38720703125, 15.960693359375, 16.5341796875, 17.107666015625, 17.68115234375, 18.254638671875, 18.828125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 13.0, 15.0, 29.0, 24.0, 45.0, 66.0, 96.0, 140.0, 309.0, 782.0, 8218.0, 3118575.0, 15686.0, 902.0, 280.0, 175.0, 120.0, 69.0, 54.0, 36.0, 29.0, 13.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.875, -91.7705078125, -88.666015625, -85.5615234375, -82.45703125, -79.3525390625, -76.248046875, -73.1435546875, -70.0390625, -66.9345703125, -63.830078125, -60.7255859375, -57.62109375, -54.5166015625, -51.412109375, -48.3076171875, -45.203125, -42.0986328125, -38.994140625, -35.8896484375, -32.78515625, -29.6806640625, -26.576171875, -23.4716796875, -20.3671875, -17.2626953125, -14.158203125, -11.0537109375, -7.94921875, -4.8447265625, -1.740234375, 1.3642578125, 4.46875, 7.5732421875, 10.677734375, 13.7822265625, 16.88671875, 19.9912109375, 23.095703125, 26.2001953125, 29.3046875, 32.4091796875, 35.513671875, 38.6181640625, 41.72265625, 44.8271484375, 47.931640625, 51.0361328125, 54.140625, 57.2451171875, 60.349609375, 63.4541015625, 66.55859375, 69.6630859375, 72.767578125, 75.8720703125, 78.9765625, 82.0810546875, 85.185546875, 88.2900390625, 91.39453125, 94.4990234375, 97.603515625, 100.7080078125, 103.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 51.0, 181.0, 347.0, 281.0, 120.0, 24.0, 7.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.45763397216797, -29.720035552978516, -26.982439041137695, -24.244842529296875, -21.507244110107422, -18.76964569091797, -16.03204917907715, -13.294452667236328, -10.556854248046875, -7.819256782531738, -5.081659317016602, -2.344061851501465, 0.3935356140136719, 3.1311330795288086, 5.868730545043945, 8.606327056884766, 11.343925476074219, 14.081522941589355, 16.819120407104492, 19.556716918945312, 22.294315338134766, 25.03191375732422, 27.76951026916504, 30.50710678100586, 33.24470520019531, 35.982303619384766, 38.71990203857422, 41.457496643066406, 44.19509506225586, 46.93269348144531, 49.6702880859375, 52.40788650512695, 55.145477294921875, 57.88307571411133, 60.62067413330078, 63.35826873779297, 66.09587097167969, 68.83346557617188, 71.57106018066406, 74.30865478515625, 77.04625701904297, 79.78385162353516, 82.52145385742188, 85.25904846191406, 87.99664306640625, 90.73424530029297, 93.47183990478516, 96.20944213867188, 98.94703674316406, 101.68463134765625, 104.42223358154297, 107.15982818603516, 109.89743041992188, 112.63502502441406, 115.37261962890625, 118.11021423339844, 120.84781646728516, 123.58541107177734, 126.32301330566406, 129.06060791015625, 131.79820251464844, 134.53579711914062, 137.27340698242188, 140.01100158691406, 142.74859619140625]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 6.0, 1.0, 9.0, 8.0, 8.0, 15.0, 20.0, 12.0, 19.0, 33.0, 20.0, 40.0, 19.0, 50.0, 32.0, 40.0, 41.0, 54.0, 42.0, 49.0, 47.0, 46.0, 39.0, 45.0, 27.0, 33.0, 40.0, 27.0, 23.0, 20.0, 25.0, 23.0, 15.0, 10.0, 15.0, 11.0, 6.0, 12.0, 4.0, 6.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.99579620361328, -60.05271911621094, -58.109642028808594, -56.16656494140625, -54.223487854003906, -52.28041076660156, -50.33732986450195, -48.39425277709961, -46.451175689697266, -44.50809860229492, -42.56502151489258, -40.621944427490234, -38.678863525390625, -36.73578643798828, -34.79270935058594, -32.849632263183594, -30.90655517578125, -28.963478088378906, -27.020401000976562, -25.077322006225586, -23.134244918823242, -21.1911678314209, -19.248088836669922, -17.305011749267578, -15.361934661865234, -13.41885757446289, -11.47577953338623, -9.53270149230957, -7.589624404907227, -5.646547317504883, -3.7034692764282227, -1.7603912353515625, 0.18268203735351562, 2.1257596015930176, 4.0688371658325195, 6.0119147300720215, 7.954992294311523, 9.898069381713867, 11.841147422790527, 13.784225463867188, 15.727302551269531, 17.670379638671875, 19.61345672607422, 21.556535720825195, 23.49961280822754, 25.442689895629883, 27.38576889038086, 29.328845977783203, 31.271923065185547, 33.21500015258789, 35.158077239990234, 37.10115432739258, 39.04423522949219, 40.98731231689453, 42.930389404296875, 44.87346649169922, 46.81654357910156, 48.759620666503906, 50.70269775390625, 52.645774841308594, 54.58885192871094, 56.53192901611328, 58.47500991821289, 60.418087005615234, 62.36116409301758]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 6.0, 13.0, 11.0, 9.0, 13.0, 18.0, 17.0, 18.0, 19.0, 33.0, 19.0, 27.0, 43.0, 37.0, 38.0, 34.0, 41.0, 43.0, 50.0, 39.0, 50.0, 27.0, 41.0, 24.0, 48.0, 43.0, 34.0, 37.0, 24.0, 22.0, 20.0, 14.0, 17.0, 13.0, 10.0, 10.0, 4.0, 10.0, 4.0, 4.0, 8.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.20703125, -6.00738525390625, -5.8077392578125, -5.60809326171875, -5.408447265625, -5.20880126953125, -5.0091552734375, -4.80950927734375, -4.60986328125, -4.41021728515625, -4.2105712890625, -4.01092529296875, -3.811279296875, -3.61163330078125, -3.4119873046875, -3.21234130859375, -3.0126953125, -2.81304931640625, -2.6134033203125, -2.41375732421875, -2.214111328125, -2.01446533203125, -1.8148193359375, -1.61517333984375, -1.41552734375, -1.21588134765625, -1.0162353515625, -0.81658935546875, -0.616943359375, -0.41729736328125, -0.2176513671875, -0.01800537109375, 0.181640625, 0.38128662109375, 0.5809326171875, 0.78057861328125, 0.980224609375, 1.17987060546875, 1.3795166015625, 1.57916259765625, 1.77880859375, 1.97845458984375, 2.1781005859375, 2.37774658203125, 2.577392578125, 2.77703857421875, 2.9766845703125, 3.17633056640625, 3.3759765625, 3.57562255859375, 3.7752685546875, 3.97491455078125, 4.174560546875, 4.37420654296875, 4.5738525390625, 4.77349853515625, 4.97314453125, 5.17279052734375, 5.3724365234375, 5.57208251953125, 5.771728515625, 5.97137451171875, 6.1710205078125, 6.37066650390625, 6.5703125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 14.0, 9.0, 18.0, 24.0, 30.0, 34.0, 42.0, 51.0, 97.0, 143.0, 219.0, 361.0, 637.0, 1371.0, 3045.0, 7837.0, 21177.0, 61987.0, 186739.0, 534516.0, 1145860.0, 1240564.0, 637886.0, 232741.0, 76755.0, 25760.0, 9434.0, 3609.0, 1512.0, 703.0, 355.0, 258.0, 139.0, 89.0, 66.0, 48.0, 41.0, 32.0, 20.0, 22.0, 8.0, 9.0, 6.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16015625, -6.93707275390625, -6.7139892578125, -6.49090576171875, -6.267822265625, -6.04473876953125, -5.8216552734375, -5.59857177734375, -5.37548828125, -5.15240478515625, -4.9293212890625, -4.70623779296875, -4.483154296875, -4.26007080078125, -4.0369873046875, -3.81390380859375, -3.5908203125, -3.36773681640625, -3.1446533203125, -2.92156982421875, -2.698486328125, -2.47540283203125, -2.2523193359375, -2.02923583984375, -1.80615234375, -1.58306884765625, -1.3599853515625, -1.13690185546875, -0.913818359375, -0.69073486328125, -0.4676513671875, -0.24456787109375, -0.021484375, 0.20159912109375, 0.4246826171875, 0.64776611328125, 0.870849609375, 1.09393310546875, 1.3170166015625, 1.54010009765625, 1.76318359375, 1.98626708984375, 2.2093505859375, 2.43243408203125, 2.655517578125, 2.87860107421875, 3.1016845703125, 3.32476806640625, 3.5478515625, 3.77093505859375, 3.9940185546875, 4.21710205078125, 4.440185546875, 4.66326904296875, 4.8863525390625, 5.10943603515625, 5.33251953125, 5.55560302734375, 5.7786865234375, 6.00177001953125, 6.224853515625, 6.44793701171875, 6.6710205078125, 6.89410400390625, 7.1171875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 5.0, 12.0, 15.0, 31.0, 39.0, 42.0, 53.0, 77.0, 104.0, 122.0, 188.0, 213.0, 311.0, 346.0, 419.0, 411.0, 386.0, 300.0, 253.0, 183.0, 141.0, 95.0, 80.0, 51.0, 50.0, 33.0, 25.0, 14.0, 23.0, 7.0, 9.0, 6.0, 3.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.4422607421875, -12.087646484375, -11.7330322265625, -11.37841796875, -11.0238037109375, -10.669189453125, -10.3145751953125, -9.9599609375, -9.6053466796875, -9.250732421875, -8.8961181640625, -8.54150390625, -8.1868896484375, -7.832275390625, -7.4776611328125, -7.123046875, -6.7684326171875, -6.413818359375, -6.0592041015625, -5.70458984375, -5.3499755859375, -4.995361328125, -4.6407470703125, -4.2861328125, -3.9315185546875, -3.576904296875, -3.2222900390625, -2.86767578125, -2.5130615234375, -2.158447265625, -1.8038330078125, -1.44921875, -1.0946044921875, -0.739990234375, -0.3853759765625, -0.03076171875, 0.3238525390625, 0.678466796875, 1.0330810546875, 1.3876953125, 1.7423095703125, 2.096923828125, 2.4515380859375, 2.80615234375, 3.1607666015625, 3.515380859375, 3.8699951171875, 4.224609375, 4.5792236328125, 4.933837890625, 5.2884521484375, 5.64306640625, 5.9976806640625, 6.352294921875, 6.7069091796875, 7.0615234375, 7.4161376953125, 7.770751953125, 8.1253662109375, 8.47998046875, 8.8345947265625, 9.189208984375, 9.5438232421875, 9.8984375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 7.0, 9.0, 13.0, 21.0, 12.0, 41.0, 36.0, 56.0, 71.0, 119.0, 194.0, 327.0, 591.0, 1308.0, 6878.0, 364313.0, 3719018.0, 95396.0, 3544.0, 967.0, 506.0, 289.0, 183.0, 109.0, 86.0, 61.0, 40.0, 25.0, 22.0, 11.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.375, -35.04541015625, -33.7158203125, -32.38623046875, -31.056640625, -29.72705078125, -28.3974609375, -27.06787109375, -25.73828125, -24.40869140625, -23.0791015625, -21.74951171875, -20.419921875, -19.09033203125, -17.7607421875, -16.43115234375, -15.1015625, -13.77197265625, -12.4423828125, -11.11279296875, -9.783203125, -8.45361328125, -7.1240234375, -5.79443359375, -4.46484375, -3.13525390625, -1.8056640625, -0.47607421875, 0.853515625, 2.18310546875, 3.5126953125, 4.84228515625, 6.171875, 7.50146484375, 8.8310546875, 10.16064453125, 11.490234375, 12.81982421875, 14.1494140625, 15.47900390625, 16.80859375, 18.13818359375, 19.4677734375, 20.79736328125, 22.126953125, 23.45654296875, 24.7861328125, 26.11572265625, 27.4453125, 28.77490234375, 30.1044921875, 31.43408203125, 32.763671875, 34.09326171875, 35.4228515625, 36.75244140625, 38.08203125, 39.41162109375, 40.7412109375, 42.07080078125, 43.400390625, 44.72998046875, 46.0595703125, 47.38916015625, 48.71875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 28.0, 64.0, 161.0, 229.0, 246.0, 176.0, 76.0, 24.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.14224243164062, -139.3675994873047, -135.5929718017578, -131.81832885742188, -128.04368591308594, -124.26905059814453, -120.49441528320312, -116.71977233886719, -112.94513702392578, -109.17050170898438, -105.39585876464844, -101.62122344970703, -97.84658813476562, -94.07194519042969, -90.29730987548828, -86.52267456054688, -82.74803161621094, -78.97339630126953, -75.1987533569336, -71.42411804199219, -67.64947509765625, -63.874839782714844, -60.10020446777344, -56.325565338134766, -52.550926208496094, -48.77628707885742, -45.00164794921875, -41.227012634277344, -37.45237350463867, -33.677734375, -29.90309715270996, -26.128459930419922, -22.35381317138672, -18.579174041748047, -14.804536819458008, -11.029898643493652, -7.255260467529297, -3.480621337890625, 0.29401588439941406, 4.068653106689453, 7.843292236328125, 11.61793041229248, 15.392568588256836, 19.167205810546875, 22.941844940185547, 26.71648406982422, 30.491121292114258, 34.2657585144043, 38.04039764404297, 41.81503677368164, 45.58967590332031, 49.36431121826172, 53.13895034790039, 56.91358947753906, 60.68822479248047, 64.46286010742188, 68.23750305175781, 72.01213836669922, 75.78678131103516, 79.56141662597656, 83.3360595703125, 87.1106948852539, 90.88533020019531, 94.65997314453125, 98.43460845947266]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 5.0, 5.0, 1.0, 6.0, 12.0, 3.0, 9.0, 9.0, 20.0, 16.0, 25.0, 22.0, 24.0, 25.0, 23.0, 23.0, 31.0, 26.0, 41.0, 38.0, 33.0, 38.0, 55.0, 32.0, 29.0, 37.0, 29.0, 34.0, 42.0, 30.0, 33.0, 29.0, 16.0, 21.0, 17.0, 27.0, 21.0, 16.0, 24.0, 13.0, 7.0, 14.0, 8.0, 7.0, 8.0, 6.0, 2.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-35.62378692626953, -34.5118293762207, -33.399871826171875, -32.28791427612305, -31.17595672607422, -30.06399917602539, -28.952041625976562, -27.840084075927734, -26.728126525878906, -25.616168975830078, -24.50421142578125, -23.392253875732422, -22.280296325683594, -21.168338775634766, -20.056381225585938, -18.94442367553711, -17.83246421813965, -16.72050666809082, -15.608549118041992, -14.496591567993164, -13.384634017944336, -12.272676467895508, -11.160717964172363, -10.048760414123535, -8.936802864074707, -7.824845314025879, -6.712887763977051, -5.6009297370910645, -4.488972187042236, -3.377014636993408, -2.265056610107422, -1.1530990600585938, -0.041141510009765625, 1.070816159248352, 2.1827738285064697, 3.294731616973877, 4.406689167022705, 5.518646717071533, 6.6306047439575195, 7.742562294006348, 8.854519844055176, 9.966477394104004, 11.078434944152832, 12.190393447875977, 13.302350997924805, 14.414308547973633, 15.526266098022461, 16.63822364807129, 17.750181198120117, 18.862138748168945, 19.974096298217773, 21.0860538482666, 22.19801139831543, 23.309968948364258, 24.42192840576172, 25.533885955810547, 26.645843505859375, 27.757801055908203, 28.86975860595703, 29.98171615600586, 31.093673706054688, 32.205631256103516, 33.317588806152344, 34.42954635620117, 35.54150390625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 3.0, 6.0, 8.0, 11.0, 16.0, 20.0, 14.0, 34.0, 26.0, 30.0, 36.0, 36.0, 29.0, 50.0, 40.0, 40.0, 33.0, 35.0, 43.0, 42.0, 47.0, 40.0, 39.0, 34.0, 33.0, 30.0, 31.0, 29.0, 24.0, 26.0, 24.0, 17.0, 13.0, 10.0, 6.0, 7.0, 5.0, 4.0, 8.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.51953125, -6.32391357421875, -6.1282958984375, -5.93267822265625, -5.737060546875, -5.54144287109375, -5.3458251953125, -5.15020751953125, -4.95458984375, -4.75897216796875, -4.5633544921875, -4.36773681640625, -4.172119140625, -3.97650146484375, -3.7808837890625, -3.58526611328125, -3.3896484375, -3.19403076171875, -2.9984130859375, -2.80279541015625, -2.607177734375, -2.41156005859375, -2.2159423828125, -2.02032470703125, -1.82470703125, -1.62908935546875, -1.4334716796875, -1.23785400390625, -1.042236328125, -0.84661865234375, -0.6510009765625, -0.45538330078125, -0.259765625, -0.06414794921875, 0.1314697265625, 0.32708740234375, 0.522705078125, 0.71832275390625, 0.9139404296875, 1.10955810546875, 1.30517578125, 1.50079345703125, 1.6964111328125, 1.89202880859375, 2.087646484375, 2.28326416015625, 2.4788818359375, 2.67449951171875, 2.8701171875, 3.06573486328125, 3.2613525390625, 3.45697021484375, 3.652587890625, 3.84820556640625, 4.0438232421875, 4.23944091796875, 4.43505859375, 4.63067626953125, 4.8262939453125, 5.02191162109375, 5.217529296875, 5.41314697265625, 5.6087646484375, 5.80438232421875, 6.0]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 4.0, 9.0, 12.0, 13.0, 27.0, 40.0, 69.0, 82.0, 108.0, 189.0, 275.0, 391.0, 571.0, 801.0, 1230.0, 1773.0, 2622.0, 3738.0, 5622.0, 8186.0, 12013.0, 18296.0, 27356.0, 41023.0, 60246.0, 84446.0, 111608.0, 134231.0, 136670.0, 115003.0, 87894.0, 63067.0, 42924.0, 28928.0, 19267.0, 12804.0, 8675.0, 5809.0, 3920.0, 2694.0, 1883.0, 1292.0, 882.0, 595.0, 397.0, 274.0, 209.0, 130.0, 90.0, 69.0, 49.0, 20.0, 22.0, 2.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.63671875, -0.61553955078125, -0.5943603515625, -0.57318115234375, -0.552001953125, -0.53082275390625, -0.5096435546875, -0.48846435546875, -0.46728515625, -0.44610595703125, -0.4249267578125, -0.40374755859375, -0.382568359375, -0.36138916015625, -0.3402099609375, -0.31903076171875, -0.2978515625, -0.27667236328125, -0.2554931640625, -0.23431396484375, -0.213134765625, -0.19195556640625, -0.1707763671875, -0.14959716796875, -0.12841796875, -0.10723876953125, -0.0860595703125, -0.06488037109375, -0.043701171875, -0.02252197265625, -0.0013427734375, 0.01983642578125, 0.041015625, 0.06219482421875, 0.0833740234375, 0.10455322265625, 0.125732421875, 0.14691162109375, 0.1680908203125, 0.18927001953125, 0.21044921875, 0.23162841796875, 0.2528076171875, 0.27398681640625, 0.295166015625, 0.31634521484375, 0.3375244140625, 0.35870361328125, 0.3798828125, 0.40106201171875, 0.4222412109375, 0.44342041015625, 0.464599609375, 0.48577880859375, 0.5069580078125, 0.52813720703125, 0.54931640625, 0.57049560546875, 0.5916748046875, 0.61285400390625, 0.634033203125, 0.65521240234375, 0.6763916015625, 0.69757080078125, 0.71875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 5.0, 8.0, 9.0, 11.0, 8.0, 16.0, 23.0, 30.0, 22.0, 29.0, 37.0, 28.0, 47.0, 44.0, 28.0, 40.0, 48.0, 1070.0, 53.0, 51.0, 43.0, 45.0, 38.0, 36.0, 41.0, 28.0, 32.0, 27.0, 24.0, 22.0, 13.0, 17.0, 10.0, 10.0, 10.0, 7.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.59765625, -5.44146728515625, -5.2852783203125, -5.12908935546875, -4.972900390625, -4.81671142578125, -4.6605224609375, -4.50433349609375, -4.34814453125, -4.19195556640625, -4.0357666015625, -3.87957763671875, -3.723388671875, -3.56719970703125, -3.4110107421875, -3.25482177734375, -3.0986328125, -2.94244384765625, -2.7862548828125, -2.63006591796875, -2.473876953125, -2.31768798828125, -2.1614990234375, -2.00531005859375, -1.84912109375, -1.69293212890625, -1.5367431640625, -1.38055419921875, -1.224365234375, -1.06817626953125, -0.9119873046875, -0.75579833984375, -0.599609375, -0.44342041015625, -0.2872314453125, -0.13104248046875, 0.025146484375, 0.18133544921875, 0.3375244140625, 0.49371337890625, 0.64990234375, 0.80609130859375, 0.9622802734375, 1.11846923828125, 1.274658203125, 1.43084716796875, 1.5870361328125, 1.74322509765625, 1.8994140625, 2.05560302734375, 2.2117919921875, 2.36798095703125, 2.524169921875, 2.68035888671875, 2.8365478515625, 2.99273681640625, 3.14892578125, 3.30511474609375, 3.4613037109375, 3.61749267578125, 3.773681640625, 3.92987060546875, 4.0860595703125, 4.24224853515625, 4.3984375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 10.0, 15.0, 13.0, 28.0, 30.0, 53.0, 66.0, 114.0, 172.0, 283.0, 395.0, 751.0, 1054.0, 1726.0, 2850.0, 4682.0, 7700.0, 12658.0, 20928.0, 33698.0, 52572.0, 80754.0, 116277.0, 175381.0, 1182060.0, 134186.0, 96376.0, 64439.0, 41162.0, 25922.0, 15617.0, 9747.0, 5828.0, 3657.0, 2228.0, 1403.0, 896.0, 534.0, 330.0, 185.0, 134.0, 66.0, 62.0, 40.0, 22.0, 14.0, 8.0, 5.0, 4.0, 1.0, 1.0], "bins": [-0.611328125, -0.5949058532714844, -0.5784835815429688, -0.5620613098144531, -0.5456390380859375, -0.5292167663574219, -0.5127944946289062, -0.4963722229003906, -0.479949951171875, -0.4635276794433594, -0.44710540771484375, -0.4306831359863281, -0.4142608642578125, -0.3978385925292969, -0.38141632080078125, -0.3649940490722656, -0.34857177734375, -0.3321495056152344, -0.31572723388671875, -0.2993049621582031, -0.2828826904296875, -0.2664604187011719, -0.25003814697265625, -0.23361587524414062, -0.217193603515625, -0.20077133178710938, -0.18434906005859375, -0.16792678833007812, -0.1515045166015625, -0.13508224487304688, -0.11865997314453125, -0.10223770141601562, -0.0858154296875, -0.06939315795898438, -0.05297088623046875, -0.036548614501953125, -0.0201263427734375, -0.003704071044921875, 0.01271820068359375, 0.029140472412109375, 0.045562744140625, 0.061985015869140625, 0.07840728759765625, 0.09482955932617188, 0.1112518310546875, 0.12767410278320312, 0.14409637451171875, 0.16051864624023438, 0.17694091796875, 0.19336318969726562, 0.20978546142578125, 0.22620773315429688, 0.2426300048828125, 0.2590522766113281, 0.27547454833984375, 0.2918968200683594, 0.308319091796875, 0.3247413635253906, 0.34116363525390625, 0.3575859069824219, 0.3740081787109375, 0.3904304504394531, 0.40685272216796875, 0.4232749938964844, 0.439697265625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 4.0, 6.0, 5.0, 13.0, 13.0, 10.0, 16.0, 13.0, 24.0, 27.0, 20.0, 40.0, 40.0, 52.0, 67.0, 59.0, 73.0, 64.0, 80.0, 48.0, 45.0, 34.0, 22.0, 35.0, 27.0, 16.0, 23.0, 11.0, 21.0, 12.0, 9.0, 8.0, 8.0, 8.0, 8.0, 8.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01561737060546875, -0.015056967735290527, -0.014496564865112305, -0.013936161994934082, -0.01337575912475586, -0.012815356254577637, -0.012254953384399414, -0.011694550514221191, -0.011134147644042969, -0.010573744773864746, -0.010013341903686523, -0.0094529390335083, -0.008892536163330078, -0.008332133293151855, -0.007771730422973633, -0.00721132755279541, -0.0066509246826171875, -0.006090521812438965, -0.005530118942260742, -0.0049697160720825195, -0.004409313201904297, -0.0038489103317260742, -0.0032885074615478516, -0.002728104591369629, -0.0021677017211914062, -0.0016072988510131836, -0.001046895980834961, -0.0004864931106567383, 7.390975952148438e-05, 0.000634312629699707, 0.0011947154998779297, 0.0017551183700561523, 0.002315521240234375, 0.0028759241104125977, 0.0034363269805908203, 0.003996729850769043, 0.004557132720947266, 0.005117535591125488, 0.005677938461303711, 0.006238341331481934, 0.006798744201660156, 0.007359147071838379, 0.007919549942016602, 0.008479952812194824, 0.009040355682373047, 0.00960075855255127, 0.010161161422729492, 0.010721564292907715, 0.011281967163085938, 0.01184237003326416, 0.012402772903442383, 0.012963175773620605, 0.013523578643798828, 0.01408398151397705, 0.014644384384155273, 0.015204787254333496, 0.01576519012451172, 0.01632559299468994, 0.016885995864868164, 0.017446398735046387, 0.01800680160522461, 0.018567204475402832, 0.019127607345581055, 0.019688010215759277, 0.0202484130859375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 9.0, 8.0, 14.0, 11.0, 13.0, 24.0, 26.0, 34.0, 44.0, 54.0, 71.0, 82.0, 112.0, 174.0, 307.0, 663.0, 11323.0, 1027789.0, 6237.0, 565.0, 315.0, 165.0, 119.0, 84.0, 63.0, 43.0, 37.0, 25.0, 29.0, 19.0, 15.0, 15.0, 6.0, 6.0, 7.0, 8.0, 2.0, 5.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0], "bins": [-0.421630859375, -0.410369873046875, -0.39910888671875, -0.387847900390625, -0.3765869140625, -0.365325927734375, -0.35406494140625, -0.342803955078125, -0.33154296875, -0.320281982421875, -0.30902099609375, -0.297760009765625, -0.2864990234375, -0.275238037109375, -0.26397705078125, -0.252716064453125, -0.241455078125, -0.230194091796875, -0.21893310546875, -0.207672119140625, -0.1964111328125, -0.185150146484375, -0.17388916015625, -0.162628173828125, -0.1513671875, -0.140106201171875, -0.12884521484375, -0.117584228515625, -0.1063232421875, -0.095062255859375, -0.08380126953125, -0.072540283203125, -0.061279296875, -0.050018310546875, -0.03875732421875, -0.027496337890625, -0.0162353515625, -0.004974365234375, 0.00628662109375, 0.017547607421875, 0.02880859375, 0.040069580078125, 0.05133056640625, 0.062591552734375, 0.0738525390625, 0.085113525390625, 0.09637451171875, 0.107635498046875, 0.118896484375, 0.130157470703125, 0.14141845703125, 0.152679443359375, 0.1639404296875, 0.175201416015625, 0.18646240234375, 0.197723388671875, 0.208984375, 0.220245361328125, 0.23150634765625, 0.242767333984375, 0.2540283203125, 0.265289306640625, 0.27655029296875, 0.287811279296875, 0.299072265625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 11.0, 991.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08656884729862213, -0.07344507426023483, -0.06032129377126694, -0.04719752073287964, -0.03407374396920204, -0.020949967205524445, -0.007826194167137146, 0.0052975863218307495, 0.018421359360218048, 0.031545136123895645, 0.04466891288757324, 0.05779268592596054, 0.07091645896434784, 0.08404023945331573, 0.09716401249170303, 0.11028779298067093, 0.12341156601905823, 0.13653534650802612, 0.14965911209583282, 0.16278289258480072, 0.17590667307376862, 0.18903043866157532, 0.2021542191505432, 0.2152779996395111, 0.228401780128479, 0.2415255606174469, 0.2546493411064148, 0.2677730917930603, 0.2808968722820282, 0.2940206527709961, 0.307144433259964, 0.3202682137489319, 0.3333919942378998, 0.3465157747268677, 0.35963955521583557, 0.37276333570480347, 0.385887086391449, 0.39901086688041687, 0.41213464736938477, 0.42525842785835266, 0.43838220834732056, 0.45150598883628845, 0.46462976932525635, 0.47775352001190186, 0.49087730050086975, 0.5040010809898376, 0.5171248912811279, 0.5302486419677734, 0.543372392654419, 0.5564961433410645, 0.5696199536323547, 0.5827437043190002, 0.5958675146102905, 0.608991265296936, 0.6221150159835815, 0.6352388262748718, 0.6483626365661621, 0.6614863872528076, 0.6746101975440979, 0.6877339482307434, 0.7008577585220337, 0.7139815092086792, 0.7271052598953247, 0.740229070186615, 0.7533528208732605]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 12.0, 8.0, 13.0, 21.0, 28.0, 22.0, 32.0, 42.0, 43.0, 52.0, 58.0, 48.0, 61.0, 59.0, 50.0, 49.0, 56.0, 43.0, 51.0, 43.0, 28.0, 36.0, 31.0, 31.0, 15.0, 13.0, 11.0, 16.0, 11.0, 5.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03833037614822388, -0.037341926246881485, -0.03635347634553909, -0.0353650227189064, -0.03437657281756401, -0.03338812291622162, -0.03239966928958893, -0.031411219388246536, -0.030422769486904144, -0.029434319585561752, -0.02844586782157421, -0.02745741605758667, -0.026468966156244278, -0.025480516254901886, -0.024492064490914345, -0.023503612726926804, -0.02251516282558441, -0.02152671292424202, -0.02053826116025448, -0.019549809396266937, -0.018561359494924545, -0.017572909593582153, -0.016584457829594612, -0.015596006996929646, -0.014607556164264679, -0.013619105331599712, -0.012630654498934746, -0.01164220366626978, -0.010653752833604813, -0.009665302000939846, -0.00867685116827488, -0.007688400335609913, -0.006699949502944946, -0.00571149867027998, -0.004723047837615013, -0.0037345970049500465, -0.00274614617228508, -0.0017576953396201134, -0.0007692445069551468, 0.0002192063257098198, 0.0012076571583747864, 0.002196107991039753, 0.0031845588237047195, 0.004173009656369686, 0.005161460489034653, 0.006149911321699619, 0.007138362154364586, 0.008126812987029552, 0.009115263819694519, 0.010103714652359486, 0.011092165485024452, 0.012080616317689419, 0.013069067150354385, 0.014057517983019352, 0.015045968815684319, 0.01603442057967186, 0.01702287048101425, 0.018011320382356644, 0.018999772146344185, 0.019988223910331726, 0.020976673811674118, 0.02196512371301651, 0.02295357547700405, 0.023942027240991592, 0.024930477142333984]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 6.0, 8.0, 11.0, 16.0, 20.0, 14.0, 34.0, 25.0, 31.0, 35.0, 37.0, 28.0, 49.0, 42.0, 40.0, 33.0, 33.0, 44.0, 43.0, 47.0, 39.0, 39.0, 33.0, 35.0, 30.0, 31.0, 29.0, 24.0, 26.0, 23.0, 18.0, 13.0, 10.0, 6.0, 7.0, 5.0, 4.0, 7.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.5234375, -6.3277587890625, -6.132080078125, -5.9364013671875, -5.74072265625, -5.5450439453125, -5.349365234375, -5.1536865234375, -4.9580078125, -4.7623291015625, -4.566650390625, -4.3709716796875, -4.17529296875, -3.9796142578125, -3.783935546875, -3.5882568359375, -3.392578125, -3.1968994140625, -3.001220703125, -2.8055419921875, -2.60986328125, -2.4141845703125, -2.218505859375, -2.0228271484375, -1.8271484375, -1.6314697265625, -1.435791015625, -1.2401123046875, -1.04443359375, -0.8487548828125, -0.653076171875, -0.4573974609375, -0.26171875, -0.0660400390625, 0.129638671875, 0.3253173828125, 0.52099609375, 0.7166748046875, 0.912353515625, 1.1080322265625, 1.3037109375, 1.4993896484375, 1.695068359375, 1.8907470703125, 2.08642578125, 2.2821044921875, 2.477783203125, 2.6734619140625, 2.869140625, 3.0648193359375, 3.260498046875, 3.4561767578125, 3.65185546875, 3.8475341796875, 4.043212890625, 4.2388916015625, 4.4345703125, 4.6302490234375, 4.825927734375, 5.0216064453125, 5.21728515625, 5.4129638671875, 5.608642578125, 5.8043212890625, 6.0]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 7.0, 5.0, 8.0, 15.0, 13.0, 23.0, 42.0, 63.0, 88.0, 145.0, 286.0, 525.0, 961.0, 1651.0, 3260.0, 6111.0, 11118.0, 20697.0, 39857.0, 84387.0, 199238.0, 320034.0, 194535.0, 82340.0, 39026.0, 20386.0, 10873.0, 5768.0, 3213.0, 1668.0, 941.0, 505.0, 299.0, 172.0, 105.0, 55.0, 40.0, 19.0, 21.0, 11.0, 14.0, 9.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.78515625, -6.58251953125, -6.3798828125, -6.17724609375, -5.974609375, -5.77197265625, -5.5693359375, -5.36669921875, -5.1640625, -4.96142578125, -4.7587890625, -4.55615234375, -4.353515625, -4.15087890625, -3.9482421875, -3.74560546875, -3.54296875, -3.34033203125, -3.1376953125, -2.93505859375, -2.732421875, -2.52978515625, -2.3271484375, -2.12451171875, -1.921875, -1.71923828125, -1.5166015625, -1.31396484375, -1.111328125, -0.90869140625, -0.7060546875, -0.50341796875, -0.30078125, -0.09814453125, 0.1044921875, 0.30712890625, 0.509765625, 0.71240234375, 0.9150390625, 1.11767578125, 1.3203125, 1.52294921875, 1.7255859375, 1.92822265625, 2.130859375, 2.33349609375, 2.5361328125, 2.73876953125, 2.94140625, 3.14404296875, 3.3466796875, 3.54931640625, 3.751953125, 3.95458984375, 4.1572265625, 4.35986328125, 4.5625, 4.76513671875, 4.9677734375, 5.17041015625, 5.373046875, 5.57568359375, 5.7783203125, 5.98095703125, 6.18359375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 9.0, 9.0, 17.0, 12.0, 22.0, 13.0, 27.0, 33.0, 38.0, 41.0, 51.0, 44.0, 57.0, 111.0, 173.0, 1452.0, 359.0, 151.0, 76.0, 69.0, 34.0, 54.0, 27.0, 31.0, 27.0, 22.0, 20.0, 18.0, 12.0, 7.0, 4.0, 4.0, 9.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.428466796875, -16.66943359375, -15.910400390625, -15.1513671875, -14.392333984375, -13.63330078125, -12.874267578125, -12.115234375, -11.356201171875, -10.59716796875, -9.838134765625, -9.0791015625, -8.320068359375, -7.56103515625, -6.802001953125, -6.04296875, -5.283935546875, -4.52490234375, -3.765869140625, -3.0068359375, -2.247802734375, -1.48876953125, -0.729736328125, 0.029296875, 0.788330078125, 1.54736328125, 2.306396484375, 3.0654296875, 3.824462890625, 4.58349609375, 5.342529296875, 6.1015625, 6.860595703125, 7.61962890625, 8.378662109375, 9.1376953125, 9.896728515625, 10.65576171875, 11.414794921875, 12.173828125, 12.932861328125, 13.69189453125, 14.450927734375, 15.2099609375, 15.968994140625, 16.72802734375, 17.487060546875, 18.24609375, 19.005126953125, 19.76416015625, 20.523193359375, 21.2822265625, 22.041259765625, 22.80029296875, 23.559326171875, 24.318359375, 25.077392578125, 25.83642578125, 26.595458984375, 27.3544921875, 28.113525390625, 28.87255859375, 29.631591796875, 30.390625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 6.0, 13.0, 12.0, 12.0, 26.0, 28.0, 48.0, 73.0, 96.0, 151.0, 229.0, 396.0, 974.0, 8720.0, 1234248.0, 1887589.0, 10809.0, 1028.0, 404.0, 280.0, 147.0, 111.0, 80.0, 51.0, 40.0, 25.0, 18.0, 19.0, 12.0, 9.0, 11.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.1875, -45.71435546875, -44.2412109375, -42.76806640625, -41.294921875, -39.82177734375, -38.3486328125, -36.87548828125, -35.40234375, -33.92919921875, -32.4560546875, -30.98291015625, -29.509765625, -28.03662109375, -26.5634765625, -25.09033203125, -23.6171875, -22.14404296875, -20.6708984375, -19.19775390625, -17.724609375, -16.25146484375, -14.7783203125, -13.30517578125, -11.83203125, -10.35888671875, -8.8857421875, -7.41259765625, -5.939453125, -4.46630859375, -2.9931640625, -1.52001953125, -0.046875, 1.42626953125, 2.8994140625, 4.37255859375, 5.845703125, 7.31884765625, 8.7919921875, 10.26513671875, 11.73828125, 13.21142578125, 14.6845703125, 16.15771484375, 17.630859375, 19.10400390625, 20.5771484375, 22.05029296875, 23.5234375, 24.99658203125, 26.4697265625, 27.94287109375, 29.416015625, 30.88916015625, 32.3623046875, 33.83544921875, 35.30859375, 36.78173828125, 38.2548828125, 39.72802734375, 41.201171875, 42.67431640625, 44.1474609375, 45.62060546875, 47.09375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [117.0, 825.0, 76.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.943163871765137, -3.9436283111572266, 5.055907249450684, 14.05544376373291, 23.054977416992188, 32.05451202392578, 41.05405044555664, 50.053585052490234, 59.05311965942383, 68.05265808105469, 77.05219268798828, 86.05172729492188, 95.05126190185547, 104.05079650878906, 113.05033874511719, 122.04986572265625, 131.04940795898438, 140.0489501953125, 149.04847717285156, 158.0480194091797, 167.04754638671875, 176.04708862304688, 185.046630859375, 194.04615783691406, 203.04568481445312, 212.04522705078125, 221.0447540283203, 230.04429626464844, 239.0438232421875, 248.04336547851562, 257.04290771484375, 266.04241943359375, 275.0419616699219, 284.04150390625, 293.0410461425781, 302.0405578613281, 311.04010009765625, 320.0396423339844, 329.0391845703125, 338.0386962890625, 347.0382385253906, 356.03778076171875, 365.0373229980469, 374.0368347167969, 383.036376953125, 392.0359191894531, 401.03546142578125, 410.03497314453125, 419.0345458984375, 428.0340881347656, 437.03363037109375, 446.03314208984375, 455.0326843261719, 464.0322265625, 473.0317687988281, 482.03131103515625, 491.03082275390625, 500.0303649902344, 509.0299072265625, 518.0294189453125, 527.0289916992188, 536.0285034179688, 545.0280151367188, 554.027587890625, 563.027099609375]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 7.0, 9.0, 6.0, 10.0, 16.0, 15.0, 28.0, 22.0, 24.0, 22.0, 29.0, 39.0, 28.0, 33.0, 34.0, 41.0, 39.0, 46.0, 42.0, 44.0, 50.0, 37.0, 39.0, 32.0, 32.0, 33.0, 34.0, 26.0, 22.0, 17.0, 23.0, 16.0, 15.0, 18.0, 14.0, 12.0, 12.0, 6.0, 5.0, 6.0, 9.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.73203659057617, -51.995750427246094, -50.25946044921875, -48.52317428588867, -46.786888122558594, -45.05059814453125, -43.31431198120117, -41.578025817871094, -39.84173583984375, -38.10544967651367, -36.36915969848633, -34.63287353515625, -32.896583557128906, -31.160297393798828, -29.42401123046875, -27.68772315979004, -25.951435089111328, -24.215147018432617, -22.478858947753906, -20.742572784423828, -19.006284713745117, -17.269996643066406, -15.533709526062012, -13.797422409057617, -12.061134338378906, -10.324846267700195, -8.5885591506958, -6.852271556854248, -5.115983963012695, -3.3796958923339844, -1.6434087753295898, 0.09287834167480469, 1.8291702270507812, 3.565457820892334, 5.301745414733887, 7.0380330085754395, 8.774320602416992, 10.510608673095703, 12.246895790100098, 13.983182907104492, 15.719470977783203, 17.455759048461914, 19.192047119140625, 20.928333282470703, 22.664621353149414, 24.400909423828125, 26.137195587158203, 27.873483657836914, 29.609771728515625, 31.346059799194336, 33.08234786987305, 34.818634033203125, 36.55492401123047, 38.29121017456055, 40.027496337890625, 41.76378631591797, 43.50007247924805, 45.236358642578125, 46.97264862060547, 48.70893478393555, 50.445220947265625, 52.18151092529297, 53.91779708862305, 55.654083251953125, 57.39037322998047]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 18.0, 11.0, 10.0, 17.0, 18.0, 20.0, 27.0, 28.0, 36.0, 28.0, 43.0, 38.0, 40.0, 30.0, 37.0, 44.0, 39.0, 39.0, 41.0, 32.0, 40.0, 42.0, 31.0, 35.0, 28.0, 29.0, 19.0, 20.0, 19.0, 26.0, 17.0, 10.0, 16.0, 9.0, 7.0, 9.0, 4.0, 6.0, 1.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0], "bins": [-6.3515625, -6.15716552734375, -5.9627685546875, -5.76837158203125, -5.573974609375, -5.37957763671875, -5.1851806640625, -4.99078369140625, -4.79638671875, -4.60198974609375, -4.4075927734375, -4.21319580078125, -4.018798828125, -3.82440185546875, -3.6300048828125, -3.43560791015625, -3.2412109375, -3.04681396484375, -2.8524169921875, -2.65802001953125, -2.463623046875, -2.26922607421875, -2.0748291015625, -1.88043212890625, -1.68603515625, -1.49163818359375, -1.2972412109375, -1.10284423828125, -0.908447265625, -0.71405029296875, -0.5196533203125, -0.32525634765625, -0.130859375, 0.06353759765625, 0.2579345703125, 0.45233154296875, 0.646728515625, 0.84112548828125, 1.0355224609375, 1.22991943359375, 1.42431640625, 1.61871337890625, 1.8131103515625, 2.00750732421875, 2.201904296875, 2.39630126953125, 2.5906982421875, 2.78509521484375, 2.9794921875, 3.17388916015625, 3.3682861328125, 3.56268310546875, 3.757080078125, 3.95147705078125, 4.1458740234375, 4.34027099609375, 4.53466796875, 4.72906494140625, 4.9234619140625, 5.11785888671875, 5.312255859375, 5.50665283203125, 5.7010498046875, 5.89544677734375, 6.08984375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 4.0, 8.0, 7.0, 9.0, 20.0, 12.0, 21.0, 21.0, 29.0, 30.0, 59.0, 91.0, 168.0, 366.0, 915.0, 3072.0, 13985.0, 83005.0, 568183.0, 2215719.0, 1106301.0, 168220.0, 26234.0, 5288.0, 1412.0, 492.0, 227.0, 104.0, 59.0, 34.0, 30.0, 19.0, 23.0, 19.0, 15.0, 13.0, 9.0, 11.0, 5.0, 7.0, 4.0, 3.0, 7.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2109375, -11.8255615234375, -11.440185546875, -11.0548095703125, -10.66943359375, -10.2840576171875, -9.898681640625, -9.5133056640625, -9.1279296875, -8.7425537109375, -8.357177734375, -7.9718017578125, -7.58642578125, -7.2010498046875, -6.815673828125, -6.4302978515625, -6.044921875, -5.6595458984375, -5.274169921875, -4.8887939453125, -4.50341796875, -4.1180419921875, -3.732666015625, -3.3472900390625, -2.9619140625, -2.5765380859375, -2.191162109375, -1.8057861328125, -1.42041015625, -1.0350341796875, -0.649658203125, -0.2642822265625, 0.12109375, 0.5064697265625, 0.891845703125, 1.2772216796875, 1.66259765625, 2.0479736328125, 2.433349609375, 2.8187255859375, 3.2041015625, 3.5894775390625, 3.974853515625, 4.3602294921875, 4.74560546875, 5.1309814453125, 5.516357421875, 5.9017333984375, 6.287109375, 6.6724853515625, 7.057861328125, 7.4432373046875, 7.82861328125, 8.2139892578125, 8.599365234375, 8.9847412109375, 9.3701171875, 9.7554931640625, 10.140869140625, 10.5262451171875, 10.91162109375, 11.2969970703125, 11.682373046875, 12.0677490234375, 12.453125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 0.0, 2.0, 3.0, 5.0, 13.0, 8.0, 6.0, 21.0, 22.0, 34.0, 34.0, 37.0, 52.0, 77.0, 102.0, 108.0, 158.0, 204.0, 265.0, 315.0, 357.0, 404.0, 354.0, 312.0, 278.0, 208.0, 149.0, 137.0, 101.0, 63.0, 59.0, 42.0, 31.0, 30.0, 27.0, 20.0, 10.0, 3.0, 5.0, 8.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6015625, -8.3101806640625, -8.018798828125, -7.7274169921875, -7.43603515625, -7.1446533203125, -6.853271484375, -6.5618896484375, -6.2705078125, -5.9791259765625, -5.687744140625, -5.3963623046875, -5.10498046875, -4.8135986328125, -4.522216796875, -4.2308349609375, -3.939453125, -3.6480712890625, -3.356689453125, -3.0653076171875, -2.77392578125, -2.4825439453125, -2.191162109375, -1.8997802734375, -1.6083984375, -1.3170166015625, -1.025634765625, -0.7342529296875, -0.44287109375, -0.1514892578125, 0.139892578125, 0.4312744140625, 0.72265625, 1.0140380859375, 1.305419921875, 1.5968017578125, 1.88818359375, 2.1795654296875, 2.470947265625, 2.7623291015625, 3.0537109375, 3.3450927734375, 3.636474609375, 3.9278564453125, 4.21923828125, 4.5106201171875, 4.802001953125, 5.0933837890625, 5.384765625, 5.6761474609375, 5.967529296875, 6.2589111328125, 6.55029296875, 6.8416748046875, 7.133056640625, 7.4244384765625, 7.7158203125, 8.0072021484375, 8.298583984375, 8.5899658203125, 8.88134765625, 9.1727294921875, 9.464111328125, 9.7554931640625, 10.046875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 6.0, 8.0, 12.0, 19.0, 23.0, 34.0, 45.0, 56.0, 66.0, 97.0, 131.0, 195.0, 256.0, 418.0, 932.0, 4918.0, 77169.0, 2333270.0, 1715316.0, 55251.0, 3887.0, 807.0, 382.0, 267.0, 166.0, 125.0, 104.0, 84.0, 62.0, 44.0, 27.0, 21.0, 23.0, 16.0, 9.0, 5.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-36.9375, -35.937744140625, -34.93798828125, -33.938232421875, -32.9384765625, -31.938720703125, -30.93896484375, -29.939208984375, -28.939453125, -27.939697265625, -26.93994140625, -25.940185546875, -24.9404296875, -23.940673828125, -22.94091796875, -21.941162109375, -20.94140625, -19.941650390625, -18.94189453125, -17.942138671875, -16.9423828125, -15.942626953125, -14.94287109375, -13.943115234375, -12.943359375, -11.943603515625, -10.94384765625, -9.944091796875, -8.9443359375, -7.944580078125, -6.94482421875, -5.945068359375, -4.9453125, -3.945556640625, -2.94580078125, -1.946044921875, -0.9462890625, 0.053466796875, 1.05322265625, 2.052978515625, 3.052734375, 4.052490234375, 5.05224609375, 6.052001953125, 7.0517578125, 8.051513671875, 9.05126953125, 10.051025390625, 11.05078125, 12.050537109375, 13.05029296875, 14.050048828125, 15.0498046875, 16.049560546875, 17.04931640625, 18.049072265625, 19.048828125, 20.048583984375, 21.04833984375, 22.048095703125, 23.0478515625, 24.047607421875, 25.04736328125, 26.047119140625, 27.046875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 22.0, 196.0, 448.0, 296.0, 49.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-219.59033203125, -212.85984802246094, -206.1293487548828, -199.39886474609375, -192.66836547851562, -185.93788146972656, -179.2073974609375, -172.47689819335938, -165.74639892578125, -159.0159149169922, -152.28541564941406, -145.554931640625, -138.82443237304688, -132.0939483642578, -125.36345672607422, -118.63296508789062, -111.90248107910156, -105.17198944091797, -98.44149780273438, -91.71101379394531, -84.98051452636719, -78.25003051757812, -71.51953887939453, -64.78904724121094, -58.058555603027344, -51.32806396484375, -44.597572326660156, -37.86708450317383, -31.136592864990234, -24.40610122680664, -17.675613403320312, -10.945121765136719, -4.2146148681640625, 2.515875816345215, 9.246366500854492, 15.976856231689453, 22.707347869873047, 29.43783950805664, 36.16832733154297, 42.89881896972656, 49.629310607910156, 56.35980224609375, 63.090293884277344, 69.82078552246094, 76.55126953125, 83.28176879882812, 90.01225280761719, 96.74274444580078, 103.47323608398438, 110.20372772216797, 116.93421936035156, 123.66470336914062, 130.39520263671875, 137.1256866455078, 143.85617065429688, 150.586669921875, 157.31716918945312, 164.0476531982422, 170.7781524658203, 177.50863647460938, 184.2391357421875, 190.96961975097656, 197.70010375976562, 204.43060302734375, 211.1610870361328]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 6.0, 7.0, 3.0, 13.0, 11.0, 10.0, 25.0, 15.0, 22.0, 16.0, 18.0, 26.0, 29.0, 35.0, 30.0, 36.0, 49.0, 40.0, 43.0, 35.0, 43.0, 36.0, 30.0, 29.0, 35.0, 36.0, 41.0, 46.0, 39.0, 21.0, 26.0, 19.0, 28.0, 22.0, 17.0, 18.0, 9.0, 6.0, 10.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-35.08148956298828, -33.992820739746094, -32.904151916503906, -31.81548500061035, -30.726818084716797, -29.63814926147461, -28.549480438232422, -27.460813522338867, -26.372146606445312, -25.283477783203125, -24.19481086730957, -23.106142044067383, -22.017475128173828, -20.92880630493164, -19.840137481689453, -18.7514705657959, -17.66280174255371, -16.574132919311523, -15.485466003417969, -14.396797180175781, -13.308130264282227, -12.219461441040039, -11.130793571472168, -10.042125701904297, -8.953457832336426, -7.864789962768555, -6.776122093200684, -5.687453746795654, -4.598785877227783, -3.510118007659912, -2.421449661254883, -1.3327817916870117, -0.24411392211914062, 0.84455406665802, 1.9332220554351807, 3.021890163421631, 4.110558032989502, 5.199225902557373, 6.287894248962402, 7.376562118530273, 8.465229988098145, 9.553897857666016, 10.642565727233887, 11.731233596801758, 12.819902420043945, 13.9085693359375, 14.997238159179688, 16.085906982421875, 17.17457389831543, 18.263242721557617, 19.351909637451172, 20.44057846069336, 21.529245376586914, 22.6179141998291, 23.706581115722656, 24.795249938964844, 25.88391876220703, 26.97258758544922, 28.061254501342773, 29.14992332458496, 30.238590240478516, 31.327259063720703, 32.41592788696289, 33.50459289550781, 34.59326171875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 8.0, 25.0, 13.0, 11.0, 21.0, 14.0, 26.0, 26.0, 22.0, 19.0, 47.0, 31.0, 30.0, 33.0, 47.0, 39.0, 31.0, 44.0, 53.0, 37.0, 46.0, 40.0, 33.0, 34.0, 30.0, 30.0, 28.0, 21.0, 18.0, 18.0, 21.0, 14.0, 13.0, 20.0, 9.0, 10.0, 3.0, 6.0, 4.0, 9.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.45703125, -6.2664794921875, -6.075927734375, -5.8853759765625, -5.69482421875, -5.5042724609375, -5.313720703125, -5.1231689453125, -4.9326171875, -4.7420654296875, -4.551513671875, -4.3609619140625, -4.17041015625, -3.9798583984375, -3.789306640625, -3.5987548828125, -3.408203125, -3.2176513671875, -3.027099609375, -2.8365478515625, -2.64599609375, -2.4554443359375, -2.264892578125, -2.0743408203125, -1.8837890625, -1.6932373046875, -1.502685546875, -1.3121337890625, -1.12158203125, -0.9310302734375, -0.740478515625, -0.5499267578125, -0.359375, -0.1688232421875, 0.021728515625, 0.2122802734375, 0.40283203125, 0.5933837890625, 0.783935546875, 0.9744873046875, 1.1650390625, 1.3555908203125, 1.546142578125, 1.7366943359375, 1.92724609375, 2.1177978515625, 2.308349609375, 2.4989013671875, 2.689453125, 2.8800048828125, 3.070556640625, 3.2611083984375, 3.45166015625, 3.6422119140625, 3.832763671875, 4.0233154296875, 4.2138671875, 4.4044189453125, 4.594970703125, 4.7855224609375, 4.97607421875, 5.1666259765625, 5.357177734375, 5.5477294921875, 5.73828125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 10.0, 15.0, 17.0, 24.0, 45.0, 60.0, 114.0, 166.0, 218.0, 352.0, 545.0, 841.0, 1181.0, 1817.0, 2808.0, 4172.0, 6139.0, 9230.0, 14070.0, 21483.0, 32464.0, 49304.0, 72841.0, 103788.0, 137073.0, 150790.0, 132778.0, 99880.0, 69216.0, 46506.0, 30704.0, 20140.0, 13417.0, 8944.0, 5871.0, 3968.0, 2489.0, 1732.0, 1126.0, 792.0, 441.0, 330.0, 216.0, 155.0, 80.0, 69.0, 48.0, 29.0, 21.0, 14.0, 9.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.7177734375, -0.6949386596679688, -0.6721038818359375, -0.6492691040039062, -0.626434326171875, -0.6035995483398438, -0.5807647705078125, -0.5579299926757812, -0.53509521484375, -0.5122604370117188, -0.4894256591796875, -0.46659088134765625, -0.443756103515625, -0.42092132568359375, -0.3980865478515625, -0.37525177001953125, -0.3524169921875, -0.32958221435546875, -0.3067474365234375, -0.28391265869140625, -0.261077880859375, -0.23824310302734375, -0.2154083251953125, -0.19257354736328125, -0.16973876953125, -0.14690399169921875, -0.1240692138671875, -0.10123443603515625, -0.078399658203125, -0.05556488037109375, -0.0327301025390625, -0.00989532470703125, 0.012939453125, 0.03577423095703125, 0.0586090087890625, 0.08144378662109375, 0.104278564453125, 0.12711334228515625, 0.1499481201171875, 0.17278289794921875, 0.19561767578125, 0.21845245361328125, 0.2412872314453125, 0.26412200927734375, 0.286956787109375, 0.30979156494140625, 0.3326263427734375, 0.35546112060546875, 0.3782958984375, 0.40113067626953125, 0.4239654541015625, 0.44680023193359375, 0.469635009765625, 0.49246978759765625, 0.5153045654296875, 0.5381393432617188, 0.56097412109375, 0.5838088989257812, 0.6066436767578125, 0.6294784545898438, 0.652313232421875, 0.6751480102539062, 0.6979827880859375, 0.7208175659179688, 0.74365234375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 3.0, 5.0, 9.0, 10.0, 4.0, 16.0, 17.0, 24.0, 19.0, 22.0, 27.0, 26.0, 42.0, 44.0, 40.0, 42.0, 49.0, 46.0, 51.0, 1088.0, 47.0, 56.0, 37.0, 47.0, 23.0, 28.0, 33.0, 33.0, 24.0, 20.0, 25.0, 14.0, 16.0, 3.0, 8.0, 10.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.76983642578125, -4.6217041015625, -4.47357177734375, -4.325439453125, -4.17730712890625, -4.0291748046875, -3.88104248046875, -3.73291015625, -3.58477783203125, -3.4366455078125, -3.28851318359375, -3.140380859375, -2.99224853515625, -2.8441162109375, -2.69598388671875, -2.5478515625, -2.39971923828125, -2.2515869140625, -2.10345458984375, -1.955322265625, -1.80718994140625, -1.6590576171875, -1.51092529296875, -1.36279296875, -1.21466064453125, -1.0665283203125, -0.91839599609375, -0.770263671875, -0.62213134765625, -0.4739990234375, -0.32586669921875, -0.177734375, -0.02960205078125, 0.1185302734375, 0.26666259765625, 0.414794921875, 0.56292724609375, 0.7110595703125, 0.85919189453125, 1.00732421875, 1.15545654296875, 1.3035888671875, 1.45172119140625, 1.599853515625, 1.74798583984375, 1.8961181640625, 2.04425048828125, 2.1923828125, 2.34051513671875, 2.4886474609375, 2.63677978515625, 2.784912109375, 2.93304443359375, 3.0811767578125, 3.22930908203125, 3.37744140625, 3.52557373046875, 3.6737060546875, 3.82183837890625, 3.969970703125, 4.11810302734375, 4.2662353515625, 4.41436767578125, 4.5625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 15.0, 17.0, 28.0, 40.0, 66.0, 76.0, 117.0, 203.0, 373.0, 517.0, 838.0, 1446.0, 2378.0, 4080.0, 6723.0, 11375.0, 19488.0, 33038.0, 54983.0, 87873.0, 131004.0, 424500.0, 957678.0, 131831.0, 89594.0, 56198.0, 33639.0, 19938.0, 11695.0, 7136.0, 4064.0, 2421.0, 1434.0, 864.0, 524.0, 343.0, 208.0, 128.0, 82.0, 60.0, 47.0, 17.0, 11.0, 10.0, 9.0, 2.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.59521484375, -0.5777206420898438, -0.5602264404296875, -0.5427322387695312, -0.525238037109375, -0.5077438354492188, -0.4902496337890625, -0.47275543212890625, -0.45526123046875, -0.43776702880859375, -0.4202728271484375, -0.40277862548828125, -0.385284423828125, -0.36779022216796875, -0.3502960205078125, -0.33280181884765625, -0.3153076171875, -0.29781341552734375, -0.2803192138671875, -0.26282501220703125, -0.245330810546875, -0.22783660888671875, -0.2103424072265625, -0.19284820556640625, -0.17535400390625, -0.15785980224609375, -0.1403656005859375, -0.12287139892578125, -0.105377197265625, -0.08788299560546875, -0.0703887939453125, -0.05289459228515625, -0.035400390625, -0.01790618896484375, -0.0004119873046875, 0.01708221435546875, 0.034576416015625, 0.05207061767578125, 0.0695648193359375, 0.08705902099609375, 0.10455322265625, 0.12204742431640625, 0.1395416259765625, 0.15703582763671875, 0.174530029296875, 0.19202423095703125, 0.2095184326171875, 0.22701263427734375, 0.2445068359375, 0.26200103759765625, 0.2794952392578125, 0.29698944091796875, 0.314483642578125, 0.33197784423828125, 0.3494720458984375, 0.36696624755859375, 0.38446044921875, 0.40195465087890625, 0.4194488525390625, 0.43694305419921875, 0.454437255859375, 0.47193145751953125, 0.4894256591796875, 0.5069198608398438, 0.5244140625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 6.0, 4.0, 2.0, 4.0, 8.0, 12.0, 15.0, 15.0, 17.0, 23.0, 18.0, 19.0, 30.0, 41.0, 23.0, 38.0, 46.0, 73.0, 77.0, 71.0, 72.0, 48.0, 53.0, 33.0, 29.0, 32.0, 23.0, 23.0, 20.0, 13.0, 15.0, 16.0, 10.0, 11.0, 9.0, 6.0, 9.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0120086669921875, -0.011686563491821289, -0.011364459991455078, -0.011042356491088867, -0.010720252990722656, -0.010398149490356445, -0.010076045989990234, -0.009753942489624023, -0.009431838989257812, -0.009109735488891602, -0.00878763198852539, -0.00846552848815918, -0.008143424987792969, -0.007821321487426758, -0.007499217987060547, -0.007177114486694336, -0.006855010986328125, -0.006532907485961914, -0.006210803985595703, -0.005888700485229492, -0.005566596984863281, -0.00524449348449707, -0.004922389984130859, -0.0046002864837646484, -0.0042781829833984375, -0.0039560794830322266, -0.0036339759826660156, -0.0033118724822998047, -0.0029897689819335938, -0.002667665481567383, -0.002345561981201172, -0.002023458480834961, -0.00170135498046875, -0.001379251480102539, -0.0010571479797363281, -0.0007350444793701172, -0.00041294097900390625, -9.083747863769531e-05, 0.00023126602172851562, 0.0005533695220947266, 0.0008754730224609375, 0.0011975765228271484, 0.0015196800231933594, 0.0018417835235595703, 0.0021638870239257812, 0.002485990524291992, 0.002808094024658203, 0.003130197525024414, 0.003452301025390625, 0.003774404525756836, 0.004096508026123047, 0.004418611526489258, 0.004740715026855469, 0.00506281852722168, 0.005384922027587891, 0.0057070255279541016, 0.0060291290283203125, 0.0063512325286865234, 0.006673336029052734, 0.006995439529418945, 0.007317543029785156, 0.007639646530151367, 0.007961750030517578, 0.008283853530883789, 0.00860595703125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 5.0, 9.0, 10.0, 14.0, 17.0, 16.0, 25.0, 31.0, 45.0, 52.0, 85.0, 88.0, 170.0, 269.0, 510.0, 4242.0, 1028796.0, 12550.0, 666.0, 291.0, 181.0, 127.0, 82.0, 50.0, 39.0, 42.0, 22.0, 32.0, 20.0, 8.0, 10.0, 6.0, 6.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20263671875, -0.19501876831054688, -0.18740081787109375, -0.17978286743164062, -0.1721649169921875, -0.16454696655273438, -0.15692901611328125, -0.14931106567382812, -0.141693115234375, -0.13407516479492188, -0.12645721435546875, -0.11883926391601562, -0.1112213134765625, -0.10360336303710938, -0.09598541259765625, -0.08836746215820312, -0.08074951171875, -0.07313156127929688, -0.06551361083984375, -0.057895660400390625, -0.0502777099609375, -0.042659759521484375, -0.03504180908203125, -0.027423858642578125, -0.019805908203125, -0.012187957763671875, -0.00457000732421875, 0.003047943115234375, 0.0106658935546875, 0.018283843994140625, 0.02590179443359375, 0.033519744873046875, 0.0411376953125, 0.048755645751953125, 0.05637359619140625, 0.06399154663085938, 0.0716094970703125, 0.07922744750976562, 0.08684539794921875, 0.09446334838867188, 0.102081298828125, 0.10969924926757812, 0.11731719970703125, 0.12493515014648438, 0.1325531005859375, 0.14017105102539062, 0.14778900146484375, 0.15540695190429688, 0.16302490234375, 0.17064285278320312, 0.17826080322265625, 0.18587875366210938, 0.1934967041015625, 0.20111465454101562, 0.20873260498046875, 0.21635055541992188, 0.223968505859375, 0.23158645629882812, 0.23920440673828125, 0.24682235717773438, 0.2544403076171875, 0.2620582580566406, 0.26967620849609375, 0.2772941589355469, 0.284912109375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 153.0, 865.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09518353641033173, -0.08733966946601868, -0.07949580997228622, -0.07165194302797318, -0.06380808353424072, -0.05596421658992767, -0.048120349645614624, -0.04027648642659187, -0.03243262320756912, -0.02458875998854637, -0.01674489490687847, -0.008901029825210571, -0.0010571666061878204, 0.00678669661283493, 0.01463056355714798, 0.02247442677617073, 0.03031828999519348, 0.03816215321421623, 0.04600601643323898, 0.05384988337755203, 0.06169374659657478, 0.06953760981559753, 0.07738147675991058, 0.08522534370422363, 0.09306920319795609, 0.10091307014226913, 0.10875692963600159, 0.11660079658031464, 0.12444466352462769, 0.13228851556777954, 0.14013239741325378, 0.14797624945640564, 0.1558201014995575, 0.16366396844387054, 0.1715078353881836, 0.17935168743133545, 0.1871955543756485, 0.19503942131996155, 0.2028832882642746, 0.21072715520858765, 0.2185710072517395, 0.22641487419605255, 0.2342587411403656, 0.24210259318351746, 0.2499464601278305, 0.25779032707214355, 0.2656341791152954, 0.27347806096076965, 0.2813219428062439, 0.28916579484939575, 0.29700967669487, 0.30485352873802185, 0.3126974105834961, 0.32054126262664795, 0.3283851146697998, 0.33622899651527405, 0.3440728485584259, 0.35191670060157776, 0.359760582447052, 0.36760443449020386, 0.3754483163356781, 0.38329216837882996, 0.3911360502243042, 0.39897990226745605, 0.4068237543106079]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 15.0, 9.0, 17.0, 16.0, 26.0, 20.0, 31.0, 51.0, 39.0, 41.0, 44.0, 69.0, 55.0, 60.0, 60.0, 65.0, 35.0, 60.0, 62.0, 41.0, 38.0, 26.0, 28.0, 21.0, 14.0, 22.0, 13.0, 10.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019495010375976562, -0.01893671602010727, -0.018378421664237976, -0.017820127308368683, -0.01726183295249939, -0.016703538596630096, -0.016145244240760803, -0.01558694988489151, -0.015028655529022217, -0.014470361173152924, -0.01391206681728363, -0.013353772461414337, -0.012795478105545044, -0.01223718374967575, -0.011678889393806458, -0.011120595037937164, -0.010562300682067871, -0.010004006326198578, -0.009445711970329285, -0.008887417614459991, -0.008329123258590698, -0.007770828902721405, -0.007212534546852112, -0.006654240190982819, -0.006095945835113525, -0.005537651479244232, -0.004979357123374939, -0.004421062767505646, -0.0038627684116363525, -0.0033044740557670593, -0.002746179699897766, -0.002187885344028473, -0.0016295909881591797, -0.0010712966322898865, -0.0005130022764205933, 4.529207944869995e-05, 0.0006035864353179932, 0.0011618807911872864, 0.0017201751470565796, 0.002278469502925873, 0.002836763858795166, 0.0033950582146644592, 0.0039533525705337524, 0.004511646926403046, 0.005069941282272339, 0.005628235638141632, 0.006186529994010925, 0.0067448243498802185, 0.007303118705749512, 0.007861413061618805, 0.008419707417488098, 0.008978001773357391, 0.009536296129226685, 0.010094590485095978, 0.010652884840965271, 0.011211179196834564, 0.011769473552703857, 0.01232776790857315, 0.012886062264442444, 0.013444356620311737, 0.01400265097618103, 0.014560945332050323, 0.015119239687919617, 0.01567753404378891, 0.016235828399658203]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 8.0, 25.0, 13.0, 11.0, 21.0, 14.0, 25.0, 27.0, 22.0, 19.0, 48.0, 30.0, 30.0, 33.0, 47.0, 39.0, 31.0, 44.0, 53.0, 37.0, 46.0, 40.0, 33.0, 34.0, 30.0, 30.0, 28.0, 21.0, 18.0, 18.0, 21.0, 14.0, 13.0, 20.0, 9.0, 10.0, 3.0, 6.0, 4.0, 9.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.45703125, -6.2664794921875, -6.075927734375, -5.8853759765625, -5.69482421875, -5.5042724609375, -5.313720703125, -5.1231689453125, -4.9326171875, -4.7420654296875, -4.551513671875, -4.3609619140625, -4.17041015625, -3.9798583984375, -3.789306640625, -3.5987548828125, -3.408203125, -3.2176513671875, -3.027099609375, -2.8365478515625, -2.64599609375, -2.4554443359375, -2.264892578125, -2.0743408203125, -1.8837890625, -1.6932373046875, -1.502685546875, -1.3121337890625, -1.12158203125, -0.9310302734375, -0.740478515625, -0.5499267578125, -0.359375, -0.1688232421875, 0.021728515625, 0.2122802734375, 0.40283203125, 0.5933837890625, 0.783935546875, 0.9744873046875, 1.1650390625, 1.3555908203125, 1.546142578125, 1.7366943359375, 1.92724609375, 2.1177978515625, 2.308349609375, 2.4989013671875, 2.689453125, 2.8800048828125, 3.070556640625, 3.2611083984375, 3.45166015625, 3.6422119140625, 3.832763671875, 4.0233154296875, 4.2138671875, 4.4044189453125, 4.594970703125, 4.7855224609375, 4.97607421875, 5.1666259765625, 5.357177734375, 5.5477294921875, 5.73828125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 9.0, 18.0, 23.0, 24.0, 28.0, 31.0, 34.0, 69.0, 74.0, 103.0, 156.0, 203.0, 359.0, 673.0, 1693.0, 4465.0, 12782.0, 42175.0, 197723.0, 562156.0, 169808.0, 37061.0, 11640.0, 3910.0, 1562.0, 679.0, 323.0, 203.0, 123.0, 113.0, 70.0, 67.0, 32.0, 26.0, 27.0, 17.0, 17.0, 21.0, 16.0, 7.0, 5.0, 8.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.953125, -11.5958251953125, -11.238525390625, -10.8812255859375, -10.52392578125, -10.1666259765625, -9.809326171875, -9.4520263671875, -9.0947265625, -8.7374267578125, -8.380126953125, -8.0228271484375, -7.66552734375, -7.3082275390625, -6.950927734375, -6.5936279296875, -6.236328125, -5.8790283203125, -5.521728515625, -5.1644287109375, -4.80712890625, -4.4498291015625, -4.092529296875, -3.7352294921875, -3.3779296875, -3.0206298828125, -2.663330078125, -2.3060302734375, -1.94873046875, -1.5914306640625, -1.234130859375, -0.8768310546875, -0.51953125, -0.1622314453125, 0.195068359375, 0.5523681640625, 0.90966796875, 1.2669677734375, 1.624267578125, 1.9815673828125, 2.3388671875, 2.6961669921875, 3.053466796875, 3.4107666015625, 3.76806640625, 4.1253662109375, 4.482666015625, 4.8399658203125, 5.197265625, 5.5545654296875, 5.911865234375, 6.2691650390625, 6.62646484375, 6.9837646484375, 7.341064453125, 7.6983642578125, 8.0556640625, 8.4129638671875, 8.770263671875, 9.1275634765625, 9.48486328125, 9.8421630859375, 10.199462890625, 10.5567626953125, 10.9140625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 8.0, 16.0, 14.0, 17.0, 19.0, 22.0, 26.0, 28.0, 29.0, 29.0, 45.0, 48.0, 51.0, 59.0, 118.0, 253.0, 1444.0, 269.0, 124.0, 56.0, 52.0, 46.0, 36.0, 36.0, 32.0, 27.0, 28.0, 24.0, 19.0, 8.0, 13.0, 8.0, 9.0, 6.0, 8.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.5, -20.860595703125, -20.22119140625, -19.581787109375, -18.9423828125, -18.302978515625, -17.66357421875, -17.024169921875, -16.384765625, -15.745361328125, -15.10595703125, -14.466552734375, -13.8271484375, -13.187744140625, -12.54833984375, -11.908935546875, -11.26953125, -10.630126953125, -9.99072265625, -9.351318359375, -8.7119140625, -8.072509765625, -7.43310546875, -6.793701171875, -6.154296875, -5.514892578125, -4.87548828125, -4.236083984375, -3.5966796875, -2.957275390625, -2.31787109375, -1.678466796875, -1.0390625, -0.399658203125, 0.23974609375, 0.879150390625, 1.5185546875, 2.157958984375, 2.79736328125, 3.436767578125, 4.076171875, 4.715576171875, 5.35498046875, 5.994384765625, 6.6337890625, 7.273193359375, 7.91259765625, 8.552001953125, 9.19140625, 9.830810546875, 10.47021484375, 11.109619140625, 11.7490234375, 12.388427734375, 13.02783203125, 13.667236328125, 14.306640625, 14.946044921875, 15.58544921875, 16.224853515625, 16.8642578125, 17.503662109375, 18.14306640625, 18.782470703125, 19.421875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 11.0, 15.0, 16.0, 19.0, 22.0, 25.0, 40.0, 58.0, 53.0, 95.0, 139.0, 230.0, 423.0, 1332.0, 12472.0, 1972207.0, 1146177.0, 9972.0, 1169.0, 422.0, 241.0, 134.0, 79.0, 69.0, 44.0, 49.0, 29.0, 31.0, 20.0, 18.0, 18.0, 15.0, 12.0, 8.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.4375, -41.02099609375, -39.6044921875, -38.18798828125, -36.771484375, -35.35498046875, -33.9384765625, -32.52197265625, -31.10546875, -29.68896484375, -28.2724609375, -26.85595703125, -25.439453125, -24.02294921875, -22.6064453125, -21.18994140625, -19.7734375, -18.35693359375, -16.9404296875, -15.52392578125, -14.107421875, -12.69091796875, -11.2744140625, -9.85791015625, -8.44140625, -7.02490234375, -5.6083984375, -4.19189453125, -2.775390625, -1.35888671875, 0.0576171875, 1.47412109375, 2.890625, 4.30712890625, 5.7236328125, 7.14013671875, 8.556640625, 9.97314453125, 11.3896484375, 12.80615234375, 14.22265625, 15.63916015625, 17.0556640625, 18.47216796875, 19.888671875, 21.30517578125, 22.7216796875, 24.13818359375, 25.5546875, 26.97119140625, 28.3876953125, 29.80419921875, 31.220703125, 32.63720703125, 34.0537109375, 35.47021484375, 36.88671875, 38.30322265625, 39.7197265625, 41.13623046875, 42.552734375, 43.96923828125, 45.3857421875, 46.80224609375, 48.21875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [14.0, 203.0, 575.0, 192.0, 33.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.258474349975586, -7.544036388397217, -2.8295984268188477, 1.8848400115966797, 6.599277496337891, 11.313714981079102, 16.028154373168945, 20.742589950561523, 25.457029342651367, 30.171466827392578, 34.88590621948242, 39.600341796875, 44.314781188964844, 49.02922058105469, 53.74365997314453, 58.458091735839844, 63.17253112792969, 67.88697052001953, 72.60140991210938, 77.31584167480469, 82.03028106689453, 86.74472045898438, 91.45915985107422, 96.17359924316406, 100.8880386352539, 105.60247802734375, 110.3169174194336, 115.03135681152344, 119.74578857421875, 124.4602279663086, 129.17466735839844, 133.88909912109375, 138.60353088378906, 143.31796264648438, 148.03240966796875, 152.74684143066406, 157.46128845214844, 162.17572021484375, 166.89016723632812, 171.60459899902344, 176.31903076171875, 181.03346252441406, 185.74790954589844, 190.46234130859375, 195.17678833007812, 199.89122009277344, 204.60565185546875, 209.32009887695312, 214.0345458984375, 218.7489776611328, 223.4634246826172, 228.1778564453125, 232.89230346679688, 237.6067352294922, 242.3211669921875, 247.03561401367188, 251.7500457763672, 256.4644775390625, 261.1789245605469, 265.89337158203125, 270.6077880859375, 275.3222351074219, 280.03668212890625, 284.7510986328125, 289.4655456542969]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 3.0, 10.0, 6.0, 18.0, 17.0, 20.0, 17.0, 24.0, 33.0, 18.0, 33.0, 35.0, 31.0, 41.0, 44.0, 37.0, 37.0, 42.0, 40.0, 41.0, 33.0, 39.0, 34.0, 26.0, 37.0, 24.0, 31.0, 33.0, 30.0, 29.0, 25.0, 16.0, 17.0, 13.0, 14.0, 10.0, 5.0, 9.0, 7.0, 5.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.386573791503906, -50.8758430480957, -49.3651123046875, -47.85438537597656, -46.34365463256836, -44.832923889160156, -43.32219696044922, -41.811466217041016, -40.30073547363281, -38.79000473022461, -37.279273986816406, -35.76854705810547, -34.257816314697266, -32.74708557128906, -31.236356735229492, -29.725627899169922, -28.21489715576172, -26.704166412353516, -25.193437576293945, -23.682708740234375, -22.171977996826172, -20.66124725341797, -19.1505184173584, -17.639789581298828, -16.129058837890625, -14.618329048156738, -13.107599258422852, -11.596869468688965, -10.086139678955078, -8.575409889221191, -7.064680099487305, -5.553950309753418, -4.043224334716797, -2.53249454498291, -1.0217647552490234, 0.4889650344848633, 1.99969482421875, 3.5104246139526367, 5.021154403686523, 6.53188419342041, 8.042613983154297, 9.553343772888184, 11.06407356262207, 12.574803352355957, 14.085533142089844, 15.59626293182373, 17.106992721557617, 18.617721557617188, 20.12845230102539, 21.639183044433594, 23.149911880493164, 24.660640716552734, 26.171371459960938, 27.68210220336914, 29.19283103942871, 30.70355987548828, 32.214290618896484, 33.72502136230469, 35.235748291015625, 36.74647903442383, 38.25720977783203, 39.767940521240234, 41.27867126464844, 42.789398193359375, 44.30012893676758]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 6.0, 3.0, 15.0, 10.0, 11.0, 13.0, 16.0, 25.0, 21.0, 23.0, 33.0, 34.0, 24.0, 32.0, 33.0, 38.0, 36.0, 44.0, 41.0, 45.0, 41.0, 37.0, 34.0, 47.0, 42.0, 32.0, 30.0, 25.0, 35.0, 27.0, 18.0, 16.0, 20.0, 19.0, 12.0, 7.0, 6.0, 8.0, 12.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.20208740234375, -5.9940185546875, -5.78594970703125, -5.577880859375, -5.36981201171875, -5.1617431640625, -4.95367431640625, -4.74560546875, -4.53753662109375, -4.3294677734375, -4.12139892578125, -3.913330078125, -3.70526123046875, -3.4971923828125, -3.28912353515625, -3.0810546875, -2.87298583984375, -2.6649169921875, -2.45684814453125, -2.248779296875, -2.04071044921875, -1.8326416015625, -1.62457275390625, -1.41650390625, -1.20843505859375, -1.0003662109375, -0.79229736328125, -0.584228515625, -0.37615966796875, -0.1680908203125, 0.03997802734375, 0.248046875, 0.45611572265625, 0.6641845703125, 0.87225341796875, 1.080322265625, 1.28839111328125, 1.4964599609375, 1.70452880859375, 1.91259765625, 2.12066650390625, 2.3287353515625, 2.53680419921875, 2.744873046875, 2.95294189453125, 3.1610107421875, 3.36907958984375, 3.5771484375, 3.78521728515625, 3.9932861328125, 4.20135498046875, 4.409423828125, 4.61749267578125, 4.8255615234375, 5.03363037109375, 5.24169921875, 5.44976806640625, 5.6578369140625, 5.86590576171875, 6.073974609375, 6.28204345703125, 6.4901123046875, 6.69818115234375, 6.90625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 0.0, 7.0, 4.0, 3.0, 8.0, 7.0, 8.0, 15.0, 18.0, 13.0, 18.0, 28.0, 37.0, 47.0, 67.0, 132.0, 270.0, 707.0, 2263.0, 8754.0, 43308.0, 258156.0, 1363427.0, 1936906.0, 482649.0, 77406.0, 14707.0, 3468.0, 981.0, 365.0, 170.0, 96.0, 55.0, 40.0, 36.0, 19.0, 8.0, 14.0, 17.0, 12.0, 8.0, 5.0, 5.0, 5.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.484375, -12.1080322265625, -11.731689453125, -11.3553466796875, -10.97900390625, -10.6026611328125, -10.226318359375, -9.8499755859375, -9.4736328125, -9.0972900390625, -8.720947265625, -8.3446044921875, -7.96826171875, -7.5919189453125, -7.215576171875, -6.8392333984375, -6.462890625, -6.0865478515625, -5.710205078125, -5.3338623046875, -4.95751953125, -4.5811767578125, -4.204833984375, -3.8284912109375, -3.4521484375, -3.0758056640625, -2.699462890625, -2.3231201171875, -1.94677734375, -1.5704345703125, -1.194091796875, -0.8177490234375, -0.44140625, -0.0650634765625, 0.311279296875, 0.6876220703125, 1.06396484375, 1.4403076171875, 1.816650390625, 2.1929931640625, 2.5693359375, 2.9456787109375, 3.322021484375, 3.6983642578125, 4.07470703125, 4.4510498046875, 4.827392578125, 5.2037353515625, 5.580078125, 5.9564208984375, 6.332763671875, 6.7091064453125, 7.08544921875, 7.4617919921875, 7.838134765625, 8.2144775390625, 8.5908203125, 8.9671630859375, 9.343505859375, 9.7198486328125, 10.09619140625, 10.4725341796875, 10.848876953125, 11.2252197265625, 11.6015625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 7.0, 7.0, 10.0, 12.0, 14.0, 31.0, 30.0, 33.0, 65.0, 67.0, 80.0, 115.0, 171.0, 222.0, 273.0, 337.0, 391.0, 401.0, 432.0, 359.0, 256.0, 183.0, 135.0, 113.0, 85.0, 62.0, 40.0, 39.0, 26.0, 9.0, 23.0, 13.0, 8.0, 7.0, 2.0, 8.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.8831787109375, -9.547607421875, -9.2120361328125, -8.87646484375, -8.5408935546875, -8.205322265625, -7.8697509765625, -7.5341796875, -7.1986083984375, -6.863037109375, -6.5274658203125, -6.19189453125, -5.8563232421875, -5.520751953125, -5.1851806640625, -4.849609375, -4.5140380859375, -4.178466796875, -3.8428955078125, -3.50732421875, -3.1717529296875, -2.836181640625, -2.5006103515625, -2.1650390625, -1.8294677734375, -1.493896484375, -1.1583251953125, -0.82275390625, -0.4871826171875, -0.151611328125, 0.1839599609375, 0.51953125, 0.8551025390625, 1.190673828125, 1.5262451171875, 1.86181640625, 2.1973876953125, 2.532958984375, 2.8685302734375, 3.2041015625, 3.5396728515625, 3.875244140625, 4.2108154296875, 4.54638671875, 4.8819580078125, 5.217529296875, 5.5531005859375, 5.888671875, 6.2242431640625, 6.559814453125, 6.8953857421875, 7.23095703125, 7.5665283203125, 7.902099609375, 8.2376708984375, 8.5732421875, 8.9088134765625, 9.244384765625, 9.5799560546875, 9.91552734375, 10.2510986328125, 10.586669921875, 10.9222412109375, 11.2578125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 11.0, 8.0, 14.0, 26.0, 26.0, 30.0, 49.0, 59.0, 79.0, 100.0, 139.0, 243.0, 347.0, 560.0, 1266.0, 4628.0, 31289.0, 395907.0, 3098244.0, 607835.0, 44020.0, 6021.0, 1492.0, 647.0, 360.0, 250.0, 144.0, 126.0, 96.0, 51.0, 55.0, 46.0, 33.0, 17.0, 15.0, 11.0, 8.0, 5.0, 3.0, 5.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-24.359375, -23.587890625, -22.81640625, -22.044921875, -21.2734375, -20.501953125, -19.73046875, -18.958984375, -18.1875, -17.416015625, -16.64453125, -15.873046875, -15.1015625, -14.330078125, -13.55859375, -12.787109375, -12.015625, -11.244140625, -10.47265625, -9.701171875, -8.9296875, -8.158203125, -7.38671875, -6.615234375, -5.84375, -5.072265625, -4.30078125, -3.529296875, -2.7578125, -1.986328125, -1.21484375, -0.443359375, 0.328125, 1.099609375, 1.87109375, 2.642578125, 3.4140625, 4.185546875, 4.95703125, 5.728515625, 6.5, 7.271484375, 8.04296875, 8.814453125, 9.5859375, 10.357421875, 11.12890625, 11.900390625, 12.671875, 13.443359375, 14.21484375, 14.986328125, 15.7578125, 16.529296875, 17.30078125, 18.072265625, 18.84375, 19.615234375, 20.38671875, 21.158203125, 21.9296875, 22.701171875, 23.47265625, 24.244140625, 25.015625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 12.0, 24.0, 48.0, 81.0, 123.0, 134.0, 134.0, 142.0, 125.0, 86.0, 50.0, 26.0, 7.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.61207580566406, -74.57588195800781, -72.5396957397461, -70.50350189208984, -68.46731567382812, -66.43112182617188, -64.39492797851562, -62.358741760253906, -60.322547912597656, -58.28635787963867, -56.25016784667969, -54.21397399902344, -52.17778396606445, -50.14159393310547, -48.105403900146484, -46.0692138671875, -44.033023834228516, -41.99683380126953, -39.96064376831055, -37.92445373535156, -35.88825988769531, -33.85206985473633, -31.815879821777344, -29.77968978881836, -27.743497848510742, -25.707307815551758, -23.67111587524414, -21.634925842285156, -19.598735809326172, -17.562543869018555, -15.52635383605957, -13.49016284942627, -11.453975677490234, -9.417784690856934, -7.381594181060791, -5.345403671264648, -3.3092126846313477, -1.2730216979980469, 0.7631683349609375, 2.7993593215942383, 4.835550308227539, 6.87174129486084, 8.90793228149414, 10.944122314453125, 12.980313301086426, 15.016504287719727, 17.05269432067871, 19.088886260986328, 21.125076293945312, 23.161266326904297, 25.197458267211914, 27.2336483001709, 29.269840240478516, 31.3060302734375, 33.342220306396484, 35.37841033935547, 37.41460418701172, 39.4507942199707, 41.48698425292969, 43.52317810058594, 45.55936813354492, 47.595558166503906, 49.63174819946289, 51.667938232421875, 53.70412826538086]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 10.0, 4.0, 3.0, 3.0, 12.0, 5.0, 9.0, 18.0, 20.0, 24.0, 27.0, 32.0, 23.0, 29.0, 42.0, 32.0, 38.0, 48.0, 40.0, 52.0, 36.0, 61.0, 43.0, 42.0, 52.0, 42.0, 27.0, 32.0, 32.0, 26.0, 22.0, 17.0, 18.0, 14.0, 17.0, 11.0, 13.0, 12.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-47.48520278930664, -46.13641357421875, -44.787620544433594, -43.43882751464844, -42.09003829956055, -40.741249084472656, -39.3924560546875, -38.043663024902344, -36.69487380981445, -35.34608459472656, -33.997291564941406, -32.64849853515625, -31.29970932006836, -29.950918197631836, -28.602127075195312, -27.25333595275879, -25.904544830322266, -24.555753707885742, -23.20696258544922, -21.858171463012695, -20.509380340576172, -19.16058921813965, -17.811798095703125, -16.4630069732666, -15.114215850830078, -13.765424728393555, -12.416633605957031, -11.067842483520508, -9.719051361083984, -8.370260238647461, -7.0214691162109375, -5.672677993774414, -4.323883056640625, -2.9750919342041016, -1.6263008117675781, -0.2775096893310547, 1.0712814331054688, 2.420072555541992, 3.7688636779785156, 5.117654800415039, 6.4664459228515625, 7.815237045288086, 9.16402816772461, 10.512819290161133, 11.861610412597656, 13.21040153503418, 14.559192657470703, 15.907983779907227, 17.25677490234375, 18.605566024780273, 19.954357147216797, 21.30314826965332, 22.651939392089844, 24.000730514526367, 25.34952163696289, 26.698312759399414, 28.047103881835938, 29.39589500427246, 30.744686126708984, 32.093475341796875, 33.44226837158203, 34.79106140136719, 36.13985061645508, 37.48863983154297, 38.837432861328125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 1.0, 6.0, 6.0, 11.0, 8.0, 11.0, 13.0, 12.0, 17.0, 16.0, 33.0, 23.0, 28.0, 30.0, 29.0, 29.0, 32.0, 41.0, 34.0, 40.0, 49.0, 41.0, 38.0, 38.0, 38.0, 35.0, 26.0, 32.0, 40.0, 34.0, 20.0, 25.0, 26.0, 18.0, 20.0, 17.0, 9.0, 13.0, 13.0, 7.0, 8.0, 7.0, 6.0, 4.0, 0.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.88671875, -5.6824951171875, -5.478271484375, -5.2740478515625, -5.06982421875, -4.8656005859375, -4.661376953125, -4.4571533203125, -4.2529296875, -4.0487060546875, -3.844482421875, -3.6402587890625, -3.43603515625, -3.2318115234375, -3.027587890625, -2.8233642578125, -2.619140625, -2.4149169921875, -2.210693359375, -2.0064697265625, -1.80224609375, -1.5980224609375, -1.393798828125, -1.1895751953125, -0.9853515625, -0.7811279296875, -0.576904296875, -0.3726806640625, -0.16845703125, 0.0357666015625, 0.239990234375, 0.4442138671875, 0.6484375, 0.8526611328125, 1.056884765625, 1.2611083984375, 1.46533203125, 1.6695556640625, 1.873779296875, 2.0780029296875, 2.2822265625, 2.4864501953125, 2.690673828125, 2.8948974609375, 3.09912109375, 3.3033447265625, 3.507568359375, 3.7117919921875, 3.916015625, 4.1202392578125, 4.324462890625, 4.5286865234375, 4.73291015625, 4.9371337890625, 5.141357421875, 5.3455810546875, 5.5498046875, 5.7540283203125, 5.958251953125, 6.1624755859375, 6.36669921875, 6.5709228515625, 6.775146484375, 6.9793701171875, 7.18359375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 6.0, 10.0, 18.0, 20.0, 41.0, 59.0, 97.0, 157.0, 239.0, 336.0, 587.0, 913.0, 1484.0, 2244.0, 3569.0, 5782.0, 9419.0, 14786.0, 23659.0, 37595.0, 58168.0, 87554.0, 124296.0, 155491.0, 155375.0, 122578.0, 86556.0, 57791.0, 36968.0, 23464.0, 14617.0, 9259.0, 5712.0, 3628.0, 2305.0, 1331.0, 945.0, 542.0, 331.0, 241.0, 120.0, 91.0, 66.0, 34.0, 31.0, 16.0, 12.0, 3.0, 5.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.73779296875, -0.7131881713867188, -0.6885833740234375, -0.6639785766601562, -0.639373779296875, -0.6147689819335938, -0.5901641845703125, -0.5655593872070312, -0.54095458984375, -0.5163497924804688, -0.4917449951171875, -0.46714019775390625, -0.442535400390625, -0.41793060302734375, -0.3933258056640625, -0.36872100830078125, -0.3441162109375, -0.31951141357421875, -0.2949066162109375, -0.27030181884765625, -0.245697021484375, -0.22109222412109375, -0.1964874267578125, -0.17188262939453125, -0.14727783203125, -0.12267303466796875, -0.0980682373046875, -0.07346343994140625, -0.048858642578125, -0.02425384521484375, 0.0003509521484375, 0.02495574951171875, 0.049560546875, 0.07416534423828125, 0.0987701416015625, 0.12337493896484375, 0.147979736328125, 0.17258453369140625, 0.1971893310546875, 0.22179412841796875, 0.24639892578125, 0.27100372314453125, 0.2956085205078125, 0.32021331787109375, 0.344818115234375, 0.36942291259765625, 0.3940277099609375, 0.41863250732421875, 0.4432373046875, 0.46784210205078125, 0.4924468994140625, 0.5170516967773438, 0.541656494140625, 0.5662612915039062, 0.5908660888671875, 0.6154708862304688, 0.64007568359375, 0.6646804809570312, 0.6892852783203125, 0.7138900756835938, 0.738494873046875, 0.7630996704101562, 0.7877044677734375, 0.8123092651367188, 0.8369140625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 12.0, 12.0, 12.0, 11.0, 15.0, 17.0, 13.0, 16.0, 24.0, 28.0, 33.0, 22.0, 43.0, 36.0, 52.0, 39.0, 44.0, 44.0, 1063.0, 35.0, 38.0, 31.0, 49.0, 27.0, 31.0, 31.0, 35.0, 25.0, 32.0, 18.0, 21.0, 22.0, 12.0, 18.0, 6.0, 10.0, 8.0, 7.0, 1.0, 3.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.70703125, -4.56219482421875, -4.4173583984375, -4.27252197265625, -4.127685546875, -3.98284912109375, -3.8380126953125, -3.69317626953125, -3.54833984375, -3.40350341796875, -3.2586669921875, -3.11383056640625, -2.968994140625, -2.82415771484375, -2.6793212890625, -2.53448486328125, -2.3896484375, -2.24481201171875, -2.0999755859375, -1.95513916015625, -1.810302734375, -1.66546630859375, -1.5206298828125, -1.37579345703125, -1.23095703125, -1.08612060546875, -0.9412841796875, -0.79644775390625, -0.651611328125, -0.50677490234375, -0.3619384765625, -0.21710205078125, -0.072265625, 0.07257080078125, 0.2174072265625, 0.36224365234375, 0.507080078125, 0.65191650390625, 0.7967529296875, 0.94158935546875, 1.08642578125, 1.23126220703125, 1.3760986328125, 1.52093505859375, 1.665771484375, 1.81060791015625, 1.9554443359375, 2.10028076171875, 2.2451171875, 2.38995361328125, 2.5347900390625, 2.67962646484375, 2.824462890625, 2.96929931640625, 3.1141357421875, 3.25897216796875, 3.40380859375, 3.54864501953125, 3.6934814453125, 3.83831787109375, 3.983154296875, 4.12799072265625, 4.2728271484375, 4.41766357421875, 4.5625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 10.0, 11.0, 13.0, 34.0, 41.0, 52.0, 96.0, 139.0, 212.0, 292.0, 463.0, 711.0, 991.0, 1731.0, 2577.0, 3938.0, 6224.0, 9622.0, 15243.0, 23582.0, 35791.0, 54172.0, 79040.0, 109199.0, 139143.0, 1191127.0, 126779.0, 96189.0, 68230.0, 46423.0, 30116.0, 19737.0, 12619.0, 8038.0, 5200.0, 3232.0, 2108.0, 1349.0, 850.0, 622.0, 386.0, 260.0, 167.0, 124.0, 81.0, 57.0, 37.0, 23.0, 29.0, 7.0, 8.0, 5.0, 0.0, 3.0, 4.0, 2.0], "bins": [-0.533203125, -0.5171890258789062, -0.5011749267578125, -0.48516082763671875, -0.469146728515625, -0.45313262939453125, -0.4371185302734375, -0.42110443115234375, -0.40509033203125, -0.38907623291015625, -0.3730621337890625, -0.35704803466796875, -0.341033935546875, -0.32501983642578125, -0.3090057373046875, -0.29299163818359375, -0.2769775390625, -0.26096343994140625, -0.2449493408203125, -0.22893524169921875, -0.212921142578125, -0.19690704345703125, -0.1808929443359375, -0.16487884521484375, -0.14886474609375, -0.13285064697265625, -0.1168365478515625, -0.10082244873046875, -0.084808349609375, -0.06879425048828125, -0.0527801513671875, -0.03676605224609375, -0.020751953125, -0.00473785400390625, 0.0112762451171875, 0.02729034423828125, 0.043304443359375, 0.05931854248046875, 0.0753326416015625, 0.09134674072265625, 0.10736083984375, 0.12337493896484375, 0.1393890380859375, 0.15540313720703125, 0.171417236328125, 0.18743133544921875, 0.2034454345703125, 0.21945953369140625, 0.2354736328125, 0.25148773193359375, 0.2675018310546875, 0.28351593017578125, 0.299530029296875, 0.31554412841796875, 0.3315582275390625, 0.34757232666015625, 0.36358642578125, 0.37960052490234375, 0.3956146240234375, 0.41162872314453125, 0.427642822265625, 0.44365692138671875, 0.4596710205078125, 0.47568511962890625, 0.49169921875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 8.0, 8.0, 10.0, 10.0, 10.0, 14.0, 10.0, 15.0, 28.0, 24.0, 24.0, 34.0, 51.0, 47.0, 68.0, 86.0, 102.0, 85.0, 79.0, 51.0, 26.0, 35.0, 36.0, 20.0, 16.0, 17.0, 9.0, 12.0, 11.0, 9.0, 7.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0109100341796875, -0.010610103607177734, -0.010310173034667969, -0.010010242462158203, -0.009710311889648438, -0.009410381317138672, -0.009110450744628906, -0.00881052017211914, -0.008510589599609375, -0.00821065902709961, -0.007910728454589844, -0.007610797882080078, -0.0073108673095703125, -0.007010936737060547, -0.006711006164550781, -0.006411075592041016, -0.00611114501953125, -0.005811214447021484, -0.005511283874511719, -0.005211353302001953, -0.0049114227294921875, -0.004611492156982422, -0.004311561584472656, -0.004011631011962891, -0.003711700439453125, -0.0034117698669433594, -0.0031118392944335938, -0.002811908721923828, -0.0025119781494140625, -0.002212047576904297, -0.0019121170043945312, -0.0016121864318847656, -0.001312255859375, -0.0010123252868652344, -0.0007123947143554688, -0.0004124641418457031, -0.0001125335693359375, 0.00018739700317382812, 0.00048732757568359375, 0.0007872581481933594, 0.001087188720703125, 0.0013871192932128906, 0.0016870498657226562, 0.001986980438232422, 0.0022869110107421875, 0.002586841583251953, 0.0028867721557617188, 0.0031867027282714844, 0.00348663330078125, 0.0037865638732910156, 0.004086494445800781, 0.004386425018310547, 0.0046863555908203125, 0.004986286163330078, 0.005286216735839844, 0.005586147308349609, 0.005886077880859375, 0.006186008453369141, 0.006485939025878906, 0.006785869598388672, 0.0070858001708984375, 0.007385730743408203, 0.007685661315917969, 0.007985591888427734, 0.0082855224609375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 5.0, 5.0, 4.0, 6.0, 9.0, 12.0, 13.0, 17.0, 20.0, 19.0, 33.0, 48.0, 65.0, 94.0, 139.0, 200.0, 456.0, 1834.0, 725911.0, 317146.0, 1423.0, 384.0, 219.0, 133.0, 81.0, 65.0, 49.0, 38.0, 28.0, 15.0, 11.0, 15.0, 15.0, 7.0, 6.0, 10.0, 3.0, 6.0, 4.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1739501953125, -0.16772842407226562, -0.16150665283203125, -0.15528488159179688, -0.1490631103515625, -0.14284133911132812, -0.13661956787109375, -0.13039779663085938, -0.124176025390625, -0.11795425415039062, -0.11173248291015625, -0.10551071166992188, -0.0992889404296875, -0.09306716918945312, -0.08684539794921875, -0.08062362670898438, -0.07440185546875, -0.06818008422851562, -0.06195831298828125, -0.055736541748046875, -0.0495147705078125, -0.043292999267578125, -0.03707122802734375, -0.030849456787109375, -0.024627685546875, -0.018405914306640625, -0.01218414306640625, -0.005962371826171875, 0.0002593994140625, 0.006481170654296875, 0.01270294189453125, 0.018924713134765625, 0.025146484375, 0.031368255615234375, 0.03759002685546875, 0.043811798095703125, 0.0500335693359375, 0.056255340576171875, 0.06247711181640625, 0.06869888305664062, 0.074920654296875, 0.08114242553710938, 0.08736419677734375, 0.09358596801757812, 0.0998077392578125, 0.10602951049804688, 0.11225128173828125, 0.11847305297851562, 0.12469482421875, 0.13091659545898438, 0.13713836669921875, 0.14336013793945312, 0.1495819091796875, 0.15580368041992188, 0.16202545166015625, 0.16824722290039062, 0.174468994140625, 0.18069076538085938, 0.18691253662109375, 0.19313430786132812, 0.1993560791015625, 0.20557785034179688, 0.21179962158203125, 0.21802139282226562, 0.2242431640625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 19.0, 926.0, 69.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07837981730699539, -0.07418414950370789, -0.06998848170042038, -0.06579281389713287, -0.06159714609384537, -0.05740147829055786, -0.05320580676198006, -0.04901013895869255, -0.044814471155405045, -0.04061880335211754, -0.03642313554883003, -0.03222746402025223, -0.02803179807960987, -0.023836130276322365, -0.01964046061038971, -0.015444792807102203, -0.011249125003814697, -0.007053456734865904, -0.0028577884659171104, 0.0013378802686929703, 0.005533548071980476, 0.009729215875267982, 0.013924885541200638, 0.018120553344488144, 0.02231622114777565, 0.026511888951063156, 0.030707556754350662, 0.03490322828292847, 0.03909889608621597, 0.04329456388950348, 0.047490231692790985, 0.05168589949607849, 0.0558815598487854, 0.060077227652072906, 0.06427289545536041, 0.06846856325864792, 0.07266423106193542, 0.07685989886522293, 0.08105556666851044, 0.08525124192237854, 0.08944690227508545, 0.09364257007837296, 0.09783823788166046, 0.10203390568494797, 0.10622957348823547, 0.11042524129152298, 0.11462090909481049, 0.11881658434867859, 0.1230122521519661, 0.1272079199552536, 0.1314035952091217, 0.1355992555618286, 0.13979493081569672, 0.14399059116840363, 0.14818626642227173, 0.15238192677497864, 0.15657760202884674, 0.16077327728271484, 0.16496893763542175, 0.16916461288928986, 0.17336027324199677, 0.17755594849586487, 0.18175160884857178, 0.18594728410243988, 0.1901429444551468]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 8.0, 14.0, 18.0, 12.0, 25.0, 23.0, 32.0, 31.0, 39.0, 64.0, 50.0, 66.0, 45.0, 63.0, 54.0, 50.0, 52.0, 45.0, 41.0, 41.0, 36.0, 31.0, 23.0, 31.0, 27.0, 11.0, 18.0, 16.0, 10.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0095747709274292, -0.009224273264408112, -0.008873775601387024, -0.008523277938365936, -0.008172780275344849, -0.007822282612323761, -0.007471784949302673, -0.007121287286281586, -0.006770789623260498, -0.00642029196023941, -0.006069794297218323, -0.005719296634197235, -0.0053687989711761475, -0.00501830130815506, -0.004667803645133972, -0.0043173059821128845, -0.003966808319091797, -0.0036163106560707092, -0.0032658129930496216, -0.002915315330028534, -0.0025648176670074463, -0.0022143200039863586, -0.001863822340965271, -0.0015133246779441833, -0.0011628270149230957, -0.0008123293519020081, -0.0004618316888809204, -0.00011133402585983276, 0.00023916363716125488, 0.0005896613001823425, 0.0009401589632034302, 0.0012906566262245178, 0.0016411542892456055, 0.001991651952266693, 0.0023421496152877808, 0.0026926472783088684, 0.003043144941329956, 0.0033936426043510437, 0.0037441402673721313, 0.004094637930393219, 0.004445135593414307, 0.004795633256435394, 0.005146130919456482, 0.00549662858247757, 0.005847126245498657, 0.006197623908519745, 0.0065481215715408325, 0.00689861923456192, 0.007249116897583008, 0.0075996145606040955, 0.007950112223625183, 0.00830060988664627, 0.008651107549667358, 0.009001605212688446, 0.009352102875709534, 0.009702600538730621, 0.010053098201751709, 0.010403595864772797, 0.010754093527793884, 0.011104591190814972, 0.01145508885383606, 0.011805586516857147, 0.012156084179878235, 0.012506581842899323, 0.01285707950592041]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 1.0, 6.0, 6.0, 11.0, 8.0, 11.0, 13.0, 12.0, 17.0, 16.0, 33.0, 23.0, 28.0, 30.0, 29.0, 29.0, 32.0, 41.0, 34.0, 39.0, 50.0, 41.0, 38.0, 38.0, 38.0, 35.0, 26.0, 32.0, 40.0, 34.0, 20.0, 25.0, 26.0, 18.0, 20.0, 17.0, 9.0, 13.0, 13.0, 7.0, 8.0, 7.0, 6.0, 4.0, 0.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.88671875, -5.6824951171875, -5.478271484375, -5.2740478515625, -5.06982421875, -4.8656005859375, -4.661376953125, -4.4571533203125, -4.2529296875, -4.0487060546875, -3.844482421875, -3.6402587890625, -3.43603515625, -3.2318115234375, -3.027587890625, -2.8233642578125, -2.619140625, -2.4149169921875, -2.210693359375, -2.0064697265625, -1.80224609375, -1.5980224609375, -1.393798828125, -1.1895751953125, -0.9853515625, -0.7811279296875, -0.576904296875, -0.3726806640625, -0.16845703125, 0.0357666015625, 0.239990234375, 0.4442138671875, 0.6484375, 0.8526611328125, 1.056884765625, 1.2611083984375, 1.46533203125, 1.6695556640625, 1.873779296875, 2.0780029296875, 2.2822265625, 2.4864501953125, 2.690673828125, 2.8948974609375, 3.09912109375, 3.3033447265625, 3.507568359375, 3.7117919921875, 3.916015625, 4.1202392578125, 4.324462890625, 4.5286865234375, 4.73291015625, 4.9371337890625, 5.141357421875, 5.3455810546875, 5.5498046875, 5.7540283203125, 5.958251953125, 6.1624755859375, 6.36669921875, 6.5709228515625, 6.775146484375, 6.9793701171875, 7.18359375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 4.0, 9.0, 7.0, 6.0, 9.0, 10.0, 21.0, 27.0, 22.0, 32.0, 54.0, 51.0, 62.0, 97.0, 134.0, 149.0, 200.0, 257.0, 346.0, 599.0, 1127.0, 2551.0, 7353.0, 22009.0, 85231.0, 686308.0, 188341.0, 34709.0, 11049.0, 3823.0, 1514.0, 787.0, 424.0, 296.0, 216.0, 136.0, 139.0, 94.0, 76.0, 67.0, 40.0, 29.0, 43.0, 23.0, 12.0, 16.0, 13.0, 13.0, 5.0, 7.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.21875, -13.72314453125, -13.2275390625, -12.73193359375, -12.236328125, -11.74072265625, -11.2451171875, -10.74951171875, -10.25390625, -9.75830078125, -9.2626953125, -8.76708984375, -8.271484375, -7.77587890625, -7.2802734375, -6.78466796875, -6.2890625, -5.79345703125, -5.2978515625, -4.80224609375, -4.306640625, -3.81103515625, -3.3154296875, -2.81982421875, -2.32421875, -1.82861328125, -1.3330078125, -0.83740234375, -0.341796875, 0.15380859375, 0.6494140625, 1.14501953125, 1.640625, 2.13623046875, 2.6318359375, 3.12744140625, 3.623046875, 4.11865234375, 4.6142578125, 5.10986328125, 5.60546875, 6.10107421875, 6.5966796875, 7.09228515625, 7.587890625, 8.08349609375, 8.5791015625, 9.07470703125, 9.5703125, 10.06591796875, 10.5615234375, 11.05712890625, 11.552734375, 12.04833984375, 12.5439453125, 13.03955078125, 13.53515625, 14.03076171875, 14.5263671875, 15.02197265625, 15.517578125, 16.01318359375, 16.5087890625, 17.00439453125, 17.5]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 7.0, 8.0, 4.0, 5.0, 8.0, 10.0, 12.0, 19.0, 19.0, 25.0, 32.0, 20.0, 25.0, 36.0, 40.0, 31.0, 40.0, 59.0, 79.0, 195.0, 1462.0, 313.0, 118.0, 79.0, 53.0, 51.0, 51.0, 35.0, 45.0, 26.0, 19.0, 26.0, 21.0, 18.0, 9.0, 9.0, 12.0, 3.0, 10.0, 4.0, 2.0, 7.0, 3.0, 2.0, 1.0, 3.0], "bins": [-24.9375, -24.295166015625, -23.65283203125, -23.010498046875, -22.3681640625, -21.725830078125, -21.08349609375, -20.441162109375, -19.798828125, -19.156494140625, -18.51416015625, -17.871826171875, -17.2294921875, -16.587158203125, -15.94482421875, -15.302490234375, -14.66015625, -14.017822265625, -13.37548828125, -12.733154296875, -12.0908203125, -11.448486328125, -10.80615234375, -10.163818359375, -9.521484375, -8.879150390625, -8.23681640625, -7.594482421875, -6.9521484375, -6.309814453125, -5.66748046875, -5.025146484375, -4.3828125, -3.740478515625, -3.09814453125, -2.455810546875, -1.8134765625, -1.171142578125, -0.52880859375, 0.113525390625, 0.755859375, 1.398193359375, 2.04052734375, 2.682861328125, 3.3251953125, 3.967529296875, 4.60986328125, 5.252197265625, 5.89453125, 6.536865234375, 7.17919921875, 7.821533203125, 8.4638671875, 9.106201171875, 9.74853515625, 10.390869140625, 11.033203125, 11.675537109375, 12.31787109375, 12.960205078125, 13.6025390625, 14.244873046875, 14.88720703125, 15.529541015625, 16.171875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 7.0, 4.0, 9.0, 11.0, 8.0, 12.0, 17.0, 12.0, 24.0, 31.0, 26.0, 41.0, 65.0, 70.0, 110.0, 161.0, 299.0, 692.0, 2622.0, 41013.0, 3006496.0, 88260.0, 3859.0, 851.0, 350.0, 171.0, 101.0, 75.0, 55.0, 46.0, 49.0, 29.0, 23.0, 24.0, 15.0, 14.0, 17.0, 10.0, 7.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.59375, -43.87939453125, -42.1650390625, -40.45068359375, -38.736328125, -37.02197265625, -35.3076171875, -33.59326171875, -31.87890625, -30.16455078125, -28.4501953125, -26.73583984375, -25.021484375, -23.30712890625, -21.5927734375, -19.87841796875, -18.1640625, -16.44970703125, -14.7353515625, -13.02099609375, -11.306640625, -9.59228515625, -7.8779296875, -6.16357421875, -4.44921875, -2.73486328125, -1.0205078125, 0.69384765625, 2.408203125, 4.12255859375, 5.8369140625, 7.55126953125, 9.265625, 10.97998046875, 12.6943359375, 14.40869140625, 16.123046875, 17.83740234375, 19.5517578125, 21.26611328125, 22.98046875, 24.69482421875, 26.4091796875, 28.12353515625, 29.837890625, 31.55224609375, 33.2666015625, 34.98095703125, 36.6953125, 38.40966796875, 40.1240234375, 41.83837890625, 43.552734375, 45.26708984375, 46.9814453125, 48.69580078125, 50.41015625, 52.12451171875, 53.8388671875, 55.55322265625, 57.267578125, 58.98193359375, 60.6962890625, 62.41064453125, 64.125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [7.0, 81.0, 356.0, 417.0, 137.0, 18.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.232892990112305, -9.023740768432617, -4.814587593078613, -0.6054344177246094, 3.603717803955078, 7.812870025634766, 12.022024154663086, 16.231176376342773, 20.44032859802246, 24.64948081970215, 28.85863494873047, 33.067787170410156, 37.276939392089844, 41.48609161376953, 45.69524383544922, 49.904396057128906, 54.113548278808594, 58.32270050048828, 62.53185272216797, 66.74100494384766, 70.95015716552734, 75.15930938720703, 79.36846923828125, 83.57762145996094, 87.78677368164062, 91.99592590332031, 96.205078125, 100.41423034667969, 104.62338256835938, 108.83253479003906, 113.04168701171875, 117.25083923339844, 121.46000671386719, 125.66915893554688, 129.87831115722656, 134.08746337890625, 138.29661560058594, 142.50576782226562, 146.7149200439453, 150.924072265625, 155.1332244873047, 159.34237670898438, 163.55152893066406, 167.76068115234375, 171.96983337402344, 176.17898559570312, 180.3881378173828, 184.5972900390625, 188.80645751953125, 193.01560974121094, 197.22476196289062, 201.4339141845703, 205.64306640625, 209.8522186279297, 214.06137084960938, 218.27052307128906, 222.47967529296875, 226.68882751464844, 230.89797973632812, 235.1071319580078, 239.3162841796875, 243.5254364013672, 247.73458862304688, 251.94374084472656, 256.15289306640625]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 1.0, 9.0, 4.0, 8.0, 7.0, 7.0, 10.0, 17.0, 16.0, 23.0, 16.0, 24.0, 24.0, 30.0, 27.0, 28.0, 34.0, 35.0, 38.0, 32.0, 40.0, 36.0, 38.0, 41.0, 36.0, 41.0, 30.0, 30.0, 36.0, 26.0, 34.0, 20.0, 29.0, 16.0, 26.0, 18.0, 20.0, 27.0, 15.0, 13.0, 10.0, 10.0, 8.0, 3.0, 3.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.96725082397461, -46.43487548828125, -44.902503967285156, -43.3701286315918, -41.83775329589844, -40.30537796020508, -38.77300262451172, -37.240631103515625, -35.708255767822266, -34.175880432128906, -32.64350891113281, -31.111133575439453, -29.578758239746094, -28.046382904052734, -26.514009475708008, -24.98163604736328, -23.449260711669922, -21.916885375976562, -20.384511947631836, -18.85213851928711, -17.31976318359375, -15.787388801574707, -14.255014419555664, -12.722640037536621, -11.190265655517578, -9.657891273498535, -8.125516891479492, -6.593142509460449, -5.060768127441406, -3.5283937454223633, -1.9960193634033203, -0.46364498138427734, 1.0687255859375, 2.601099967956543, 4.133474349975586, 5.665848731994629, 7.198223114013672, 8.730597496032715, 10.262971878051758, 11.7953462600708, 13.327720642089844, 14.860095024108887, 16.39246940612793, 17.924842834472656, 19.457218170166016, 20.989593505859375, 22.5219669342041, 24.054340362548828, 25.586715698242188, 27.119091033935547, 28.651464462280273, 30.183837890625, 31.71621322631836, 33.24858856201172, 34.78096008300781, 36.31333541870117, 37.84571075439453, 39.37808609008789, 40.91046142578125, 42.442832946777344, 43.9752082824707, 45.50758361816406, 47.039955139160156, 48.572330474853516, 50.104705810546875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 4.0, 7.0, 9.0, 11.0, 11.0, 15.0, 12.0, 18.0, 18.0, 27.0, 30.0, 18.0, 44.0, 39.0, 37.0, 39.0, 41.0, 34.0, 38.0, 49.0, 42.0, 43.0, 34.0, 42.0, 31.0, 33.0, 35.0, 23.0, 27.0, 28.0, 31.0, 17.0, 10.0, 24.0, 8.0, 9.0, 6.0, 8.0, 9.0, 9.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.6640625, -6.43975830078125, -6.2154541015625, -5.99114990234375, -5.766845703125, -5.54254150390625, -5.3182373046875, -5.09393310546875, -4.86962890625, -4.64532470703125, -4.4210205078125, -4.19671630859375, -3.972412109375, -3.74810791015625, -3.5238037109375, -3.29949951171875, -3.0751953125, -2.85089111328125, -2.6265869140625, -2.40228271484375, -2.177978515625, -1.95367431640625, -1.7293701171875, -1.50506591796875, -1.28076171875, -1.05645751953125, -0.8321533203125, -0.60784912109375, -0.383544921875, -0.15924072265625, 0.0650634765625, 0.28936767578125, 0.513671875, 0.73797607421875, 0.9622802734375, 1.18658447265625, 1.410888671875, 1.63519287109375, 1.8594970703125, 2.08380126953125, 2.30810546875, 2.53240966796875, 2.7567138671875, 2.98101806640625, 3.205322265625, 3.42962646484375, 3.6539306640625, 3.87823486328125, 4.1025390625, 4.32684326171875, 4.5511474609375, 4.77545166015625, 4.999755859375, 5.22406005859375, 5.4483642578125, 5.67266845703125, 5.89697265625, 6.12127685546875, 6.3455810546875, 6.56988525390625, 6.794189453125, 7.01849365234375, 7.2427978515625, 7.46710205078125, 7.69140625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 11.0, 7.0, 19.0, 14.0, 17.0, 20.0, 22.0, 28.0, 53.0, 73.0, 109.0, 168.0, 304.0, 579.0, 1382.0, 3603.0, 10775.0, 38377.0, 163390.0, 725926.0, 1874473.0, 1052404.0, 244571.0, 55213.0, 14540.0, 4744.0, 1716.0, 710.0, 396.0, 166.0, 149.0, 69.0, 69.0, 32.0, 27.0, 27.0, 23.0, 14.0, 14.0, 6.0, 8.0, 7.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.53125, -10.1983642578125, -9.865478515625, -9.5325927734375, -9.19970703125, -8.8668212890625, -8.533935546875, -8.2010498046875, -7.8681640625, -7.5352783203125, -7.202392578125, -6.8695068359375, -6.53662109375, -6.2037353515625, -5.870849609375, -5.5379638671875, -5.205078125, -4.8721923828125, -4.539306640625, -4.2064208984375, -3.87353515625, -3.5406494140625, -3.207763671875, -2.8748779296875, -2.5419921875, -2.2091064453125, -1.876220703125, -1.5433349609375, -1.21044921875, -0.8775634765625, -0.544677734375, -0.2117919921875, 0.12109375, 0.4539794921875, 0.786865234375, 1.1197509765625, 1.45263671875, 1.7855224609375, 2.118408203125, 2.4512939453125, 2.7841796875, 3.1170654296875, 3.449951171875, 3.7828369140625, 4.11572265625, 4.4486083984375, 4.781494140625, 5.1143798828125, 5.447265625, 5.7801513671875, 6.113037109375, 6.4459228515625, 6.77880859375, 7.1116943359375, 7.444580078125, 7.7774658203125, 8.1103515625, 8.4432373046875, 8.776123046875, 9.1090087890625, 9.44189453125, 9.7747802734375, 10.107666015625, 10.4405517578125, 10.7734375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 8.0, 4.0, 7.0, 14.0, 15.0, 23.0, 29.0, 32.0, 58.0, 72.0, 104.0, 144.0, 189.0, 281.0, 384.0, 490.0, 480.0, 480.0, 334.0, 259.0, 199.0, 130.0, 87.0, 58.0, 50.0, 37.0, 25.0, 22.0, 13.0, 14.0, 12.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.859375, -12.4605712890625, -12.061767578125, -11.6629638671875, -11.26416015625, -10.8653564453125, -10.466552734375, -10.0677490234375, -9.6689453125, -9.2701416015625, -8.871337890625, -8.4725341796875, -8.07373046875, -7.6749267578125, -7.276123046875, -6.8773193359375, -6.478515625, -6.0797119140625, -5.680908203125, -5.2821044921875, -4.88330078125, -4.4844970703125, -4.085693359375, -3.6868896484375, -3.2880859375, -2.8892822265625, -2.490478515625, -2.0916748046875, -1.69287109375, -1.2940673828125, -0.895263671875, -0.4964599609375, -0.09765625, 0.3011474609375, 0.699951171875, 1.0987548828125, 1.49755859375, 1.8963623046875, 2.295166015625, 2.6939697265625, 3.0927734375, 3.4915771484375, 3.890380859375, 4.2891845703125, 4.68798828125, 5.0867919921875, 5.485595703125, 5.8843994140625, 6.283203125, 6.6820068359375, 7.080810546875, 7.4796142578125, 7.87841796875, 8.2772216796875, 8.676025390625, 9.0748291015625, 9.4736328125, 9.8724365234375, 10.271240234375, 10.6700439453125, 11.06884765625, 11.4676513671875, 11.866455078125, 12.2652587890625, 12.6640625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 10.0, 19.0, 13.0, 22.0, 18.0, 39.0, 58.0, 80.0, 113.0, 171.0, 307.0, 594.0, 1398.0, 4944.0, 42323.0, 969154.0, 3019405.0, 140610.0, 10939.0, 2137.0, 816.0, 372.0, 250.0, 155.0, 95.0, 76.0, 40.0, 29.0, 21.0, 19.0, 13.0, 7.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.125, -29.1279296875, -28.130859375, -27.1337890625, -26.13671875, -25.1396484375, -24.142578125, -23.1455078125, -22.1484375, -21.1513671875, -20.154296875, -19.1572265625, -18.16015625, -17.1630859375, -16.166015625, -15.1689453125, -14.171875, -13.1748046875, -12.177734375, -11.1806640625, -10.18359375, -9.1865234375, -8.189453125, -7.1923828125, -6.1953125, -5.1982421875, -4.201171875, -3.2041015625, -2.20703125, -1.2099609375, -0.212890625, 0.7841796875, 1.78125, 2.7783203125, 3.775390625, 4.7724609375, 5.76953125, 6.7666015625, 7.763671875, 8.7607421875, 9.7578125, 10.7548828125, 11.751953125, 12.7490234375, 13.74609375, 14.7431640625, 15.740234375, 16.7373046875, 17.734375, 18.7314453125, 19.728515625, 20.7255859375, 21.72265625, 22.7197265625, 23.716796875, 24.7138671875, 25.7109375, 26.7080078125, 27.705078125, 28.7021484375, 29.69921875, 30.6962890625, 31.693359375, 32.6904296875, 33.6875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 31.0, 132.0, 335.0, 358.0, 138.0, 14.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-168.94461059570312, -162.89486694335938, -156.84510803222656, -150.7953643798828, -144.74560546875, -138.69586181640625, -132.6461181640625, -126.59635925292969, -120.5466079711914, -114.49685668945312, -108.44710540771484, -102.39735412597656, -96.34761047363281, -90.2978515625, -84.24810791015625, -78.19835662841797, -72.14860534667969, -66.0988540649414, -60.049102783203125, -53.99935531616211, -47.94960403442383, -41.89985275268555, -35.85010528564453, -29.80035400390625, -23.75060272216797, -17.700851440429688, -11.651102066040039, -5.601352691650391, 0.4483985900878906, 6.498149871826172, 12.547897338867188, 18.59764862060547, 24.647384643554688, 30.69713592529297, 36.74688720703125, 42.796634674072266, 48.84638595581055, 54.89613723754883, 60.945884704589844, 66.99563598632812, 73.0453872680664, 79.09513854980469, 85.14488983154297, 91.19464111328125, 97.244384765625, 103.29414367675781, 109.34388732910156, 115.39363861083984, 121.44338989257812, 127.4931411743164, 133.5428924560547, 139.59263610839844, 145.64239501953125, 151.692138671875, 157.74188232421875, 163.79164123535156, 169.84140014648438, 175.89114379882812, 181.94090270996094, 187.9906463623047, 194.0404052734375, 200.09014892578125, 206.139892578125, 212.1896514892578, 218.23939514160156]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 9.0, 12.0, 12.0, 12.0, 20.0, 20.0, 11.0, 22.0, 23.0, 32.0, 34.0, 37.0, 31.0, 46.0, 37.0, 32.0, 40.0, 47.0, 33.0, 48.0, 38.0, 28.0, 29.0, 33.0, 41.0, 37.0, 35.0, 14.0, 21.0, 21.0, 27.0, 17.0, 10.0, 16.0, 15.0, 13.0, 10.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-37.40069580078125, -36.1751708984375, -34.94964599609375, -33.724117279052734, -32.498592376708984, -31.273067474365234, -30.04754066467285, -28.82201385498047, -27.59648895263672, -26.37096405029297, -25.145437240600586, -23.919910430908203, -22.694385528564453, -21.468860626220703, -20.24333381652832, -19.017807006835938, -17.792282104492188, -16.566757202148438, -15.341230392456055, -14.115704536437988, -12.890178680419922, -11.664652824401855, -10.439126968383789, -9.213601112365723, -7.988075256347656, -6.76254940032959, -5.537023544311523, -4.311497688293457, -3.0859718322753906, -1.8604459762573242, -0.6349201202392578, 0.5906057357788086, 1.8161354064941406, 3.041661262512207, 4.267187118530273, 5.49271297454834, 6.718238830566406, 7.943764686584473, 9.169290542602539, 10.394816398620605, 11.620342254638672, 12.845868110656738, 14.071393966674805, 15.296919822692871, 16.522445678710938, 17.747970581054688, 18.97349739074707, 20.199024200439453, 21.424549102783203, 22.650074005126953, 23.875600814819336, 25.10112762451172, 26.32665252685547, 27.55217742919922, 28.7777042388916, 30.003231048583984, 31.228755950927734, 32.454280853271484, 33.6798095703125, 34.90533447265625, 36.130859375, 37.35638427734375, 38.5819091796875, 39.807437896728516, 41.032962799072266]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 9.0, 10.0, 5.0, 11.0, 10.0, 13.0, 26.0, 22.0, 20.0, 28.0, 21.0, 32.0, 44.0, 35.0, 36.0, 37.0, 56.0, 48.0, 47.0, 48.0, 47.0, 37.0, 46.0, 45.0, 37.0, 32.0, 31.0, 22.0, 19.0, 21.0, 21.0, 18.0, 13.0, 16.0, 10.0, 9.0, 3.0, 4.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.25, -7.006591796875, -6.76318359375, -6.519775390625, -6.2763671875, -6.032958984375, -5.78955078125, -5.546142578125, -5.302734375, -5.059326171875, -4.81591796875, -4.572509765625, -4.3291015625, -4.085693359375, -3.84228515625, -3.598876953125, -3.35546875, -3.112060546875, -2.86865234375, -2.625244140625, -2.3818359375, -2.138427734375, -1.89501953125, -1.651611328125, -1.408203125, -1.164794921875, -0.92138671875, -0.677978515625, -0.4345703125, -0.191162109375, 0.05224609375, 0.295654296875, 0.5390625, 0.782470703125, 1.02587890625, 1.269287109375, 1.5126953125, 1.756103515625, 1.99951171875, 2.242919921875, 2.486328125, 2.729736328125, 2.97314453125, 3.216552734375, 3.4599609375, 3.703369140625, 3.94677734375, 4.190185546875, 4.43359375, 4.677001953125, 4.92041015625, 5.163818359375, 5.4072265625, 5.650634765625, 5.89404296875, 6.137451171875, 6.380859375, 6.624267578125, 6.86767578125, 7.111083984375, 7.3544921875, 7.597900390625, 7.84130859375, 8.084716796875, 8.328125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 17.0, 16.0, 30.0, 39.0, 54.0, 93.0, 142.0, 206.0, 287.0, 446.0, 575.0, 925.0, 1405.0, 2110.0, 3034.0, 4723.0, 7320.0, 10912.0, 16870.0, 25890.0, 39162.0, 59454.0, 86754.0, 118581.0, 144067.0, 143976.0, 118776.0, 87437.0, 59737.0, 39730.0, 26043.0, 17293.0, 11091.0, 7257.0, 4662.0, 3038.0, 2075.0, 1340.0, 979.0, 602.0, 414.0, 311.0, 220.0, 131.0, 109.0, 68.0, 39.0, 41.0, 28.0, 11.0, 11.0, 11.0, 7.0, 4.0, 3.0, 0.0, 1.0], "bins": [-0.76416015625, -0.7402877807617188, -0.7164154052734375, -0.6925430297851562, -0.668670654296875, -0.6447982788085938, -0.6209259033203125, -0.5970535278320312, -0.57318115234375, -0.5493087768554688, -0.5254364013671875, -0.5015640258789062, -0.477691650390625, -0.45381927490234375, -0.4299468994140625, -0.40607452392578125, -0.3822021484375, -0.35832977294921875, -0.3344573974609375, -0.31058502197265625, -0.286712646484375, -0.26284027099609375, -0.2389678955078125, -0.21509552001953125, -0.19122314453125, -0.16735076904296875, -0.1434783935546875, -0.11960601806640625, -0.095733642578125, -0.07186126708984375, -0.0479888916015625, -0.02411651611328125, -0.000244140625, 0.02362823486328125, 0.0475006103515625, 0.07137298583984375, 0.095245361328125, 0.11911773681640625, 0.1429901123046875, 0.16686248779296875, 0.19073486328125, 0.21460723876953125, 0.2384796142578125, 0.26235198974609375, 0.286224365234375, 0.31009674072265625, 0.3339691162109375, 0.35784149169921875, 0.3817138671875, 0.40558624267578125, 0.4294586181640625, 0.45333099365234375, 0.477203369140625, 0.5010757446289062, 0.5249481201171875, 0.5488204956054688, 0.57269287109375, 0.5965652465820312, 0.6204376220703125, 0.6443099975585938, 0.668182373046875, 0.6920547485351562, 0.7159271240234375, 0.7397994995117188, 0.763671875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 5.0, 3.0, 9.0, 12.0, 6.0, 4.0, 9.0, 9.0, 24.0, 20.0, 17.0, 32.0, 35.0, 35.0, 35.0, 39.0, 38.0, 49.0, 36.0, 1076.0, 44.0, 46.0, 44.0, 38.0, 34.0, 50.0, 29.0, 27.0, 23.0, 27.0, 22.0, 23.0, 24.0, 19.0, 23.0, 13.0, 12.0, 9.0, 1.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62109375, -4.47174072265625, -4.3223876953125, -4.17303466796875, -4.023681640625, -3.87432861328125, -3.7249755859375, -3.57562255859375, -3.42626953125, -3.27691650390625, -3.1275634765625, -2.97821044921875, -2.828857421875, -2.67950439453125, -2.5301513671875, -2.38079833984375, -2.2314453125, -2.08209228515625, -1.9327392578125, -1.78338623046875, -1.634033203125, -1.48468017578125, -1.3353271484375, -1.18597412109375, -1.03662109375, -0.88726806640625, -0.7379150390625, -0.58856201171875, -0.439208984375, -0.28985595703125, -0.1405029296875, 0.00885009765625, 0.158203125, 0.30755615234375, 0.4569091796875, 0.60626220703125, 0.755615234375, 0.90496826171875, 1.0543212890625, 1.20367431640625, 1.35302734375, 1.50238037109375, 1.6517333984375, 1.80108642578125, 1.950439453125, 2.09979248046875, 2.2491455078125, 2.39849853515625, 2.5478515625, 2.69720458984375, 2.8465576171875, 2.99591064453125, 3.145263671875, 3.29461669921875, 3.4439697265625, 3.59332275390625, 3.74267578125, 3.89202880859375, 4.0413818359375, 4.19073486328125, 4.340087890625, 4.48944091796875, 4.6387939453125, 4.78814697265625, 4.9375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 2.0, 5.0, 9.0, 29.0, 16.0, 45.0, 83.0, 96.0, 167.0, 239.0, 385.0, 593.0, 940.0, 1454.0, 2237.0, 3452.0, 5451.0, 8836.0, 13881.0, 21530.0, 32749.0, 49931.0, 73228.0, 103316.0, 133520.0, 1195844.0, 132567.0, 102911.0, 72987.0, 49552.0, 32658.0, 21217.0, 13477.0, 8647.0, 5498.0, 3545.0, 2237.0, 1358.0, 872.0, 548.0, 387.0, 220.0, 150.0, 77.0, 59.0, 40.0, 24.0, 18.0, 20.0, 7.0, 6.0, 7.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.52587890625, -0.5086288452148438, -0.4913787841796875, -0.47412872314453125, -0.456878662109375, -0.43962860107421875, -0.4223785400390625, -0.40512847900390625, -0.38787841796875, -0.37062835693359375, -0.3533782958984375, -0.33612823486328125, -0.318878173828125, -0.30162811279296875, -0.2843780517578125, -0.26712799072265625, -0.2498779296875, -0.23262786865234375, -0.2153778076171875, -0.19812774658203125, -0.180877685546875, -0.16362762451171875, -0.1463775634765625, -0.12912750244140625, -0.11187744140625, -0.09462738037109375, -0.0773773193359375, -0.06012725830078125, -0.042877197265625, -0.02562713623046875, -0.0083770751953125, 0.00887298583984375, 0.026123046875, 0.04337310791015625, 0.0606231689453125, 0.07787322998046875, 0.095123291015625, 0.11237335205078125, 0.1296234130859375, 0.14687347412109375, 0.16412353515625, 0.18137359619140625, 0.1986236572265625, 0.21587371826171875, 0.233123779296875, 0.25037384033203125, 0.2676239013671875, 0.28487396240234375, 0.3021240234375, 0.31937408447265625, 0.3366241455078125, 0.35387420654296875, 0.371124267578125, 0.38837432861328125, 0.4056243896484375, 0.42287445068359375, 0.44012451171875, 0.45737457275390625, 0.4746246337890625, 0.49187469482421875, 0.509124755859375, 0.5263748168945312, 0.5436248779296875, 0.5608749389648438, 0.578125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 6.0, 4.0, 6.0, 20.0, 18.0, 21.0, 17.0, 41.0, 49.0, 65.0, 127.0, 165.0, 142.0, 76.0, 63.0, 35.0, 30.0, 18.0, 23.0, 17.0, 9.0, 7.0, 1.0, 4.0, 2.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01270294189453125, -0.0122758150100708, -0.011848688125610352, -0.011421561241149902, -0.010994434356689453, -0.010567307472229004, -0.010140180587768555, -0.009713053703308105, -0.009285926818847656, -0.008858799934387207, -0.008431673049926758, -0.008004546165466309, -0.007577419281005859, -0.00715029239654541, -0.006723165512084961, -0.006296038627624512, -0.0058689117431640625, -0.005441784858703613, -0.005014657974243164, -0.004587531089782715, -0.004160404205322266, -0.0037332773208618164, -0.003306150436401367, -0.002879023551940918, -0.0024518966674804688, -0.0020247697830200195, -0.0015976428985595703, -0.001170516014099121, -0.0007433891296386719, -0.00031626224517822266, 0.00011086463928222656, 0.0005379915237426758, 0.000965118408203125, 0.0013922452926635742, 0.0018193721771240234, 0.0022464990615844727, 0.002673625946044922, 0.003100752830505371, 0.0035278797149658203, 0.0039550065994262695, 0.004382133483886719, 0.004809260368347168, 0.005236387252807617, 0.005663514137268066, 0.006090641021728516, 0.006517767906188965, 0.006944894790649414, 0.007372021675109863, 0.0077991485595703125, 0.008226275444030762, 0.008653402328491211, 0.00908052921295166, 0.00950765609741211, 0.009934782981872559, 0.010361909866333008, 0.010789036750793457, 0.011216163635253906, 0.011643290519714355, 0.012070417404174805, 0.012497544288635254, 0.012924671173095703, 0.013351798057556152, 0.013778924942016602, 0.01420605182647705, 0.0146331787109375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 1.0, 10.0, 11.0, 16.0, 27.0, 23.0, 39.0, 71.0, 107.0, 203.0, 473.0, 6216.0, 1038265.0, 2149.0, 428.0, 170.0, 91.0, 67.0, 40.0, 37.0, 23.0, 14.0, 10.0, 6.0, 13.0, 8.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.3037109375, -0.29488372802734375, -0.2860565185546875, -0.27722930908203125, -0.268402099609375, -0.25957489013671875, -0.2507476806640625, -0.24192047119140625, -0.23309326171875, -0.22426605224609375, -0.2154388427734375, -0.20661163330078125, -0.197784423828125, -0.18895721435546875, -0.1801300048828125, -0.17130279541015625, -0.1624755859375, -0.15364837646484375, -0.1448211669921875, -0.13599395751953125, -0.127166748046875, -0.11833953857421875, -0.1095123291015625, -0.10068511962890625, -0.09185791015625, -0.08303070068359375, -0.0742034912109375, -0.06537628173828125, -0.056549072265625, -0.04772186279296875, -0.0388946533203125, -0.03006744384765625, -0.021240234375, -0.01241302490234375, -0.0035858154296875, 0.00524139404296875, 0.014068603515625, 0.02289581298828125, 0.0317230224609375, 0.04055023193359375, 0.04937744140625, 0.05820465087890625, 0.0670318603515625, 0.07585906982421875, 0.084686279296875, 0.09351348876953125, 0.1023406982421875, 0.11116790771484375, 0.1199951171875, 0.12882232666015625, 0.1376495361328125, 0.14647674560546875, 0.155303955078125, 0.16413116455078125, 0.1729583740234375, 0.18178558349609375, 0.19061279296875, 0.19944000244140625, 0.2082672119140625, 0.21709442138671875, 0.225921630859375, 0.23474884033203125, 0.2435760498046875, 0.25240325927734375, 0.26123046875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 968.0, 37.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11654668301343918, -0.11141981184482574, -0.10629294812679291, -0.10116607695817947, -0.09603920578956604, -0.0909123346209526, -0.08578546345233917, -0.08065859973430634, -0.0755317285656929, -0.07040485739707947, -0.06527799367904663, -0.0601511225104332, -0.05502425134181976, -0.04989738017320633, -0.044770512729883194, -0.03964364528656006, -0.034516774117946625, -0.02938990481197834, -0.024263035506010056, -0.01913616620004177, -0.014009296894073486, -0.008882427588105202, -0.003755558282136917, 0.0013713091611862183, 0.006498180329799652, 0.011625049635767937, 0.01675191894173622, 0.021878788247704506, 0.02700565755367279, 0.032132528722286224, 0.03725939616560936, 0.042386263608932495, 0.047513142228126526, 0.05264001339673996, 0.057766880840063095, 0.06289374828338623, 0.06802061945199966, 0.0731474906206131, 0.07827435433864594, 0.08340122550725937, 0.0885280966758728, 0.09365496784448624, 0.09878183901309967, 0.10390870273113251, 0.10903557389974594, 0.11416244506835938, 0.11928930878639221, 0.12441617995500565, 0.12954305112361908, 0.13466991484165192, 0.13979679346084595, 0.14492365717887878, 0.15005052089691162, 0.15517739951610565, 0.1603042632341385, 0.16543114185333252, 0.17055800557136536, 0.1756848692893982, 0.18081174790859222, 0.18593861162662506, 0.1910654902458191, 0.19619235396385193, 0.20131921768188477, 0.2064460813999176, 0.21157296001911163]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 9.0, 10.0, 3.0, 16.0, 20.0, 21.0, 21.0, 31.0, 41.0, 44.0, 47.0, 62.0, 47.0, 45.0, 44.0, 57.0, 72.0, 46.0, 58.0, 54.0, 39.0, 34.0, 41.0, 24.0, 24.0, 18.0, 16.0, 14.0, 5.0, 5.0, 6.0, 11.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010081470012664795, -0.00971247348934412, -0.009343476966023445, -0.00897448044270277, -0.008605483919382095, -0.00823648739606142, -0.007867490872740746, -0.007498494349420071, -0.007129497826099396, -0.006760501302778721, -0.006391504779458046, -0.006022508256137371, -0.005653511732816696, -0.005284515209496021, -0.004915518686175346, -0.0045465221628546715, -0.004177525639533997, -0.0038085291162133217, -0.003439532592892647, -0.003070536069571972, -0.002701539546251297, -0.002332543022930622, -0.001963546499609947, -0.0015945499762892723, -0.0012255534529685974, -0.0008565569296479225, -0.0004875604063272476, -0.00011856388300657272, 0.00025043264031410217, 0.0006194291636347771, 0.000988425686955452, 0.0013574222102761269, 0.0017264187335968018, 0.0020954152569174767, 0.0024644117802381516, 0.0028334083035588264, 0.0032024048268795013, 0.0035714013502001762, 0.003940397873520851, 0.004309394396841526, 0.004678390920162201, 0.005047387443482876, 0.005416383966803551, 0.005785380490124226, 0.0061543770134449005, 0.006523373536765575, 0.00689237006008625, 0.007261366583406925, 0.0076303631067276, 0.007999359630048275, 0.00836835615336895, 0.008737352676689625, 0.0091063492000103, 0.009475345723330975, 0.00984434224665165, 0.010213338769972324, 0.010582335293293, 0.010951331816613674, 0.011320328339934349, 0.011689324863255024, 0.012058321386575699, 0.012427317909896374, 0.012796314433217049, 0.013165310956537724, 0.013534307479858398]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 9.0, 10.0, 5.0, 11.0, 10.0, 13.0, 26.0, 22.0, 20.0, 28.0, 21.0, 32.0, 44.0, 35.0, 36.0, 37.0, 56.0, 48.0, 47.0, 48.0, 47.0, 37.0, 46.0, 45.0, 37.0, 33.0, 30.0, 22.0, 19.0, 21.0, 21.0, 18.0, 13.0, 16.0, 10.0, 9.0, 3.0, 4.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.25, -7.006591796875, -6.76318359375, -6.519775390625, -6.2763671875, -6.032958984375, -5.78955078125, -5.546142578125, -5.302734375, -5.059326171875, -4.81591796875, -4.572509765625, -4.3291015625, -4.085693359375, -3.84228515625, -3.598876953125, -3.35546875, -3.112060546875, -2.86865234375, -2.625244140625, -2.3818359375, -2.138427734375, -1.89501953125, -1.651611328125, -1.408203125, -1.164794921875, -0.92138671875, -0.677978515625, -0.4345703125, -0.191162109375, 0.05224609375, 0.295654296875, 0.5390625, 0.782470703125, 1.02587890625, 1.269287109375, 1.5126953125, 1.756103515625, 1.99951171875, 2.242919921875, 2.486328125, 2.729736328125, 2.97314453125, 3.216552734375, 3.4599609375, 3.703369140625, 3.94677734375, 4.190185546875, 4.43359375, 4.677001953125, 4.92041015625, 5.163818359375, 5.4072265625, 5.650634765625, 5.89404296875, 6.137451171875, 6.380859375, 6.624267578125, 6.86767578125, 7.111083984375, 7.3544921875, 7.597900390625, 7.84130859375, 8.084716796875, 8.328125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 6.0, 17.0, 19.0, 25.0, 37.0, 57.0, 78.0, 98.0, 161.0, 253.0, 398.0, 669.0, 1135.0, 2040.0, 4037.0, 8320.0, 18574.0, 42975.0, 99290.0, 234972.0, 348306.0, 161247.0, 69430.0, 30214.0, 13134.0, 6209.0, 2937.0, 1563.0, 853.0, 530.0, 326.0, 195.0, 131.0, 90.0, 61.0, 50.0, 25.0, 26.0, 17.0, 11.0, 12.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.99609375, -7.70306396484375, -7.4100341796875, -7.11700439453125, -6.823974609375, -6.53094482421875, -6.2379150390625, -5.94488525390625, -5.65185546875, -5.35882568359375, -5.0657958984375, -4.77276611328125, -4.479736328125, -4.18670654296875, -3.8936767578125, -3.60064697265625, -3.3076171875, -3.01458740234375, -2.7215576171875, -2.42852783203125, -2.135498046875, -1.84246826171875, -1.5494384765625, -1.25640869140625, -0.96337890625, -0.67034912109375, -0.3773193359375, -0.08428955078125, 0.208740234375, 0.50177001953125, 0.7947998046875, 1.08782958984375, 1.380859375, 1.67388916015625, 1.9669189453125, 2.25994873046875, 2.552978515625, 2.84600830078125, 3.1390380859375, 3.43206787109375, 3.72509765625, 4.01812744140625, 4.3111572265625, 4.60418701171875, 4.897216796875, 5.19024658203125, 5.4832763671875, 5.77630615234375, 6.0693359375, 6.36236572265625, 6.6553955078125, 6.94842529296875, 7.241455078125, 7.53448486328125, 7.8275146484375, 8.12054443359375, 8.41357421875, 8.70660400390625, 8.9996337890625, 9.29266357421875, 9.585693359375, 9.87872314453125, 10.1717529296875, 10.46478271484375, 10.7578125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 6.0, 12.0, 6.0, 6.0, 13.0, 15.0, 13.0, 8.0, 20.0, 27.0, 28.0, 28.0, 36.0, 29.0, 37.0, 59.0, 69.0, 66.0, 118.0, 182.0, 1294.0, 274.0, 149.0, 99.0, 64.0, 44.0, 41.0, 43.0, 30.0, 30.0, 17.0, 31.0, 21.0, 15.0, 15.0, 16.0, 17.0, 10.0, 7.0, 10.0, 5.0, 6.0, 4.0, 5.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.234375, -16.677978515625, -16.12158203125, -15.565185546875, -15.0087890625, -14.452392578125, -13.89599609375, -13.339599609375, -12.783203125, -12.226806640625, -11.67041015625, -11.114013671875, -10.5576171875, -10.001220703125, -9.44482421875, -8.888427734375, -8.33203125, -7.775634765625, -7.21923828125, -6.662841796875, -6.1064453125, -5.550048828125, -4.99365234375, -4.437255859375, -3.880859375, -3.324462890625, -2.76806640625, -2.211669921875, -1.6552734375, -1.098876953125, -0.54248046875, 0.013916015625, 0.5703125, 1.126708984375, 1.68310546875, 2.239501953125, 2.7958984375, 3.352294921875, 3.90869140625, 4.465087890625, 5.021484375, 5.577880859375, 6.13427734375, 6.690673828125, 7.2470703125, 7.803466796875, 8.35986328125, 8.916259765625, 9.47265625, 10.029052734375, 10.58544921875, 11.141845703125, 11.6982421875, 12.254638671875, 12.81103515625, 13.367431640625, 13.923828125, 14.480224609375, 15.03662109375, 15.593017578125, 16.1494140625, 16.705810546875, 17.26220703125, 17.818603515625, 18.375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 5.0, 9.0, 5.0, 5.0, 1.0, 9.0, 17.0, 19.0, 39.0, 45.0, 64.0, 85.0, 162.0, 209.0, 336.0, 714.0, 2705.0, 43063.0, 2574312.0, 507741.0, 13328.0, 1421.0, 548.0, 286.0, 198.0, 108.0, 77.0, 63.0, 41.0, 21.0, 31.0, 8.0, 11.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.53125, -41.1943359375, -39.857421875, -38.5205078125, -37.18359375, -35.8466796875, -34.509765625, -33.1728515625, -31.8359375, -30.4990234375, -29.162109375, -27.8251953125, -26.48828125, -25.1513671875, -23.814453125, -22.4775390625, -21.140625, -19.8037109375, -18.466796875, -17.1298828125, -15.79296875, -14.4560546875, -13.119140625, -11.7822265625, -10.4453125, -9.1083984375, -7.771484375, -6.4345703125, -5.09765625, -3.7607421875, -2.423828125, -1.0869140625, 0.25, 1.5869140625, 2.923828125, 4.2607421875, 5.59765625, 6.9345703125, 8.271484375, 9.6083984375, 10.9453125, 12.2822265625, 13.619140625, 14.9560546875, 16.29296875, 17.6298828125, 18.966796875, 20.3037109375, 21.640625, 22.9775390625, 24.314453125, 25.6513671875, 26.98828125, 28.3251953125, 29.662109375, 30.9990234375, 32.3359375, 33.6728515625, 35.009765625, 36.3466796875, 37.68359375, 39.0205078125, 40.357421875, 41.6943359375, 43.03125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [4.0, 47.0, 322.0, 459.0, 167.0, 15.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.130380630493164, -11.101810455322266, -6.073239326477051, -1.044668197631836, 3.9839019775390625, 9.012472152709961, 14.041044235229492, 19.069612503051758, 24.09818458557129, 29.126754760742188, 34.15532684326172, 39.18389892578125, 44.212467193603516, 49.24103546142578, 54.26960754394531, 59.298179626464844, 64.32675170898438, 69.3553237915039, 74.38389587402344, 79.41246032714844, 84.44103240966797, 89.4696044921875, 94.49817657470703, 99.52674865722656, 104.55531311035156, 109.5838851928711, 114.61245727539062, 119.64102172851562, 124.66959381103516, 129.6981658935547, 134.72674560546875, 139.75531005859375, 144.7838897705078, 149.8124542236328, 154.84103393554688, 159.86959838867188, 164.89817810058594, 169.92674255371094, 174.955322265625, 179.98388671875, 185.012451171875, 190.041015625, 195.06959533691406, 200.09815979003906, 205.12673950195312, 210.15530395507812, 215.18386840820312, 220.2124481201172, 225.24102783203125, 230.26959228515625, 235.2981719970703, 240.3267364501953, 245.35531616210938, 250.38388061523438, 255.41244506835938, 260.4410095214844, 265.4695739746094, 270.4981384277344, 275.5267028808594, 280.5552978515625, 285.5838623046875, 290.6124267578125, 295.6409912109375, 300.6695556640625, 305.6981506347656]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 6.0, 7.0, 4.0, 17.0, 18.0, 16.0, 22.0, 21.0, 16.0, 17.0, 26.0, 25.0, 22.0, 29.0, 37.0, 32.0, 41.0, 54.0, 37.0, 39.0, 51.0, 44.0, 33.0, 46.0, 31.0, 34.0, 35.0, 23.0, 27.0, 19.0, 22.0, 16.0, 19.0, 18.0, 20.0, 9.0, 10.0, 12.0, 8.0, 8.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-47.337684631347656, -45.98408508300781, -44.630489349365234, -43.27688980102539, -41.92329406738281, -40.56969451904297, -39.216094970703125, -37.86249542236328, -36.5088996887207, -35.15530014038086, -33.80170440673828, -32.44810485839844, -31.094507217407227, -29.740909576416016, -28.387310028076172, -27.03371238708496, -25.68011474609375, -24.32651710510254, -22.972919464111328, -21.619319915771484, -20.265722274780273, -18.912124633789062, -17.55852508544922, -16.204927444458008, -14.851329803466797, -13.497732162475586, -12.144133567810059, -10.790534973144531, -9.43693733215332, -8.08333969116211, -6.729741096496582, -5.376142501831055, -4.022544860839844, -2.6689467430114746, -1.3153486251831055, 0.03824949264526367, 1.3918476104736328, 2.745445728302002, 4.099043846130371, 5.452642440795898, 6.806240081787109, 8.15983772277832, 9.513436317443848, 10.867034912109375, 12.220632553100586, 13.574230194091797, 14.927828788757324, 16.28142738342285, 17.635025024414062, 18.988622665405273, 20.342220306396484, 21.695819854736328, 23.04941749572754, 24.40301513671875, 25.756614685058594, 27.110212326049805, 28.463809967041016, 29.817407608032227, 31.171005249023438, 32.52460479736328, 33.878204345703125, 35.2318000793457, 36.58539962768555, 37.938995361328125, 39.29259490966797]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 1.0, 6.0, 7.0, 1.0, 7.0, 9.0, 10.0, 10.0, 9.0, 10.0, 21.0, 21.0, 17.0, 23.0, 12.0, 33.0, 29.0, 34.0, 33.0, 39.0, 35.0, 33.0, 52.0, 43.0, 41.0, 39.0, 41.0, 35.0, 33.0, 35.0, 33.0, 29.0, 28.0, 26.0, 19.0, 17.0, 21.0, 23.0, 20.0, 13.0, 17.0, 5.0, 8.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.9140625, -6.69317626953125, -6.4722900390625, -6.25140380859375, -6.030517578125, -5.80963134765625, -5.5887451171875, -5.36785888671875, -5.14697265625, -4.92608642578125, -4.7052001953125, -4.48431396484375, -4.263427734375, -4.04254150390625, -3.8216552734375, -3.60076904296875, -3.3798828125, -3.15899658203125, -2.9381103515625, -2.71722412109375, -2.496337890625, -2.27545166015625, -2.0545654296875, -1.83367919921875, -1.61279296875, -1.39190673828125, -1.1710205078125, -0.95013427734375, -0.729248046875, -0.50836181640625, -0.2874755859375, -0.06658935546875, 0.154296875, 0.37518310546875, 0.5960693359375, 0.81695556640625, 1.037841796875, 1.25872802734375, 1.4796142578125, 1.70050048828125, 1.92138671875, 2.14227294921875, 2.3631591796875, 2.58404541015625, 2.804931640625, 3.02581787109375, 3.2467041015625, 3.46759033203125, 3.6884765625, 3.90936279296875, 4.1302490234375, 4.35113525390625, 4.572021484375, 4.79290771484375, 5.0137939453125, 5.23468017578125, 5.45556640625, 5.67645263671875, 5.8973388671875, 6.11822509765625, 6.339111328125, 6.55999755859375, 6.7808837890625, 7.00177001953125, 7.22265625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 4.0, 11.0, 12.0, 10.0, 28.0, 29.0, 50.0, 66.0, 93.0, 138.0, 232.0, 379.0, 631.0, 1166.0, 2361.0, 5043.0, 11858.0, 29863.0, 84292.0, 253912.0, 748805.0, 1484890.0, 1014405.0, 366068.0, 119555.0, 41387.0, 15868.0, 6548.0, 3033.0, 1499.0, 810.0, 442.0, 267.0, 187.0, 107.0, 70.0, 38.0, 40.0, 21.0, 16.0, 18.0, 14.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.078125, -7.822998046875, -7.56787109375, -7.312744140625, -7.0576171875, -6.802490234375, -6.54736328125, -6.292236328125, -6.037109375, -5.781982421875, -5.52685546875, -5.271728515625, -5.0166015625, -4.761474609375, -4.50634765625, -4.251220703125, -3.99609375, -3.740966796875, -3.48583984375, -3.230712890625, -2.9755859375, -2.720458984375, -2.46533203125, -2.210205078125, -1.955078125, -1.699951171875, -1.44482421875, -1.189697265625, -0.9345703125, -0.679443359375, -0.42431640625, -0.169189453125, 0.0859375, 0.341064453125, 0.59619140625, 0.851318359375, 1.1064453125, 1.361572265625, 1.61669921875, 1.871826171875, 2.126953125, 2.382080078125, 2.63720703125, 2.892333984375, 3.1474609375, 3.402587890625, 3.65771484375, 3.912841796875, 4.16796875, 4.423095703125, 4.67822265625, 4.933349609375, 5.1884765625, 5.443603515625, 5.69873046875, 5.953857421875, 6.208984375, 6.464111328125, 6.71923828125, 6.974365234375, 7.2294921875, 7.484619140625, 7.73974609375, 7.994873046875, 8.25]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 9.0, 16.0, 17.0, 19.0, 16.0, 19.0, 40.0, 44.0, 72.0, 92.0, 132.0, 169.0, 204.0, 299.0, 440.0, 458.0, 446.0, 454.0, 326.0, 221.0, 145.0, 112.0, 71.0, 75.0, 41.0, 36.0, 21.0, 23.0, 13.0, 7.0, 13.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.125, -11.767578125, -11.41015625, -11.052734375, -10.6953125, -10.337890625, -9.98046875, -9.623046875, -9.265625, -8.908203125, -8.55078125, -8.193359375, -7.8359375, -7.478515625, -7.12109375, -6.763671875, -6.40625, -6.048828125, -5.69140625, -5.333984375, -4.9765625, -4.619140625, -4.26171875, -3.904296875, -3.546875, -3.189453125, -2.83203125, -2.474609375, -2.1171875, -1.759765625, -1.40234375, -1.044921875, -0.6875, -0.330078125, 0.02734375, 0.384765625, 0.7421875, 1.099609375, 1.45703125, 1.814453125, 2.171875, 2.529296875, 2.88671875, 3.244140625, 3.6015625, 3.958984375, 4.31640625, 4.673828125, 5.03125, 5.388671875, 5.74609375, 6.103515625, 6.4609375, 6.818359375, 7.17578125, 7.533203125, 7.890625, 8.248046875, 8.60546875, 8.962890625, 9.3203125, 9.677734375, 10.03515625, 10.392578125, 10.75]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 9.0, 6.0, 10.0, 20.0, 19.0, 47.0, 52.0, 76.0, 108.0, 181.0, 307.0, 514.0, 1178.0, 2468.0, 6599.0, 20034.0, 71956.0, 339234.0, 1917139.0, 1497872.0, 254024.0, 56424.0, 16075.0, 5439.0, 2172.0, 972.0, 503.0, 299.0, 168.0, 99.0, 88.0, 63.0, 41.0, 23.0, 18.0, 11.0, 11.0, 3.0, 3.0, 0.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.453125, -13.969970703125, -13.48681640625, -13.003662109375, -12.5205078125, -12.037353515625, -11.55419921875, -11.071044921875, -10.587890625, -10.104736328125, -9.62158203125, -9.138427734375, -8.6552734375, -8.172119140625, -7.68896484375, -7.205810546875, -6.72265625, -6.239501953125, -5.75634765625, -5.273193359375, -4.7900390625, -4.306884765625, -3.82373046875, -3.340576171875, -2.857421875, -2.374267578125, -1.89111328125, -1.407958984375, -0.9248046875, -0.441650390625, 0.04150390625, 0.524658203125, 1.0078125, 1.490966796875, 1.97412109375, 2.457275390625, 2.9404296875, 3.423583984375, 3.90673828125, 4.389892578125, 4.873046875, 5.356201171875, 5.83935546875, 6.322509765625, 6.8056640625, 7.288818359375, 7.77197265625, 8.255126953125, 8.73828125, 9.221435546875, 9.70458984375, 10.187744140625, 10.6708984375, 11.154052734375, 11.63720703125, 12.120361328125, 12.603515625, 13.086669921875, 13.56982421875, 14.052978515625, 14.5361328125, 15.019287109375, 15.50244140625, 15.985595703125, 16.46875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 10.0, 36.0, 222.0, 414.0, 268.0, 56.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-226.86776733398438, -220.66490173339844, -214.4620361328125, -208.25917053222656, -202.05630493164062, -195.8534393310547, -189.65057373046875, -183.44769287109375, -177.24484252929688, -171.04197692871094, -164.839111328125, -158.63624572753906, -152.43338012695312, -146.2305145263672, -140.02764892578125, -133.82476806640625, -127.62190246582031, -121.41903686523438, -115.21617126464844, -109.0133056640625, -102.81044006347656, -96.60757446289062, -90.40470123291016, -84.20183563232422, -77.99897003173828, -71.79610443115234, -65.5932388305664, -59.3903694152832, -53.187503814697266, -46.98463821411133, -40.781768798828125, -34.57890319824219, -28.376052856445312, -22.173187255859375, -15.970319747924805, -9.767452239990234, -3.564586639404297, 2.6382789611816406, 8.841148376464844, 15.044013977050781, 21.24687957763672, 27.449745178222656, 33.652610778808594, 39.8554801940918, 46.058345794677734, 52.26121139526367, 58.464080810546875, 64.66694641113281, 70.86981201171875, 77.07267761230469, 83.27554321289062, 89.47840881347656, 95.6812744140625, 101.88414001464844, 108.0870132446289, 114.28987884521484, 120.49274444580078, 126.69561004638672, 132.8984832763672, 139.10134887695312, 145.30421447753906, 151.507080078125, 157.70994567871094, 163.91281127929688, 170.1156768798828]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 7.0, 7.0, 4.0, 7.0, 12.0, 4.0, 11.0, 17.0, 17.0, 15.0, 22.0, 16.0, 19.0, 20.0, 38.0, 26.0, 34.0, 22.0, 37.0, 45.0, 33.0, 35.0, 32.0, 55.0, 48.0, 39.0, 35.0, 39.0, 30.0, 37.0, 27.0, 20.0, 21.0, 18.0, 14.0, 17.0, 21.0, 13.0, 14.0, 13.0, 8.0, 8.0, 11.0, 4.0, 10.0, 9.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-32.07764434814453, -30.92927360534668, -29.780902862548828, -28.632532119750977, -27.484161376953125, -26.33578872680664, -25.18741798400879, -24.039047241210938, -22.890676498413086, -21.742305755615234, -20.593935012817383, -19.44556427001953, -18.297191619873047, -17.148822784423828, -16.000450134277344, -14.852079391479492, -13.70370864868164, -12.555337905883789, -11.406967163085938, -10.25859546661377, -9.110224723815918, -7.961853981018066, -6.813482761383057, -5.665111541748047, -4.516740798950195, -3.3683698177337646, -2.219998836517334, -1.0716278553009033, 0.07674312591552734, 1.225113868713379, 2.3734850883483887, 3.5218563079833984, 4.670230865478516, 5.818601608276367, 6.966972827911377, 8.115344047546387, 9.263714790344238, 10.41208553314209, 11.560457229614258, 12.70882797241211, 13.857198715209961, 15.005569458007812, 16.153940200805664, 17.302310943603516, 18.45068359375, 19.59905242919922, 20.747425079345703, 21.895795822143555, 23.044166564941406, 24.192537307739258, 25.34090805053711, 26.48927879333496, 27.637649536132812, 28.786022186279297, 29.93439292907715, 31.082763671875, 32.23113250732422, 33.3795051574707, 34.52787399291992, 35.676246643066406, 36.824615478515625, 37.97298812866211, 39.12135696411133, 40.26972961425781, 41.4181022644043]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 7.0, 3.0, 8.0, 8.0, 9.0, 12.0, 7.0, 14.0, 19.0, 21.0, 16.0, 11.0, 20.0, 32.0, 17.0, 46.0, 27.0, 39.0, 21.0, 32.0, 37.0, 47.0, 35.0, 51.0, 42.0, 38.0, 43.0, 34.0, 33.0, 41.0, 26.0, 21.0, 26.0, 25.0, 20.0, 17.0, 16.0, 13.0, 8.0, 13.0, 8.0, 11.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-6.58984375, -6.3702392578125, -6.150634765625, -5.9310302734375, -5.71142578125, -5.4918212890625, -5.272216796875, -5.0526123046875, -4.8330078125, -4.6134033203125, -4.393798828125, -4.1741943359375, -3.95458984375, -3.7349853515625, -3.515380859375, -3.2957763671875, -3.076171875, -2.8565673828125, -2.636962890625, -2.4173583984375, -2.19775390625, -1.9781494140625, -1.758544921875, -1.5389404296875, -1.3193359375, -1.0997314453125, -0.880126953125, -0.6605224609375, -0.44091796875, -0.2213134765625, -0.001708984375, 0.2178955078125, 0.4375, 0.6571044921875, 0.876708984375, 1.0963134765625, 1.31591796875, 1.5355224609375, 1.755126953125, 1.9747314453125, 2.1943359375, 2.4139404296875, 2.633544921875, 2.8531494140625, 3.07275390625, 3.2923583984375, 3.511962890625, 3.7315673828125, 3.951171875, 4.1707763671875, 4.390380859375, 4.6099853515625, 4.82958984375, 5.0491943359375, 5.268798828125, 5.4884033203125, 5.7080078125, 5.9276123046875, 6.147216796875, 6.3668212890625, 6.58642578125, 6.8060302734375, 7.025634765625, 7.2452392578125, 7.46484375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 8.0, 7.0, 11.0, 15.0, 31.0, 35.0, 55.0, 107.0, 166.0, 250.0, 392.0, 562.0, 1043.0, 1686.0, 2584.0, 4224.0, 6785.0, 10826.0, 17050.0, 26764.0, 42380.0, 66633.0, 100843.0, 141448.0, 168233.0, 149232.0, 108687.0, 72361.0, 46605.0, 29703.0, 18639.0, 11692.0, 7403.0, 4580.0, 2839.0, 1757.0, 1078.0, 714.0, 438.0, 277.0, 150.0, 81.0, 50.0, 43.0, 31.0, 15.0, 20.0, 13.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9716796875, -0.9418716430664062, -0.9120635986328125, -0.8822555541992188, -0.852447509765625, -0.8226394653320312, -0.7928314208984375, -0.7630233764648438, -0.73321533203125, -0.7034072875976562, -0.6735992431640625, -0.6437911987304688, -0.613983154296875, -0.5841751098632812, -0.5543670654296875, -0.5245590209960938, -0.4947509765625, -0.46494293212890625, -0.4351348876953125, -0.40532684326171875, -0.375518798828125, -0.34571075439453125, -0.3159027099609375, -0.28609466552734375, -0.25628662109375, -0.22647857666015625, -0.1966705322265625, -0.16686248779296875, -0.137054443359375, -0.10724639892578125, -0.0774383544921875, -0.04763031005859375, -0.017822265625, 0.01198577880859375, 0.0417938232421875, 0.07160186767578125, 0.101409912109375, 0.13121795654296875, 0.1610260009765625, 0.19083404541015625, 0.22064208984375, 0.25045013427734375, 0.2802581787109375, 0.31006622314453125, 0.339874267578125, 0.36968231201171875, 0.3994903564453125, 0.42929840087890625, 0.4591064453125, 0.48891448974609375, 0.5187225341796875, 0.5485305786132812, 0.578338623046875, 0.6081466674804688, 0.6379547119140625, 0.6677627563476562, 0.69757080078125, 0.7273788452148438, 0.7571868896484375, 0.7869949340820312, 0.816802978515625, 0.8466110229492188, 0.8764190673828125, 0.9062271118164062, 0.93603515625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 9.0, 11.0, 11.0, 10.0, 13.0, 11.0, 18.0, 16.0, 24.0, 28.0, 31.0, 19.0, 34.0, 38.0, 28.0, 36.0, 29.0, 36.0, 48.0, 1065.0, 34.0, 49.0, 40.0, 39.0, 29.0, 38.0, 28.0, 27.0, 31.0, 32.0, 12.0, 21.0, 18.0, 12.0, 16.0, 19.0, 10.0, 12.0, 5.0, 11.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0546875, -4.9056396484375, -4.756591796875, -4.6075439453125, -4.45849609375, -4.3094482421875, -4.160400390625, -4.0113525390625, -3.8623046875, -3.7132568359375, -3.564208984375, -3.4151611328125, -3.26611328125, -3.1170654296875, -2.968017578125, -2.8189697265625, -2.669921875, -2.5208740234375, -2.371826171875, -2.2227783203125, -2.07373046875, -1.9246826171875, -1.775634765625, -1.6265869140625, -1.4775390625, -1.3284912109375, -1.179443359375, -1.0303955078125, -0.88134765625, -0.7322998046875, -0.583251953125, -0.4342041015625, -0.28515625, -0.1361083984375, 0.012939453125, 0.1619873046875, 0.31103515625, 0.4600830078125, 0.609130859375, 0.7581787109375, 0.9072265625, 1.0562744140625, 1.205322265625, 1.3543701171875, 1.50341796875, 1.6524658203125, 1.801513671875, 1.9505615234375, 2.099609375, 2.2486572265625, 2.397705078125, 2.5467529296875, 2.69580078125, 2.8448486328125, 2.993896484375, 3.1429443359375, 3.2919921875, 3.4410400390625, 3.590087890625, 3.7391357421875, 3.88818359375, 4.0372314453125, 4.186279296875, 4.3353271484375, 4.484375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 14.0, 13.0, 29.0, 25.0, 62.0, 100.0, 134.0, 206.0, 390.0, 593.0, 909.0, 1470.0, 2217.0, 3710.0, 6072.0, 9382.0, 15040.0, 23703.0, 36821.0, 56293.0, 83106.0, 113300.0, 146818.0, 1186704.0, 125551.0, 95243.0, 66662.0, 44779.0, 28759.0, 18280.0, 11381.0, 7239.0, 4466.0, 2836.0, 1762.0, 1137.0, 678.0, 413.0, 309.0, 164.0, 135.0, 82.0, 37.0, 37.0, 23.0, 17.0, 8.0, 7.0, 4.0, 1.0, 4.0, 3.0, 1.0], "bins": [-0.63330078125, -0.6147918701171875, -0.596282958984375, -0.5777740478515625, -0.55926513671875, -0.5407562255859375, -0.522247314453125, -0.5037384033203125, -0.4852294921875, -0.4667205810546875, -0.448211669921875, -0.4297027587890625, -0.41119384765625, -0.3926849365234375, -0.374176025390625, -0.3556671142578125, -0.337158203125, -0.3186492919921875, -0.300140380859375, -0.2816314697265625, -0.26312255859375, -0.2446136474609375, -0.226104736328125, -0.2075958251953125, -0.1890869140625, -0.1705780029296875, -0.152069091796875, -0.1335601806640625, -0.11505126953125, -0.0965423583984375, -0.078033447265625, -0.0595245361328125, -0.041015625, -0.0225067138671875, -0.003997802734375, 0.0145111083984375, 0.03302001953125, 0.0515289306640625, 0.070037841796875, 0.0885467529296875, 0.1070556640625, 0.1255645751953125, 0.144073486328125, 0.1625823974609375, 0.18109130859375, 0.1996002197265625, 0.218109130859375, 0.2366180419921875, 0.255126953125, 0.2736358642578125, 0.292144775390625, 0.3106536865234375, 0.32916259765625, 0.3476715087890625, 0.366180419921875, 0.3846893310546875, 0.4031982421875, 0.4217071533203125, 0.440216064453125, 0.4587249755859375, 0.47723388671875, 0.4957427978515625, 0.514251708984375, 0.5327606201171875, 0.55126953125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 4.0, 5.0, 9.0, 12.0, 12.0, 17.0, 32.0, 18.0, 22.0, 34.0, 52.0, 65.0, 122.0, 132.0, 119.0, 79.0, 52.0, 39.0, 30.0, 25.0, 35.0, 18.0, 10.0, 7.0, 11.0, 6.0, 6.0, 2.0, 0.0, 6.0, 1.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015716552734375, -0.015249848365783691, -0.014783143997192383, -0.014316439628601074, -0.013849735260009766, -0.013383030891418457, -0.012916326522827148, -0.01244962215423584, -0.011982917785644531, -0.011516213417053223, -0.011049509048461914, -0.010582804679870605, -0.010116100311279297, -0.009649395942687988, -0.00918269157409668, -0.008715987205505371, -0.008249282836914062, -0.007782578468322754, -0.007315874099731445, -0.006849169731140137, -0.006382465362548828, -0.0059157609939575195, -0.005449056625366211, -0.004982352256774902, -0.004515647888183594, -0.004048943519592285, -0.0035822391510009766, -0.003115534782409668, -0.0026488304138183594, -0.0021821260452270508, -0.0017154216766357422, -0.0012487173080444336, -0.000782012939453125, -0.0003153085708618164, 0.0001513957977294922, 0.0006181001663208008, 0.0010848045349121094, 0.001551508903503418, 0.0020182132720947266, 0.002484917640686035, 0.0029516220092773438, 0.0034183263778686523, 0.003885030746459961, 0.0043517351150512695, 0.004818439483642578, 0.005285143852233887, 0.005751848220825195, 0.006218552589416504, 0.0066852569580078125, 0.007151961326599121, 0.00761866569519043, 0.008085370063781738, 0.008552074432373047, 0.009018778800964355, 0.009485483169555664, 0.009952187538146973, 0.010418891906738281, 0.01088559627532959, 0.011352300643920898, 0.011819005012512207, 0.012285709381103516, 0.012752413749694824, 0.013219118118286133, 0.013685822486877441, 0.01415252685546875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 2.0, 2.0, 6.0, 4.0, 5.0, 6.0, 16.0, 12.0, 16.0, 17.0, 37.0, 52.0, 63.0, 100.0, 156.0, 271.0, 699.0, 15788.0, 1023506.0, 6503.0, 583.0, 239.0, 129.0, 92.0, 53.0, 47.0, 38.0, 27.0, 21.0, 16.0, 5.0, 6.0, 5.0, 5.0, 4.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27685546875, -0.26775360107421875, -0.2586517333984375, -0.24954986572265625, -0.240447998046875, -0.23134613037109375, -0.2222442626953125, -0.21314239501953125, -0.20404052734375, -0.19493865966796875, -0.1858367919921875, -0.17673492431640625, -0.167633056640625, -0.15853118896484375, -0.1494293212890625, -0.14032745361328125, -0.1312255859375, -0.12212371826171875, -0.1130218505859375, -0.10391998291015625, -0.094818115234375, -0.08571624755859375, -0.0766143798828125, -0.06751251220703125, -0.05841064453125, -0.04930877685546875, -0.0402069091796875, -0.03110504150390625, -0.022003173828125, -0.01290130615234375, -0.0037994384765625, 0.00530242919921875, 0.014404296875, 0.02350616455078125, 0.0326080322265625, 0.04170989990234375, 0.050811767578125, 0.05991363525390625, 0.0690155029296875, 0.07811737060546875, 0.08721923828125, 0.09632110595703125, 0.1054229736328125, 0.11452484130859375, 0.123626708984375, 0.13272857666015625, 0.1418304443359375, 0.15093231201171875, 0.1600341796875, 0.16913604736328125, 0.1782379150390625, 0.18733978271484375, 0.196441650390625, 0.20554351806640625, 0.2146453857421875, 0.22374725341796875, 0.23284912109375, 0.24195098876953125, 0.2510528564453125, 0.26015472412109375, 0.269256591796875, 0.27835845947265625, 0.2874603271484375, 0.29656219482421875, 0.3056640625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 2.0, 42.0, 971.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05599676072597504, -0.04718736559152603, -0.038377970457077026, -0.029568571597337723, -0.020759176462888718, -0.011949781328439713, -0.003140382468700409, 0.005669012665748596, 0.014478407800197601, 0.023287802934646606, 0.03209719806909561, 0.040906596928834915, 0.04971599206328392, 0.058525387197732925, 0.06733478605747223, 0.07614418119192123, 0.08495357632637024, 0.09376297146081924, 0.10257236659526825, 0.11138176918029785, 0.12019115686416626, 0.12900055944919586, 0.13780996203422546, 0.14661934971809387, 0.15542873740196228, 0.16423813998699188, 0.1730475276708603, 0.1818569302558899, 0.1906663179397583, 0.1994757205247879, 0.2082851231098175, 0.2170945107936859, 0.22590389847755432, 0.23471330106258392, 0.24352268874645233, 0.25233209133148193, 0.26114147901535034, 0.26995086669921875, 0.27876028418540955, 0.28756967186927795, 0.29637905955314636, 0.30518844723701477, 0.31399786472320557, 0.322807252407074, 0.3316166400909424, 0.3404260277748108, 0.3492354452610016, 0.35804483294487, 0.3668542504310608, 0.3756636381149292, 0.38447305560112, 0.3932824432849884, 0.4020918309688568, 0.4109012186527252, 0.419710636138916, 0.4285200238227844, 0.43732941150665283, 0.44613879919052124, 0.45494821667671204, 0.46375760436058044, 0.47256699204444885, 0.48137637972831726, 0.49018579721450806, 0.49899518489837646, 0.5078045725822449]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 6.0, 22.0, 13.0, 30.0, 27.0, 30.0, 48.0, 49.0, 55.0, 59.0, 75.0, 66.0, 81.0, 56.0, 60.0, 41.0, 42.0, 46.0, 33.0, 40.0, 32.0, 18.0, 18.0, 15.0, 12.0, 6.0, 9.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.024235308170318604, -0.023661397397518158, -0.023087484762072563, -0.02251357212662697, -0.021939661353826523, -0.021365750581026077, -0.020791837945580482, -0.020217925310134888, -0.019644014537334442, -0.019070103764533997, -0.018496191129088402, -0.017922278493642807, -0.01734836772084236, -0.016774456948041916, -0.01620054431259632, -0.015626631677150726, -0.01505272090435028, -0.01447880920022726, -0.01390489749610424, -0.01333098579198122, -0.0127570740878582, -0.01218316238373518, -0.01160925067961216, -0.01103533897548914, -0.01046142727136612, -0.0098875155672431, -0.009313603863120079, -0.008739692158997059, -0.008165780454874039, -0.0075918687507510185, -0.007017957046627998, -0.006444045342504978, -0.005870133638381958, -0.005296221934258938, -0.004722310230135918, -0.0041483985260128975, -0.0035744868218898773, -0.003000575117766857, -0.002426663413643837, -0.0018527517095208168, -0.0012788400053977966, -0.0007049283012747765, -0.0001310165971517563, 0.0004428951069712639, 0.001016806811094284, 0.0015907185152173042, 0.0021646302193403244, 0.0027385419234633446, 0.0033124536275863647, 0.003886365331709385, 0.004460277035832405, 0.005034188739955425, 0.0056081004440784454, 0.006182012148201466, 0.006755923852324486, 0.007329835556447506, 0.007903747260570526, 0.008477658964693546, 0.009051570668816566, 0.009625482372939587, 0.010199394077062607, 0.010773305781185627, 0.011347217485308647, 0.011921129189431667, 0.012495040893554688]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 7.0, 4.0, 7.0, 8.0, 9.0, 12.0, 7.0, 14.0, 19.0, 21.0, 16.0, 11.0, 20.0, 32.0, 17.0, 46.0, 29.0, 38.0, 20.0, 32.0, 37.0, 47.0, 35.0, 51.0, 43.0, 39.0, 42.0, 33.0, 35.0, 42.0, 23.0, 21.0, 26.0, 25.0, 21.0, 16.0, 16.0, 13.0, 8.0, 13.0, 8.0, 11.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-6.58984375, -6.37017822265625, -6.1505126953125, -5.93084716796875, -5.711181640625, -5.49151611328125, -5.2718505859375, -5.05218505859375, -4.83251953125, -4.61285400390625, -4.3931884765625, -4.17352294921875, -3.953857421875, -3.73419189453125, -3.5145263671875, -3.29486083984375, -3.0751953125, -2.85552978515625, -2.6358642578125, -2.41619873046875, -2.196533203125, -1.97686767578125, -1.7572021484375, -1.53753662109375, -1.31787109375, -1.09820556640625, -0.8785400390625, -0.65887451171875, -0.439208984375, -0.21954345703125, 0.0001220703125, 0.21978759765625, 0.439453125, 0.65911865234375, 0.8787841796875, 1.09844970703125, 1.318115234375, 1.53778076171875, 1.7574462890625, 1.97711181640625, 2.19677734375, 2.41644287109375, 2.6361083984375, 2.85577392578125, 3.075439453125, 3.29510498046875, 3.5147705078125, 3.73443603515625, 3.9541015625, 4.17376708984375, 4.3934326171875, 4.61309814453125, 4.832763671875, 5.05242919921875, 5.2720947265625, 5.49176025390625, 5.71142578125, 5.93109130859375, 6.1507568359375, 6.37042236328125, 6.590087890625, 6.80975341796875, 7.0294189453125, 7.24908447265625, 7.46875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 9.0, 8.0, 18.0, 22.0, 17.0, 28.0, 34.0, 48.0, 51.0, 79.0, 90.0, 125.0, 191.0, 246.0, 409.0, 627.0, 1041.0, 2108.0, 4154.0, 9013.0, 19941.0, 46068.0, 111410.0, 289978.0, 331480.0, 132555.0, 54260.0, 23392.0, 10522.0, 4871.0, 2368.0, 1239.0, 699.0, 435.0, 261.0, 184.0, 127.0, 106.0, 74.0, 63.0, 34.0, 38.0, 27.0, 23.0, 19.0, 11.0, 15.0, 9.0, 8.0, 5.0, 7.0, 0.0, 3.0, 2.0, 1.0], "bins": [-10.5078125, -10.1903076171875, -9.872802734375, -9.5552978515625, -9.23779296875, -8.9202880859375, -8.602783203125, -8.2852783203125, -7.9677734375, -7.6502685546875, -7.332763671875, -7.0152587890625, -6.69775390625, -6.3802490234375, -6.062744140625, -5.7452392578125, -5.427734375, -5.1102294921875, -4.792724609375, -4.4752197265625, -4.15771484375, -3.8402099609375, -3.522705078125, -3.2052001953125, -2.8876953125, -2.5701904296875, -2.252685546875, -1.9351806640625, -1.61767578125, -1.3001708984375, -0.982666015625, -0.6651611328125, -0.34765625, -0.0301513671875, 0.287353515625, 0.6048583984375, 0.92236328125, 1.2398681640625, 1.557373046875, 1.8748779296875, 2.1923828125, 2.5098876953125, 2.827392578125, 3.1448974609375, 3.46240234375, 3.7799072265625, 4.097412109375, 4.4149169921875, 4.732421875, 5.0499267578125, 5.367431640625, 5.6849365234375, 6.00244140625, 6.3199462890625, 6.637451171875, 6.9549560546875, 7.2724609375, 7.5899658203125, 7.907470703125, 8.2249755859375, 8.54248046875, 8.8599853515625, 9.177490234375, 9.4949951171875, 9.8125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 6.0, 0.0, 3.0, 2.0, 11.0, 14.0, 7.0, 11.0, 17.0, 13.0, 16.0, 27.0, 26.0, 20.0, 31.0, 27.0, 39.0, 29.0, 51.0, 58.0, 68.0, 114.0, 201.0, 1279.0, 220.0, 146.0, 117.0, 81.0, 59.0, 51.0, 46.0, 32.0, 29.0, 25.0, 21.0, 25.0, 18.0, 15.0, 14.0, 9.0, 14.0, 17.0, 8.0, 11.0, 5.0, 3.0, 6.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.546875, -15.02734375, -14.5078125, -13.98828125, -13.46875, -12.94921875, -12.4296875, -11.91015625, -11.390625, -10.87109375, -10.3515625, -9.83203125, -9.3125, -8.79296875, -8.2734375, -7.75390625, -7.234375, -6.71484375, -6.1953125, -5.67578125, -5.15625, -4.63671875, -4.1171875, -3.59765625, -3.078125, -2.55859375, -2.0390625, -1.51953125, -1.0, -0.48046875, 0.0390625, 0.55859375, 1.078125, 1.59765625, 2.1171875, 2.63671875, 3.15625, 3.67578125, 4.1953125, 4.71484375, 5.234375, 5.75390625, 6.2734375, 6.79296875, 7.3125, 7.83203125, 8.3515625, 8.87109375, 9.390625, 9.91015625, 10.4296875, 10.94921875, 11.46875, 11.98828125, 12.5078125, 13.02734375, 13.546875, 14.06640625, 14.5859375, 15.10546875, 15.625, 16.14453125, 16.6640625, 17.18359375, 17.703125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 8.0, 7.0, 15.0, 18.0, 26.0, 34.0, 63.0, 57.0, 96.0, 143.0, 210.0, 363.0, 649.0, 2226.0, 24402.0, 2365728.0, 736158.0, 12333.0, 1595.0, 595.0, 336.0, 217.0, 119.0, 111.0, 47.0, 40.0, 25.0, 19.0, 13.0, 10.0, 5.0, 5.0, 6.0, 8.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.09375, -38.65625, -37.21875, -35.78125, -34.34375, -32.90625, -31.46875, -30.03125, -28.59375, -27.15625, -25.71875, -24.28125, -22.84375, -21.40625, -19.96875, -18.53125, -17.09375, -15.65625, -14.21875, -12.78125, -11.34375, -9.90625, -8.46875, -7.03125, -5.59375, -4.15625, -2.71875, -1.28125, 0.15625, 1.59375, 3.03125, 4.46875, 5.90625, 7.34375, 8.78125, 10.21875, 11.65625, 13.09375, 14.53125, 15.96875, 17.40625, 18.84375, 20.28125, 21.71875, 23.15625, 24.59375, 26.03125, 27.46875, 28.90625, 30.34375, 31.78125, 33.21875, 34.65625, 36.09375, 37.53125, 38.96875, 40.40625, 41.84375, 43.28125, 44.71875, 46.15625, 47.59375, 49.03125, 50.46875, 51.90625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 549.0, 459.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.22972106933594, -176.56564331054688, -163.90158081054688, -151.2375030517578, -138.57342529296875, -125.90934753417969, -113.24527740478516, -100.58120727539062, -87.91712951660156, -75.2530517578125, -62.58898162841797, -49.92490768432617, -37.260833740234375, -24.596759796142578, -11.932685852050781, 0.73138427734375, 13.395462036132812, 26.05953598022461, 38.723609924316406, 51.3876838684082, 64.0517578125, 76.71583557128906, 89.3799057006836, 102.04397583007812, 114.70805358886719, 127.37213134765625, 140.03619384765625, 152.7002716064453, 165.36434936523438, 178.02842712402344, 190.6925048828125, 203.3565673828125, 216.0206298828125, 228.68470764160156, 241.34878540039062, 254.01284790039062, 266.67694091796875, 279.34100341796875, 292.00506591796875, 304.66912841796875, 317.3332214355469, 329.9972839355469, 342.661376953125, 355.325439453125, 367.989501953125, 380.6535949707031, 393.3176574707031, 405.98175048828125, 418.64581298828125, 431.30987548828125, 443.9739685058594, 456.6380310058594, 469.3021240234375, 481.9661865234375, 494.6302490234375, 507.2943115234375, 519.9583740234375, 532.6224365234375, 545.2864990234375, 557.9506225585938, 570.6146850585938, 583.2787475585938, 595.9428100585938, 608.6068725585938, 621.27099609375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 8.0, 9.0, 7.0, 7.0, 7.0, 14.0, 19.0, 21.0, 38.0, 24.0, 33.0, 34.0, 39.0, 25.0, 41.0, 34.0, 42.0, 39.0, 40.0, 41.0, 59.0, 54.0, 43.0, 37.0, 38.0, 38.0, 26.0, 18.0, 17.0, 17.0, 34.0, 22.0, 19.0, 6.0, 11.0, 9.0, 9.0, 7.0, 10.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-51.2830924987793, -49.833824157714844, -48.38455581665039, -46.93528366088867, -45.48601531982422, -44.036746978759766, -42.58747863769531, -41.138206481933594, -39.68893814086914, -38.23966979980469, -36.790401458740234, -35.341129302978516, -33.89186096191406, -32.44259262084961, -30.993324279785156, -29.54405403137207, -28.094785690307617, -26.645517349243164, -25.196247100830078, -23.746978759765625, -22.29770851135254, -20.848440170288086, -19.399169921875, -17.949901580810547, -16.500633239746094, -15.051363945007324, -13.602094650268555, -12.152826309204102, -10.703556060791016, -9.254287719726562, -7.805018424987793, -6.355749130249023, -4.9064788818359375, -3.457209587097168, -2.0079405307769775, -0.5586714744567871, 0.8905978202819824, 2.339867115020752, 3.7891359329223633, 5.238405227661133, 6.687674522399902, 8.136943817138672, 9.586213111877441, 11.035482406616211, 12.484750747680664, 13.93402099609375, 15.383289337158203, 16.832557678222656, 18.281827926635742, 19.731096267700195, 21.18036651611328, 22.629634857177734, 24.07890510559082, 25.528173446655273, 26.97744369506836, 28.426712036132812, 29.875980377197266, 31.32524871826172, 32.77451705932617, 34.22378921508789, 35.673057556152344, 37.1223258972168, 38.57159423828125, 40.02086639404297, 41.47013473510742]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 10.0, 13.0, 3.0, 13.0, 18.0, 16.0, 15.0, 29.0, 30.0, 34.0, 28.0, 28.0, 27.0, 31.0, 44.0, 35.0, 26.0, 48.0, 46.0, 43.0, 48.0, 30.0, 45.0, 32.0, 40.0, 30.0, 31.0, 17.0, 24.0, 19.0, 18.0, 22.0, 11.0, 12.0, 14.0, 10.0, 12.0, 4.0, 8.0, 4.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.65625, -7.42279052734375, -7.1893310546875, -6.95587158203125, -6.722412109375, -6.48895263671875, -6.2554931640625, -6.02203369140625, -5.78857421875, -5.55511474609375, -5.3216552734375, -5.08819580078125, -4.854736328125, -4.62127685546875, -4.3878173828125, -4.15435791015625, -3.9208984375, -3.68743896484375, -3.4539794921875, -3.22052001953125, -2.987060546875, -2.75360107421875, -2.5201416015625, -2.28668212890625, -2.05322265625, -1.81976318359375, -1.5863037109375, -1.35284423828125, -1.119384765625, -0.88592529296875, -0.6524658203125, -0.41900634765625, -0.185546875, 0.04791259765625, 0.2813720703125, 0.51483154296875, 0.748291015625, 0.98175048828125, 1.2152099609375, 1.44866943359375, 1.68212890625, 1.91558837890625, 2.1490478515625, 2.38250732421875, 2.615966796875, 2.84942626953125, 3.0828857421875, 3.31634521484375, 3.5498046875, 3.78326416015625, 4.0167236328125, 4.25018310546875, 4.483642578125, 4.71710205078125, 4.9505615234375, 5.18402099609375, 5.41748046875, 5.65093994140625, 5.8843994140625, 6.11785888671875, 6.351318359375, 6.58477783203125, 6.8182373046875, 7.05169677734375, 7.28515625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 5.0, 11.0, 7.0, 15.0, 16.0, 19.0, 18.0, 28.0, 29.0, 43.0, 57.0, 77.0, 97.0, 142.0, 200.0, 227.0, 372.0, 887.0, 40020.0, 4097938.0, 51608.0, 1021.0, 400.0, 260.0, 206.0, 142.0, 98.0, 76.0, 53.0, 43.0, 37.0, 20.0, 20.0, 22.0, 12.0, 11.0, 11.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-67.625, -65.4794921875, -63.333984375, -61.1884765625, -59.04296875, -56.8974609375, -54.751953125, -52.6064453125, -50.4609375, -48.3154296875, -46.169921875, -44.0244140625, -41.87890625, -39.7333984375, -37.587890625, -35.4423828125, -33.296875, -31.1513671875, -29.005859375, -26.8603515625, -24.71484375, -22.5693359375, -20.423828125, -18.2783203125, -16.1328125, -13.9873046875, -11.841796875, -9.6962890625, -7.55078125, -5.4052734375, -3.259765625, -1.1142578125, 1.03125, 3.1767578125, 5.322265625, 7.4677734375, 9.61328125, 11.7587890625, 13.904296875, 16.0498046875, 18.1953125, 20.3408203125, 22.486328125, 24.6318359375, 26.77734375, 28.9228515625, 31.068359375, 33.2138671875, 35.359375, 37.5048828125, 39.650390625, 41.7958984375, 43.94140625, 46.0869140625, 48.232421875, 50.3779296875, 52.5234375, 54.6689453125, 56.814453125, 58.9599609375, 61.10546875, 63.2509765625, 65.396484375, 67.5419921875, 69.6875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 8.0, 8.0, 5.0, 22.0, 20.0, 40.0, 38.0, 60.0, 100.0, 134.0, 167.0, 245.0, 379.0, 525.0, 627.0, 530.0, 356.0, 275.0, 157.0, 107.0, 62.0, 62.0, 32.0, 29.0, 23.0, 19.0, 12.0, 5.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.75, -16.3031005859375, -15.856201171875, -15.4093017578125, -14.96240234375, -14.5155029296875, -14.068603515625, -13.6217041015625, -13.1748046875, -12.7279052734375, -12.281005859375, -11.8341064453125, -11.38720703125, -10.9403076171875, -10.493408203125, -10.0465087890625, -9.599609375, -9.1527099609375, -8.705810546875, -8.2589111328125, -7.81201171875, -7.3651123046875, -6.918212890625, -6.4713134765625, -6.0244140625, -5.5775146484375, -5.130615234375, -4.6837158203125, -4.23681640625, -3.7899169921875, -3.343017578125, -2.8961181640625, -2.44921875, -2.0023193359375, -1.555419921875, -1.1085205078125, -0.66162109375, -0.2147216796875, 0.232177734375, 0.6790771484375, 1.1259765625, 1.5728759765625, 2.019775390625, 2.4666748046875, 2.91357421875, 3.3604736328125, 3.807373046875, 4.2542724609375, 4.701171875, 5.1480712890625, 5.594970703125, 6.0418701171875, 6.48876953125, 6.9356689453125, 7.382568359375, 7.8294677734375, 8.2763671875, 8.7232666015625, 9.170166015625, 9.6170654296875, 10.06396484375, 10.5108642578125, 10.957763671875, 11.4046630859375, 11.8515625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 7.0, 3.0, 5.0, 9.0, 6.0, 8.0, 14.0, 17.0, 17.0, 34.0, 37.0, 57.0, 86.0, 130.0, 251.0, 656.0, 2465.0, 17050.0, 259236.0, 3572259.0, 317994.0, 19821.0, 2651.0, 720.0, 252.0, 143.0, 101.0, 52.0, 40.0, 40.0, 30.0, 21.0, 15.0, 13.0, 12.0, 6.0, 6.0, 5.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-40.8125, -39.72509765625, -38.6376953125, -37.55029296875, -36.462890625, -35.37548828125, -34.2880859375, -33.20068359375, -32.11328125, -31.02587890625, -29.9384765625, -28.85107421875, -27.763671875, -26.67626953125, -25.5888671875, -24.50146484375, -23.4140625, -22.32666015625, -21.2392578125, -20.15185546875, -19.064453125, -17.97705078125, -16.8896484375, -15.80224609375, -14.71484375, -13.62744140625, -12.5400390625, -11.45263671875, -10.365234375, -9.27783203125, -8.1904296875, -7.10302734375, -6.015625, -4.92822265625, -3.8408203125, -2.75341796875, -1.666015625, -0.57861328125, 0.5087890625, 1.59619140625, 2.68359375, 3.77099609375, 4.8583984375, 5.94580078125, 7.033203125, 8.12060546875, 9.2080078125, 10.29541015625, 11.3828125, 12.47021484375, 13.5576171875, 14.64501953125, 15.732421875, 16.81982421875, 17.9072265625, 18.99462890625, 20.08203125, 21.16943359375, 22.2568359375, 23.34423828125, 24.431640625, 25.51904296875, 26.6064453125, 27.69384765625, 28.78125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 246.0, 630.0, 120.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.51507568359375, -143.5267333984375, -133.53839111328125, -123.55004119873047, -113.56169891357422, -103.57335662841797, -93.58500671386719, -83.59666442871094, -73.60832214355469, -63.61997985839844, -53.63163375854492, -43.643287658691406, -33.654945373535156, -23.666603088378906, -13.67825698852539, -3.689910888671875, 6.298431396484375, 16.286775588989258, 26.27511978149414, 36.263465881347656, 46.251808166503906, 56.240150451660156, 66.22850036621094, 76.21684265136719, 86.20518493652344, 96.19352722167969, 106.18186950683594, 116.17021942138672, 126.15856170654297, 136.14691162109375, 146.13525390625, 156.12359619140625, 166.11190795898438, 176.10025024414062, 186.08859252929688, 196.07693481445312, 206.06527709960938, 216.05361938476562, 226.04197692871094, 236.0303192138672, 246.01866149902344, 256.00701904296875, 265.995361328125, 275.98370361328125, 285.9720458984375, 295.96038818359375, 305.94873046875, 315.93707275390625, 325.9254150390625, 335.91375732421875, 345.902099609375, 355.89044189453125, 365.8787841796875, 375.86712646484375, 385.85546875, 395.84381103515625, 405.8321533203125, 415.82049560546875, 425.808837890625, 435.79718017578125, 445.7855224609375, 455.77386474609375, 465.76220703125, 475.75054931640625, 485.7389221191406]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 5.0, 15.0, 11.0, 19.0, 14.0, 23.0, 31.0, 25.0, 37.0, 33.0, 26.0, 33.0, 22.0, 43.0, 32.0, 34.0, 56.0, 48.0, 35.0, 34.0, 43.0, 32.0, 33.0, 40.0, 34.0, 30.0, 27.0, 24.0, 18.0, 22.0, 19.0, 13.0, 11.0, 8.0, 7.0, 9.0, 4.0, 12.0, 7.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.44572067260742, -35.20658493041992, -33.967445373535156, -32.728309631347656, -31.48917007446289, -30.25003433227539, -29.010896682739258, -27.771759033203125, -26.532621383666992, -25.29348373413086, -24.054346084594727, -22.815208435058594, -21.576072692871094, -20.336933135986328, -19.097797393798828, -17.858659744262695, -16.619522094726562, -15.38038444519043, -14.141246795654297, -12.90211009979248, -11.662972450256348, -10.423834800720215, -9.184698104858398, -7.945560455322266, -6.706422805786133, -5.46728515625, -4.228147983551025, -2.9890105724334717, -1.749873161315918, -0.5107355117797852, 0.7284016609191895, 1.967538833618164, 3.2066802978515625, 4.445817947387695, 5.68495512008667, 6.9240922927856445, 8.163229942321777, 9.40236759185791, 10.641504287719727, 11.88064193725586, 13.119779586791992, 14.358917236328125, 15.598054885864258, 16.83719253540039, 18.07632827758789, 19.315467834472656, 20.554603576660156, 21.79374122619629, 23.032878875732422, 24.272016525268555, 25.511154174804688, 26.75029182434082, 27.989429473876953, 29.228565216064453, 30.467702865600586, 31.70684051513672, 32.94597625732422, 34.18511199951172, 35.424251556396484, 36.663387298583984, 37.90252685546875, 39.14166259765625, 40.380802154541016, 41.619937896728516, 42.85907745361328]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 11.0, 8.0, 10.0, 10.0, 16.0, 11.0, 11.0, 22.0, 20.0, 17.0, 15.0, 16.0, 24.0, 30.0, 29.0, 33.0, 31.0, 37.0, 40.0, 38.0, 39.0, 28.0, 46.0, 46.0, 30.0, 35.0, 34.0, 31.0, 25.0, 34.0, 11.0, 22.0, 25.0, 19.0, 17.0, 15.0, 21.0, 10.0, 6.0, 14.0, 8.0, 10.0, 7.0, 6.0, 10.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.6484375, -6.4384765625, -6.228515625, -6.0185546875, -5.80859375, -5.5986328125, -5.388671875, -5.1787109375, -4.96875, -4.7587890625, -4.548828125, -4.3388671875, -4.12890625, -3.9189453125, -3.708984375, -3.4990234375, -3.2890625, -3.0791015625, -2.869140625, -2.6591796875, -2.44921875, -2.2392578125, -2.029296875, -1.8193359375, -1.609375, -1.3994140625, -1.189453125, -0.9794921875, -0.76953125, -0.5595703125, -0.349609375, -0.1396484375, 0.0703125, 0.2802734375, 0.490234375, 0.7001953125, 0.91015625, 1.1201171875, 1.330078125, 1.5400390625, 1.75, 1.9599609375, 2.169921875, 2.3798828125, 2.58984375, 2.7998046875, 3.009765625, 3.2197265625, 3.4296875, 3.6396484375, 3.849609375, 4.0595703125, 4.26953125, 4.4794921875, 4.689453125, 4.8994140625, 5.109375, 5.3193359375, 5.529296875, 5.7392578125, 5.94921875, 6.1591796875, 6.369140625, 6.5791015625, 6.7890625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 11.0, 21.0, 41.0, 51.0, 79.0, 109.0, 200.0, 303.0, 390.0, 612.0, 834.0, 1342.0, 1867.0, 2852.0, 4086.0, 6084.0, 9082.0, 13143.0, 19290.0, 28728.0, 41712.0, 59500.0, 81957.0, 107321.0, 127261.0, 130379.0, 113479.0, 88718.0, 64492.0, 45983.0, 31610.0, 21315.0, 14619.0, 9954.0, 6811.0, 4628.0, 3208.0, 2111.0, 1357.0, 983.0, 628.0, 473.0, 326.0, 199.0, 147.0, 89.0, 64.0, 39.0, 22.0, 11.0, 13.0, 6.0, 4.0, 3.0, 6.0, 1.0], "bins": [-0.830078125, -0.805023193359375, -0.77996826171875, -0.754913330078125, -0.7298583984375, -0.704803466796875, -0.67974853515625, -0.654693603515625, -0.629638671875, -0.604583740234375, -0.57952880859375, -0.554473876953125, -0.5294189453125, -0.504364013671875, -0.47930908203125, -0.454254150390625, -0.42919921875, -0.404144287109375, -0.37908935546875, -0.354034423828125, -0.3289794921875, -0.303924560546875, -0.27886962890625, -0.253814697265625, -0.228759765625, -0.203704833984375, -0.17864990234375, -0.153594970703125, -0.1285400390625, -0.103485107421875, -0.07843017578125, -0.053375244140625, -0.0283203125, -0.003265380859375, 0.02178955078125, 0.046844482421875, 0.0718994140625, 0.096954345703125, 0.12200927734375, 0.147064208984375, 0.172119140625, 0.197174072265625, 0.22222900390625, 0.247283935546875, 0.2723388671875, 0.297393798828125, 0.32244873046875, 0.347503662109375, 0.37255859375, 0.397613525390625, 0.42266845703125, 0.447723388671875, 0.4727783203125, 0.497833251953125, 0.52288818359375, 0.547943115234375, 0.572998046875, 0.598052978515625, 0.62310791015625, 0.648162841796875, 0.6732177734375, 0.698272705078125, 0.72332763671875, 0.748382568359375, 0.7734375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 5.0, 6.0, 15.0, 16.0, 17.0, 33.0, 21.0, 19.0, 36.0, 34.0, 25.0, 29.0, 41.0, 33.0, 42.0, 40.0, 37.0, 33.0, 1055.0, 39.0, 42.0, 45.0, 48.0, 42.0, 37.0, 33.0, 23.0, 27.0, 20.0, 21.0, 17.0, 18.0, 11.0, 17.0, 8.0, 8.0, 6.0, 8.0, 3.0, 6.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.953125, -5.78448486328125, -5.6158447265625, -5.44720458984375, -5.278564453125, -5.10992431640625, -4.9412841796875, -4.77264404296875, -4.60400390625, -4.43536376953125, -4.2667236328125, -4.09808349609375, -3.929443359375, -3.76080322265625, -3.5921630859375, -3.42352294921875, -3.2548828125, -3.08624267578125, -2.9176025390625, -2.74896240234375, -2.580322265625, -2.41168212890625, -2.2430419921875, -2.07440185546875, -1.90576171875, -1.73712158203125, -1.5684814453125, -1.39984130859375, -1.231201171875, -1.06256103515625, -0.8939208984375, -0.72528076171875, -0.556640625, -0.38800048828125, -0.2193603515625, -0.05072021484375, 0.117919921875, 0.28656005859375, 0.4552001953125, 0.62384033203125, 0.79248046875, 0.96112060546875, 1.1297607421875, 1.29840087890625, 1.467041015625, 1.63568115234375, 1.8043212890625, 1.97296142578125, 2.1416015625, 2.31024169921875, 2.4788818359375, 2.64752197265625, 2.816162109375, 2.98480224609375, 3.1534423828125, 3.32208251953125, 3.49072265625, 3.65936279296875, 3.8280029296875, 3.99664306640625, 4.165283203125, 4.33392333984375, 4.5025634765625, 4.67120361328125, 4.83984375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 16.0, 17.0, 15.0, 36.0, 39.0, 66.0, 84.0, 126.0, 207.0, 314.0, 527.0, 758.0, 1273.0, 2064.0, 3282.0, 5358.0, 8603.0, 13452.0, 21105.0, 32456.0, 48559.0, 71512.0, 99763.0, 127819.0, 1184187.0, 136895.0, 106249.0, 78649.0, 53664.0, 35781.0, 23394.0, 15084.0, 9636.0, 6097.0, 3841.0, 2393.0, 1460.0, 874.0, 525.0, 350.0, 231.0, 123.0, 104.0, 49.0, 25.0, 31.0, 16.0, 12.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.62841796875, -0.6102676391601562, -0.5921173095703125, -0.5739669799804688, -0.555816650390625, -0.5376663208007812, -0.5195159912109375, -0.5013656616210938, -0.48321533203125, -0.46506500244140625, -0.4469146728515625, -0.42876434326171875, -0.410614013671875, -0.39246368408203125, -0.3743133544921875, -0.35616302490234375, -0.3380126953125, -0.31986236572265625, -0.3017120361328125, -0.28356170654296875, -0.265411376953125, -0.24726104736328125, -0.2291107177734375, -0.21096038818359375, -0.19281005859375, -0.17465972900390625, -0.1565093994140625, -0.13835906982421875, -0.120208740234375, -0.10205841064453125, -0.0839080810546875, -0.06575775146484375, -0.047607421875, -0.02945709228515625, -0.0113067626953125, 0.00684356689453125, 0.024993896484375, 0.04314422607421875, 0.0612945556640625, 0.07944488525390625, 0.09759521484375, 0.11574554443359375, 0.1338958740234375, 0.15204620361328125, 0.170196533203125, 0.18834686279296875, 0.2064971923828125, 0.22464752197265625, 0.2427978515625, 0.26094818115234375, 0.2790985107421875, 0.29724884033203125, 0.315399169921875, 0.33354949951171875, 0.3516998291015625, 0.36985015869140625, 0.38800048828125, 0.40615081787109375, 0.4243011474609375, 0.44245147705078125, 0.460601806640625, 0.47875213623046875, 0.4969024658203125, 0.5150527954101562, 0.533203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 11.0, 6.0, 12.0, 13.0, 26.0, 24.0, 27.0, 46.0, 106.0, 143.0, 145.0, 131.0, 72.0, 53.0, 28.0, 27.0, 29.0, 15.0, 13.0, 6.0, 6.0, 3.0, 2.0, 3.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.026031494140625, -0.025250673294067383, -0.024469852447509766, -0.02368903160095215, -0.02290821075439453, -0.022127389907836914, -0.021346569061279297, -0.02056574821472168, -0.019784927368164062, -0.019004106521606445, -0.018223285675048828, -0.01744246482849121, -0.016661643981933594, -0.015880823135375977, -0.01510000228881836, -0.014319181442260742, -0.013538360595703125, -0.012757539749145508, -0.01197671890258789, -0.011195898056030273, -0.010415077209472656, -0.009634256362915039, -0.008853435516357422, -0.008072614669799805, -0.0072917938232421875, -0.00651097297668457, -0.005730152130126953, -0.004949331283569336, -0.004168510437011719, -0.0033876895904541016, -0.0026068687438964844, -0.0018260478973388672, -0.00104522705078125, -0.0002644062042236328, 0.0005164146423339844, 0.0012972354888916016, 0.0020780563354492188, 0.002858877182006836, 0.003639698028564453, 0.00442051887512207, 0.0052013397216796875, 0.005982160568237305, 0.006762981414794922, 0.007543802261352539, 0.008324623107910156, 0.009105443954467773, 0.00988626480102539, 0.010667085647583008, 0.011447906494140625, 0.012228727340698242, 0.01300954818725586, 0.013790369033813477, 0.014571189880371094, 0.015352010726928711, 0.016132831573486328, 0.016913652420043945, 0.017694473266601562, 0.01847529411315918, 0.019256114959716797, 0.020036935806274414, 0.02081775665283203, 0.02159857749938965, 0.022379398345947266, 0.023160219192504883, 0.0239410400390625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 7.0, 8.0, 7.0, 10.0, 7.0, 17.0, 20.0, 25.0, 32.0, 83.0, 104.0, 116.0, 203.0, 459.0, 2844.0, 1032658.0, 10576.0, 625.0, 255.0, 132.0, 90.0, 57.0, 45.0, 25.0, 26.0, 24.0, 14.0, 11.0, 13.0, 10.0, 8.0, 3.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.453125, -0.43833160400390625, -0.4235382080078125, -0.40874481201171875, -0.393951416015625, -0.37915802001953125, -0.3643646240234375, -0.34957122802734375, -0.33477783203125, -0.31998443603515625, -0.3051910400390625, -0.29039764404296875, -0.275604248046875, -0.26081085205078125, -0.2460174560546875, -0.23122406005859375, -0.2164306640625, -0.20163726806640625, -0.1868438720703125, -0.17205047607421875, -0.157257080078125, -0.14246368408203125, -0.1276702880859375, -0.11287689208984375, -0.09808349609375, -0.08329010009765625, -0.0684967041015625, -0.05370330810546875, -0.038909912109375, -0.02411651611328125, -0.0093231201171875, 0.00547027587890625, 0.020263671875, 0.03505706787109375, 0.0498504638671875, 0.06464385986328125, 0.079437255859375, 0.09423065185546875, 0.1090240478515625, 0.12381744384765625, 0.13861083984375, 0.15340423583984375, 0.1681976318359375, 0.18299102783203125, 0.197784423828125, 0.21257781982421875, 0.2273712158203125, 0.24216461181640625, 0.2569580078125, 0.27175140380859375, 0.2865447998046875, 0.30133819580078125, 0.316131591796875, 0.33092498779296875, 0.3457183837890625, 0.36051177978515625, 0.37530517578125, 0.39009857177734375, 0.4048919677734375, 0.41968536376953125, 0.434478759765625, 0.44927215576171875, 0.4640655517578125, 0.47885894775390625, 0.49365234375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 957.0, 56.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08458857983350754, -0.07367686927318573, -0.06276515871286392, -0.05185345187783241, -0.040941741317510605, -0.030030030757188797, -0.019118323922157288, -0.00820661336183548, 0.002705097198486328, 0.013616806827485561, 0.024528516456484795, 0.03544022515416145, 0.04635193571448326, 0.05726364627480507, 0.06817535310983658, 0.07908706367015839, 0.0899987742304802, 0.100910484790802, 0.11182219535112381, 0.12273390591144562, 0.13364560902118683, 0.14455732703208923, 0.15546903014183044, 0.16638073325157166, 0.17729245126247406, 0.18820415437221527, 0.19911587238311768, 0.2100275754928589, 0.2209392935037613, 0.2318509966135025, 0.2427627146244049, 0.2536744177341461, 0.26458612084388733, 0.27549782395362854, 0.28640952706336975, 0.29732125997543335, 0.30823296308517456, 0.31914466619491577, 0.330056369304657, 0.3409680724143982, 0.3518798053264618, 0.362791508436203, 0.3737032115459442, 0.3846149444580078, 0.395526647567749, 0.40643835067749023, 0.41735005378723145, 0.42826175689697266, 0.43917346000671387, 0.4500851631164551, 0.4609968662261963, 0.4719085991382599, 0.4828203022480011, 0.4937320053577423, 0.5046437382698059, 0.5155554413795471, 0.5264671444892883, 0.5373788475990295, 0.5482905507087708, 0.559202253818512, 0.5701139569282532, 0.5810257196426392, 0.5919374227523804, 0.6028491258621216, 0.6137608289718628]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 8.0, 11.0, 9.0, 12.0, 21.0, 30.0, 32.0, 36.0, 36.0, 54.0, 36.0, 66.0, 65.0, 67.0, 58.0, 62.0, 46.0, 53.0, 54.0, 34.0, 57.0, 28.0, 25.0, 24.0, 25.0, 13.0, 18.0, 7.0, 3.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03312307596206665, -0.032248929142951965, -0.03137478232383728, -0.030500631779432297, -0.02962648496031761, -0.028752338141202927, -0.027878189459443092, -0.027004040777683258, -0.026129893958568573, -0.025255747139453888, -0.024381598457694054, -0.02350744977593422, -0.022633302956819534, -0.02175915613770485, -0.020885007455945015, -0.02001085877418518, -0.019136711955070496, -0.01826256513595581, -0.017388416454195976, -0.016514267772436142, -0.015640120953321457, -0.014765973202884197, -0.013891825452446938, -0.013017677702009678, -0.012143529951572418, -0.011269382201135159, -0.010395234450697899, -0.00952108670026064, -0.00864693894982338, -0.00777279119938612, -0.00689864344894886, -0.0060244956985116005, -0.005150347948074341, -0.004276200197637081, -0.0034020524471998215, -0.002527904696762562, -0.0016537569463253021, -0.0007796091958880424, 9.453855454921722e-05, 0.0009686863049864769, 0.0018428340554237366, 0.0027169818058609962, 0.003591129556298256, 0.004465277306735516, 0.005339425057172775, 0.006213572807610035, 0.007087720558047295, 0.007961868308484554, 0.008836016058921814, 0.009710163809359074, 0.010584311559796333, 0.011458459310233593, 0.012332607060670853, 0.013206754811108112, 0.014080902561545372, 0.014955050311982632, 0.01582919806241989, 0.016703344881534576, 0.01757749356329441, 0.018451642245054245, 0.01932578906416893, 0.020199935883283615, 0.02107408456504345, 0.021948233246803284, 0.02282238006591797]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 10.0, 8.0, 10.0, 10.0, 16.0, 11.0, 11.0, 22.0, 20.0, 17.0, 15.0, 17.0, 23.0, 30.0, 29.0, 33.0, 31.0, 36.0, 40.0, 39.0, 39.0, 28.0, 46.0, 46.0, 29.0, 36.0, 35.0, 30.0, 25.0, 34.0, 11.0, 22.0, 25.0, 19.0, 17.0, 15.0, 20.0, 11.0, 6.0, 13.0, 9.0, 10.0, 8.0, 5.0, 10.0, 4.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.64453125, -6.4346923828125, -6.224853515625, -6.0150146484375, -5.80517578125, -5.5953369140625, -5.385498046875, -5.1756591796875, -4.9658203125, -4.7559814453125, -4.546142578125, -4.3363037109375, -4.12646484375, -3.9166259765625, -3.706787109375, -3.4969482421875, -3.287109375, -3.0772705078125, -2.867431640625, -2.6575927734375, -2.44775390625, -2.2379150390625, -2.028076171875, -1.8182373046875, -1.6083984375, -1.3985595703125, -1.188720703125, -0.9788818359375, -0.76904296875, -0.5592041015625, -0.349365234375, -0.1395263671875, 0.0703125, 0.2801513671875, 0.489990234375, 0.6998291015625, 0.90966796875, 1.1195068359375, 1.329345703125, 1.5391845703125, 1.7490234375, 1.9588623046875, 2.168701171875, 2.3785400390625, 2.58837890625, 2.7982177734375, 3.008056640625, 3.2178955078125, 3.427734375, 3.6375732421875, 3.847412109375, 4.0572509765625, 4.26708984375, 4.4769287109375, 4.686767578125, 4.8966064453125, 5.1064453125, 5.3162841796875, 5.526123046875, 5.7359619140625, 5.94580078125, 6.1556396484375, 6.365478515625, 6.5753173828125, 6.78515625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 2.0, 6.0, 12.0, 13.0, 25.0, 25.0, 32.0, 43.0, 54.0, 83.0, 92.0, 122.0, 151.0, 169.0, 239.0, 317.0, 352.0, 457.0, 619.0, 829.0, 1213.0, 2290.0, 5470.0, 16536.0, 54800.0, 171531.0, 405706.0, 257495.0, 86825.0, 26066.0, 8190.0, 3155.0, 1641.0, 916.0, 655.0, 493.0, 403.0, 333.0, 274.0, 221.0, 148.0, 121.0, 87.0, 73.0, 63.0, 48.0, 37.0, 33.0, 24.0, 11.0, 14.0, 9.0, 8.0, 12.0, 5.0, 2.0, 4.0, 2.0], "bins": [-13.25, -12.8447265625, -12.439453125, -12.0341796875, -11.62890625, -11.2236328125, -10.818359375, -10.4130859375, -10.0078125, -9.6025390625, -9.197265625, -8.7919921875, -8.38671875, -7.9814453125, -7.576171875, -7.1708984375, -6.765625, -6.3603515625, -5.955078125, -5.5498046875, -5.14453125, -4.7392578125, -4.333984375, -3.9287109375, -3.5234375, -3.1181640625, -2.712890625, -2.3076171875, -1.90234375, -1.4970703125, -1.091796875, -0.6865234375, -0.28125, 0.1240234375, 0.529296875, 0.9345703125, 1.33984375, 1.7451171875, 2.150390625, 2.5556640625, 2.9609375, 3.3662109375, 3.771484375, 4.1767578125, 4.58203125, 4.9873046875, 5.392578125, 5.7978515625, 6.203125, 6.6083984375, 7.013671875, 7.4189453125, 7.82421875, 8.2294921875, 8.634765625, 9.0400390625, 9.4453125, 9.8505859375, 10.255859375, 10.6611328125, 11.06640625, 11.4716796875, 11.876953125, 12.2822265625, 12.6875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 7.0, 15.0, 15.0, 15.0, 23.0, 17.0, 29.0, 37.0, 37.0, 39.0, 43.0, 79.0, 86.0, 127.0, 262.0, 1413.0, 226.0, 128.0, 85.0, 56.0, 49.0, 46.0, 32.0, 28.0, 28.0, 19.0, 24.0, 15.0, 12.0, 9.0, 9.0, 3.0, 4.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.046875, -19.388427734375, -18.72998046875, -18.071533203125, -17.4130859375, -16.754638671875, -16.09619140625, -15.437744140625, -14.779296875, -14.120849609375, -13.46240234375, -12.803955078125, -12.1455078125, -11.487060546875, -10.82861328125, -10.170166015625, -9.51171875, -8.853271484375, -8.19482421875, -7.536376953125, -6.8779296875, -6.219482421875, -5.56103515625, -4.902587890625, -4.244140625, -3.585693359375, -2.92724609375, -2.268798828125, -1.6103515625, -0.951904296875, -0.29345703125, 0.364990234375, 1.0234375, 1.681884765625, 2.34033203125, 2.998779296875, 3.6572265625, 4.315673828125, 4.97412109375, 5.632568359375, 6.291015625, 6.949462890625, 7.60791015625, 8.266357421875, 8.9248046875, 9.583251953125, 10.24169921875, 10.900146484375, 11.55859375, 12.217041015625, 12.87548828125, 13.533935546875, 14.1923828125, 14.850830078125, 15.50927734375, 16.167724609375, 16.826171875, 17.484619140625, 18.14306640625, 18.801513671875, 19.4599609375, 20.118408203125, 20.77685546875, 21.435302734375, 22.09375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 10.0, 11.0, 14.0, 17.0, 31.0, 44.0, 50.0, 86.0, 137.0, 285.0, 517.0, 1069.0, 7230.0, 3129386.0, 4650.0, 1000.0, 447.0, 253.0, 166.0, 82.0, 59.0, 42.0, 29.0, 16.0, 17.0, 14.0, 9.0, 9.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.1875, -121.5537109375, -117.919921875, -114.2861328125, -110.65234375, -107.0185546875, -103.384765625, -99.7509765625, -96.1171875, -92.4833984375, -88.849609375, -85.2158203125, -81.58203125, -77.9482421875, -74.314453125, -70.6806640625, -67.046875, -63.4130859375, -59.779296875, -56.1455078125, -52.51171875, -48.8779296875, -45.244140625, -41.6103515625, -37.9765625, -34.3427734375, -30.708984375, -27.0751953125, -23.44140625, -19.8076171875, -16.173828125, -12.5400390625, -8.90625, -5.2724609375, -1.638671875, 1.9951171875, 5.62890625, 9.2626953125, 12.896484375, 16.5302734375, 20.1640625, 23.7978515625, 27.431640625, 31.0654296875, 34.69921875, 38.3330078125, 41.966796875, 45.6005859375, 49.234375, 52.8681640625, 56.501953125, 60.1357421875, 63.76953125, 67.4033203125, 71.037109375, 74.6708984375, 78.3046875, 81.9384765625, 85.572265625, 89.2060546875, 92.83984375, 96.4736328125, 100.107421875, 103.7412109375, 107.375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 18.0, 41.0, 98.0, 179.0, 247.0, 199.0, 119.0, 69.0, 21.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.30699157714844, -68.3917236328125, -65.47645568847656, -62.561187744140625, -59.64592361450195, -56.730655670166016, -53.81538772583008, -50.900123596191406, -47.98485565185547, -45.06958770751953, -42.154319763183594, -39.239051818847656, -36.323787689208984, -33.40851974487305, -30.49325180053711, -27.577985763549805, -24.662715911865234, -21.747447967529297, -18.832181930541992, -15.916913986206055, -13.001646995544434, -10.086380004882812, -7.171112060546875, -4.25584602355957, -1.3405780792236328, 1.5746891498565674, 4.489956378936768, 7.405223846435547, 10.320490837097168, 13.235757827758789, 16.151025772094727, 19.06629180908203, 21.98155975341797, 24.896827697753906, 27.81209373474121, 30.72736167907715, 33.64262771606445, 36.55789566040039, 39.47316360473633, 42.388427734375, 45.30369567871094, 48.218963623046875, 51.13423156738281, 54.04949951171875, 56.96476364135742, 59.88003158569336, 62.7952995300293, 65.71056365966797, 68.62583923339844, 71.54110717773438, 74.45637512207031, 77.37164306640625, 80.28691101074219, 83.20217895507812, 86.11744689941406, 89.03270721435547, 91.9479751586914, 94.86324310302734, 97.77851104736328, 100.69377899169922, 103.60904693603516, 106.52430725097656, 109.4395751953125, 112.35484313964844, 115.27011108398438]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 8.0, 6.0, 13.0, 15.0, 14.0, 12.0, 21.0, 25.0, 22.0, 25.0, 25.0, 33.0, 33.0, 42.0, 44.0, 35.0, 36.0, 41.0, 47.0, 47.0, 44.0, 35.0, 31.0, 32.0, 36.0, 38.0, 41.0, 30.0, 29.0, 24.0, 17.0, 15.0, 7.0, 18.0, 11.0, 8.0, 7.0, 6.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.09221649169922, -47.382896423339844, -45.67357635498047, -43.964256286621094, -42.254940032958984, -40.54561996459961, -38.836299896240234, -37.12697982788086, -35.417659759521484, -33.70833969116211, -31.999021530151367, -30.289701461791992, -28.580381393432617, -26.871063232421875, -25.1617431640625, -23.452423095703125, -21.743104934692383, -20.033784866333008, -18.324466705322266, -16.61514663696289, -14.905826568603516, -13.196507453918457, -11.487188339233398, -9.777868270874023, -8.068549156188965, -6.359229564666748, -4.649909973144531, -2.9405908584594727, -1.2312712669372559, 0.47804832458496094, 2.1873674392700195, 3.8966875076293945, 5.606006622314453, 7.31532621383667, 9.024645805358887, 10.733964920043945, 12.44328498840332, 14.152604103088379, 15.861923217773438, 17.571243286132812, 19.280563354492188, 20.989883422851562, 22.699201583862305, 24.40852165222168, 26.117841720581055, 27.827159881591797, 29.536479949951172, 31.245800018310547, 32.955116271972656, 34.66443634033203, 36.373756408691406, 38.08307647705078, 39.79239273071289, 41.501712799072266, 43.21103286743164, 44.920352935791016, 46.62967300415039, 48.338993072509766, 50.04831314086914, 51.75762939453125, 53.466949462890625, 55.17626953125, 56.885589599609375, 58.59490966796875, 60.304229736328125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 10.0, 15.0, 8.0, 7.0, 9.0, 15.0, 21.0, 18.0, 22.0, 22.0, 30.0, 14.0, 37.0, 37.0, 31.0, 41.0, 53.0, 44.0, 29.0, 41.0, 41.0, 34.0, 25.0, 36.0, 38.0, 46.0, 32.0, 22.0, 28.0, 23.0, 16.0, 21.0, 20.0, 25.0, 15.0, 9.0, 8.0, 9.0, 7.0, 6.0, 9.0, 5.0, 4.0, 2.0, 5.0, 7.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.3203125, -7.0911865234375, -6.862060546875, -6.6329345703125, -6.40380859375, -6.1746826171875, -5.945556640625, -5.7164306640625, -5.4873046875, -5.2581787109375, -5.029052734375, -4.7999267578125, -4.57080078125, -4.3416748046875, -4.112548828125, -3.8834228515625, -3.654296875, -3.4251708984375, -3.196044921875, -2.9669189453125, -2.73779296875, -2.5086669921875, -2.279541015625, -2.0504150390625, -1.8212890625, -1.5921630859375, -1.363037109375, -1.1339111328125, -0.90478515625, -0.6756591796875, -0.446533203125, -0.2174072265625, 0.01171875, 0.2408447265625, 0.469970703125, 0.6990966796875, 0.92822265625, 1.1573486328125, 1.386474609375, 1.6156005859375, 1.8447265625, 2.0738525390625, 2.302978515625, 2.5321044921875, 2.76123046875, 2.9903564453125, 3.219482421875, 3.4486083984375, 3.677734375, 3.9068603515625, 4.135986328125, 4.3651123046875, 4.59423828125, 4.8233642578125, 5.052490234375, 5.2816162109375, 5.5107421875, 5.7398681640625, 5.968994140625, 6.1981201171875, 6.42724609375, 6.6563720703125, 6.885498046875, 7.1146240234375, 7.34375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 9.0, 11.0, 11.0, 17.0, 35.0, 67.0, 101.0, 185.0, 422.0, 962.0, 2049.0, 5368.0, 19435.0, 147774.0, 1532722.0, 2200989.0, 245471.0, 27587.0, 6747.0, 2347.0, 996.0, 488.0, 231.0, 113.0, 52.0, 29.0, 16.0, 10.0, 10.0, 4.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.0625, -17.44189453125, -16.8212890625, -16.20068359375, -15.580078125, -14.95947265625, -14.3388671875, -13.71826171875, -13.09765625, -12.47705078125, -11.8564453125, -11.23583984375, -10.615234375, -9.99462890625, -9.3740234375, -8.75341796875, -8.1328125, -7.51220703125, -6.8916015625, -6.27099609375, -5.650390625, -5.02978515625, -4.4091796875, -3.78857421875, -3.16796875, -2.54736328125, -1.9267578125, -1.30615234375, -0.685546875, -0.06494140625, 0.5556640625, 1.17626953125, 1.796875, 2.41748046875, 3.0380859375, 3.65869140625, 4.279296875, 4.89990234375, 5.5205078125, 6.14111328125, 6.76171875, 7.38232421875, 8.0029296875, 8.62353515625, 9.244140625, 9.86474609375, 10.4853515625, 11.10595703125, 11.7265625, 12.34716796875, 12.9677734375, 13.58837890625, 14.208984375, 14.82958984375, 15.4501953125, 16.07080078125, 16.69140625, 17.31201171875, 17.9326171875, 18.55322265625, 19.173828125, 19.79443359375, 20.4150390625, 21.03564453125, 21.65625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 12.0, 32.0, 35.0, 48.0, 95.0, 127.0, 213.0, 313.0, 499.0, 780.0, 671.0, 462.0, 288.0, 156.0, 116.0, 86.0, 45.0, 21.0, 15.0, 26.0, 17.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.875, -13.2119140625, -12.548828125, -11.8857421875, -11.22265625, -10.5595703125, -9.896484375, -9.2333984375, -8.5703125, -7.9072265625, -7.244140625, -6.5810546875, -5.91796875, -5.2548828125, -4.591796875, -3.9287109375, -3.265625, -2.6025390625, -1.939453125, -1.2763671875, -0.61328125, 0.0498046875, 0.712890625, 1.3759765625, 2.0390625, 2.7021484375, 3.365234375, 4.0283203125, 4.69140625, 5.3544921875, 6.017578125, 6.6806640625, 7.34375, 8.0068359375, 8.669921875, 9.3330078125, 9.99609375, 10.6591796875, 11.322265625, 11.9853515625, 12.6484375, 13.3115234375, 13.974609375, 14.6376953125, 15.30078125, 15.9638671875, 16.626953125, 17.2900390625, 17.953125, 18.6162109375, 19.279296875, 19.9423828125, 20.60546875, 21.2685546875, 21.931640625, 22.5947265625, 23.2578125, 23.9208984375, 24.583984375, 25.2470703125, 25.91015625, 26.5732421875, 27.236328125, 27.8994140625, 28.5625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 8.0, 9.0, 9.0, 17.0, 37.0, 75.0, 124.0, 298.0, 731.0, 2257.0, 19488.0, 1195722.0, 2929368.0, 41258.0, 3253.0, 930.0, 392.0, 157.0, 74.0, 39.0, 25.0, 10.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.25, -40.93408203125, -39.6181640625, -38.30224609375, -36.986328125, -35.67041015625, -34.3544921875, -33.03857421875, -31.72265625, -30.40673828125, -29.0908203125, -27.77490234375, -26.458984375, -25.14306640625, -23.8271484375, -22.51123046875, -21.1953125, -19.87939453125, -18.5634765625, -17.24755859375, -15.931640625, -14.61572265625, -13.2998046875, -11.98388671875, -10.66796875, -9.35205078125, -8.0361328125, -6.72021484375, -5.404296875, -4.08837890625, -2.7724609375, -1.45654296875, -0.140625, 1.17529296875, 2.4912109375, 3.80712890625, 5.123046875, 6.43896484375, 7.7548828125, 9.07080078125, 10.38671875, 11.70263671875, 13.0185546875, 14.33447265625, 15.650390625, 16.96630859375, 18.2822265625, 19.59814453125, 20.9140625, 22.22998046875, 23.5458984375, 24.86181640625, 26.177734375, 27.49365234375, 28.8095703125, 30.12548828125, 31.44140625, 32.75732421875, 34.0732421875, 35.38916015625, 36.705078125, 38.02099609375, 39.3369140625, 40.65283203125, 41.96875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 11.0, 54.0, 245.0, 444.0, 216.0, 38.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.20370483398438, -87.2127685546875, -80.22183990478516, -73.23091125488281, -66.23997497558594, -59.24904251098633, -52.25811004638672, -45.26717758178711, -38.2762451171875, -31.28531265258789, -24.29438018798828, -17.303447723388672, -10.312515258789062, -3.321582794189453, 3.6693496704101562, 10.660282135009766, 17.651214599609375, 24.642147064208984, 31.633079528808594, 38.6240119934082, 45.61494445800781, 52.60587692260742, 59.59680938720703, 66.58773803710938, 73.57867431640625, 80.56961059570312, 87.56053924560547, 94.55146789550781, 101.54240417480469, 108.53334045410156, 115.5242691040039, 122.51519775390625, 129.50613403320312, 136.4970703125, 143.48800659179688, 150.4789276123047, 157.46986389160156, 164.46080017089844, 171.45172119140625, 178.44265747070312, 185.43359375, 192.42453002929688, 199.41546630859375, 206.40638732910156, 213.39732360839844, 220.3882598876953, 227.37918090820312, 234.3701171875, 241.36105346679688, 248.35198974609375, 255.34292602539062, 262.3338623046875, 269.32476806640625, 276.3157043457031, 283.306640625, 290.2975769042969, 297.28851318359375, 304.2794494628906, 311.2703857421875, 318.2613220214844, 325.25225830078125, 332.2431640625, 339.2341003417969, 346.22503662109375, 353.2159729003906]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 7.0, 3.0, 7.0, 10.0, 7.0, 11.0, 12.0, 9.0, 17.0, 17.0, 16.0, 23.0, 14.0, 24.0, 21.0, 25.0, 36.0, 29.0, 40.0, 50.0, 39.0, 31.0, 32.0, 38.0, 38.0, 33.0, 32.0, 33.0, 38.0, 29.0, 30.0, 24.0, 28.0, 41.0, 28.0, 26.0, 11.0, 14.0, 14.0, 12.0, 6.0, 14.0, 6.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.37238311767578, -43.9488639831543, -42.52534484863281, -41.10182571411133, -39.678306579589844, -38.254783630371094, -36.83126449584961, -35.407745361328125, -33.98422622680664, -32.560707092285156, -31.137187957763672, -29.713666915893555, -28.29014778137207, -26.866628646850586, -25.44310760498047, -24.019588470458984, -22.5960693359375, -21.172550201416016, -19.74903106689453, -18.325510025024414, -16.90199089050293, -15.478471755981445, -14.054951667785645, -12.631431579589844, -11.20791244506836, -9.784393310546875, -8.360873222351074, -6.937353610992432, -5.513833999633789, -4.0903143882751465, -2.666794776916504, -1.2432746887207031, 0.18024826049804688, 1.6037678718566895, 3.027287483215332, 4.450807094573975, 5.874326705932617, 7.29784631729126, 8.721365928649902, 10.144886016845703, 11.568405151367188, 12.991924285888672, 14.415444374084473, 15.838964462280273, 17.262483596801758, 18.686002731323242, 20.10952377319336, 21.533042907714844, 22.956562042236328, 24.380081176757812, 25.803600311279297, 27.227121353149414, 28.6506404876709, 30.074159622192383, 31.4976806640625, 32.921199798583984, 34.34471893310547, 35.76823806762695, 37.19175720214844, 38.61527633666992, 40.038795471191406, 41.462318420410156, 42.88583755493164, 44.309356689453125, 45.73287582397461]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 10.0, 9.0, 9.0, 8.0, 8.0, 23.0, 22.0, 22.0, 35.0, 26.0, 29.0, 35.0, 30.0, 45.0, 42.0, 65.0, 40.0, 40.0, 39.0, 32.0, 35.0, 50.0, 40.0, 47.0, 32.0, 28.0, 28.0, 18.0, 23.0, 24.0, 17.0, 15.0, 8.0, 14.0, 10.0, 12.0, 8.0, 5.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.317138671875, -6.10693359375, -5.896728515625, -5.6865234375, -5.476318359375, -5.26611328125, -5.055908203125, -4.845703125, -4.635498046875, -4.42529296875, -4.215087890625, -4.0048828125, -3.794677734375, -3.58447265625, -3.374267578125, -3.1640625, -2.953857421875, -2.74365234375, -2.533447265625, -2.3232421875, -2.113037109375, -1.90283203125, -1.692626953125, -1.482421875, -1.272216796875, -1.06201171875, -0.851806640625, -0.6416015625, -0.431396484375, -0.22119140625, -0.010986328125, 0.19921875, 0.409423828125, 0.61962890625, 0.829833984375, 1.0400390625, 1.250244140625, 1.46044921875, 1.670654296875, 1.880859375, 2.091064453125, 2.30126953125, 2.511474609375, 2.7216796875, 2.931884765625, 3.14208984375, 3.352294921875, 3.5625, 3.772705078125, 3.98291015625, 4.193115234375, 4.4033203125, 4.613525390625, 4.82373046875, 5.033935546875, 5.244140625, 5.454345703125, 5.66455078125, 5.874755859375, 6.0849609375, 6.295166015625, 6.50537109375, 6.715576171875, 6.92578125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 17.0, 24.0, 28.0, 37.0, 59.0, 80.0, 112.0, 191.0, 253.0, 391.0, 554.0, 875.0, 1241.0, 2019.0, 3220.0, 5085.0, 8242.0, 13376.0, 21468.0, 35251.0, 56205.0, 88722.0, 131033.0, 169336.0, 165444.0, 124499.0, 82927.0, 51876.0, 32847.0, 20006.0, 12334.0, 7497.0, 4791.0, 3011.0, 1925.0, 1205.0, 770.0, 544.0, 357.0, 243.0, 140.0, 128.0, 62.0, 46.0, 20.0, 17.0, 22.0, 12.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.85791015625, -0.8326187133789062, -0.8073272705078125, -0.7820358276367188, -0.756744384765625, -0.7314529418945312, -0.7061614990234375, -0.6808700561523438, -0.65557861328125, -0.6302871704101562, -0.6049957275390625, -0.5797042846679688, -0.554412841796875, -0.5291213989257812, -0.5038299560546875, -0.47853851318359375, -0.4532470703125, -0.42795562744140625, -0.4026641845703125, -0.37737274169921875, -0.352081298828125, -0.32678985595703125, -0.3014984130859375, -0.27620697021484375, -0.25091552734375, -0.22562408447265625, -0.2003326416015625, -0.17504119873046875, -0.149749755859375, -0.12445831298828125, -0.0991668701171875, -0.07387542724609375, -0.048583984375, -0.02329254150390625, 0.0019989013671875, 0.02729034423828125, 0.052581787109375, 0.07787322998046875, 0.1031646728515625, 0.12845611572265625, 0.15374755859375, 0.17903900146484375, 0.2043304443359375, 0.22962188720703125, 0.254913330078125, 0.28020477294921875, 0.3054962158203125, 0.33078765869140625, 0.3560791015625, 0.38137054443359375, 0.4066619873046875, 0.43195343017578125, 0.457244873046875, 0.48253631591796875, 0.5078277587890625, 0.5331192016601562, 0.55841064453125, 0.5837020874023438, 0.6089935302734375, 0.6342849731445312, 0.659576416015625, 0.6848678588867188, 0.7101593017578125, 0.7354507446289062, 0.7607421875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 5.0, 10.0, 17.0, 15.0, 14.0, 21.0, 19.0, 11.0, 28.0, 23.0, 23.0, 26.0, 32.0, 27.0, 31.0, 27.0, 35.0, 42.0, 42.0, 1072.0, 44.0, 38.0, 24.0, 39.0, 45.0, 29.0, 33.0, 30.0, 34.0, 21.0, 16.0, 21.0, 15.0, 11.0, 16.0, 12.0, 17.0, 10.0, 4.0, 3.0, 3.0, 9.0, 8.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.935546875, -3.810943603515625, -3.68634033203125, -3.561737060546875, -3.4371337890625, -3.312530517578125, -3.18792724609375, -3.063323974609375, -2.938720703125, -2.814117431640625, -2.68951416015625, -2.564910888671875, -2.4403076171875, -2.315704345703125, -2.19110107421875, -2.066497802734375, -1.94189453125, -1.817291259765625, -1.69268798828125, -1.568084716796875, -1.4434814453125, -1.318878173828125, -1.19427490234375, -1.069671630859375, -0.945068359375, -0.820465087890625, -0.69586181640625, -0.571258544921875, -0.4466552734375, -0.322052001953125, -0.19744873046875, -0.072845458984375, 0.0517578125, 0.176361083984375, 0.30096435546875, 0.425567626953125, 0.5501708984375, 0.674774169921875, 0.79937744140625, 0.923980712890625, 1.048583984375, 1.173187255859375, 1.29779052734375, 1.422393798828125, 1.5469970703125, 1.671600341796875, 1.79620361328125, 1.920806884765625, 2.04541015625, 2.170013427734375, 2.29461669921875, 2.419219970703125, 2.5438232421875, 2.668426513671875, 2.79302978515625, 2.917633056640625, 3.042236328125, 3.166839599609375, 3.29144287109375, 3.416046142578125, 3.5406494140625, 3.665252685546875, 3.78985595703125, 3.914459228515625, 4.0390625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 19.0, 33.0, 44.0, 50.0, 80.0, 143.0, 252.0, 349.0, 573.0, 783.0, 1367.0, 2137.0, 3435.0, 5495.0, 8810.0, 14154.0, 22242.0, 34876.0, 53576.0, 80568.0, 114251.0, 153252.0, 1194448.0, 130381.0, 94631.0, 64744.0, 42726.0, 27309.0, 17223.0, 10852.0, 6764.0, 4297.0, 2626.0, 1718.0, 1032.0, 657.0, 431.0, 268.0, 172.0, 132.0, 79.0, 45.0, 29.0, 25.0, 14.0, 7.0, 12.0, 10.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.50537109375, -0.48918914794921875, -0.4730072021484375, -0.45682525634765625, -0.440643310546875, -0.42446136474609375, -0.4082794189453125, -0.39209747314453125, -0.37591552734375, -0.35973358154296875, -0.3435516357421875, -0.32736968994140625, -0.311187744140625, -0.29500579833984375, -0.2788238525390625, -0.26264190673828125, -0.2464599609375, -0.23027801513671875, -0.2140960693359375, -0.19791412353515625, -0.181732177734375, -0.16555023193359375, -0.1493682861328125, -0.13318634033203125, -0.11700439453125, -0.10082244873046875, -0.0846405029296875, -0.06845855712890625, -0.052276611328125, -0.03609466552734375, -0.0199127197265625, -0.00373077392578125, 0.012451171875, 0.02863311767578125, 0.0448150634765625, 0.06099700927734375, 0.077178955078125, 0.09336090087890625, 0.1095428466796875, 0.12572479248046875, 0.14190673828125, 0.15808868408203125, 0.1742706298828125, 0.19045257568359375, 0.206634521484375, 0.22281646728515625, 0.2389984130859375, 0.25518035888671875, 0.2713623046875, 0.28754425048828125, 0.3037261962890625, 0.31990814208984375, 0.336090087890625, 0.35227203369140625, 0.3684539794921875, 0.38463592529296875, 0.40081787109375, 0.41699981689453125, 0.4331817626953125, 0.44936370849609375, 0.465545654296875, 0.48172760009765625, 0.4979095458984375, 0.5140914916992188, 0.5302734375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 3.0, 3.0, 5.0, 6.0, 10.0, 10.0, 10.0, 18.0, 20.0, 25.0, 37.0, 40.0, 50.0, 76.0, 89.0, 87.0, 104.0, 80.0, 62.0, 55.0, 37.0, 30.0, 23.0, 20.0, 10.0, 15.0, 9.0, 12.0, 11.0, 6.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.01259613037109375, -0.012238025665283203, -0.011879920959472656, -0.01152181625366211, -0.011163711547851562, -0.010805606842041016, -0.010447502136230469, -0.010089397430419922, -0.009731292724609375, -0.009373188018798828, -0.009015083312988281, -0.008656978607177734, -0.008298873901367188, -0.00794076919555664, -0.007582664489746094, -0.007224559783935547, -0.006866455078125, -0.006508350372314453, -0.006150245666503906, -0.005792140960693359, -0.0054340362548828125, -0.005075931549072266, -0.004717826843261719, -0.004359722137451172, -0.004001617431640625, -0.003643512725830078, -0.0032854080200195312, -0.0029273033142089844, -0.0025691986083984375, -0.0022110939025878906, -0.0018529891967773438, -0.0014948844909667969, -0.00113677978515625, -0.0007786750793457031, -0.00042057037353515625, -6.246566772460938e-05, 0.0002956390380859375, 0.0006537437438964844, 0.0010118484497070312, 0.0013699531555175781, 0.001728057861328125, 0.002086162567138672, 0.0024442672729492188, 0.0028023719787597656, 0.0031604766845703125, 0.0035185813903808594, 0.0038766860961914062, 0.004234790802001953, 0.0045928955078125, 0.004951000213623047, 0.005309104919433594, 0.005667209625244141, 0.0060253143310546875, 0.006383419036865234, 0.006741523742675781, 0.007099628448486328, 0.007457733154296875, 0.007815837860107422, 0.008173942565917969, 0.008532047271728516, 0.008890151977539062, 0.00924825668334961, 0.009606361389160156, 0.009964466094970703, 0.01032257080078125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 9.0, 6.0, 6.0, 13.0, 11.0, 27.0, 18.0, 38.0, 17.0, 35.0, 41.0, 48.0, 86.0, 119.0, 198.0, 304.0, 594.0, 5222.0, 1020513.0, 19324.0, 810.0, 379.0, 202.0, 144.0, 99.0, 67.0, 42.0, 41.0, 27.0, 19.0, 22.0, 16.0, 11.0, 9.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.184814453125, -0.1785736083984375, -0.172332763671875, -0.1660919189453125, -0.15985107421875, -0.1536102294921875, -0.147369384765625, -0.1411285400390625, -0.1348876953125, -0.1286468505859375, -0.122406005859375, -0.1161651611328125, -0.10992431640625, -0.1036834716796875, -0.097442626953125, -0.0912017822265625, -0.0849609375, -0.0787200927734375, -0.072479248046875, -0.0662384033203125, -0.05999755859375, -0.0537567138671875, -0.047515869140625, -0.0412750244140625, -0.0350341796875, -0.0287933349609375, -0.022552490234375, -0.0163116455078125, -0.01007080078125, -0.0038299560546875, 0.002410888671875, 0.0086517333984375, 0.014892578125, 0.0211334228515625, 0.027374267578125, 0.0336151123046875, 0.03985595703125, 0.0460968017578125, 0.052337646484375, 0.0585784912109375, 0.0648193359375, 0.0710601806640625, 0.077301025390625, 0.0835418701171875, 0.08978271484375, 0.0960235595703125, 0.102264404296875, 0.1085052490234375, 0.11474609375, 0.1209869384765625, 0.127227783203125, 0.1334686279296875, 0.13970947265625, 0.1459503173828125, 0.152191162109375, 0.1584320068359375, 0.1646728515625, 0.1709136962890625, 0.177154541015625, 0.1833953857421875, 0.18963623046875, 0.1958770751953125, 0.202117919921875, 0.2083587646484375, 0.214599609375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 978.0, 34.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04295317083597183, -0.037378452718257904, -0.031803734600543976, -0.026229020208120346, -0.020654302090406418, -0.01507958397269249, -0.00950486958026886, -0.003930151462554932, 0.0016445666551589966, 0.00721928384155035, 0.012794001027941704, 0.018368717283010483, 0.02394343540072441, 0.02951815351843834, 0.03509286791086197, 0.0406675860285759, 0.046242304146289825, 0.051817022264003754, 0.05739174038171768, 0.06296645104885101, 0.06854116916656494, 0.07411588728427887, 0.0796906054019928, 0.08526532351970673, 0.09084004163742065, 0.09641475975513458, 0.10198947787284851, 0.10756419599056244, 0.11313891410827637, 0.1187136322259903, 0.12428834289312363, 0.12986305356025696, 0.13543778657913208, 0.141012504696846, 0.14658722281455994, 0.15216194093227386, 0.1577366590499878, 0.16331137716770172, 0.16888609528541565, 0.17446079850196838, 0.1800355315208435, 0.18561024963855743, 0.19118496775627136, 0.1967596858739853, 0.20233440399169922, 0.20790912210941315, 0.21348384022712708, 0.2190585434436798, 0.22463326156139374, 0.23020797967910767, 0.2357826977968216, 0.24135741591453552, 0.24693213403224945, 0.2525068521499634, 0.2580815553665161, 0.26365628838539124, 0.26923099160194397, 0.2748056948184967, 0.2803804278373718, 0.28595513105392456, 0.2915298640727997, 0.2971045672893524, 0.30267930030822754, 0.3082540035247803, 0.3138287365436554]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 11.0, 20.0, 22.0, 25.0, 30.0, 46.0, 60.0, 47.0, 64.0, 68.0, 71.0, 66.0, 55.0, 57.0, 50.0, 48.0, 50.0, 38.0, 40.0, 41.0, 23.0, 19.0, 11.0, 12.0, 5.0, 8.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.018280208110809326, -0.01781718246638775, -0.01735415682196617, -0.016891131177544594, -0.016428105533123016, -0.01596507988870144, -0.015502054244279861, -0.015039028599858284, -0.014576002955436707, -0.014112977311015129, -0.013649951666593552, -0.013186926022171974, -0.012723900377750397, -0.01226087473332882, -0.011797849088907242, -0.011334823444485664, -0.010871797800064087, -0.01040877215564251, -0.009945746511220932, -0.009482720866799355, -0.009019695222377777, -0.0085566695779562, -0.008093643933534622, -0.007630618289113045, -0.007167592644691467, -0.00670456700026989, -0.006241541355848312, -0.005778515711426735, -0.0053154900670051575, -0.00485246442258358, -0.0043894387781620026, -0.003926413133740425, -0.0034633874893188477, -0.00300036184489727, -0.0025373362004756927, -0.0020743105560541153, -0.0016112849116325378, -0.0011482592672109604, -0.0006852336227893829, -0.00022220797836780548, 0.00024081766605377197, 0.0007038433104753494, 0.0011668689548969269, 0.0016298945993185043, 0.002092920243740082, 0.0025559458881616592, 0.0030189715325832367, 0.003481997177004814, 0.003945022821426392, 0.004408048465847969, 0.0048710741102695465, 0.005334099754691124, 0.005797125399112701, 0.006260151043534279, 0.006723176687955856, 0.007186202332377434, 0.007649227976799011, 0.008112253621220589, 0.008575279265642166, 0.009038304910063744, 0.009501330554485321, 0.009964356198906898, 0.010427381843328476, 0.010890407487750053, 0.01135343313217163]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 11.0, 9.0, 9.0, 8.0, 8.0, 23.0, 20.0, 24.0, 35.0, 26.0, 29.0, 34.0, 31.0, 45.0, 42.0, 65.0, 37.0, 43.0, 39.0, 32.0, 35.0, 49.0, 41.0, 45.0, 32.0, 30.0, 28.0, 17.0, 24.0, 24.0, 16.0, 15.0, 9.0, 14.0, 9.0, 13.0, 8.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53125, -6.321044921875, -6.11083984375, -5.900634765625, -5.6904296875, -5.480224609375, -5.27001953125, -5.059814453125, -4.849609375, -4.639404296875, -4.42919921875, -4.218994140625, -4.0087890625, -3.798583984375, -3.58837890625, -3.378173828125, -3.16796875, -2.957763671875, -2.74755859375, -2.537353515625, -2.3271484375, -2.116943359375, -1.90673828125, -1.696533203125, -1.486328125, -1.276123046875, -1.06591796875, -0.855712890625, -0.6455078125, -0.435302734375, -0.22509765625, -0.014892578125, 0.1953125, 0.405517578125, 0.61572265625, 0.825927734375, 1.0361328125, 1.246337890625, 1.45654296875, 1.666748046875, 1.876953125, 2.087158203125, 2.29736328125, 2.507568359375, 2.7177734375, 2.927978515625, 3.13818359375, 3.348388671875, 3.55859375, 3.768798828125, 3.97900390625, 4.189208984375, 4.3994140625, 4.609619140625, 4.81982421875, 5.030029296875, 5.240234375, 5.450439453125, 5.66064453125, 5.870849609375, 6.0810546875, 6.291259765625, 6.50146484375, 6.711669921875, 6.921875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 0.0, 8.0, 4.0, 15.0, 18.0, 24.0, 37.0, 48.0, 79.0, 97.0, 125.0, 148.0, 214.0, 311.0, 409.0, 566.0, 726.0, 940.0, 1425.0, 2096.0, 3437.0, 7887.0, 34646.0, 232621.0, 616458.0, 112838.0, 18769.0, 5393.0, 2665.0, 1794.0, 1312.0, 927.0, 647.0, 517.0, 356.0, 270.0, 209.0, 148.0, 102.0, 74.0, 54.0, 36.0, 35.0, 15.0, 20.0, 8.0, 9.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.78125, -16.261962890625, -15.74267578125, -15.223388671875, -14.7041015625, -14.184814453125, -13.66552734375, -13.146240234375, -12.626953125, -12.107666015625, -11.58837890625, -11.069091796875, -10.5498046875, -10.030517578125, -9.51123046875, -8.991943359375, -8.47265625, -7.953369140625, -7.43408203125, -6.914794921875, -6.3955078125, -5.876220703125, -5.35693359375, -4.837646484375, -4.318359375, -3.799072265625, -3.27978515625, -2.760498046875, -2.2412109375, -1.721923828125, -1.20263671875, -0.683349609375, -0.1640625, 0.355224609375, 0.87451171875, 1.393798828125, 1.9130859375, 2.432373046875, 2.95166015625, 3.470947265625, 3.990234375, 4.509521484375, 5.02880859375, 5.548095703125, 6.0673828125, 6.586669921875, 7.10595703125, 7.625244140625, 8.14453125, 8.663818359375, 9.18310546875, 9.702392578125, 10.2216796875, 10.740966796875, 11.26025390625, 11.779541015625, 12.298828125, 12.818115234375, 13.33740234375, 13.856689453125, 14.3759765625, 14.895263671875, 15.41455078125, 15.933837890625, 16.453125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 6.0, 2.0, 2.0, 4.0, 9.0, 14.0, 9.0, 17.0, 12.0, 20.0, 22.0, 31.0, 35.0, 28.0, 34.0, 51.0, 50.0, 69.0, 121.0, 209.0, 1396.0, 277.0, 158.0, 93.0, 54.0, 46.0, 45.0, 40.0, 32.0, 27.0, 17.0, 25.0, 16.0, 11.0, 11.0, 9.0, 11.0, 10.0, 6.0, 0.0, 4.0, 6.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.59375, -16.1019287109375, -15.610107421875, -15.1182861328125, -14.62646484375, -14.1346435546875, -13.642822265625, -13.1510009765625, -12.6591796875, -12.1673583984375, -11.675537109375, -11.1837158203125, -10.69189453125, -10.2000732421875, -9.708251953125, -9.2164306640625, -8.724609375, -8.2327880859375, -7.740966796875, -7.2491455078125, -6.75732421875, -6.2655029296875, -5.773681640625, -5.2818603515625, -4.7900390625, -4.2982177734375, -3.806396484375, -3.3145751953125, -2.82275390625, -2.3309326171875, -1.839111328125, -1.3472900390625, -0.85546875, -0.3636474609375, 0.128173828125, 0.6199951171875, 1.11181640625, 1.6036376953125, 2.095458984375, 2.5872802734375, 3.0791015625, 3.5709228515625, 4.062744140625, 4.5545654296875, 5.04638671875, 5.5382080078125, 6.030029296875, 6.5218505859375, 7.013671875, 7.5054931640625, 7.997314453125, 8.4891357421875, 8.98095703125, 9.4727783203125, 9.964599609375, 10.4564208984375, 10.9482421875, 11.4400634765625, 11.931884765625, 12.4237060546875, 12.91552734375, 13.4073486328125, 13.899169921875, 14.3909912109375, 14.8828125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 9.0, 5.0, 17.0, 21.0, 13.0, 20.0, 26.0, 33.0, 50.0, 82.0, 83.0, 141.0, 250.0, 434.0, 827.0, 1957.0, 11040.0, 3109439.0, 16920.0, 2208.0, 868.0, 436.0, 246.0, 171.0, 109.0, 72.0, 49.0, 46.0, 33.0, 24.0, 16.0, 12.0, 12.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.25, -57.1748046875, -55.099609375, -53.0244140625, -50.94921875, -48.8740234375, -46.798828125, -44.7236328125, -42.6484375, -40.5732421875, -38.498046875, -36.4228515625, -34.34765625, -32.2724609375, -30.197265625, -28.1220703125, -26.046875, -23.9716796875, -21.896484375, -19.8212890625, -17.74609375, -15.6708984375, -13.595703125, -11.5205078125, -9.4453125, -7.3701171875, -5.294921875, -3.2197265625, -1.14453125, 0.9306640625, 3.005859375, 5.0810546875, 7.15625, 9.2314453125, 11.306640625, 13.3818359375, 15.45703125, 17.5322265625, 19.607421875, 21.6826171875, 23.7578125, 25.8330078125, 27.908203125, 29.9833984375, 32.05859375, 34.1337890625, 36.208984375, 38.2841796875, 40.359375, 42.4345703125, 44.509765625, 46.5849609375, 48.66015625, 50.7353515625, 52.810546875, 54.8857421875, 56.9609375, 59.0361328125, 61.111328125, 63.1865234375, 65.26171875, 67.3369140625, 69.412109375, 71.4873046875, 73.5625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 23.0, 137.0, 274.0, 299.0, 194.0, 62.0, 15.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-176.9239959716797, -172.71615600585938, -168.50831604003906, -164.3004913330078, -160.0926513671875, -155.8848114013672, -151.67697143554688, -147.46914672851562, -143.2613067626953, -139.053466796875, -134.8456268310547, -130.63780212402344, -126.42996215820312, -122.22212219238281, -118.0142822265625, -113.80644989013672, -109.5986099243164, -105.3907699584961, -101.18293762207031, -96.97509765625, -92.76726531982422, -88.5594253540039, -84.35159301757812, -80.14375305175781, -75.9359130859375, -71.72807312011719, -67.5202407836914, -63.312400817871094, -59.10456848144531, -54.896728515625, -50.68889236450195, -46.481056213378906, -42.273231506347656, -38.06539535522461, -33.85755920410156, -29.649721145629883, -25.441884994506836, -21.23404884338379, -17.02621078491211, -12.818374633789062, -8.610538482666016, -4.4027018547058105, -0.19486522674560547, 4.012971878051758, 8.220808029174805, 12.428644180297852, 16.63648223876953, 20.844318389892578, 25.052154541015625, 29.259990692138672, 33.46782684326172, 37.67566680908203, 41.88349914550781, 46.091339111328125, 50.29917526245117, 54.50701141357422, 58.714847564697266, 62.92268371582031, 67.13052368164062, 71.3383560180664, 75.54619598388672, 79.7540283203125, 83.96186828613281, 88.16970825195312, 92.3775405883789]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 12.0, 8.0, 10.0, 17.0, 15.0, 18.0, 19.0, 14.0, 17.0, 17.0, 31.0, 25.0, 24.0, 27.0, 32.0, 33.0, 40.0, 50.0, 43.0, 34.0, 32.0, 34.0, 45.0, 43.0, 33.0, 35.0, 28.0, 35.0, 29.0, 28.0, 21.0, 20.0, 26.0, 20.0, 16.0, 11.0, 12.0, 6.0, 6.0, 5.0, 2.0, 6.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-46.40268325805664, -45.01646423339844, -43.630245208740234, -42.24402618408203, -40.857810974121094, -39.47159194946289, -38.08537292480469, -36.699153900146484, -35.31293487548828, -33.92671585083008, -32.540496826171875, -31.154279708862305, -29.768062591552734, -28.38184356689453, -26.995624542236328, -25.609405517578125, -24.223190307617188, -22.836971282958984, -21.450754165649414, -20.06453514099121, -18.67831802368164, -17.292098999023438, -15.905879974365234, -14.519661903381348, -13.133443832397461, -11.747225761413574, -10.361007690429688, -8.974788665771484, -7.588570594787598, -6.202352523803711, -4.816133499145508, -3.429915428161621, -2.043701171875, -0.6574828624725342, 0.7287354469299316, 2.1149539947509766, 3.5011720657348633, 4.88739013671875, 6.273609161376953, 7.65982723236084, 9.046045303344727, 10.432263374328613, 11.8184814453125, 13.204700469970703, 14.59091854095459, 15.977136611938477, 17.36335563659668, 18.74957275390625, 20.135791778564453, 21.522010803222656, 22.908227920532227, 24.29444694519043, 25.6806640625, 27.066883087158203, 28.453102111816406, 29.83932113647461, 31.22553825378418, 32.61175537109375, 33.99797439575195, 35.384193420410156, 36.77041244506836, 38.15663146972656, 39.5428466796875, 40.9290657043457, 42.315284729003906]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 9.0, 8.0, 11.0, 15.0, 13.0, 16.0, 17.0, 14.0, 22.0, 24.0, 33.0, 22.0, 45.0, 48.0, 41.0, 32.0, 43.0, 44.0, 43.0, 44.0, 41.0, 46.0, 50.0, 35.0, 30.0, 39.0, 34.0, 26.0, 20.0, 22.0, 24.0, 13.0, 9.0, 14.0, 17.0, 5.0, 5.0, 3.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7421875, -6.52191162109375, -6.3016357421875, -6.08135986328125, -5.861083984375, -5.64080810546875, -5.4205322265625, -5.20025634765625, -4.97998046875, -4.75970458984375, -4.5394287109375, -4.31915283203125, -4.098876953125, -3.87860107421875, -3.6583251953125, -3.43804931640625, -3.2177734375, -2.99749755859375, -2.7772216796875, -2.55694580078125, -2.336669921875, -2.11639404296875, -1.8961181640625, -1.67584228515625, -1.45556640625, -1.23529052734375, -1.0150146484375, -0.79473876953125, -0.574462890625, -0.35418701171875, -0.1339111328125, 0.08636474609375, 0.306640625, 0.52691650390625, 0.7471923828125, 0.96746826171875, 1.187744140625, 1.40802001953125, 1.6282958984375, 1.84857177734375, 2.06884765625, 2.28912353515625, 2.5093994140625, 2.72967529296875, 2.949951171875, 3.17022705078125, 3.3905029296875, 3.61077880859375, 3.8310546875, 4.05133056640625, 4.2716064453125, 4.49188232421875, 4.712158203125, 4.93243408203125, 5.1527099609375, 5.37298583984375, 5.59326171875, 5.81353759765625, 6.0338134765625, 6.25408935546875, 6.474365234375, 6.69464111328125, 6.9149169921875, 7.13519287109375, 7.35546875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 18.0, 17.0, 28.0, 54.0, 83.0, 171.0, 327.0, 584.0, 1136.0, 2381.0, 5703.0, 17641.0, 104198.0, 1144163.0, 2486860.0, 375153.0, 39207.0, 9504.0, 3680.0, 1618.0, 794.0, 424.0, 234.0, 134.0, 73.0, 38.0, 22.0, 14.0, 6.0, 4.0, 8.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.671875, -14.17041015625, -13.6689453125, -13.16748046875, -12.666015625, -12.16455078125, -11.6630859375, -11.16162109375, -10.66015625, -10.15869140625, -9.6572265625, -9.15576171875, -8.654296875, -8.15283203125, -7.6513671875, -7.14990234375, -6.6484375, -6.14697265625, -5.6455078125, -5.14404296875, -4.642578125, -4.14111328125, -3.6396484375, -3.13818359375, -2.63671875, -2.13525390625, -1.6337890625, -1.13232421875, -0.630859375, -0.12939453125, 0.3720703125, 0.87353515625, 1.375, 1.87646484375, 2.3779296875, 2.87939453125, 3.380859375, 3.88232421875, 4.3837890625, 4.88525390625, 5.38671875, 5.88818359375, 6.3896484375, 6.89111328125, 7.392578125, 7.89404296875, 8.3955078125, 8.89697265625, 9.3984375, 9.89990234375, 10.4013671875, 10.90283203125, 11.404296875, 11.90576171875, 12.4072265625, 12.90869140625, 13.41015625, 13.91162109375, 14.4130859375, 14.91455078125, 15.416015625, 15.91748046875, 16.4189453125, 16.92041015625, 17.421875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 17.0, 19.0, 21.0, 26.0, 45.0, 68.0, 112.0, 142.0, 222.0, 258.0, 348.0, 470.0, 529.0, 492.0, 397.0, 273.0, 182.0, 138.0, 102.0, 67.0, 46.0, 26.0, 21.0, 18.0, 8.0, 6.0, 7.0, 5.0, 0.0, 2.0, 1.0], "bins": [-18.40625, -18.0013427734375, -17.596435546875, -17.1915283203125, -16.78662109375, -16.3817138671875, -15.976806640625, -15.5718994140625, -15.1669921875, -14.7620849609375, -14.357177734375, -13.9522705078125, -13.54736328125, -13.1424560546875, -12.737548828125, -12.3326416015625, -11.927734375, -11.5228271484375, -11.117919921875, -10.7130126953125, -10.30810546875, -9.9031982421875, -9.498291015625, -9.0933837890625, -8.6884765625, -8.2835693359375, -7.878662109375, -7.4737548828125, -7.06884765625, -6.6639404296875, -6.259033203125, -5.8541259765625, -5.44921875, -5.0443115234375, -4.639404296875, -4.2344970703125, -3.82958984375, -3.4246826171875, -3.019775390625, -2.6148681640625, -2.2099609375, -1.8050537109375, -1.400146484375, -0.9952392578125, -0.59033203125, -0.1854248046875, 0.219482421875, 0.6243896484375, 1.029296875, 1.4342041015625, 1.839111328125, 2.2440185546875, 2.64892578125, 3.0538330078125, 3.458740234375, 3.8636474609375, 4.2685546875, 4.6734619140625, 5.078369140625, 5.4832763671875, 5.88818359375, 6.2930908203125, 6.697998046875, 7.1029052734375, 7.5078125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 13.0, 16.0, 16.0, 30.0, 50.0, 84.0, 143.0, 250.0, 468.0, 1150.0, 3681.0, 33689.0, 2580226.0, 1546994.0, 22397.0, 3034.0, 1006.0, 440.0, 232.0, 139.0, 89.0, 49.0, 26.0, 21.0, 17.0, 6.0, 7.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.78125, -18.83642578125, -17.8916015625, -16.94677734375, -16.001953125, -15.05712890625, -14.1123046875, -13.16748046875, -12.22265625, -11.27783203125, -10.3330078125, -9.38818359375, -8.443359375, -7.49853515625, -6.5537109375, -5.60888671875, -4.6640625, -3.71923828125, -2.7744140625, -1.82958984375, -0.884765625, 0.06005859375, 1.0048828125, 1.94970703125, 2.89453125, 3.83935546875, 4.7841796875, 5.72900390625, 6.673828125, 7.61865234375, 8.5634765625, 9.50830078125, 10.453125, 11.39794921875, 12.3427734375, 13.28759765625, 14.232421875, 15.17724609375, 16.1220703125, 17.06689453125, 18.01171875, 18.95654296875, 19.9013671875, 20.84619140625, 21.791015625, 22.73583984375, 23.6806640625, 24.62548828125, 25.5703125, 26.51513671875, 27.4599609375, 28.40478515625, 29.349609375, 30.29443359375, 31.2392578125, 32.18408203125, 33.12890625, 34.07373046875, 35.0185546875, 35.96337890625, 36.908203125, 37.85302734375, 38.7978515625, 39.74267578125, 40.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 304.0, 647.0, 54.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-136.85989379882812, -124.69395446777344, -112.52802276611328, -100.36209106445312, -88.19615173339844, -76.03021240234375, -63.864280700683594, -51.69834899902344, -39.53240966796875, -27.366474151611328, -15.200538635253906, -3.0346031188964844, 9.131332397460938, 21.29726791381836, 33.46320343017578, 45.62913513183594, 57.795074462890625, 69.96101379394531, 82.12694549560547, 94.29287719726562, 106.45881652832031, 118.624755859375, 130.79067993164062, 142.9566192626953, 155.12255859375, 167.2884979248047, 179.45443725585938, 191.620361328125, 203.7863006591797, 215.95223999023438, 228.1181640625, 240.2841033935547, 252.45001220703125, 264.6159362792969, 276.7818908691406, 288.94781494140625, 301.11376953125, 313.2796936035156, 325.44561767578125, 337.611572265625, 349.7774963378906, 361.94342041015625, 374.109375, 386.2752990722656, 398.44122314453125, 410.607177734375, 422.7731018066406, 434.93902587890625, 447.10498046875, 459.2709045410156, 471.4368591308594, 483.602783203125, 495.76873779296875, 507.9346618652344, 520.1005859375, 532.2665405273438, 544.4324951171875, 556.5984497070312, 568.7643432617188, 580.9302978515625, 593.0962524414062, 605.2621459960938, 617.4281005859375, 629.5940551757812, 641.7599487304688]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 6.0, 11.0, 5.0, 7.0, 12.0, 10.0, 13.0, 18.0, 21.0, 22.0, 22.0, 29.0, 27.0, 27.0, 36.0, 42.0, 36.0, 38.0, 40.0, 48.0, 42.0, 44.0, 46.0, 33.0, 28.0, 46.0, 44.0, 20.0, 30.0, 27.0, 30.0, 21.0, 15.0, 17.0, 16.0, 20.0, 13.0, 4.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0], "bins": [-42.56147003173828, -41.305564880371094, -40.04965591430664, -38.79375076293945, -37.537845611572266, -36.28194046020508, -35.026031494140625, -33.77012634277344, -32.51422119140625, -31.25831413269043, -30.002408981323242, -28.746501922607422, -27.490596771240234, -26.234689712524414, -24.978782653808594, -23.722877502441406, -22.466970443725586, -21.211063385009766, -19.955158233642578, -18.699251174926758, -17.44334602355957, -16.18743896484375, -14.931532859802246, -13.675626754760742, -12.419720649719238, -11.163814544677734, -9.90790843963623, -8.652002334594727, -7.3960957527160645, -6.1401896476745605, -4.884283065795898, -3.6283769607543945, -2.3724708557128906, -1.1165646314620972, 0.1393415927886963, 1.3952479362487793, 2.651154041290283, 3.907060146331787, 5.162966728210449, 6.418872833251953, 7.674778938293457, 8.930685043334961, 10.186591148376465, 11.442497253417969, 12.698404312133789, 13.954309463500977, 15.210216522216797, 16.466121673583984, 17.722028732299805, 18.977935791015625, 20.233840942382812, 21.489748001098633, 22.74565315246582, 24.00156021118164, 25.257465362548828, 26.51337242126465, 27.76927947998047, 29.02518653869629, 30.281091690063477, 31.536998748779297, 32.792903900146484, 34.04880905151367, 35.304718017578125, 36.56062316894531, 37.8165283203125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 3.0, 8.0, 6.0, 12.0, 8.0, 11.0, 6.0, 10.0, 12.0, 16.0, 21.0, 16.0, 20.0, 27.0, 28.0, 31.0, 37.0, 36.0, 43.0, 43.0, 40.0, 43.0, 52.0, 47.0, 36.0, 43.0, 31.0, 41.0, 39.0, 36.0, 33.0, 31.0, 17.0, 12.0, 17.0, 13.0, 23.0, 11.0, 9.0, 7.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.76898193359375, -4.6043701171875, -4.43975830078125, -4.275146484375, -4.11053466796875, -3.9459228515625, -3.78131103515625, -3.61669921875, -3.45208740234375, -3.2874755859375, -3.12286376953125, -2.958251953125, -2.79364013671875, -2.6290283203125, -2.46441650390625, -2.2998046875, -2.13519287109375, -1.9705810546875, -1.80596923828125, -1.641357421875, -1.47674560546875, -1.3121337890625, -1.14752197265625, -0.98291015625, -0.81829833984375, -0.6536865234375, -0.48907470703125, -0.324462890625, -0.15985107421875, 0.0047607421875, 0.16937255859375, 0.333984375, 0.49859619140625, 0.6632080078125, 0.82781982421875, 0.992431640625, 1.15704345703125, 1.3216552734375, 1.48626708984375, 1.65087890625, 1.81549072265625, 1.9801025390625, 2.14471435546875, 2.309326171875, 2.47393798828125, 2.6385498046875, 2.80316162109375, 2.9677734375, 3.13238525390625, 3.2969970703125, 3.46160888671875, 3.626220703125, 3.79083251953125, 3.9554443359375, 4.12005615234375, 4.28466796875, 4.44927978515625, 4.6138916015625, 4.77850341796875, 4.943115234375, 5.10772705078125, 5.2723388671875, 5.43695068359375, 5.6015625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 11.0, 11.0, 25.0, 29.0, 55.0, 68.0, 136.0, 214.0, 245.0, 321.0, 531.0, 705.0, 1046.0, 1590.0, 2387.0, 3268.0, 5032.0, 7520.0, 11018.0, 16601.0, 24360.0, 36936.0, 54771.0, 79138.0, 109274.0, 138176.0, 144773.0, 122046.0, 91667.0, 63848.0, 43987.0, 29301.0, 19442.0, 12943.0, 8567.0, 5855.0, 3938.0, 2769.0, 1894.0, 1304.0, 810.0, 634.0, 389.0, 304.0, 200.0, 138.0, 88.0, 64.0, 42.0, 30.0, 22.0, 10.0, 5.0, 6.0, 2.0, 4.0, 5.0], "bins": [-0.52978515625, -0.5138320922851562, -0.4978790283203125, -0.48192596435546875, -0.465972900390625, -0.45001983642578125, -0.4340667724609375, -0.41811370849609375, -0.40216064453125, -0.38620758056640625, -0.3702545166015625, -0.35430145263671875, -0.338348388671875, -0.32239532470703125, -0.3064422607421875, -0.29048919677734375, -0.2745361328125, -0.25858306884765625, -0.2426300048828125, -0.22667694091796875, -0.210723876953125, -0.19477081298828125, -0.1788177490234375, -0.16286468505859375, -0.14691162109375, -0.13095855712890625, -0.1150054931640625, -0.09905242919921875, -0.083099365234375, -0.06714630126953125, -0.0511932373046875, -0.03524017333984375, -0.019287109375, -0.00333404541015625, 0.0126190185546875, 0.02857208251953125, 0.044525146484375, 0.06047821044921875, 0.0764312744140625, 0.09238433837890625, 0.10833740234375, 0.12429046630859375, 0.1402435302734375, 0.15619659423828125, 0.172149658203125, 0.18810272216796875, 0.2040557861328125, 0.22000885009765625, 0.2359619140625, 0.25191497802734375, 0.2678680419921875, 0.28382110595703125, 0.299774169921875, 0.31572723388671875, 0.3316802978515625, 0.34763336181640625, 0.36358642578125, 0.37953948974609375, 0.3954925537109375, 0.41144561767578125, 0.427398681640625, 0.44335174560546875, 0.4593048095703125, 0.47525787353515625, 0.4912109375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 9.0, 5.0, 12.0, 6.0, 6.0, 12.0, 13.0, 22.0, 27.0, 19.0, 29.0, 27.0, 26.0, 43.0, 39.0, 48.0, 33.0, 46.0, 38.0, 1065.0, 48.0, 45.0, 39.0, 34.0, 30.0, 39.0, 31.0, 39.0, 35.0, 26.0, 32.0, 14.0, 11.0, 12.0, 10.0, 17.0, 9.0, 12.0, 5.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.798828125, -3.685089111328125, -3.57135009765625, -3.457611083984375, -3.3438720703125, -3.230133056640625, -3.11639404296875, -3.002655029296875, -2.888916015625, -2.775177001953125, -2.66143798828125, -2.547698974609375, -2.4339599609375, -2.320220947265625, -2.20648193359375, -2.092742919921875, -1.97900390625, -1.865264892578125, -1.75152587890625, -1.637786865234375, -1.5240478515625, -1.410308837890625, -1.29656982421875, -1.182830810546875, -1.069091796875, -0.955352783203125, -0.84161376953125, -0.727874755859375, -0.6141357421875, -0.500396728515625, -0.38665771484375, -0.272918701171875, -0.1591796875, -0.045440673828125, 0.06829833984375, 0.182037353515625, 0.2957763671875, 0.409515380859375, 0.52325439453125, 0.636993408203125, 0.750732421875, 0.864471435546875, 0.97821044921875, 1.091949462890625, 1.2056884765625, 1.319427490234375, 1.43316650390625, 1.546905517578125, 1.66064453125, 1.774383544921875, 1.88812255859375, 2.001861572265625, 2.1156005859375, 2.229339599609375, 2.34307861328125, 2.456817626953125, 2.570556640625, 2.684295654296875, 2.79803466796875, 2.911773681640625, 3.0255126953125, 3.139251708984375, 3.25299072265625, 3.366729736328125, 3.48046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 24.0, 24.0, 36.0, 45.0, 79.0, 121.0, 168.0, 314.0, 407.0, 679.0, 1061.0, 1631.0, 2546.0, 3959.0, 6613.0, 10285.0, 16459.0, 26198.0, 40201.0, 60862.0, 90007.0, 123793.0, 1093859.0, 251701.0, 118902.0, 85366.0, 57879.0, 37934.0, 24233.0, 15553.0, 9800.0, 6125.0, 3701.0, 2413.0, 1500.0, 908.0, 589.0, 386.0, 260.0, 173.0, 116.0, 66.0, 50.0, 40.0, 17.0, 17.0, 9.0, 10.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.42822265625, -0.4152183532714844, -0.40221405029296875, -0.3892097473144531, -0.3762054443359375, -0.3632011413574219, -0.35019683837890625, -0.3371925354003906, -0.324188232421875, -0.3111839294433594, -0.29817962646484375, -0.2851753234863281, -0.2721710205078125, -0.2591667175292969, -0.24616241455078125, -0.23315811157226562, -0.22015380859375, -0.20714950561523438, -0.19414520263671875, -0.18114089965820312, -0.1681365966796875, -0.15513229370117188, -0.14212799072265625, -0.12912368774414062, -0.116119384765625, -0.10311508178710938, -0.09011077880859375, -0.07710647583007812, -0.0641021728515625, -0.051097869873046875, -0.03809356689453125, -0.025089263916015625, -0.0120849609375, 0.000919342041015625, 0.01392364501953125, 0.026927947998046875, 0.0399322509765625, 0.052936553955078125, 0.06594085693359375, 0.07894515991210938, 0.091949462890625, 0.10495376586914062, 0.11795806884765625, 0.13096237182617188, 0.1439666748046875, 0.15697097778320312, 0.16997528076171875, 0.18297958374023438, 0.19598388671875, 0.20898818969726562, 0.22199249267578125, 0.23499679565429688, 0.2480010986328125, 0.2610054016113281, 0.27400970458984375, 0.2870140075683594, 0.300018310546875, 0.3130226135253906, 0.32602691650390625, 0.3390312194824219, 0.3520355224609375, 0.3650398254394531, 0.37804412841796875, 0.3910484313964844, 0.404052734375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 3.0, 5.0, 7.0, 12.0, 6.0, 15.0, 15.0, 15.0, 27.0, 34.0, 40.0, 64.0, 61.0, 85.0, 76.0, 81.0, 83.0, 72.0, 66.0, 42.0, 43.0, 38.0, 25.0, 14.0, 17.0, 10.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01157379150390625, -0.011189818382263184, -0.010805845260620117, -0.01042187213897705, -0.010037899017333984, -0.009653925895690918, -0.009269952774047852, -0.008885979652404785, -0.008502006530761719, -0.008118033409118652, -0.007734060287475586, -0.0073500871658325195, -0.006966114044189453, -0.006582140922546387, -0.00619816780090332, -0.005814194679260254, -0.0054302215576171875, -0.005046248435974121, -0.004662275314331055, -0.004278302192687988, -0.003894329071044922, -0.0035103559494018555, -0.003126382827758789, -0.0027424097061157227, -0.0023584365844726562, -0.00197446346282959, -0.0015904903411865234, -0.001206517219543457, -0.0008225440979003906, -0.0004385709762573242, -5.459785461425781e-05, 0.0003293752670288086, 0.000713348388671875, 0.0010973215103149414, 0.0014812946319580078, 0.0018652677536010742, 0.0022492408752441406, 0.002633213996887207, 0.0030171871185302734, 0.00340116024017334, 0.0037851333618164062, 0.004169106483459473, 0.004553079605102539, 0.0049370527267456055, 0.005321025848388672, 0.005704998970031738, 0.006088972091674805, 0.006472945213317871, 0.0068569183349609375, 0.007240891456604004, 0.00762486457824707, 0.008008837699890137, 0.008392810821533203, 0.00877678394317627, 0.009160757064819336, 0.009544730186462402, 0.009928703308105469, 0.010312676429748535, 0.010696649551391602, 0.011080622673034668, 0.011464595794677734, 0.0118485689163208, 0.012232542037963867, 0.012616515159606934, 0.01300048828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 9.0, 7.0, 13.0, 13.0, 11.0, 15.0, 27.0, 37.0, 49.0, 74.0, 88.0, 135.0, 211.0, 369.0, 622.0, 1564.0, 956303.0, 86514.0, 1053.0, 513.0, 282.0, 184.0, 131.0, 71.0, 66.0, 33.0, 35.0, 21.0, 27.0, 16.0, 8.0, 10.0, 8.0, 7.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.227783203125, -0.2210559844970703, -0.21432876586914062, -0.20760154724121094, -0.20087432861328125, -0.19414710998535156, -0.18741989135742188, -0.1806926727294922, -0.1739654541015625, -0.1672382354736328, -0.16051101684570312, -0.15378379821777344, -0.14705657958984375, -0.14032936096191406, -0.13360214233398438, -0.1268749237060547, -0.120147705078125, -0.11342048645019531, -0.10669326782226562, -0.09996604919433594, -0.09323883056640625, -0.08651161193847656, -0.07978439331054688, -0.07305717468261719, -0.0663299560546875, -0.05960273742675781, -0.052875518798828125, -0.04614830017089844, -0.03942108154296875, -0.03269386291503906, -0.025966644287109375, -0.019239425659179688, -0.01251220703125, -0.0057849884033203125, 0.000942230224609375, 0.0076694488525390625, 0.01439666748046875, 0.021123886108398438, 0.027851104736328125, 0.03457832336425781, 0.0413055419921875, 0.04803276062011719, 0.054759979248046875, 0.06148719787597656, 0.06821441650390625, 0.07494163513183594, 0.08166885375976562, 0.08839607238769531, 0.095123291015625, 0.10185050964355469, 0.10857772827148438, 0.11530494689941406, 0.12203216552734375, 0.12875938415527344, 0.13548660278320312, 0.1422138214111328, 0.1489410400390625, 0.1556682586669922, 0.16239547729492188, 0.16912269592285156, 0.17584991455078125, 0.18257713317871094, 0.18930435180664062, 0.1960315704345703, 0.2027587890625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 726.0, 286.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18916285037994385, -0.184042289853096, -0.17892172932624817, -0.17380118370056152, -0.16868062317371368, -0.16356006264686584, -0.1584395170211792, -0.15331895649433136, -0.14819839596748352, -0.14307783544063568, -0.13795727491378784, -0.1328367292881012, -0.12771616876125336, -0.12259560823440552, -0.11747505515813828, -0.11235450208187103, -0.1072339415550232, -0.10211338102817535, -0.09699282795190811, -0.09187227487564087, -0.08675171434879303, -0.08163115382194519, -0.07651060074567795, -0.0713900476694107, -0.06626948714256287, -0.061148930341005325, -0.056028373539447784, -0.050907816737890244, -0.0457872599363327, -0.04066670313477516, -0.03554614633321762, -0.03042558953166008, -0.02530503273010254, -0.020184475928544998, -0.015063919126987457, -0.009943362325429916, -0.0048228055238723755, 0.0002977512776851654, 0.005418308079242706, 0.010538864880800247, 0.015659421682357788, 0.02077997848391533, 0.02590053528547287, 0.03102109208703041, 0.03614164888858795, 0.04126220569014549, 0.04638276249170303, 0.051503319293260574, 0.056623876094818115, 0.061744432896375656, 0.0668649896979332, 0.07198554277420044, 0.07710610330104828, 0.08222666382789612, 0.08734721690416336, 0.0924677699804306, 0.09758833050727844, 0.10270889103412628, 0.10782944411039352, 0.11294999718666077, 0.1180705577135086, 0.12319111824035645, 0.1283116638660431, 0.13343222439289093, 0.13855278491973877]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 5.0, 5.0, 8.0, 17.0, 27.0, 22.0, 42.0, 54.0, 34.0, 60.0, 52.0, 65.0, 71.0, 63.0, 50.0, 70.0, 73.0, 36.0, 56.0, 45.0, 35.0, 27.0, 19.0, 21.0, 13.0, 6.0, 4.0, 6.0, 5.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.018456220626831055, -0.017981894314289093, -0.01750756800174713, -0.01703324168920517, -0.016558915376663208, -0.016084589064121246, -0.015610262751579285, -0.015135936439037323, -0.014661610126495361, -0.0141872838139534, -0.013712957501411438, -0.013238631188869476, -0.012764304876327515, -0.012289978563785553, -0.011815652251243591, -0.01134132593870163, -0.010866999626159668, -0.010392673313617706, -0.009918347001075745, -0.009444020688533783, -0.008969694375991821, -0.00849536806344986, -0.008021041750907898, -0.007546715438365936, -0.007072389125823975, -0.006598062813282013, -0.006123736500740051, -0.00564941018819809, -0.005175083875656128, -0.004700757563114166, -0.004226431250572205, -0.003752104938030243, -0.0032777786254882812, -0.0028034523129463196, -0.002329126000404358, -0.0018547996878623962, -0.0013804733753204346, -0.0009061470627784729, -0.00043182075023651123, 4.250556230545044e-05, 0.0005168318748474121, 0.0009911581873893738, 0.0014654844999313354, 0.0019398108124732971, 0.002414137125015259, 0.0028884634375572205, 0.003362789750099182, 0.003837116062641144, 0.0043114423751831055, 0.004785768687725067, 0.005260095000267029, 0.0057344213128089905, 0.006208747625350952, 0.006683073937892914, 0.0071574002504348755, 0.007631726562976837, 0.008106052875518799, 0.00858037918806076, 0.009054705500602722, 0.009529031813144684, 0.010003358125686646, 0.010477684438228607, 0.010952010750770569, 0.01142633706331253, 0.011900663375854492]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 3.0, 7.0, 7.0, 12.0, 8.0, 11.0, 6.0, 10.0, 12.0, 16.0, 21.0, 16.0, 20.0, 27.0, 28.0, 31.0, 37.0, 36.0, 43.0, 43.0, 40.0, 43.0, 52.0, 47.0, 36.0, 43.0, 32.0, 41.0, 38.0, 37.0, 32.0, 31.0, 17.0, 12.0, 17.0, 13.0, 23.0, 11.0, 9.0, 7.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.76898193359375, -4.6043701171875, -4.43975830078125, -4.275146484375, -4.11053466796875, -3.9459228515625, -3.78131103515625, -3.61669921875, -3.45208740234375, -3.2874755859375, -3.12286376953125, -2.958251953125, -2.79364013671875, -2.6290283203125, -2.46441650390625, -2.2998046875, -2.13519287109375, -1.9705810546875, -1.80596923828125, -1.641357421875, -1.47674560546875, -1.3121337890625, -1.14752197265625, -0.98291015625, -0.81829833984375, -0.6536865234375, -0.48907470703125, -0.324462890625, -0.15985107421875, 0.0047607421875, 0.16937255859375, 0.333984375, 0.49859619140625, 0.6632080078125, 0.82781982421875, 0.992431640625, 1.15704345703125, 1.3216552734375, 1.48626708984375, 1.65087890625, 1.81549072265625, 1.9801025390625, 2.14471435546875, 2.309326171875, 2.47393798828125, 2.6385498046875, 2.80316162109375, 2.9677734375, 3.13238525390625, 3.2969970703125, 3.46160888671875, 3.626220703125, 3.79083251953125, 3.9554443359375, 4.12005615234375, 4.28466796875, 4.44927978515625, 4.6138916015625, 4.77850341796875, 4.943115234375, 5.10772705078125, 5.2723388671875, 5.43695068359375, 5.6015625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 8.0, 6.0, 9.0, 12.0, 14.0, 21.0, 31.0, 31.0, 40.0, 26.0, 51.0, 70.0, 77.0, 114.0, 173.0, 196.0, 253.0, 400.0, 493.0, 764.0, 1291.0, 2383.0, 5482.0, 17218.0, 72136.0, 360406.0, 453109.0, 97799.0, 22187.0, 6727.0, 2706.0, 1401.0, 781.0, 529.0, 412.0, 282.0, 197.0, 160.0, 131.0, 117.0, 82.0, 58.0, 45.0, 46.0, 26.0, 19.0, 11.0, 7.0, 8.0, 8.0, 4.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-8.453125, -8.1812744140625, -7.909423828125, -7.6375732421875, -7.36572265625, -7.0938720703125, -6.822021484375, -6.5501708984375, -6.2783203125, -6.0064697265625, -5.734619140625, -5.4627685546875, -5.19091796875, -4.9190673828125, -4.647216796875, -4.3753662109375, -4.103515625, -3.8316650390625, -3.559814453125, -3.2879638671875, -3.01611328125, -2.7442626953125, -2.472412109375, -2.2005615234375, -1.9287109375, -1.6568603515625, -1.385009765625, -1.1131591796875, -0.84130859375, -0.5694580078125, -0.297607421875, -0.0257568359375, 0.24609375, 0.5179443359375, 0.789794921875, 1.0616455078125, 1.33349609375, 1.6053466796875, 1.877197265625, 2.1490478515625, 2.4208984375, 2.6927490234375, 2.964599609375, 3.2364501953125, 3.50830078125, 3.7801513671875, 4.052001953125, 4.3238525390625, 4.595703125, 4.8675537109375, 5.139404296875, 5.4112548828125, 5.68310546875, 5.9549560546875, 6.226806640625, 6.4986572265625, 6.7705078125, 7.0423583984375, 7.314208984375, 7.5860595703125, 7.85791015625, 8.1297607421875, 8.401611328125, 8.6734619140625, 8.9453125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 8.0, 5.0, 4.0, 13.0, 13.0, 19.0, 21.0, 25.0, 27.0, 36.0, 38.0, 50.0, 66.0, 101.0, 151.0, 399.0, 1460.0, 164.0, 100.0, 64.0, 49.0, 53.0, 28.0, 29.0, 25.0, 14.0, 15.0, 15.0, 7.0, 5.0, 9.0, 4.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.484375, -15.953125, -15.421875, -14.890625, -14.359375, -13.828125, -13.296875, -12.765625, -12.234375, -11.703125, -11.171875, -10.640625, -10.109375, -9.578125, -9.046875, -8.515625, -7.984375, -7.453125, -6.921875, -6.390625, -5.859375, -5.328125, -4.796875, -4.265625, -3.734375, -3.203125, -2.671875, -2.140625, -1.609375, -1.078125, -0.546875, -0.015625, 0.515625, 1.046875, 1.578125, 2.109375, 2.640625, 3.171875, 3.703125, 4.234375, 4.765625, 5.296875, 5.828125, 6.359375, 6.890625, 7.421875, 7.953125, 8.484375, 9.015625, 9.546875, 10.078125, 10.609375, 11.140625, 11.671875, 12.203125, 12.734375, 13.265625, 13.796875, 14.328125, 14.859375, 15.390625, 15.921875, 16.453125, 16.984375, 17.515625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 6.0, 9.0, 18.0, 6.0, 19.0, 29.0, 41.0, 48.0, 82.0, 131.0, 134.0, 238.0, 552.0, 1806.0, 25748.0, 3095216.0, 18678.0, 1575.0, 514.0, 254.0, 183.0, 111.0, 85.0, 58.0, 49.0, 21.0, 27.0, 16.0, 11.0, 9.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.9375, -37.77392578125, -36.6103515625, -35.44677734375, -34.283203125, -33.11962890625, -31.9560546875, -30.79248046875, -29.62890625, -28.46533203125, -27.3017578125, -26.13818359375, -24.974609375, -23.81103515625, -22.6474609375, -21.48388671875, -20.3203125, -19.15673828125, -17.9931640625, -16.82958984375, -15.666015625, -14.50244140625, -13.3388671875, -12.17529296875, -11.01171875, -9.84814453125, -8.6845703125, -7.52099609375, -6.357421875, -5.19384765625, -4.0302734375, -2.86669921875, -1.703125, -0.53955078125, 0.6240234375, 1.78759765625, 2.951171875, 4.11474609375, 5.2783203125, 6.44189453125, 7.60546875, 8.76904296875, 9.9326171875, 11.09619140625, 12.259765625, 13.42333984375, 14.5869140625, 15.75048828125, 16.9140625, 18.07763671875, 19.2412109375, 20.40478515625, 21.568359375, 22.73193359375, 23.8955078125, 25.05908203125, 26.22265625, 27.38623046875, 28.5498046875, 29.71337890625, 30.876953125, 32.04052734375, 33.2041015625, 34.36767578125, 35.53125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 59.0, 455.0, 459.0, 35.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.66342163085938, -64.0647964477539, -59.46617126464844, -54.8675422668457, -50.268917083740234, -45.670291900634766, -41.07166290283203, -36.47303771972656, -31.874412536621094, -27.275787353515625, -22.677160263061523, -18.078533172607422, -13.479907989501953, -8.881282806396484, -4.282655715942383, 0.31597137451171875, 4.9145965576171875, 9.513222694396973, 14.111848831176758, 18.71047592163086, 23.309101104736328, 27.907726287841797, 32.50635528564453, 37.10498046875, 41.70360565185547, 46.30223083496094, 50.900856018066406, 55.49948501586914, 60.09811019897461, 64.69673156738281, 69.29536437988281, 73.89398956298828, 78.49263000488281, 83.09125518798828, 87.68988037109375, 92.28850555419922, 96.88713073730469, 101.48576354980469, 106.08438873291016, 110.68301391601562, 115.2816390991211, 119.88026428222656, 124.47888946533203, 129.0775146484375, 133.6761474609375, 138.27476501464844, 142.87339782714844, 147.47201538085938, 152.07064819335938, 156.66928100585938, 161.2678985595703, 165.8665313720703, 170.46514892578125, 175.06378173828125, 179.6623992919922, 184.2610321044922, 188.85964965820312, 193.45828247070312, 198.05690002441406, 202.65553283691406, 207.254150390625, 211.852783203125, 216.45140075683594, 221.05003356933594, 225.64866638183594]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 4.0, 5.0, 6.0, 9.0, 11.0, 14.0, 21.0, 25.0, 18.0, 26.0, 31.0, 36.0, 28.0, 38.0, 46.0, 44.0, 49.0, 37.0, 40.0, 40.0, 30.0, 36.0, 39.0, 40.0, 41.0, 42.0, 32.0, 36.0, 28.0, 28.0, 15.0, 15.0, 22.0, 14.0, 10.0, 10.0, 4.0, 8.0, 5.0, 4.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.162355422973633, -30.059326171875, -28.956296920776367, -27.853267669677734, -26.75023651123047, -25.64720916748047, -24.544178009033203, -23.44114875793457, -22.338119506835938, -21.235090255737305, -20.132061004638672, -19.02903175354004, -17.926002502441406, -16.82297134399414, -15.719942092895508, -14.616912841796875, -13.513883590698242, -12.41085433959961, -11.307825088500977, -10.204794883728027, -9.101765632629395, -7.998736381530762, -6.895706653594971, -5.79267692565918, -4.689647674560547, -3.586618185043335, -2.483588695526123, -1.3805592060089111, -0.2775297164916992, 0.8254995346069336, 1.9285292625427246, 3.0315589904785156, 4.134590148925781, 5.237619400024414, 6.340649127960205, 7.443678855895996, 8.546708106994629, 9.649737358093262, 10.752767562866211, 11.855796813964844, 12.958826065063477, 14.06185531616211, 15.164884567260742, 16.267913818359375, 17.37094497680664, 18.47397232055664, 19.577003479003906, 20.68003273010254, 21.783061981201172, 22.886091232299805, 23.989120483398438, 25.09214973449707, 26.195178985595703, 27.29821014404297, 28.4012393951416, 29.504268646240234, 30.607297897338867, 31.7103271484375, 32.813358306884766, 33.916385650634766, 35.01941680908203, 36.12244415283203, 37.2254753112793, 38.32850646972656, 39.43153381347656]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 5.0, 9.0, 8.0, 14.0, 8.0, 9.0, 18.0, 16.0, 18.0, 20.0, 21.0, 26.0, 38.0, 30.0, 42.0, 34.0, 34.0, 38.0, 49.0, 46.0, 48.0, 50.0, 42.0, 34.0, 27.0, 37.0, 34.0, 26.0, 23.0, 27.0, 19.0, 21.0, 16.0, 14.0, 14.0, 11.0, 8.0, 6.0, 11.0, 6.0, 6.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.2265625, -6.04150390625, -5.8564453125, -5.67138671875, -5.486328125, -5.30126953125, -5.1162109375, -4.93115234375, -4.74609375, -4.56103515625, -4.3759765625, -4.19091796875, -4.005859375, -3.82080078125, -3.6357421875, -3.45068359375, -3.265625, -3.08056640625, -2.8955078125, -2.71044921875, -2.525390625, -2.34033203125, -2.1552734375, -1.97021484375, -1.78515625, -1.60009765625, -1.4150390625, -1.22998046875, -1.044921875, -0.85986328125, -0.6748046875, -0.48974609375, -0.3046875, -0.11962890625, 0.0654296875, 0.25048828125, 0.435546875, 0.62060546875, 0.8056640625, 0.99072265625, 1.17578125, 1.36083984375, 1.5458984375, 1.73095703125, 1.916015625, 2.10107421875, 2.2861328125, 2.47119140625, 2.65625, 2.84130859375, 3.0263671875, 3.21142578125, 3.396484375, 3.58154296875, 3.7666015625, 3.95166015625, 4.13671875, 4.32177734375, 4.5068359375, 4.69189453125, 4.876953125, 5.06201171875, 5.2470703125, 5.43212890625, 5.6171875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 5.0, 5.0, 5.0, 6.0, 5.0, 10.0, 15.0, 13.0, 16.0, 24.0, 25.0, 41.0, 63.0, 81.0, 108.0, 146.0, 184.0, 288.0, 388.0, 548.0, 990.0, 2071.0, 10068.0, 219963.0, 3385504.0, 550807.0, 16845.0, 2713.0, 1160.0, 671.0, 416.0, 292.0, 220.0, 162.0, 102.0, 82.0, 42.0, 45.0, 34.0, 24.0, 24.0, 24.0, 10.0, 7.0, 6.0, 5.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-33.5625, -32.6201171875, -31.677734375, -30.7353515625, -29.79296875, -28.8505859375, -27.908203125, -26.9658203125, -26.0234375, -25.0810546875, -24.138671875, -23.1962890625, -22.25390625, -21.3115234375, -20.369140625, -19.4267578125, -18.484375, -17.5419921875, -16.599609375, -15.6572265625, -14.71484375, -13.7724609375, -12.830078125, -11.8876953125, -10.9453125, -10.0029296875, -9.060546875, -8.1181640625, -7.17578125, -6.2333984375, -5.291015625, -4.3486328125, -3.40625, -2.4638671875, -1.521484375, -0.5791015625, 0.36328125, 1.3056640625, 2.248046875, 3.1904296875, 4.1328125, 5.0751953125, 6.017578125, 6.9599609375, 7.90234375, 8.8447265625, 9.787109375, 10.7294921875, 11.671875, 12.6142578125, 13.556640625, 14.4990234375, 15.44140625, 16.3837890625, 17.326171875, 18.2685546875, 19.2109375, 20.1533203125, 21.095703125, 22.0380859375, 22.98046875, 23.9228515625, 24.865234375, 25.8076171875, 26.75]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 5.0, 4.0, 11.0, 20.0, 44.0, 57.0, 59.0, 98.0, 139.0, 202.0, 288.0, 403.0, 442.0, 525.0, 450.0, 374.0, 271.0, 204.0, 131.0, 115.0, 75.0, 54.0, 37.0, 21.0, 13.0, 8.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.875, -11.486328125, -11.09765625, -10.708984375, -10.3203125, -9.931640625, -9.54296875, -9.154296875, -8.765625, -8.376953125, -7.98828125, -7.599609375, -7.2109375, -6.822265625, -6.43359375, -6.044921875, -5.65625, -5.267578125, -4.87890625, -4.490234375, -4.1015625, -3.712890625, -3.32421875, -2.935546875, -2.546875, -2.158203125, -1.76953125, -1.380859375, -0.9921875, -0.603515625, -0.21484375, 0.173828125, 0.5625, 0.951171875, 1.33984375, 1.728515625, 2.1171875, 2.505859375, 2.89453125, 3.283203125, 3.671875, 4.060546875, 4.44921875, 4.837890625, 5.2265625, 5.615234375, 6.00390625, 6.392578125, 6.78125, 7.169921875, 7.55859375, 7.947265625, 8.3359375, 8.724609375, 9.11328125, 9.501953125, 9.890625, 10.279296875, 10.66796875, 11.056640625, 11.4453125, 11.833984375, 12.22265625, 12.611328125, 13.0]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 35.0, 58.0, 101.0, 295.0, 766.0, 2912.0, 26519.0, 1357101.0, 2741643.0, 58976.0, 4294.0, 1057.0, 322.0, 116.0, 35.0, 19.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-31.78125, -30.96875, -30.15625, -29.34375, -28.53125, -27.71875, -26.90625, -26.09375, -25.28125, -24.46875, -23.65625, -22.84375, -22.03125, -21.21875, -20.40625, -19.59375, -18.78125, -17.96875, -17.15625, -16.34375, -15.53125, -14.71875, -13.90625, -13.09375, -12.28125, -11.46875, -10.65625, -9.84375, -9.03125, -8.21875, -7.40625, -6.59375, -5.78125, -4.96875, -4.15625, -3.34375, -2.53125, -1.71875, -0.90625, -0.09375, 0.71875, 1.53125, 2.34375, 3.15625, 3.96875, 4.78125, 5.59375, 6.40625, 7.21875, 8.03125, 8.84375, 9.65625, 10.46875, 11.28125, 12.09375, 12.90625, 13.71875, 14.53125, 15.34375, 16.15625, 16.96875, 17.78125, 18.59375, 19.40625, 20.21875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 8.0, 10.0, 8.0, 15.0, 20.0, 33.0, 48.0, 40.0, 65.0, 51.0, 66.0, 77.0, 85.0, 72.0, 77.0, 63.0, 52.0, 53.0, 35.0, 26.0, 34.0, 12.0, 17.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.35721206665039, -46.113197326660156, -43.869178771972656, -41.62516403198242, -39.38114547729492, -37.13713073730469, -34.89311218261719, -32.64909744262695, -30.405080795288086, -28.16106414794922, -25.91704750061035, -23.673030853271484, -21.42901611328125, -19.18499755859375, -16.940982818603516, -14.696966171264648, -12.452949523925781, -10.208932876586914, -7.964916706085205, -5.720900535583496, -3.476883888244629, -1.2328672409057617, 1.011148452758789, 3.2551651000976562, 5.499181747436523, 7.743198394775391, 9.987215042114258, 12.231230735778809, 14.475247383117676, 16.71926498413086, 18.963279724121094, 21.20729637145996, 23.451309204101562, 25.69532585144043, 27.939342498779297, 30.18335723876953, 32.42737579345703, 34.671390533447266, 36.9154052734375, 39.159423828125, 41.4034423828125, 43.647457122802734, 45.891475677490234, 48.13549041748047, 50.37950897216797, 52.6235237121582, 54.86753845214844, 57.11155700683594, 59.35557174682617, 61.599586486816406, 63.843605041503906, 66.0876235961914, 68.33163452148438, 70.57565307617188, 72.81967163085938, 75.06369018554688, 77.30770111083984, 79.55171966552734, 81.79573059082031, 84.03974914550781, 86.28376770019531, 88.52778625488281, 90.77179718017578, 93.01581573486328, 95.25983428955078]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 2.0, 10.0, 8.0, 5.0, 7.0, 12.0, 16.0, 20.0, 12.0, 23.0, 26.0, 32.0, 27.0, 28.0, 37.0, 44.0, 38.0, 50.0, 35.0, 32.0, 29.0, 38.0, 47.0, 38.0, 38.0, 44.0, 37.0, 30.0, 38.0, 30.0, 28.0, 22.0, 15.0, 25.0, 12.0, 8.0, 9.0, 2.0, 7.0, 10.0, 6.0, 2.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-49.04084014892578, -47.628089904785156, -46.2153434753418, -44.80259704589844, -43.38984680175781, -41.97709655761719, -40.56435012817383, -39.15160369873047, -37.738853454589844, -36.32610321044922, -34.91335678100586, -33.5006103515625, -32.087860107421875, -30.675111770629883, -29.26236343383789, -27.8496150970459, -26.436866760253906, -25.024118423461914, -23.611370086669922, -22.19862174987793, -20.785873413085938, -19.373125076293945, -17.960376739501953, -16.54762840270996, -15.134880065917969, -13.722131729125977, -12.309383392333984, -10.896635055541992, -9.48388671875, -8.071138381958008, -6.658390045166016, -5.245641708374023, -3.8328933715820312, -2.420145034790039, -1.0073966979980469, 0.4053516387939453, 1.8180999755859375, 3.2308483123779297, 4.643596649169922, 6.056344985961914, 7.469093322753906, 8.881841659545898, 10.29458999633789, 11.707338333129883, 13.120086669921875, 14.532835006713867, 15.94558334350586, 17.35833168029785, 18.771080017089844, 20.183828353881836, 21.596576690673828, 23.00932502746582, 24.422073364257812, 25.834821701049805, 27.247570037841797, 28.66031837463379, 30.07306671142578, 31.485815048217773, 32.898563385009766, 34.311309814453125, 35.72406005859375, 37.136810302734375, 38.549556732177734, 39.962303161621094, 41.37505340576172]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 4.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 8.0, 6.0, 13.0, 12.0, 13.0, 14.0, 14.0, 29.0, 19.0, 26.0, 33.0, 31.0, 46.0, 44.0, 39.0, 36.0, 29.0, 38.0, 48.0, 44.0, 46.0, 47.0, 32.0, 34.0, 39.0, 28.0, 23.0, 35.0, 24.0, 23.0, 24.0, 12.0, 16.0, 10.0, 6.0, 4.0, 7.0, 5.0, 3.0, 5.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0], "bins": [-90.0625, -87.51953125, -84.9765625, -82.43359375, -79.890625, -77.34765625, -74.8046875, -72.26171875, -69.71875, -67.17578125, -64.6328125, -62.08984375, -59.546875, -57.00390625, -54.4609375, -51.91796875, -49.375, -46.83203125, -44.2890625, -41.74609375, -39.203125, -36.66015625, -34.1171875, -31.57421875, -29.03125, -26.48828125, -23.9453125, -21.40234375, -18.859375, -16.31640625, -13.7734375, -11.23046875, -8.6875, -6.14453125, -3.6015625, -1.05859375, 1.484375, 4.02734375, 6.5703125, 9.11328125, 11.65625, 14.19921875, 16.7421875, 19.28515625, 21.828125, 24.37109375, 26.9140625, 29.45703125, 32.0, 34.54296875, 37.0859375, 39.62890625, 42.171875, 44.71484375, 47.2578125, 49.80078125, 52.34375, 54.88671875, 57.4296875, 59.97265625, 62.515625, 65.05859375, 67.6015625, 70.14453125, 72.6875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 7.0, 9.0, 12.0, 18.0, 32.0, 46.0, 73.0, 124.0, 189.0, 307.0, 470.0, 731.0, 1070.0, 1594.0, 2652.0, 4084.0, 6362.0, 9750.0, 15296.0, 23912.0, 36830.0, 55042.0, 80949.0, 112112.0, 141199.0, 147076.0, 125421.0, 93491.0, 65448.0, 43972.0, 28611.0, 18610.0, 11883.0, 7702.0, 4803.0, 3153.0, 1958.0, 1275.0, 844.0, 491.0, 323.0, 226.0, 141.0, 103.0, 57.0, 39.0, 29.0, 16.0, 7.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.01953125, -6.80816650390625, -6.5968017578125, -6.38543701171875, -6.174072265625, -5.96270751953125, -5.7513427734375, -5.53997802734375, -5.32861328125, -5.11724853515625, -4.9058837890625, -4.69451904296875, -4.483154296875, -4.27178955078125, -4.0604248046875, -3.84906005859375, -3.6376953125, -3.42633056640625, -3.2149658203125, -3.00360107421875, -2.792236328125, -2.58087158203125, -2.3695068359375, -2.15814208984375, -1.94677734375, -1.73541259765625, -1.5240478515625, -1.31268310546875, -1.101318359375, -0.88995361328125, -0.6785888671875, -0.46722412109375, -0.255859375, -0.04449462890625, 0.1668701171875, 0.37823486328125, 0.589599609375, 0.80096435546875, 1.0123291015625, 1.22369384765625, 1.43505859375, 1.64642333984375, 1.8577880859375, 2.06915283203125, 2.280517578125, 2.49188232421875, 2.7032470703125, 2.91461181640625, 3.1259765625, 3.33734130859375, 3.5487060546875, 3.76007080078125, 3.971435546875, 4.18280029296875, 4.3941650390625, 4.60552978515625, 4.81689453125, 5.02825927734375, 5.2396240234375, 5.45098876953125, 5.662353515625, 5.87371826171875, 6.0850830078125, 6.29644775390625, 6.5078125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 8.0, 9.0, 14.0, 12.0, 13.0, 11.0, 29.0, 14.0, 24.0, 21.0, 18.0, 29.0, 28.0, 28.0, 31.0, 31.0, 31.0, 37.0, 38.0, 38.0, 1067.0, 33.0, 30.0, 34.0, 46.0, 22.0, 34.0, 39.0, 36.0, 25.0, 22.0, 17.0, 16.0, 20.0, 13.0, 20.0, 16.0, 11.0, 8.0, 5.0, 9.0, 3.0, 10.0, 1.0, 5.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0], "bins": [-49.03125, -47.52880859375, -46.0263671875, -44.52392578125, -43.021484375, -41.51904296875, -40.0166015625, -38.51416015625, -37.01171875, -35.50927734375, -34.0068359375, -32.50439453125, -31.001953125, -29.49951171875, -27.9970703125, -26.49462890625, -24.9921875, -23.48974609375, -21.9873046875, -20.48486328125, -18.982421875, -17.47998046875, -15.9775390625, -14.47509765625, -12.97265625, -11.47021484375, -9.9677734375, -8.46533203125, -6.962890625, -5.46044921875, -3.9580078125, -2.45556640625, -0.953125, 0.54931640625, 2.0517578125, 3.55419921875, 5.056640625, 6.55908203125, 8.0615234375, 9.56396484375, 11.06640625, 12.56884765625, 14.0712890625, 15.57373046875, 17.076171875, 18.57861328125, 20.0810546875, 21.58349609375, 23.0859375, 24.58837890625, 26.0908203125, 27.59326171875, 29.095703125, 30.59814453125, 32.1005859375, 33.60302734375, 35.10546875, 36.60791015625, 38.1103515625, 39.61279296875, 41.115234375, 42.61767578125, 44.1201171875, 45.62255859375, 47.125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 14.0, 23.0, 28.0, 49.0, 58.0, 100.0, 169.0, 287.0, 458.0, 810.0, 1359.0, 2303.0, 4024.0, 6588.0, 11170.0, 18868.0, 30963.0, 51033.0, 80345.0, 119599.0, 158372.0, 1216013.0, 137800.0, 96616.0, 63047.0, 38572.0, 23617.0, 14137.0, 8251.0, 5082.0, 2994.0, 1817.0, 1044.0, 615.0, 337.0, 229.0, 126.0, 87.0, 51.0, 30.0, 16.0, 13.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.7890625, -6.584716796875, -6.38037109375, -6.176025390625, -5.9716796875, -5.767333984375, -5.56298828125, -5.358642578125, -5.154296875, -4.949951171875, -4.74560546875, -4.541259765625, -4.3369140625, -4.132568359375, -3.92822265625, -3.723876953125, -3.51953125, -3.315185546875, -3.11083984375, -2.906494140625, -2.7021484375, -2.497802734375, -2.29345703125, -2.089111328125, -1.884765625, -1.680419921875, -1.47607421875, -1.271728515625, -1.0673828125, -0.863037109375, -0.65869140625, -0.454345703125, -0.25, -0.045654296875, 0.15869140625, 0.363037109375, 0.5673828125, 0.771728515625, 0.97607421875, 1.180419921875, 1.384765625, 1.589111328125, 1.79345703125, 1.997802734375, 2.2021484375, 2.406494140625, 2.61083984375, 2.815185546875, 3.01953125, 3.223876953125, 3.42822265625, 3.632568359375, 3.8369140625, 4.041259765625, 4.24560546875, 4.449951171875, 4.654296875, 4.858642578125, 5.06298828125, 5.267333984375, 5.4716796875, 5.676025390625, 5.88037109375, 6.084716796875, 6.2890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 6.0, 3.0, 0.0, 5.0, 9.0, 3.0, 5.0, 4.0, 8.0, 12.0, 15.0, 11.0, 19.0, 18.0, 10.0, 25.0, 27.0, 29.0, 54.0, 56.0, 53.0, 54.0, 63.0, 62.0, 60.0, 63.0, 50.0, 43.0, 26.0, 32.0, 32.0, 23.0, 26.0, 15.0, 12.0, 17.0, 8.0, 9.0, 11.0, 3.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040771484375, -0.03925657272338867, -0.037741661071777344, -0.036226749420166016, -0.03471183776855469, -0.03319692611694336, -0.03168201446533203, -0.030167102813720703, -0.028652191162109375, -0.027137279510498047, -0.02562236785888672, -0.02410745620727539, -0.022592544555664062, -0.021077632904052734, -0.019562721252441406, -0.018047809600830078, -0.01653289794921875, -0.015017986297607422, -0.013503074645996094, -0.011988162994384766, -0.010473251342773438, -0.00895833969116211, -0.007443428039550781, -0.005928516387939453, -0.004413604736328125, -0.002898693084716797, -0.0013837814331054688, 0.00013113021850585938, 0.0016460418701171875, 0.0031609535217285156, 0.004675865173339844, 0.006190776824951172, 0.0077056884765625, 0.009220600128173828, 0.010735511779785156, 0.012250423431396484, 0.013765335083007812, 0.01528024673461914, 0.01679515838623047, 0.018310070037841797, 0.019824981689453125, 0.021339893341064453, 0.02285480499267578, 0.02436971664428711, 0.025884628295898438, 0.027399539947509766, 0.028914451599121094, 0.030429363250732422, 0.03194427490234375, 0.03345918655395508, 0.034974098205566406, 0.036489009857177734, 0.03800392150878906, 0.03951883316040039, 0.04103374481201172, 0.04254865646362305, 0.044063568115234375, 0.0455784797668457, 0.04709339141845703, 0.04860830307006836, 0.05012321472167969, 0.051638126373291016, 0.053153038024902344, 0.05466794967651367, 0.056182861328125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 6.0, 13.0, 14.0, 14.0, 25.0, 44.0, 46.0, 49.0, 90.0, 119.0, 188.0, 289.0, 458.0, 740.0, 1475.0, 2551.0, 4933.0, 9980.0, 21692.0, 51267.0, 132629.0, 347913.0, 291011.0, 105107.0, 41829.0, 18193.0, 8411.0, 4200.0, 2141.0, 1215.0, 691.0, 405.0, 246.0, 139.0, 133.0, 72.0, 48.0, 44.0, 35.0, 22.0, 13.0, 13.0, 13.0, 15.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.265625, -0.2577857971191406, -0.24994659423828125, -0.24210739135742188, -0.2342681884765625, -0.22642898559570312, -0.21858978271484375, -0.21075057983398438, -0.202911376953125, -0.19507217407226562, -0.18723297119140625, -0.17939376831054688, -0.1715545654296875, -0.16371536254882812, -0.15587615966796875, -0.14803695678710938, -0.14019775390625, -0.13235855102539062, -0.12451934814453125, -0.11668014526367188, -0.1088409423828125, -0.10100173950195312, -0.09316253662109375, -0.08532333374023438, -0.077484130859375, -0.06964492797851562, -0.06180572509765625, -0.053966522216796875, -0.0461273193359375, -0.038288116455078125, -0.03044891357421875, -0.022609710693359375, -0.0147705078125, -0.006931304931640625, 0.00090789794921875, 0.008747100830078125, 0.0165863037109375, 0.024425506591796875, 0.03226470947265625, 0.040103912353515625, 0.047943115234375, 0.055782318115234375, 0.06362152099609375, 0.07146072387695312, 0.0792999267578125, 0.08713912963867188, 0.09497833251953125, 0.10281753540039062, 0.11065673828125, 0.11849594116210938, 0.12633514404296875, 0.13417434692382812, 0.1420135498046875, 0.14985275268554688, 0.15769195556640625, 0.16553115844726562, 0.173370361328125, 0.18120956420898438, 0.18904876708984375, 0.19688796997070312, 0.2047271728515625, 0.21256637573242188, 0.22040557861328125, 0.22824478149414062, 0.236083984375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 1.0, 9.0, 9.0, 12.0, 16.0, 21.0, 26.0, 43.0, 56.0, 50.0, 60.0, 104.0, 107.0, 77.0, 88.0, 81.0, 64.0, 60.0, 36.0, 28.0, 16.0, 14.0, 9.0, 7.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.12564866244792938, -0.1230572760105133, -0.12046589702367783, -0.11787451058626175, -0.11528313159942627, -0.11269174516201019, -0.11010036617517471, -0.10750897973775864, -0.10491760075092316, -0.10232621431350708, -0.0997348353266716, -0.09714344888925552, -0.09455206990242004, -0.09196068346500397, -0.08936930447816849, -0.08677791804075241, -0.08418653160333633, -0.08159514516592026, -0.07900376617908478, -0.0764123797416687, -0.07382100075483322, -0.07122961431741714, -0.06863823533058167, -0.06604684889316559, -0.06345546245574951, -0.060864079743623734, -0.058272697031497955, -0.05568131431937218, -0.0530899316072464, -0.05049854516983032, -0.047907162457704544, -0.045315779745578766, -0.042724404484033585, -0.040133021771907806, -0.03754163905978203, -0.03495025634765625, -0.03235886991024017, -0.029767489060759544, -0.027176104485988617, -0.02458472177386284, -0.02199333906173706, -0.019401956349611282, -0.016810573637485504, -0.014219189062714577, -0.011627806350588799, -0.00903642363846302, -0.0064450399950146675, -0.0038536563515663147, -0.0012622736394405365, 0.001329109538346529, 0.0039204927161335945, 0.00651187589392066, 0.009103259071707726, 0.011694641783833504, 0.014286025427281857, 0.01687740907073021, 0.019468791782855988, 0.022060174494981766, 0.024651557207107544, 0.02724294178187847, 0.02983432449400425, 0.03242570906877518, 0.035017091780900955, 0.03760847449302673, 0.04019985720515251]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 9.0, 5.0, 8.0, 7.0, 11.0, 16.0, 17.0, 20.0, 27.0, 22.0, 37.0, 27.0, 30.0, 30.0, 43.0, 49.0, 39.0, 53.0, 45.0, 40.0, 48.0, 43.0, 38.0, 39.0, 30.0, 42.0, 34.0, 35.0, 25.0, 25.0, 21.0, 13.0, 22.0, 14.0, 11.0, 8.0, 6.0, 3.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04023468494415283, -0.03889888897538185, -0.03756309300661087, -0.03622729703783989, -0.03489150106906891, -0.03355570510029793, -0.03221990913152695, -0.030884113162755966, -0.029548317193984985, -0.028212521225214005, -0.026876725256443024, -0.025540929287672043, -0.024205133318901062, -0.02286933735013008, -0.0215335413813591, -0.02019774541258812, -0.01886194944381714, -0.017526153475046158, -0.016190357506275177, -0.014854561537504196, -0.013518765568733215, -0.012182969599962234, -0.010847173631191254, -0.009511377662420273, -0.008175581693649292, -0.006839785724878311, -0.00550398975610733, -0.0041681937873363495, -0.0028323978185653687, -0.0014966018497943878, -0.00016080588102340698, 0.0011749900877475739, 0.0025107860565185547, 0.0038465820252895355, 0.005182377994060516, 0.006518173962831497, 0.007853969931602478, 0.009189765900373459, 0.01052556186914444, 0.01186135783791542, 0.013197153806686401, 0.014532949775457382, 0.015868745744228363, 0.017204541712999344, 0.018540337681770325, 0.019876133650541306, 0.021211929619312286, 0.022547725588083267, 0.023883521556854248, 0.02521931752562523, 0.02655511349439621, 0.02789090946316719, 0.02922670543193817, 0.030562501400709152, 0.03189829736948013, 0.033234093338251114, 0.034569889307022095, 0.035905685275793076, 0.037241481244564056, 0.03857727721333504, 0.03991307318210602, 0.041248869150877, 0.04258466511964798, 0.04392046108841896, 0.04525625705718994]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 7.0, 4.0, 8.0, 6.0, 14.0, 10.0, 14.0, 14.0, 15.0, 27.0, 20.0, 28.0, 30.0, 33.0, 45.0, 44.0, 39.0, 37.0, 29.0, 40.0, 47.0, 42.0, 48.0, 47.0, 29.0, 37.0, 37.0, 29.0, 21.0, 37.0, 24.0, 23.0, 24.0, 11.0, 17.0, 9.0, 6.0, 4.0, 7.0, 5.0, 3.0, 5.0, 9.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0], "bins": [-90.0, -87.45703125, -84.9140625, -82.37109375, -79.828125, -77.28515625, -74.7421875, -72.19921875, -69.65625, -67.11328125, -64.5703125, -62.02734375, -59.484375, -56.94140625, -54.3984375, -51.85546875, -49.3125, -46.76953125, -44.2265625, -41.68359375, -39.140625, -36.59765625, -34.0546875, -31.51171875, -28.96875, -26.42578125, -23.8828125, -21.33984375, -18.796875, -16.25390625, -13.7109375, -11.16796875, -8.625, -6.08203125, -3.5390625, -0.99609375, 1.546875, 4.08984375, 6.6328125, 9.17578125, 11.71875, 14.26171875, 16.8046875, 19.34765625, 21.890625, 24.43359375, 26.9765625, 29.51953125, 32.0625, 34.60546875, 37.1484375, 39.69140625, 42.234375, 44.77734375, 47.3203125, 49.86328125, 52.40625, 54.94921875, 57.4921875, 60.03515625, 62.578125, 65.12109375, 67.6640625, 70.20703125, 72.75]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 10.0, 12.0, 17.0, 23.0, 24.0, 38.0, 53.0, 85.0, 109.0, 169.0, 301.0, 405.0, 722.0, 1619.0, 4029.0, 13151.0, 55800.0, 267513.0, 500104.0, 157433.0, 32785.0, 8368.0, 2868.0, 1162.0, 615.0, 379.0, 212.0, 166.0, 93.0, 74.0, 58.0, 29.0, 25.0, 13.0, 23.0, 9.0, 6.0, 8.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-14.9921875, -14.555419921875, -14.11865234375, -13.681884765625, -13.2451171875, -12.808349609375, -12.37158203125, -11.934814453125, -11.498046875, -11.061279296875, -10.62451171875, -10.187744140625, -9.7509765625, -9.314208984375, -8.87744140625, -8.440673828125, -8.00390625, -7.567138671875, -7.13037109375, -6.693603515625, -6.2568359375, -5.820068359375, -5.38330078125, -4.946533203125, -4.509765625, -4.072998046875, -3.63623046875, -3.199462890625, -2.7626953125, -2.325927734375, -1.88916015625, -1.452392578125, -1.015625, -0.578857421875, -0.14208984375, 0.294677734375, 0.7314453125, 1.168212890625, 1.60498046875, 2.041748046875, 2.478515625, 2.915283203125, 3.35205078125, 3.788818359375, 4.2255859375, 4.662353515625, 5.09912109375, 5.535888671875, 5.97265625, 6.409423828125, 6.84619140625, 7.282958984375, 7.7197265625, 8.156494140625, 8.59326171875, 9.030029296875, 9.466796875, 9.903564453125, 10.34033203125, 10.777099609375, 11.2138671875, 11.650634765625, 12.08740234375, 12.524169921875, 12.9609375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 4.0, 20.0, 26.0, 37.0, 51.0, 47.0, 70.0, 87.0, 90.0, 2131.0, 107.0, 86.0, 88.0, 52.0, 37.0, 25.0, 31.0, 15.0, 12.0, 7.0, 5.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-257.5, -249.375, -241.25, -233.125, -225.0, -216.875, -208.75, -200.625, -192.5, -184.375, -176.25, -168.125, -160.0, -151.875, -143.75, -135.625, -127.5, -119.375, -111.25, -103.125, -95.0, -86.875, -78.75, -70.625, -62.5, -54.375, -46.25, -38.125, -30.0, -21.875, -13.75, -5.625, 2.5, 10.625, 18.75, 26.875, 35.0, 43.125, 51.25, 59.375, 67.5, 75.625, 83.75, 91.875, 100.0, 108.125, 116.25, 124.375, 132.5, 140.625, 148.75, 156.875, 165.0, 173.125, 181.25, 189.375, 197.5, 205.625, 213.75, 221.875, 230.0, 238.125, 246.25, 254.375, 262.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 11.0, 15.0, 15.0, 26.0, 32.0, 58.0, 81.0, 124.0, 242.0, 430.0, 962.0, 2660.0, 15009.0, 2790471.0, 323549.0, 8337.0, 1852.0, 815.0, 395.0, 219.0, 111.0, 80.0, 42.0, 37.0, 25.0, 22.0, 13.0, 8.0, 13.0, 6.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-40.5625, -39.365234375, -38.16796875, -36.970703125, -35.7734375, -34.576171875, -33.37890625, -32.181640625, -30.984375, -29.787109375, -28.58984375, -27.392578125, -26.1953125, -24.998046875, -23.80078125, -22.603515625, -21.40625, -20.208984375, -19.01171875, -17.814453125, -16.6171875, -15.419921875, -14.22265625, -13.025390625, -11.828125, -10.630859375, -9.43359375, -8.236328125, -7.0390625, -5.841796875, -4.64453125, -3.447265625, -2.25, -1.052734375, 0.14453125, 1.341796875, 2.5390625, 3.736328125, 4.93359375, 6.130859375, 7.328125, 8.525390625, 9.72265625, 10.919921875, 12.1171875, 13.314453125, 14.51171875, 15.708984375, 16.90625, 18.103515625, 19.30078125, 20.498046875, 21.6953125, 22.892578125, 24.08984375, 25.287109375, 26.484375, 27.681640625, 28.87890625, 30.076171875, 31.2734375, 32.470703125, 33.66796875, 34.865234375, 36.0625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 9.0, 15.0, 26.0, 49.0, 83.0, 121.0, 129.0, 173.0, 144.0, 100.0, 58.0, 24.0, 26.0, 13.0, 5.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.86422729492188, -174.43331909179688, -168.00241088867188, -161.57150268554688, -155.14060974121094, -148.70970153808594, -142.27879333496094, -135.84788513183594, -129.4169921875, -122.986083984375, -116.55518341064453, -110.12427520751953, -103.69337463378906, -97.26246643066406, -90.83155822753906, -84.40065002441406, -77.96974182128906, -71.53883361816406, -65.1079330444336, -58.677024841308594, -52.24612045288086, -45.815216064453125, -39.384307861328125, -32.95340347290039, -26.522499084472656, -20.091594696044922, -13.660688400268555, -7.2297821044921875, -0.7988777160644531, 5.632026672363281, 12.062934875488281, 18.493839263916016, 24.924728393554688, 31.355632781982422, 37.786537170410156, 44.217445373535156, 50.64834976196289, 57.079254150390625, 63.510162353515625, 69.94107055664062, 76.3719711303711, 82.8028793334961, 89.23377990722656, 95.66468811035156, 102.09559631347656, 108.52649688720703, 114.95740509033203, 121.3883056640625, 127.8192138671875, 134.2501220703125, 140.6810302734375, 147.1119384765625, 153.54283142089844, 159.97373962402344, 166.40464782714844, 172.83555603027344, 179.26644897460938, 185.69735717773438, 192.12826538085938, 198.55917358398438, 204.9900665283203, 211.4209747314453, 217.8518829345703, 224.2827911376953, 230.7136993408203]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 13.0, 10.0, 20.0, 20.0, 21.0, 21.0, 20.0, 27.0, 35.0, 38.0, 39.0, 39.0, 32.0, 50.0, 46.0, 48.0, 43.0, 50.0, 63.0, 43.0, 57.0, 25.0, 35.0, 40.0, 20.0, 31.0, 11.0, 13.0, 13.0, 18.0, 7.0, 8.0, 7.0, 3.0, 10.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-192.01649475097656, -185.93333435058594, -179.85018920898438, -173.76702880859375, -167.6838836669922, -161.60072326660156, -155.517578125, -149.43441772460938, -143.3512725830078, -137.2681121826172, -131.18496704101562, -125.10181427001953, -119.01866149902344, -112.93550872802734, -106.85235595703125, -100.76919555664062, -94.68604278564453, -88.60289001464844, -82.51973724365234, -76.43658447265625, -70.35343170166016, -64.27027893066406, -58.1871223449707, -52.10396957397461, -46.020816802978516, -39.93766403198242, -33.85451126098633, -27.7713565826416, -21.688203811645508, -15.605051040649414, -9.521896362304688, -3.4387435913085938, 2.6444091796875, 8.727561950683594, 14.810715675354004, 20.893869400024414, 26.977022171020508, 33.06017303466797, 39.14332962036133, 45.22648239135742, 51.309635162353516, 57.39278793334961, 63.4759407043457, 69.55909729003906, 75.64225006103516, 81.72540283203125, 87.80855560302734, 93.89170837402344, 99.97486114501953, 106.05801391601562, 112.14116668701172, 118.22431945800781, 124.3074722290039, 130.390625, 136.47378540039062, 142.5569305419922, 148.6400909423828, 154.72325134277344, 160.806396484375, 166.88955688476562, 172.9727020263672, 179.0558624267578, 185.13900756835938, 191.22216796875, 197.30531311035156]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 12.0, 6.0, 8.0, 15.0, 25.0, 25.0, 41.0, 62.0, 62.0, 94.0, 144.0, 196.0, 223.0, 334.0, 487.0, 641.0, 838.0, 1250.0, 1628.0, 2150.0, 2960.0, 4443.0, 1015452.0, 5300.0, 3236.0, 2318.0, 1699.0, 1298.0, 996.0, 733.0, 527.0, 376.0, 294.0, 192.0, 144.0, 75.0, 84.0, 45.0, 37.0, 24.0, 24.0, 14.0, 10.0, 14.0, 4.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.988479614257812, -28.100051879882812, -27.211626052856445, -26.323198318481445, -25.434772491455078, -24.546344757080078, -23.657917022705078, -22.76949119567871, -21.88106346130371, -20.99263572692871, -20.104209899902344, -19.215782165527344, -18.327356338500977, -17.438928604125977, -16.55050277709961, -15.66207504272461, -14.773648262023926, -13.885221481323242, -12.996794700622559, -12.108367919921875, -11.219940185546875, -10.331513404846191, -9.443086624145508, -8.554658889770508, -7.666232585906982, -6.777805805206299, -5.889378547668457, -5.000951766967773, -4.11252498626709, -3.224097728729248, -2.3356709480285645, -1.4472436904907227, -0.5588169097900391, 0.32961004972457886, 1.2180370092391968, 2.10646390914917, 2.9948909282684326, 3.8833179473876953, 4.771744728088379, 5.660171985626221, 6.548598766326904, 7.437025547027588, 8.32545280456543, 9.213879585266113, 10.102306365966797, 10.990734100341797, 11.879159927368164, 12.767587661743164, 13.656014442443848, 14.544441223144531, 15.432868003845215, 16.3212947845459, 17.2097225189209, 18.098148345947266, 18.986576080322266, 19.875003814697266, 20.763429641723633, 21.651857376098633, 22.540283203125, 23.4287109375, 24.317136764526367, 25.205564498901367, 26.093990325927734, 26.982418060302734, 27.870845794677734]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 8.0, 10.0, 18.0, 16.0, 34.0, 50.0, 44.0, 82.0, 119.0, 423.0, 51460200.0, 1846.0, 146.0, 57.0, 34.0, 21.0, 15.0, 9.0, 4.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1636.43115234375, -1560.9873046875, -1485.5435791015625, -1410.0997314453125, -1334.656005859375, -1259.212158203125, -1183.768310546875, -1108.3245849609375, -1032.880859375, -957.4370727539062, -881.9932861328125, -806.5494384765625, -731.105712890625, -655.661865234375, -580.2180786132812, -504.7742919921875, -429.3304443359375, -353.88665771484375, -278.44287109375, -202.99905395507812, -127.55526733398438, -52.111480712890625, 23.33233642578125, 98.776123046875, 174.21990966796875, 249.6636962890625, 325.10748291015625, 400.5513000488281, 475.9950866699219, 551.4388427734375, 626.8826904296875, 702.3264770507812, 777.770263671875, 853.2140502929688, 928.6578369140625, 1004.1016845703125, 1079.54541015625, 1154.9892578125, 1230.43310546875, 1305.8768310546875, 1381.320556640625, 1456.764404296875, 1532.2081298828125, 1607.6519775390625, 1683.095703125, 1758.53955078125, 1833.9833984375, 1909.4271240234375, 1984.8709716796875, 2060.314697265625, 2135.758544921875, 2211.202392578125, 2286.646240234375, 2362.08984375, 2437.53369140625, 2512.9775390625, 2588.42138671875, 2663.865234375, 2739.30908203125, 2814.752685546875, 2890.196533203125, 2965.640380859375, 3041.084228515625, 3116.52783203125, 3191.9716796875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 17.0, 31.0, 47.0, 72.0, 92.0, 133.0, 185.0, 319.0, 503.0, 757.0, 1073.0, 1675.0, 2559.0, 3994.0, 6028.0, 9356.0, 14356.0, 22049.0, 33355.0, 50326.0, 77273.0, 115130.0, 167785.0, 236371.0, 320406.0, 575526.0, 3316191.0, 397875.0, 289824.0, 209603.0, 145909.0, 99920.0, 66447.0, 43667.0, 28727.0, 18625.0, 12305.0, 7843.0, 5284.0, 3354.0, 2192.0, 1506.0, 958.0, 609.0, 426.0, 286.0, 153.0, 110.0, 89.0, 60.0, 21.0, 10.0, 12.0, 7.0, 2.0, 2.0], "bins": [-1.8564453125, -1.8023529052734375, -1.748260498046875, -1.6941680908203125, -1.64007568359375, -1.5859832763671875, -1.531890869140625, -1.4777984619140625, -1.4237060546875, -1.3696136474609375, -1.315521240234375, -1.2614288330078125, -1.20733642578125, -1.1532440185546875, -1.099151611328125, -1.0450592041015625, -0.990966796875, -0.9368743896484375, -0.882781982421875, -0.8286895751953125, -0.77459716796875, -0.7205047607421875, -0.666412353515625, -0.6123199462890625, -0.5582275390625, -0.5041351318359375, -0.450042724609375, -0.3959503173828125, -0.34185791015625, -0.2877655029296875, -0.233673095703125, -0.1795806884765625, -0.12548828125, -0.0713958740234375, -0.017303466796875, 0.0367889404296875, 0.09088134765625, 0.1449737548828125, 0.199066162109375, 0.2531585693359375, 0.3072509765625, 0.3613433837890625, 0.415435791015625, 0.4695281982421875, 0.52362060546875, 0.5777130126953125, 0.631805419921875, 0.6858978271484375, 0.739990234375, 0.7940826416015625, 0.848175048828125, 0.9022674560546875, 0.95635986328125, 1.0104522705078125, 1.064544677734375, 1.1186370849609375, 1.1727294921875, 1.2268218994140625, 1.280914306640625, 1.3350067138671875, 1.38909912109375, 1.4431915283203125, 1.497283935546875, 1.5513763427734375, 1.60546875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [4.0, 4.0, 0.0, 6.0, 4.0, 3.0, 5.0, 3.0, 7.0, 7.0, 8.0, 10.0, 6.0, 12.0, 19.0, 15.0, 17.0, 22.0, 18.0, 12.0, 26.0, 19.0, 29.0, 33.0, 37.0, 24.0, 39.0, 42.0, 46.0, 156.0, 860.0, 102.0, 36.0, 29.0, 29.0, 29.0, 34.0, 33.0, 24.0, 28.0, 24.0, 22.0, 23.0, 11.0, 22.0, 16.0, 12.0, 10.0, 16.0, 7.0, 9.0, 6.0, 5.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-20.640625, -19.959716796875, -19.27880859375, -18.597900390625, -17.9169921875, -17.236083984375, -16.55517578125, -15.874267578125, -15.193359375, -14.512451171875, -13.83154296875, -13.150634765625, -12.4697265625, -11.788818359375, -11.10791015625, -10.427001953125, -9.74609375, -9.065185546875, -8.38427734375, -7.703369140625, -7.0224609375, -6.341552734375, -5.66064453125, -4.979736328125, -4.298828125, -3.617919921875, -2.93701171875, -2.256103515625, -1.5751953125, -0.894287109375, -0.21337890625, 0.467529296875, 1.1484375, 1.829345703125, 2.51025390625, 3.191162109375, 3.8720703125, 4.552978515625, 5.23388671875, 5.914794921875, 6.595703125, 7.276611328125, 7.95751953125, 8.638427734375, 9.3193359375, 10.000244140625, 10.68115234375, 11.362060546875, 12.04296875, 12.723876953125, 13.40478515625, 14.085693359375, 14.7666015625, 15.447509765625, 16.12841796875, 16.809326171875, 17.490234375, 18.171142578125, 18.85205078125, 19.532958984375, 20.2138671875, 20.894775390625, 21.57568359375, 22.256591796875, 22.9375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 6.0, 4.0, 10.0, 22.0, 32.0, 56.0, 89.0, 138.0, 196.0, 315.0, 465.0, 789.0, 1151.0, 1786.0, 2719.0, 4550.0, 6798.0, 10410.0, 16415.0, 25952.0, 41036.0, 64065.0, 102128.0, 160847.0, 244240.0, 352221.0, 747143.0, 3271704.0, 415378.0, 287014.0, 193855.0, 123902.0, 78912.0, 49802.0, 31807.0, 20089.0, 12541.0, 8074.0, 5198.0, 3462.0, 2217.0, 1403.0, 920.0, 538.0, 383.0, 249.0, 138.0, 111.0, 49.0, 45.0, 20.0, 19.0, 21.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-1.841796875, -1.786346435546875, -1.73089599609375, -1.675445556640625, -1.6199951171875, -1.564544677734375, -1.50909423828125, -1.453643798828125, -1.398193359375, -1.342742919921875, -1.28729248046875, -1.231842041015625, -1.1763916015625, -1.120941162109375, -1.06549072265625, -1.010040283203125, -0.95458984375, -0.899139404296875, -0.84368896484375, -0.788238525390625, -0.7327880859375, -0.677337646484375, -0.62188720703125, -0.566436767578125, -0.510986328125, -0.455535888671875, -0.40008544921875, -0.344635009765625, -0.2891845703125, -0.233734130859375, -0.17828369140625, -0.122833251953125, -0.0673828125, -0.011932373046875, 0.04351806640625, 0.098968505859375, 0.1544189453125, 0.209869384765625, 0.26531982421875, 0.320770263671875, 0.376220703125, 0.431671142578125, 0.48712158203125, 0.542572021484375, 0.5980224609375, 0.653472900390625, 0.70892333984375, 0.764373779296875, 0.81982421875, 0.875274658203125, 0.93072509765625, 0.986175537109375, 1.0416259765625, 1.097076416015625, 1.15252685546875, 1.207977294921875, 1.263427734375, 1.318878173828125, 1.37432861328125, 1.429779052734375, 1.4852294921875, 1.540679931640625, 1.59613037109375, 1.651580810546875, 1.70703125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 7.0, 12.0, 16.0, 10.0, 10.0, 11.0, 23.0, 14.0, 20.0, 19.0, 29.0, 28.0, 25.0, 25.0, 43.0, 39.0, 49.0, 47.0, 192.0, 886.0, 52.0, 54.0, 39.0, 31.0, 43.0, 40.0, 41.0, 22.0, 22.0, 22.0, 23.0, 20.0, 17.0, 19.0, 12.0, 11.0, 6.0, 7.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.390625, -27.559326171875, -26.72802734375, -25.896728515625, -25.0654296875, -24.234130859375, -23.40283203125, -22.571533203125, -21.740234375, -20.908935546875, -20.07763671875, -19.246337890625, -18.4150390625, -17.583740234375, -16.75244140625, -15.921142578125, -15.08984375, -14.258544921875, -13.42724609375, -12.595947265625, -11.7646484375, -10.933349609375, -10.10205078125, -9.270751953125, -8.439453125, -7.608154296875, -6.77685546875, -5.945556640625, -5.1142578125, -4.282958984375, -3.45166015625, -2.620361328125, -1.7890625, -0.957763671875, -0.12646484375, 0.704833984375, 1.5361328125, 2.367431640625, 3.19873046875, 4.030029296875, 4.861328125, 5.692626953125, 6.52392578125, 7.355224609375, 8.1865234375, 9.017822265625, 9.84912109375, 10.680419921875, 11.51171875, 12.343017578125, 13.17431640625, 14.005615234375, 14.8369140625, 15.668212890625, 16.49951171875, 17.330810546875, 18.162109375, 18.993408203125, 19.82470703125, 20.656005859375, 21.4873046875, 22.318603515625, 23.14990234375, 23.981201171875, 24.8125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 9.0, 12.0, 17.0, 16.0, 18.0, 20.0, 22.0, 39.0, 52.0, 72.0, 120.0, 158.0, 275.0, 542.0, 1147.0, 2395.0, 6004.0, 14073.0, 35172.0, 96012.0, 5682834.0, 322843.0, 78570.0, 29692.0, 11917.0, 4942.0, 2142.0, 1066.0, 447.0, 258.0, 137.0, 140.0, 62.0, 43.0, 20.0, 22.0, 25.0, 26.0, 26.0, 14.0, 7.0, 9.0, 12.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.7421875, -10.4429931640625, -10.143798828125, -9.8446044921875, -9.54541015625, -9.2462158203125, -8.947021484375, -8.6478271484375, -8.3486328125, -8.0494384765625, -7.750244140625, -7.4510498046875, -7.15185546875, -6.8526611328125, -6.553466796875, -6.2542724609375, -5.955078125, -5.6558837890625, -5.356689453125, -5.0574951171875, -4.75830078125, -4.4591064453125, -4.159912109375, -3.8607177734375, -3.5615234375, -3.2623291015625, -2.963134765625, -2.6639404296875, -2.36474609375, -2.0655517578125, -1.766357421875, -1.4671630859375, -1.16796875, -0.8687744140625, -0.569580078125, -0.2703857421875, 0.02880859375, 0.3280029296875, 0.627197265625, 0.9263916015625, 1.2255859375, 1.5247802734375, 1.823974609375, 2.1231689453125, 2.42236328125, 2.7215576171875, 3.020751953125, 3.3199462890625, 3.619140625, 3.9183349609375, 4.217529296875, 4.5167236328125, 4.81591796875, 5.1151123046875, 5.414306640625, 5.7135009765625, 6.0126953125, 6.3118896484375, 6.611083984375, 6.9102783203125, 7.20947265625, 7.5086669921875, 7.807861328125, 8.1070556640625, 8.40625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 11.0, 13.0, 8.0, 16.0, 21.0, 19.0, 11.0, 27.0, 35.0, 30.0, 28.0, 43.0, 34.0, 48.0, 40.0, 39.0, 105.0, 1002.0, 63.0, 45.0, 50.0, 30.0, 41.0, 37.0, 33.0, 30.0, 25.0, 25.0, 20.0, 12.0, 19.0, 11.0, 14.0, 6.0, 9.0, 9.0, 2.0, 7.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.234375, -27.267333984375, -26.30029296875, -25.333251953125, -24.3662109375, -23.399169921875, -22.43212890625, -21.465087890625, -20.498046875, -19.531005859375, -18.56396484375, -17.596923828125, -16.6298828125, -15.662841796875, -14.69580078125, -13.728759765625, -12.76171875, -11.794677734375, -10.82763671875, -9.860595703125, -8.8935546875, -7.926513671875, -6.95947265625, -5.992431640625, -5.025390625, -4.058349609375, -3.09130859375, -2.124267578125, -1.1572265625, -0.190185546875, 0.77685546875, 1.743896484375, 2.7109375, 3.677978515625, 4.64501953125, 5.612060546875, 6.5791015625, 7.546142578125, 8.51318359375, 9.480224609375, 10.447265625, 11.414306640625, 12.38134765625, 13.348388671875, 14.3154296875, 15.282470703125, 16.24951171875, 17.216552734375, 18.18359375, 19.150634765625, 20.11767578125, 21.084716796875, 22.0517578125, 23.018798828125, 23.98583984375, 24.952880859375, 25.919921875, 26.886962890625, 27.85400390625, 28.821044921875, 29.7880859375, 30.755126953125, 31.72216796875, 32.689208984375, 33.65625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 9.0, 30.0, 118.0, 491.0, 268.0, 63.0, 18.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.91288757324219, -69.02229309082031, -65.13169860839844, -61.2411003112793, -57.35050582885742, -53.45990753173828, -49.569313049316406, -45.67871856689453, -41.788124084472656, -37.89752960205078, -34.00693130493164, -30.116336822509766, -26.22574234008789, -22.335145950317383, -18.444549560546875, -14.553955078125, -10.66335678100586, -6.772761344909668, -2.8821654319763184, 1.0084304809570312, 4.899025917053223, 8.789621353149414, 12.680217742919922, 16.570812225341797, 20.461408615112305, 24.352005004882812, 28.242599487304688, 32.13319396972656, 36.0237922668457, 39.91438674926758, 43.80498504638672, 47.695579528808594, 51.58617401123047, 55.476768493652344, 59.367366790771484, 63.25796127319336, 67.1485595703125, 71.03915405273438, 74.92974853515625, 78.82034301757812, 82.7109375, 86.60153198242188, 90.49212646484375, 94.38272094726562, 98.27332305908203, 102.1639175415039, 106.05451202392578, 109.94510650634766, 113.83570861816406, 117.72630310058594, 121.61689758300781, 125.50749206542969, 129.39808654785156, 133.28868103027344, 137.17929077148438, 141.06988525390625, 144.96046447753906, 148.85105895996094, 152.7416534423828, 156.6322479248047, 160.52284240722656, 164.41343688964844, 168.30404663085938, 172.19464111328125, 176.08523559570312]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 6.0, 13.0, 7.0, 12.0, 12.0, 36.0, 41.0, 71.0, 77.0, 84.0, 115.0, 109.0, 104.0, 71.0, 63.0, 56.0, 33.0, 29.0, 18.0, 9.0, 7.0, 5.0, 7.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.44094848632812, -98.71145629882812, -94.98196411132812, -91.25247192382812, -87.52297973632812, -83.79348754882812, -80.06399536132812, -76.33450317382812, -72.60501098632812, -68.87551879882812, -65.14602661132812, -61.416534423828125, -57.687042236328125, -53.957550048828125, -50.22806167602539, -46.49856948852539, -42.769081115722656, -39.039588928222656, -35.310096740722656, -31.58060646057129, -27.85111427307129, -24.12162208557129, -20.392131805419922, -16.662639617919922, -12.933147430419922, -9.203655242919922, -5.474164009094238, -1.7446727752685547, 1.9848194122314453, 5.714311599731445, 9.443801879882812, 13.173294067382812, 16.902786254882812, 20.632278442382812, 24.361770629882812, 28.09126091003418, 31.82075309753418, 35.55024719238281, 39.27973556518555, 43.00922775268555, 46.73871994018555, 50.46821212768555, 54.19770431518555, 57.92719268798828, 61.65668487548828, 65.38617706298828, 69.11566925048828, 72.84516143798828, 76.57465362548828, 80.30414581298828, 84.03363800048828, 87.76313018798828, 91.49262237548828, 95.22211456298828, 98.95159912109375, 102.68109130859375, 106.41058349609375, 110.14007568359375, 113.86956787109375, 117.59906005859375, 121.32855224609375, 125.05804443359375, 128.78753662109375, 132.51702880859375, 136.24652099609375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 12.0, 16.0, 16.0, 19.0, 35.0, 29.0, 76.0, 77.0, 141.0, 183.0, 285.0, 423.0, 692.0, 1115.0, 1762.0, 2999.0, 5326.0, 10740.0, 25830.0, 99941.0, 3921796.0, 81608.0, 21130.0, 8570.0, 4365.0, 2537.0, 1489.0, 961.0, 624.0, 424.0, 289.0, 235.0, 173.0, 92.0, 71.0, 57.0, 37.0, 34.0, 24.0, 12.0, 4.0, 7.0, 6.0, 2.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.57861328125, -0.5589752197265625, -0.539337158203125, -0.5196990966796875, -0.50006103515625, -0.4804229736328125, -0.460784912109375, -0.4411468505859375, -0.4215087890625, -0.4018707275390625, -0.382232666015625, -0.3625946044921875, -0.34295654296875, -0.3233184814453125, -0.303680419921875, -0.2840423583984375, -0.264404296875, -0.2447662353515625, -0.225128173828125, -0.2054901123046875, -0.18585205078125, -0.1662139892578125, -0.146575927734375, -0.1269378662109375, -0.1072998046875, -0.0876617431640625, -0.068023681640625, -0.0483856201171875, -0.02874755859375, -0.0091094970703125, 0.010528564453125, 0.0301666259765625, 0.0498046875, 0.0694427490234375, 0.089080810546875, 0.1087188720703125, 0.12835693359375, 0.1479949951171875, 0.167633056640625, 0.1872711181640625, 0.2069091796875, 0.2265472412109375, 0.246185302734375, 0.2658233642578125, 0.28546142578125, 0.3050994873046875, 0.324737548828125, 0.3443756103515625, 0.364013671875, 0.3836517333984375, 0.403289794921875, 0.4229278564453125, 0.44256591796875, 0.4622039794921875, 0.481842041015625, 0.5014801025390625, 0.5211181640625, 0.5407562255859375, 0.560394287109375, 0.5800323486328125, 0.59967041015625, 0.6193084716796875, 0.638946533203125, 0.6585845947265625, 0.67822265625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 7.0, 8.0, 6.0, 5.0, 8.0, 10.0, 10.0, 18.0, 14.0, 546.0, 247.0, 16.0, 17.0, 16.0, 6.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 3.0, 5.0, 1.0, 1.0, 6.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.339111328125, -0.326934814453125, -0.31475830078125, -0.302581787109375, -0.2904052734375, -0.278228759765625, -0.26605224609375, -0.253875732421875, -0.24169921875, -0.229522705078125, -0.21734619140625, -0.205169677734375, -0.1929931640625, -0.180816650390625, -0.16864013671875, -0.156463623046875, -0.144287109375, -0.132110595703125, -0.11993408203125, -0.107757568359375, -0.0955810546875, -0.083404541015625, -0.07122802734375, -0.059051513671875, -0.046875, -0.034698486328125, -0.02252197265625, -0.010345458984375, 0.0018310546875, 0.014007568359375, 0.02618408203125, 0.038360595703125, 0.050537109375, 0.062713623046875, 0.07489013671875, 0.087066650390625, 0.0992431640625, 0.111419677734375, 0.12359619140625, 0.135772705078125, 0.14794921875, 0.160125732421875, 0.17230224609375, 0.184478759765625, 0.1966552734375, 0.208831787109375, 0.22100830078125, 0.233184814453125, 0.245361328125, 0.257537841796875, 0.26971435546875, 0.281890869140625, 0.2940673828125, 0.306243896484375, 0.31842041015625, 0.330596923828125, 0.3427734375, 0.354949951171875, 0.36712646484375, 0.379302978515625, 0.3914794921875, 0.403656005859375, 0.41583251953125, 0.428009033203125, 0.440185546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 9.0, 6.0, 10.0, 6.0, 25.0, 28.0, 34.0, 60.0, 88.0, 130.0, 219.0, 315.0, 604.0, 1210.0, 2869.0, 7986.0, 33705.0, 327517.0, 3666475.0, 125632.0, 18520.0, 5136.0, 1713.0, 843.0, 435.0, 255.0, 144.0, 88.0, 65.0, 37.0, 29.0, 14.0, 18.0, 14.0, 13.0, 12.0, 6.0, 4.0, 4.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.6638946533203125, -0.641265869140625, -0.6186370849609375, -0.59600830078125, -0.5733795166015625, -0.550750732421875, -0.5281219482421875, -0.5054931640625, -0.4828643798828125, -0.460235595703125, -0.4376068115234375, -0.41497802734375, -0.3923492431640625, -0.369720458984375, -0.3470916748046875, -0.324462890625, -0.3018341064453125, -0.279205322265625, -0.2565765380859375, -0.23394775390625, -0.2113189697265625, -0.188690185546875, -0.1660614013671875, -0.1434326171875, -0.1208038330078125, -0.098175048828125, -0.0755462646484375, -0.05291748046875, -0.0302886962890625, -0.007659912109375, 0.0149688720703125, 0.03759765625, 0.0602264404296875, 0.082855224609375, 0.1054840087890625, 0.12811279296875, 0.1507415771484375, 0.173370361328125, 0.1959991455078125, 0.2186279296875, 0.2412567138671875, 0.263885498046875, 0.2865142822265625, 0.30914306640625, 0.3317718505859375, 0.354400634765625, 0.3770294189453125, 0.399658203125, 0.4222869873046875, 0.444915771484375, 0.4675445556640625, 0.49017333984375, 0.5128021240234375, 0.535430908203125, 0.5580596923828125, 0.5806884765625, 0.6033172607421875, 0.625946044921875, 0.6485748291015625, 0.67120361328125, 0.6938323974609375, 0.716461181640625, 0.7390899658203125, 0.76171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 3.0, 12.0, 17.0, 18.0, 37.0, 50.0, 76.0, 147.0, 251.0, 678.0, 1817.0, 499.0, 178.0, 100.0, 55.0, 40.0, 31.0, 12.0, 8.0, 11.0, 4.0, 2.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.4619140625, -0.4484748840332031, -0.43503570556640625, -0.4215965270996094, -0.4081573486328125, -0.3947181701660156, -0.38127899169921875, -0.3678398132324219, -0.354400634765625, -0.3409614562988281, -0.32752227783203125, -0.3140830993652344, -0.3006439208984375, -0.2872047424316406, -0.27376556396484375, -0.2603263854980469, -0.24688720703125, -0.23344802856445312, -0.22000885009765625, -0.20656967163085938, -0.1931304931640625, -0.17969131469726562, -0.16625213623046875, -0.15281295776367188, -0.139373779296875, -0.12593460083007812, -0.11249542236328125, -0.09905624389648438, -0.0856170654296875, -0.07217788696289062, -0.05873870849609375, -0.045299530029296875, -0.0318603515625, -0.018421173095703125, -0.00498199462890625, 0.008457183837890625, 0.0218963623046875, 0.035335540771484375, 0.04877471923828125, 0.062213897705078125, 0.075653076171875, 0.08909225463867188, 0.10253143310546875, 0.11597061157226562, 0.1294097900390625, 0.14284896850585938, 0.15628814697265625, 0.16972732543945312, 0.18316650390625, 0.19660568237304688, 0.21004486083984375, 0.22348403930664062, 0.2369232177734375, 0.2503623962402344, 0.26380157470703125, 0.2772407531738281, 0.290679931640625, 0.3041191101074219, 0.31755828857421875, 0.3309974670410156, 0.3444366455078125, 0.3578758239746094, 0.37131500244140625, 0.3847541809082031, 0.398193359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 16.0, 46.0, 398.0, 485.0, 47.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0191986560821533, -1.8531420230865479, -1.687085509300232, -1.521028995513916, -1.3549723625183105, -1.188915729522705, -1.0228592157363892, -0.8568027019500732, -0.6907460689544678, -0.5246894955635071, -0.3586329221725464, -0.1925763487815857, -0.026519775390625, 0.1395367980003357, 0.3055933713912964, 0.4716498851776123, 0.6377065181732178, 0.8037630915641785, 0.9698196649551392, 1.135876178741455, 1.3019328117370605, 1.467989444732666, 1.634045958518982, 1.8001024723052979, 1.9661591053009033, 2.132215738296509, 2.298272132873535, 2.4643287658691406, 2.630385398864746, 2.7964420318603516, 2.962498664855957, 3.1285550594329834, 3.294611930847168, 3.4606685638427734, 3.626725196838379, 3.7927815914154053, 3.9588382244110107, 4.124894618988037, 4.290951251983643, 4.457007884979248, 4.6230645179748535, 4.789121150970459, 4.9551777839660645, 5.12123441696167, 5.287290573120117, 5.453347206115723, 5.619403839111328, 5.785460472106934, 5.951517105102539, 6.1175737380981445, 6.28363037109375, 6.4496870040893555, 6.615743637084961, 6.781799793243408, 6.947856426239014, 7.113913059234619, 7.279969692230225, 7.44602632522583, 7.6120829582214355, 7.778139591217041, 7.944195747375488, 8.110252380371094, 8.2763090133667, 8.442365646362305, 8.60842227935791]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 6.0, 7.0, 6.0, 9.0, 15.0, 30.0, 26.0, 54.0, 56.0, 49.0, 75.0, 97.0, 88.0, 110.0, 78.0, 70.0, 61.0, 55.0, 38.0, 28.0, 15.0, 10.0, 1.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.696762800216675, -2.6279690265655518, -2.5591752529144287, -2.4903814792633057, -2.4215877056121826, -2.3527939319610596, -2.2840001583099365, -2.2152063846588135, -2.1464126110076904, -2.0776188373565674, -2.0088250637054443, -1.9400312900543213, -1.8712375164031982, -1.8024437427520752, -1.7336499691009521, -1.664856195449829, -1.596062421798706, -1.527268648147583, -1.45847487449646, -1.389681100845337, -1.3208873271942139, -1.2520935535430908, -1.1832997798919678, -1.1145060062408447, -1.0457122325897217, -0.9769184589385986, -0.9081246852874756, -0.8393309116363525, -0.7705371379852295, -0.7017433643341064, -0.6329495906829834, -0.5641558170318604, -0.4953620433807373, -0.42656826972961426, -0.3577744960784912, -0.28898072242736816, -0.22018694877624512, -0.15139317512512207, -0.08259940147399902, -0.013805627822875977, 0.05498814582824707, 0.12378191947937012, 0.19257569313049316, 0.2613694667816162, 0.33016324043273926, 0.3989570140838623, 0.46775078773498535, 0.5365445613861084, 0.6053383350372314, 0.6741321086883545, 0.7429258823394775, 0.8117196559906006, 0.8805134296417236, 0.9493072032928467, 1.0181009769439697, 1.0868947505950928, 1.1556885242462158, 1.2244822978973389, 1.293276071548462, 1.362069845199585, 1.430863618850708, 1.499657392501831, 1.568451166152954, 1.6372449398040771, 1.7060387134552002]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 10.0, 15.0, 13.0, 30.0, 44.0, 51.0, 82.0, 141.0, 202.0, 281.0, 467.0, 652.0, 993.0, 1552.0, 2510.0, 4151.0, 7419.0, 14816.0, 36958.0, 881914.0, 55205.0, 19055.0, 8979.0, 4834.0, 2898.0, 1820.0, 1189.0, 749.0, 514.0, 337.0, 224.0, 144.0, 87.0, 82.0, 33.0, 31.0, 24.0, 13.0, 15.0, 4.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6064453125, -1.560089111328125, -1.51373291015625, -1.467376708984375, -1.4210205078125, -1.374664306640625, -1.32830810546875, -1.281951904296875, -1.235595703125, -1.189239501953125, -1.14288330078125, -1.096527099609375, -1.0501708984375, -1.003814697265625, -0.95745849609375, -0.911102294921875, -0.86474609375, -0.818389892578125, -0.77203369140625, -0.725677490234375, -0.6793212890625, -0.632965087890625, -0.58660888671875, -0.540252685546875, -0.493896484375, -0.447540283203125, -0.40118408203125, -0.354827880859375, -0.3084716796875, -0.262115478515625, -0.21575927734375, -0.169403076171875, -0.123046875, -0.076690673828125, -0.03033447265625, 0.016021728515625, 0.0623779296875, 0.108734130859375, 0.15509033203125, 0.201446533203125, 0.247802734375, 0.294158935546875, 0.34051513671875, 0.386871337890625, 0.4332275390625, 0.479583740234375, 0.52593994140625, 0.572296142578125, 0.61865234375, 0.665008544921875, 0.71136474609375, 0.757720947265625, 0.8040771484375, 0.850433349609375, 0.89678955078125, 0.943145751953125, 0.989501953125, 1.035858154296875, 1.08221435546875, 1.128570556640625, 1.1749267578125, 1.221282958984375, 1.26763916015625, 1.313995361328125, 1.3603515625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 5.0, 0.0, 5.0, 5.0, 6.0, 6.0, 8.0, 10.0, 10.0, 9.0, 13.0, 15.0, 204.0, 583.0, 24.0, 11.0, 20.0, 8.0, 4.0, 9.0, 8.0, 1.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302490234375, -0.2909126281738281, -0.27933502197265625, -0.2677574157714844, -0.2561798095703125, -0.24460220336914062, -0.23302459716796875, -0.22144699096679688, -0.209869384765625, -0.19829177856445312, -0.18671417236328125, -0.17513656616210938, -0.1635589599609375, -0.15198135375976562, -0.14040374755859375, -0.12882614135742188, -0.11724853515625, -0.10567092895507812, -0.09409332275390625, -0.08251571655273438, -0.0709381103515625, -0.059360504150390625, -0.04778289794921875, -0.036205291748046875, -0.024627685546875, -0.013050079345703125, -0.00147247314453125, 0.010105133056640625, 0.0216827392578125, 0.033260345458984375, 0.04483795166015625, 0.056415557861328125, 0.0679931640625, 0.07957077026367188, 0.09114837646484375, 0.10272598266601562, 0.1143035888671875, 0.12588119506835938, 0.13745880126953125, 0.14903640747070312, 0.160614013671875, 0.17219161987304688, 0.18376922607421875, 0.19534683227539062, 0.2069244384765625, 0.21850204467773438, 0.23007965087890625, 0.24165725708007812, 0.25323486328125, 0.2648124694824219, 0.27639007568359375, 0.2879676818847656, 0.2995452880859375, 0.3111228942871094, 0.32270050048828125, 0.3342781066894531, 0.345855712890625, 0.3574333190917969, 0.36901092529296875, 0.3805885314941406, 0.3921661376953125, 0.4037437438964844, 0.41532135009765625, 0.4268989562988281, 0.4384765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 7.0, 10.0, 13.0, 10.0, 19.0, 31.0, 53.0, 95.0, 141.0, 239.0, 481.0, 1088.0, 3051.0, 12274.0, 73053.0, 627428.0, 286668.0, 33705.0, 6624.0, 1922.0, 735.0, 349.0, 197.0, 129.0, 83.0, 50.0, 33.0, 23.0, 16.0, 12.0, 2.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3896484375, -1.345947265625, -1.30224609375, -1.258544921875, -1.21484375, -1.171142578125, -1.12744140625, -1.083740234375, -1.0400390625, -0.996337890625, -0.95263671875, -0.908935546875, -0.865234375, -0.821533203125, -0.77783203125, -0.734130859375, -0.6904296875, -0.646728515625, -0.60302734375, -0.559326171875, -0.515625, -0.471923828125, -0.42822265625, -0.384521484375, -0.3408203125, -0.297119140625, -0.25341796875, -0.209716796875, -0.166015625, -0.122314453125, -0.07861328125, -0.034912109375, 0.0087890625, 0.052490234375, 0.09619140625, 0.139892578125, 0.18359375, 0.227294921875, 0.27099609375, 0.314697265625, 0.3583984375, 0.402099609375, 0.44580078125, 0.489501953125, 0.533203125, 0.576904296875, 0.62060546875, 0.664306640625, 0.7080078125, 0.751708984375, 0.79541015625, 0.839111328125, 0.8828125, 0.926513671875, 0.97021484375, 1.013916015625, 1.0576171875, 1.101318359375, 1.14501953125, 1.188720703125, 1.232421875, 1.276123046875, 1.31982421875, 1.363525390625, 1.4072265625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 10.0, 11.0, 7.0, 12.0, 13.0, 13.0, 23.0, 22.0, 26.0, 27.0, 31.0, 29.0, 35.0, 41.0, 32.0, 41.0, 45.0, 45.0, 35.0, 44.0, 46.0, 47.0, 48.0, 46.0, 32.0, 46.0, 30.0, 29.0, 27.0, 13.0, 16.0, 11.0, 11.0, 10.0, 7.0, 6.0, 5.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.435546875, -1.392852783203125, -1.35015869140625, -1.307464599609375, -1.2647705078125, -1.222076416015625, -1.17938232421875, -1.136688232421875, -1.093994140625, -1.051300048828125, -1.00860595703125, -0.965911865234375, -0.9232177734375, -0.880523681640625, -0.83782958984375, -0.795135498046875, -0.75244140625, -0.709747314453125, -0.66705322265625, -0.624359130859375, -0.5816650390625, -0.538970947265625, -0.49627685546875, -0.453582763671875, -0.410888671875, -0.368194580078125, -0.32550048828125, -0.282806396484375, -0.2401123046875, -0.197418212890625, -0.15472412109375, -0.112030029296875, -0.0693359375, -0.026641845703125, 0.01605224609375, 0.058746337890625, 0.1014404296875, 0.144134521484375, 0.18682861328125, 0.229522705078125, 0.272216796875, 0.314910888671875, 0.35760498046875, 0.400299072265625, 0.4429931640625, 0.485687255859375, 0.52838134765625, 0.571075439453125, 0.61376953125, 0.656463623046875, 0.69915771484375, 0.741851806640625, 0.7845458984375, 0.827239990234375, 0.86993408203125, 0.912628173828125, 0.955322265625, 0.998016357421875, 1.04071044921875, 1.083404541015625, 1.1260986328125, 1.168792724609375, 1.21148681640625, 1.254180908203125, 1.296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 10.0, 16.0, 35.0, 51.0, 98.0, 269.0, 801.0, 4939.0, 709463.0, 327380.0, 4236.0, 769.0, 256.0, 91.0, 59.0, 32.0, 19.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.88671875, -2.8126373291015625, -2.738555908203125, -2.6644744873046875, -2.59039306640625, -2.5163116455078125, -2.442230224609375, -2.3681488037109375, -2.2940673828125, -2.2199859619140625, -2.145904541015625, -2.0718231201171875, -1.99774169921875, -1.9236602783203125, -1.849578857421875, -1.7754974365234375, -1.701416015625, -1.6273345947265625, -1.553253173828125, -1.4791717529296875, -1.40509033203125, -1.3310089111328125, -1.256927490234375, -1.1828460693359375, -1.1087646484375, -1.0346832275390625, -0.960601806640625, -0.8865203857421875, -0.81243896484375, -0.7383575439453125, -0.664276123046875, -0.5901947021484375, -0.51611328125, -0.4420318603515625, -0.367950439453125, -0.2938690185546875, -0.21978759765625, -0.1457061767578125, -0.071624755859375, 0.0024566650390625, 0.0765380859375, 0.1506195068359375, 0.224700927734375, 0.2987823486328125, 0.37286376953125, 0.4469451904296875, 0.521026611328125, 0.5951080322265625, 0.669189453125, 0.7432708740234375, 0.817352294921875, 0.8914337158203125, 0.96551513671875, 1.0395965576171875, 1.113677978515625, 1.1877593994140625, 1.2618408203125, 1.3359222412109375, 1.410003662109375, 1.4840850830078125, 1.55816650390625, 1.6322479248046875, 1.706329345703125, 1.7804107666015625, 1.8544921875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 8.0, 6.0, 5.0, 10.0, 10.0, 10.0, 19.0, 15.0, 28.0, 38.0, 62.0, 91.0, 81.0, 125.0, 111.0, 104.0, 73.0, 62.0, 49.0, 23.0, 29.0, 11.0, 6.0, 7.0, 6.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.233287811279297e-05, -5.0693750381469727e-05, -4.9054622650146484e-05, -4.741549491882324e-05, -4.57763671875e-05, -4.413723945617676e-05, -4.2498111724853516e-05, -4.0858983993530273e-05, -3.921985626220703e-05, -3.758072853088379e-05, -3.594160079956055e-05, -3.4302473068237305e-05, -3.266334533691406e-05, -3.102421760559082e-05, -2.9385089874267578e-05, -2.7745962142944336e-05, -2.6106834411621094e-05, -2.446770668029785e-05, -2.282857894897461e-05, -2.1189451217651367e-05, -1.9550323486328125e-05, -1.7911195755004883e-05, -1.627206802368164e-05, -1.4632940292358398e-05, -1.2993812561035156e-05, -1.1354684829711914e-05, -9.715557098388672e-06, -8.07642936706543e-06, -6.4373016357421875e-06, -4.798173904418945e-06, -3.159046173095703e-06, -1.519918441772461e-06, 1.1920928955078125e-07, 1.7583370208740234e-06, 3.3974647521972656e-06, 5.036592483520508e-06, 6.67572021484375e-06, 8.314847946166992e-06, 9.953975677490234e-06, 1.1593103408813477e-05, 1.3232231140136719e-05, 1.4871358871459961e-05, 1.6510486602783203e-05, 1.8149614334106445e-05, 1.9788742065429688e-05, 2.142786979675293e-05, 2.3066997528076172e-05, 2.4706125259399414e-05, 2.6345252990722656e-05, 2.79843807220459e-05, 2.962350845336914e-05, 3.126263618469238e-05, 3.2901763916015625e-05, 3.454089164733887e-05, 3.618001937866211e-05, 3.781914710998535e-05, 3.9458274841308594e-05, 4.1097402572631836e-05, 4.273653030395508e-05, 4.437565803527832e-05, 4.601478576660156e-05, 4.7653913497924805e-05, 4.929304122924805e-05, 5.093216896057129e-05, 5.257129669189453e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 8.0, 9.0, 7.0, 19.0, 38.0, 45.0, 74.0, 159.0, 381.0, 739.0, 2006.0, 8676.0, 114507.0, 871439.0, 42575.0, 5139.0, 1461.0, 613.0, 295.0, 149.0, 63.0, 57.0, 25.0, 18.0, 15.0, 6.0, 8.0, 5.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.986328125, -0.953826904296875, -0.92132568359375, -0.888824462890625, -0.8563232421875, -0.823822021484375, -0.79132080078125, -0.758819580078125, -0.726318359375, -0.693817138671875, -0.66131591796875, -0.628814697265625, -0.5963134765625, -0.563812255859375, -0.53131103515625, -0.498809814453125, -0.46630859375, -0.433807373046875, -0.40130615234375, -0.368804931640625, -0.3363037109375, -0.303802490234375, -0.27130126953125, -0.238800048828125, -0.206298828125, -0.173797607421875, -0.14129638671875, -0.108795166015625, -0.0762939453125, -0.043792724609375, -0.01129150390625, 0.021209716796875, 0.0537109375, 0.086212158203125, 0.11871337890625, 0.151214599609375, 0.1837158203125, 0.216217041015625, 0.24871826171875, 0.281219482421875, 0.313720703125, 0.346221923828125, 0.37872314453125, 0.411224365234375, 0.4437255859375, 0.476226806640625, 0.50872802734375, 0.541229248046875, 0.57373046875, 0.606231689453125, 0.63873291015625, 0.671234130859375, 0.7037353515625, 0.736236572265625, 0.76873779296875, 0.801239013671875, 0.833740234375, 0.866241455078125, 0.89874267578125, 0.931243896484375, 0.9637451171875, 0.996246337890625, 1.02874755859375, 1.061248779296875, 1.09375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 13.0, 23.0, 21.0, 52.0, 82.0, 137.0, 173.0, 167.0, 126.0, 82.0, 36.0, 29.0, 26.0, 7.0, 11.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6083984375, -1.5596160888671875, -1.510833740234375, -1.4620513916015625, -1.41326904296875, -1.3644866943359375, -1.315704345703125, -1.2669219970703125, -1.2181396484375, -1.1693572998046875, -1.120574951171875, -1.0717926025390625, -1.02301025390625, -0.9742279052734375, -0.925445556640625, -0.8766632080078125, -0.827880859375, -0.7790985107421875, -0.730316162109375, -0.6815338134765625, -0.63275146484375, -0.5839691162109375, -0.535186767578125, -0.4864044189453125, -0.4376220703125, -0.3888397216796875, -0.340057373046875, -0.2912750244140625, -0.24249267578125, -0.1937103271484375, -0.144927978515625, -0.0961456298828125, -0.04736328125, 0.0014190673828125, 0.050201416015625, 0.0989837646484375, 0.14776611328125, 0.1965484619140625, 0.245330810546875, 0.2941131591796875, 0.3428955078125, 0.3916778564453125, 0.440460205078125, 0.4892425537109375, 0.53802490234375, 0.5868072509765625, 0.635589599609375, 0.6843719482421875, 0.733154296875, 0.7819366455078125, 0.830718994140625, 0.8795013427734375, 0.92828369140625, 0.9770660400390625, 1.025848388671875, 1.0746307373046875, 1.1234130859375, 1.1721954345703125, 1.220977783203125, 1.2697601318359375, 1.31854248046875, 1.3673248291015625, 1.416107177734375, 1.4648895263671875, 1.513671875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 5.0, 15.0, 55.0, 301.0, 513.0, 79.0, 15.0, 12.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.141454696655273, -15.250275611877441, -14.35909652709961, -13.467917442321777, -12.576738357543945, -11.685559272766113, -10.794380187988281, -9.90320110321045, -9.012022018432617, -8.120842933654785, -7.229663848876953, -6.338484764099121, -5.447305679321289, -4.556126594543457, -3.664947509765625, -2.773768424987793, -1.882589340209961, -0.9914102554321289, -0.10023117065429688, 0.7909479141235352, 1.6821269989013672, 2.573306083679199, 3.4644851684570312, 4.355664253234863, 5.246843338012695, 6.138022422790527, 7.029201507568359, 7.920380592346191, 8.811559677124023, 9.702738761901855, 10.593917846679688, 11.48509693145752, 12.376274108886719, 13.26745319366455, 14.158632278442383, 15.049811363220215, 15.940990447998047, 16.832168579101562, 17.72334861755371, 18.61452865600586, 19.505706787109375, 20.39688491821289, 21.28806495666504, 22.179244995117188, 23.070423126220703, 23.96160125732422, 24.852781295776367, 25.743961334228516, 26.63513946533203, 27.526317596435547, 28.417497634887695, 29.308677673339844, 30.19985580444336, 31.091033935546875, 31.982213973999023, 32.87339401245117, 33.76457214355469, 34.6557502746582, 35.54692840576172, 36.4381103515625, 37.329288482666016, 38.22046661376953, 39.11164855957031, 40.00282669067383, 40.894004821777344]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 2.0, 5.0, 5.0, 4.0, 6.0, 16.0, 18.0, 31.0, 44.0, 61.0, 93.0, 112.0, 143.0, 115.0, 86.0, 68.0, 42.0, 25.0, 19.0, 15.0, 11.0, 9.0, 7.0, 4.0, 5.0, 3.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-22.497350692749023, -21.807695388793945, -21.118038177490234, -20.428382873535156, -19.738727569580078, -19.049072265625, -18.35941505432129, -17.66975975036621, -16.980104446411133, -16.290449142456055, -15.60079288482666, -14.911136627197266, -14.221481323242188, -13.531825065612793, -12.842168807983398, -12.15251350402832, -11.462857246398926, -10.773200988769531, -10.083545684814453, -9.393889427185059, -8.70423412322998, -8.014577865600586, -7.32492208480835, -6.635266304016113, -5.945610523223877, -5.255954742431641, -4.566298961639404, -3.876642942428589, -3.1869871616363525, -2.497331380844116, -1.8076753616333008, -1.1180195808410645, -0.4283638000488281, 0.261292040348053, 0.9509478807449341, 1.64060378074646, 2.3302595615386963, 3.0199153423309326, 3.709571361541748, 4.399227142333984, 5.088882923126221, 5.778538703918457, 6.468194484710693, 7.15785026550293, 7.847506523132324, 8.537161827087402, 9.226818084716797, 9.916473388671875, 10.60612964630127, 11.295785903930664, 11.985441207885742, 12.675097465515137, 13.364752769470215, 14.05440902709961, 14.744064331054688, 15.433720588684082, 16.123376846313477, 16.813032150268555, 17.502689361572266, 18.192344665527344, 18.881999969482422, 19.5716552734375, 20.26131248474121, 20.95096778869629, 21.640623092651367]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 4.0, 5.0, 9.0, 10.0, 7.0, 18.0, 32.0, 43.0, 91.0, 103.0, 228.0, 433.0, 901.0, 2067.0, 6022.0, 25759.0, 3098938.0, 1028853.0, 21645.0, 5324.0, 1841.0, 887.0, 432.0, 243.0, 120.0, 86.0, 61.0, 47.0, 29.0, 7.0, 8.0, 13.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.455078125, -3.335845947265625, -3.21661376953125, -3.097381591796875, -2.9781494140625, -2.858917236328125, -2.73968505859375, -2.620452880859375, -2.501220703125, -2.381988525390625, -2.26275634765625, -2.143524169921875, -2.0242919921875, -1.905059814453125, -1.78582763671875, -1.666595458984375, -1.54736328125, -1.428131103515625, -1.30889892578125, -1.189666748046875, -1.0704345703125, -0.951202392578125, -0.83197021484375, -0.712738037109375, -0.593505859375, -0.474273681640625, -0.35504150390625, -0.235809326171875, -0.1165771484375, 0.002655029296875, 0.12188720703125, 0.241119384765625, 0.3603515625, 0.479583740234375, 0.59881591796875, 0.718048095703125, 0.8372802734375, 0.956512451171875, 1.07574462890625, 1.194976806640625, 1.314208984375, 1.433441162109375, 1.55267333984375, 1.671905517578125, 1.7911376953125, 1.910369873046875, 2.02960205078125, 2.148834228515625, 2.26806640625, 2.387298583984375, 2.50653076171875, 2.625762939453125, 2.7449951171875, 2.864227294921875, 2.98345947265625, 3.102691650390625, 3.221923828125, 3.341156005859375, 3.46038818359375, 3.579620361328125, 3.6988525390625, 3.818084716796875, 3.93731689453125, 4.056549072265625, 4.17578125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 6.0, 17.0, 12.0, 13.0, 17.0, 34.0, 100.0, 393.0, 252.0, 52.0, 23.0, 19.0, 12.0, 12.0, 6.0, 5.0, 5.0, 6.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3828125, -0.3699302673339844, -0.35704803466796875, -0.3441658020019531, -0.3312835693359375, -0.3184013366699219, -0.30551910400390625, -0.2926368713378906, -0.279754638671875, -0.2668724060058594, -0.25399017333984375, -0.24110794067382812, -0.2282257080078125, -0.21534347534179688, -0.20246124267578125, -0.18957901000976562, -0.17669677734375, -0.16381454467773438, -0.15093231201171875, -0.13805007934570312, -0.1251678466796875, -0.11228561401367188, -0.09940338134765625, -0.08652114868164062, -0.073638916015625, -0.060756683349609375, -0.04787445068359375, -0.034992218017578125, -0.0221099853515625, -0.009227752685546875, 0.00365447998046875, 0.016536712646484375, 0.0294189453125, 0.042301177978515625, 0.05518341064453125, 0.06806564331054688, 0.0809478759765625, 0.09383010864257812, 0.10671234130859375, 0.11959457397460938, 0.132476806640625, 0.14535903930664062, 0.15824127197265625, 0.17112350463867188, 0.1840057373046875, 0.19688796997070312, 0.20977020263671875, 0.22265243530273438, 0.23553466796875, 0.24841690063476562, 0.26129913330078125, 0.2741813659667969, 0.2870635986328125, 0.2999458312988281, 0.31282806396484375, 0.3257102966308594, 0.338592529296875, 0.3514747619628906, 0.36435699462890625, 0.3772392272949219, 0.3901214599609375, 0.4030036926269531, 0.41588592529296875, 0.4287681579589844, 0.441650390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 13.0, 11.0, 14.0, 25.0, 45.0, 58.0, 127.0, 261.0, 539.0, 1376.0, 4078.0, 21077.0, 551520.0, 3571400.0, 35365.0, 5498.0, 1610.0, 636.0, 264.0, 157.0, 74.0, 47.0, 22.0, 18.0, 10.0, 8.0, 4.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.478118896484375, -1.41131591796875, -1.344512939453125, -1.2777099609375, -1.210906982421875, -1.14410400390625, -1.077301025390625, -1.010498046875, -0.943695068359375, -0.87689208984375, -0.810089111328125, -0.7432861328125, -0.676483154296875, -0.60968017578125, -0.542877197265625, -0.47607421875, -0.409271240234375, -0.34246826171875, -0.275665283203125, -0.2088623046875, -0.142059326171875, -0.07525634765625, -0.008453369140625, 0.058349609375, 0.125152587890625, 0.19195556640625, 0.258758544921875, 0.3255615234375, 0.392364501953125, 0.45916748046875, 0.525970458984375, 0.5927734375, 0.659576416015625, 0.72637939453125, 0.793182373046875, 0.8599853515625, 0.926788330078125, 0.99359130859375, 1.060394287109375, 1.127197265625, 1.194000244140625, 1.26080322265625, 1.327606201171875, 1.3944091796875, 1.461212158203125, 1.52801513671875, 1.594818115234375, 1.66162109375, 1.728424072265625, 1.79522705078125, 1.862030029296875, 1.9288330078125, 1.995635986328125, 2.06243896484375, 2.129241943359375, 2.196044921875, 2.262847900390625, 2.32965087890625, 2.396453857421875, 2.4632568359375, 2.530059814453125, 2.59686279296875, 2.663665771484375, 2.73046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 13.0, 15.0, 12.0, 14.0, 38.0, 61.0, 68.0, 113.0, 237.0, 613.0, 1817.0, 579.0, 185.0, 103.0, 55.0, 38.0, 25.0, 17.0, 14.0, 11.0, 12.0, 2.0, 8.0, 2.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4072265625, -0.3960838317871094, -0.38494110107421875, -0.3737983703613281, -0.3626556396484375, -0.3515129089355469, -0.34037017822265625, -0.3292274475097656, -0.318084716796875, -0.3069419860839844, -0.29579925537109375, -0.2846565246582031, -0.2735137939453125, -0.2623710632324219, -0.25122833251953125, -0.24008560180664062, -0.22894287109375, -0.21780014038085938, -0.20665740966796875, -0.19551467895507812, -0.1843719482421875, -0.17322921752929688, -0.16208648681640625, -0.15094375610351562, -0.139801025390625, -0.12865829467773438, -0.11751556396484375, -0.10637283325195312, -0.0952301025390625, -0.08408737182617188, -0.07294464111328125, -0.061801910400390625, -0.0506591796875, -0.039516448974609375, -0.02837371826171875, -0.017230987548828125, -0.0060882568359375, 0.005054473876953125, 0.01619720458984375, 0.027339935302734375, 0.038482666015625, 0.049625396728515625, 0.06076812744140625, 0.07191085815429688, 0.0830535888671875, 0.09419631958007812, 0.10533905029296875, 0.11648178100585938, 0.12762451171875, 0.13876724243164062, 0.14990997314453125, 0.16105270385742188, 0.1721954345703125, 0.18333816528320312, 0.19448089599609375, 0.20562362670898438, 0.216766357421875, 0.22790908813476562, 0.23905181884765625, 0.2501945495605469, 0.2613372802734375, 0.2724800109863281, 0.28362274169921875, 0.2947654724121094, 0.305908203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 15.0, 152.0, 802.0, 18.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.02397346496582, -19.668811798095703, -19.313648223876953, -18.958486557006836, -18.60332489013672, -18.24816131591797, -17.89299964904785, -17.537837982177734, -17.182674407958984, -16.827512741088867, -16.472349166870117, -16.1171875, -15.762024879455566, -15.406862258911133, -15.051700592041016, -14.696537971496582, -14.341376304626465, -13.986213684082031, -13.631052017211914, -13.27588939666748, -12.920726776123047, -12.56556510925293, -12.210402488708496, -11.855239868164062, -11.500078201293945, -11.144915580749512, -10.789753913879395, -10.434591293334961, -10.079428672790527, -9.724266052246094, -9.369104385375977, -9.013941764831543, -8.65877914428711, -8.303616523742676, -7.9484543800354, -7.593292236328125, -7.238129615783691, -6.882967472076416, -6.527805328369141, -6.172642707824707, -5.817480087280273, -5.462317943572998, -5.1071553230285645, -4.751993179321289, -4.3968305587768555, -4.04166841506958, -3.6865062713623047, -3.33134388923645, -2.9761815071105957, -2.621019124984741, -2.2658567428588867, -1.9106945991516113, -1.5555322170257568, -1.2003698348999023, -0.845207691192627, -0.49004530906677246, -0.13488292694091797, 0.22027939558029175, 0.5754417181015015, 0.9306039810180664, 1.285766363143921, 1.6409287452697754, 1.9960908889770508, 2.3512532711029053, 2.7064156532287598]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 6.0, 12.0, 11.0, 13.0, 23.0, 21.0, 36.0, 42.0, 48.0, 56.0, 61.0, 50.0, 56.0, 72.0, 68.0, 73.0, 54.0, 47.0, 57.0, 34.0, 29.0, 25.0, 20.0, 20.0, 9.0, 7.0, 12.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4993104934692383, -1.4471986293792725, -1.3950867652893066, -1.3429749011993408, -1.2908631563186646, -1.2387512922286987, -1.186639428138733, -1.134527564048767, -1.0824156999588013, -1.0303038358688354, -0.9781920313835144, -0.9260801672935486, -0.8739683032035828, -0.8218564987182617, -0.7697446346282959, -0.7176327705383301, -0.665520966053009, -0.6134091019630432, -0.5612972974777222, -0.5091854333877563, -0.4570735692977905, -0.4049617350101471, -0.35284990072250366, -0.30073803663253784, -0.2486262023448944, -0.19651435315608978, -0.14440250396728516, -0.09229066967964172, -0.0401788204908371, 0.01193302869796753, 0.06404486298561096, 0.11615672707557678, 0.16826856136322021, 0.22038041055202484, 0.27249225974082947, 0.3246040940284729, 0.3767159581184387, 0.42882779240608215, 0.4809396266937256, 0.5330514907836914, 0.5851633548736572, 0.637275218963623, 0.6893870234489441, 0.7414988875389099, 0.7936107516288757, 0.8457225561141968, 0.8978344202041626, 0.9499462842941284, 1.0020580291748047, 1.0541698932647705, 1.1062817573547363, 1.1583936214447021, 1.2105053663253784, 1.2626172304153442, 1.31472909450531, 1.3668409585952759, 1.4189528226852417, 1.4710646867752075, 1.5231765508651733, 1.5752882957458496, 1.6274001598358154, 1.6795120239257812, 1.731623888015747, 1.783735752105713, 1.8358476161956787]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 15.0, 9.0, 17.0, 29.0, 34.0, 43.0, 82.0, 88.0, 136.0, 272.0, 461.0, 766.0, 1510.0, 3280.0, 8532.0, 29035.0, 580104.0, 384297.0, 25708.0, 7742.0, 3082.0, 1436.0, 740.0, 396.0, 243.0, 157.0, 101.0, 65.0, 48.0, 31.0, 25.0, 18.0, 14.0, 9.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.2890625, -2.2196044921875, -2.150146484375, -2.0806884765625, -2.01123046875, -1.9417724609375, -1.872314453125, -1.8028564453125, -1.7333984375, -1.6639404296875, -1.594482421875, -1.5250244140625, -1.45556640625, -1.3861083984375, -1.316650390625, -1.2471923828125, -1.177734375, -1.1082763671875, -1.038818359375, -0.9693603515625, -0.89990234375, -0.8304443359375, -0.760986328125, -0.6915283203125, -0.6220703125, -0.5526123046875, -0.483154296875, -0.4136962890625, -0.34423828125, -0.2747802734375, -0.205322265625, -0.1358642578125, -0.06640625, 0.0030517578125, 0.072509765625, 0.1419677734375, 0.21142578125, 0.2808837890625, 0.350341796875, 0.4197998046875, 0.4892578125, 0.5587158203125, 0.628173828125, 0.6976318359375, 0.76708984375, 0.8365478515625, 0.906005859375, 0.9754638671875, 1.044921875, 1.1143798828125, 1.183837890625, 1.2532958984375, 1.32275390625, 1.3922119140625, 1.461669921875, 1.5311279296875, 1.6005859375, 1.6700439453125, 1.739501953125, 1.8089599609375, 1.87841796875, 1.9478759765625, 2.017333984375, 2.0867919921875, 2.15625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 9.0, 7.0, 12.0, 14.0, 19.0, 30.0, 128.0, 341.0, 269.0, 92.0, 24.0, 12.0, 13.0, 7.0, 8.0, 4.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397705078125, -0.3843536376953125, -0.371002197265625, -0.3576507568359375, -0.34429931640625, -0.3309478759765625, -0.317596435546875, -0.3042449951171875, -0.2908935546875, -0.2775421142578125, -0.264190673828125, -0.2508392333984375, -0.23748779296875, -0.2241363525390625, -0.210784912109375, -0.1974334716796875, -0.18408203125, -0.1707305908203125, -0.157379150390625, -0.1440277099609375, -0.13067626953125, -0.1173248291015625, -0.103973388671875, -0.0906219482421875, -0.0772705078125, -0.0639190673828125, -0.050567626953125, -0.0372161865234375, -0.02386474609375, -0.0105133056640625, 0.002838134765625, 0.0161895751953125, 0.029541015625, 0.0428924560546875, 0.056243896484375, 0.0695953369140625, 0.08294677734375, 0.0962982177734375, 0.109649658203125, 0.1230010986328125, 0.1363525390625, 0.1497039794921875, 0.163055419921875, 0.1764068603515625, 0.18975830078125, 0.2031097412109375, 0.216461181640625, 0.2298126220703125, 0.2431640625, 0.2565155029296875, 0.269866943359375, 0.2832183837890625, 0.29656982421875, 0.3099212646484375, 0.323272705078125, 0.3366241455078125, 0.3499755859375, 0.3633270263671875, 0.376678466796875, 0.3900299072265625, 0.40338134765625, 0.4167327880859375, 0.430084228515625, 0.4434356689453125, 0.456787109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 4.0, 8.0, 8.0, 7.0, 12.0, 19.0, 21.0, 24.0, 44.0, 44.0, 72.0, 85.0, 139.0, 195.0, 330.0, 559.0, 1093.0, 2480.0, 7001.0, 24795.0, 113666.0, 529330.0, 294299.0, 54141.0, 13145.0, 3884.0, 1481.0, 659.0, 340.0, 207.0, 126.0, 100.0, 59.0, 40.0, 45.0, 22.0, 16.0, 17.0, 8.0, 9.0, 7.0, 7.0, 1.0, 5.0, 1.0, 2.0], "bins": [-1.205078125, -1.1747817993164062, -1.1444854736328125, -1.1141891479492188, -1.083892822265625, -1.0535964965820312, -1.0233001708984375, -0.9930038452148438, -0.96270751953125, -0.9324111938476562, -0.9021148681640625, -0.8718185424804688, -0.841522216796875, -0.8112258911132812, -0.7809295654296875, -0.7506332397460938, -0.7203369140625, -0.6900405883789062, -0.6597442626953125, -0.6294479370117188, -0.599151611328125, -0.5688552856445312, -0.5385589599609375, -0.5082626342773438, -0.47796630859375, -0.44766998291015625, -0.4173736572265625, -0.38707733154296875, -0.356781005859375, -0.32648468017578125, -0.2961883544921875, -0.26589202880859375, -0.235595703125, -0.20529937744140625, -0.1750030517578125, -0.14470672607421875, -0.114410400390625, -0.08411407470703125, -0.0538177490234375, -0.02352142333984375, 0.00677490234375, 0.03707122802734375, 0.0673675537109375, 0.09766387939453125, 0.127960205078125, 0.15825653076171875, 0.1885528564453125, 0.21884918212890625, 0.2491455078125, 0.27944183349609375, 0.3097381591796875, 0.34003448486328125, 0.370330810546875, 0.40062713623046875, 0.4309234619140625, 0.46121978759765625, 0.49151611328125, 0.5218124389648438, 0.5521087646484375, 0.5824050903320312, 0.612701416015625, 0.6429977416992188, 0.6732940673828125, 0.7035903930664062, 0.73388671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 7.0, 9.0, 12.0, 11.0, 17.0, 21.0, 26.0, 27.0, 34.0, 39.0, 28.0, 32.0, 37.0, 52.0, 46.0, 36.0, 51.0, 37.0, 45.0, 52.0, 43.0, 50.0, 40.0, 39.0, 27.0, 34.0, 20.0, 20.0, 18.0, 23.0, 13.0, 14.0, 9.0, 5.0, 7.0, 2.0, 7.0, 3.0, 1.0, 1.0], "bins": [-1.0517578125, -1.0261688232421875, -1.000579833984375, -0.9749908447265625, -0.94940185546875, -0.9238128662109375, -0.898223876953125, -0.8726348876953125, -0.8470458984375, -0.8214569091796875, -0.795867919921875, -0.7702789306640625, -0.74468994140625, -0.7191009521484375, -0.693511962890625, -0.6679229736328125, -0.642333984375, -0.6167449951171875, -0.591156005859375, -0.5655670166015625, -0.53997802734375, -0.5143890380859375, -0.488800048828125, -0.4632110595703125, -0.4376220703125, -0.4120330810546875, -0.386444091796875, -0.3608551025390625, -0.33526611328125, -0.3096771240234375, -0.284088134765625, -0.2584991455078125, -0.23291015625, -0.2073211669921875, -0.181732177734375, -0.1561431884765625, -0.13055419921875, -0.1049652099609375, -0.079376220703125, -0.0537872314453125, -0.0281982421875, -0.0026092529296875, 0.022979736328125, 0.0485687255859375, 0.07415771484375, 0.0997467041015625, 0.125335693359375, 0.1509246826171875, 0.176513671875, 0.2021026611328125, 0.227691650390625, 0.2532806396484375, 0.27886962890625, 0.3044586181640625, 0.330047607421875, 0.3556365966796875, 0.3812255859375, 0.4068145751953125, 0.432403564453125, 0.4579925537109375, 0.48358154296875, 0.5091705322265625, 0.534759521484375, 0.5603485107421875, 0.5859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 10.0, 16.0, 23.0, 33.0, 64.0, 157.0, 379.0, 1118.0, 6428.0, 926036.0, 109851.0, 3212.0, 695.0, 250.0, 124.0, 49.0, 30.0, 27.0, 12.0, 7.0, 5.0, 4.0, 1.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.314453125, -3.216522216796875, -3.11859130859375, -3.020660400390625, -2.9227294921875, -2.824798583984375, -2.72686767578125, -2.628936767578125, -2.531005859375, -2.433074951171875, -2.33514404296875, -2.237213134765625, -2.1392822265625, -2.041351318359375, -1.94342041015625, -1.845489501953125, -1.74755859375, -1.649627685546875, -1.55169677734375, -1.453765869140625, -1.3558349609375, -1.257904052734375, -1.15997314453125, -1.062042236328125, -0.964111328125, -0.866180419921875, -0.76824951171875, -0.670318603515625, -0.5723876953125, -0.474456787109375, -0.37652587890625, -0.278594970703125, -0.1806640625, -0.082733154296875, 0.01519775390625, 0.113128662109375, 0.2110595703125, 0.308990478515625, 0.40692138671875, 0.504852294921875, 0.602783203125, 0.700714111328125, 0.79864501953125, 0.896575927734375, 0.9945068359375, 1.092437744140625, 1.19036865234375, 1.288299560546875, 1.38623046875, 1.484161376953125, 1.58209228515625, 1.680023193359375, 1.7779541015625, 1.875885009765625, 1.97381591796875, 2.071746826171875, 2.169677734375, 2.267608642578125, 2.36553955078125, 2.463470458984375, 2.5614013671875, 2.659332275390625, 2.75726318359375, 2.855194091796875, 2.953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 8.0, 6.0, 9.0, 11.0, 14.0, 24.0, 57.0, 63.0, 149.0, 298.0, 159.0, 69.0, 46.0, 25.0, 15.0, 11.0, 5.0, 8.0, 3.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003046989440917969, -0.0002963319420814514, -0.00028796494007110596, -0.0002795979380607605, -0.00027123093605041504, -0.0002628639340400696, -0.0002544969320297241, -0.00024612993001937866, -0.0002377629280090332, -0.00022939592599868774, -0.00022102892398834229, -0.00021266192197799683, -0.00020429491996765137, -0.0001959279179573059, -0.00018756091594696045, -0.000179193913936615, -0.00017082691192626953, -0.00016245990991592407, -0.0001540929079055786, -0.00014572590589523315, -0.0001373589038848877, -0.00012899190187454224, -0.00012062489986419678, -0.00011225789785385132, -0.00010389089584350586, -9.55238938331604e-05, -8.715689182281494e-05, -7.878988981246948e-05, -7.042288780212402e-05, -6.205588579177856e-05, -5.3688883781433105e-05, -4.5321881771087646e-05, -3.695487976074219e-05, -2.858787775039673e-05, -2.022087574005127e-05, -1.185387372970581e-05, -3.4868717193603516e-06, 4.880130290985107e-06, 1.3247132301330566e-05, 2.1614134311676025e-05, 2.9981136322021484e-05, 3.834813833236694e-05, 4.67151403427124e-05, 5.508214235305786e-05, 6.344914436340332e-05, 7.181614637374878e-05, 8.018314838409424e-05, 8.85501503944397e-05, 9.691715240478516e-05, 0.00010528415441513062, 0.00011365115642547607, 0.00012201815843582153, 0.000130385160446167, 0.00013875216245651245, 0.0001471191644668579, 0.00015548616647720337, 0.00016385316848754883, 0.0001722201704978943, 0.00018058717250823975, 0.0001889541745185852, 0.00019732117652893066, 0.00020568817853927612, 0.00021405518054962158, 0.00022242218255996704, 0.0002307891845703125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 12.0, 15.0, 36.0, 47.0, 91.0, 208.0, 464.0, 1209.0, 6105.0, 189533.0, 835427.0, 12638.0, 1755.0, 525.0, 243.0, 106.0, 65.0, 25.0, 17.0, 6.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.251953125, -2.19134521484375, -2.1307373046875, -2.07012939453125, -2.009521484375, -1.94891357421875, -1.8883056640625, -1.82769775390625, -1.76708984375, -1.70648193359375, -1.6458740234375, -1.58526611328125, -1.524658203125, -1.46405029296875, -1.4034423828125, -1.34283447265625, -1.2822265625, -1.22161865234375, -1.1610107421875, -1.10040283203125, -1.039794921875, -0.97918701171875, -0.9185791015625, -0.85797119140625, -0.79736328125, -0.73675537109375, -0.6761474609375, -0.61553955078125, -0.554931640625, -0.49432373046875, -0.4337158203125, -0.37310791015625, -0.3125, -0.25189208984375, -0.1912841796875, -0.13067626953125, -0.070068359375, -0.00946044921875, 0.0511474609375, 0.11175537109375, 0.17236328125, 0.23297119140625, 0.2935791015625, 0.35418701171875, 0.414794921875, 0.47540283203125, 0.5360107421875, 0.59661865234375, 0.6572265625, 0.71783447265625, 0.7784423828125, 0.83905029296875, 0.899658203125, 0.96026611328125, 1.0208740234375, 1.08148193359375, 1.14208984375, 1.20269775390625, 1.2633056640625, 1.32391357421875, 1.384521484375, 1.44512939453125, 1.5057373046875, 1.56634521484375, 1.626953125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 9.0, 16.0, 34.0, 51.0, 78.0, 150.0, 196.0, 161.0, 131.0, 67.0, 38.0, 28.0, 18.0, 10.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.283966064453125, -1.24371337890625, -1.203460693359375, -1.1632080078125, -1.122955322265625, -1.08270263671875, -1.042449951171875, -1.002197265625, -0.961944580078125, -0.92169189453125, -0.881439208984375, -0.8411865234375, -0.800933837890625, -0.76068115234375, -0.720428466796875, -0.68017578125, -0.639923095703125, -0.59967041015625, -0.559417724609375, -0.5191650390625, -0.478912353515625, -0.43865966796875, -0.398406982421875, -0.358154296875, -0.317901611328125, -0.27764892578125, -0.237396240234375, -0.1971435546875, -0.156890869140625, -0.11663818359375, -0.076385498046875, -0.0361328125, 0.004119873046875, 0.04437255859375, 0.084625244140625, 0.1248779296875, 0.165130615234375, 0.20538330078125, 0.245635986328125, 0.285888671875, 0.326141357421875, 0.36639404296875, 0.406646728515625, 0.4468994140625, 0.487152099609375, 0.52740478515625, 0.567657470703125, 0.60791015625, 0.648162841796875, 0.68841552734375, 0.728668212890625, 0.7689208984375, 0.809173583984375, 0.84942626953125, 0.889678955078125, 0.929931640625, 0.970184326171875, 1.01043701171875, 1.050689697265625, 1.0909423828125, 1.131195068359375, 1.17144775390625, 1.211700439453125, 1.251953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 9.0, 57.0, 775.0, 148.0, 14.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.953643798828125, -23.853364944458008, -22.75308609008789, -21.65280532836914, -20.552526473999023, -19.452247619628906, -18.351966857910156, -17.25168800354004, -16.151409149169922, -15.051130294799805, -13.950850486755371, -12.850570678710938, -11.75029182434082, -10.650012969970703, -9.54973316192627, -8.449453353881836, -7.349174499511719, -6.248895168304443, -5.148615837097168, -4.048336505889893, -2.948057174682617, -1.8477778434753418, -0.7474985122680664, 0.352780818939209, 1.4530601501464844, 2.5533394813537598, 3.653618812561035, 4.7538981437683105, 5.854177474975586, 6.954456806182861, 8.054736137390137, 9.15501594543457, 10.255294799804688, 11.355573654174805, 12.455853462219238, 13.556133270263672, 14.656412124633789, 15.756690979003906, 16.856971740722656, 17.957250595092773, 19.05752944946289, 20.157808303833008, 21.258087158203125, 22.358367919921875, 23.458646774291992, 24.55892562866211, 25.65920639038086, 26.759485244750977, 27.859764099121094, 28.96004295349121, 30.060321807861328, 31.160602569580078, 32.26087951660156, 33.36116027832031, 34.46144104003906, 35.56171798706055, 36.6619987487793, 37.76227951049805, 38.86255645751953, 39.96283721923828, 41.06311798095703, 42.163394927978516, 43.263675689697266, 44.36395263671875, 45.4642333984375]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 1.0, 11.0, 11.0, 26.0, 33.0, 42.0, 57.0, 57.0, 90.0, 96.0, 108.0, 92.0, 72.0, 65.0, 52.0, 41.0, 31.0, 25.0, 14.0, 11.0, 7.0, 3.0, 6.0, 8.0, 2.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.809890747070312, -10.494063377380371, -10.17823600769043, -9.862409591674805, -9.546582221984863, -9.230754852294922, -8.914928436279297, -8.599101066589355, -8.283273696899414, -7.967446327209473, -7.6516194343566895, -7.335792541503906, -7.019965171813965, -6.704137802124023, -6.38831090927124, -6.072484016418457, -5.756656646728516, -5.440829277038574, -5.125002384185791, -4.809175491333008, -4.493348121643066, -4.177520751953125, -3.861693859100342, -3.5458667278289795, -3.230039596557617, -2.914212465286255, -2.5983853340148926, -2.2825582027435303, -1.966731071472168, -1.6509039402008057, -1.3350768089294434, -1.019249677658081, -0.7034215927124023, -0.38759446144104004, -0.07176733016967773, 0.24405980110168457, 0.5598869323730469, 0.8757140636444092, 1.1915411949157715, 1.5073683261871338, 1.823195457458496, 2.1390225887298584, 2.4548497200012207, 2.770676851272583, 3.0865039825439453, 3.4023311138153076, 3.71815824508667, 4.033985137939453, 4.3498125076293945, 4.665639877319336, 4.981466770172119, 5.297293663024902, 5.613121032714844, 5.928948402404785, 6.244775295257568, 6.560602188110352, 6.876429557800293, 7.192256927490234, 7.508083820343018, 7.823910713195801, 8.139738082885742, 8.455565452575684, 8.771392822265625, 9.08721923828125, 9.403046607971191]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 1.0, 9.0, 8.0, 4.0, 5.0, 10.0, 14.0, 11.0, 18.0, 26.0, 47.0, 52.0, 83.0, 99.0, 214.0, 370.0, 736.0, 1884.0, 5449.0, 56606.0, 4106014.0, 16871.0, 3105.0, 1114.0, 567.0, 321.0, 190.0, 156.0, 91.0, 58.0, 32.0, 23.0, 21.0, 11.0, 12.0, 5.0, 4.0, 9.0, 3.0, 5.0, 6.0, 8.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.7578125, -6.5347900390625, -6.311767578125, -6.0887451171875, -5.86572265625, -5.6427001953125, -5.419677734375, -5.1966552734375, -4.9736328125, -4.7506103515625, -4.527587890625, -4.3045654296875, -4.08154296875, -3.8585205078125, -3.635498046875, -3.4124755859375, -3.189453125, -2.9664306640625, -2.743408203125, -2.5203857421875, -2.29736328125, -2.0743408203125, -1.851318359375, -1.6282958984375, -1.4052734375, -1.1822509765625, -0.959228515625, -0.7362060546875, -0.51318359375, -0.2901611328125, -0.067138671875, 0.1558837890625, 0.37890625, 0.6019287109375, 0.824951171875, 1.0479736328125, 1.27099609375, 1.4940185546875, 1.717041015625, 1.9400634765625, 2.1630859375, 2.3861083984375, 2.609130859375, 2.8321533203125, 3.05517578125, 3.2781982421875, 3.501220703125, 3.7242431640625, 3.947265625, 4.1702880859375, 4.393310546875, 4.6163330078125, 4.83935546875, 5.0623779296875, 5.285400390625, 5.5084228515625, 5.7314453125, 5.9544677734375, 6.177490234375, 6.4005126953125, 6.62353515625, 6.8465576171875, 7.069580078125, 7.2926025390625, 7.515625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 19.0, 20.0, 31.0, 72.0, 237.0, 313.0, 191.0, 52.0, 26.0, 9.0, 9.0, 3.0, 7.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45068359375, -0.435821533203125, -0.42095947265625, -0.406097412109375, -0.3912353515625, -0.376373291015625, -0.36151123046875, -0.346649169921875, -0.331787109375, -0.316925048828125, -0.30206298828125, -0.287200927734375, -0.2723388671875, -0.257476806640625, -0.24261474609375, -0.227752685546875, -0.212890625, -0.198028564453125, -0.18316650390625, -0.168304443359375, -0.1534423828125, -0.138580322265625, -0.12371826171875, -0.108856201171875, -0.093994140625, -0.079132080078125, -0.06427001953125, -0.049407958984375, -0.0345458984375, -0.019683837890625, -0.00482177734375, 0.010040283203125, 0.02490234375, 0.039764404296875, 0.05462646484375, 0.069488525390625, 0.0843505859375, 0.099212646484375, 0.11407470703125, 0.128936767578125, 0.143798828125, 0.158660888671875, 0.17352294921875, 0.188385009765625, 0.2032470703125, 0.218109130859375, 0.23297119140625, 0.247833251953125, 0.2626953125, 0.277557373046875, 0.29241943359375, 0.307281494140625, 0.3221435546875, 0.337005615234375, 0.35186767578125, 0.366729736328125, 0.381591796875, 0.396453857421875, 0.41131591796875, 0.426177978515625, 0.4410400390625, 0.455902099609375, 0.47076416015625, 0.485626220703125, 0.50048828125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 11.0, 5.0, 10.0, 19.0, 21.0, 44.0, 62.0, 151.0, 487.0, 3568.0, 1929681.0, 2255723.0, 3576.0, 561.0, 160.0, 70.0, 50.0, 21.0, 17.0, 7.0, 6.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.96875, -6.7637939453125, -6.558837890625, -6.3538818359375, -6.14892578125, -5.9439697265625, -5.739013671875, -5.5340576171875, -5.3291015625, -5.1241455078125, -4.919189453125, -4.7142333984375, -4.50927734375, -4.3043212890625, -4.099365234375, -3.8944091796875, -3.689453125, -3.4844970703125, -3.279541015625, -3.0745849609375, -2.86962890625, -2.6646728515625, -2.459716796875, -2.2547607421875, -2.0498046875, -1.8448486328125, -1.639892578125, -1.4349365234375, -1.22998046875, -1.0250244140625, -0.820068359375, -0.6151123046875, -0.41015625, -0.2052001953125, -0.000244140625, 0.2047119140625, 0.40966796875, 0.6146240234375, 0.819580078125, 1.0245361328125, 1.2294921875, 1.4344482421875, 1.639404296875, 1.8443603515625, 2.04931640625, 2.2542724609375, 2.459228515625, 2.6641845703125, 2.869140625, 3.0740966796875, 3.279052734375, 3.4840087890625, 3.68896484375, 3.8939208984375, 4.098876953125, 4.3038330078125, 4.5087890625, 4.7137451171875, 4.918701171875, 5.1236572265625, 5.32861328125, 5.5335693359375, 5.738525390625, 5.9434814453125, 6.1484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 1.0, 5.0, 5.0, 11.0, 12.0, 17.0, 38.0, 40.0, 66.0, 116.0, 333.0, 922.0, 1735.0, 388.0, 141.0, 74.0, 48.0, 32.0, 18.0, 16.0, 9.0, 10.0, 7.0, 3.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.392578125, -0.3795814514160156, -0.36658477783203125, -0.3535881042480469, -0.3405914306640625, -0.3275947570800781, -0.31459808349609375, -0.3016014099121094, -0.288604736328125, -0.2756080627441406, -0.26261138916015625, -0.24961471557617188, -0.2366180419921875, -0.22362136840820312, -0.21062469482421875, -0.19762802124023438, -0.18463134765625, -0.17163467407226562, -0.15863800048828125, -0.14564132690429688, -0.1326446533203125, -0.11964797973632812, -0.10665130615234375, -0.09365463256835938, -0.080657958984375, -0.06766128540039062, -0.05466461181640625, -0.041667938232421875, -0.0286712646484375, -0.015674591064453125, -0.00267791748046875, 0.010318756103515625, 0.0233154296875, 0.036312103271484375, 0.04930877685546875, 0.062305450439453125, 0.0753021240234375, 0.08829879760742188, 0.10129547119140625, 0.11429214477539062, 0.127288818359375, 0.14028549194335938, 0.15328216552734375, 0.16627883911132812, 0.1792755126953125, 0.19227218627929688, 0.20526885986328125, 0.21826553344726562, 0.23126220703125, 0.24425888061523438, 0.25725555419921875, 0.2702522277832031, 0.2832489013671875, 0.2962455749511719, 0.30924224853515625, 0.3222389221191406, 0.335235595703125, 0.3482322692871094, 0.36122894287109375, 0.3742256164550781, 0.3872222900390625, 0.4002189636230469, 0.41321563720703125, 0.4262123107910156, 0.439208984375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 15.0, 19.0, 87.0, 446.0, 326.0, 78.0, 14.0, 12.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9233076572418213, -2.795870304107666, -2.6684327125549316, -2.5409953594207764, -2.413558006286621, -2.2861204147338867, -2.1586830615997314, -2.031245708465576, -1.9038081169128418, -1.776370644569397, -1.6489331722259521, -1.5214958190917969, -1.394058346748352, -1.2666208744049072, -1.139183521270752, -1.0117460489273071, -0.8843085765838623, -0.7568711042404175, -0.6294336915016174, -0.5019962787628174, -0.37455880641937256, -0.24712133407592773, -0.11968392133712769, 0.007753491401672363, 0.1351909637451172, 0.2626284062862396, 0.39006584882736206, 0.5175032615661621, 0.6449407339096069, 0.7723782062530518, 0.8998156189918518, 1.0272530317306519, 1.1546907424926758, 1.2821282148361206, 1.4095656871795654, 1.5370030403137207, 1.6644405126571655, 1.7918779850006104, 1.9193153381347656, 2.0467529296875, 2.1741902828216553, 2.3016276359558105, 2.429065227508545, 2.5565025806427, 2.6839399337768555, 2.81137752532959, 2.938814878463745, 3.0662522315979004, 3.1936898231506348, 3.32112717628479, 3.4485647678375244, 3.5760021209716797, 3.703439712524414, 3.8308770656585693, 3.9583144187927246, 4.085752010345459, 4.213189125061035, 4.3406267166137695, 4.468063831329346, 4.59550142288208, 4.7229390144348145, 4.850376129150391, 4.977813720703125, 5.105251312255859, 5.232688903808594]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 4.0, 10.0, 8.0, 12.0, 17.0, 34.0, 25.0, 41.0, 45.0, 74.0, 65.0, 64.0, 72.0, 72.0, 71.0, 65.0, 67.0, 54.0, 46.0, 39.0, 22.0, 21.0, 18.0, 8.0, 9.0, 5.0, 5.0, 9.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55598783493042, -1.502063512802124, -1.4481391906738281, -1.3942149877548218, -1.3402906656265259, -1.28636634349823, -1.2324421405792236, -1.1785178184509277, -1.1245934963226318, -1.070669174194336, -1.01674485206604, -0.9628206491470337, -0.9088963270187378, -0.8549720048904419, -0.8010477423667908, -0.7471234798431396, -0.6931991577148438, -0.6392748355865479, -0.5853505730628967, -0.5314263105392456, -0.4775019884109497, -0.4235776960849762, -0.3696534037590027, -0.3157291114330292, -0.26180481910705566, -0.20788052678108215, -0.15395623445510864, -0.10003194212913513, -0.04610764980316162, 0.00781664252281189, 0.0617409348487854, 0.11566522717475891, 0.16958951950073242, 0.22351381182670593, 0.27743810415267944, 0.33136239647865295, 0.38528668880462646, 0.4392109811306, 0.4931352734565735, 0.5470595359802246, 0.6009838581085205, 0.6549081802368164, 0.7088324427604675, 0.7627567052841187, 0.8166810274124146, 0.8706053495407104, 0.9245296120643616, 0.9784538745880127, 1.0323781967163086, 1.0863025188446045, 1.1402268409729004, 1.1941510438919067, 1.2480753660202026, 1.3019996881484985, 1.3559238910675049, 1.4098482131958008, 1.4637725353240967, 1.5176968574523926, 1.5716211795806885, 1.6255453824996948, 1.6794697046279907, 1.7333940267562866, 1.787318229675293, 1.8412425518035889, 1.8951668739318848]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 7.0, 2.0, 10.0, 9.0, 17.0, 30.0, 35.0, 57.0, 94.0, 142.0, 227.0, 475.0, 1068.0, 2968.0, 16447.0, 844299.0, 171051.0, 8016.0, 1917.0, 742.0, 358.0, 205.0, 141.0, 76.0, 50.0, 27.0, 22.0, 18.0, 10.0, 11.0, 5.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.474609375, -3.37188720703125, -3.2691650390625, -3.16644287109375, -3.063720703125, -2.96099853515625, -2.8582763671875, -2.75555419921875, -2.65283203125, -2.55010986328125, -2.4473876953125, -2.34466552734375, -2.241943359375, -2.13922119140625, -2.0364990234375, -1.93377685546875, -1.8310546875, -1.72833251953125, -1.6256103515625, -1.52288818359375, -1.420166015625, -1.31744384765625, -1.2147216796875, -1.11199951171875, -1.00927734375, -0.90655517578125, -0.8038330078125, -0.70111083984375, -0.598388671875, -0.49566650390625, -0.3929443359375, -0.29022216796875, -0.1875, -0.08477783203125, 0.0179443359375, 0.12066650390625, 0.223388671875, 0.32611083984375, 0.4288330078125, 0.53155517578125, 0.63427734375, 0.73699951171875, 0.8397216796875, 0.94244384765625, 1.045166015625, 1.14788818359375, 1.2506103515625, 1.35333251953125, 1.4560546875, 1.55877685546875, 1.6614990234375, 1.76422119140625, 1.866943359375, 1.96966552734375, 2.0723876953125, 2.17510986328125, 2.27783203125, 2.38055419921875, 2.4832763671875, 2.58599853515625, 2.688720703125, 2.79144287109375, 2.8941650390625, 2.99688720703125, 3.099609375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 11.0, 8.0, 14.0, 38.0, 84.0, 242.0, 286.0, 182.0, 80.0, 30.0, 13.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.3917083740234375, -0.377899169921875, -0.3640899658203125, -0.35028076171875, -0.3364715576171875, -0.322662353515625, -0.3088531494140625, -0.2950439453125, -0.2812347412109375, -0.267425537109375, -0.2536163330078125, -0.23980712890625, -0.2259979248046875, -0.212188720703125, -0.1983795166015625, -0.1845703125, -0.1707611083984375, -0.156951904296875, -0.1431427001953125, -0.12933349609375, -0.1155242919921875, -0.101715087890625, -0.0879058837890625, -0.0740966796875, -0.0602874755859375, -0.046478271484375, -0.0326690673828125, -0.01885986328125, -0.0050506591796875, 0.008758544921875, 0.0225677490234375, 0.036376953125, 0.0501861572265625, 0.063995361328125, 0.0778045654296875, 0.09161376953125, 0.1054229736328125, 0.119232177734375, 0.1330413818359375, 0.1468505859375, 0.1606597900390625, 0.174468994140625, 0.1882781982421875, 0.20208740234375, 0.2158966064453125, 0.229705810546875, 0.2435150146484375, 0.25732421875, 0.2711334228515625, 0.284942626953125, 0.2987518310546875, 0.31256103515625, 0.3263702392578125, 0.340179443359375, 0.3539886474609375, 0.3677978515625, 0.3816070556640625, 0.395416259765625, 0.4092254638671875, 0.42303466796875, 0.4368438720703125, 0.450653076171875, 0.4644622802734375, 0.478271484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 7.0, 8.0, 9.0, 10.0, 15.0, 31.0, 31.0, 54.0, 67.0, 103.0, 132.0, 190.0, 306.0, 497.0, 952.0, 2168.0, 6686.0, 28392.0, 198540.0, 676400.0, 106607.0, 18510.0, 4849.0, 1776.0, 797.0, 461.0, 267.0, 187.0, 142.0, 83.0, 75.0, 50.0, 52.0, 29.0, 16.0, 11.0, 11.0, 13.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6455078125, -1.5976104736328125, -1.549713134765625, -1.5018157958984375, -1.45391845703125, -1.4060211181640625, -1.358123779296875, -1.3102264404296875, -1.2623291015625, -1.2144317626953125, -1.166534423828125, -1.1186370849609375, -1.07073974609375, -1.0228424072265625, -0.974945068359375, -0.9270477294921875, -0.879150390625, -0.8312530517578125, -0.783355712890625, -0.7354583740234375, -0.68756103515625, -0.6396636962890625, -0.591766357421875, -0.5438690185546875, -0.4959716796875, -0.4480743408203125, -0.400177001953125, -0.3522796630859375, -0.30438232421875, -0.2564849853515625, -0.208587646484375, -0.1606903076171875, -0.11279296875, -0.0648956298828125, -0.016998291015625, 0.0308990478515625, 0.07879638671875, 0.1266937255859375, 0.174591064453125, 0.2224884033203125, 0.2703857421875, 0.3182830810546875, 0.366180419921875, 0.4140777587890625, 0.46197509765625, 0.5098724365234375, 0.557769775390625, 0.6056671142578125, 0.653564453125, 0.7014617919921875, 0.749359130859375, 0.7972564697265625, 0.84515380859375, 0.8930511474609375, 0.940948486328125, 0.9888458251953125, 1.0367431640625, 1.0846405029296875, 1.132537841796875, 1.1804351806640625, 1.22833251953125, 1.2762298583984375, 1.324127197265625, 1.3720245361328125, 1.419921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 10.0, 3.0, 5.0, 4.0, 8.0, 16.0, 11.0, 10.0, 20.0, 20.0, 29.0, 14.0, 28.0, 24.0, 28.0, 42.0, 35.0, 50.0, 39.0, 51.0, 44.0, 53.0, 40.0, 35.0, 49.0, 44.0, 43.0, 34.0, 31.0, 28.0, 20.0, 25.0, 14.0, 18.0, 12.0, 13.0, 14.0, 12.0, 5.0, 2.0, 6.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8974609375, -0.8691329956054688, -0.8408050537109375, -0.8124771118164062, -0.784149169921875, -0.7558212280273438, -0.7274932861328125, -0.6991653442382812, -0.67083740234375, -0.6425094604492188, -0.6141815185546875, -0.5858535766601562, -0.557525634765625, -0.5291976928710938, -0.5008697509765625, -0.47254180908203125, -0.4442138671875, -0.41588592529296875, -0.3875579833984375, -0.35923004150390625, -0.330902099609375, -0.30257415771484375, -0.2742462158203125, -0.24591827392578125, -0.21759033203125, -0.18926239013671875, -0.1609344482421875, -0.13260650634765625, -0.104278564453125, -0.07595062255859375, -0.0476226806640625, -0.01929473876953125, 0.009033203125, 0.03736114501953125, 0.0656890869140625, 0.09401702880859375, 0.122344970703125, 0.15067291259765625, 0.1790008544921875, 0.20732879638671875, 0.23565673828125, 0.26398468017578125, 0.2923126220703125, 0.32064056396484375, 0.348968505859375, 0.37729644775390625, 0.4056243896484375, 0.43395233154296875, 0.4622802734375, 0.49060821533203125, 0.5189361572265625, 0.5472640991210938, 0.575592041015625, 0.6039199829101562, 0.6322479248046875, 0.6605758666992188, 0.68890380859375, 0.7172317504882812, 0.7455596923828125, 0.7738876342773438, 0.802215576171875, 0.8305435180664062, 0.8588714599609375, 0.8871994018554688, 0.91552734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 13.0, 10.0, 21.0, 27.0, 98.0, 171.0, 470.0, 2036.0, 62313.0, 975164.0, 6799.0, 900.0, 291.0, 117.0, 48.0, 28.0, 22.0, 9.0, 7.0, 8.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.12347412109375, -2.0555419921875, -1.98760986328125, -1.919677734375, -1.85174560546875, -1.7838134765625, -1.71588134765625, -1.64794921875, -1.58001708984375, -1.5120849609375, -1.44415283203125, -1.376220703125, -1.30828857421875, -1.2403564453125, -1.17242431640625, -1.1044921875, -1.03656005859375, -0.9686279296875, -0.90069580078125, -0.832763671875, -0.76483154296875, -0.6968994140625, -0.62896728515625, -0.56103515625, -0.49310302734375, -0.4251708984375, -0.35723876953125, -0.289306640625, -0.22137451171875, -0.1534423828125, -0.08551025390625, -0.017578125, 0.05035400390625, 0.1182861328125, 0.18621826171875, 0.254150390625, 0.32208251953125, 0.3900146484375, 0.45794677734375, 0.52587890625, 0.59381103515625, 0.6617431640625, 0.72967529296875, 0.797607421875, 0.86553955078125, 0.9334716796875, 1.00140380859375, 1.0693359375, 1.13726806640625, 1.2052001953125, 1.27313232421875, 1.341064453125, 1.40899658203125, 1.4769287109375, 1.54486083984375, 1.61279296875, 1.68072509765625, 1.7486572265625, 1.81658935546875, 1.884521484375, 1.95245361328125, 2.0203857421875, 2.08831787109375, 2.15625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 8.0, 10.0, 11.0, 19.0, 12.0, 19.0, 28.0, 42.0, 63.0, 77.0, 122.0, 190.0, 101.0, 67.0, 62.0, 39.0, 32.0, 16.0, 14.0, 16.0, 7.0, 9.0, 11.0, 1.0, 7.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00020933151245117188, -0.00020265765488147736, -0.00019598379731178284, -0.00018930993974208832, -0.0001826360821723938, -0.00017596222460269928, -0.00016928836703300476, -0.00016261450946331024, -0.00015594065189361572, -0.0001492667943239212, -0.00014259293675422668, -0.00013591907918453217, -0.00012924522161483765, -0.00012257136404514313, -0.00011589750647544861, -0.00010922364890575409, -0.00010254979133605957, -9.587593376636505e-05, -8.920207619667053e-05, -8.252821862697601e-05, -7.58543610572815e-05, -6.918050348758698e-05, -6.250664591789246e-05, -5.583278834819794e-05, -4.915893077850342e-05, -4.24850732088089e-05, -3.581121563911438e-05, -2.913735806941986e-05, -2.2463500499725342e-05, -1.5789642930030823e-05, -9.115785360336304e-06, -2.4419277906417847e-06, 4.231929779052734e-06, 1.0905787348747253e-05, 1.7579644918441772e-05, 2.425350248813629e-05, 3.092736005783081e-05, 3.760121762752533e-05, 4.427507519721985e-05, 5.094893276691437e-05, 5.762279033660889e-05, 6.42966479063034e-05, 7.097050547599792e-05, 7.764436304569244e-05, 8.431822061538696e-05, 9.099207818508148e-05, 9.7665935754776e-05, 0.00010433979332447052, 0.00011101365089416504, 0.00011768750846385956, 0.00012436136603355408, 0.0001310352236032486, 0.00013770908117294312, 0.00014438293874263763, 0.00015105679631233215, 0.00015773065388202667, 0.0001644045114517212, 0.0001710783690214157, 0.00017775222659111023, 0.00018442608416080475, 0.00019109994173049927, 0.0001977737993001938, 0.0002044476568698883, 0.00021112151443958282, 0.00021779537200927734]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 10.0, 9.0, 12.0, 13.0, 25.0, 27.0, 53.0, 64.0, 91.0, 144.0, 307.0, 627.0, 1626.0, 5751.0, 38465.0, 714386.0, 262820.0, 18314.0, 3552.0, 1163.0, 478.0, 226.0, 118.0, 77.0, 38.0, 28.0, 34.0, 14.0, 19.0, 13.0, 6.0, 6.0, 4.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.109375, -1.07452392578125, -1.0396728515625, -1.00482177734375, -0.969970703125, -0.93511962890625, -0.9002685546875, -0.86541748046875, -0.83056640625, -0.79571533203125, -0.7608642578125, -0.72601318359375, -0.691162109375, -0.65631103515625, -0.6214599609375, -0.58660888671875, -0.5517578125, -0.51690673828125, -0.4820556640625, -0.44720458984375, -0.412353515625, -0.37750244140625, -0.3426513671875, -0.30780029296875, -0.27294921875, -0.23809814453125, -0.2032470703125, -0.16839599609375, -0.133544921875, -0.09869384765625, -0.0638427734375, -0.02899169921875, 0.005859375, 0.04071044921875, 0.0755615234375, 0.11041259765625, 0.145263671875, 0.18011474609375, 0.2149658203125, 0.24981689453125, 0.28466796875, 0.31951904296875, 0.3543701171875, 0.38922119140625, 0.424072265625, 0.45892333984375, 0.4937744140625, 0.52862548828125, 0.5634765625, 0.59832763671875, 0.6331787109375, 0.66802978515625, 0.702880859375, 0.73773193359375, 0.7725830078125, 0.80743408203125, 0.84228515625, 0.87713623046875, 0.9119873046875, 0.94683837890625, 0.981689453125, 1.01654052734375, 1.0513916015625, 1.08624267578125, 1.12109375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 5.0, 6.0, 9.0, 15.0, 22.0, 24.0, 28.0, 35.0, 45.0, 49.0, 83.0, 92.0, 104.0, 100.0, 88.0, 63.0, 48.0, 37.0, 34.0, 28.0, 18.0, 8.0, 9.0, 9.0, 8.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6201171875, -0.6022491455078125, -0.584381103515625, -0.5665130615234375, -0.54864501953125, -0.5307769775390625, -0.512908935546875, -0.4950408935546875, -0.4771728515625, -0.4593048095703125, -0.441436767578125, -0.4235687255859375, -0.40570068359375, -0.3878326416015625, -0.369964599609375, -0.3520965576171875, -0.334228515625, -0.3163604736328125, -0.298492431640625, -0.2806243896484375, -0.26275634765625, -0.2448883056640625, -0.227020263671875, -0.2091522216796875, -0.1912841796875, -0.1734161376953125, -0.155548095703125, -0.1376800537109375, -0.11981201171875, -0.1019439697265625, -0.084075927734375, -0.0662078857421875, -0.04833984375, -0.0304718017578125, -0.012603759765625, 0.0052642822265625, 0.02313232421875, 0.0410003662109375, 0.058868408203125, 0.0767364501953125, 0.0946044921875, 0.1124725341796875, 0.130340576171875, 0.1482086181640625, 0.16607666015625, 0.1839447021484375, 0.201812744140625, 0.2196807861328125, 0.237548828125, 0.2554168701171875, 0.273284912109375, 0.2911529541015625, 0.30902099609375, 0.3268890380859375, 0.344757080078125, 0.3626251220703125, 0.3804931640625, 0.3983612060546875, 0.416229248046875, 0.4340972900390625, 0.45196533203125, 0.4698333740234375, 0.487701416015625, 0.5055694580078125, 0.5234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 57.0, 777.0, 156.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.993803024291992, -20.389400482177734, -18.78499984741211, -17.180599212646484, -15.576196670532227, -13.971795082092285, -12.367393493652344, -10.762991905212402, -9.158590316772461, -7.5541887283325195, -5.949787139892578, -4.345385551452637, -2.7409839630126953, -1.136582374572754, 0.4678192138671875, 2.072220802307129, 3.6766223907470703, 5.281023979187012, 6.885425567626953, 8.489827156066895, 10.094228744506836, 11.698630332946777, 13.303031921386719, 14.90743350982666, 16.5118350982666, 18.11623764038086, 19.720638275146484, 21.32503890991211, 22.929441452026367, 24.533843994140625, 26.13824462890625, 27.742645263671875, 29.3470458984375, 30.951446533203125, 32.55584716796875, 34.16025161743164, 35.764652252197266, 37.36905288696289, 38.97345733642578, 40.577857971191406, 42.18225860595703, 43.786659240722656, 45.39105987548828, 46.99546432495117, 48.5998649597168, 50.20426559448242, 51.80867004394531, 53.41307067871094, 55.01747131347656, 56.62187194824219, 58.22627258300781, 59.8306770324707, 61.43507766723633, 63.03947830200195, 64.64388275146484, 66.24828338623047, 67.8526840209961, 69.45708465576172, 71.06148529052734, 72.66588592529297, 74.27029418945312, 75.87469482421875, 77.47909545898438, 79.08349609375, 80.68789672851562]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 2.0, 11.0, 12.0, 31.0, 40.0, 38.0, 51.0, 56.0, 83.0, 91.0, 88.0, 75.0, 93.0, 78.0, 62.0, 42.0, 41.0, 33.0, 20.0, 18.0, 13.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.905634880065918, -10.500060081481934, -10.094484329223633, -9.688909530639648, -9.283334732055664, -8.87775993347168, -8.472184181213379, -8.066609382629395, -7.661034107208252, -7.255458831787109, -6.849884033203125, -6.444308757781982, -6.03873348236084, -5.6331586837768555, -5.227583408355713, -4.82200813293457, -4.416433334350586, -4.010858058929443, -3.605283260345459, -3.1997079849243164, -2.794132947921753, -2.3885579109191895, -1.9829826354980469, -1.5774075984954834, -1.17183256149292, -0.7662574648857117, -0.3606823682785034, 0.04489278793334961, 0.4504678249359131, 0.8560428619384766, 1.2616181373596191, 1.6671931743621826, 2.0727691650390625, 2.478344202041626, 2.8839192390441895, 3.289494514465332, 3.6950695514678955, 4.100644588470459, 4.506219863891602, 4.911794662475586, 5.3173699378967285, 5.722945213317871, 6.1285200119018555, 6.534095287322998, 6.939670562744141, 7.345245361328125, 7.750820636749268, 8.15639591217041, 8.561970710754395, 8.967545509338379, 9.37312126159668, 9.778696060180664, 10.184270858764648, 10.589845657348633, 10.995421409606934, 11.400996208190918, 11.806571960449219, 12.212146759033203, 12.617722511291504, 13.023297309875488, 13.428872108459473, 13.834447860717773, 14.240022659301758, 14.645597457885742, 15.051172256469727]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 12.0, 24.0, 54.0, 147.0, 539.0, 32199.0, 4159905.0, 1016.0, 252.0, 71.0, 27.0, 12.0, 8.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.421875, -21.677734375, -20.93359375, -20.189453125, -19.4453125, -18.701171875, -17.95703125, -17.212890625, -16.46875, -15.724609375, -14.98046875, -14.236328125, -13.4921875, -12.748046875, -12.00390625, -11.259765625, -10.515625, -9.771484375, -9.02734375, -8.283203125, -7.5390625, -6.794921875, -6.05078125, -5.306640625, -4.5625, -3.818359375, -3.07421875, -2.330078125, -1.5859375, -0.841796875, -0.09765625, 0.646484375, 1.390625, 2.134765625, 2.87890625, 3.623046875, 4.3671875, 5.111328125, 5.85546875, 6.599609375, 7.34375, 8.087890625, 8.83203125, 9.576171875, 10.3203125, 11.064453125, 11.80859375, 12.552734375, 13.296875, 14.041015625, 14.78515625, 15.529296875, 16.2734375, 17.017578125, 17.76171875, 18.505859375, 19.25, 19.994140625, 20.73828125, 21.482421875, 22.2265625, 22.970703125, 23.71484375, 24.458984375, 25.203125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 11.0, 20.0, 44.0, 83.0, 168.0, 244.0, 205.0, 113.0, 72.0, 15.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53955078125, -0.5213775634765625, -0.503204345703125, -0.4850311279296875, -0.46685791015625, -0.4486846923828125, -0.430511474609375, -0.4123382568359375, -0.3941650390625, -0.3759918212890625, -0.357818603515625, -0.3396453857421875, -0.32147216796875, -0.3032989501953125, -0.285125732421875, -0.2669525146484375, -0.248779296875, -0.2306060791015625, -0.212432861328125, -0.1942596435546875, -0.17608642578125, -0.1579132080078125, -0.139739990234375, -0.1215667724609375, -0.1033935546875, -0.0852203369140625, -0.067047119140625, -0.0488739013671875, -0.03070068359375, -0.0125274658203125, 0.005645751953125, 0.0238189697265625, 0.0419921875, 0.0601654052734375, 0.078338623046875, 0.0965118408203125, 0.11468505859375, 0.1328582763671875, 0.151031494140625, 0.1692047119140625, 0.1873779296875, 0.2055511474609375, 0.223724365234375, 0.2418975830078125, 0.26007080078125, 0.2782440185546875, 0.296417236328125, 0.3145904541015625, 0.332763671875, 0.3509368896484375, 0.369110107421875, 0.3872833251953125, 0.40545654296875, 0.4236297607421875, 0.441802978515625, 0.4599761962890625, 0.4781494140625, 0.4963226318359375, 0.514495849609375, 0.5326690673828125, 0.55084228515625, 0.5690155029296875, 0.587188720703125, 0.6053619384765625, 0.62353515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 15.0, 14.0, 24.0, 44.0, 67.0, 124.0, 310.0, 1080.0, 7145.0, 200989.0, 3960467.0, 20620.0, 2357.0, 527.0, 190.0, 117.0, 74.0, 50.0, 29.0, 14.0, 13.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.568359375, -3.460906982421875, -3.35345458984375, -3.246002197265625, -3.1385498046875, -3.031097412109375, -2.92364501953125, -2.816192626953125, -2.708740234375, -2.601287841796875, -2.49383544921875, -2.386383056640625, -2.2789306640625, -2.171478271484375, -2.06402587890625, -1.956573486328125, -1.84912109375, -1.741668701171875, -1.63421630859375, -1.526763916015625, -1.4193115234375, -1.311859130859375, -1.20440673828125, -1.096954345703125, -0.989501953125, -0.882049560546875, -0.77459716796875, -0.667144775390625, -0.5596923828125, -0.452239990234375, -0.34478759765625, -0.237335205078125, -0.1298828125, -0.022430419921875, 0.08502197265625, 0.192474365234375, 0.2999267578125, 0.407379150390625, 0.51483154296875, 0.622283935546875, 0.729736328125, 0.837188720703125, 0.94464111328125, 1.052093505859375, 1.1595458984375, 1.266998291015625, 1.37445068359375, 1.481903076171875, 1.58935546875, 1.696807861328125, 1.80426025390625, 1.911712646484375, 2.0191650390625, 2.126617431640625, 2.23406982421875, 2.341522216796875, 2.448974609375, 2.556427001953125, 2.66387939453125, 2.771331787109375, 2.8787841796875, 2.986236572265625, 3.09368896484375, 3.201141357421875, 3.30859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 11.0, 10.0, 12.0, 22.0, 34.0, 106.0, 262.0, 1172.0, 1838.0, 318.0, 125.0, 54.0, 30.0, 20.0, 18.0, 7.0, 8.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.349609375, -0.33129119873046875, -0.3129730224609375, -0.29465484619140625, -0.276336669921875, -0.25801849365234375, -0.2397003173828125, -0.22138214111328125, -0.20306396484375, -0.18474578857421875, -0.1664276123046875, -0.14810943603515625, -0.129791259765625, -0.11147308349609375, -0.0931549072265625, -0.07483673095703125, -0.0565185546875, -0.03820037841796875, -0.0198822021484375, -0.00156402587890625, 0.016754150390625, 0.03507232666015625, 0.0533905029296875, 0.07170867919921875, 0.09002685546875, 0.10834503173828125, 0.1266632080078125, 0.14498138427734375, 0.163299560546875, 0.18161773681640625, 0.1999359130859375, 0.21825408935546875, 0.236572265625, 0.25489044189453125, 0.2732086181640625, 0.29152679443359375, 0.309844970703125, 0.32816314697265625, 0.3464813232421875, 0.36479949951171875, 0.38311767578125, 0.40143585205078125, 0.4197540283203125, 0.43807220458984375, 0.456390380859375, 0.47470855712890625, 0.4930267333984375, 0.5113449096679688, 0.5296630859375, 0.5479812622070312, 0.5662994384765625, 0.5846176147460938, 0.602935791015625, 0.6212539672851562, 0.6395721435546875, 0.6578903198242188, 0.67620849609375, 0.6945266723632812, 0.7128448486328125, 0.7311630249023438, 0.749481201171875, 0.7677993774414062, 0.7861175537109375, 0.8044357299804688, 0.82275390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 11.0, 26.0, 46.0, 87.0, 187.0, 190.0, 185.0, 113.0, 76.0, 33.0, 13.0, 12.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0713757276535034, -1.0100514888763428, -0.9487271308898926, -0.8874028325080872, -0.8260785341262817, -0.7647542357444763, -0.7034299373626709, -0.6421056389808655, -0.5807813405990601, -0.5194570422172546, -0.4581327438354492, -0.3968084454536438, -0.3354841470718384, -0.27415984869003296, -0.21283555030822754, -0.15151125192642212, -0.0901869535446167, -0.02886265516281128, 0.03246164321899414, 0.09378594160079956, 0.15511023998260498, 0.2164345383644104, 0.2777588367462158, 0.33908313512802124, 0.40040743350982666, 0.4617317318916321, 0.5230560302734375, 0.5843803286552429, 0.6457046270370483, 0.7070289254188538, 0.7683532238006592, 0.8296775221824646, 0.8910017013549805, 0.9523259997367859, 1.0136502981185913, 1.074974536895752, 1.1362988948822021, 1.1976232528686523, 1.258947491645813, 1.3202717304229736, 1.3815960884094238, 1.442920446395874, 1.5042446851730347, 1.5655689239501953, 1.6268932819366455, 1.6882176399230957, 1.7495418787002563, 1.810866117477417, 1.8721904754638672, 1.9335148334503174, 1.994839072227478, 2.0561633110046387, 2.117487668991089, 2.178812026977539, 2.24013614654541, 2.3014605045318604, 2.3627848625183105, 2.4241092205047607, 2.485433578491211, 2.546757698059082, 2.6080820560455322, 2.6694064140319824, 2.7307305335998535, 2.7920548915863037, 2.853379249572754]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 11.0, 15.0, 12.0, 20.0, 23.0, 19.0, 28.0, 29.0, 33.0, 37.0, 44.0, 43.0, 50.0, 60.0, 51.0, 48.0, 53.0, 51.0, 32.0, 49.0, 42.0, 42.0, 44.0, 33.0, 21.0, 21.0, 24.0, 17.0, 14.0, 8.0, 5.0, 6.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.4748361110687256, -1.4331227540969849, -1.3914093971252441, -1.3496960401535034, -1.3079826831817627, -1.266269326210022, -1.2245559692382812, -1.1828426122665405, -1.1411292552947998, -1.099415898323059, -1.0577025413513184, -1.0159891843795776, -0.9742758274078369, -0.9325624704360962, -0.8908491134643555, -0.8491357564926147, -0.8074224591255188, -0.7657091021537781, -0.7239957451820374, -0.6822823882102966, -0.6405690312385559, -0.5988556742668152, -0.5571423768997192, -0.5154290199279785, -0.4737156331539154, -0.4320022761821747, -0.39028891921043396, -0.3485755920410156, -0.3068622350692749, -0.2651488780975342, -0.22343552112579346, -0.18172216415405273, -0.140008807182312, -0.09829545021057129, -0.05658210068941116, -0.014868751168251038, 0.026844605803489685, 0.06855796277523041, 0.11027130484580994, 0.15198466181755066, 0.19369801878929138, 0.2354113757610321, 0.2771247327327728, 0.31883805990219116, 0.3605514168739319, 0.4022647738456726, 0.44397813081741333, 0.48569148778915405, 0.5274048447608948, 0.5691182017326355, 0.6108315587043762, 0.6525449156761169, 0.6942582726478577, 0.7359716296195984, 0.7776849269866943, 0.8193982839584351, 0.8611116409301758, 0.9028249979019165, 0.9445383548736572, 0.986251711845398, 1.0279650688171387, 1.0696784257888794, 1.1113917827606201, 1.1531051397323608, 1.1948184967041016]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 5.0, 9.0, 8.0, 8.0, 15.0, 28.0, 34.0, 54.0, 83.0, 172.0, 332.0, 654.0, 1738.0, 6733.0, 198019.0, 821593.0, 14562.0, 2705.0, 865.0, 424.0, 208.0, 119.0, 56.0, 44.0, 26.0, 12.0, 7.0, 9.0, 8.0, 5.0, 6.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.44140625, -3.334442138671875, -3.22747802734375, -3.120513916015625, -3.0135498046875, -2.906585693359375, -2.79962158203125, -2.692657470703125, -2.585693359375, -2.478729248046875, -2.37176513671875, -2.264801025390625, -2.1578369140625, -2.050872802734375, -1.94390869140625, -1.836944580078125, -1.72998046875, -1.623016357421875, -1.51605224609375, -1.409088134765625, -1.3021240234375, -1.195159912109375, -1.08819580078125, -0.981231689453125, -0.874267578125, -0.767303466796875, -0.66033935546875, -0.553375244140625, -0.4464111328125, -0.339447021484375, -0.23248291015625, -0.125518798828125, -0.0185546875, 0.088409423828125, 0.19537353515625, 0.302337646484375, 0.4093017578125, 0.516265869140625, 0.62322998046875, 0.730194091796875, 0.837158203125, 0.944122314453125, 1.05108642578125, 1.158050537109375, 1.2650146484375, 1.371978759765625, 1.47894287109375, 1.585906982421875, 1.69287109375, 1.799835205078125, 1.90679931640625, 2.013763427734375, 2.1207275390625, 2.227691650390625, 2.33465576171875, 2.441619873046875, 2.548583984375, 2.655548095703125, 2.76251220703125, 2.869476318359375, 2.9764404296875, 3.083404541015625, 3.19036865234375, 3.297332763671875, 3.404296875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 11.0, 16.0, 49.0, 120.0, 201.0, 236.0, 169.0, 108.0, 56.0, 17.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52587890625, -0.5086288452148438, -0.4913787841796875, -0.47412872314453125, -0.456878662109375, -0.43962860107421875, -0.4223785400390625, -0.40512847900390625, -0.38787841796875, -0.37062835693359375, -0.3533782958984375, -0.33612823486328125, -0.318878173828125, -0.30162811279296875, -0.2843780517578125, -0.26712799072265625, -0.2498779296875, -0.23262786865234375, -0.2153778076171875, -0.19812774658203125, -0.180877685546875, -0.16362762451171875, -0.1463775634765625, -0.12912750244140625, -0.11187744140625, -0.09462738037109375, -0.0773773193359375, -0.06012725830078125, -0.042877197265625, -0.02562713623046875, -0.0083770751953125, 0.00887298583984375, 0.026123046875, 0.04337310791015625, 0.0606231689453125, 0.07787322998046875, 0.095123291015625, 0.11237335205078125, 0.1296234130859375, 0.14687347412109375, 0.16412353515625, 0.18137359619140625, 0.1986236572265625, 0.21587371826171875, 0.233123779296875, 0.25037384033203125, 0.2676239013671875, 0.28487396240234375, 0.3021240234375, 0.31937408447265625, 0.3366241455078125, 0.35387420654296875, 0.371124267578125, 0.38837432861328125, 0.4056243896484375, 0.42287445068359375, 0.44012451171875, 0.45737457275390625, 0.4746246337890625, 0.49187469482421875, 0.509124755859375, 0.5263748168945312, 0.5436248779296875, 0.5608749389648438, 0.578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 7.0, 6.0, 9.0, 11.0, 16.0, 37.0, 63.0, 95.0, 185.0, 341.0, 713.0, 1943.0, 9001.0, 106353.0, 823657.0, 94625.0, 8264.0, 1873.0, 655.0, 319.0, 147.0, 82.0, 55.0, 32.0, 21.0, 8.0, 11.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.226165771484375, -2.15545654296875, -2.084747314453125, -2.0140380859375, -1.943328857421875, -1.87261962890625, -1.801910400390625, -1.731201171875, -1.660491943359375, -1.58978271484375, -1.519073486328125, -1.4483642578125, -1.377655029296875, -1.30694580078125, -1.236236572265625, -1.16552734375, -1.094818115234375, -1.02410888671875, -0.953399658203125, -0.8826904296875, -0.811981201171875, -0.74127197265625, -0.670562744140625, -0.599853515625, -0.529144287109375, -0.45843505859375, -0.387725830078125, -0.3170166015625, -0.246307373046875, -0.17559814453125, -0.104888916015625, -0.0341796875, 0.036529541015625, 0.10723876953125, 0.177947998046875, 0.2486572265625, 0.319366455078125, 0.39007568359375, 0.460784912109375, 0.531494140625, 0.602203369140625, 0.67291259765625, 0.743621826171875, 0.8143310546875, 0.885040283203125, 0.95574951171875, 1.026458740234375, 1.09716796875, 1.167877197265625, 1.23858642578125, 1.309295654296875, 1.3800048828125, 1.450714111328125, 1.52142333984375, 1.592132568359375, 1.662841796875, 1.733551025390625, 1.80426025390625, 1.874969482421875, 1.9456787109375, 2.016387939453125, 2.08709716796875, 2.157806396484375, 2.228515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 0.0, 7.0, 2.0, 5.0, 3.0, 13.0, 15.0, 21.0, 23.0, 28.0, 41.0, 44.0, 56.0, 68.0, 59.0, 80.0, 61.0, 64.0, 69.0, 61.0, 54.0, 49.0, 39.0, 42.0, 29.0, 20.0, 17.0, 4.0, 5.0, 2.0, 3.0, 3.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5830078125, -1.533172607421875, -1.48333740234375, -1.433502197265625, -1.3836669921875, -1.333831787109375, -1.28399658203125, -1.234161376953125, -1.184326171875, -1.134490966796875, -1.08465576171875, -1.034820556640625, -0.9849853515625, -0.935150146484375, -0.88531494140625, -0.835479736328125, -0.78564453125, -0.735809326171875, -0.68597412109375, -0.636138916015625, -0.5863037109375, -0.536468505859375, -0.48663330078125, -0.436798095703125, -0.386962890625, -0.337127685546875, -0.28729248046875, -0.237457275390625, -0.1876220703125, -0.137786865234375, -0.08795166015625, -0.038116455078125, 0.01171875, 0.061553955078125, 0.11138916015625, 0.161224365234375, 0.2110595703125, 0.260894775390625, 0.31072998046875, 0.360565185546875, 0.410400390625, 0.460235595703125, 0.51007080078125, 0.559906005859375, 0.6097412109375, 0.659576416015625, 0.70941162109375, 0.759246826171875, 0.80908203125, 0.858917236328125, 0.90875244140625, 0.958587646484375, 1.0084228515625, 1.058258056640625, 1.10809326171875, 1.157928466796875, 1.207763671875, 1.257598876953125, 1.30743408203125, 1.357269287109375, 1.4071044921875, 1.456939697265625, 1.50677490234375, 1.556610107421875, 1.6064453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 9.0, 19.0, 15.0, 39.0, 93.0, 187.0, 678.0, 3735.0, 917426.0, 123641.0, 1955.0, 468.0, 145.0, 69.0, 33.0, 20.0, 9.0, 11.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.181640625, -2.115234375, -2.048828125, -1.982421875, -1.916015625, -1.849609375, -1.783203125, -1.716796875, -1.650390625, -1.583984375, -1.517578125, -1.451171875, -1.384765625, -1.318359375, -1.251953125, -1.185546875, -1.119140625, -1.052734375, -0.986328125, -0.919921875, -0.853515625, -0.787109375, -0.720703125, -0.654296875, -0.587890625, -0.521484375, -0.455078125, -0.388671875, -0.322265625, -0.255859375, -0.189453125, -0.123046875, -0.056640625, 0.009765625, 0.076171875, 0.142578125, 0.208984375, 0.275390625, 0.341796875, 0.408203125, 0.474609375, 0.541015625, 0.607421875, 0.673828125, 0.740234375, 0.806640625, 0.873046875, 0.939453125, 1.005859375, 1.072265625, 1.138671875, 1.205078125, 1.271484375, 1.337890625, 1.404296875, 1.470703125, 1.537109375, 1.603515625, 1.669921875, 1.736328125, 1.802734375, 1.869140625, 1.935546875, 2.001953125, 2.068359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 4.0, 3.0, 5.0, 3.0, 1.0, 7.0, 7.0, 8.0, 15.0, 15.0, 15.0, 14.0, 24.0, 19.0, 22.0, 25.0, 43.0, 69.0, 132.0, 146.0, 117.0, 64.0, 40.0, 26.0, 23.0, 21.0, 30.0, 16.0, 20.0, 9.0, 12.0, 8.0, 4.0, 6.0, 8.0, 3.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00014448165893554688, -0.0001402720808982849, -0.00013606250286102295, -0.00013185292482376099, -0.00012764334678649902, -0.00012343376874923706, -0.0001192241907119751, -0.00011501461267471313, -0.00011080503463745117, -0.00010659545660018921, -0.00010238587856292725, -9.817630052566528e-05, -9.396672248840332e-05, -8.975714445114136e-05, -8.55475664138794e-05, -8.133798837661743e-05, -7.712841033935547e-05, -7.29188323020935e-05, -6.870925426483154e-05, -6.449967622756958e-05, -6.029009819030762e-05, -5.6080520153045654e-05, -5.187094211578369e-05, -4.766136407852173e-05, -4.3451786041259766e-05, -3.92422080039978e-05, -3.503262996673584e-05, -3.082305192947388e-05, -2.6613473892211914e-05, -2.240389585494995e-05, -1.8194317817687988e-05, -1.3984739780426025e-05, -9.775161743164062e-06, -5.5655837059021e-06, -1.3560056686401367e-06, 2.853572368621826e-06, 7.063150405883789e-06, 1.1272728443145752e-05, 1.5482306480407715e-05, 1.9691884517669678e-05, 2.390146255493164e-05, 2.8111040592193604e-05, 3.2320618629455566e-05, 3.653019666671753e-05, 4.073977470397949e-05, 4.4949352741241455e-05, 4.915893077850342e-05, 5.336850881576538e-05, 5.7578086853027344e-05, 6.17876648902893e-05, 6.599724292755127e-05, 7.020682096481323e-05, 7.44163990020752e-05, 7.862597703933716e-05, 8.283555507659912e-05, 8.704513311386108e-05, 9.125471115112305e-05, 9.546428918838501e-05, 9.967386722564697e-05, 0.00010388344526290894, 0.0001080930233001709, 0.00011230260133743286, 0.00011651217937469482, 0.00012072175741195679, 0.00012493133544921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 3.0, 9.0, 8.0, 9.0, 13.0, 20.0, 32.0, 47.0, 82.0, 138.0, 291.0, 684.0, 2234.0, 12326.0, 421525.0, 592050.0, 15196.0, 2462.0, 776.0, 299.0, 139.0, 85.0, 32.0, 34.0, 28.0, 8.0, 7.0, 6.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0], "bins": [-1.6513671875, -1.6138763427734375, -1.576385498046875, -1.5388946533203125, -1.50140380859375, -1.4639129638671875, -1.426422119140625, -1.3889312744140625, -1.3514404296875, -1.3139495849609375, -1.276458740234375, -1.2389678955078125, -1.20147705078125, -1.1639862060546875, -1.126495361328125, -1.0890045166015625, -1.051513671875, -1.0140228271484375, -0.976531982421875, -0.9390411376953125, -0.90155029296875, -0.8640594482421875, -0.826568603515625, -0.7890777587890625, -0.7515869140625, -0.7140960693359375, -0.676605224609375, -0.6391143798828125, -0.60162353515625, -0.5641326904296875, -0.526641845703125, -0.4891510009765625, -0.45166015625, -0.4141693115234375, -0.376678466796875, -0.3391876220703125, -0.30169677734375, -0.2642059326171875, -0.226715087890625, -0.1892242431640625, -0.1517333984375, -0.1142425537109375, -0.076751708984375, -0.0392608642578125, -0.00177001953125, 0.0357208251953125, 0.073211669921875, 0.1107025146484375, 0.148193359375, 0.1856842041015625, 0.223175048828125, 0.2606658935546875, 0.29815673828125, 0.3356475830078125, 0.373138427734375, 0.4106292724609375, 0.4481201171875, 0.4856109619140625, 0.523101806640625, 0.5605926513671875, 0.59808349609375, 0.6355743408203125, 0.673065185546875, 0.7105560302734375, 0.748046875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 2.0, 7.0, 12.0, 12.0, 14.0, 25.0, 32.0, 59.0, 81.0, 100.0, 99.0, 140.0, 113.0, 89.0, 67.0, 40.0, 36.0, 19.0, 14.0, 11.0, 9.0, 5.0, 6.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59716796875, -0.5768051147460938, -0.5564422607421875, -0.5360794067382812, -0.515716552734375, -0.49535369873046875, -0.4749908447265625, -0.45462799072265625, -0.43426513671875, -0.41390228271484375, -0.3935394287109375, -0.37317657470703125, -0.352813720703125, -0.33245086669921875, -0.3120880126953125, -0.29172515869140625, -0.2713623046875, -0.25099945068359375, -0.2306365966796875, -0.21027374267578125, -0.189910888671875, -0.16954803466796875, -0.1491851806640625, -0.12882232666015625, -0.10845947265625, -0.08809661865234375, -0.0677337646484375, -0.04737091064453125, -0.027008056640625, -0.00664520263671875, 0.0137176513671875, 0.03408050537109375, 0.054443359375, 0.07480621337890625, 0.0951690673828125, 0.11553192138671875, 0.135894775390625, 0.15625762939453125, 0.1766204833984375, 0.19698333740234375, 0.21734619140625, 0.23770904541015625, 0.2580718994140625, 0.27843475341796875, 0.298797607421875, 0.31916046142578125, 0.3395233154296875, 0.35988616943359375, 0.3802490234375, 0.40061187744140625, 0.4209747314453125, 0.44133758544921875, 0.461700439453125, 0.48206329345703125, 0.5024261474609375, 0.5227890014648438, 0.54315185546875, 0.5635147094726562, 0.5838775634765625, 0.6042404174804688, 0.624603271484375, 0.6449661254882812, 0.6653289794921875, 0.6856918334960938, 0.7060546875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 12.0, 51.0, 415.0, 476.0, 47.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.725003242492676, -13.811201095581055, -12.897398948669434, -11.983596801757812, -11.069794654846191, -10.15599250793457, -9.242189407348633, -8.328388214111328, -7.414585590362549, -6.500783443450928, -5.586981296539307, -4.673178672790527, -3.7593767642974854, -2.845574378967285, -1.931772232055664, -1.017970085144043, -0.10416793823242188, 0.809634268283844, 1.7234364748001099, 2.6372387409210205, 3.5510408878326416, 4.464843273162842, 5.378645420074463, 6.292447566986084, 7.206249713897705, 8.120052337646484, 9.033854484558105, 9.947656631469727, 10.861458778381348, 11.775260925292969, 12.68906307220459, 13.602865219116211, 14.516668319702148, 15.43047046661377, 16.34427261352539, 17.258075714111328, 18.171876907348633, 19.08568000793457, 19.999481201171875, 20.913284301757812, 21.827085494995117, 22.740888595581055, 23.65468978881836, 24.568492889404297, 25.4822940826416, 26.39609718322754, 27.309898376464844, 28.22370147705078, 29.13750457763672, 30.051307678222656, 30.96510887145996, 31.8789119720459, 32.7927131652832, 33.70651626586914, 34.62031936645508, 35.53411865234375, 36.44792175292969, 37.361724853515625, 38.27552795410156, 39.189327239990234, 40.10313034057617, 41.01693344116211, 41.93073654174805, 42.84453582763672, 43.758338928222656]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 1.0, 3.0, 5.0, 7.0, 12.0, 12.0, 17.0, 24.0, 24.0, 23.0, 24.0, 26.0, 21.0, 38.0, 32.0, 40.0, 43.0, 31.0, 42.0, 46.0, 36.0, 52.0, 38.0, 38.0, 43.0, 37.0, 48.0, 32.0, 35.0, 30.0, 26.0, 14.0, 15.0, 18.0, 12.0, 12.0, 14.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.249598503112793, -6.043041229248047, -5.836483955383301, -5.629927158355713, -5.423369884490967, -5.216812610626221, -5.010255336761475, -4.803698539733887, -4.597141265869141, -4.3905839920043945, -4.184026718139648, -3.9774696826934814, -3.7709126472473145, -3.5643553733825684, -3.3577980995178223, -3.1512410640716553, -2.944683790206909, -2.738126516342163, -2.531569480895996, -2.32501220703125, -2.118455171585083, -1.911897897720337, -1.7053407430648804, -1.4987835884094238, -1.2922264337539673, -1.0856692790985107, -0.8791121244430542, -0.6725549101829529, -0.46599775552749634, -0.259440541267395, -0.05288338661193848, 0.15367376804351807, 0.3602309226989746, 0.5667880773544312, 0.7733452320098877, 0.979902446269989, 1.1864595413208008, 1.3930168151855469, 1.5995739698410034, 1.80613112449646, 2.012688159942627, 2.219245433807373, 2.42580246925354, 2.632359743118286, 2.838916778564453, 3.045474052429199, 3.2520313262939453, 3.4585883617401123, 3.6651456356048584, 3.8717029094696045, 4.0782599449157715, 4.284817218780518, 4.491374492645264, 4.697931289672852, 4.904488563537598, 5.111045837402344, 5.31760311126709, 5.524160385131836, 5.730717658996582, 5.93727445602417, 6.143831729888916, 6.350389003753662, 6.556946277618408, 6.763503074645996, 6.970060348510742]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 13.0, 12.0, 19.0, 31.0, 90.0, 216.0, 679.0, 3989.0, 3669764.0, 514695.0, 3578.0, 741.0, 236.0, 103.0, 43.0, 23.0, 25.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.88671875, -5.69024658203125, -5.4937744140625, -5.29730224609375, -5.100830078125, -4.90435791015625, -4.7078857421875, -4.51141357421875, -4.31494140625, -4.11846923828125, -3.9219970703125, -3.72552490234375, -3.529052734375, -3.33258056640625, -3.1361083984375, -2.93963623046875, -2.7431640625, -2.54669189453125, -2.3502197265625, -2.15374755859375, -1.957275390625, -1.76080322265625, -1.5643310546875, -1.36785888671875, -1.17138671875, -0.97491455078125, -0.7784423828125, -0.58197021484375, -0.385498046875, -0.18902587890625, 0.0074462890625, 0.20391845703125, 0.400390625, 0.59686279296875, 0.7933349609375, 0.98980712890625, 1.186279296875, 1.38275146484375, 1.5792236328125, 1.77569580078125, 1.97216796875, 2.16864013671875, 2.3651123046875, 2.56158447265625, 2.758056640625, 2.95452880859375, 3.1510009765625, 3.34747314453125, 3.5439453125, 3.74041748046875, 3.9368896484375, 4.13336181640625, 4.329833984375, 4.52630615234375, 4.7227783203125, 4.91925048828125, 5.11572265625, 5.31219482421875, 5.5086669921875, 5.70513916015625, 5.901611328125, 6.09808349609375, 6.2945556640625, 6.49102783203125, 6.6875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 8.0, 19.0, 39.0, 67.0, 103.0, 171.0, 182.0, 163.0, 114.0, 64.0, 38.0, 16.0, 9.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55419921875, -0.5354461669921875, -0.516693115234375, -0.4979400634765625, -0.47918701171875, -0.4604339599609375, -0.441680908203125, -0.4229278564453125, -0.4041748046875, -0.3854217529296875, -0.366668701171875, -0.3479156494140625, -0.32916259765625, -0.3104095458984375, -0.291656494140625, -0.2729034423828125, -0.254150390625, -0.2353973388671875, -0.216644287109375, -0.1978912353515625, -0.17913818359375, -0.1603851318359375, -0.141632080078125, -0.1228790283203125, -0.1041259765625, -0.0853729248046875, -0.066619873046875, -0.0478668212890625, -0.02911376953125, -0.0103607177734375, 0.008392333984375, 0.0271453857421875, 0.0458984375, 0.0646514892578125, 0.083404541015625, 0.1021575927734375, 0.12091064453125, 0.1396636962890625, 0.158416748046875, 0.1771697998046875, 0.1959228515625, 0.2146759033203125, 0.233428955078125, 0.2521820068359375, 0.27093505859375, 0.2896881103515625, 0.308441162109375, 0.3271942138671875, 0.345947265625, 0.3647003173828125, 0.383453369140625, 0.4022064208984375, 0.42095947265625, 0.4397125244140625, 0.458465576171875, 0.4772186279296875, 0.4959716796875, 0.5147247314453125, 0.533477783203125, 0.5522308349609375, 0.57098388671875, 0.5897369384765625, 0.608489990234375, 0.6272430419921875, 0.64599609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 12.0, 17.0, 23.0, 41.0, 78.0, 119.0, 234.0, 686.0, 3731.0, 51739.0, 4087290.0, 45586.0, 3632.0, 639.0, 229.0, 93.0, 55.0, 23.0, 14.0, 15.0, 7.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.177734375, -2.09228515625, -2.0068359375, -1.92138671875, -1.8359375, -1.75048828125, -1.6650390625, -1.57958984375, -1.494140625, -1.40869140625, -1.3232421875, -1.23779296875, -1.15234375, -1.06689453125, -0.9814453125, -0.89599609375, -0.810546875, -0.72509765625, -0.6396484375, -0.55419921875, -0.46875, -0.38330078125, -0.2978515625, -0.21240234375, -0.126953125, -0.04150390625, 0.0439453125, 0.12939453125, 0.21484375, 0.30029296875, 0.3857421875, 0.47119140625, 0.556640625, 0.64208984375, 0.7275390625, 0.81298828125, 0.8984375, 0.98388671875, 1.0693359375, 1.15478515625, 1.240234375, 1.32568359375, 1.4111328125, 1.49658203125, 1.58203125, 1.66748046875, 1.7529296875, 1.83837890625, 1.923828125, 2.00927734375, 2.0947265625, 2.18017578125, 2.265625, 2.35107421875, 2.4365234375, 2.52197265625, 2.607421875, 2.69287109375, 2.7783203125, 2.86376953125, 2.94921875, 3.03466796875, 3.1201171875, 3.20556640625, 3.291015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 4.0, 5.0, 10.0, 10.0, 18.0, 26.0, 31.0, 56.0, 143.0, 442.0, 2241.0, 726.0, 193.0, 66.0, 37.0, 21.0, 11.0, 13.0, 12.0, 4.0, 4.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7353515625, -0.7181053161621094, -0.7008590698242188, -0.6836128234863281, -0.6663665771484375, -0.6491203308105469, -0.6318740844726562, -0.6146278381347656, -0.597381591796875, -0.5801353454589844, -0.5628890991210938, -0.5456428527832031, -0.5283966064453125, -0.5111503601074219, -0.49390411376953125, -0.4766578674316406, -0.45941162109375, -0.4421653747558594, -0.42491912841796875, -0.4076728820800781, -0.3904266357421875, -0.3731803894042969, -0.35593414306640625, -0.3386878967285156, -0.321441650390625, -0.3041954040527344, -0.28694915771484375, -0.2697029113769531, -0.2524566650390625, -0.23521041870117188, -0.21796417236328125, -0.20071792602539062, -0.1834716796875, -0.16622543334960938, -0.14897918701171875, -0.13173294067382812, -0.1144866943359375, -0.09724044799804688, -0.07999420166015625, -0.06274795532226562, -0.045501708984375, -0.028255462646484375, -0.01100921630859375, 0.006237030029296875, 0.0234832763671875, 0.040729522705078125, 0.05797576904296875, 0.07522201538085938, 0.09246826171875, 0.10971450805664062, 0.12696075439453125, 0.14420700073242188, 0.1614532470703125, 0.17869949340820312, 0.19594573974609375, 0.21319198608398438, 0.230438232421875, 0.24768447875976562, 0.26493072509765625, 0.2821769714355469, 0.2994232177734375, 0.3166694641113281, 0.33391571044921875, 0.3511619567871094, 0.368408203125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 15.0, 76.0, 315.0, 411.0, 146.0, 22.0, 9.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.168980360031128, -2.042003631591797, -1.9150269031524658, -1.7880500555038452, -1.6610733270645142, -1.534096598625183, -1.4071197509765625, -1.2801430225372314, -1.1531662940979004, -1.0261895656585693, -0.8992127776145935, -0.7722359895706177, -0.6452592611312866, -0.5182825326919556, -0.39130574464797974, -0.2643289566040039, -0.13735222816467285, -0.01037546992301941, 0.11660128831863403, 0.24357804656028748, 0.3705548048019409, 0.497531533241272, 0.6245083212852478, 0.7514851093292236, 0.8784618377685547, 1.0054385662078857, 1.1324152946472168, 1.2593921422958374, 1.3863688707351685, 1.5133455991744995, 1.6403224468231201, 1.7672991752624512, 1.8942756652832031, 2.021252393722534, 2.1482291221618652, 2.2752058506011963, 2.4021825790405273, 2.5291595458984375, 2.6561362743377686, 2.7831130027770996, 2.9100897312164307, 3.0370664596557617, 3.1640431880950928, 3.291019916534424, 3.417996883392334, 3.544973373413086, 3.671950340270996, 3.798927068710327, 3.925903797149658, 4.052880764007568, 4.17985725402832, 4.3068342208862305, 4.433810710906982, 4.560787677764893, 4.6877641677856445, 4.814741134643555, 4.941718101501465, 5.068695068359375, 5.195671558380127, 5.322648525238037, 5.449625015258789, 5.576601982116699, 5.703578472137451, 5.830555438995361, 5.957531929016113]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 7.0, 16.0, 13.0, 28.0, 30.0, 38.0, 38.0, 48.0, 53.0, 60.0, 68.0, 73.0, 65.0, 68.0, 55.0, 64.0, 50.0, 52.0, 41.0, 25.0, 26.0, 15.0, 23.0, 14.0, 4.0, 11.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8195555210113525, -1.7663153409957886, -1.7130751609802246, -1.6598351001739502, -1.6065949201583862, -1.5533547401428223, -1.5001146793365479, -1.4468744993209839, -1.39363431930542, -1.340394139289856, -1.287153959274292, -1.2339138984680176, -1.1806737184524536, -1.1274335384368896, -1.0741934776306152, -1.0209532976150513, -0.9677131175994873, -0.9144729375839233, -0.8612328171730042, -0.807992696762085, -0.754752516746521, -0.701512336730957, -0.6482722163200378, -0.5950320959091187, -0.5417919158935547, -0.4885517656803131, -0.43531161546707153, -0.38207146525382996, -0.3288313150405884, -0.2755911648273468, -0.22235101461410522, -0.16911086440086365, -0.11587071418762207, -0.0626305639743805, -0.009390413761138916, 0.04384973645210266, 0.09708988666534424, 0.15033003687858582, 0.2035701870918274, 0.25681033730506897, 0.31005048751831055, 0.3632906377315521, 0.4165307879447937, 0.4697709381580353, 0.5230110883712769, 0.5762512683868408, 0.62949138879776, 0.6827315092086792, 0.7359716892242432, 0.7892118692398071, 0.8424519896507263, 0.8956921100616455, 0.9489322900772095, 1.0021724700927734, 1.0554125308990479, 1.1086527109146118, 1.1618928909301758, 1.2151330709457397, 1.2683732509613037, 1.3216133117675781, 1.374853491783142, 1.428093671798706, 1.4813337326049805, 1.5345739126205444, 1.5878140926361084]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 12.0, 15.0, 35.0, 36.0, 45.0, 78.0, 96.0, 158.0, 274.0, 464.0, 764.0, 1701.0, 5331.0, 29863.0, 390853.0, 562894.0, 44876.0, 6750.0, 2062.0, 946.0, 494.0, 267.0, 176.0, 120.0, 70.0, 53.0, 31.0, 22.0, 15.0, 15.0, 11.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.7021484375, -1.6549835205078125, -1.607818603515625, -1.5606536865234375, -1.51348876953125, -1.4663238525390625, -1.419158935546875, -1.3719940185546875, -1.3248291015625, -1.2776641845703125, -1.230499267578125, -1.1833343505859375, -1.13616943359375, -1.0890045166015625, -1.041839599609375, -0.9946746826171875, -0.947509765625, -0.9003448486328125, -0.853179931640625, -0.8060150146484375, -0.75885009765625, -0.7116851806640625, -0.664520263671875, -0.6173553466796875, -0.5701904296875, -0.5230255126953125, -0.475860595703125, -0.4286956787109375, -0.38153076171875, -0.3343658447265625, -0.287200927734375, -0.2400360107421875, -0.19287109375, -0.1457061767578125, -0.098541259765625, -0.0513763427734375, -0.00421142578125, 0.0429534912109375, 0.090118408203125, 0.1372833251953125, 0.1844482421875, 0.2316131591796875, 0.278778076171875, 0.3259429931640625, 0.37310791015625, 0.4202728271484375, 0.467437744140625, 0.5146026611328125, 0.561767578125, 0.6089324951171875, 0.656097412109375, 0.7032623291015625, 0.75042724609375, 0.7975921630859375, 0.844757080078125, 0.8919219970703125, 0.9390869140625, 0.9862518310546875, 1.033416748046875, 1.0805816650390625, 1.12774658203125, 1.1749114990234375, 1.222076416015625, 1.2692413330078125, 1.31640625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 11.0, 19.0, 25.0, 67.0, 117.0, 150.0, 172.0, 159.0, 138.0, 73.0, 40.0, 15.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50732421875, -0.4896392822265625, -0.471954345703125, -0.4542694091796875, -0.43658447265625, -0.4188995361328125, -0.401214599609375, -0.3835296630859375, -0.3658447265625, -0.3481597900390625, -0.330474853515625, -0.3127899169921875, -0.29510498046875, -0.2774200439453125, -0.259735107421875, -0.2420501708984375, -0.224365234375, -0.2066802978515625, -0.188995361328125, -0.1713104248046875, -0.15362548828125, -0.1359405517578125, -0.118255615234375, -0.1005706787109375, -0.0828857421875, -0.0652008056640625, -0.047515869140625, -0.0298309326171875, -0.01214599609375, 0.0055389404296875, 0.023223876953125, 0.0409088134765625, 0.05859375, 0.0762786865234375, 0.093963623046875, 0.1116485595703125, 0.12933349609375, 0.1470184326171875, 0.164703369140625, 0.1823883056640625, 0.2000732421875, 0.2177581787109375, 0.235443115234375, 0.2531280517578125, 0.27081298828125, 0.2884979248046875, 0.306182861328125, 0.3238677978515625, 0.341552734375, 0.3592376708984375, 0.376922607421875, 0.3946075439453125, 0.41229248046875, 0.4299774169921875, 0.447662353515625, 0.4653472900390625, 0.4830322265625, 0.5007171630859375, 0.518402099609375, 0.5360870361328125, 0.55377197265625, 0.5714569091796875, 0.589141845703125, 0.6068267822265625, 0.62451171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 14.0, 15.0, 12.0, 16.0, 26.0, 31.0, 31.0, 66.0, 74.0, 103.0, 127.0, 203.0, 298.0, 458.0, 730.0, 1419.0, 3400.0, 9498.0, 36599.0, 198796.0, 580055.0, 169263.0, 31879.0, 8850.0, 3069.0, 1410.0, 770.0, 390.0, 246.0, 192.0, 151.0, 111.0, 59.0, 52.0, 43.0, 25.0, 19.0, 12.0, 3.0, 5.0, 12.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0712890625, -1.0372314453125, -1.003173828125, -0.9691162109375, -0.93505859375, -0.9010009765625, -0.866943359375, -0.8328857421875, -0.798828125, -0.7647705078125, -0.730712890625, -0.6966552734375, -0.66259765625, -0.6285400390625, -0.594482421875, -0.5604248046875, -0.5263671875, -0.4923095703125, -0.458251953125, -0.4241943359375, -0.39013671875, -0.3560791015625, -0.322021484375, -0.2879638671875, -0.25390625, -0.2198486328125, -0.185791015625, -0.1517333984375, -0.11767578125, -0.0836181640625, -0.049560546875, -0.0155029296875, 0.0185546875, 0.0526123046875, 0.086669921875, 0.1207275390625, 0.15478515625, 0.1888427734375, 0.222900390625, 0.2569580078125, 0.291015625, 0.3250732421875, 0.359130859375, 0.3931884765625, 0.42724609375, 0.4613037109375, 0.495361328125, 0.5294189453125, 0.5634765625, 0.5975341796875, 0.631591796875, 0.6656494140625, 0.69970703125, 0.7337646484375, 0.767822265625, 0.8018798828125, 0.8359375, 0.8699951171875, 0.904052734375, 0.9381103515625, 0.97216796875, 1.0062255859375, 1.040283203125, 1.0743408203125, 1.1083984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 9.0, 12.0, 12.0, 11.0, 17.0, 18.0, 15.0, 22.0, 29.0, 30.0, 44.0, 42.0, 44.0, 52.0, 56.0, 66.0, 47.0, 55.0, 51.0, 44.0, 43.0, 52.0, 35.0, 44.0, 23.0, 25.0, 17.0, 13.0, 12.0, 8.0, 7.0, 12.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.46875, -1.42742919921875, -1.3861083984375, -1.34478759765625, -1.303466796875, -1.26214599609375, -1.2208251953125, -1.17950439453125, -1.13818359375, -1.09686279296875, -1.0555419921875, -1.01422119140625, -0.972900390625, -0.93157958984375, -0.8902587890625, -0.84893798828125, -0.8076171875, -0.76629638671875, -0.7249755859375, -0.68365478515625, -0.642333984375, -0.60101318359375, -0.5596923828125, -0.51837158203125, -0.47705078125, -0.43572998046875, -0.3944091796875, -0.35308837890625, -0.311767578125, -0.27044677734375, -0.2291259765625, -0.18780517578125, -0.146484375, -0.10516357421875, -0.0638427734375, -0.02252197265625, 0.018798828125, 0.06011962890625, 0.1014404296875, 0.14276123046875, 0.18408203125, 0.22540283203125, 0.2667236328125, 0.30804443359375, 0.349365234375, 0.39068603515625, 0.4320068359375, 0.47332763671875, 0.5146484375, 0.55596923828125, 0.5972900390625, 0.63861083984375, 0.679931640625, 0.72125244140625, 0.7625732421875, 0.80389404296875, 0.84521484375, 0.88653564453125, 0.9278564453125, 0.96917724609375, 1.010498046875, 1.05181884765625, 1.0931396484375, 1.13446044921875, 1.17578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 3.0, 5.0, 10.0, 11.0, 14.0, 23.0, 37.0, 69.0, 115.0, 278.0, 668.0, 1951.0, 10290.0, 294282.0, 718138.0, 18384.0, 2695.0, 884.0, 312.0, 153.0, 89.0, 40.0, 26.0, 21.0, 10.0, 14.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6494140625, -0.6278533935546875, -0.606292724609375, -0.5847320556640625, -0.56317138671875, -0.5416107177734375, -0.520050048828125, -0.4984893798828125, -0.4769287109375, -0.4553680419921875, -0.433807373046875, -0.4122467041015625, -0.39068603515625, -0.3691253662109375, -0.347564697265625, -0.3260040283203125, -0.304443359375, -0.2828826904296875, -0.261322021484375, -0.2397613525390625, -0.21820068359375, -0.1966400146484375, -0.175079345703125, -0.1535186767578125, -0.1319580078125, -0.1103973388671875, -0.088836669921875, -0.0672760009765625, -0.04571533203125, -0.0241546630859375, -0.002593994140625, 0.0189666748046875, 0.04052734375, 0.0620880126953125, 0.083648681640625, 0.1052093505859375, 0.12677001953125, 0.1483306884765625, 0.169891357421875, 0.1914520263671875, 0.2130126953125, 0.2345733642578125, 0.256134033203125, 0.2776947021484375, 0.29925537109375, 0.3208160400390625, 0.342376708984375, 0.3639373779296875, 0.385498046875, 0.4070587158203125, 0.428619384765625, 0.4501800537109375, 0.47174072265625, 0.4933013916015625, 0.514862060546875, 0.5364227294921875, 0.5579833984375, 0.5795440673828125, 0.601104736328125, 0.6226654052734375, 0.64422607421875, 0.6657867431640625, 0.687347412109375, 0.7089080810546875, 0.73046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 10.0, 13.0, 19.0, 21.0, 39.0, 40.0, 59.0, 119.0, 184.0, 177.0, 100.0, 74.0, 51.0, 32.0, 15.0, 17.0, 13.0, 7.0, 6.0, 1.0, 1.0, 3.0], "bins": [-0.0003383159637451172, -0.00033166538923978806, -0.0003250148147344589, -0.0003183642402291298, -0.00031171366572380066, -0.0003050630912184715, -0.0002984125167131424, -0.00029176194220781326, -0.00028511136770248413, -0.000278460793197155, -0.00027181021869182587, -0.00026515964418649673, -0.0002585090696811676, -0.00025185849517583847, -0.00024520792067050934, -0.0002385573461651802, -0.00023190677165985107, -0.00022525619715452194, -0.0002186056226491928, -0.00021195504814386368, -0.00020530447363853455, -0.00019865389913320541, -0.00019200332462787628, -0.00018535275012254715, -0.00017870217561721802, -0.00017205160111188889, -0.00016540102660655975, -0.00015875045210123062, -0.0001520998775959015, -0.00014544930309057236, -0.00013879872858524323, -0.0001321481540799141, -0.00012549757957458496, -0.00011884700506925583, -0.0001121964305639267, -0.00010554585605859756, -9.889528155326843e-05, -9.22447070479393e-05, -8.559413254261017e-05, -7.894355803728104e-05, -7.22929835319519e-05, -6.564240902662277e-05, -5.899183452129364e-05, -5.234126001596451e-05, -4.5690685510635376e-05, -3.9040111005306244e-05, -3.238953649997711e-05, -2.573896199464798e-05, -1.9088387489318848e-05, -1.2437812983989716e-05, -5.7872384786605835e-06, 8.633360266685486e-07, 7.513910531997681e-06, 1.4164485037326813e-05, 2.0815059542655945e-05, 2.7465634047985077e-05, 3.411620855331421e-05, 4.076678305864334e-05, 4.741735756397247e-05, 5.4067932069301605e-05, 6.071850657463074e-05, 6.736908107995987e-05, 7.4019655585289e-05, 8.067023009061813e-05, 8.732080459594727e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 6.0, 13.0, 14.0, 13.0, 25.0, 40.0, 72.0, 169.0, 382.0, 971.0, 3404.0, 29954.0, 850326.0, 152663.0, 7750.0, 1672.0, 614.0, 241.0, 88.0, 37.0, 36.0, 17.0, 17.0, 7.0, 4.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61865234375, -0.5946044921875, -0.570556640625, -0.5465087890625, -0.5224609375, -0.4984130859375, -0.474365234375, -0.4503173828125, -0.42626953125, -0.4022216796875, -0.378173828125, -0.3541259765625, -0.330078125, -0.3060302734375, -0.281982421875, -0.2579345703125, -0.23388671875, -0.2098388671875, -0.185791015625, -0.1617431640625, -0.1376953125, -0.1136474609375, -0.089599609375, -0.0655517578125, -0.04150390625, -0.0174560546875, 0.006591796875, 0.0306396484375, 0.0546875, 0.0787353515625, 0.102783203125, 0.1268310546875, 0.15087890625, 0.1749267578125, 0.198974609375, 0.2230224609375, 0.2470703125, 0.2711181640625, 0.295166015625, 0.3192138671875, 0.34326171875, 0.3673095703125, 0.391357421875, 0.4154052734375, 0.439453125, 0.4635009765625, 0.487548828125, 0.5115966796875, 0.53564453125, 0.5596923828125, 0.583740234375, 0.6077880859375, 0.6318359375, 0.6558837890625, 0.679931640625, 0.7039794921875, 0.72802734375, 0.7520751953125, 0.776123046875, 0.8001708984375, 0.82421875, 0.8482666015625, 0.872314453125, 0.8963623046875, 0.92041015625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 9.0, 9.0, 7.0, 8.0, 18.0, 13.0, 26.0, 38.0, 55.0, 75.0, 84.0, 137.0, 135.0, 118.0, 83.0, 49.0, 46.0, 23.0, 15.0, 17.0, 12.0, 8.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.55517578125, -0.5388450622558594, -0.5225143432617188, -0.5061836242675781, -0.4898529052734375, -0.4735221862792969, -0.45719146728515625, -0.4408607482910156, -0.424530029296875, -0.4081993103027344, -0.39186859130859375, -0.3755378723144531, -0.3592071533203125, -0.3428764343261719, -0.32654571533203125, -0.3102149963378906, -0.29388427734375, -0.2775535583496094, -0.26122283935546875, -0.24489212036132812, -0.2285614013671875, -0.21223068237304688, -0.19589996337890625, -0.17956924438476562, -0.163238525390625, -0.14690780639648438, -0.13057708740234375, -0.11424636840820312, -0.0979156494140625, -0.08158493041992188, -0.06525421142578125, -0.048923492431640625, -0.0325927734375, -0.016262054443359375, 6.866455078125e-05, 0.016399383544921875, 0.0327301025390625, 0.049060821533203125, 0.06539154052734375, 0.08172225952148438, 0.098052978515625, 0.11438369750976562, 0.13071441650390625, 0.14704513549804688, 0.1633758544921875, 0.17970657348632812, 0.19603729248046875, 0.21236801147460938, 0.22869873046875, 0.24502944946289062, 0.26136016845703125, 0.2776908874511719, 0.2940216064453125, 0.3103523254394531, 0.32668304443359375, 0.3430137634277344, 0.359344482421875, 0.3756752014160156, 0.39200592041015625, 0.4083366394042969, 0.4246673583984375, 0.4409980773925781, 0.45732879638671875, 0.4736595153808594, 0.489990234375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 14.0, 49.0, 131.0, 334.0, 309.0, 103.0, 29.0, 13.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.298676490783691, -9.85159683227539, -9.404518127441406, -8.957438468933105, -8.510358810424805, -8.06328010559082, -7.6162004470825195, -7.169121265411377, -6.722042083740234, -6.274962902069092, -5.827883720397949, -5.380804061889648, -4.933724880218506, -4.486645698547363, -4.0395660400390625, -3.59248685836792, -3.1454076766967773, -2.6983284950256348, -2.251249074935913, -1.804169774055481, -1.3570904731750488, -0.9100112915039062, -0.46293187141418457, -0.01585245132446289, 0.4312267303466797, 0.8783060312271118, 1.325385332107544, 1.772464632987976, 2.219543933868408, 2.666623115539551, 3.1137025356292725, 3.560781955718994, 4.00786018371582, 4.454939365386963, 4.9020185470581055, 5.349098205566406, 5.796177387237549, 6.243256568908691, 6.690336227416992, 7.137415409088135, 7.584494590759277, 8.031574249267578, 8.478652954101562, 8.925732612609863, 9.372812271118164, 9.819890975952148, 10.26697063446045, 10.71405029296875, 11.161128997802734, 11.608208656311035, 12.05528736114502, 12.50236701965332, 12.949445724487305, 13.396525382995605, 13.843605041503906, 14.29068374633789, 14.737763404846191, 15.184843063354492, 15.631921768188477, 16.07900047302246, 16.526081085205078, 16.973159790039062, 17.420238494873047, 17.867319107055664, 18.31439781188965]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 6.0, 6.0, 5.0, 15.0, 12.0, 16.0, 18.0, 32.0, 24.0, 38.0, 39.0, 31.0, 37.0, 40.0, 55.0, 53.0, 44.0, 49.0, 47.0, 43.0, 43.0, 45.0, 36.0, 29.0, 35.0, 37.0, 30.0, 15.0, 24.0, 24.0, 16.0, 16.0, 13.0, 7.0, 8.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.905524253845215, -7.677194595336914, -7.4488654136657715, -7.220535755157471, -6.992206573486328, -6.763876914978027, -6.535547256469727, -6.307218074798584, -6.078888416290283, -5.850558757781982, -5.62222957611084, -5.393899917602539, -5.1655707359313965, -4.937241077423096, -4.708911895751953, -4.480582237243652, -4.252252578735352, -4.023922920227051, -3.795593738555908, -3.5672640800476074, -3.3389346599578857, -3.110605239868164, -2.8822758197784424, -2.6539463996887207, -2.425617218017578, -2.1972877979278564, -1.9689582586288452, -1.7406288385391235, -1.5122992992401123, -1.2839698791503906, -1.055640459060669, -0.8273109197616577, -0.5989813804626465, -0.37065190076828003, -0.14232245087623596, 0.0860069990158081, 0.31433647871017456, 0.542665958404541, 0.7709953784942627, 0.9993249177932739, 1.2276543378829956, 1.4559837579727173, 1.6843132972717285, 1.9126427173614502, 2.140972137451172, 2.3693017959594727, 2.5976309776306152, 2.825960636138916, 3.0542900562286377, 3.2826194763183594, 3.510948896408081, 3.7392783164978027, 3.9676079750061035, 4.195937156677246, 4.424266815185547, 4.652596473693848, 4.88092565536499, 5.109255313873291, 5.337584495544434, 5.565914154052734, 5.794243335723877, 6.022572994232178, 6.25090217590332, 6.479231834411621, 6.707561492919922]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 2.0, 9.0, 13.0, 18.0, 28.0, 46.0, 93.0, 198.0, 380.0, 933.0, 3191.0, 23649.0, 4079324.0, 77949.0, 5890.0, 1431.0, 524.0, 245.0, 123.0, 76.0, 52.0, 35.0, 17.0, 15.0, 9.0, 10.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.111328125, -2.0350341796875, -1.958740234375, -1.8824462890625, -1.80615234375, -1.7298583984375, -1.653564453125, -1.5772705078125, -1.5009765625, -1.4246826171875, -1.348388671875, -1.2720947265625, -1.19580078125, -1.1195068359375, -1.043212890625, -0.9669189453125, -0.890625, -0.8143310546875, -0.738037109375, -0.6617431640625, -0.58544921875, -0.5091552734375, -0.432861328125, -0.3565673828125, -0.2802734375, -0.2039794921875, -0.127685546875, -0.0513916015625, 0.02490234375, 0.1011962890625, 0.177490234375, 0.2537841796875, 0.330078125, 0.4063720703125, 0.482666015625, 0.5589599609375, 0.63525390625, 0.7115478515625, 0.787841796875, 0.8641357421875, 0.9404296875, 1.0167236328125, 1.093017578125, 1.1693115234375, 1.24560546875, 1.3218994140625, 1.398193359375, 1.4744873046875, 1.55078125, 1.6270751953125, 1.703369140625, 1.7796630859375, 1.85595703125, 1.9322509765625, 2.008544921875, 2.0848388671875, 2.1611328125, 2.2374267578125, 2.313720703125, 2.3900146484375, 2.46630859375, 2.5426025390625, 2.618896484375, 2.6951904296875, 2.771484375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 14.0, 23.0, 37.0, 64.0, 100.0, 127.0, 170.0, 147.0, 121.0, 68.0, 55.0, 35.0, 18.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49169921875, -0.47399139404296875, -0.4562835693359375, -0.43857574462890625, -0.420867919921875, -0.40316009521484375, -0.3854522705078125, -0.36774444580078125, -0.35003662109375, -0.33232879638671875, -0.3146209716796875, -0.29691314697265625, -0.279205322265625, -0.26149749755859375, -0.2437896728515625, -0.22608184814453125, -0.2083740234375, -0.19066619873046875, -0.1729583740234375, -0.15525054931640625, -0.137542724609375, -0.11983489990234375, -0.1021270751953125, -0.08441925048828125, -0.06671142578125, -0.04900360107421875, -0.0312957763671875, -0.01358795166015625, 0.004119873046875, 0.02182769775390625, 0.0395355224609375, 0.05724334716796875, 0.074951171875, 0.09265899658203125, 0.1103668212890625, 0.12807464599609375, 0.145782470703125, 0.16349029541015625, 0.1811981201171875, 0.19890594482421875, 0.21661376953125, 0.23432159423828125, 0.2520294189453125, 0.26973724365234375, 0.287445068359375, 0.30515289306640625, 0.3228607177734375, 0.34056854248046875, 0.3582763671875, 0.37598419189453125, 0.3936920166015625, 0.41139984130859375, 0.429107666015625, 0.44681549072265625, 0.4645233154296875, 0.48223114013671875, 0.49993896484375, 0.5176467895507812, 0.5353546142578125, 0.5530624389648438, 0.570770263671875, 0.5884780883789062, 0.6061859130859375, 0.6238937377929688, 0.6416015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 8.0, 5.0, 10.0, 18.0, 16.0, 43.0, 88.0, 214.0, 682.0, 2499.0, 12292.0, 628850.0, 3528463.0, 16903.0, 2867.0, 877.0, 252.0, 98.0, 46.0, 21.0, 12.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7958984375, -1.7399139404296875, -1.683929443359375, -1.6279449462890625, -1.57196044921875, -1.5159759521484375, -1.459991455078125, -1.4040069580078125, -1.3480224609375, -1.2920379638671875, -1.236053466796875, -1.1800689697265625, -1.12408447265625, -1.0680999755859375, -1.012115478515625, -0.9561309814453125, -0.900146484375, -0.8441619873046875, -0.788177490234375, -0.7321929931640625, -0.67620849609375, -0.6202239990234375, -0.564239501953125, -0.5082550048828125, -0.4522705078125, -0.3962860107421875, -0.340301513671875, -0.2843170166015625, -0.22833251953125, -0.1723480224609375, -0.116363525390625, -0.0603790283203125, -0.00439453125, 0.0515899658203125, 0.107574462890625, 0.1635589599609375, 0.21954345703125, 0.2755279541015625, 0.331512451171875, 0.3874969482421875, 0.4434814453125, 0.4994659423828125, 0.555450439453125, 0.6114349365234375, 0.66741943359375, 0.7234039306640625, 0.779388427734375, 0.8353729248046875, 0.891357421875, 0.9473419189453125, 1.003326416015625, 1.0593109130859375, 1.11529541015625, 1.1712799072265625, 1.227264404296875, 1.2832489013671875, 1.3392333984375, 1.3952178955078125, 1.451202392578125, 1.5071868896484375, 1.56317138671875, 1.6191558837890625, 1.675140380859375, 1.7311248779296875, 1.787109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 8.0, 10.0, 18.0, 26.0, 39.0, 73.0, 186.0, 606.0, 2106.0, 543.0, 192.0, 87.0, 43.0, 32.0, 15.0, 15.0, 12.0, 8.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3125, -0.30255889892578125, -0.2926177978515625, -0.28267669677734375, -0.272735595703125, -0.26279449462890625, -0.2528533935546875, -0.24291229248046875, -0.23297119140625, -0.22303009033203125, -0.2130889892578125, -0.20314788818359375, -0.193206787109375, -0.18326568603515625, -0.1733245849609375, -0.16338348388671875, -0.1534423828125, -0.14350128173828125, -0.1335601806640625, -0.12361907958984375, -0.113677978515625, -0.10373687744140625, -0.0937957763671875, -0.08385467529296875, -0.07391357421875, -0.06397247314453125, -0.0540313720703125, -0.04409027099609375, -0.034149169921875, -0.02420806884765625, -0.0142669677734375, -0.00432586669921875, 0.005615234375, 0.01555633544921875, 0.0254974365234375, 0.03543853759765625, 0.045379638671875, 0.05532073974609375, 0.0652618408203125, 0.07520294189453125, 0.08514404296875, 0.09508514404296875, 0.1050262451171875, 0.11496734619140625, 0.124908447265625, 0.13484954833984375, 0.1447906494140625, 0.15473175048828125, 0.1646728515625, 0.17461395263671875, 0.1845550537109375, 0.19449615478515625, 0.204437255859375, 0.21437835693359375, 0.2243194580078125, 0.23426055908203125, 0.24420166015625, 0.25414276123046875, 0.2640838623046875, 0.27402496337890625, 0.283966064453125, 0.29390716552734375, 0.3038482666015625, 0.31378936767578125, 0.32373046875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 14.0, 39.0, 192.0, 437.0, 269.0, 44.0, 8.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.591681480407715, -4.488351821899414, -4.385021686553955, -4.281692028045654, -4.1783623695373535, -4.075032711029053, -3.9717025756835938, -3.868372917175293, -3.765043258666992, -3.6617133617401123, -3.5583837032318115, -3.4550538063049316, -3.351724147796631, -3.248394250869751, -3.145064353942871, -3.0417346954345703, -2.9384047985076904, -2.8350749015808105, -2.7317452430725098, -2.62841534614563, -2.525085687637329, -2.421755790710449, -2.3184261322021484, -2.2150962352752686, -2.1117663383483887, -2.008436441421509, -1.905106782913208, -1.8017768859863281, -1.6984472274780273, -1.5951173305511475, -1.4917875528335571, -1.3884577751159668, -1.285127878189087, -1.1817981004714966, -1.0784683227539062, -0.9751384854316711, -0.8718087077140808, -0.7684789299964905, -0.6651490926742554, -0.561819314956665, -0.4584895372390747, -0.3551597595214844, -0.25182995200157166, -0.14850014448165894, -0.045170366764068604, 0.05815941095352173, 0.16148924827575684, 0.26481902599334717, 0.3681488037109375, 0.47147858142852783, 0.5748083591461182, 0.6781381964683533, 0.7814679741859436, 0.8847977519035339, 0.988127589225769, 1.0914573669433594, 1.1947871446609497, 1.29811692237854, 1.4014467000961304, 1.5047764778137207, 1.6081063747406006, 1.7114360332489014, 1.8147659301757812, 1.9180957078933716, 2.021425485610962]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 4.0, 3.0, 1.0, 6.0, 8.0, 6.0, 11.0, 14.0, 14.0, 17.0, 14.0, 24.0, 37.0, 35.0, 42.0, 46.0, 41.0, 43.0, 44.0, 60.0, 60.0, 52.0, 59.0, 44.0, 41.0, 44.0, 44.0, 27.0, 31.0, 29.0, 20.0, 22.0, 16.0, 13.0, 9.0, 9.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.089052438735962, -1.0584359169006348, -1.0278193950653076, -0.9972027540206909, -0.9665862321853638, -0.9359697103500366, -0.9053531289100647, -0.8747365474700928, -0.8441200256347656, -0.8135035037994385, -0.7828869223594666, -0.7522703409194946, -0.7216538190841675, -0.6910372972488403, -0.6604207158088684, -0.6298041343688965, -0.5991876125335693, -0.5685710906982422, -0.5379545092582703, -0.5073379278182983, -0.4767214059829712, -0.44610485434532166, -0.4154883027076721, -0.3848717510700226, -0.35425519943237305, -0.3236386477947235, -0.293022096157074, -0.26240554451942444, -0.2317889928817749, -0.20117244124412537, -0.17055588960647583, -0.1399393379688263, -0.10932278633117676, -0.07870623469352722, -0.048089683055877686, -0.01747313141822815, 0.013143420219421387, 0.04375997185707092, 0.07437652349472046, 0.10499307513237, 0.13560962677001953, 0.16622617840766907, 0.1968427300453186, 0.22745928168296814, 0.2580758333206177, 0.2886923849582672, 0.31930893659591675, 0.3499254882335663, 0.3805420398712158, 0.41115859150886536, 0.4417751431465149, 0.47239169478416443, 0.503008246421814, 0.5336247682571411, 0.564241349697113, 0.594857931137085, 0.6254744529724121, 0.6560909748077393, 0.6867075562477112, 0.7173241376876831, 0.7479406595230103, 0.7785571813583374, 0.8091737627983093, 0.8397903442382812, 0.8704068660736084]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 5.0, 8.0, 6.0, 28.0, 35.0, 31.0, 56.0, 104.0, 191.0, 319.0, 646.0, 1487.0, 4737.0, 28402.0, 460831.0, 512121.0, 31361.0, 5121.0, 1580.0, 662.0, 331.0, 177.0, 114.0, 68.0, 40.0, 33.0, 18.0, 11.0, 10.0, 4.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.923828125, -1.868896484375, -1.81396484375, -1.759033203125, -1.7041015625, -1.649169921875, -1.59423828125, -1.539306640625, -1.484375, -1.429443359375, -1.37451171875, -1.319580078125, -1.2646484375, -1.209716796875, -1.15478515625, -1.099853515625, -1.044921875, -0.989990234375, -0.93505859375, -0.880126953125, -0.8251953125, -0.770263671875, -0.71533203125, -0.660400390625, -0.60546875, -0.550537109375, -0.49560546875, -0.440673828125, -0.3857421875, -0.330810546875, -0.27587890625, -0.220947265625, -0.166015625, -0.111083984375, -0.05615234375, -0.001220703125, 0.0537109375, 0.108642578125, 0.16357421875, 0.218505859375, 0.2734375, 0.328369140625, 0.38330078125, 0.438232421875, 0.4931640625, 0.548095703125, 0.60302734375, 0.657958984375, 0.712890625, 0.767822265625, 0.82275390625, 0.877685546875, 0.9326171875, 0.987548828125, 1.04248046875, 1.097412109375, 1.15234375, 1.207275390625, 1.26220703125, 1.317138671875, 1.3720703125, 1.427001953125, 1.48193359375, 1.536865234375, 1.591796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 24.0, 24.0, 60.0, 84.0, 132.0, 139.0, 162.0, 119.0, 96.0, 71.0, 41.0, 17.0, 7.0, 7.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487060546875, -0.4697456359863281, -0.45243072509765625, -0.4351158142089844, -0.4178009033203125, -0.4004859924316406, -0.38317108154296875, -0.3658561706542969, -0.348541259765625, -0.3312263488769531, -0.31391143798828125, -0.2965965270996094, -0.2792816162109375, -0.2619667053222656, -0.24465179443359375, -0.22733688354492188, -0.21002197265625, -0.19270706176757812, -0.17539215087890625, -0.15807723999023438, -0.1407623291015625, -0.12344741821289062, -0.10613250732421875, -0.08881759643554688, -0.071502685546875, -0.054187774658203125, -0.03687286376953125, -0.019557952880859375, -0.0022430419921875, 0.015071868896484375, 0.03238677978515625, 0.049701690673828125, 0.0670166015625, 0.08433151245117188, 0.10164642333984375, 0.11896133422851562, 0.1362762451171875, 0.15359115600585938, 0.17090606689453125, 0.18822097778320312, 0.205535888671875, 0.22285079956054688, 0.24016571044921875, 0.2574806213378906, 0.2747955322265625, 0.2921104431152344, 0.30942535400390625, 0.3267402648925781, 0.34405517578125, 0.3613700866699219, 0.37868499755859375, 0.3959999084472656, 0.4133148193359375, 0.4306297302246094, 0.44794464111328125, 0.4652595520019531, 0.482574462890625, 0.4998893737792969, 0.5172042846679688, 0.5345191955566406, 0.5518341064453125, 0.5691490173339844, 0.5864639282226562, 0.6037788391113281, 0.62109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 9.0, 3.0, 15.0, 5.0, 16.0, 16.0, 26.0, 30.0, 55.0, 66.0, 107.0, 140.0, 221.0, 339.0, 549.0, 908.0, 1956.0, 4961.0, 17286.0, 85799.0, 460706.0, 387037.0, 65898.0, 14031.0, 4234.0, 1620.0, 883.0, 521.0, 343.0, 213.0, 171.0, 113.0, 78.0, 67.0, 30.0, 26.0, 21.0, 14.0, 10.0, 11.0, 7.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.98046875, -0.9497604370117188, -0.9190521240234375, -0.8883438110351562, -0.857635498046875, -0.8269271850585938, -0.7962188720703125, -0.7655105590820312, -0.73480224609375, -0.7040939331054688, -0.6733856201171875, -0.6426773071289062, -0.611968994140625, -0.5812606811523438, -0.5505523681640625, -0.5198440551757812, -0.4891357421875, -0.45842742919921875, -0.4277191162109375, -0.39701080322265625, -0.366302490234375, -0.33559417724609375, -0.3048858642578125, -0.27417755126953125, -0.24346923828125, -0.21276092529296875, -0.1820526123046875, -0.15134429931640625, -0.120635986328125, -0.08992767333984375, -0.0592193603515625, -0.02851104736328125, 0.002197265625, 0.03290557861328125, 0.0636138916015625, 0.09432220458984375, 0.125030517578125, 0.15573883056640625, 0.1864471435546875, 0.21715545654296875, 0.24786376953125, 0.27857208251953125, 0.3092803955078125, 0.33998870849609375, 0.370697021484375, 0.40140533447265625, 0.4321136474609375, 0.46282196044921875, 0.4935302734375, 0.5242385864257812, 0.5549468994140625, 0.5856552124023438, 0.616363525390625, 0.6470718383789062, 0.6777801513671875, 0.7084884643554688, 0.73919677734375, 0.7699050903320312, 0.8006134033203125, 0.8313217163085938, 0.862030029296875, 0.8927383422851562, 0.9234466552734375, 0.9541549682617188, 0.98486328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 6.0, 3.0, 4.0, 5.0, 10.0, 6.0, 17.0, 11.0, 13.0, 8.0, 18.0, 25.0, 30.0, 32.0, 33.0, 37.0, 46.0, 50.0, 38.0, 40.0, 50.0, 55.0, 40.0, 48.0, 40.0, 35.0, 38.0, 36.0, 25.0, 26.0, 22.0, 19.0, 15.0, 25.0, 20.0, 17.0, 7.0, 11.0, 8.0, 4.0, 9.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88818359375, -0.8559799194335938, -0.8237762451171875, -0.7915725708007812, -0.759368896484375, -0.7271652221679688, -0.6949615478515625, -0.6627578735351562, -0.63055419921875, -0.5983505249023438, -0.5661468505859375, -0.5339431762695312, -0.501739501953125, -0.46953582763671875, -0.4373321533203125, -0.40512847900390625, -0.3729248046875, -0.34072113037109375, -0.3085174560546875, -0.27631378173828125, -0.244110107421875, -0.21190643310546875, -0.1797027587890625, -0.14749908447265625, -0.11529541015625, -0.08309173583984375, -0.0508880615234375, -0.01868438720703125, 0.013519287109375, 0.04572296142578125, 0.0779266357421875, 0.11013031005859375, 0.142333984375, 0.17453765869140625, 0.2067413330078125, 0.23894500732421875, 0.271148681640625, 0.30335235595703125, 0.3355560302734375, 0.36775970458984375, 0.39996337890625, 0.43216705322265625, 0.4643707275390625, 0.49657440185546875, 0.528778076171875, 0.5609817504882812, 0.5931854248046875, 0.6253890991210938, 0.6575927734375, 0.6897964477539062, 0.7220001220703125, 0.7542037963867188, 0.786407470703125, 0.8186111450195312, 0.8508148193359375, 0.8830184936523438, 0.91522216796875, 0.9474258422851562, 0.9796295166015625, 1.0118331909179688, 1.044036865234375, 1.0762405395507812, 1.1084442138671875, 1.1406478881835938, 1.1728515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 15.0, 10.0, 20.0, 34.0, 50.0, 82.0, 154.0, 337.0, 902.0, 3412.0, 33519.0, 874066.0, 127379.0, 6265.0, 1288.0, 489.0, 220.0, 120.0, 62.0, 36.0, 28.0, 16.0, 11.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.5846824645996094, -0.5682907104492188, -0.5518989562988281, -0.5355072021484375, -0.5191154479980469, -0.5027236938476562, -0.4863319396972656, -0.469940185546875, -0.4535484313964844, -0.43715667724609375, -0.4207649230957031, -0.4043731689453125, -0.3879814147949219, -0.37158966064453125, -0.3551979064941406, -0.33880615234375, -0.3224143981933594, -0.30602264404296875, -0.2896308898925781, -0.2732391357421875, -0.2568473815917969, -0.24045562744140625, -0.22406387329101562, -0.207672119140625, -0.19128036499023438, -0.17488861083984375, -0.15849685668945312, -0.1421051025390625, -0.12571334838867188, -0.10932159423828125, -0.09292984008789062, -0.0765380859375, -0.060146331787109375, -0.04375457763671875, -0.027362823486328125, -0.0109710693359375, 0.005420684814453125, 0.02181243896484375, 0.038204193115234375, 0.054595947265625, 0.07098770141601562, 0.08737945556640625, 0.10377120971679688, 0.1201629638671875, 0.13655471801757812, 0.15294647216796875, 0.16933822631835938, 0.18572998046875, 0.20212173461914062, 0.21851348876953125, 0.23490524291992188, 0.2512969970703125, 0.2676887512207031, 0.28408050537109375, 0.3004722595214844, 0.316864013671875, 0.3332557678222656, 0.34964752197265625, 0.3660392761230469, 0.3824310302734375, 0.3988227844238281, 0.41521453857421875, 0.4316062927246094, 0.447998046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 6.0, 15.0, 6.0, 16.0, 21.0, 25.0, 37.0, 48.0, 64.0, 142.0, 166.0, 143.0, 85.0, 56.0, 38.0, 25.0, 21.0, 18.0, 13.0, 8.0, 9.0, 3.0, 3.0, 5.0, 2.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00014090538024902344, -0.0001371670514345169, -0.00013342872262001038, -0.00012969039380550385, -0.00012595206499099731, -0.00012221373617649078, -0.00011847540736198425, -0.00011473707854747772, -0.00011099874973297119, -0.00010726042091846466, -0.00010352209210395813, -9.97837632894516e-05, -9.604543447494507e-05, -9.230710566043854e-05, -8.856877684593201e-05, -8.483044803142548e-05, -8.109211921691895e-05, -7.735379040241241e-05, -7.361546158790588e-05, -6.987713277339935e-05, -6.613880395889282e-05, -6.240047514438629e-05, -5.866214632987976e-05, -5.492381751537323e-05, -5.11854887008667e-05, -4.744715988636017e-05, -4.370883107185364e-05, -3.997050225734711e-05, -3.6232173442840576e-05, -3.2493844628334045e-05, -2.8755515813827515e-05, -2.5017186999320984e-05, -2.1278858184814453e-05, -1.7540529370307922e-05, -1.3802200555801392e-05, -1.006387174129486e-05, -6.32554292678833e-06, -2.5872141122817993e-06, 1.1511147022247314e-06, 4.889443516731262e-06, 8.627772331237793e-06, 1.2366101145744324e-05, 1.6104429960250854e-05, 1.9842758774757385e-05, 2.3581087589263916e-05, 2.7319416403770447e-05, 3.105774521827698e-05, 3.479607403278351e-05, 3.853440284729004e-05, 4.227273166179657e-05, 4.60110604763031e-05, 4.974938929080963e-05, 5.348771810531616e-05, 5.722604691982269e-05, 6.0964375734329224e-05, 6.470270454883575e-05, 6.844103336334229e-05, 7.217936217784882e-05, 7.591769099235535e-05, 7.965601980686188e-05, 8.339434862136841e-05, 8.713267743587494e-05, 9.087100625038147e-05, 9.4609335064888e-05, 9.834766387939453e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 18.0, 16.0, 29.0, 34.0, 89.0, 186.0, 479.0, 1630.0, 9739.0, 502863.0, 520804.0, 10224.0, 1534.0, 492.0, 205.0, 75.0, 39.0, 40.0, 18.0, 12.0, 7.0, 8.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7138671875, -0.6922378540039062, -0.6706085205078125, -0.6489791870117188, -0.627349853515625, -0.6057205200195312, -0.5840911865234375, -0.5624618530273438, -0.54083251953125, -0.5192031860351562, -0.4975738525390625, -0.47594451904296875, -0.454315185546875, -0.43268585205078125, -0.4110565185546875, -0.38942718505859375, -0.3677978515625, -0.34616851806640625, -0.3245391845703125, -0.30290985107421875, -0.281280517578125, -0.25965118408203125, -0.2380218505859375, -0.21639251708984375, -0.19476318359375, -0.17313385009765625, -0.1515045166015625, -0.12987518310546875, -0.108245849609375, -0.08661651611328125, -0.0649871826171875, -0.04335784912109375, -0.021728515625, -9.918212890625e-05, 0.0215301513671875, 0.04315948486328125, 0.064788818359375, 0.08641815185546875, 0.1080474853515625, 0.12967681884765625, 0.15130615234375, 0.17293548583984375, 0.1945648193359375, 0.21619415283203125, 0.237823486328125, 0.25945281982421875, 0.2810821533203125, 0.30271148681640625, 0.3243408203125, 0.34597015380859375, 0.3675994873046875, 0.38922882080078125, 0.410858154296875, 0.43248748779296875, 0.4541168212890625, 0.47574615478515625, 0.49737548828125, 0.5190048217773438, 0.5406341552734375, 0.5622634887695312, 0.583892822265625, 0.6055221557617188, 0.6271514892578125, 0.6487808227539062, 0.67041015625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 6.0, 8.0, 13.0, 30.0, 69.0, 110.0, 130.0, 193.0, 149.0, 126.0, 74.0, 35.0, 14.0, 12.0, 13.0, 5.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63037109375, -0.6136627197265625, -0.596954345703125, -0.5802459716796875, -0.56353759765625, -0.5468292236328125, -0.530120849609375, -0.5134124755859375, -0.4967041015625, -0.4799957275390625, -0.463287353515625, -0.4465789794921875, -0.42987060546875, -0.4131622314453125, -0.396453857421875, -0.3797454833984375, -0.363037109375, -0.3463287353515625, -0.329620361328125, -0.3129119873046875, -0.29620361328125, -0.2794952392578125, -0.262786865234375, -0.2460784912109375, -0.2293701171875, -0.2126617431640625, -0.195953369140625, -0.1792449951171875, -0.16253662109375, -0.1458282470703125, -0.129119873046875, -0.1124114990234375, -0.095703125, -0.0789947509765625, -0.062286376953125, -0.0455780029296875, -0.02886962890625, -0.0121612548828125, 0.004547119140625, 0.0212554931640625, 0.0379638671875, 0.0546722412109375, 0.071380615234375, 0.0880889892578125, 0.10479736328125, 0.1215057373046875, 0.138214111328125, 0.1549224853515625, 0.171630859375, 0.1883392333984375, 0.205047607421875, 0.2217559814453125, 0.23846435546875, 0.2551727294921875, 0.271881103515625, 0.2885894775390625, 0.3052978515625, 0.3220062255859375, 0.338714599609375, 0.3554229736328125, 0.37213134765625, 0.3888397216796875, 0.405548095703125, 0.4222564697265625, 0.43896484375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 7.0, 19.0, 38.0, 47.0, 95.0, 155.0, 205.0, 174.0, 128.0, 49.0, 34.0, 14.0, 14.0, 10.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.40093469619751, -5.198666572570801, -4.996398448944092, -4.794130325317383, -4.591862201690674, -4.389594078063965, -4.187325954437256, -3.985057830810547, -3.782789707183838, -3.580521583557129, -3.37825345993042, -3.175985336303711, -2.973717212677002, -2.771449089050293, -2.569180965423584, -2.366912841796875, -2.164644718170166, -1.962376594543457, -1.760108470916748, -1.557840347290039, -1.35557222366333, -1.153304100036621, -0.9510359764099121, -0.7487678527832031, -0.5464997291564941, -0.34423160552978516, -0.14196348190307617, 0.06030464172363281, 0.2625727653503418, 0.4648408889770508, 0.6671090126037598, 0.8693771362304688, 1.071645736694336, 1.273913860321045, 1.476181983947754, 1.678450107574463, 1.8807182312011719, 2.082986354827881, 2.28525447845459, 2.487522602081299, 2.689790725708008, 2.892058849334717, 3.094326972961426, 3.2965950965881348, 3.4988632202148438, 3.7011313438415527, 3.9033994674682617, 4.105667591094971, 4.30793571472168, 4.510203838348389, 4.712471961975098, 4.914740085601807, 5.117008209228516, 5.319276332855225, 5.521544456481934, 5.723812580108643, 5.926080703735352, 6.1283488273620605, 6.3306169509887695, 6.5328850746154785, 6.7351531982421875, 6.9374213218688965, 7.1396894454956055, 7.3419575691223145, 7.544225692749023]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 6.0, 13.0, 17.0, 16.0, 26.0, 21.0, 45.0, 25.0, 58.0, 56.0, 56.0, 66.0, 79.0, 62.0, 69.0, 47.0, 60.0, 59.0, 48.0, 29.0, 27.0, 25.0, 15.0, 20.0, 12.0, 7.0, 5.0, 6.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.962808609008789, -8.708889961242676, -8.454971313476562, -8.20105266571045, -7.947134494781494, -7.693215847015381, -7.439297676086426, -7.1853790283203125, -6.931460380554199, -6.677541732788086, -6.423623085021973, -6.169704914093018, -5.915786266326904, -5.661867618560791, -5.407949447631836, -5.154030799865723, -4.900112152099609, -4.646193504333496, -4.392274856567383, -4.138356685638428, -3.8844380378723145, -3.630519390106201, -3.376600980758667, -3.122682571411133, -2.8687639236450195, -2.6148452758789062, -2.360926866531372, -2.107008457183838, -1.8530898094177246, -1.5991712808609009, -1.3452527523040771, -1.0913342237472534, -0.8374161720275879, -0.5834976434707642, -0.32957911491394043, -0.0756605863571167, 0.17825794219970703, 0.43217647075653076, 0.6860949993133545, 0.9400135278701782, 1.193932056427002, 1.4478505849838257, 1.7017691135406494, 1.9556876420974731, 2.209606170654297, 2.46352481842041, 2.7174432277679443, 2.9713616371154785, 3.225280284881592, 3.479198932647705, 3.7331173419952393, 3.9870357513427734, 4.240954399108887, 4.494873046875, 4.748791694641113, 5.002709865570068, 5.256628513336182, 5.510547161102295, 5.76446533203125, 6.018383979797363, 6.272302627563477, 6.52622127532959, 6.780139923095703, 7.034058094024658, 7.2879767417907715]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 10.0, 11.0, 18.0, 30.0, 33.0, 61.0, 100.0, 148.0, 289.0, 657.0, 1492.0, 4789.0, 25431.0, 2687333.0, 1441119.0, 24294.0, 4948.0, 1753.0, 767.0, 375.0, 228.0, 136.0, 70.0, 49.0, 42.0, 28.0, 20.0, 9.0, 7.0, 6.0, 14.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.669921875, -1.6080322265625, -1.546142578125, -1.4842529296875, -1.42236328125, -1.3604736328125, -1.298583984375, -1.2366943359375, -1.1748046875, -1.1129150390625, -1.051025390625, -0.9891357421875, -0.92724609375, -0.8653564453125, -0.803466796875, -0.7415771484375, -0.6796875, -0.6177978515625, -0.555908203125, -0.4940185546875, -0.43212890625, -0.3702392578125, -0.308349609375, -0.2464599609375, -0.1845703125, -0.1226806640625, -0.060791015625, 0.0010986328125, 0.06298828125, 0.1248779296875, 0.186767578125, 0.2486572265625, 0.310546875, 0.3724365234375, 0.434326171875, 0.4962158203125, 0.55810546875, 0.6199951171875, 0.681884765625, 0.7437744140625, 0.8056640625, 0.8675537109375, 0.929443359375, 0.9913330078125, 1.05322265625, 1.1151123046875, 1.177001953125, 1.2388916015625, 1.30078125, 1.3626708984375, 1.424560546875, 1.4864501953125, 1.54833984375, 1.6102294921875, 1.672119140625, 1.7340087890625, 1.7958984375, 1.8577880859375, 1.919677734375, 1.9815673828125, 2.04345703125, 2.1053466796875, 2.167236328125, 2.2291259765625, 2.291015625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 15.0, 32.0, 41.0, 88.0, 90.0, 114.0, 136.0, 138.0, 126.0, 75.0, 57.0, 38.0, 13.0, 10.0, 9.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50146484375, -0.48340606689453125, -0.4653472900390625, -0.44728851318359375, -0.429229736328125, -0.41117095947265625, -0.3931121826171875, -0.37505340576171875, -0.35699462890625, -0.33893585205078125, -0.3208770751953125, -0.30281829833984375, -0.284759521484375, -0.26670074462890625, -0.2486419677734375, -0.23058319091796875, -0.2125244140625, -0.19446563720703125, -0.1764068603515625, -0.15834808349609375, -0.140289306640625, -0.12223052978515625, -0.1041717529296875, -0.08611297607421875, -0.06805419921875, -0.04999542236328125, -0.0319366455078125, -0.01387786865234375, 0.004180908203125, 0.02223968505859375, 0.0402984619140625, 0.05835723876953125, 0.076416015625, 0.09447479248046875, 0.1125335693359375, 0.13059234619140625, 0.148651123046875, 0.16670989990234375, 0.1847686767578125, 0.20282745361328125, 0.22088623046875, 0.23894500732421875, 0.2570037841796875, 0.27506256103515625, 0.293121337890625, 0.31118011474609375, 0.3292388916015625, 0.34729766845703125, 0.3653564453125, 0.38341522216796875, 0.4014739990234375, 0.41953277587890625, 0.437591552734375, 0.45565032958984375, 0.4737091064453125, 0.49176788330078125, 0.50982666015625, 0.5278854370117188, 0.5459442138671875, 0.5640029907226562, 0.582061767578125, 0.6001205444335938, 0.6181793212890625, 0.6362380981445312, 0.654296875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 12.0, 26.0, 47.0, 93.0, 177.0, 410.0, 1040.0, 5012.0, 182848.0, 3988846.0, 12714.0, 1866.0, 646.0, 265.0, 115.0, 69.0, 30.0, 18.0, 11.0, 6.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30078125, -2.212921142578125, -2.12506103515625, -2.037200927734375, -1.9493408203125, -1.861480712890625, -1.77362060546875, -1.685760498046875, -1.597900390625, -1.510040283203125, -1.42218017578125, -1.334320068359375, -1.2464599609375, -1.158599853515625, -1.07073974609375, -0.982879638671875, -0.89501953125, -0.807159423828125, -0.71929931640625, -0.631439208984375, -0.5435791015625, -0.455718994140625, -0.36785888671875, -0.279998779296875, -0.192138671875, -0.104278564453125, -0.01641845703125, 0.071441650390625, 0.1593017578125, 0.247161865234375, 0.33502197265625, 0.422882080078125, 0.5107421875, 0.598602294921875, 0.68646240234375, 0.774322509765625, 0.8621826171875, 0.950042724609375, 1.03790283203125, 1.125762939453125, 1.213623046875, 1.301483154296875, 1.38934326171875, 1.477203369140625, 1.5650634765625, 1.652923583984375, 1.74078369140625, 1.828643798828125, 1.91650390625, 2.004364013671875, 2.09222412109375, 2.180084228515625, 2.2679443359375, 2.355804443359375, 2.44366455078125, 2.531524658203125, 2.619384765625, 2.707244873046875, 2.79510498046875, 2.882965087890625, 2.9708251953125, 3.058685302734375, 3.14654541015625, 3.234405517578125, 3.322265625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 10.0, 18.0, 28.0, 57.0, 188.0, 1219.0, 2092.0, 294.0, 70.0, 31.0, 26.0, 10.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98583984375, -0.9541549682617188, -0.9224700927734375, -0.8907852172851562, -0.859100341796875, -0.8274154663085938, -0.7957305908203125, -0.7640457153320312, -0.73236083984375, -0.7006759643554688, -0.6689910888671875, -0.6373062133789062, -0.605621337890625, -0.5739364624023438, -0.5422515869140625, -0.5105667114257812, -0.4788818359375, -0.44719696044921875, -0.4155120849609375, -0.38382720947265625, -0.352142333984375, -0.32045745849609375, -0.2887725830078125, -0.25708770751953125, -0.22540283203125, -0.19371795654296875, -0.1620330810546875, -0.13034820556640625, -0.098663330078125, -0.06697845458984375, -0.0352935791015625, -0.00360870361328125, 0.028076171875, 0.05976104736328125, 0.0914459228515625, 0.12313079833984375, 0.154815673828125, 0.18650054931640625, 0.2181854248046875, 0.24987030029296875, 0.28155517578125, 0.31324005126953125, 0.3449249267578125, 0.37660980224609375, 0.408294677734375, 0.43997955322265625, 0.4716644287109375, 0.5033493041992188, 0.5350341796875, 0.5667190551757812, 0.5984039306640625, 0.6300888061523438, 0.661773681640625, 0.6934585571289062, 0.7251434326171875, 0.7568283081054688, 0.78851318359375, 0.8201980590820312, 0.8518829345703125, 0.8835678100585938, 0.915252685546875, 0.9469375610351562, 0.9786224365234375, 1.0103073120117188, 1.0419921875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 3.0, 11.0, 18.0, 57.0, 129.0, 221.0, 250.0, 171.0, 67.0, 32.0, 18.0, 7.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6571035385131836, -2.562452554702759, -2.467801809310913, -2.3731508255004883, -2.2785000801086426, -2.1838490962982178, -2.089198112487793, -1.9945472478866577, -1.8998963832855225, -1.8052455186843872, -1.710594654083252, -1.6159436702728271, -1.521292805671692, -1.4266419410705566, -1.3319909572601318, -1.2373400926589966, -1.1426892280578613, -1.048038363456726, -0.953387439250946, -0.858736515045166, -0.7640856504440308, -0.6694347858428955, -0.5747838616371155, -0.48013293743133545, -0.3854820728302002, -0.29083117842674255, -0.1961802840232849, -0.10152938961982727, -0.006878495216369629, 0.08777239918708801, 0.18242329359054565, 0.2770742177963257, 0.37172484397888184, 0.4663757383823395, 0.5610266327857971, 0.6556775569915771, 0.7503284215927124, 0.8449792861938477, 0.9396302103996277, 1.0342811346054077, 1.128931999206543, 1.2235828638076782, 1.3182337284088135, 1.4128847122192383, 1.5075355768203735, 1.6021864414215088, 1.6968374252319336, 1.7914882898330688, 1.886139154434204, 1.9807900190353394, 2.0754408836364746, 2.1700918674468994, 2.264742851257324, 2.35939359664917, 2.4540445804595947, 2.5486955642700195, 2.6433463096618652, 2.73799729347229, 2.8326480388641357, 2.9272990226745605, 3.0219497680664062, 3.116600751876831, 3.211251735687256, 3.3059024810791016, 3.4005534648895264]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 13.0, 19.0, 27.0, 35.0, 63.0, 85.0, 118.0, 118.0, 152.0, 82.0, 94.0, 74.0, 39.0, 36.0, 15.0, 11.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.897249698638916, -3.7748000621795654, -3.652350425720215, -3.5299010276794434, -3.4074513912200928, -3.285001754760742, -3.1625521183013916, -3.040102481842041, -2.9176530838012695, -2.795203447341919, -2.6727538108825684, -2.550304412841797, -2.4278547763824463, -2.3054051399230957, -2.182955503463745, -2.0605058670043945, -1.938056230545044, -1.8156065940856934, -1.6931570768356323, -1.5707074403762817, -1.4482579231262207, -1.3258082866668701, -1.2033586502075195, -1.080909013748169, -0.9584594964981079, -0.8360099196434021, -0.7135603427886963, -0.5911107063293457, -0.4686611294746399, -0.3462115526199341, -0.2237619161605835, -0.10131233930587769, 0.021137237548828125, 0.14358682930469513, 0.26603642106056213, 0.38848602771759033, 0.5109356045722961, 0.633385181427002, 0.7558348178863525, 0.8782843947410583, 1.0007339715957642, 1.1231836080551147, 1.2456331253051758, 1.3680827617645264, 1.490532398223877, 1.612981915473938, 1.7354315519332886, 1.8578810691833496, 1.9803307056427002, 2.102780342102051, 2.2252299785614014, 2.347679615020752, 2.4701290130615234, 2.592578649520874, 2.7150282859802246, 2.837477922439575, 2.959927558898926, 3.0823771953582764, 3.204826831817627, 3.3272762298583984, 3.449725866317749, 3.5721755027770996, 3.69462513923645, 3.817074775695801, 3.9395241737365723]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 11.0, 9.0, 21.0, 25.0, 38.0, 71.0, 132.0, 266.0, 582.0, 1348.0, 3975.0, 26566.0, 683457.0, 313892.0, 13308.0, 2809.0, 1096.0, 460.0, 221.0, 117.0, 69.0, 39.0, 17.0, 12.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.63671875, -2.56707763671875, -2.4974365234375, -2.42779541015625, -2.358154296875, -2.28851318359375, -2.2188720703125, -2.14923095703125, -2.07958984375, -2.00994873046875, -1.9403076171875, -1.87066650390625, -1.801025390625, -1.73138427734375, -1.6617431640625, -1.59210205078125, -1.5224609375, -1.45281982421875, -1.3831787109375, -1.31353759765625, -1.243896484375, -1.17425537109375, -1.1046142578125, -1.03497314453125, -0.96533203125, -0.89569091796875, -0.8260498046875, -0.75640869140625, -0.686767578125, -0.61712646484375, -0.5474853515625, -0.47784423828125, -0.408203125, -0.33856201171875, -0.2689208984375, -0.19927978515625, -0.129638671875, -0.05999755859375, 0.0096435546875, 0.07928466796875, 0.14892578125, 0.21856689453125, 0.2882080078125, 0.35784912109375, 0.427490234375, 0.49713134765625, 0.5667724609375, 0.63641357421875, 0.7060546875, 0.77569580078125, 0.8453369140625, 0.91497802734375, 0.984619140625, 1.05426025390625, 1.1239013671875, 1.19354248046875, 1.26318359375, 1.33282470703125, 1.4024658203125, 1.47210693359375, 1.541748046875, 1.61138916015625, 1.6810302734375, 1.75067138671875, 1.8203125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 9.0, 21.0, 37.0, 53.0, 84.0, 103.0, 119.0, 142.0, 129.0, 113.0, 71.0, 53.0, 27.0, 10.0, 7.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.474853515625, -0.4575538635253906, -0.44025421142578125, -0.4229545593261719, -0.4056549072265625, -0.3883552551269531, -0.37105560302734375, -0.3537559509277344, -0.336456298828125, -0.3191566467285156, -0.30185699462890625, -0.2845573425292969, -0.2672576904296875, -0.24995803833007812, -0.23265838623046875, -0.21535873413085938, -0.19805908203125, -0.18075942993164062, -0.16345977783203125, -0.14616012573242188, -0.1288604736328125, -0.11156082153320312, -0.09426116943359375, -0.07696151733398438, -0.059661865234375, -0.042362213134765625, -0.02506256103515625, -0.007762908935546875, 0.0095367431640625, 0.026836395263671875, 0.04413604736328125, 0.061435699462890625, 0.0787353515625, 0.09603500366210938, 0.11333465576171875, 0.13063430786132812, 0.1479339599609375, 0.16523361206054688, 0.18253326416015625, 0.19983291625976562, 0.217132568359375, 0.23443222045898438, 0.25173187255859375, 0.2690315246582031, 0.2863311767578125, 0.3036308288574219, 0.32093048095703125, 0.3382301330566406, 0.35552978515625, 0.3728294372558594, 0.39012908935546875, 0.4074287414550781, 0.4247283935546875, 0.4420280456542969, 0.45932769775390625, 0.4766273498535156, 0.493927001953125, 0.5112266540527344, 0.5285263061523438, 0.5458259582519531, 0.5631256103515625, 0.5804252624511719, 0.5977249145507812, 0.6150245666503906, 0.63232421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 6.0, 3.0, 6.0, 13.0, 9.0, 14.0, 18.0, 34.0, 55.0, 79.0, 124.0, 224.0, 483.0, 1054.0, 3060.0, 14219.0, 131048.0, 714665.0, 161128.0, 16537.0, 3424.0, 1168.0, 501.0, 246.0, 145.0, 91.0, 49.0, 45.0, 27.0, 14.0, 8.0, 12.0, 8.0, 9.0, 2.0, 7.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.658203125, -1.612823486328125, -1.56744384765625, -1.522064208984375, -1.4766845703125, -1.431304931640625, -1.38592529296875, -1.340545654296875, -1.295166015625, -1.249786376953125, -1.20440673828125, -1.159027099609375, -1.1136474609375, -1.068267822265625, -1.02288818359375, -0.977508544921875, -0.93212890625, -0.886749267578125, -0.84136962890625, -0.795989990234375, -0.7506103515625, -0.705230712890625, -0.65985107421875, -0.614471435546875, -0.569091796875, -0.523712158203125, -0.47833251953125, -0.432952880859375, -0.3875732421875, -0.342193603515625, -0.29681396484375, -0.251434326171875, -0.2060546875, -0.160675048828125, -0.11529541015625, -0.069915771484375, -0.0245361328125, 0.020843505859375, 0.06622314453125, 0.111602783203125, 0.156982421875, 0.202362060546875, 0.24774169921875, 0.293121337890625, 0.3385009765625, 0.383880615234375, 0.42926025390625, 0.474639892578125, 0.52001953125, 0.565399169921875, 0.61077880859375, 0.656158447265625, 0.7015380859375, 0.746917724609375, 0.79229736328125, 0.837677001953125, 0.883056640625, 0.928436279296875, 0.97381591796875, 1.019195556640625, 1.0645751953125, 1.109954833984375, 1.15533447265625, 1.200714111328125, 1.24609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 1.0, 7.0, 4.0, 8.0, 10.0, 14.0, 9.0, 28.0, 26.0, 29.0, 33.0, 56.0, 48.0, 51.0, 58.0, 53.0, 53.0, 45.0, 59.0, 57.0, 48.0, 50.0, 47.0, 59.0, 32.0, 23.0, 22.0, 21.0, 10.0, 14.0, 3.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-1.8564453125, -1.810150146484375, -1.76385498046875, -1.717559814453125, -1.6712646484375, -1.624969482421875, -1.57867431640625, -1.532379150390625, -1.486083984375, -1.439788818359375, -1.39349365234375, -1.347198486328125, -1.3009033203125, -1.254608154296875, -1.20831298828125, -1.162017822265625, -1.11572265625, -1.069427490234375, -1.02313232421875, -0.976837158203125, -0.9305419921875, -0.884246826171875, -0.83795166015625, -0.791656494140625, -0.745361328125, -0.699066162109375, -0.65277099609375, -0.606475830078125, -0.5601806640625, -0.513885498046875, -0.46759033203125, -0.421295166015625, -0.375, -0.328704833984375, -0.28240966796875, -0.236114501953125, -0.1898193359375, -0.143524169921875, -0.09722900390625, -0.050933837890625, -0.004638671875, 0.041656494140625, 0.08795166015625, 0.134246826171875, 0.1805419921875, 0.226837158203125, 0.27313232421875, 0.319427490234375, 0.36572265625, 0.412017822265625, 0.45831298828125, 0.504608154296875, 0.5509033203125, 0.597198486328125, 0.64349365234375, 0.689788818359375, 0.736083984375, 0.782379150390625, 0.82867431640625, 0.874969482421875, 0.9212646484375, 0.967559814453125, 1.01385498046875, 1.060150146484375, 1.1064453125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 11.0, 18.0, 32.0, 74.0, 99.0, 267.0, 785.0, 2666.0, 17493.0, 954147.0, 66408.0, 4600.0, 1206.0, 395.0, 181.0, 67.0, 42.0, 17.0, 9.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.337890625, -1.3041763305664062, -1.2704620361328125, -1.2367477416992188, -1.203033447265625, -1.1693191528320312, -1.1356048583984375, -1.1018905639648438, -1.06817626953125, -1.0344619750976562, -1.0007476806640625, -0.9670333862304688, -0.933319091796875, -0.8996047973632812, -0.8658905029296875, -0.8321762084960938, -0.7984619140625, -0.7647476196289062, -0.7310333251953125, -0.6973190307617188, -0.663604736328125, -0.6298904418945312, -0.5961761474609375, -0.5624618530273438, -0.52874755859375, -0.49503326416015625, -0.4613189697265625, -0.42760467529296875, -0.393890380859375, -0.36017608642578125, -0.3264617919921875, -0.29274749755859375, -0.259033203125, -0.22531890869140625, -0.1916046142578125, -0.15789031982421875, -0.124176025390625, -0.09046173095703125, -0.0567474365234375, -0.02303314208984375, 0.01068115234375, 0.04439544677734375, 0.0781097412109375, 0.11182403564453125, 0.145538330078125, 0.17925262451171875, 0.2129669189453125, 0.24668121337890625, 0.2803955078125, 0.31410980224609375, 0.3478240966796875, 0.38153839111328125, 0.415252685546875, 0.44896697998046875, 0.4826812744140625, 0.5163955688476562, 0.55010986328125, 0.5838241577148438, 0.6175384521484375, 0.6512527465820312, 0.684967041015625, 0.7186813354492188, 0.7523956298828125, 0.7861099243164062, 0.81982421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 9.0, 14.0, 9.0, 23.0, 16.0, 36.0, 35.0, 73.0, 118.0, 152.0, 164.0, 104.0, 59.0, 32.0, 36.0, 21.0, 16.0, 17.0, 9.0, 12.0, 10.0, 9.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00015914440155029297, -0.00015533901751041412, -0.00015153363347053528, -0.00014772824943065643, -0.0001439228653907776, -0.00014011748135089874, -0.0001363120973110199, -0.00013250671327114105, -0.0001287013292312622, -0.00012489594519138336, -0.00012109056115150452, -0.00011728517711162567, -0.00011347979307174683, -0.00010967440903186798, -0.00010586902499198914, -0.00010206364095211029, -9.825825691223145e-05, -9.44528728723526e-05, -9.064748883247375e-05, -8.684210479259491e-05, -8.303672075271606e-05, -7.923133671283722e-05, -7.542595267295837e-05, -7.162056863307953e-05, -6.781518459320068e-05, -6.400980055332184e-05, -6.020441651344299e-05, -5.639903247356415e-05, -5.25936484336853e-05, -4.878826439380646e-05, -4.498288035392761e-05, -4.117749631404877e-05, -3.737211227416992e-05, -3.356672823429108e-05, -2.976134419441223e-05, -2.5955960154533386e-05, -2.215057611465454e-05, -1.8345192074775696e-05, -1.453980803489685e-05, -1.0734423995018005e-05, -6.92903995513916e-06, -3.123655915260315e-06, 6.817281246185303e-07, 4.4871121644973755e-06, 8.29249620437622e-06, 1.2097880244255066e-05, 1.590326428413391e-05, 1.9708648324012756e-05, 2.35140323638916e-05, 2.7319416403770447e-05, 3.112480044364929e-05, 3.493018448352814e-05, 3.873556852340698e-05, 4.254095256328583e-05, 4.634633660316467e-05, 5.015172064304352e-05, 5.395710468292236e-05, 5.776248872280121e-05, 6.156787276268005e-05, 6.53732568025589e-05, 6.917864084243774e-05, 7.298402488231659e-05, 7.678940892219543e-05, 8.059479296207428e-05, 8.440017700195312e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 11.0, 18.0, 22.0, 29.0, 56.0, 119.0, 261.0, 643.0, 2321.0, 13394.0, 598927.0, 418458.0, 11243.0, 2075.0, 580.0, 195.0, 95.0, 43.0, 20.0, 13.0, 8.0, 9.0, 8.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5595703125, -0.532867431640625, -0.50616455078125, -0.479461669921875, -0.4527587890625, -0.426055908203125, -0.39935302734375, -0.372650146484375, -0.345947265625, -0.319244384765625, -0.29254150390625, -0.265838623046875, -0.2391357421875, -0.212432861328125, -0.18572998046875, -0.159027099609375, -0.13232421875, -0.105621337890625, -0.07891845703125, -0.052215576171875, -0.0255126953125, 0.001190185546875, 0.02789306640625, 0.054595947265625, 0.081298828125, 0.108001708984375, 0.13470458984375, 0.161407470703125, 0.1881103515625, 0.214813232421875, 0.24151611328125, 0.268218994140625, 0.294921875, 0.321624755859375, 0.34832763671875, 0.375030517578125, 0.4017333984375, 0.428436279296875, 0.45513916015625, 0.481842041015625, 0.508544921875, 0.535247802734375, 0.56195068359375, 0.588653564453125, 0.6153564453125, 0.642059326171875, 0.66876220703125, 0.695465087890625, 0.72216796875, 0.748870849609375, 0.77557373046875, 0.802276611328125, 0.8289794921875, 0.855682373046875, 0.88238525390625, 0.909088134765625, 0.935791015625, 0.962493896484375, 0.98919677734375, 1.015899658203125, 1.0426025390625, 1.069305419921875, 1.09600830078125, 1.122711181640625, 1.1494140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 11.0, 15.0, 30.0, 33.0, 51.0, 84.0, 120.0, 155.0, 165.0, 111.0, 69.0, 60.0, 26.0, 14.0, 9.0, 5.0, 5.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.48291015625, -0.46431732177734375, -0.4457244873046875, -0.42713165283203125, -0.408538818359375, -0.38994598388671875, -0.3713531494140625, -0.35276031494140625, -0.33416748046875, -0.31557464599609375, -0.2969818115234375, -0.27838897705078125, -0.259796142578125, -0.24120330810546875, -0.2226104736328125, -0.20401763916015625, -0.1854248046875, -0.16683197021484375, -0.1482391357421875, -0.12964630126953125, -0.111053466796875, -0.09246063232421875, -0.0738677978515625, -0.05527496337890625, -0.03668212890625, -0.01808929443359375, 0.0005035400390625, 0.01909637451171875, 0.037689208984375, 0.05628204345703125, 0.0748748779296875, 0.09346771240234375, 0.112060546875, 0.13065338134765625, 0.1492462158203125, 0.16783905029296875, 0.186431884765625, 0.20502471923828125, 0.2236175537109375, 0.24221038818359375, 0.26080322265625, 0.27939605712890625, 0.2979888916015625, 0.31658172607421875, 0.335174560546875, 0.35376739501953125, 0.3723602294921875, 0.39095306396484375, 0.4095458984375, 0.42813873291015625, 0.4467315673828125, 0.46532440185546875, 0.483917236328125, 0.5025100708007812, 0.5211029052734375, 0.5396957397460938, 0.55828857421875, 0.5768814086914062, 0.5954742431640625, 0.6140670776367188, 0.632659912109375, 0.6512527465820312, 0.6698455810546875, 0.6884384155273438, 0.70703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 12.0, 19.0, 15.0, 51.0, 88.0, 170.0, 202.0, 168.0, 119.0, 65.0, 40.0, 19.0, 15.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.624582290649414, -10.381489753723145, -10.138396263122559, -9.895303726196289, -9.652210235595703, -9.409117698669434, -9.166025161743164, -8.922931671142578, -8.679839134216309, -8.436746597290039, -8.193653106689453, -7.950560569763184, -7.707467555999756, -7.464374542236328, -7.2212815284729, -6.978188514709473, -6.735095500946045, -6.492002487182617, -6.2489094734191895, -6.005816459655762, -5.762723922729492, -5.5196309089660645, -5.276537895202637, -5.033444881439209, -4.790351867675781, -4.5472588539123535, -4.304165840148926, -4.061073303222656, -3.8179802894592285, -3.574887275695801, -3.331794261932373, -3.0887012481689453, -2.845608711242676, -2.602515697479248, -2.3594229221343994, -2.1163299083709717, -1.8732370138168335, -1.6301441192626953, -1.3870511054992676, -1.1439582109451294, -0.9008653163909912, -0.657772421836853, -0.41467946767807007, -0.1715865135192871, 0.07150638103485107, 0.31459927558898926, 0.557692289352417, 0.8007851839065552, 1.0438780784606934, 1.2869709730148315, 1.5300638675689697, 1.7731568813323975, 2.016249656677246, 2.259342670440674, 2.5024356842041016, 2.7455286979675293, 2.988621473312378, 3.2317144870758057, 3.4748072624206543, 3.717900276184082, 3.9609932899475098, 4.2040863037109375, 4.447178840637207, 4.690271854400635, 4.9333648681640625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 13.0, 10.0, 9.0, 16.0, 16.0, 19.0, 23.0, 39.0, 30.0, 40.0, 39.0, 44.0, 52.0, 66.0, 47.0, 60.0, 68.0, 47.0, 55.0, 51.0, 38.0, 32.0, 28.0, 16.0, 26.0, 18.0, 23.0, 18.0, 8.0, 12.0, 10.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-8.529154777526855, -8.273794174194336, -8.0184326171875, -7.763071537017822, -7.5077104568481445, -7.252349853515625, -6.996988773345947, -6.7416276931762695, -6.486266613006592, -6.230905532836914, -5.975544452667236, -5.720183372497559, -5.464822769165039, -5.209461212158203, -4.954100608825684, -4.698739528656006, -4.443378448486328, -4.18801736831665, -3.9326562881469727, -3.677295446395874, -3.4219343662261963, -3.1665732860565186, -2.91121244430542, -2.655851364135742, -2.4004902839660645, -2.1451292037963867, -1.8897682428359985, -1.6344072818756104, -1.3790462017059326, -1.1236851215362549, -0.8683241605758667, -0.6129631996154785, -0.357602596282959, -0.10224157571792603, 0.15311944484710693, 0.4084804654121399, 0.6638414859771729, 0.9192025661468506, 1.1745635271072388, 1.429924488067627, 1.6852855682373047, 1.9406466484069824, 2.19600772857666, 2.451368570327759, 2.7067296504974365, 2.9620907306671143, 3.217451572418213, 3.4728126525878906, 3.7281737327575684, 3.983534812927246, 4.238895893096924, 4.494256973266602, 4.749617576599121, 5.004979133605957, 5.260339736938477, 5.515700817108154, 5.771061897277832, 6.02642297744751, 6.2817840576171875, 6.537145137786865, 6.792506217956543, 7.0478668212890625, 7.30322790145874, 7.558588981628418, 7.813950061798096]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 7.0, 14.0, 12.0, 27.0, 54.0, 76.0, 145.0, 236.0, 475.0, 1033.0, 3987.0, 30120.0, 4038069.0, 108748.0, 7807.0, 1909.0, 703.0, 311.0, 217.0, 118.0, 72.0, 54.0, 30.0, 16.0, 14.0, 5.0, 12.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.57421875, -1.512939453125, -1.45166015625, -1.390380859375, -1.3291015625, -1.267822265625, -1.20654296875, -1.145263671875, -1.083984375, -1.022705078125, -0.96142578125, -0.900146484375, -0.8388671875, -0.777587890625, -0.71630859375, -0.655029296875, -0.59375, -0.532470703125, -0.47119140625, -0.409912109375, -0.3486328125, -0.287353515625, -0.22607421875, -0.164794921875, -0.103515625, -0.042236328125, 0.01904296875, 0.080322265625, 0.1416015625, 0.202880859375, 0.26416015625, 0.325439453125, 0.38671875, 0.447998046875, 0.50927734375, 0.570556640625, 0.6318359375, 0.693115234375, 0.75439453125, 0.815673828125, 0.876953125, 0.938232421875, 0.99951171875, 1.060791015625, 1.1220703125, 1.183349609375, 1.24462890625, 1.305908203125, 1.3671875, 1.428466796875, 1.48974609375, 1.551025390625, 1.6123046875, 1.673583984375, 1.73486328125, 1.796142578125, 1.857421875, 1.918701171875, 1.97998046875, 2.041259765625, 2.1025390625, 2.163818359375, 2.22509765625, 2.286376953125, 2.34765625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 4.0, 7.0, 8.0, 28.0, 33.0, 53.0, 58.0, 80.0, 112.0, 111.0, 118.0, 109.0, 94.0, 59.0, 50.0, 28.0, 12.0, 11.0, 6.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.455810546875, -0.4388771057128906, -0.42194366455078125, -0.4050102233886719, -0.3880767822265625, -0.3711433410644531, -0.35420989990234375, -0.3372764587402344, -0.320343017578125, -0.3034095764160156, -0.28647613525390625, -0.2695426940917969, -0.2526092529296875, -0.23567581176757812, -0.21874237060546875, -0.20180892944335938, -0.18487548828125, -0.16794204711914062, -0.15100860595703125, -0.13407516479492188, -0.1171417236328125, -0.10020828247070312, -0.08327484130859375, -0.06634140014648438, -0.049407958984375, -0.032474517822265625, -0.01554107666015625, 0.001392364501953125, 0.0183258056640625, 0.035259246826171875, 0.05219268798828125, 0.06912612915039062, 0.0860595703125, 0.10299301147460938, 0.11992645263671875, 0.13685989379882812, 0.1537933349609375, 0.17072677612304688, 0.18766021728515625, 0.20459365844726562, 0.221527099609375, 0.23846054077148438, 0.25539398193359375, 0.2723274230957031, 0.2892608642578125, 0.3061943054199219, 0.32312774658203125, 0.3400611877441406, 0.35699462890625, 0.3739280700683594, 0.39086151123046875, 0.4077949523925781, 0.4247283935546875, 0.4416618347167969, 0.45859527587890625, 0.4755287170410156, 0.492462158203125, 0.5093955993652344, 0.5263290405273438, 0.5432624816894531, 0.5601959228515625, 0.5771293640136719, 0.5940628051757812, 0.6109962463378906, 0.6279296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 9.0, 8.0, 21.0, 55.0, 97.0, 210.0, 463.0, 1074.0, 3357.0, 18676.0, 2133484.0, 2013184.0, 18354.0, 3418.0, 1073.0, 419.0, 195.0, 79.0, 40.0, 24.0, 9.0, 10.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5009765625, -1.4554901123046875, -1.410003662109375, -1.3645172119140625, -1.31903076171875, -1.2735443115234375, -1.228057861328125, -1.1825714111328125, -1.1370849609375, -1.0915985107421875, -1.046112060546875, -1.0006256103515625, -0.95513916015625, -0.9096527099609375, -0.864166259765625, -0.8186798095703125, -0.773193359375, -0.7277069091796875, -0.682220458984375, -0.6367340087890625, -0.59124755859375, -0.5457611083984375, -0.500274658203125, -0.4547882080078125, -0.4093017578125, -0.3638153076171875, -0.318328857421875, -0.2728424072265625, -0.22735595703125, -0.1818695068359375, -0.136383056640625, -0.0908966064453125, -0.04541015625, 7.62939453125e-05, 0.045562744140625, 0.0910491943359375, 0.13653564453125, 0.1820220947265625, 0.227508544921875, 0.2729949951171875, 0.3184814453125, 0.3639678955078125, 0.409454345703125, 0.4549407958984375, 0.50042724609375, 0.5459136962890625, 0.591400146484375, 0.6368865966796875, 0.682373046875, 0.7278594970703125, 0.773345947265625, 0.8188323974609375, 0.86431884765625, 0.9098052978515625, 0.955291748046875, 1.0007781982421875, 1.0462646484375, 1.0917510986328125, 1.137237548828125, 1.1827239990234375, 1.22821044921875, 1.2736968994140625, 1.319183349609375, 1.3646697998046875, 1.41015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 6.0, 7.0, 13.0, 28.0, 34.0, 63.0, 135.0, 399.0, 2146.0, 821.0, 198.0, 95.0, 48.0, 21.0, 15.0, 12.0, 5.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5615234375, -0.5462379455566406, -0.5309524536132812, -0.5156669616699219, -0.5003814697265625, -0.4850959777832031, -0.46981048583984375, -0.4545249938964844, -0.439239501953125, -0.4239540100097656, -0.40866851806640625, -0.3933830261230469, -0.3780975341796875, -0.3628120422363281, -0.34752655029296875, -0.3322410583496094, -0.31695556640625, -0.3016700744628906, -0.28638458251953125, -0.2710990905761719, -0.2558135986328125, -0.24052810668945312, -0.22524261474609375, -0.20995712280273438, -0.194671630859375, -0.17938613891601562, -0.16410064697265625, -0.14881515502929688, -0.1335296630859375, -0.11824417114257812, -0.10295867919921875, -0.08767318725585938, -0.0723876953125, -0.057102203369140625, -0.04181671142578125, -0.026531219482421875, -0.0112457275390625, 0.004039764404296875, 0.01932525634765625, 0.034610748291015625, 0.049896240234375, 0.06518173217773438, 0.08046722412109375, 0.09575271606445312, 0.1110382080078125, 0.12632369995117188, 0.14160919189453125, 0.15689468383789062, 0.17218017578125, 0.18746566772460938, 0.20275115966796875, 0.21803665161132812, 0.2333221435546875, 0.24860763549804688, 0.26389312744140625, 0.2791786193847656, 0.294464111328125, 0.3097496032714844, 0.32503509521484375, 0.3403205871582031, 0.3556060791015625, 0.3708915710449219, 0.38617706298828125, 0.4014625549316406, 0.416748046875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 12.0, 32.0, 93.0, 314.0, 349.0, 138.0, 41.0, 12.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.765956878662109, -4.652946949005127, -4.5399370193481445, -4.426926612854004, -4.3139166831970215, -4.200906753540039, -4.087896347045898, -3.974886417388916, -3.8618764877319336, -3.748866558074951, -3.6358563899993896, -3.522846221923828, -3.4098362922668457, -3.2968263626098633, -3.1838161945343018, -3.0708060264587402, -2.957796096801758, -2.8447861671447754, -2.731775999069214, -2.6187658309936523, -2.50575590133667, -2.3927459716796875, -2.279735803604126, -2.1667256355285645, -2.053715705871582, -1.94070565700531, -1.827695608139038, -1.7146855592727661, -1.6016755104064941, -1.4886654615402222, -1.3756554126739502, -1.2626453638076782, -1.1496353149414062, -1.0366252660751343, -0.9236152172088623, -0.8106051683425903, -0.6975951194763184, -0.5845850706100464, -0.4715750217437744, -0.35856497287750244, -0.24555492401123047, -0.1325448751449585, -0.019534826278686523, 0.09347522258758545, 0.20648527145385742, 0.3194953203201294, 0.43250536918640137, 0.5455154180526733, 0.6585254669189453, 0.7715355157852173, 0.8845455646514893, 0.9975556135177612, 1.1105656623840332, 1.2235757112503052, 1.3365857601165771, 1.4495958089828491, 1.562605857849121, 1.675615906715393, 1.788625955581665, 1.901636004447937, 2.014646053314209, 2.1276559829711914, 2.240666151046753, 2.3536763191223145, 2.466686248779297]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 12.0, 14.0, 10.0, 26.0, 25.0, 29.0, 47.0, 66.0, 60.0, 69.0, 75.0, 67.0, 76.0, 71.0, 53.0, 47.0, 58.0, 48.0, 45.0, 21.0, 20.0, 15.0, 14.0, 16.0, 11.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8561229705810547, -1.8031017780303955, -1.7500805854797363, -1.6970593929290771, -1.644038200378418, -1.5910170078277588, -1.5379959344863892, -1.48497474193573, -1.4319535493850708, -1.3789323568344116, -1.3259111642837524, -1.2728899717330933, -1.2198688983917236, -1.1668477058410645, -1.1138265132904053, -1.060805320739746, -1.007784128189087, -0.9547629356384277, -0.9017417430877686, -0.8487206101417542, -0.795699417591095, -0.7426782250404358, -0.6896570920944214, -0.6366358995437622, -0.583614706993103, -0.5305935144424438, -0.47757235169410706, -0.42455118894577026, -0.3715299963951111, -0.3185088038444519, -0.2654876410961151, -0.21246647834777832, -0.1594454050064087, -0.1064242273569107, -0.05340304970741272, -0.0003818720579147339, 0.05263930559158325, 0.10566049814224243, 0.15868166089057922, 0.21170282363891602, 0.2647240161895752, 0.3177452087402344, 0.37076637148857117, 0.42378753423690796, 0.47680872678756714, 0.5298299193382263, 0.5828510522842407, 0.6358722448348999, 0.6888934373855591, 0.7419146299362183, 0.7949358224868774, 0.8479569554328918, 0.900978147983551, 0.9539993405342102, 1.0070204734802246, 1.0600416660308838, 1.113062858581543, 1.1660840511322021, 1.2191052436828613, 1.2721264362335205, 1.3251476287841797, 1.3781688213348389, 1.4311898946762085, 1.4842110872268677, 1.5372322797775269]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 7.0, 16.0, 26.0, 28.0, 40.0, 64.0, 81.0, 147.0, 187.0, 293.0, 549.0, 956.0, 1683.0, 3755.0, 12152.0, 65324.0, 509301.0, 389009.0, 47855.0, 9997.0, 3341.0, 1556.0, 829.0, 451.0, 265.0, 223.0, 141.0, 76.0, 70.0, 38.0, 26.0, 22.0, 12.0, 11.0, 6.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.259765625, -1.2146453857421875, -1.169525146484375, -1.1244049072265625, -1.07928466796875, -1.0341644287109375, -0.989044189453125, -0.9439239501953125, -0.8988037109375, -0.8536834716796875, -0.808563232421875, -0.7634429931640625, -0.71832275390625, -0.6732025146484375, -0.628082275390625, -0.5829620361328125, -0.537841796875, -0.4927215576171875, -0.447601318359375, -0.4024810791015625, -0.35736083984375, -0.3122406005859375, -0.267120361328125, -0.2220001220703125, -0.1768798828125, -0.1317596435546875, -0.086639404296875, -0.0415191650390625, 0.00360107421875, 0.0487213134765625, 0.093841552734375, 0.1389617919921875, 0.18408203125, 0.2292022705078125, 0.274322509765625, 0.3194427490234375, 0.36456298828125, 0.4096832275390625, 0.454803466796875, 0.4999237060546875, 0.5450439453125, 0.5901641845703125, 0.635284423828125, 0.6804046630859375, 0.72552490234375, 0.7706451416015625, 0.815765380859375, 0.8608856201171875, 0.906005859375, 0.9511260986328125, 0.996246337890625, 1.0413665771484375, 1.08648681640625, 1.1316070556640625, 1.176727294921875, 1.2218475341796875, 1.2669677734375, 1.3120880126953125, 1.357208251953125, 1.4023284912109375, 1.44744873046875, 1.4925689697265625, 1.537689208984375, 1.5828094482421875, 1.6279296875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 12.0, 29.0, 43.0, 46.0, 66.0, 88.0, 96.0, 122.0, 119.0, 115.0, 85.0, 59.0, 48.0, 22.0, 7.0, 11.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.473388671875, -0.4563255310058594, -0.43926239013671875, -0.4221992492675781, -0.4051361083984375, -0.3880729675292969, -0.37100982666015625, -0.3539466857910156, -0.336883544921875, -0.3198204040527344, -0.30275726318359375, -0.2856941223144531, -0.2686309814453125, -0.2515678405761719, -0.23450469970703125, -0.21744155883789062, -0.20037841796875, -0.18331527709960938, -0.16625213623046875, -0.14918899536132812, -0.1321258544921875, -0.11506271362304688, -0.09799957275390625, -0.08093643188476562, -0.063873291015625, -0.046810150146484375, -0.02974700927734375, -0.012683868408203125, 0.0043792724609375, 0.021442413330078125, 0.03850555419921875, 0.055568695068359375, 0.0726318359375, 0.08969497680664062, 0.10675811767578125, 0.12382125854492188, 0.1408843994140625, 0.15794754028320312, 0.17501068115234375, 0.19207382202148438, 0.209136962890625, 0.22620010375976562, 0.24326324462890625, 0.2603263854980469, 0.2773895263671875, 0.2944526672363281, 0.31151580810546875, 0.3285789489746094, 0.34564208984375, 0.3627052307128906, 0.37976837158203125, 0.3968315124511719, 0.4138946533203125, 0.4309577941894531, 0.44802093505859375, 0.4650840759277344, 0.482147216796875, 0.4992103576660156, 0.5162734985351562, 0.5333366394042969, 0.5503997802734375, 0.5674629211425781, 0.5845260620117188, 0.6015892028808594, 0.61865234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 7.0, 7.0, 10.0, 16.0, 18.0, 45.0, 48.0, 57.0, 87.0, 151.0, 244.0, 376.0, 730.0, 1439.0, 3758.0, 14317.0, 82607.0, 487600.0, 382066.0, 58165.0, 10800.0, 3188.0, 1231.0, 574.0, 343.0, 218.0, 136.0, 100.0, 71.0, 43.0, 38.0, 17.0, 12.0, 11.0, 3.0, 3.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.10546875, -1.0697021484375, -1.033935546875, -0.9981689453125, -0.96240234375, -0.9266357421875, -0.890869140625, -0.8551025390625, -0.8193359375, -0.7835693359375, -0.747802734375, -0.7120361328125, -0.67626953125, -0.6405029296875, -0.604736328125, -0.5689697265625, -0.533203125, -0.4974365234375, -0.461669921875, -0.4259033203125, -0.39013671875, -0.3543701171875, -0.318603515625, -0.2828369140625, -0.2470703125, -0.2113037109375, -0.175537109375, -0.1397705078125, -0.10400390625, -0.0682373046875, -0.032470703125, 0.0032958984375, 0.0390625, 0.0748291015625, 0.110595703125, 0.1463623046875, 0.18212890625, 0.2178955078125, 0.253662109375, 0.2894287109375, 0.3251953125, 0.3609619140625, 0.396728515625, 0.4324951171875, 0.46826171875, 0.5040283203125, 0.539794921875, 0.5755615234375, 0.611328125, 0.6470947265625, 0.682861328125, 0.7186279296875, 0.75439453125, 0.7901611328125, 0.825927734375, 0.8616943359375, 0.8974609375, 0.9332275390625, 0.968994140625, 1.0047607421875, 1.04052734375, 1.0762939453125, 1.112060546875, 1.1478271484375, 1.18359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 9.0, 5.0, 5.0, 9.0, 9.0, 16.0, 8.0, 22.0, 25.0, 36.0, 32.0, 55.0, 43.0, 43.0, 52.0, 61.0, 42.0, 58.0, 64.0, 56.0, 42.0, 47.0, 35.0, 45.0, 54.0, 28.0, 20.0, 22.0, 13.0, 8.0, 14.0, 5.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.51953125, -1.47332763671875, -1.4271240234375, -1.38092041015625, -1.334716796875, -1.28851318359375, -1.2423095703125, -1.19610595703125, -1.14990234375, -1.10369873046875, -1.0574951171875, -1.01129150390625, -0.965087890625, -0.91888427734375, -0.8726806640625, -0.82647705078125, -0.7802734375, -0.73406982421875, -0.6878662109375, -0.64166259765625, -0.595458984375, -0.54925537109375, -0.5030517578125, -0.45684814453125, -0.41064453125, -0.36444091796875, -0.3182373046875, -0.27203369140625, -0.225830078125, -0.17962646484375, -0.1334228515625, -0.08721923828125, -0.041015625, 0.00518798828125, 0.0513916015625, 0.09759521484375, 0.143798828125, 0.19000244140625, 0.2362060546875, 0.28240966796875, 0.32861328125, 0.37481689453125, 0.4210205078125, 0.46722412109375, 0.513427734375, 0.55963134765625, 0.6058349609375, 0.65203857421875, 0.6982421875, 0.74444580078125, 0.7906494140625, 0.83685302734375, 0.883056640625, 0.92926025390625, 0.9754638671875, 1.02166748046875, 1.06787109375, 1.11407470703125, 1.1602783203125, 1.20648193359375, 1.252685546875, 1.29888916015625, 1.3450927734375, 1.39129638671875, 1.4375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 11.0, 11.0, 12.0, 22.0, 40.0, 60.0, 141.0, 276.0, 766.0, 2270.0, 12692.0, 273368.0, 722191.0, 31028.0, 3865.0, 1038.0, 389.0, 179.0, 89.0, 40.0, 23.0, 14.0, 13.0, 7.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.62890625, -0.608734130859375, -0.58856201171875, -0.568389892578125, -0.5482177734375, -0.528045654296875, -0.50787353515625, -0.487701416015625, -0.467529296875, -0.447357177734375, -0.42718505859375, -0.407012939453125, -0.3868408203125, -0.366668701171875, -0.34649658203125, -0.326324462890625, -0.30615234375, -0.285980224609375, -0.26580810546875, -0.245635986328125, -0.2254638671875, -0.205291748046875, -0.18511962890625, -0.164947509765625, -0.144775390625, -0.124603271484375, -0.10443115234375, -0.084259033203125, -0.0640869140625, -0.043914794921875, -0.02374267578125, -0.003570556640625, 0.0166015625, 0.036773681640625, 0.05694580078125, 0.077117919921875, 0.0972900390625, 0.117462158203125, 0.13763427734375, 0.157806396484375, 0.177978515625, 0.198150634765625, 0.21832275390625, 0.238494873046875, 0.2586669921875, 0.278839111328125, 0.29901123046875, 0.319183349609375, 0.33935546875, 0.359527587890625, 0.37969970703125, 0.399871826171875, 0.4200439453125, 0.440216064453125, 0.46038818359375, 0.480560302734375, 0.500732421875, 0.520904541015625, 0.54107666015625, 0.561248779296875, 0.5814208984375, 0.601593017578125, 0.62176513671875, 0.641937255859375, 0.662109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 1.0, 3.0, 8.0, 7.0, 7.0, 8.0, 13.0, 18.0, 24.0, 34.0, 34.0, 52.0, 56.0, 65.0, 86.0, 98.0, 107.0, 85.0, 56.0, 55.0, 27.0, 22.0, 20.0, 15.0, 14.0, 16.0, 8.0, 6.0, 7.0, 6.0, 4.0, 5.0, 4.0, 8.0, 3.0, 4.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-9.21487808227539e-05, -8.963234722614288e-05, -8.711591362953186e-05, -8.459948003292084e-05, -8.208304643630981e-05, -7.956661283969879e-05, -7.705017924308777e-05, -7.453374564647675e-05, -7.201731204986572e-05, -6.95008784532547e-05, -6.698444485664368e-05, -6.446801126003265e-05, -6.195157766342163e-05, -5.943514406681061e-05, -5.6918710470199585e-05, -5.440227687358856e-05, -5.188584327697754e-05, -4.9369409680366516e-05, -4.685297608375549e-05, -4.433654248714447e-05, -4.182010889053345e-05, -3.9303675293922424e-05, -3.67872416973114e-05, -3.427080810070038e-05, -3.1754374504089355e-05, -2.9237940907478333e-05, -2.672150731086731e-05, -2.4205073714256287e-05, -2.1688640117645264e-05, -1.917220652103424e-05, -1.6655772924423218e-05, -1.4139339327812195e-05, -1.1622905731201172e-05, -9.106472134590149e-06, -6.590038537979126e-06, -4.073604941368103e-06, -1.55717134475708e-06, 9.592622518539429e-07, 3.475695848464966e-06, 5.992129445075989e-06, 8.508563041687012e-06, 1.1024996638298035e-05, 1.3541430234909058e-05, 1.605786383152008e-05, 1.8574297428131104e-05, 2.1090731024742126e-05, 2.360716462135315e-05, 2.6123598217964172e-05, 2.8640031814575195e-05, 3.115646541118622e-05, 3.367289900779724e-05, 3.6189332604408264e-05, 3.870576620101929e-05, 4.122219979763031e-05, 4.373863339424133e-05, 4.6255066990852356e-05, 4.877150058746338e-05, 5.12879341840744e-05, 5.3804367780685425e-05, 5.632080137729645e-05, 5.883723497390747e-05, 6.13536685705185e-05, 6.387010216712952e-05, 6.638653576374054e-05, 6.890296936035156e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 5.0, 8.0, 15.0, 24.0, 31.0, 50.0, 82.0, 123.0, 222.0, 430.0, 927.0, 2479.0, 9125.0, 53985.0, 478992.0, 440188.0, 49239.0, 8406.0, 2318.0, 901.0, 391.0, 217.0, 125.0, 81.0, 55.0, 33.0, 29.0, 18.0, 8.0, 5.0, 9.0, 4.0, 7.0, 3.0, 0.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374267578125, -0.3617820739746094, -0.34929656982421875, -0.3368110656738281, -0.3243255615234375, -0.3118400573730469, -0.29935455322265625, -0.2868690490722656, -0.274383544921875, -0.2618980407714844, -0.24941253662109375, -0.23692703247070312, -0.2244415283203125, -0.21195602416992188, -0.19947052001953125, -0.18698501586914062, -0.17449951171875, -0.16201400756835938, -0.14952850341796875, -0.13704299926757812, -0.1245574951171875, -0.11207199096679688, -0.09958648681640625, -0.08710098266601562, -0.074615478515625, -0.062129974365234375, -0.04964447021484375, -0.037158966064453125, -0.0246734619140625, -0.012187957763671875, 0.00029754638671875, 0.012783050537109375, 0.0252685546875, 0.037754058837890625, 0.05023956298828125, 0.06272506713867188, 0.0752105712890625, 0.08769607543945312, 0.10018157958984375, 0.11266708374023438, 0.125152587890625, 0.13763809204101562, 0.15012359619140625, 0.16260910034179688, 0.1750946044921875, 0.18758010864257812, 0.20006561279296875, 0.21255111694335938, 0.22503662109375, 0.23752212524414062, 0.25000762939453125, 0.2624931335449219, 0.2749786376953125, 0.2874641418457031, 0.29994964599609375, 0.3124351501464844, 0.324920654296875, 0.3374061584472656, 0.34989166259765625, 0.3623771667480469, 0.3748626708984375, 0.3873481750488281, 0.39983367919921875, 0.4123191833496094, 0.4248046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 3.0, 5.0, 13.0, 8.0, 17.0, 19.0, 22.0, 39.0, 40.0, 58.0, 67.0, 107.0, 98.0, 108.0, 89.0, 75.0, 56.0, 37.0, 35.0, 23.0, 28.0, 8.0, 12.0, 3.0, 6.0, 3.0, 5.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279052734375, -0.266937255859375, -0.25482177734375, -0.242706298828125, -0.2305908203125, -0.218475341796875, -0.20635986328125, -0.194244384765625, -0.18212890625, -0.170013427734375, -0.15789794921875, -0.145782470703125, -0.1336669921875, -0.121551513671875, -0.10943603515625, -0.097320556640625, -0.085205078125, -0.073089599609375, -0.06097412109375, -0.048858642578125, -0.0367431640625, -0.024627685546875, -0.01251220703125, -0.000396728515625, 0.01171875, 0.023834228515625, 0.03594970703125, 0.048065185546875, 0.0601806640625, 0.072296142578125, 0.08441162109375, 0.096527099609375, 0.108642578125, 0.120758056640625, 0.13287353515625, 0.144989013671875, 0.1571044921875, 0.169219970703125, 0.18133544921875, 0.193450927734375, 0.20556640625, 0.217681884765625, 0.22979736328125, 0.241912841796875, 0.2540283203125, 0.266143798828125, 0.27825927734375, 0.290374755859375, 0.302490234375, 0.314605712890625, 0.32672119140625, 0.338836669921875, 0.3509521484375, 0.363067626953125, 0.37518310546875, 0.387298583984375, 0.3994140625, 0.411529541015625, 0.42364501953125, 0.435760498046875, 0.4478759765625, 0.459991455078125, 0.47210693359375, 0.484222412109375, 0.496337890625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 10.0, 18.0, 25.0, 36.0, 57.0, 97.0, 120.0, 163.0, 133.0, 107.0, 77.0, 62.0, 32.0, 17.0, 10.0, 8.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.429243087768555, -7.225990295410156, -7.022737979888916, -6.819485664367676, -6.616232872009277, -6.412980079650879, -6.209727764129639, -6.006475448608398, -5.80322265625, -5.599969863891602, -5.396717548370361, -5.193465232849121, -4.990212440490723, -4.786959648132324, -4.583707332611084, -4.380455017089844, -4.177202224731445, -3.973949670791626, -3.7706971168518066, -3.5674445629119873, -3.364192008972168, -3.1609394550323486, -2.9576869010925293, -2.75443434715271, -2.5511817932128906, -2.3479292392730713, -2.144676685333252, -1.9414241313934326, -1.7381715774536133, -1.534919023513794, -1.3316664695739746, -1.1284139156341553, -0.9251613616943359, -0.7219088077545166, -0.5186562538146973, -0.31540369987487793, -0.1121511459350586, 0.09110140800476074, 0.2943539619445801, 0.4976065158843994, 0.7008590698242188, 0.9041116237640381, 1.1073641777038574, 1.3106167316436768, 1.513869285583496, 1.7171218395233154, 1.9203743934631348, 2.123626947402954, 2.3268795013427734, 2.5301320552825928, 2.733384609222412, 2.9366371631622314, 3.139889717102051, 3.34314227104187, 3.5463948249816895, 3.749647378921509, 3.952899932861328, 4.156152725219727, 4.359405040740967, 4.562657356262207, 4.7659101486206055, 4.969162940979004, 5.172415256500244, 5.375667572021484, 5.578920364379883]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 4.0, 5.0, 9.0, 9.0, 15.0, 14.0, 6.0, 15.0, 23.0, 21.0, 37.0, 35.0, 29.0, 40.0, 42.0, 47.0, 45.0, 41.0, 47.0, 48.0, 55.0, 47.0, 49.0, 32.0, 45.0, 30.0, 31.0, 30.0, 24.0, 21.0, 23.0, 21.0, 12.0, 10.0, 13.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.620080947875977, -8.367776870727539, -8.115472793579102, -7.863168716430664, -7.610864162445068, -7.358560085296631, -7.106256008148193, -6.853951930999756, -6.60164737701416, -6.349343299865723, -6.097039222717285, -5.844735145568848, -5.592430591583252, -5.3401265144348145, -5.087822437286377, -4.8355183601379395, -4.583214282989502, -4.3309102058410645, -4.078606128692627, -3.8263018131256104, -3.5739974975585938, -3.3216934204101562, -3.0693893432617188, -2.8170852661132812, -2.5647809505462646, -2.312476873397827, -2.0601725578308105, -1.807868480682373, -1.555564284324646, -1.303260087966919, -1.0509560108184814, -0.7986518144607544, -0.5463480949401855, -0.2940439283847809, -0.04173976182937622, 0.21056437492370605, 0.4628685712814331, 0.7151727676391602, 0.9674768447875977, 1.2197810411453247, 1.4720852375030518, 1.7243894338607788, 1.9766936302185059, 2.2289977073669434, 2.481301784515381, 2.7336061000823975, 2.985910177230835, 3.2382144927978516, 3.490518569946289, 3.7428226470947266, 3.995126962661743, 4.247430801391602, 4.499735355377197, 4.752039432525635, 5.004343509674072, 5.25664758682251, 5.5089521408081055, 5.761256217956543, 6.0135602951049805, 6.265864372253418, 6.518168926239014, 6.770473003387451, 7.022777080535889, 7.275081157684326, 7.527385234832764]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 8.0, 16.0, 17.0, 15.0, 35.0, 31.0, 65.0, 79.0, 108.0, 182.0, 351.0, 687.0, 1464.0, 3535.0, 11537.0, 93108.0, 3990981.0, 74893.0, 10438.0, 3533.0, 1463.0, 683.0, 362.0, 212.0, 133.0, 97.0, 63.0, 39.0, 34.0, 23.0, 16.0, 18.0, 9.0, 7.0, 5.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5966796875, -1.5424957275390625, -1.488311767578125, -1.4341278076171875, -1.37994384765625, -1.3257598876953125, -1.271575927734375, -1.2173919677734375, -1.1632080078125, -1.1090240478515625, -1.054840087890625, -1.0006561279296875, -0.94647216796875, -0.8922882080078125, -0.838104248046875, -0.7839202880859375, -0.729736328125, -0.6755523681640625, -0.621368408203125, -0.5671844482421875, -0.51300048828125, -0.4588165283203125, -0.404632568359375, -0.3504486083984375, -0.2962646484375, -0.2420806884765625, -0.187896728515625, -0.1337127685546875, -0.07952880859375, -0.0253448486328125, 0.028839111328125, 0.0830230712890625, 0.13720703125, 0.1913909912109375, 0.245574951171875, 0.2997589111328125, 0.35394287109375, 0.4081268310546875, 0.462310791015625, 0.5164947509765625, 0.5706787109375, 0.6248626708984375, 0.679046630859375, 0.7332305908203125, 0.78741455078125, 0.8415985107421875, 0.895782470703125, 0.9499664306640625, 1.004150390625, 1.0583343505859375, 1.112518310546875, 1.1667022705078125, 1.22088623046875, 1.2750701904296875, 1.329254150390625, 1.3834381103515625, 1.4376220703125, 1.4918060302734375, 1.545989990234375, 1.6001739501953125, 1.65435791015625, 1.7085418701171875, 1.762725830078125, 1.8169097900390625, 1.87109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 10.0, 15.0, 29.0, 44.0, 48.0, 68.0, 88.0, 106.0, 104.0, 108.0, 103.0, 89.0, 54.0, 39.0, 32.0, 18.0, 11.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.60009765625, -0.5811691284179688, -0.5622406005859375, -0.5433120727539062, -0.524383544921875, -0.5054550170898438, -0.4865264892578125, -0.46759796142578125, -0.44866943359375, -0.42974090576171875, -0.4108123779296875, -0.39188385009765625, -0.372955322265625, -0.35402679443359375, -0.3350982666015625, -0.31616973876953125, -0.2972412109375, -0.27831268310546875, -0.2593841552734375, -0.24045562744140625, -0.221527099609375, -0.20259857177734375, -0.1836700439453125, -0.16474151611328125, -0.14581298828125, -0.12688446044921875, -0.1079559326171875, -0.08902740478515625, -0.070098876953125, -0.05117034912109375, -0.0322418212890625, -0.01331329345703125, 0.005615234375, 0.02454376220703125, 0.0434722900390625, 0.06240081787109375, 0.081329345703125, 0.10025787353515625, 0.1191864013671875, 0.13811492919921875, 0.15704345703125, 0.17597198486328125, 0.1949005126953125, 0.21382904052734375, 0.232757568359375, 0.25168609619140625, 0.2706146240234375, 0.28954315185546875, 0.3084716796875, 0.32740020751953125, 0.3463287353515625, 0.36525726318359375, 0.384185791015625, 0.40311431884765625, 0.4220428466796875, 0.44097137451171875, 0.45989990234375, 0.47882843017578125, 0.4977569580078125, 0.5166854858398438, 0.535614013671875, 0.5545425415039062, 0.5734710693359375, 0.5923995971679688, 0.611328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 8.0, 14.0, 39.0, 79.0, 294.0, 994.0, 4326.0, 53940.0, 4089738.0, 39631.0, 3854.0, 940.0, 280.0, 88.0, 33.0, 17.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.50225830078125, -1.4322509765625, -1.36224365234375, -1.292236328125, -1.22222900390625, -1.1522216796875, -1.08221435546875, -1.01220703125, -0.94219970703125, -0.8721923828125, -0.80218505859375, -0.732177734375, -0.66217041015625, -0.5921630859375, -0.52215576171875, -0.4521484375, -0.38214111328125, -0.3121337890625, -0.24212646484375, -0.172119140625, -0.10211181640625, -0.0321044921875, 0.03790283203125, 0.10791015625, 0.17791748046875, 0.2479248046875, 0.31793212890625, 0.387939453125, 0.45794677734375, 0.5279541015625, 0.59796142578125, 0.66796875, 0.73797607421875, 0.8079833984375, 0.87799072265625, 0.947998046875, 1.01800537109375, 1.0880126953125, 1.15802001953125, 1.22802734375, 1.29803466796875, 1.3680419921875, 1.43804931640625, 1.508056640625, 1.57806396484375, 1.6480712890625, 1.71807861328125, 1.7880859375, 1.85809326171875, 1.9281005859375, 1.99810791015625, 2.068115234375, 2.13812255859375, 2.2081298828125, 2.27813720703125, 2.34814453125, 2.41815185546875, 2.4881591796875, 2.55816650390625, 2.628173828125, 2.69818115234375, 2.7681884765625, 2.83819580078125, 2.908203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 3.0, 11.0, 19.0, 28.0, 52.0, 104.0, 224.0, 1195.0, 1769.0, 327.0, 121.0, 71.0, 47.0, 26.0, 15.0, 11.0, 9.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.564453125, -0.54571533203125, -0.5269775390625, -0.50823974609375, -0.489501953125, -0.47076416015625, -0.4520263671875, -0.43328857421875, -0.41455078125, -0.39581298828125, -0.3770751953125, -0.35833740234375, -0.339599609375, -0.32086181640625, -0.3021240234375, -0.28338623046875, -0.2646484375, -0.24591064453125, -0.2271728515625, -0.20843505859375, -0.189697265625, -0.17095947265625, -0.1522216796875, -0.13348388671875, -0.11474609375, -0.09600830078125, -0.0772705078125, -0.05853271484375, -0.039794921875, -0.02105712890625, -0.0023193359375, 0.01641845703125, 0.03515625, 0.05389404296875, 0.0726318359375, 0.09136962890625, 0.110107421875, 0.12884521484375, 0.1475830078125, 0.16632080078125, 0.18505859375, 0.20379638671875, 0.2225341796875, 0.24127197265625, 0.260009765625, 0.27874755859375, 0.2974853515625, 0.31622314453125, 0.3349609375, 0.35369873046875, 0.3724365234375, 0.39117431640625, 0.409912109375, 0.42864990234375, 0.4473876953125, 0.46612548828125, 0.48486328125, 0.50360107421875, 0.5223388671875, 0.54107666015625, 0.559814453125, 0.57855224609375, 0.5972900390625, 0.61602783203125, 0.634765625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 16.0, 134.0, 597.0, 234.0, 21.0, 9.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.443396806716919, -2.1563329696655273, -1.8692693710327148, -1.5822056531906128, -1.2951419353485107, -1.0080782175064087, -0.7210144996643066, -0.43395066261291504, -0.14688706398010254, 0.1401766538619995, 0.42724037170410156, 0.7143040895462036, 1.0013678073883057, 1.2884315252304077, 1.5754952430725098, 1.8625590801239014, 2.149622678756714, 2.4366865158081055, 2.723750114440918, 3.0108137130737305, 3.297877550125122, 3.5849413871765137, 3.872004985809326, 4.159069061279297, 4.446132659912109, 4.733196258544922, 5.020259857177734, 5.307323932647705, 5.594387531280518, 5.88145112991333, 6.168515205383301, 6.455578804016113, 6.742642402648926, 7.029706001281738, 7.316769599914551, 7.6038336753845215, 7.890897274017334, 8.177961349487305, 8.465024948120117, 8.75208854675293, 9.039152145385742, 9.326215744018555, 9.613279342651367, 9.90034294128418, 10.187406539916992, 10.474471092224121, 10.761534690856934, 11.048598289489746, 11.335661888122559, 11.622725486755371, 11.909789085388184, 12.196852684020996, 12.483917236328125, 12.770980834960938, 13.05804443359375, 13.345108032226562, 13.632171630859375, 13.919235229492188, 14.206298828125, 14.493362426757812, 14.780426025390625, 15.067490577697754, 15.354554176330566, 15.641617774963379, 15.928681373596191]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 4.0, 5.0, 9.0, 18.0, 16.0, 26.0, 26.0, 31.0, 24.0, 38.0, 37.0, 35.0, 42.0, 55.0, 58.0, 50.0, 36.0, 44.0, 57.0, 45.0, 49.0, 33.0, 33.0, 39.0, 31.0, 24.0, 18.0, 18.0, 13.0, 16.0, 16.0, 9.0, 7.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7116096019744873, -1.6607743501663208, -1.6099392175674438, -1.5591039657592773, -1.5082688331604004, -1.4574335813522339, -1.4065983295440674, -1.3557631969451904, -1.304927945137024, -1.2540926933288574, -1.2032575607299805, -1.152422308921814, -1.1015870571136475, -1.0507519245147705, -0.999916672706604, -0.9490814805030823, -0.8982462882995605, -0.8474110960960388, -0.7965759038925171, -0.7457406520843506, -0.6949054598808289, -0.6440702676773071, -0.5932350158691406, -0.5423998236656189, -0.49156463146209717, -0.44072943925857544, -0.3898942172527313, -0.3390589952468872, -0.2882238030433655, -0.23738861083984375, -0.18655338883399963, -0.13571816682815552, -0.08488297462463379, -0.03404776751995087, 0.016787439584732056, 0.06762264668941498, 0.1184578537940979, 0.16929304599761963, 0.22012826800346375, 0.27096349000930786, 0.3217986822128296, 0.3726338744163513, 0.42346909642219543, 0.47430431842803955, 0.5251395106315613, 0.575974702835083, 0.6268099546432495, 0.6776451468467712, 0.728480339050293, 0.7793155312538147, 0.8301507234573364, 0.8809859752655029, 0.9318211674690247, 0.9826563596725464, 1.033491611480713, 1.0843267440795898, 1.1351619958877563, 1.1859972476959229, 1.2368323802947998, 1.2876676321029663, 1.3385028839111328, 1.3893380165100098, 1.4401732683181763, 1.4910085201263428, 1.5418436527252197]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 5.0, 7.0, 6.0, 13.0, 16.0, 15.0, 30.0, 42.0, 69.0, 84.0, 171.0, 279.0, 542.0, 1181.0, 2723.0, 9471.0, 56675.0, 668246.0, 274137.0, 25540.0, 5519.0, 1905.0, 787.0, 452.0, 233.0, 134.0, 80.0, 66.0, 43.0, 22.0, 6.0, 14.0, 8.0, 10.0, 5.0, 4.0, 5.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6953125, -1.6402740478515625, -1.585235595703125, -1.5301971435546875, -1.47515869140625, -1.4201202392578125, -1.365081787109375, -1.3100433349609375, -1.2550048828125, -1.1999664306640625, -1.144927978515625, -1.0898895263671875, -1.03485107421875, -0.9798126220703125, -0.924774169921875, -0.8697357177734375, -0.814697265625, -0.7596588134765625, -0.704620361328125, -0.6495819091796875, -0.59454345703125, -0.5395050048828125, -0.484466552734375, -0.4294281005859375, -0.3743896484375, -0.3193511962890625, -0.264312744140625, -0.2092742919921875, -0.15423583984375, -0.0991973876953125, -0.044158935546875, 0.0108795166015625, 0.06591796875, 0.1209564208984375, 0.175994873046875, 0.2310333251953125, 0.28607177734375, 0.3411102294921875, 0.396148681640625, 0.4511871337890625, 0.5062255859375, 0.5612640380859375, 0.616302490234375, 0.6713409423828125, 0.72637939453125, 0.7814178466796875, 0.836456298828125, 0.8914947509765625, 0.946533203125, 1.0015716552734375, 1.056610107421875, 1.1116485595703125, 1.16668701171875, 1.2217254638671875, 1.276763916015625, 1.3318023681640625, 1.3868408203125, 1.4418792724609375, 1.496917724609375, 1.5519561767578125, 1.60699462890625, 1.6620330810546875, 1.717071533203125, 1.7721099853515625, 1.8271484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 8.0, 8.0, 17.0, 40.0, 33.0, 68.0, 77.0, 92.0, 108.0, 124.0, 106.0, 77.0, 82.0, 55.0, 39.0, 22.0, 9.0, 11.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.64453125, -0.625152587890625, -0.60577392578125, -0.586395263671875, -0.5670166015625, -0.547637939453125, -0.52825927734375, -0.508880615234375, -0.489501953125, -0.470123291015625, -0.45074462890625, -0.431365966796875, -0.4119873046875, -0.392608642578125, -0.37322998046875, -0.353851318359375, -0.33447265625, -0.315093994140625, -0.29571533203125, -0.276336669921875, -0.2569580078125, -0.237579345703125, -0.21820068359375, -0.198822021484375, -0.179443359375, -0.160064697265625, -0.14068603515625, -0.121307373046875, -0.1019287109375, -0.082550048828125, -0.06317138671875, -0.043792724609375, -0.0244140625, -0.005035400390625, 0.01434326171875, 0.033721923828125, 0.0531005859375, 0.072479248046875, 0.09185791015625, 0.111236572265625, 0.130615234375, 0.149993896484375, 0.16937255859375, 0.188751220703125, 0.2081298828125, 0.227508544921875, 0.24688720703125, 0.266265869140625, 0.28564453125, 0.305023193359375, 0.32440185546875, 0.343780517578125, 0.3631591796875, 0.382537841796875, 0.40191650390625, 0.421295166015625, 0.440673828125, 0.460052490234375, 0.47943115234375, 0.498809814453125, 0.5181884765625, 0.537567138671875, 0.55694580078125, 0.576324462890625, 0.595703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 8.0, 4.0, 10.0, 18.0, 19.0, 42.0, 42.0, 68.0, 67.0, 109.0, 159.0, 253.0, 439.0, 832.0, 2176.0, 7868.0, 42560.0, 386552.0, 533299.0, 59074.0, 9975.0, 2687.0, 974.0, 460.0, 275.0, 183.0, 109.0, 94.0, 51.0, 32.0, 31.0, 22.0, 14.0, 12.0, 10.0, 4.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.40234375, -1.359954833984375, -1.31756591796875, -1.275177001953125, -1.2327880859375, -1.190399169921875, -1.14801025390625, -1.105621337890625, -1.063232421875, -1.020843505859375, -0.97845458984375, -0.936065673828125, -0.8936767578125, -0.851287841796875, -0.80889892578125, -0.766510009765625, -0.72412109375, -0.681732177734375, -0.63934326171875, -0.596954345703125, -0.5545654296875, -0.512176513671875, -0.46978759765625, -0.427398681640625, -0.385009765625, -0.342620849609375, -0.30023193359375, -0.257843017578125, -0.2154541015625, -0.173065185546875, -0.13067626953125, -0.088287353515625, -0.0458984375, -0.003509521484375, 0.03887939453125, 0.081268310546875, 0.1236572265625, 0.166046142578125, 0.20843505859375, 0.250823974609375, 0.293212890625, 0.335601806640625, 0.37799072265625, 0.420379638671875, 0.4627685546875, 0.505157470703125, 0.54754638671875, 0.589935302734375, 0.63232421875, 0.674713134765625, 0.71710205078125, 0.759490966796875, 0.8018798828125, 0.844268798828125, 0.88665771484375, 0.929046630859375, 0.971435546875, 1.013824462890625, 1.05621337890625, 1.098602294921875, 1.1409912109375, 1.183380126953125, 1.22576904296875, 1.268157958984375, 1.310546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 2.0, 3.0, 7.0, 10.0, 12.0, 11.0, 10.0, 15.0, 24.0, 23.0, 25.0, 37.0, 31.0, 28.0, 41.0, 43.0, 35.0, 65.0, 54.0, 45.0, 56.0, 46.0, 58.0, 48.0, 38.0, 43.0, 37.0, 28.0, 30.0, 16.0, 16.0, 5.0, 12.0, 12.0, 13.0, 10.0, 5.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6572265625, -1.610321044921875, -1.56341552734375, -1.516510009765625, -1.4696044921875, -1.422698974609375, -1.37579345703125, -1.328887939453125, -1.281982421875, -1.235076904296875, -1.18817138671875, -1.141265869140625, -1.0943603515625, -1.047454833984375, -1.00054931640625, -0.953643798828125, -0.90673828125, -0.859832763671875, -0.81292724609375, -0.766021728515625, -0.7191162109375, -0.672210693359375, -0.62530517578125, -0.578399658203125, -0.531494140625, -0.484588623046875, -0.43768310546875, -0.390777587890625, -0.3438720703125, -0.296966552734375, -0.25006103515625, -0.203155517578125, -0.15625, -0.109344482421875, -0.06243896484375, -0.015533447265625, 0.0313720703125, 0.078277587890625, 0.12518310546875, 0.172088623046875, 0.218994140625, 0.265899658203125, 0.31280517578125, 0.359710693359375, 0.4066162109375, 0.453521728515625, 0.50042724609375, 0.547332763671875, 0.59423828125, 0.641143798828125, 0.68804931640625, 0.734954833984375, 0.7818603515625, 0.828765869140625, 0.87567138671875, 0.922576904296875, 0.969482421875, 1.016387939453125, 1.06329345703125, 1.110198974609375, 1.1571044921875, 1.204010009765625, 1.25091552734375, 1.297821044921875, 1.3447265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 11.0, 30.0, 44.0, 148.0, 708.0, 8281.0, 1005315.0, 32505.0, 1160.0, 260.0, 53.0, 25.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4423828125, -1.40301513671875, -1.3636474609375, -1.32427978515625, -1.284912109375, -1.24554443359375, -1.2061767578125, -1.16680908203125, -1.12744140625, -1.08807373046875, -1.0487060546875, -1.00933837890625, -0.969970703125, -0.93060302734375, -0.8912353515625, -0.85186767578125, -0.8125, -0.77313232421875, -0.7337646484375, -0.69439697265625, -0.655029296875, -0.61566162109375, -0.5762939453125, -0.53692626953125, -0.49755859375, -0.45819091796875, -0.4188232421875, -0.37945556640625, -0.340087890625, -0.30072021484375, -0.2613525390625, -0.22198486328125, -0.1826171875, -0.14324951171875, -0.1038818359375, -0.06451416015625, -0.025146484375, 0.01422119140625, 0.0535888671875, 0.09295654296875, 0.13232421875, 0.17169189453125, 0.2110595703125, 0.25042724609375, 0.289794921875, 0.32916259765625, 0.3685302734375, 0.40789794921875, 0.447265625, 0.48663330078125, 0.5260009765625, 0.56536865234375, 0.604736328125, 0.64410400390625, 0.6834716796875, 0.72283935546875, 0.76220703125, 0.80157470703125, 0.8409423828125, 0.88031005859375, 0.919677734375, 0.95904541015625, 0.9984130859375, 1.03778076171875, 1.0771484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 12.0, 10.0, 17.0, 23.0, 32.0, 66.0, 94.0, 158.0, 213.0, 145.0, 77.0, 40.0, 32.0, 23.0, 15.0, 11.0, 6.0, 7.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014197826385498047, -0.00013698451220989227, -0.00013199076056480408, -0.00012699700891971588, -0.00012200325727462769, -0.00011700950562953949, -0.0001120157539844513, -0.0001070220023393631, -0.0001020282506942749, -9.70344990491867e-05, -9.204074740409851e-05, -8.704699575901031e-05, -8.205324411392212e-05, -7.705949246883392e-05, -7.206574082374573e-05, -6.707198917865753e-05, -6.207823753356934e-05, -5.708448588848114e-05, -5.2090734243392944e-05, -4.709698259830475e-05, -4.210323095321655e-05, -3.710947930812836e-05, -3.211572766304016e-05, -2.7121976017951965e-05, -2.212822437286377e-05, -1.7134472727775574e-05, -1.2140721082687378e-05, -7.146969437599182e-06, -2.1532177925109863e-06, 2.8405338525772095e-06, 7.834285497665405e-06, 1.2828037142753601e-05, 1.7821788787841797e-05, 2.2815540432929993e-05, 2.780929207801819e-05, 3.2803043723106384e-05, 3.779679536819458e-05, 4.2790547013282776e-05, 4.778429865837097e-05, 5.277805030345917e-05, 5.777180194854736e-05, 6.276555359363556e-05, 6.775930523872375e-05, 7.275305688381195e-05, 7.774680852890015e-05, 8.274056017398834e-05, 8.773431181907654e-05, 9.272806346416473e-05, 9.772181510925293e-05, 0.00010271556675434113, 0.00010770931839942932, 0.00011270307004451752, 0.00011769682168960571, 0.0001226905733346939, 0.0001276843249797821, 0.0001326780766248703, 0.0001376718282699585, 0.0001426655799150467, 0.0001476593315601349, 0.00015265308320522308, 0.00015764683485031128, 0.00016264058649539948, 0.00016763433814048767, 0.00017262808978557587, 0.00017762184143066406]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 7.0, 13.0, 29.0, 52.0, 118.0, 353.0, 1909.0, 307127.0, 735673.0, 2589.0, 424.0, 131.0, 56.0, 37.0, 17.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9609375, -0.9192657470703125, -0.877593994140625, -0.8359222412109375, -0.79425048828125, -0.7525787353515625, -0.710906982421875, -0.6692352294921875, -0.6275634765625, -0.5858917236328125, -0.544219970703125, -0.5025482177734375, -0.46087646484375, -0.4192047119140625, -0.377532958984375, -0.3358612060546875, -0.294189453125, -0.2525177001953125, -0.210845947265625, -0.1691741943359375, -0.12750244140625, -0.0858306884765625, -0.044158935546875, -0.0024871826171875, 0.0391845703125, 0.0808563232421875, 0.122528076171875, 0.1641998291015625, 0.20587158203125, 0.2475433349609375, 0.289215087890625, 0.3308868408203125, 0.37255859375, 0.4142303466796875, 0.455902099609375, 0.4975738525390625, 0.53924560546875, 0.5809173583984375, 0.622589111328125, 0.6642608642578125, 0.7059326171875, 0.7476043701171875, 0.789276123046875, 0.8309478759765625, 0.87261962890625, 0.9142913818359375, 0.955963134765625, 0.9976348876953125, 1.039306640625, 1.0809783935546875, 1.122650146484375, 1.1643218994140625, 1.20599365234375, 1.2476654052734375, 1.289337158203125, 1.3310089111328125, 1.3726806640625, 1.4143524169921875, 1.456024169921875, 1.4976959228515625, 1.53936767578125, 1.5810394287109375, 1.622711181640625, 1.6643829345703125, 1.7060546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 15.0, 19.0, 35.0, 74.0, 200.0, 299.0, 204.0, 87.0, 41.0, 24.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72021484375, -0.6896591186523438, -0.6591033935546875, -0.6285476684570312, -0.597991943359375, -0.5674362182617188, -0.5368804931640625, -0.5063247680664062, -0.47576904296875, -0.44521331787109375, -0.4146575927734375, -0.38410186767578125, -0.353546142578125, -0.32299041748046875, -0.2924346923828125, -0.26187896728515625, -0.2313232421875, -0.20076751708984375, -0.1702117919921875, -0.13965606689453125, -0.109100341796875, -0.07854461669921875, -0.0479888916015625, -0.01743316650390625, 0.01312255859375, 0.04367828369140625, 0.0742340087890625, 0.10478973388671875, 0.135345458984375, 0.16590118408203125, 0.1964569091796875, 0.22701263427734375, 0.257568359375, 0.28812408447265625, 0.3186798095703125, 0.34923553466796875, 0.379791259765625, 0.41034698486328125, 0.4409027099609375, 0.47145843505859375, 0.50201416015625, 0.5325698852539062, 0.5631256103515625, 0.5936813354492188, 0.624237060546875, 0.6547927856445312, 0.6853485107421875, 0.7159042358398438, 0.7464599609375, 0.7770156860351562, 0.8075714111328125, 0.8381271362304688, 0.868682861328125, 0.8992385864257812, 0.9297943115234375, 0.9603500366210938, 0.99090576171875, 1.0214614868164062, 1.0520172119140625, 1.0825729370117188, 1.113128662109375, 1.1436843872070312, 1.1742401123046875, 1.2047958374023438, 1.2353515625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 16.0, 21.0, 42.0, 171.0, 307.0, 257.0, 112.0, 53.0, 18.0, 8.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.163463592529297, -11.769636154174805, -11.375809669494629, -10.981982231140137, -10.588154792785645, -10.194328308105469, -9.800500869750977, -9.406673431396484, -9.012845993041992, -8.6190185546875, -8.225192070007324, -7.831364631652832, -7.43753719329834, -7.043710231781006, -6.649883270263672, -6.25605583190918, -5.862229347229004, -5.46840238571167, -5.074574947357178, -4.680747985839844, -4.286920547485352, -3.8930935859680176, -3.4992666244506836, -3.1054394245147705, -2.7116122245788574, -2.3177850246429443, -1.9239579439163208, -1.5301308631896973, -1.1363036632537842, -0.7424764633178711, -0.3486495018005371, 0.04517769813537598, 0.43900489807128906, 0.8328320384025574, 1.2266591787338257, 1.6204862594604492, 2.0143134593963623, 2.4081406593322754, 2.8019676208496094, 3.1957948207855225, 3.5896220207214355, 3.9834492206573486, 4.377276420593262, 4.771103382110596, 5.16493034362793, 5.558757781982422, 5.952584743499756, 6.34641170501709, 6.740239143371582, 7.134066104888916, 7.527893543243408, 7.921720504760742, 8.315547943115234, 8.709375381469727, 9.103201866149902, 9.497029304504395, 9.89085578918457, 10.284683227539062, 10.678509712219238, 11.07233715057373, 11.466164588928223, 11.859991073608398, 12.25381851196289, 12.647645950317383, 13.041473388671875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 6.0, 11.0, 10.0, 12.0, 14.0, 14.0, 18.0, 22.0, 21.0, 22.0, 36.0, 23.0, 51.0, 51.0, 58.0, 49.0, 52.0, 50.0, 50.0, 44.0, 51.0, 43.0, 34.0, 49.0, 34.0, 35.0, 24.0, 16.0, 20.0, 16.0, 10.0, 10.0, 12.0, 10.0, 4.0, 11.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0], "bins": [-9.796653747558594, -9.548315048217773, -9.299976348876953, -9.05163860321045, -8.803299903869629, -8.554961204528809, -8.306622505187988, -8.058284759521484, -7.809946060180664, -7.561607360839844, -7.313269138336182, -7.064930438995361, -6.816592216491699, -6.568253517150879, -6.319914817810059, -6.0715765953063965, -5.823237895965576, -5.574899196624756, -5.326560974121094, -5.078222274780273, -4.829884052276611, -4.581545352935791, -4.333207130432129, -4.084868431091309, -3.8365299701690674, -3.588191509246826, -3.339853048324585, -3.0915145874023438, -2.8431758880615234, -2.5948376655578613, -2.346498966217041, -2.0981605052948, -1.8498215675354004, -1.6014831066131592, -1.353144645690918, -1.1048060655593872, -0.856467604637146, -0.6081291437149048, -0.359790563583374, -0.11145210266113281, 0.1368863582611084, 0.385224848985672, 0.6335633397102356, 0.8819018602371216, 1.1302403211593628, 1.378578782081604, 1.6269173622131348, 1.875255823135376, 2.123594284057617, 2.3719327449798584, 2.6202712059020996, 2.86860990524292, 3.116948127746582, 3.3652868270874023, 3.6136252880096436, 3.8619637489318848, 4.110301971435547, 4.358640670776367, 4.606978893280029, 4.85531759262085, 5.103655815124512, 5.351994514465332, 5.600333213806152, 5.8486714363098145, 6.097010135650635]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 0.0, 5.0, 2.0, 5.0, 7.0, 9.0, 12.0, 6.0, 19.0, 17.0, 27.0, 37.0, 41.0, 54.0, 57.0, 100.0, 139.0, 273.0, 392.0, 734.0, 1718.0, 3988.0, 11620.0, 54090.0, 3711002.0, 370534.0, 26397.0, 7184.0, 2753.0, 1236.0, 668.0, 375.0, 197.0, 144.0, 117.0, 69.0, 54.0, 42.0, 34.0, 22.0, 30.0, 17.0, 8.0, 9.0, 7.0, 5.0, 5.0, 7.0, 10.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.1982421875, -1.1593475341796875, -1.120452880859375, -1.0815582275390625, -1.04266357421875, -1.0037689208984375, -0.964874267578125, -0.9259796142578125, -0.8870849609375, -0.8481903076171875, -0.809295654296875, -0.7704010009765625, -0.73150634765625, -0.6926116943359375, -0.653717041015625, -0.6148223876953125, -0.575927734375, -0.5370330810546875, -0.498138427734375, -0.4592437744140625, -0.42034912109375, -0.3814544677734375, -0.342559814453125, -0.3036651611328125, -0.2647705078125, -0.2258758544921875, -0.186981201171875, -0.1480865478515625, -0.10919189453125, -0.0702972412109375, -0.031402587890625, 0.0074920654296875, 0.04638671875, 0.0852813720703125, 0.124176025390625, 0.1630706787109375, 0.20196533203125, 0.2408599853515625, 0.279754638671875, 0.3186492919921875, 0.3575439453125, 0.3964385986328125, 0.435333251953125, 0.4742279052734375, 0.51312255859375, 0.5520172119140625, 0.590911865234375, 0.6298065185546875, 0.668701171875, 0.7075958251953125, 0.746490478515625, 0.7853851318359375, 0.82427978515625, 0.8631744384765625, 0.902069091796875, 0.9409637451171875, 0.9798583984375, 1.0187530517578125, 1.057647705078125, 1.0965423583984375, 1.13543701171875, 1.1743316650390625, 1.213226318359375, 1.2521209716796875, 1.291015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 11.0, 31.0, 56.0, 60.0, 68.0, 76.0, 117.0, 118.0, 109.0, 119.0, 80.0, 50.0, 32.0, 22.0, 13.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.7685546875, -0.746856689453125, -0.72515869140625, -0.703460693359375, -0.6817626953125, -0.660064697265625, -0.63836669921875, -0.616668701171875, -0.594970703125, -0.573272705078125, -0.55157470703125, -0.529876708984375, -0.5081787109375, -0.486480712890625, -0.46478271484375, -0.443084716796875, -0.42138671875, -0.399688720703125, -0.37799072265625, -0.356292724609375, -0.3345947265625, -0.312896728515625, -0.29119873046875, -0.269500732421875, -0.247802734375, -0.226104736328125, -0.20440673828125, -0.182708740234375, -0.1610107421875, -0.139312744140625, -0.11761474609375, -0.095916748046875, -0.07421875, -0.052520751953125, -0.03082275390625, -0.009124755859375, 0.0125732421875, 0.034271240234375, 0.05596923828125, 0.077667236328125, 0.099365234375, 0.121063232421875, 0.14276123046875, 0.164459228515625, 0.1861572265625, 0.207855224609375, 0.22955322265625, 0.251251220703125, 0.27294921875, 0.294647216796875, 0.31634521484375, 0.338043212890625, 0.3597412109375, 0.381439208984375, 0.40313720703125, 0.424835205078125, 0.446533203125, 0.468231201171875, 0.48992919921875, 0.511627197265625, 0.5333251953125, 0.555023193359375, 0.57672119140625, 0.598419189453125, 0.6201171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 13.0, 35.0, 71.0, 120.0, 304.0, 705.0, 2023.0, 13032.0, 3853043.0, 315566.0, 6800.0, 1480.0, 603.0, 254.0, 118.0, 61.0, 30.0, 11.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.359375, -2.289703369140625, -2.22003173828125, -2.150360107421875, -2.0806884765625, -2.011016845703125, -1.94134521484375, -1.871673583984375, -1.802001953125, -1.732330322265625, -1.66265869140625, -1.592987060546875, -1.5233154296875, -1.453643798828125, -1.38397216796875, -1.314300537109375, -1.24462890625, -1.174957275390625, -1.10528564453125, -1.035614013671875, -0.9659423828125, -0.896270751953125, -0.82659912109375, -0.756927490234375, -0.687255859375, -0.617584228515625, -0.54791259765625, -0.478240966796875, -0.4085693359375, -0.338897705078125, -0.26922607421875, -0.199554443359375, -0.1298828125, -0.060211181640625, 0.00946044921875, 0.079132080078125, 0.1488037109375, 0.218475341796875, 0.28814697265625, 0.357818603515625, 0.427490234375, 0.497161865234375, 0.56683349609375, 0.636505126953125, 0.7061767578125, 0.775848388671875, 0.84552001953125, 0.915191650390625, 0.98486328125, 1.054534912109375, 1.12420654296875, 1.193878173828125, 1.2635498046875, 1.333221435546875, 1.40289306640625, 1.472564697265625, 1.542236328125, 1.611907958984375, 1.68157958984375, 1.751251220703125, 1.8209228515625, 1.890594482421875, 1.96026611328125, 2.029937744140625, 2.099609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 5.0, 10.0, 17.0, 33.0, 49.0, 167.0, 1073.0, 2208.0, 298.0, 89.0, 45.0, 22.0, 20.0, 9.0, 5.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53173828125, -0.5113983154296875, -0.491058349609375, -0.4707183837890625, -0.45037841796875, -0.4300384521484375, -0.409698486328125, -0.3893585205078125, -0.3690185546875, -0.3486785888671875, -0.328338623046875, -0.3079986572265625, -0.28765869140625, -0.2673187255859375, -0.246978759765625, -0.2266387939453125, -0.206298828125, -0.1859588623046875, -0.165618896484375, -0.1452789306640625, -0.12493896484375, -0.1045989990234375, -0.084259033203125, -0.0639190673828125, -0.0435791015625, -0.0232391357421875, -0.002899169921875, 0.0174407958984375, 0.03778076171875, 0.0581207275390625, 0.078460693359375, 0.0988006591796875, 0.119140625, 0.1394805908203125, 0.159820556640625, 0.1801605224609375, 0.20050048828125, 0.2208404541015625, 0.241180419921875, 0.2615203857421875, 0.2818603515625, 0.3022003173828125, 0.322540283203125, 0.3428802490234375, 0.36322021484375, 0.3835601806640625, 0.403900146484375, 0.4242401123046875, 0.444580078125, 0.4649200439453125, 0.485260009765625, 0.5055999755859375, 0.52593994140625, 0.5462799072265625, 0.566619873046875, 0.5869598388671875, 0.6072998046875, 0.6276397705078125, 0.647979736328125, 0.6683197021484375, 0.68865966796875, 0.7089996337890625, 0.729339599609375, 0.7496795654296875, 0.77001953125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 22.0, 96.0, 328.0, 355.0, 148.0, 38.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1776537895202637, -3.0316455364227295, -2.885637044906616, -2.739628791809082, -2.5936203002929688, -2.4476120471954346, -2.3016037940979004, -2.155595302581787, -2.009587049484253, -1.8635786771774292, -1.7175703048706055, -1.5715620517730713, -1.4255536794662476, -1.2795453071594238, -1.1335370540618896, -0.9875286817550659, -0.8415203094482422, -0.6955119371414185, -0.5495036244392395, -0.40349528193473816, -0.2574869394302368, -0.11147856712341309, 0.03452974557876587, 0.18053805828094482, 0.32654643058776855, 0.4725547730922699, 0.6185631155967712, 0.7645714282989502, 0.9105798006057739, 1.0565881729125977, 1.2025964260101318, 1.3486047983169556, 1.4946131706237793, 1.640621542930603, 1.7866299152374268, 1.932638168334961, 2.078646659851074, 2.2246549129486084, 2.3706631660461426, 2.516671657562256, 2.66267991065979, 2.808688163757324, 2.9546966552734375, 3.1007049083709717, 3.246713161468506, 3.392721652984619, 3.5387299060821533, 3.6847381591796875, 3.830746650695801, 3.976754903793335, 4.122763156890869, 4.268771648406982, 4.414780139923096, 4.560788154602051, 4.706796646118164, 4.852805137634277, 4.998813629150391, 5.144822120666504, 5.290830135345459, 5.436838626861572, 5.5828471183776855, 5.728855133056641, 5.874863624572754, 6.020872116088867, 6.166880130767822]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 13.0, 23.0, 22.0, 36.0, 56.0, 43.0, 58.0, 80.0, 84.0, 74.0, 74.0, 66.0, 61.0, 70.0, 52.0, 44.0, 47.0, 36.0, 17.0, 17.0, 7.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9207372665405273, -1.852354645729065, -1.783972144126892, -1.7155895233154297, -1.6472070217132568, -1.5788244009017944, -1.510441780090332, -1.4420592784881592, -1.3736766576766968, -1.3052940368652344, -1.2369115352630615, -1.1685289144515991, -1.1001462936401367, -1.0317637920379639, -0.9633811712265015, -0.8949986100196838, -0.8266160488128662, -0.7582334876060486, -0.689850926399231, -0.6214683055877686, -0.5530857443809509, -0.4847031831741333, -0.4163205921649933, -0.34793800115585327, -0.27955543994903564, -0.21117286384105682, -0.142790287733078, -0.07440771162509918, -0.006025135517120361, 0.062357425689697266, 0.13074001669883728, 0.1991226077079773, 0.267505407333374, 0.33588796854019165, 0.40427055954933167, 0.4726531505584717, 0.5410357117652893, 0.6094182729721069, 0.6778008937835693, 0.746183454990387, 0.8145660161972046, 0.8829485774040222, 0.9513311386108398, 1.0197137594223022, 1.0880963802337646, 1.1564788818359375, 1.2248615026474, 1.2932441234588623, 1.3616266250610352, 1.4300092458724976, 1.4983917474746704, 1.5667743682861328, 1.6351568698883057, 1.703539490699768, 1.7719221115112305, 1.8403046131134033, 1.9086872339248657, 1.9770698547363281, 2.045452356338501, 2.113834857940674, 2.182217597961426, 2.2506000995635986, 2.3189826011657715, 2.3873653411865234, 2.4557478427886963]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 21.0, 42.0, 132.0, 273.0, 921.0, 4979.0, 184829.0, 840916.0, 14082.0, 1622.0, 440.0, 167.0, 53.0, 36.0, 9.0, 7.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.63671875, -3.52716064453125, -3.4176025390625, -3.30804443359375, -3.198486328125, -3.08892822265625, -2.9793701171875, -2.86981201171875, -2.76025390625, -2.65069580078125, -2.5411376953125, -2.43157958984375, -2.322021484375, -2.21246337890625, -2.1029052734375, -1.99334716796875, -1.8837890625, -1.77423095703125, -1.6646728515625, -1.55511474609375, -1.445556640625, -1.33599853515625, -1.2264404296875, -1.11688232421875, -1.00732421875, -0.89776611328125, -0.7882080078125, -0.67864990234375, -0.569091796875, -0.45953369140625, -0.3499755859375, -0.24041748046875, -0.130859375, -0.02130126953125, 0.0882568359375, 0.19781494140625, 0.307373046875, 0.41693115234375, 0.5264892578125, 0.63604736328125, 0.74560546875, 0.85516357421875, 0.9647216796875, 1.07427978515625, 1.183837890625, 1.29339599609375, 1.4029541015625, 1.51251220703125, 1.6220703125, 1.73162841796875, 1.8411865234375, 1.95074462890625, 2.060302734375, 2.16986083984375, 2.2794189453125, 2.38897705078125, 2.49853515625, 2.60809326171875, 2.7176513671875, 2.82720947265625, 2.936767578125, 3.04632568359375, 3.1558837890625, 3.26544189453125, 3.375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 11.0, 9.0, 25.0, 39.0, 62.0, 62.0, 81.0, 93.0, 125.0, 126.0, 109.0, 93.0, 59.0, 42.0, 25.0, 15.0, 8.0, 7.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.80517578125, -0.782684326171875, -0.76019287109375, -0.737701416015625, -0.7152099609375, -0.692718505859375, -0.67022705078125, -0.647735595703125, -0.625244140625, -0.602752685546875, -0.58026123046875, -0.557769775390625, -0.5352783203125, -0.512786865234375, -0.49029541015625, -0.467803955078125, -0.4453125, -0.422821044921875, -0.40032958984375, -0.377838134765625, -0.3553466796875, -0.332855224609375, -0.31036376953125, -0.287872314453125, -0.265380859375, -0.242889404296875, -0.22039794921875, -0.197906494140625, -0.1754150390625, -0.152923583984375, -0.13043212890625, -0.107940673828125, -0.08544921875, -0.062957763671875, -0.04046630859375, -0.017974853515625, 0.0045166015625, 0.027008056640625, 0.04949951171875, 0.071990966796875, 0.094482421875, 0.116973876953125, 0.13946533203125, 0.161956787109375, 0.1844482421875, 0.206939697265625, 0.22943115234375, 0.251922607421875, 0.2744140625, 0.296905517578125, 0.31939697265625, 0.341888427734375, 0.3643798828125, 0.386871337890625, 0.40936279296875, 0.431854248046875, 0.454345703125, 0.476837158203125, 0.49932861328125, 0.521820068359375, 0.5443115234375, 0.566802978515625, 0.58929443359375, 0.611785888671875, 0.63427734375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 8.0, 12.0, 11.0, 15.0, 20.0, 30.0, 38.0, 59.0, 65.0, 106.0, 136.0, 211.0, 423.0, 1118.0, 3359.0, 13662.0, 87528.0, 663825.0, 238887.0, 29776.0, 6022.0, 1737.0, 666.0, 307.0, 163.0, 108.0, 67.0, 52.0, 42.0, 32.0, 12.0, 16.0, 7.0, 11.0, 9.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.023681640625, -0.98388671875, -0.944091796875, -0.904296875, -0.864501953125, -0.82470703125, -0.784912109375, -0.7451171875, -0.705322265625, -0.66552734375, -0.625732421875, -0.5859375, -0.546142578125, -0.50634765625, -0.466552734375, -0.4267578125, -0.386962890625, -0.34716796875, -0.307373046875, -0.267578125, -0.227783203125, -0.18798828125, -0.148193359375, -0.1083984375, -0.068603515625, -0.02880859375, 0.010986328125, 0.05078125, 0.090576171875, 0.13037109375, 0.170166015625, 0.2099609375, 0.249755859375, 0.28955078125, 0.329345703125, 0.369140625, 0.408935546875, 0.44873046875, 0.488525390625, 0.5283203125, 0.568115234375, 0.60791015625, 0.647705078125, 0.6875, 0.727294921875, 0.76708984375, 0.806884765625, 0.8466796875, 0.886474609375, 0.92626953125, 0.966064453125, 1.005859375, 1.045654296875, 1.08544921875, 1.125244140625, 1.1650390625, 1.204833984375, 1.24462890625, 1.284423828125, 1.32421875, 1.364013671875, 1.40380859375, 1.443603515625, 1.4833984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 10.0, 10.0, 4.0, 12.0, 17.0, 18.0, 17.0, 26.0, 24.0, 37.0, 30.0, 26.0, 23.0, 33.0, 39.0, 53.0, 39.0, 31.0, 57.0, 31.0, 50.0, 47.0, 39.0, 38.0, 36.0, 30.0, 27.0, 34.0, 18.0, 16.0, 13.0, 17.0, 12.0, 14.0, 11.0, 10.0, 8.0, 4.0, 9.0, 7.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.216796875, -1.178497314453125, -1.14019775390625, -1.101898193359375, -1.0635986328125, -1.025299072265625, -0.98699951171875, -0.948699951171875, -0.910400390625, -0.872100830078125, -0.83380126953125, -0.795501708984375, -0.7572021484375, -0.718902587890625, -0.68060302734375, -0.642303466796875, -0.60400390625, -0.565704345703125, -0.52740478515625, -0.489105224609375, -0.4508056640625, -0.412506103515625, -0.37420654296875, -0.335906982421875, -0.297607421875, -0.259307861328125, -0.22100830078125, -0.182708740234375, -0.1444091796875, -0.106109619140625, -0.06781005859375, -0.029510498046875, 0.0087890625, 0.047088623046875, 0.08538818359375, 0.123687744140625, 0.1619873046875, 0.200286865234375, 0.23858642578125, 0.276885986328125, 0.315185546875, 0.353485107421875, 0.39178466796875, 0.430084228515625, 0.4683837890625, 0.506683349609375, 0.54498291015625, 0.583282470703125, 0.62158203125, 0.659881591796875, 0.69818115234375, 0.736480712890625, 0.7747802734375, 0.813079833984375, 0.85137939453125, 0.889678955078125, 0.927978515625, 0.966278076171875, 1.00457763671875, 1.042877197265625, 1.0811767578125, 1.119476318359375, 1.15777587890625, 1.196075439453125, 1.234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 10.0, 12.0, 15.0, 24.0, 40.0, 86.0, 164.0, 347.0, 947.0, 3354.0, 34046.0, 872948.0, 127775.0, 6474.0, 1352.0, 471.0, 215.0, 91.0, 67.0, 36.0, 25.0, 13.0, 8.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.6648483276367188, -0.6431732177734375, -0.6214981079101562, -0.599822998046875, -0.5781478881835938, -0.5564727783203125, -0.5347976684570312, -0.51312255859375, -0.49144744873046875, -0.4697723388671875, -0.44809722900390625, -0.426422119140625, -0.40474700927734375, -0.3830718994140625, -0.36139678955078125, -0.3397216796875, -0.31804656982421875, -0.2963714599609375, -0.27469635009765625, -0.253021240234375, -0.23134613037109375, -0.2096710205078125, -0.18799591064453125, -0.16632080078125, -0.14464569091796875, -0.1229705810546875, -0.10129547119140625, -0.079620361328125, -0.05794525146484375, -0.0362701416015625, -0.01459503173828125, 0.007080078125, 0.02875518798828125, 0.0504302978515625, 0.07210540771484375, 0.093780517578125, 0.11545562744140625, 0.1371307373046875, 0.15880584716796875, 0.18048095703125, 0.20215606689453125, 0.2238311767578125, 0.24550628662109375, 0.267181396484375, 0.28885650634765625, 0.3105316162109375, 0.33220672607421875, 0.3538818359375, 0.37555694580078125, 0.3972320556640625, 0.41890716552734375, 0.440582275390625, 0.46225738525390625, 0.4839324951171875, 0.5056076049804688, 0.52728271484375, 0.5489578247070312, 0.5706329345703125, 0.5923080444335938, 0.613983154296875, 0.6356582641601562, 0.6573333740234375, 0.6790084838867188, 0.70068359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 8.0, 8.0, 15.0, 6.0, 4.0, 14.0, 11.0, 17.0, 19.0, 36.0, 56.0, 104.0, 154.0, 195.0, 101.0, 69.0, 35.0, 25.0, 18.0, 20.0, 13.0, 13.0, 9.0, 6.0, 5.0, 7.0, 5.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001609325408935547, -0.000155741348862648, -0.00015055015683174133, -0.00014535896480083466, -0.00014016777276992798, -0.0001349765807390213, -0.00012978538870811462, -0.00012459419667720795, -0.00011940300464630127, -0.00011421181261539459, -0.00010902062058448792, -0.00010382942855358124, -9.863823652267456e-05, -9.344704449176788e-05, -8.82558524608612e-05, -8.306466042995453e-05, -7.787346839904785e-05, -7.268227636814117e-05, -6.74910843372345e-05, -6.229989230632782e-05, -5.710870027542114e-05, -5.1917508244514465e-05, -4.672631621360779e-05, -4.153512418270111e-05, -3.6343932151794434e-05, -3.1152740120887756e-05, -2.596154808998108e-05, -2.0770356059074402e-05, -1.5579164028167725e-05, -1.0387971997261047e-05, -5.19677996635437e-06, -5.587935447692871e-09, 5.185604095458984e-06, 1.0376796126365662e-05, 1.556798815727234e-05, 2.0759180188179016e-05, 2.5950372219085693e-05, 3.114156424999237e-05, 3.633275628089905e-05, 4.1523948311805725e-05, 4.67151403427124e-05, 5.190633237361908e-05, 5.709752440452576e-05, 6.228871643543243e-05, 6.747990846633911e-05, 7.267110049724579e-05, 7.786229252815247e-05, 8.305348455905914e-05, 8.824467658996582e-05, 9.34358686208725e-05, 9.862706065177917e-05, 0.00010381825268268585, 0.00010900944471359253, 0.0001142006367444992, 0.00011939182877540588, 0.00012458302080631256, 0.00012977421283721924, 0.00013496540486812592, 0.0001401565968990326, 0.00014534778892993927, 0.00015053898096084595, 0.00015573017299175262, 0.0001609213650226593, 0.00016611255705356598, 0.00017130374908447266]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 2.0, 2.0, 10.0, 9.0, 17.0, 18.0, 21.0, 35.0, 53.0, 86.0, 236.0, 522.0, 1642.0, 6999.0, 72310.0, 849656.0, 105496.0, 8448.0, 1829.0, 606.0, 250.0, 110.0, 69.0, 25.0, 31.0, 17.0, 14.0, 6.0, 5.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434326171875, -0.4173316955566406, -0.40033721923828125, -0.3833427429199219, -0.3663482666015625, -0.3493537902832031, -0.33235931396484375, -0.3153648376464844, -0.298370361328125, -0.2813758850097656, -0.26438140869140625, -0.24738693237304688, -0.2303924560546875, -0.21339797973632812, -0.19640350341796875, -0.17940902709960938, -0.16241455078125, -0.14542007446289062, -0.12842559814453125, -0.11143112182617188, -0.0944366455078125, -0.07744216918945312, -0.06044769287109375, -0.043453216552734375, -0.026458740234375, -0.009464263916015625, 0.00753021240234375, 0.024524688720703125, 0.0415191650390625, 0.058513641357421875, 0.07550811767578125, 0.09250259399414062, 0.1094970703125, 0.12649154663085938, 0.14348602294921875, 0.16048049926757812, 0.1774749755859375, 0.19446945190429688, 0.21146392822265625, 0.22845840454101562, 0.245452880859375, 0.2624473571777344, 0.27944183349609375, 0.2964363098144531, 0.3134307861328125, 0.3304252624511719, 0.34741973876953125, 0.3644142150878906, 0.38140869140625, 0.3984031677246094, 0.41539764404296875, 0.4323921203613281, 0.4493865966796875, 0.4663810729980469, 0.48337554931640625, 0.5003700256347656, 0.517364501953125, 0.5343589782714844, 0.5513534545898438, 0.5683479309082031, 0.5853424072265625, 0.6023368835449219, 0.6193313598632812, 0.6363258361816406, 0.6533203125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 10.0, 20.0, 26.0, 31.0, 57.0, 64.0, 94.0, 139.0, 124.0, 121.0, 80.0, 58.0, 35.0, 41.0, 19.0, 15.0, 12.0, 8.0, 10.0, 3.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.355224609375, -0.3400077819824219, -0.32479095458984375, -0.3095741271972656, -0.2943572998046875, -0.2791404724121094, -0.26392364501953125, -0.24870681762695312, -0.233489990234375, -0.21827316284179688, -0.20305633544921875, -0.18783950805664062, -0.1726226806640625, -0.15740585327148438, -0.14218902587890625, -0.12697219848632812, -0.11175537109375, -0.09653854370117188, -0.08132171630859375, -0.06610488891601562, -0.0508880615234375, -0.035671234130859375, -0.02045440673828125, -0.005237579345703125, 0.009979248046875, 0.025196075439453125, 0.04041290283203125, 0.055629730224609375, 0.0708465576171875, 0.08606338500976562, 0.10128021240234375, 0.11649703979492188, 0.1317138671875, 0.14693069458007812, 0.16214752197265625, 0.17736434936523438, 0.1925811767578125, 0.20779800415039062, 0.22301483154296875, 0.23823165893554688, 0.253448486328125, 0.2686653137207031, 0.28388214111328125, 0.2990989685058594, 0.3143157958984375, 0.3295326232910156, 0.34474945068359375, 0.3599662780761719, 0.37518310546875, 0.3903999328613281, 0.40561676025390625, 0.4208335876464844, 0.4360504150390625, 0.4512672424316406, 0.46648406982421875, 0.4817008972167969, 0.496917724609375, 0.5121345520019531, 0.5273513793945312, 0.5425682067871094, 0.5577850341796875, 0.5730018615722656, 0.5882186889648438, 0.6034355163574219, 0.61865234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 45.0, 533.0, 381.0, 44.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.19060516357422, -41.18220901489258, -40.17381286621094, -39.1654167175293, -38.157020568847656, -37.148624420166016, -36.140228271484375, -35.131832122802734, -34.123435974121094, -33.11503982543945, -32.10664367675781, -31.098247528076172, -30.08985137939453, -29.08145523071289, -28.07305908203125, -27.06466293334961, -26.056264877319336, -25.047868728637695, -24.039472579956055, -23.031076431274414, -22.022680282592773, -21.014284133911133, -20.00588607788086, -18.99748992919922, -17.989093780517578, -16.980697631835938, -15.972301483154297, -14.963905334472656, -13.955509185791016, -12.947113037109375, -11.938715934753418, -10.930319786071777, -9.921924591064453, -8.913528442382812, -7.905132293701172, -6.896735668182373, -5.888339519500732, -4.879943370819092, -3.871546745300293, -2.8631505966186523, -1.8547544479370117, -0.8463581800460815, 0.16203808784484863, 1.1704344749450684, 2.178830623626709, 3.1872267723083496, 4.195623397827148, 5.204019546508789, 6.21241569519043, 7.22081184387207, 8.229207992553711, 9.237604141235352, 10.246000289916992, 11.254396438598633, 12.26279354095459, 13.27118968963623, 14.279585838317871, 15.287981986999512, 16.29637908935547, 17.30477523803711, 18.31317138671875, 19.32156753540039, 20.32996368408203, 21.338359832763672, 22.346755981445312]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 11.0, 8.0, 17.0, 18.0, 13.0, 26.0, 24.0, 35.0, 25.0, 24.0, 32.0, 39.0, 45.0, 36.0, 36.0, 37.0, 43.0, 43.0, 47.0, 41.0, 37.0, 32.0, 40.0, 35.0, 34.0, 31.0, 33.0, 22.0, 13.0, 15.0, 23.0, 12.0, 13.0, 9.0, 9.0, 9.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.6352081298828125, -6.434624195098877, -6.234039783477783, -6.033455848693848, -5.832871913909912, -5.632287979125977, -5.431703567504883, -5.231119632720947, -5.030535697937012, -4.829951763153076, -4.629367351531982, -4.428783416748047, -4.228199481964111, -4.027615547180176, -3.827031135559082, -3.6264472007751465, -3.4258627891540527, -3.225278615951538, -3.0246946811676025, -2.824110507965088, -2.6235265731811523, -2.4229423999786377, -2.222358226776123, -2.0217742919921875, -1.8211901187896729, -1.6206060647964478, -1.4200220108032227, -1.219437837600708, -1.018853783607483, -0.8182697296142578, -0.6176855564117432, -0.41710150241851807, -0.21651744842529297, -0.015933364629745483, 0.184650719165802, 0.3852348327636719, 0.585818886756897, 0.7864029407501221, 0.9869871139526367, 1.1875711679458618, 1.388155221939087, 1.588739275932312, 1.789323329925537, 1.9899075031280518, 2.1904916763305664, 2.391075611114502, 2.5916597843170166, 2.7922439575195312, 2.992827892303467, 3.1934120655059814, 3.393996000289917, 3.5945801734924316, 3.795164108276367, 3.995748281478882, 4.1963324546813965, 4.396916389465332, 4.597500801086426, 4.798084735870361, 4.998669147491455, 5.199253082275391, 5.399837017059326, 5.600420951843262, 5.8010053634643555, 6.001589298248291, 6.202173233032227]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 1.0, 5.0, 3.0, 10.0, 15.0, 32.0, 46.0, 98.0, 134.0, 237.0, 571.0, 1589.0, 6611.0, 54836.0, 4068334.0, 52615.0, 6222.0, 1643.0, 623.0, 279.0, 147.0, 82.0, 51.0, 39.0, 22.0, 11.0, 14.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.501953125, -3.39739990234375, -3.2928466796875, -3.18829345703125, -3.083740234375, -2.97918701171875, -2.8746337890625, -2.77008056640625, -2.66552734375, -2.56097412109375, -2.4564208984375, -2.35186767578125, -2.247314453125, -2.14276123046875, -2.0382080078125, -1.93365478515625, -1.8291015625, -1.72454833984375, -1.6199951171875, -1.51544189453125, -1.410888671875, -1.30633544921875, -1.2017822265625, -1.09722900390625, -0.99267578125, -0.88812255859375, -0.7835693359375, -0.67901611328125, -0.574462890625, -0.46990966796875, -0.3653564453125, -0.26080322265625, -0.15625, -0.05169677734375, 0.0528564453125, 0.15740966796875, 0.261962890625, 0.36651611328125, 0.4710693359375, 0.57562255859375, 0.68017578125, 0.78472900390625, 0.8892822265625, 0.99383544921875, 1.098388671875, 1.20294189453125, 1.3074951171875, 1.41204833984375, 1.5166015625, 1.62115478515625, 1.7257080078125, 1.83026123046875, 1.934814453125, 2.03936767578125, 2.1439208984375, 2.24847412109375, 2.35302734375, 2.45758056640625, 2.5621337890625, 2.66668701171875, 2.771240234375, 2.87579345703125, 2.9803466796875, 3.08489990234375, 3.189453125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 7.0, 20.0, 28.0, 40.0, 64.0, 76.0, 80.0, 118.0, 106.0, 128.0, 104.0, 72.0, 53.0, 34.0, 21.0, 15.0, 10.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.82421875, -0.80096435546875, -0.7777099609375, -0.75445556640625, -0.731201171875, -0.70794677734375, -0.6846923828125, -0.66143798828125, -0.63818359375, -0.61492919921875, -0.5916748046875, -0.56842041015625, -0.545166015625, -0.52191162109375, -0.4986572265625, -0.47540283203125, -0.4521484375, -0.42889404296875, -0.4056396484375, -0.38238525390625, -0.359130859375, -0.33587646484375, -0.3126220703125, -0.28936767578125, -0.26611328125, -0.24285888671875, -0.2196044921875, -0.19635009765625, -0.173095703125, -0.14984130859375, -0.1265869140625, -0.10333251953125, -0.080078125, -0.05682373046875, -0.0335693359375, -0.01031494140625, 0.012939453125, 0.03619384765625, 0.0594482421875, 0.08270263671875, 0.10595703125, 0.12921142578125, 0.1524658203125, 0.17572021484375, 0.198974609375, 0.22222900390625, 0.2454833984375, 0.26873779296875, 0.2919921875, 0.31524658203125, 0.3385009765625, 0.36175537109375, 0.385009765625, 0.40826416015625, 0.4315185546875, 0.45477294921875, 0.47802734375, 0.50128173828125, 0.5245361328125, 0.54779052734375, 0.571044921875, 0.59429931640625, 0.6175537109375, 0.64080810546875, 0.6640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 13.0, 47.0, 134.0, 259.0, 717.0, 1751.0, 12108.0, 4126033.0, 48600.0, 2957.0, 987.0, 379.0, 177.0, 72.0, 21.0, 11.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.12066650390625, -3.9718017578125, -3.82293701171875, -3.674072265625, -3.52520751953125, -3.3763427734375, -3.22747802734375, -3.07861328125, -2.92974853515625, -2.7808837890625, -2.63201904296875, -2.483154296875, -2.33428955078125, -2.1854248046875, -2.03656005859375, -1.8876953125, -1.73883056640625, -1.5899658203125, -1.44110107421875, -1.292236328125, -1.14337158203125, -0.9945068359375, -0.84564208984375, -0.69677734375, -0.54791259765625, -0.3990478515625, -0.25018310546875, -0.101318359375, 0.04754638671875, 0.1964111328125, 0.34527587890625, 0.494140625, 0.64300537109375, 0.7918701171875, 0.94073486328125, 1.089599609375, 1.23846435546875, 1.3873291015625, 1.53619384765625, 1.68505859375, 1.83392333984375, 1.9827880859375, 2.13165283203125, 2.280517578125, 2.42938232421875, 2.5782470703125, 2.72711181640625, 2.8759765625, 3.02484130859375, 3.1737060546875, 3.32257080078125, 3.471435546875, 3.62030029296875, 3.7691650390625, 3.91802978515625, 4.06689453125, 4.21575927734375, 4.3646240234375, 4.51348876953125, 4.662353515625, 4.81121826171875, 4.9600830078125, 5.10894775390625, 5.2578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 7.0, 8.0, 12.0, 25.0, 51.0, 144.0, 2746.0, 904.0, 86.0, 38.0, 21.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.240234375, -1.1987457275390625, -1.157257080078125, -1.1157684326171875, -1.07427978515625, -1.0327911376953125, -0.991302490234375, -0.9498138427734375, -0.9083251953125, -0.8668365478515625, -0.825347900390625, -0.7838592529296875, -0.74237060546875, -0.7008819580078125, -0.659393310546875, -0.6179046630859375, -0.576416015625, -0.5349273681640625, -0.493438720703125, -0.4519500732421875, -0.41046142578125, -0.3689727783203125, -0.327484130859375, -0.2859954833984375, -0.2445068359375, -0.2030181884765625, -0.161529541015625, -0.1200408935546875, -0.07855224609375, -0.0370635986328125, 0.004425048828125, 0.0459136962890625, 0.08740234375, 0.1288909912109375, 0.170379638671875, 0.2118682861328125, 0.25335693359375, 0.2948455810546875, 0.336334228515625, 0.3778228759765625, 0.4193115234375, 0.4608001708984375, 0.502288818359375, 0.5437774658203125, 0.58526611328125, 0.6267547607421875, 0.668243408203125, 0.7097320556640625, 0.751220703125, 0.7927093505859375, 0.834197998046875, 0.8756866455078125, 0.91717529296875, 0.9586639404296875, 1.000152587890625, 1.0416412353515625, 1.0831298828125, 1.1246185302734375, 1.166107177734375, 1.2075958251953125, 1.24908447265625, 1.2905731201171875, 1.332061767578125, 1.3735504150390625, 1.4150390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 18.0, 54.0, 178.0, 397.0, 236.0, 72.0, 23.0, 12.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344240188598633, -8.164571762084961, -7.9849042892456055, -7.805236339569092, -7.625568389892578, -7.4459004402160645, -7.266232490539551, -7.086564540863037, -6.906896591186523, -6.72722864151001, -6.547560691833496, -6.367892742156982, -6.188224792480469, -6.008556842803955, -5.828888893127441, -5.649220943450928, -5.469552993774414, -5.2898850440979, -5.110217094421387, -4.930549144744873, -4.750881195068359, -4.571213245391846, -4.391545295715332, -4.211877346038818, -4.0322089195251465, -3.852540969848633, -3.672873020172119, -3.4932050704956055, -3.313537120819092, -3.133869171142578, -2.9542012214660645, -2.774533271789551, -2.594865322113037, -2.4151973724365234, -2.2355294227600098, -2.055861473083496, -1.8761935234069824, -1.6965255737304688, -1.5168575048446655, -1.3371895551681519, -1.1575216054916382, -0.9778536558151245, -0.7981857061386108, -0.6185176968574524, -0.4388497471809387, -0.25918179750442505, -0.0795137882232666, 0.10015416145324707, 0.27982211112976074, 0.4594900608062744, 0.6391580104827881, 0.8188260197639465, 0.9984939694404602, 1.178161859512329, 1.3578299283981323, 1.537497878074646, 1.7171658277511597, 1.8968337774276733, 2.0765018463134766, 2.2561697959899902, 2.435837745666504, 2.6155056953430176, 2.7951736450195312, 2.974841594696045, 3.1545095443725586]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 5.0, 5.0, 11.0, 19.0, 25.0, 37.0, 40.0, 44.0, 53.0, 55.0, 76.0, 85.0, 77.0, 64.0, 70.0, 67.0, 45.0, 60.0, 40.0, 30.0, 25.0, 24.0, 19.0, 3.0, 5.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5115015506744385, -2.4132091999053955, -2.3149166107177734, -2.2166242599487305, -2.1183319091796875, -2.0200395584106445, -1.9217469692230225, -1.8234546184539795, -1.725162148475647, -1.6268696784973145, -1.5285773277282715, -1.430284857749939, -1.3319923877716064, -1.2337000370025635, -1.135407567024231, -1.0371150970458984, -0.9388227462768555, -0.8405303359031677, -0.74223792552948, -0.6439454555511475, -0.5456530451774597, -0.447360634803772, -0.34906816482543945, -0.2507757544517517, -0.15248334407806396, -0.05419091880321503, 0.04410150647163391, 0.14239394664764404, 0.2406863570213318, 0.33897876739501953, 0.43727123737335205, 0.5355636477470398, 0.6338562965393066, 0.7321487069129944, 0.8304411172866821, 0.9287335872650146, 1.0270259380340576, 1.1253184080123901, 1.2236108779907227, 1.3219032287597656, 1.4201956987380981, 1.5184881687164307, 1.6167805194854736, 1.7150729894638062, 1.8133654594421387, 1.9116578102111816, 2.0099501609802246, 2.1082427501678467, 2.2065351009368896, 2.3048274517059326, 2.4031200408935547, 2.5014123916625977, 2.5997047424316406, 2.6979970932006836, 2.7962896823883057, 2.8945820331573486, 2.9928746223449707, 3.0911669731140137, 3.1894595623016357, 3.2877519130706787, 3.3860442638397217, 3.4843368530273438, 3.5826292037963867, 3.6809215545654297, 3.7792139053344727]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 7.0, 8.0, 10.0, 13.0, 35.0, 48.0, 89.0, 229.0, 546.0, 1571.0, 6114.0, 67485.0, 834735.0, 125955.0, 8615.0, 1935.0, 640.0, 257.0, 133.0, 63.0, 24.0, 24.0, 6.0, 7.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.00390625, -2.9117431640625, -2.819580078125, -2.7274169921875, -2.63525390625, -2.5430908203125, -2.450927734375, -2.3587646484375, -2.2666015625, -2.1744384765625, -2.082275390625, -1.9901123046875, -1.89794921875, -1.8057861328125, -1.713623046875, -1.6214599609375, -1.529296875, -1.4371337890625, -1.344970703125, -1.2528076171875, -1.16064453125, -1.0684814453125, -0.976318359375, -0.8841552734375, -0.7919921875, -0.6998291015625, -0.607666015625, -0.5155029296875, -0.42333984375, -0.3311767578125, -0.239013671875, -0.1468505859375, -0.0546875, 0.0374755859375, 0.129638671875, 0.2218017578125, 0.31396484375, 0.4061279296875, 0.498291015625, 0.5904541015625, 0.6826171875, 0.7747802734375, 0.866943359375, 0.9591064453125, 1.05126953125, 1.1434326171875, 1.235595703125, 1.3277587890625, 1.419921875, 1.5120849609375, 1.604248046875, 1.6964111328125, 1.78857421875, 1.8807373046875, 1.972900390625, 2.0650634765625, 2.1572265625, 2.2493896484375, 2.341552734375, 2.4337158203125, 2.52587890625, 2.6180419921875, 2.710205078125, 2.8023681640625, 2.89453125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 15.0, 26.0, 37.0, 51.0, 78.0, 79.0, 107.0, 121.0, 120.0, 111.0, 63.0, 60.0, 43.0, 32.0, 14.0, 14.0, 9.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.85205078125, -0.8275222778320312, -0.8029937744140625, -0.7784652709960938, -0.753936767578125, -0.7294082641601562, -0.7048797607421875, -0.6803512573242188, -0.65582275390625, -0.6312942504882812, -0.6067657470703125, -0.5822372436523438, -0.557708740234375, -0.5331802368164062, -0.5086517333984375, -0.48412322998046875, -0.4595947265625, -0.43506622314453125, -0.4105377197265625, -0.38600921630859375, -0.361480712890625, -0.33695220947265625, -0.3124237060546875, -0.28789520263671875, -0.26336669921875, -0.23883819580078125, -0.2143096923828125, -0.18978118896484375, -0.165252685546875, -0.14072418212890625, -0.1161956787109375, -0.09166717529296875, -0.067138671875, -0.04261016845703125, -0.0180816650390625, 0.00644683837890625, 0.030975341796875, 0.05550384521484375, 0.0800323486328125, 0.10456085205078125, 0.12908935546875, 0.15361785888671875, 0.1781463623046875, 0.20267486572265625, 0.227203369140625, 0.25173187255859375, 0.2762603759765625, 0.30078887939453125, 0.3253173828125, 0.34984588623046875, 0.3743743896484375, 0.39890289306640625, 0.423431396484375, 0.44795989990234375, 0.4724884033203125, 0.49701690673828125, 0.52154541015625, 0.5460739135742188, 0.5706024169921875, 0.5951309204101562, 0.619659423828125, 0.6441879272460938, 0.6687164306640625, 0.6932449340820312, 0.7177734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 5.0, 4.0, 4.0, 12.0, 18.0, 23.0, 29.0, 44.0, 47.0, 74.0, 129.0, 228.0, 473.0, 993.0, 2793.0, 12059.0, 110784.0, 802845.0, 102035.0, 11434.0, 2605.0, 906.0, 379.0, 209.0, 138.0, 83.0, 60.0, 31.0, 29.0, 21.0, 8.0, 14.0, 9.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.7188720703125, -1.648681640625, -1.5784912109375, -1.50830078125, -1.4381103515625, -1.367919921875, -1.2977294921875, -1.2275390625, -1.1573486328125, -1.087158203125, -1.0169677734375, -0.94677734375, -0.8765869140625, -0.806396484375, -0.7362060546875, -0.666015625, -0.5958251953125, -0.525634765625, -0.4554443359375, -0.38525390625, -0.3150634765625, -0.244873046875, -0.1746826171875, -0.1044921875, -0.0343017578125, 0.035888671875, 0.1060791015625, 0.17626953125, 0.2464599609375, 0.316650390625, 0.3868408203125, 0.45703125, 0.5272216796875, 0.597412109375, 0.6676025390625, 0.73779296875, 0.8079833984375, 0.878173828125, 0.9483642578125, 1.0185546875, 1.0887451171875, 1.158935546875, 1.2291259765625, 1.29931640625, 1.3695068359375, 1.439697265625, 1.5098876953125, 1.580078125, 1.6502685546875, 1.720458984375, 1.7906494140625, 1.86083984375, 1.9310302734375, 2.001220703125, 2.0714111328125, 2.1416015625, 2.2117919921875, 2.281982421875, 2.3521728515625, 2.42236328125, 2.4925537109375, 2.562744140625, 2.6329345703125, 2.703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 12.0, 10.0, 20.0, 16.0, 33.0, 35.0, 32.0, 33.0, 52.0, 59.0, 50.0, 63.0, 75.0, 78.0, 69.0, 38.0, 63.0, 43.0, 42.0, 42.0, 21.0, 12.0, 14.0, 13.0, 13.0, 7.0, 5.0, 3.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.9375, -2.86407470703125, -2.7906494140625, -2.71722412109375, -2.643798828125, -2.57037353515625, -2.4969482421875, -2.42352294921875, -2.35009765625, -2.27667236328125, -2.2032470703125, -2.12982177734375, -2.056396484375, -1.98297119140625, -1.9095458984375, -1.83612060546875, -1.7626953125, -1.68927001953125, -1.6158447265625, -1.54241943359375, -1.468994140625, -1.39556884765625, -1.3221435546875, -1.24871826171875, -1.17529296875, -1.10186767578125, -1.0284423828125, -0.95501708984375, -0.881591796875, -0.80816650390625, -0.7347412109375, -0.66131591796875, -0.587890625, -0.51446533203125, -0.4410400390625, -0.36761474609375, -0.294189453125, -0.22076416015625, -0.1473388671875, -0.07391357421875, -0.00048828125, 0.07293701171875, 0.1463623046875, 0.21978759765625, 0.293212890625, 0.36663818359375, 0.4400634765625, 0.51348876953125, 0.5869140625, 0.66033935546875, 0.7337646484375, 0.80718994140625, 0.880615234375, 0.95404052734375, 1.0274658203125, 1.10089111328125, 1.17431640625, 1.24774169921875, 1.3211669921875, 1.39459228515625, 1.468017578125, 1.54144287109375, 1.6148681640625, 1.68829345703125, 1.76171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 13.0, 18.0, 21.0, 39.0, 57.0, 94.0, 209.0, 392.0, 718.0, 1878.0, 6803.0, 56840.0, 920025.0, 51514.0, 6550.0, 1809.0, 721.0, 343.0, 209.0, 131.0, 64.0, 36.0, 27.0, 11.0, 7.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2060546875, -1.1637115478515625, -1.121368408203125, -1.0790252685546875, -1.03668212890625, -0.9943389892578125, -0.951995849609375, -0.9096527099609375, -0.8673095703125, -0.8249664306640625, -0.782623291015625, -0.7402801513671875, -0.69793701171875, -0.6555938720703125, -0.613250732421875, -0.5709075927734375, -0.528564453125, -0.4862213134765625, -0.443878173828125, -0.4015350341796875, -0.35919189453125, -0.3168487548828125, -0.274505615234375, -0.2321624755859375, -0.1898193359375, -0.1474761962890625, -0.105133056640625, -0.0627899169921875, -0.02044677734375, 0.0218963623046875, 0.064239501953125, 0.1065826416015625, 0.14892578125, 0.1912689208984375, 0.233612060546875, 0.2759552001953125, 0.31829833984375, 0.3606414794921875, 0.402984619140625, 0.4453277587890625, 0.4876708984375, 0.5300140380859375, 0.572357177734375, 0.6147003173828125, 0.65704345703125, 0.6993865966796875, 0.741729736328125, 0.7840728759765625, 0.826416015625, 0.8687591552734375, 0.911102294921875, 0.9534454345703125, 0.99578857421875, 1.0381317138671875, 1.080474853515625, 1.1228179931640625, 1.1651611328125, 1.2075042724609375, 1.249847412109375, 1.2921905517578125, 1.33453369140625, 1.3768768310546875, 1.419219970703125, 1.4615631103515625, 1.50390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 5.0, 8.0, 7.0, 13.0, 12.0, 16.0, 22.0, 39.0, 49.0, 49.0, 68.0, 116.0, 166.0, 116.0, 73.0, 59.0, 37.0, 31.0, 28.0, 19.0, 14.0, 6.0, 15.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015270709991455078, -0.00014816038310527802, -0.00014361366629600525, -0.00013906694948673248, -0.00013452023267745972, -0.00012997351586818695, -0.00012542679905891418, -0.00012088008224964142, -0.00011633336544036865, -0.00011178664863109589, -0.00010723993182182312, -0.00010269321501255035, -9.814649820327759e-05, -9.359978139400482e-05, -8.905306458473206e-05, -8.450634777545929e-05, -7.995963096618652e-05, -7.541291415691376e-05, -7.086619734764099e-05, -6.631948053836823e-05, -6.177276372909546e-05, -5.722604691982269e-05, -5.267933011054993e-05, -4.813261330127716e-05, -4.3585896492004395e-05, -3.903917968273163e-05, -3.449246287345886e-05, -2.9945746064186096e-05, -2.539902925491333e-05, -2.0852312445640564e-05, -1.6305595636367798e-05, -1.1758878827095032e-05, -7.212162017822266e-06, -2.6654452085494995e-06, 1.8812716007232666e-06, 6.427988409996033e-06, 1.0974705219268799e-05, 1.5521422028541565e-05, 2.006813883781433e-05, 2.4614855647087097e-05, 2.9161572456359863e-05, 3.370828926563263e-05, 3.8255006074905396e-05, 4.280172288417816e-05, 4.734843969345093e-05, 5.1895156502723694e-05, 5.644187331199646e-05, 6.0988590121269226e-05, 6.553530693054199e-05, 7.008202373981476e-05, 7.462874054908752e-05, 7.917545735836029e-05, 8.372217416763306e-05, 8.826889097690582e-05, 9.281560778617859e-05, 9.736232459545135e-05, 0.00010190904140472412, 0.00010645575821399689, 0.00011100247502326965, 0.00011554919183254242, 0.00012009590864181519, 0.00012464262545108795, 0.00012918934226036072, 0.00013373605906963348, 0.00013828277587890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 4.0, 5.0, 4.0, 5.0, 9.0, 8.0, 14.0, 22.0, 36.0, 43.0, 81.0, 160.0, 270.0, 577.0, 1162.0, 4131.0, 23635.0, 477978.0, 509012.0, 24647.0, 4230.0, 1319.0, 546.0, 258.0, 154.0, 94.0, 53.0, 30.0, 16.0, 16.0, 14.0, 4.0, 3.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.125, -1.092864990234375, -1.06072998046875, -1.028594970703125, -0.9964599609375, -0.964324951171875, -0.93218994140625, -0.900054931640625, -0.867919921875, -0.835784912109375, -0.80364990234375, -0.771514892578125, -0.7393798828125, -0.707244873046875, -0.67510986328125, -0.642974853515625, -0.61083984375, -0.578704833984375, -0.54656982421875, -0.514434814453125, -0.4822998046875, -0.450164794921875, -0.41802978515625, -0.385894775390625, -0.353759765625, -0.321624755859375, -0.28948974609375, -0.257354736328125, -0.2252197265625, -0.193084716796875, -0.16094970703125, -0.128814697265625, -0.0966796875, -0.064544677734375, -0.03240966796875, -0.000274658203125, 0.0318603515625, 0.063995361328125, 0.09613037109375, 0.128265380859375, 0.160400390625, 0.192535400390625, 0.22467041015625, 0.256805419921875, 0.2889404296875, 0.321075439453125, 0.35321044921875, 0.385345458984375, 0.41748046875, 0.449615478515625, 0.48175048828125, 0.513885498046875, 0.5460205078125, 0.578155517578125, 0.61029052734375, 0.642425537109375, 0.674560546875, 0.706695556640625, 0.73883056640625, 0.770965576171875, 0.8031005859375, 0.835235595703125, 0.86737060546875, 0.899505615234375, 0.931640625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 7.0, 9.0, 9.0, 22.0, 17.0, 17.0, 48.0, 53.0, 116.0, 181.0, 184.0, 110.0, 69.0, 39.0, 24.0, 15.0, 23.0, 7.0, 17.0, 4.0, 3.0, 3.0, 4.0, 5.0, 10.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.44140625, -1.4086990356445312, -1.3759918212890625, -1.3432846069335938, -1.310577392578125, -1.2778701782226562, -1.2451629638671875, -1.2124557495117188, -1.17974853515625, -1.1470413208007812, -1.1143341064453125, -1.0816268920898438, -1.048919677734375, -1.0162124633789062, -0.9835052490234375, -0.9507980346679688, -0.9180908203125, -0.8853836059570312, -0.8526763916015625, -0.8199691772460938, -0.787261962890625, -0.7545547485351562, -0.7218475341796875, -0.6891403198242188, -0.65643310546875, -0.6237258911132812, -0.5910186767578125, -0.5583114624023438, -0.525604248046875, -0.49289703369140625, -0.4601898193359375, -0.42748260498046875, -0.394775390625, -0.36206817626953125, -0.3293609619140625, -0.29665374755859375, -0.263946533203125, -0.23123931884765625, -0.1985321044921875, -0.16582489013671875, -0.13311767578125, -0.10041046142578125, -0.0677032470703125, -0.03499603271484375, -0.002288818359375, 0.03041839599609375, 0.0631256103515625, 0.09583282470703125, 0.1285400390625, 0.16124725341796875, 0.1939544677734375, 0.22666168212890625, 0.259368896484375, 0.29207611083984375, 0.3247833251953125, 0.35749053955078125, 0.39019775390625, 0.42290496826171875, 0.4556121826171875, 0.48831939697265625, 0.521026611328125, 0.5537338256835938, 0.5864410400390625, 0.6191482543945312, 0.65185546875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 4.0, 8.0, 14.0, 47.0, 85.0, 188.0, 247.0, 204.0, 110.0, 49.0, 28.0, 10.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.90314483642578, -23.355697631835938, -22.808250427246094, -22.260805130004883, -21.71335792541504, -21.165910720825195, -20.618465423583984, -20.07101821899414, -19.523571014404297, -18.976123809814453, -18.42867660522461, -17.8812313079834, -17.333784103393555, -16.78633689880371, -16.2388916015625, -15.691444396972656, -15.143997192382812, -14.596549987792969, -14.049103736877441, -13.501657485961914, -12.95421028137207, -12.406763076782227, -11.8593168258667, -11.311870574951172, -10.764423370361328, -10.216976165771484, -9.669529914855957, -9.12208366394043, -8.574636459350586, -8.027189254760742, -7.479743003845215, -6.932296276092529, -6.384847640991211, -5.837400913238525, -5.28995418548584, -4.742507457733154, -4.195060729980469, -3.647614002227783, -3.1001672744750977, -2.552720546722412, -2.0052738189697266, -1.457827091217041, -0.9103803634643555, -0.3629336357116699, 0.18451309204101562, 0.7319598197937012, 1.2794065475463867, 1.8268532752990723, 2.374300003051758, 2.9217467308044434, 3.469193458557129, 4.0166401863098145, 4.5640869140625, 5.1115336418151855, 5.658980369567871, 6.206427097320557, 6.753873825073242, 7.301320552825928, 7.848767280578613, 8.39621353149414, 8.943660736083984, 9.491107940673828, 10.038554191589355, 10.586000442504883, 11.133447647094727]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 1.0, 8.0, 3.0, 8.0, 7.0, 5.0, 15.0, 8.0, 16.0, 30.0, 22.0, 27.0, 27.0, 34.0, 22.0, 49.0, 34.0, 42.0, 49.0, 47.0, 54.0, 50.0, 31.0, 35.0, 48.0, 40.0, 47.0, 42.0, 35.0, 20.0, 23.0, 24.0, 15.0, 9.0, 15.0, 13.0, 8.0, 10.0, 13.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-13.676092147827148, -13.295989990234375, -12.915887832641602, -12.535785675048828, -12.155682563781738, -11.775580406188965, -11.395478248596191, -11.015376091003418, -10.635273933410645, -10.255171775817871, -9.875069618225098, -9.494966506958008, -9.114864349365234, -8.734762191772461, -8.354660034179688, -7.974557876586914, -7.594455242156982, -7.214353084564209, -6.834250450134277, -6.454148292541504, -6.0740461349487305, -5.693943977355957, -5.313841342926025, -4.933739185333252, -4.55363655090332, -4.173534393310547, -3.7934319972991943, -3.413329601287842, -3.0332274436950684, -2.653125047683716, -2.2730226516723633, -1.8929204940795898, -1.5128183364868164, -1.1327160596847534, -0.7526137232780457, -0.3725113868713379, 0.007590889930725098, 0.3876931667327881, 0.7677955627441406, 1.147897720336914, 1.5280001163482666, 1.9081023931503296, 2.2882046699523926, 2.668307065963745, 3.0484094619750977, 3.428511619567871, 3.8086140155792236, 4.188715934753418, 4.56881856918335, 4.948920726776123, 5.329023361206055, 5.709125518798828, 6.089227676391602, 6.469329833984375, 6.849432468414307, 7.22953462600708, 7.609637260437012, 7.989739418029785, 8.369841575622559, 8.749944686889648, 9.130046844482422, 9.510149002075195, 9.890251159667969, 10.270353317260742, 10.650455474853516]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 10.0, 14.0, 13.0, 20.0, 30.0, 51.0, 76.0, 128.0, 181.0, 320.0, 621.0, 1274.0, 2716.0, 7260.0, 27701.0, 346602.0, 3727281.0, 60375.0, 12098.0, 3954.0, 1676.0, 798.0, 423.0, 206.0, 153.0, 91.0, 68.0, 37.0, 18.0, 26.0, 17.0, 12.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.193359375, -2.125274658203125, -2.05718994140625, -1.989105224609375, -1.9210205078125, -1.852935791015625, -1.78485107421875, -1.716766357421875, -1.648681640625, -1.580596923828125, -1.51251220703125, -1.444427490234375, -1.3763427734375, -1.308258056640625, -1.24017333984375, -1.172088623046875, -1.10400390625, -1.035919189453125, -0.96783447265625, -0.899749755859375, -0.8316650390625, -0.763580322265625, -0.69549560546875, -0.627410888671875, -0.559326171875, -0.491241455078125, -0.42315673828125, -0.355072021484375, -0.2869873046875, -0.218902587890625, -0.15081787109375, -0.082733154296875, -0.0146484375, 0.053436279296875, 0.12152099609375, 0.189605712890625, 0.2576904296875, 0.325775146484375, 0.39385986328125, 0.461944580078125, 0.530029296875, 0.598114013671875, 0.66619873046875, 0.734283447265625, 0.8023681640625, 0.870452880859375, 0.93853759765625, 1.006622314453125, 1.07470703125, 1.142791748046875, 1.21087646484375, 1.278961181640625, 1.3470458984375, 1.415130615234375, 1.48321533203125, 1.551300048828125, 1.619384765625, 1.687469482421875, 1.75555419921875, 1.823638916015625, 1.8917236328125, 1.959808349609375, 2.02789306640625, 2.095977783203125, 2.1640625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 6.0, 10.0, 17.0, 17.0, 25.0, 36.0, 45.0, 59.0, 76.0, 60.0, 93.0, 91.0, 96.0, 84.0, 72.0, 75.0, 33.0, 32.0, 23.0, 11.0, 21.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9013671875, -0.8751983642578125, -0.849029541015625, -0.8228607177734375, -0.79669189453125, -0.7705230712890625, -0.744354248046875, -0.7181854248046875, -0.6920166015625, -0.6658477783203125, -0.639678955078125, -0.6135101318359375, -0.58734130859375, -0.5611724853515625, -0.535003662109375, -0.5088348388671875, -0.482666015625, -0.4564971923828125, -0.430328369140625, -0.4041595458984375, -0.37799072265625, -0.3518218994140625, -0.325653076171875, -0.2994842529296875, -0.2733154296875, -0.2471466064453125, -0.220977783203125, -0.1948089599609375, -0.16864013671875, -0.1424713134765625, -0.116302490234375, -0.0901336669921875, -0.06396484375, -0.0377960205078125, -0.011627197265625, 0.0145416259765625, 0.04071044921875, 0.0668792724609375, 0.093048095703125, 0.1192169189453125, 0.1453857421875, 0.1715545654296875, 0.197723388671875, 0.2238922119140625, 0.25006103515625, 0.2762298583984375, 0.302398681640625, 0.3285675048828125, 0.354736328125, 0.3809051513671875, 0.407073974609375, 0.4332427978515625, 0.45941162109375, 0.4855804443359375, 0.511749267578125, 0.5379180908203125, 0.5640869140625, 0.5902557373046875, 0.616424560546875, 0.6425933837890625, 0.66876220703125, 0.6949310302734375, 0.721099853515625, 0.7472686767578125, 0.7734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 15.0, 19.0, 66.0, 102.0, 217.0, 456.0, 1004.0, 2536.0, 7985.0, 46152.0, 3875644.0, 236231.0, 16817.0, 4229.0, 1513.0, 688.0, 298.0, 152.0, 74.0, 31.0, 22.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.034942626953125, -1.95269775390625, -1.870452880859375, -1.7882080078125, -1.705963134765625, -1.62371826171875, -1.541473388671875, -1.459228515625, -1.376983642578125, -1.29473876953125, -1.212493896484375, -1.1302490234375, -1.048004150390625, -0.96575927734375, -0.883514404296875, -0.80126953125, -0.719024658203125, -0.63677978515625, -0.554534912109375, -0.4722900390625, -0.390045166015625, -0.30780029296875, -0.225555419921875, -0.143310546875, -0.061065673828125, 0.02117919921875, 0.103424072265625, 0.1856689453125, 0.267913818359375, 0.35015869140625, 0.432403564453125, 0.5146484375, 0.596893310546875, 0.67913818359375, 0.761383056640625, 0.8436279296875, 0.925872802734375, 1.00811767578125, 1.090362548828125, 1.172607421875, 1.254852294921875, 1.33709716796875, 1.419342041015625, 1.5015869140625, 1.583831787109375, 1.66607666015625, 1.748321533203125, 1.83056640625, 1.912811279296875, 1.99505615234375, 2.077301025390625, 2.1595458984375, 2.241790771484375, 2.32403564453125, 2.406280517578125, 2.488525390625, 2.570770263671875, 2.65301513671875, 2.735260009765625, 2.8175048828125, 2.899749755859375, 2.98199462890625, 3.064239501953125, 3.146484375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 5.0, 5.0, 9.0, 9.0, 18.0, 31.0, 60.0, 103.0, 353.0, 2480.0, 646.0, 162.0, 60.0, 30.0, 23.0, 18.0, 11.0, 6.0, 8.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.197265625, -1.15826416015625, -1.1192626953125, -1.08026123046875, -1.041259765625, -1.00225830078125, -0.9632568359375, -0.92425537109375, -0.88525390625, -0.84625244140625, -0.8072509765625, -0.76824951171875, -0.729248046875, -0.69024658203125, -0.6512451171875, -0.61224365234375, -0.5732421875, -0.53424072265625, -0.4952392578125, -0.45623779296875, -0.417236328125, -0.37823486328125, -0.3392333984375, -0.30023193359375, -0.26123046875, -0.22222900390625, -0.1832275390625, -0.14422607421875, -0.105224609375, -0.06622314453125, -0.0272216796875, 0.01177978515625, 0.05078125, 0.08978271484375, 0.1287841796875, 0.16778564453125, 0.206787109375, 0.24578857421875, 0.2847900390625, 0.32379150390625, 0.36279296875, 0.40179443359375, 0.4407958984375, 0.47979736328125, 0.518798828125, 0.55780029296875, 0.5968017578125, 0.63580322265625, 0.6748046875, 0.71380615234375, 0.7528076171875, 0.79180908203125, 0.830810546875, 0.86981201171875, 0.9088134765625, 0.94781494140625, 0.98681640625, 1.02581787109375, 1.0648193359375, 1.10382080078125, 1.142822265625, 1.18182373046875, 1.2208251953125, 1.25982666015625, 1.298828125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 14.0, 30.0, 127.0, 367.0, 323.0, 103.0, 33.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.952731132507324, -8.632033348083496, -8.311336517333984, -7.990638732910156, -7.669940948486328, -7.349243640899658, -7.028546333312988, -6.70784854888916, -6.38715124130249, -6.06645393371582, -5.745756149291992, -5.425058841705322, -5.104361534118652, -4.783663749694824, -4.462966442108154, -4.142269134521484, -3.8215713500976562, -3.5008738040924072, -3.180176258087158, -2.8594789505004883, -2.5387814044952393, -2.2180838584899902, -1.8973864316940308, -1.5766890048980713, -1.2559914588928223, -0.935293972492218, -0.6145964860916138, -0.2938989996910095, 0.026798486709594727, 0.34749603271484375, 0.6681934595108032, 0.9888908863067627, 1.3095874786376953, 1.6302850246429443, 1.9509824514389038, 2.2716798782348633, 2.5923774242401123, 2.9130749702453613, 3.2337722778320312, 3.5544698238372803, 3.8751673698425293, 4.195864677429199, 4.516562461853027, 4.837259769439697, 5.157957077026367, 5.478654861450195, 5.799352169036865, 6.120049476623535, 6.440747261047363, 6.761444568634033, 7.082142353057861, 7.402839660644531, 7.723537445068359, 8.044235229492188, 8.3649320602417, 8.685629844665527, 9.006326675415039, 9.327024459838867, 9.647721290588379, 9.968419075012207, 10.289116859436035, 10.609813690185547, 10.930511474609375, 11.251209259033203, 11.571907043457031]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 10.0, 11.0, 8.0, 10.0, 12.0, 13.0, 23.0, 45.0, 28.0, 27.0, 37.0, 40.0, 48.0, 50.0, 52.0, 56.0, 55.0, 55.0, 64.0, 45.0, 54.0, 38.0, 38.0, 37.0, 26.0, 22.0, 22.0, 20.0, 15.0, 10.0, 7.0, 11.0, 4.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.089986801147461, -3.980909585952759, -3.8718323707580566, -3.7627551555633545, -3.6536779403686523, -3.54460072517395, -3.435523509979248, -3.326446056365967, -3.2173690795898438, -3.1082918643951416, -2.9992146492004395, -2.8901374340057373, -2.781060218811035, -2.671983003616333, -2.562905788421631, -2.4538283348083496, -2.3447511196136475, -2.2356739044189453, -2.126596689224243, -2.017519474029541, -1.9084422588348389, -1.7993650436401367, -1.690287709236145, -1.5812104940414429, -1.4721332788467407, -1.3630560636520386, -1.2539788484573364, -1.1449015140533447, -1.0358242988586426, -0.9267471432685852, -0.8176698684692383, -0.7085926532745361, -0.599515438079834, -0.49043822288513184, -0.3813609778881073, -0.27228373289108276, -0.16320651769638062, -0.05412930250167847, 0.05494797229766846, 0.1640251874923706, 0.27310240268707275, 0.3821796178817749, 0.49125686287879944, 0.600334107875824, 0.7094113230705261, 0.8184885382652283, 0.9275658130645752, 1.0366430282592773, 1.1457202434539795, 1.2547974586486816, 1.3638746738433838, 1.472951889038086, 1.582029104232788, 1.6911063194274902, 1.800183653831482, 1.909260869026184, 2.018338203430176, 2.127415418624878, 2.23649263381958, 2.3455698490142822, 2.4546470642089844, 2.5637242794036865, 2.6728014945983887, 2.78187894821167, 2.890955924987793]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 3.0, 2.0, 15.0, 14.0, 15.0, 35.0, 49.0, 79.0, 129.0, 213.0, 399.0, 732.0, 1482.0, 3655.0, 10186.0, 35659.0, 167572.0, 528251.0, 231787.0, 47536.0, 12652.0, 4374.0, 1803.0, 866.0, 427.0, 233.0, 143.0, 90.0, 56.0, 29.0, 24.0, 19.0, 4.0, 5.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7744140625, -1.7216033935546875, -1.668792724609375, -1.6159820556640625, -1.56317138671875, -1.5103607177734375, -1.457550048828125, -1.4047393798828125, -1.3519287109375, -1.2991180419921875, -1.246307373046875, -1.1934967041015625, -1.14068603515625, -1.0878753662109375, -1.035064697265625, -0.9822540283203125, -0.929443359375, -0.8766326904296875, -0.823822021484375, -0.7710113525390625, -0.71820068359375, -0.6653900146484375, -0.612579345703125, -0.5597686767578125, -0.5069580078125, -0.4541473388671875, -0.401336669921875, -0.3485260009765625, -0.29571533203125, -0.2429046630859375, -0.190093994140625, -0.1372833251953125, -0.08447265625, -0.0316619873046875, 0.021148681640625, 0.0739593505859375, 0.12677001953125, 0.1795806884765625, 0.232391357421875, 0.2852020263671875, 0.3380126953125, 0.3908233642578125, 0.443634033203125, 0.4964447021484375, 0.54925537109375, 0.6020660400390625, 0.654876708984375, 0.7076873779296875, 0.760498046875, 0.8133087158203125, 0.866119384765625, 0.9189300537109375, 0.97174072265625, 1.0245513916015625, 1.077362060546875, 1.1301727294921875, 1.1829833984375, 1.2357940673828125, 1.288604736328125, 1.3414154052734375, 1.39422607421875, 1.4470367431640625, 1.499847412109375, 1.5526580810546875, 1.60546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 6.0, 9.0, 16.0, 20.0, 36.0, 42.0, 43.0, 74.0, 68.0, 86.0, 91.0, 82.0, 98.0, 81.0, 64.0, 54.0, 42.0, 28.0, 16.0, 13.0, 11.0, 8.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.923828125, -0.897430419921875, -0.87103271484375, -0.844635009765625, -0.8182373046875, -0.791839599609375, -0.76544189453125, -0.739044189453125, -0.712646484375, -0.686248779296875, -0.65985107421875, -0.633453369140625, -0.6070556640625, -0.580657958984375, -0.55426025390625, -0.527862548828125, -0.50146484375, -0.475067138671875, -0.44866943359375, -0.422271728515625, -0.3958740234375, -0.369476318359375, -0.34307861328125, -0.316680908203125, -0.290283203125, -0.263885498046875, -0.23748779296875, -0.211090087890625, -0.1846923828125, -0.158294677734375, -0.13189697265625, -0.105499267578125, -0.0791015625, -0.052703857421875, -0.02630615234375, 9.1552734375e-05, 0.0264892578125, 0.052886962890625, 0.07928466796875, 0.105682373046875, 0.132080078125, 0.158477783203125, 0.18487548828125, 0.211273193359375, 0.2376708984375, 0.264068603515625, 0.29046630859375, 0.316864013671875, 0.34326171875, 0.369659423828125, 0.39605712890625, 0.422454833984375, 0.4488525390625, 0.475250244140625, 0.50164794921875, 0.528045654296875, 0.554443359375, 0.580841064453125, 0.60723876953125, 0.633636474609375, 0.6600341796875, 0.686431884765625, 0.71282958984375, 0.739227294921875, 0.765625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 8.0, 8.0, 10.0, 14.0, 15.0, 25.0, 34.0, 49.0, 55.0, 81.0, 123.0, 224.0, 331.0, 641.0, 1681.0, 5089.0, 22673.0, 165278.0, 694291.0, 131247.0, 19077.0, 4585.0, 1403.0, 645.0, 328.0, 189.0, 144.0, 84.0, 58.0, 40.0, 37.0, 18.0, 12.0, 16.0, 13.0, 5.0, 9.0, 7.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.376953125, -2.29888916015625, -2.2208251953125, -2.14276123046875, -2.064697265625, -1.98663330078125, -1.9085693359375, -1.83050537109375, -1.75244140625, -1.67437744140625, -1.5963134765625, -1.51824951171875, -1.440185546875, -1.36212158203125, -1.2840576171875, -1.20599365234375, -1.1279296875, -1.04986572265625, -0.9718017578125, -0.89373779296875, -0.815673828125, -0.73760986328125, -0.6595458984375, -0.58148193359375, -0.50341796875, -0.42535400390625, -0.3472900390625, -0.26922607421875, -0.191162109375, -0.11309814453125, -0.0350341796875, 0.04302978515625, 0.12109375, 0.19915771484375, 0.2772216796875, 0.35528564453125, 0.433349609375, 0.51141357421875, 0.5894775390625, 0.66754150390625, 0.74560546875, 0.82366943359375, 0.9017333984375, 0.97979736328125, 1.057861328125, 1.13592529296875, 1.2139892578125, 1.29205322265625, 1.3701171875, 1.44818115234375, 1.5262451171875, 1.60430908203125, 1.682373046875, 1.76043701171875, 1.8385009765625, 1.91656494140625, 1.99462890625, 2.07269287109375, 2.1507568359375, 2.22882080078125, 2.306884765625, 2.38494873046875, 2.4630126953125, 2.54107666015625, 2.619140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 3.0, 0.0, 3.0, 3.0, 5.0, 3.0, 4.0, 7.0, 6.0, 12.0, 8.0, 10.0, 22.0, 18.0, 17.0, 21.0, 20.0, 36.0, 45.0, 43.0, 39.0, 39.0, 48.0, 43.0, 38.0, 42.0, 56.0, 45.0, 40.0, 54.0, 35.0, 31.0, 35.0, 32.0, 24.0, 27.0, 18.0, 9.0, 11.0, 12.0, 11.0, 8.0, 6.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.583984375, -2.495147705078125, -2.40631103515625, -2.317474365234375, -2.2286376953125, -2.139801025390625, -2.05096435546875, -1.962127685546875, -1.873291015625, -1.784454345703125, -1.69561767578125, -1.606781005859375, -1.5179443359375, -1.429107666015625, -1.34027099609375, -1.251434326171875, -1.16259765625, -1.073760986328125, -0.98492431640625, -0.896087646484375, -0.8072509765625, -0.718414306640625, -0.62957763671875, -0.540740966796875, -0.451904296875, -0.363067626953125, -0.27423095703125, -0.185394287109375, -0.0965576171875, -0.007720947265625, 0.08111572265625, 0.169952392578125, 0.2587890625, 0.347625732421875, 0.43646240234375, 0.525299072265625, 0.6141357421875, 0.702972412109375, 0.79180908203125, 0.880645751953125, 0.969482421875, 1.058319091796875, 1.14715576171875, 1.235992431640625, 1.3248291015625, 1.413665771484375, 1.50250244140625, 1.591339111328125, 1.68017578125, 1.769012451171875, 1.85784912109375, 1.946685791015625, 2.0355224609375, 2.124359130859375, 2.21319580078125, 2.302032470703125, 2.390869140625, 2.479705810546875, 2.56854248046875, 2.657379150390625, 2.7462158203125, 2.835052490234375, 2.92388916015625, 3.012725830078125, 3.1015625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 9.0, 9.0, 26.0, 23.0, 37.0, 51.0, 118.0, 254.0, 542.0, 1566.0, 7437.0, 111285.0, 873031.0, 47441.0, 4741.0, 1101.0, 422.0, 220.0, 109.0, 55.0, 34.0, 17.0, 9.0, 8.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.720703125, -1.6691436767578125, -1.617584228515625, -1.5660247802734375, -1.51446533203125, -1.4629058837890625, -1.411346435546875, -1.3597869873046875, -1.3082275390625, -1.2566680908203125, -1.205108642578125, -1.1535491943359375, -1.10198974609375, -1.0504302978515625, -0.998870849609375, -0.9473114013671875, -0.895751953125, -0.8441925048828125, -0.792633056640625, -0.7410736083984375, -0.68951416015625, -0.6379547119140625, -0.586395263671875, -0.5348358154296875, -0.4832763671875, -0.4317169189453125, -0.380157470703125, -0.3285980224609375, -0.27703857421875, -0.2254791259765625, -0.173919677734375, -0.1223602294921875, -0.07080078125, -0.0192413330078125, 0.032318115234375, 0.0838775634765625, 0.13543701171875, 0.1869964599609375, 0.238555908203125, 0.2901153564453125, 0.3416748046875, 0.3932342529296875, 0.444793701171875, 0.4963531494140625, 0.54791259765625, 0.5994720458984375, 0.651031494140625, 0.7025909423828125, 0.754150390625, 0.8057098388671875, 0.857269287109375, 0.9088287353515625, 0.96038818359375, 1.0119476318359375, 1.063507080078125, 1.1150665283203125, 1.1666259765625, 1.2181854248046875, 1.269744873046875, 1.3213043212890625, 1.37286376953125, 1.4244232177734375, 1.475982666015625, 1.5275421142578125, 1.5791015625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 9.0, 24.0, 23.0, 33.0, 62.0, 66.0, 99.0, 99.0, 114.0, 100.0, 99.0, 70.0, 50.0, 30.0, 34.0, 20.0, 19.0, 10.0, 6.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001323223114013672, -0.00012771226465702057, -0.00012310221791267395, -0.00011849217116832733, -0.00011388212442398071, -0.0001092720776796341, -0.00010466203093528748, -0.00010005198419094086, -9.544193744659424e-05, -9.083189070224762e-05, -8.6221843957901e-05, -8.161179721355438e-05, -7.700175046920776e-05, -7.239170372486115e-05, -6.778165698051453e-05, -6.317161023616791e-05, -5.856156349182129e-05, -5.395151674747467e-05, -4.934147000312805e-05, -4.473142325878143e-05, -4.0121376514434814e-05, -3.5511329770088196e-05, -3.090128302574158e-05, -2.629123628139496e-05, -2.168118953704834e-05, -1.707114279270172e-05, -1.2461096048355103e-05, -7.851049304008484e-06, -3.2410025596618652e-06, 1.3690441846847534e-06, 5.979090929031372e-06, 1.058913767337799e-05, 1.519918441772461e-05, 1.9809231162071228e-05, 2.4419277906417847e-05, 2.9029324650764465e-05, 3.3639371395111084e-05, 3.82494181394577e-05, 4.285946488380432e-05, 4.746951162815094e-05, 5.207955837249756e-05, 5.668960511684418e-05, 6.12996518611908e-05, 6.590969860553741e-05, 7.051974534988403e-05, 7.512979209423065e-05, 7.973983883857727e-05, 8.434988558292389e-05, 8.895993232727051e-05, 9.356997907161713e-05, 9.818002581596375e-05, 0.00010279007256031036, 0.00010740011930465698, 0.0001120101660490036, 0.00011662021279335022, 0.00012123025953769684, 0.00012584030628204346, 0.00013045035302639008, 0.0001350603997707367, 0.0001396704465150833, 0.00014428049325942993, 0.00014889054000377655, 0.00015350058674812317, 0.0001581106334924698, 0.0001627206802368164]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 3.0, 10.0, 15.0, 26.0, 43.0, 77.0, 134.0, 260.0, 549.0, 1323.0, 4823.0, 32107.0, 525813.0, 448288.0, 28377.0, 4471.0, 1151.0, 529.0, 238.0, 130.0, 75.0, 35.0, 24.0, 12.0, 13.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1611328125, -1.1223907470703125, -1.083648681640625, -1.0449066162109375, -1.00616455078125, -0.9674224853515625, -0.928680419921875, -0.8899383544921875, -0.8511962890625, -0.8124542236328125, -0.773712158203125, -0.7349700927734375, -0.69622802734375, -0.6574859619140625, -0.618743896484375, -0.5800018310546875, -0.541259765625, -0.5025177001953125, -0.463775634765625, -0.4250335693359375, -0.38629150390625, -0.3475494384765625, -0.308807373046875, -0.2700653076171875, -0.2313232421875, -0.1925811767578125, -0.153839111328125, -0.1150970458984375, -0.07635498046875, -0.0376129150390625, 0.001129150390625, 0.0398712158203125, 0.07861328125, 0.1173553466796875, 0.156097412109375, 0.1948394775390625, 0.23358154296875, 0.2723236083984375, 0.311065673828125, 0.3498077392578125, 0.3885498046875, 0.4272918701171875, 0.466033935546875, 0.5047760009765625, 0.54351806640625, 0.5822601318359375, 0.621002197265625, 0.6597442626953125, 0.698486328125, 0.7372283935546875, 0.775970458984375, 0.8147125244140625, 0.85345458984375, 0.8921966552734375, 0.930938720703125, 0.9696807861328125, 1.0084228515625, 1.0471649169921875, 1.085906982421875, 1.1246490478515625, 1.16339111328125, 1.2021331787109375, 1.240875244140625, 1.2796173095703125, 1.318359375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 7.0, 11.0, 10.0, 8.0, 17.0, 26.0, 31.0, 41.0, 59.0, 88.0, 119.0, 137.0, 134.0, 91.0, 55.0, 39.0, 30.0, 20.0, 14.0, 16.0, 11.0, 11.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.125, -1.0867919921875, -1.048583984375, -1.0103759765625, -0.97216796875, -0.9339599609375, -0.895751953125, -0.8575439453125, -0.8193359375, -0.7811279296875, -0.742919921875, -0.7047119140625, -0.66650390625, -0.6282958984375, -0.590087890625, -0.5518798828125, -0.513671875, -0.4754638671875, -0.437255859375, -0.3990478515625, -0.36083984375, -0.3226318359375, -0.284423828125, -0.2462158203125, -0.2080078125, -0.1697998046875, -0.131591796875, -0.0933837890625, -0.05517578125, -0.0169677734375, 0.021240234375, 0.0594482421875, 0.09765625, 0.1358642578125, 0.174072265625, 0.2122802734375, 0.25048828125, 0.2886962890625, 0.326904296875, 0.3651123046875, 0.4033203125, 0.4415283203125, 0.479736328125, 0.5179443359375, 0.55615234375, 0.5943603515625, 0.632568359375, 0.6707763671875, 0.708984375, 0.7471923828125, 0.785400390625, 0.8236083984375, 0.86181640625, 0.9000244140625, 0.938232421875, 0.9764404296875, 1.0146484375, 1.0528564453125, 1.091064453125, 1.1292724609375, 1.16748046875, 1.2056884765625, 1.243896484375, 1.2821044921875, 1.3203125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 11.0, 30.0, 75.0, 225.0, 329.0, 197.0, 77.0, 28.0, 18.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.165355682373047, -16.234865188598633, -15.304374694824219, -14.373884201049805, -13.44339370727539, -12.512903213500977, -11.582412719726562, -10.651922225952148, -9.721431732177734, -8.79094123840332, -7.860450744628906, -6.929960250854492, -5.999469757080078, -5.068978786468506, -4.138488292694092, -3.2079977989196777, -2.2775068283081055, -1.3470163345336914, -0.4165257215499878, 0.5139648914337158, 1.4444553852081299, 2.374946117401123, 3.305436611175537, 4.235927104949951, 5.166417598724365, 6.096908092498779, 7.027398586273193, 7.957889556884766, 8.88838005065918, 9.818870544433594, 10.749361038208008, 11.679851531982422, 12.610342025756836, 13.54083251953125, 14.471323013305664, 15.401813507080078, 16.332304000854492, 17.262794494628906, 18.19328498840332, 19.123775482177734, 20.05426597595215, 20.984756469726562, 21.915246963500977, 22.84573745727539, 23.776227951049805, 24.70671844482422, 25.637208938598633, 26.567699432373047, 27.498191833496094, 28.428682327270508, 29.359172821044922, 30.289663314819336, 31.22015380859375, 32.1506462097168, 33.08113479614258, 34.011627197265625, 34.942115783691406, 35.87260818481445, 36.803096771240234, 37.73358917236328, 38.66407775878906, 39.59457015991211, 40.52505874633789, 41.45555114746094, 42.38603973388672]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0, 12.0, 7.0, 7.0, 12.0, 13.0, 18.0, 18.0, 25.0, 29.0, 34.0, 36.0, 47.0, 41.0, 51.0, 58.0, 66.0, 61.0, 64.0, 61.0, 52.0, 44.0, 46.0, 37.0, 30.0, 29.0, 21.0, 17.0, 11.0, 10.0, 8.0, 5.0, 8.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.446754455566406, -21.841707229614258, -21.23666000366211, -20.631614685058594, -20.026567459106445, -19.421520233154297, -18.81647491455078, -18.211427688598633, -17.606380462646484, -17.001333236694336, -16.396286010742188, -15.791240692138672, -15.186193466186523, -14.581146240234375, -13.976099967956543, -13.371053695678711, -12.766006469726562, -12.160959243774414, -11.555912971496582, -10.95086669921875, -10.345819473266602, -9.740772247314453, -9.135725975036621, -8.530679702758789, -7.925632476806641, -7.32058572769165, -6.71553897857666, -6.11049222946167, -5.50544548034668, -4.9003987312316895, -4.295351982116699, -3.690305233001709, -3.0852584838867188, -2.4802117347717285, -1.8751649856567383, -1.270118236541748, -0.6650714874267578, -0.06002473831176758, 0.5450220108032227, 1.150068759918213, 1.7551155090332031, 2.3601622581481934, 2.9652090072631836, 3.570255756378174, 4.175302505493164, 4.780349254608154, 5.3853960037231445, 5.990442752838135, 6.595489501953125, 7.200536251068115, 7.8055830001831055, 8.410629272460938, 9.015676498413086, 9.620723724365234, 10.225769996643066, 10.830816268920898, 11.435863494873047, 12.040910720825195, 12.645956993103027, 13.25100326538086, 13.856050491333008, 14.461097717285156, 15.066143989562988, 15.67119026184082, 16.27623748779297]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 2.0, 10.0, 15.0, 17.0, 31.0, 56.0, 89.0, 117.0, 189.0, 327.0, 546.0, 997.0, 1905.0, 4284.0, 11626.0, 48438.0, 3806806.0, 277488.0, 26864.0, 7877.0, 3093.0, 1566.0, 782.0, 441.0, 257.0, 174.0, 86.0, 59.0, 43.0, 21.0, 16.0, 13.0, 13.0, 7.0, 4.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6259765625, -1.57489013671875, -1.5238037109375, -1.47271728515625, -1.421630859375, -1.37054443359375, -1.3194580078125, -1.26837158203125, -1.21728515625, -1.16619873046875, -1.1151123046875, -1.06402587890625, -1.012939453125, -0.96185302734375, -0.9107666015625, -0.85968017578125, -0.80859375, -0.75750732421875, -0.7064208984375, -0.65533447265625, -0.604248046875, -0.55316162109375, -0.5020751953125, -0.45098876953125, -0.39990234375, -0.34881591796875, -0.2977294921875, -0.24664306640625, -0.195556640625, -0.14447021484375, -0.0933837890625, -0.04229736328125, 0.0087890625, 0.05987548828125, 0.1109619140625, 0.16204833984375, 0.213134765625, 0.26422119140625, 0.3153076171875, 0.36639404296875, 0.41748046875, 0.46856689453125, 0.5196533203125, 0.57073974609375, 0.621826171875, 0.67291259765625, 0.7239990234375, 0.77508544921875, 0.826171875, 0.87725830078125, 0.9283447265625, 0.97943115234375, 1.030517578125, 1.08160400390625, 1.1326904296875, 1.18377685546875, 1.23486328125, 1.28594970703125, 1.3370361328125, 1.38812255859375, 1.439208984375, 1.49029541015625, 1.5413818359375, 1.59246826171875, 1.6435546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 3.0, 8.0, 6.0, 12.0, 20.0, 27.0, 31.0, 33.0, 41.0, 71.0, 75.0, 69.0, 87.0, 81.0, 89.0, 63.0, 67.0, 50.0, 36.0, 35.0, 18.0, 12.0, 17.0, 9.0, 9.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.033203125, -1.003662109375, -0.97412109375, -0.944580078125, -0.9150390625, -0.885498046875, -0.85595703125, -0.826416015625, -0.796875, -0.767333984375, -0.73779296875, -0.708251953125, -0.6787109375, -0.649169921875, -0.61962890625, -0.590087890625, -0.560546875, -0.531005859375, -0.50146484375, -0.471923828125, -0.4423828125, -0.412841796875, -0.38330078125, -0.353759765625, -0.32421875, -0.294677734375, -0.26513671875, -0.235595703125, -0.2060546875, -0.176513671875, -0.14697265625, -0.117431640625, -0.087890625, -0.058349609375, -0.02880859375, 0.000732421875, 0.0302734375, 0.059814453125, 0.08935546875, 0.118896484375, 0.1484375, 0.177978515625, 0.20751953125, 0.237060546875, 0.2666015625, 0.296142578125, 0.32568359375, 0.355224609375, 0.384765625, 0.414306640625, 0.44384765625, 0.473388671875, 0.5029296875, 0.532470703125, 0.56201171875, 0.591552734375, 0.62109375, 0.650634765625, 0.68017578125, 0.709716796875, 0.7392578125, 0.768798828125, 0.79833984375, 0.827880859375, 0.857421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 6.0, 7.0, 9.0, 15.0, 17.0, 35.0, 50.0, 85.0, 110.0, 147.0, 183.0, 299.0, 496.0, 766.0, 1299.0, 2426.0, 5072.0, 13918.0, 82174.0, 3978668.0, 83305.0, 13977.0, 5292.0, 2389.0, 1260.0, 793.0, 497.0, 301.0, 217.0, 134.0, 83.0, 67.0, 57.0, 45.0, 30.0, 22.0, 12.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7265625, -1.665985107421875, -1.60540771484375, -1.544830322265625, -1.4842529296875, -1.423675537109375, -1.36309814453125, -1.302520751953125, -1.241943359375, -1.181365966796875, -1.12078857421875, -1.060211181640625, -0.9996337890625, -0.939056396484375, -0.87847900390625, -0.817901611328125, -0.75732421875, -0.696746826171875, -0.63616943359375, -0.575592041015625, -0.5150146484375, -0.454437255859375, -0.39385986328125, -0.333282470703125, -0.272705078125, -0.212127685546875, -0.15155029296875, -0.090972900390625, -0.0303955078125, 0.030181884765625, 0.09075927734375, 0.151336669921875, 0.2119140625, 0.272491455078125, 0.33306884765625, 0.393646240234375, 0.4542236328125, 0.514801025390625, 0.57537841796875, 0.635955810546875, 0.696533203125, 0.757110595703125, 0.81768798828125, 0.878265380859375, 0.9388427734375, 0.999420166015625, 1.05999755859375, 1.120574951171875, 1.18115234375, 1.241729736328125, 1.30230712890625, 1.362884521484375, 1.4234619140625, 1.484039306640625, 1.54461669921875, 1.605194091796875, 1.665771484375, 1.726348876953125, 1.78692626953125, 1.847503662109375, 1.9080810546875, 1.968658447265625, 2.02923583984375, 2.089813232421875, 2.150390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 6.0, 9.0, 8.0, 23.0, 28.0, 94.0, 689.0, 3024.0, 105.0, 26.0, 19.0, 16.0, 6.0, 3.0, 4.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64697265625, -0.62615966796875, -0.6053466796875, -0.58453369140625, -0.563720703125, -0.54290771484375, -0.5220947265625, -0.50128173828125, -0.48046875, -0.45965576171875, -0.4388427734375, -0.41802978515625, -0.397216796875, -0.37640380859375, -0.3555908203125, -0.33477783203125, -0.31396484375, -0.29315185546875, -0.2723388671875, -0.25152587890625, -0.230712890625, -0.20989990234375, -0.1890869140625, -0.16827392578125, -0.1474609375, -0.12664794921875, -0.1058349609375, -0.08502197265625, -0.064208984375, -0.04339599609375, -0.0225830078125, -0.00177001953125, 0.01904296875, 0.03985595703125, 0.0606689453125, 0.08148193359375, 0.102294921875, 0.12310791015625, 0.1439208984375, 0.16473388671875, 0.185546875, 0.20635986328125, 0.2271728515625, 0.24798583984375, 0.268798828125, 0.28961181640625, 0.3104248046875, 0.33123779296875, 0.35205078125, 0.37286376953125, 0.3936767578125, 0.41448974609375, 0.435302734375, 0.45611572265625, 0.4769287109375, 0.49774169921875, 0.5185546875, 0.53936767578125, 0.5601806640625, 0.58099365234375, 0.601806640625, 0.62261962890625, 0.6434326171875, 0.66424560546875, 0.68505859375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 15.0, 50.0, 146.0, 265.0, 271.0, 149.0, 66.0, 27.0, 9.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5270354747772217, -2.422767400741577, -2.3184990882873535, -2.214231014251709, -2.1099629402160645, -2.00569486618042, -1.9014266729354858, -1.7971584796905518, -1.6928904056549072, -1.5886223316192627, -1.4843541383743286, -1.3800859451293945, -1.27581787109375, -1.1715497970581055, -1.0672816038131714, -0.9630134701728821, -0.8587453365325928, -0.7544772028923035, -0.6502090692520142, -0.5459409356117249, -0.44167280197143555, -0.33740466833114624, -0.23313653469085693, -0.12886840105056763, -0.02460026741027832, 0.07966786623001099, 0.1839359998703003, 0.2882041335105896, 0.3924722671508789, 0.4967404007911682, 0.6010085344314575, 0.7052766680717468, 0.809544563293457, 0.9138126969337463, 1.0180808305740356, 1.1223490238189697, 1.2266170978546143, 1.3308851718902588, 1.4351533651351929, 1.539421558380127, 1.6436896324157715, 1.747957706451416, 1.85222589969635, 1.9564940929412842, 2.0607621669769287, 2.1650302410125732, 2.269298553466797, 2.3735666275024414, 2.477834701538086, 2.5821027755737305, 2.686370849609375, 2.7906391620635986, 2.894907236099243, 2.9991753101348877, 3.1034436225891113, 3.207711696624756, 3.3119797706604004, 3.416247844696045, 3.5205159187316895, 3.624784231185913, 3.7290523052215576, 3.833320379257202, 3.937588691711426, 4.04185676574707, 4.146124839782715]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 1.0, 16.0, 16.0, 10.0, 15.0, 19.0, 29.0, 22.0, 26.0, 39.0, 27.0, 49.0, 42.0, 38.0, 55.0, 56.0, 55.0, 57.0, 50.0, 40.0, 43.0, 52.0, 18.0, 30.0, 30.0, 29.0, 25.0, 21.0, 16.0, 15.0, 18.0, 7.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1421548128128052, -1.1085011959075928, -1.0748475790023804, -1.041193962097168, -1.0075403451919556, -0.9738867282867432, -0.9402331709861755, -0.9065795540809631, -0.8729259371757507, -0.8392723202705383, -0.8056187033653259, -0.7719650864601135, -0.7383115291595459, -0.7046579122543335, -0.6710042953491211, -0.6373506784439087, -0.6036970615386963, -0.5700434446334839, -0.5363898277282715, -0.5027362108230591, -0.46908262372016907, -0.43542900681495667, -0.40177541971206665, -0.36812180280685425, -0.33446818590164185, -0.30081456899642944, -0.26716095209121704, -0.23350736498832703, -0.19985374808311462, -0.16620013117790222, -0.132546529173851, -0.0988929271697998, -0.06523919105529785, -0.031585581600666046, 0.0020680278539657593, 0.035721637308597565, 0.06937524676322937, 0.10302886366844177, 0.13668246567249298, 0.1703360676765442, 0.2039896845817566, 0.237643301486969, 0.2712969183921814, 0.3049505054950714, 0.3386041224002838, 0.3722577393054962, 0.40591132640838623, 0.43956494331359863, 0.47321856021881104, 0.5068721771240234, 0.5405257940292358, 0.5741794109344482, 0.6078330278396606, 0.641486644744873, 0.6751402020454407, 0.7087938189506531, 0.7424474358558655, 0.7761010527610779, 0.8097546696662903, 0.8434082865715027, 0.8770618438720703, 0.9107154607772827, 0.9443690776824951, 0.9780226945877075, 1.01167631149292]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 9.0, 14.0, 22.0, 30.0, 52.0, 94.0, 179.0, 359.0, 758.0, 1902.0, 4993.0, 14944.0, 61381.0, 304661.0, 492006.0, 126946.0, 27020.0, 8089.0, 2873.0, 1139.0, 541.0, 237.0, 119.0, 53.0, 42.0, 27.0, 17.0, 10.0, 13.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08984375, -2.024993896484375, -1.96014404296875, -1.895294189453125, -1.8304443359375, -1.765594482421875, -1.70074462890625, -1.635894775390625, -1.571044921875, -1.506195068359375, -1.44134521484375, -1.376495361328125, -1.3116455078125, -1.246795654296875, -1.18194580078125, -1.117095947265625, -1.05224609375, -0.987396240234375, -0.92254638671875, -0.857696533203125, -0.7928466796875, -0.727996826171875, -0.66314697265625, -0.598297119140625, -0.533447265625, -0.468597412109375, -0.40374755859375, -0.338897705078125, -0.2740478515625, -0.209197998046875, -0.14434814453125, -0.079498291015625, -0.0146484375, 0.050201416015625, 0.11505126953125, 0.179901123046875, 0.2447509765625, 0.309600830078125, 0.37445068359375, 0.439300537109375, 0.504150390625, 0.569000244140625, 0.63385009765625, 0.698699951171875, 0.7635498046875, 0.828399658203125, 0.89324951171875, 0.958099365234375, 1.02294921875, 1.087799072265625, 1.15264892578125, 1.217498779296875, 1.2823486328125, 1.347198486328125, 1.41204833984375, 1.476898193359375, 1.541748046875, 1.606597900390625, 1.67144775390625, 1.736297607421875, 1.8011474609375, 1.865997314453125, 1.93084716796875, 1.995697021484375, 2.060546875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 2.0, 1.0, 5.0, 11.0, 9.0, 15.0, 17.0, 20.0, 18.0, 51.0, 34.0, 63.0, 71.0, 77.0, 78.0, 82.0, 71.0, 88.0, 60.0, 55.0, 47.0, 31.0, 25.0, 8.0, 11.0, 8.0, 13.0, 11.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.015228271484375, -0.98553466796875, -0.955841064453125, -0.9261474609375, -0.896453857421875, -0.86676025390625, -0.837066650390625, -0.807373046875, -0.777679443359375, -0.74798583984375, -0.718292236328125, -0.6885986328125, -0.658905029296875, -0.62921142578125, -0.599517822265625, -0.56982421875, -0.540130615234375, -0.51043701171875, -0.480743408203125, -0.4510498046875, -0.421356201171875, -0.39166259765625, -0.361968994140625, -0.332275390625, -0.302581787109375, -0.27288818359375, -0.243194580078125, -0.2135009765625, -0.183807373046875, -0.15411376953125, -0.124420166015625, -0.0947265625, -0.065032958984375, -0.03533935546875, -0.005645751953125, 0.0240478515625, 0.053741455078125, 0.08343505859375, 0.113128662109375, 0.142822265625, 0.172515869140625, 0.20220947265625, 0.231903076171875, 0.2615966796875, 0.291290283203125, 0.32098388671875, 0.350677490234375, 0.38037109375, 0.410064697265625, 0.43975830078125, 0.469451904296875, 0.4991455078125, 0.528839111328125, 0.55853271484375, 0.588226318359375, 0.617919921875, 0.647613525390625, 0.67730712890625, 0.707000732421875, 0.7366943359375, 0.766387939453125, 0.79608154296875, 0.825775146484375, 0.85546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 4.0, 8.0, 11.0, 19.0, 20.0, 30.0, 47.0, 94.0, 128.0, 223.0, 348.0, 837.0, 2147.0, 7782.0, 52471.0, 691443.0, 264166.0, 21616.0, 4379.0, 1419.0, 601.0, 290.0, 186.0, 85.0, 54.0, 39.0, 25.0, 22.0, 12.0, 14.0, 9.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.38671875, -3.26910400390625, -3.1514892578125, -3.03387451171875, -2.916259765625, -2.79864501953125, -2.6810302734375, -2.56341552734375, -2.44580078125, -2.32818603515625, -2.2105712890625, -2.09295654296875, -1.975341796875, -1.85772705078125, -1.7401123046875, -1.62249755859375, -1.5048828125, -1.38726806640625, -1.2696533203125, -1.15203857421875, -1.034423828125, -0.91680908203125, -0.7991943359375, -0.68157958984375, -0.56396484375, -0.44635009765625, -0.3287353515625, -0.21112060546875, -0.093505859375, 0.02410888671875, 0.1417236328125, 0.25933837890625, 0.376953125, 0.49456787109375, 0.6121826171875, 0.72979736328125, 0.847412109375, 0.96502685546875, 1.0826416015625, 1.20025634765625, 1.31787109375, 1.43548583984375, 1.5531005859375, 1.67071533203125, 1.788330078125, 1.90594482421875, 2.0235595703125, 2.14117431640625, 2.2587890625, 2.37640380859375, 2.4940185546875, 2.61163330078125, 2.729248046875, 2.84686279296875, 2.9644775390625, 3.08209228515625, 3.19970703125, 3.31732177734375, 3.4349365234375, 3.55255126953125, 3.670166015625, 3.78778076171875, 3.9053955078125, 4.02301025390625, 4.140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 7.0, 8.0, 6.0, 5.0, 14.0, 16.0, 18.0, 26.0, 25.0, 39.0, 46.0, 34.0, 53.0, 54.0, 56.0, 51.0, 63.0, 61.0, 62.0, 52.0, 56.0, 47.0, 41.0, 16.0, 28.0, 18.0, 21.0, 16.0, 10.0, 7.0, 11.0, 6.0, 4.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.44921875, -5.3037109375, -5.158203125, -5.0126953125, -4.8671875, -4.7216796875, -4.576171875, -4.4306640625, -4.28515625, -4.1396484375, -3.994140625, -3.8486328125, -3.703125, -3.5576171875, -3.412109375, -3.2666015625, -3.12109375, -2.9755859375, -2.830078125, -2.6845703125, -2.5390625, -2.3935546875, -2.248046875, -2.1025390625, -1.95703125, -1.8115234375, -1.666015625, -1.5205078125, -1.375, -1.2294921875, -1.083984375, -0.9384765625, -0.79296875, -0.6474609375, -0.501953125, -0.3564453125, -0.2109375, -0.0654296875, 0.080078125, 0.2255859375, 0.37109375, 0.5166015625, 0.662109375, 0.8076171875, 0.953125, 1.0986328125, 1.244140625, 1.3896484375, 1.53515625, 1.6806640625, 1.826171875, 1.9716796875, 2.1171875, 2.2626953125, 2.408203125, 2.5537109375, 2.69921875, 2.8447265625, 2.990234375, 3.1357421875, 3.28125, 3.4267578125, 3.572265625, 3.7177734375, 3.86328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 8.0, 27.0, 34.0, 69.0, 220.0, 999.0, 18740.0, 1016897.0, 10406.0, 841.0, 196.0, 58.0, 30.0, 14.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.2916259765625, -5.137939453125, -4.9842529296875, -4.83056640625, -4.6768798828125, -4.523193359375, -4.3695068359375, -4.2158203125, -4.0621337890625, -3.908447265625, -3.7547607421875, -3.60107421875, -3.4473876953125, -3.293701171875, -3.1400146484375, -2.986328125, -2.8326416015625, -2.678955078125, -2.5252685546875, -2.37158203125, -2.2178955078125, -2.064208984375, -1.9105224609375, -1.7568359375, -1.6031494140625, -1.449462890625, -1.2957763671875, -1.14208984375, -0.9884033203125, -0.834716796875, -0.6810302734375, -0.52734375, -0.3736572265625, -0.219970703125, -0.0662841796875, 0.08740234375, 0.2410888671875, 0.394775390625, 0.5484619140625, 0.7021484375, 0.8558349609375, 1.009521484375, 1.1632080078125, 1.31689453125, 1.4705810546875, 1.624267578125, 1.7779541015625, 1.931640625, 2.0853271484375, 2.239013671875, 2.3927001953125, 2.54638671875, 2.7000732421875, 2.853759765625, 3.0074462890625, 3.1611328125, 3.3148193359375, 3.468505859375, 3.6221923828125, 3.77587890625, 3.9295654296875, 4.083251953125, 4.2369384765625, 4.390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 11.0, 16.0, 48.0, 72.0, 136.0, 174.0, 193.0, 138.0, 89.0, 51.0, 36.0, 20.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032901763916015625, -0.00032103434205055237, -0.0003130510449409485, -0.0003050677478313446, -0.0002970844507217407, -0.00028910115361213684, -0.00028111785650253296, -0.0002731345593929291, -0.0002651512622833252, -0.0002571679651737213, -0.00024918466806411743, -0.00024120137095451355, -0.00023321807384490967, -0.00022523477673530579, -0.0002172514796257019, -0.00020926818251609802, -0.00020128488540649414, -0.00019330158829689026, -0.00018531829118728638, -0.0001773349940776825, -0.0001693516969680786, -0.00016136839985847473, -0.00015338510274887085, -0.00014540180563926697, -0.00013741850852966309, -0.0001294352114200592, -0.00012145191431045532, -0.00011346861720085144, -0.00010548532009124756, -9.750202298164368e-05, -8.95187258720398e-05, -8.153542876243591e-05, -7.355213165283203e-05, -6.556883454322815e-05, -5.758553743362427e-05, -4.9602240324020386e-05, -4.1618943214416504e-05, -3.363564610481262e-05, -2.565234899520874e-05, -1.766905188560486e-05, -9.685754776000977e-06, -1.7024576663970947e-06, 6.280839443206787e-06, 1.4264136552810669e-05, 2.224743366241455e-05, 3.0230730772018433e-05, 3.8214027881622314e-05, 4.6197324991226196e-05, 5.418062210083008e-05, 6.216391921043396e-05, 7.014721632003784e-05, 7.813051342964172e-05, 8.61138105392456e-05, 9.409710764884949e-05, 0.00010208040475845337, 0.00011006370186805725, 0.00011804699897766113, 0.00012603029608726501, 0.0001340135931968689, 0.00014199689030647278, 0.00014998018741607666, 0.00015796348452568054, 0.00016594678163528442, 0.0001739300787448883, 0.0001819133758544922]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 10.0, 15.0, 13.0, 19.0, 24.0, 29.0, 54.0, 61.0, 81.0, 145.0, 293.0, 607.0, 1470.0, 4677.0, 21265.0, 188244.0, 723907.0, 89279.0, 12911.0, 3159.0, 1094.0, 485.0, 245.0, 143.0, 96.0, 56.0, 42.0, 28.0, 18.0, 12.0, 19.0, 13.0, 11.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.123046875, -1.0883331298828125, -1.053619384765625, -1.0189056396484375, -0.98419189453125, -0.9494781494140625, -0.914764404296875, -0.8800506591796875, -0.8453369140625, -0.8106231689453125, -0.775909423828125, -0.7411956787109375, -0.70648193359375, -0.6717681884765625, -0.637054443359375, -0.6023406982421875, -0.567626953125, -0.5329132080078125, -0.498199462890625, -0.4634857177734375, -0.42877197265625, -0.3940582275390625, -0.359344482421875, -0.3246307373046875, -0.2899169921875, -0.2552032470703125, -0.220489501953125, -0.1857757568359375, -0.15106201171875, -0.1163482666015625, -0.081634521484375, -0.0469207763671875, -0.01220703125, 0.0225067138671875, 0.057220458984375, 0.0919342041015625, 0.12664794921875, 0.1613616943359375, 0.196075439453125, 0.2307891845703125, 0.2655029296875, 0.3002166748046875, 0.334930419921875, 0.3696441650390625, 0.40435791015625, 0.4390716552734375, 0.473785400390625, 0.5084991455078125, 0.543212890625, 0.5779266357421875, 0.612640380859375, 0.6473541259765625, 0.68206787109375, 0.7167816162109375, 0.751495361328125, 0.7862091064453125, 0.8209228515625, 0.8556365966796875, 0.890350341796875, 0.9250640869140625, 0.95977783203125, 0.9944915771484375, 1.029205322265625, 1.0639190673828125, 1.0986328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 8.0, 2.0, 2.0, 12.0, 11.0, 15.0, 17.0, 27.0, 22.0, 25.0, 40.0, 84.0, 94.0, 109.0, 127.0, 106.0, 76.0, 58.0, 37.0, 24.0, 20.0, 26.0, 12.0, 9.0, 8.0, 3.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6123046875, -1.5688934326171875, -1.525482177734375, -1.4820709228515625, -1.43865966796875, -1.3952484130859375, -1.351837158203125, -1.3084259033203125, -1.2650146484375, -1.2216033935546875, -1.178192138671875, -1.1347808837890625, -1.09136962890625, -1.0479583740234375, -1.004547119140625, -0.9611358642578125, -0.917724609375, -0.8743133544921875, -0.830902099609375, -0.7874908447265625, -0.74407958984375, -0.7006683349609375, -0.657257080078125, -0.6138458251953125, -0.5704345703125, -0.5270233154296875, -0.483612060546875, -0.4402008056640625, -0.39678955078125, -0.3533782958984375, -0.309967041015625, -0.2665557861328125, -0.22314453125, -0.1797332763671875, -0.136322021484375, -0.0929107666015625, -0.04949951171875, -0.0060882568359375, 0.037322998046875, 0.0807342529296875, 0.1241455078125, 0.1675567626953125, 0.210968017578125, 0.2543792724609375, 0.29779052734375, 0.3412017822265625, 0.384613037109375, 0.4280242919921875, 0.471435546875, 0.5148468017578125, 0.558258056640625, 0.6016693115234375, 0.64508056640625, 0.6884918212890625, 0.731903076171875, 0.7753143310546875, 0.8187255859375, 0.8621368408203125, 0.905548095703125, 0.9489593505859375, 0.99237060546875, 1.0357818603515625, 1.079193115234375, 1.1226043701171875, 1.166015625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 9.0, 20.0, 41.0, 55.0, 100.0, 187.0, 192.0, 161.0, 92.0, 55.0, 34.0, 19.0, 10.0, 15.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.407970428466797, -21.664745330810547, -20.921520233154297, -20.178295135498047, -19.435070037841797, -18.69184684753418, -17.94862174987793, -17.20539665222168, -16.46217155456543, -15.71894645690918, -14.97572135925293, -14.232497215270996, -13.489272117614746, -12.746047019958496, -12.002822875976562, -11.259597778320312, -10.516372680664062, -9.773147583007812, -9.029922485351562, -8.286698341369629, -7.543473243713379, -6.800248146057129, -6.057023525238037, -5.313798904418945, -4.570573806762695, -3.8273489475250244, -3.0841240882873535, -2.3408992290496826, -1.5976743698120117, -0.8544495105743408, -0.11122465133666992, 0.6319999694824219, 1.3752250671386719, 2.1184499263763428, 2.8616747856140137, 3.6048996448516846, 4.3481245040893555, 5.0913496017456055, 5.834574222564697, 6.577798843383789, 7.321023941040039, 8.064249038696289, 8.807474136352539, 9.550698280334473, 10.293923377990723, 11.037148475646973, 11.780372619628906, 12.523597717285156, 13.266822814941406, 14.010047912597656, 14.753273010253906, 15.49649715423584, 16.239723205566406, 16.982946395874023, 17.726171493530273, 18.469396591186523, 19.212621688842773, 19.955846786499023, 20.699071884155273, 21.442296981811523, 22.18552017211914, 22.92874526977539, 23.67197036743164, 24.41519546508789, 25.15842056274414]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 9.0, 8.0, 13.0, 12.0, 15.0, 16.0, 26.0, 26.0, 28.0, 32.0, 50.0, 50.0, 54.0, 47.0, 56.0, 60.0, 61.0, 57.0, 46.0, 50.0, 48.0, 31.0, 28.0, 27.0, 17.0, 20.0, 17.0, 17.0, 13.0, 16.0, 10.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.595840454101562, -21.9388484954834, -21.2818546295166, -20.624862670898438, -19.96786880493164, -19.310876846313477, -18.653884887695312, -17.996891021728516, -17.33989906311035, -16.682907104492188, -16.02591323852539, -15.368921279907227, -14.711928367614746, -14.054935455322266, -13.397942543029785, -12.740949630737305, -12.083956718444824, -11.426963806152344, -10.769970893859863, -10.112977981567383, -9.455986022949219, -8.798993110656738, -8.142000198364258, -7.4850077629089355, -6.828014850616455, -6.171021938323975, -5.514029502868652, -4.857036590576172, -4.200043678283691, -3.543051242828369, -2.8860583305358887, -2.2290658950805664, -1.572072982788086, -0.9150802493095398, -0.25808751583099365, 0.39890527725219727, 1.0558979511260986, 1.712890625, 2.3698835372924805, 3.0268759727478027, 3.683868885040283, 4.340861797332764, 4.997854232788086, 5.654847145080566, 6.311840057373047, 6.968832492828369, 7.62582540512085, 8.282817840576172, 8.939810752868652, 9.596803665161133, 10.253796577453613, 10.910789489746094, 11.567781448364258, 12.224774360656738, 12.881767272949219, 13.538759231567383, 14.19575309753418, 14.85274600982666, 15.50973892211914, 16.166730880737305, 16.8237247467041, 17.480716705322266, 18.137710571289062, 18.794702529907227, 19.45169448852539]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 3.0, 10.0, 9.0, 25.0, 25.0, 31.0, 44.0, 52.0, 81.0, 109.0, 173.0, 269.0, 373.0, 585.0, 1061.0, 1975.0, 3685.0, 9147.0, 26680.0, 124950.0, 3776067.0, 194514.0, 33843.0, 10872.0, 4495.0, 2166.0, 1150.0, 616.0, 383.0, 293.0, 166.0, 122.0, 86.0, 61.0, 47.0, 29.0, 24.0, 10.0, 9.0, 9.0, 8.0, 4.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.455078125, -1.405914306640625, -1.35675048828125, -1.307586669921875, -1.2584228515625, -1.209259033203125, -1.16009521484375, -1.110931396484375, -1.061767578125, -1.012603759765625, -0.96343994140625, -0.914276123046875, -0.8651123046875, -0.815948486328125, -0.76678466796875, -0.717620849609375, -0.66845703125, -0.619293212890625, -0.57012939453125, -0.520965576171875, -0.4718017578125, -0.422637939453125, -0.37347412109375, -0.324310302734375, -0.275146484375, -0.225982666015625, -0.17681884765625, -0.127655029296875, -0.0784912109375, -0.029327392578125, 0.01983642578125, 0.069000244140625, 0.1181640625, 0.167327880859375, 0.21649169921875, 0.265655517578125, 0.3148193359375, 0.363983154296875, 0.41314697265625, 0.462310791015625, 0.511474609375, 0.560638427734375, 0.60980224609375, 0.658966064453125, 0.7081298828125, 0.757293701171875, 0.80645751953125, 0.855621337890625, 0.90478515625, 0.953948974609375, 1.00311279296875, 1.052276611328125, 1.1014404296875, 1.150604248046875, 1.19976806640625, 1.248931884765625, 1.298095703125, 1.347259521484375, 1.39642333984375, 1.445587158203125, 1.4947509765625, 1.543914794921875, 1.59307861328125, 1.642242431640625, 1.69140625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 15.0, 6.0, 4.0, 8.0, 13.0, 17.0, 30.0, 33.0, 25.0, 46.0, 62.0, 79.0, 84.0, 78.0, 99.0, 82.0, 65.0, 62.0, 43.0, 31.0, 31.0, 22.0, 16.0, 14.0, 8.0, 5.0, 2.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2294921875, -1.195098876953125, -1.16070556640625, -1.126312255859375, -1.0919189453125, -1.057525634765625, -1.02313232421875, -0.988739013671875, -0.954345703125, -0.919952392578125, -0.88555908203125, -0.851165771484375, -0.8167724609375, -0.782379150390625, -0.74798583984375, -0.713592529296875, -0.67919921875, -0.644805908203125, -0.61041259765625, -0.576019287109375, -0.5416259765625, -0.507232666015625, -0.47283935546875, -0.438446044921875, -0.404052734375, -0.369659423828125, -0.33526611328125, -0.300872802734375, -0.2664794921875, -0.232086181640625, -0.19769287109375, -0.163299560546875, -0.12890625, -0.094512939453125, -0.06011962890625, -0.025726318359375, 0.0086669921875, 0.043060302734375, 0.07745361328125, 0.111846923828125, 0.146240234375, 0.180633544921875, 0.21502685546875, 0.249420166015625, 0.2838134765625, 0.318206787109375, 0.35260009765625, 0.386993408203125, 0.42138671875, 0.455780029296875, 0.49017333984375, 0.524566650390625, 0.5589599609375, 0.593353271484375, 0.62774658203125, 0.662139892578125, 0.696533203125, 0.730926513671875, 0.76531982421875, 0.799713134765625, 0.8341064453125, 0.868499755859375, 0.90289306640625, 0.937286376953125, 0.9716796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 2.0, 5.0, 2.0, 4.0, 9.0, 20.0, 19.0, 21.0, 28.0, 34.0, 54.0, 76.0, 117.0, 185.0, 351.0, 747.0, 1535.0, 4040.0, 12544.0, 53110.0, 1053265.0, 2990178.0, 57388.0, 12978.0, 4244.0, 1687.0, 709.0, 346.0, 194.0, 111.0, 75.0, 53.0, 37.0, 27.0, 15.0, 18.0, 14.0, 8.0, 5.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1640625, -2.09429931640625, -2.0245361328125, -1.95477294921875, -1.885009765625, -1.81524658203125, -1.7454833984375, -1.67572021484375, -1.60595703125, -1.53619384765625, -1.4664306640625, -1.39666748046875, -1.326904296875, -1.25714111328125, -1.1873779296875, -1.11761474609375, -1.0478515625, -0.97808837890625, -0.9083251953125, -0.83856201171875, -0.768798828125, -0.69903564453125, -0.6292724609375, -0.55950927734375, -0.48974609375, -0.41998291015625, -0.3502197265625, -0.28045654296875, -0.210693359375, -0.14093017578125, -0.0711669921875, -0.00140380859375, 0.068359375, 0.13812255859375, 0.2078857421875, 0.27764892578125, 0.347412109375, 0.41717529296875, 0.4869384765625, 0.55670166015625, 0.62646484375, 0.69622802734375, 0.7659912109375, 0.83575439453125, 0.905517578125, 0.97528076171875, 1.0450439453125, 1.11480712890625, 1.1845703125, 1.25433349609375, 1.3240966796875, 1.39385986328125, 1.463623046875, 1.53338623046875, 1.6031494140625, 1.67291259765625, 1.74267578125, 1.81243896484375, 1.8822021484375, 1.95196533203125, 2.021728515625, 2.09149169921875, 2.1612548828125, 2.23101806640625, 2.30078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 11.0, 18.0, 28.0, 67.0, 181.0, 2728.0, 777.0, 136.0, 59.0, 31.0, 16.0, 3.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2998046875, -1.2672500610351562, -1.2346954345703125, -1.2021408081054688, -1.169586181640625, -1.1370315551757812, -1.1044769287109375, -1.0719223022460938, -1.03936767578125, -1.0068130493164062, -0.9742584228515625, -0.9417037963867188, -0.909149169921875, -0.8765945434570312, -0.8440399169921875, -0.8114852905273438, -0.7789306640625, -0.7463760375976562, -0.7138214111328125, -0.6812667846679688, -0.648712158203125, -0.6161575317382812, -0.5836029052734375, -0.5510482788085938, -0.51849365234375, -0.48593902587890625, -0.4533843994140625, -0.42082977294921875, -0.388275146484375, -0.35572052001953125, -0.3231658935546875, -0.29061126708984375, -0.258056640625, -0.22550201416015625, -0.1929473876953125, -0.16039276123046875, -0.127838134765625, -0.09528350830078125, -0.0627288818359375, -0.03017425537109375, 0.00238037109375, 0.03493499755859375, 0.0674896240234375, 0.10004425048828125, 0.132598876953125, 0.16515350341796875, 0.1977081298828125, 0.23026275634765625, 0.2628173828125, 0.29537200927734375, 0.3279266357421875, 0.36048126220703125, 0.393035888671875, 0.42559051513671875, 0.4581451416015625, 0.49069976806640625, 0.52325439453125, 0.5558090209960938, 0.5883636474609375, 0.6209182739257812, 0.653472900390625, 0.6860275268554688, 0.7185821533203125, 0.7511367797851562, 0.78369140625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 17.0, 25.0, 27.0, 44.0, 59.0, 41.0, 58.0, 87.0, 76.0, 81.0, 78.0, 65.0, 67.0, 56.0, 45.0, 47.0, 27.0, 28.0, 16.0, 11.0, 7.0, 7.0, 8.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.822250485420227, -1.7732852697372437, -1.7243200540542603, -1.6753548383712769, -1.626389503479004, -1.5774242877960205, -1.528459072113037, -1.4794938564300537, -1.4305286407470703, -1.381563425064087, -1.3325982093811035, -1.2836329936981201, -1.2346677780151367, -1.1857024431228638, -1.1367372274398804, -1.087772011756897, -1.0388067960739136, -0.9898415803909302, -0.9408763647079468, -0.8919110894203186, -0.8429458737373352, -0.7939806580543518, -0.7450153827667236, -0.6960501670837402, -0.6470849514007568, -0.5981197357177734, -0.54915452003479, -0.5001892447471619, -0.45122402906417847, -0.40225881338119507, -0.3532935678958893, -0.3043283224105835, -0.25536322593688965, -0.20639799535274506, -0.15743276476860046, -0.10846753418445587, -0.05950230360031128, -0.010537073016166687, 0.038428157567977905, 0.08739340305328369, 0.1363586187362671, 0.18532384932041168, 0.23428907990455627, 0.28325432538986206, 0.33221954107284546, 0.38118475675582886, 0.43015000224113464, 0.47911524772644043, 0.5280804634094238, 0.5770456790924072, 0.6260108947753906, 0.6749761700630188, 0.7239413857460022, 0.7729066014289856, 0.8218718767166138, 0.8708370923995972, 0.9198023080825806, 0.968767523765564, 1.0177327394485474, 1.0666979551315308, 1.1156632900238037, 1.164628505706787, 1.2135937213897705, 1.262558937072754, 1.3115241527557373]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 5.0, 4.0, 6.0, 13.0, 14.0, 11.0, 17.0, 23.0, 19.0, 34.0, 25.0, 39.0, 42.0, 37.0, 43.0, 38.0, 40.0, 59.0, 51.0, 47.0, 39.0, 45.0, 39.0, 36.0, 39.0, 32.0, 31.0, 34.0, 30.0, 20.0, 11.0, 13.0, 11.0, 8.0, 13.0, 4.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.4191548824310303, -1.3746458292007446, -1.3301368951797485, -1.285627841949463, -1.2411187887191772, -1.1966097354888916, -1.1521008014678955, -1.1075917482376099, -1.0630826950073242, -1.0185736417770386, -0.9740646481513977, -0.9295556545257568, -0.8850466012954712, -0.8405376076698303, -0.7960286140441895, -0.7515195608139038, -0.7070106267929077, -0.6625016331672668, -0.6179925799369812, -0.5734835863113403, -0.5289745330810547, -0.4844655394554138, -0.43995654582977295, -0.3954475224018097, -0.35093849897384644, -0.3064294755458832, -0.2619204521179199, -0.21741145849227905, -0.1729024350643158, -0.12839341163635254, -0.08388441801071167, -0.03937539458274841, 0.005133628845214844, 0.049642644822597504, 0.09415166079998016, 0.13866066932678223, 0.18316969275474548, 0.22767871618270874, 0.2721877098083496, 0.31669673323631287, 0.3612057566642761, 0.4057147800922394, 0.45022380352020264, 0.4947327971458435, 0.5392417907714844, 0.58375084400177, 0.6282598376274109, 0.6727688312530518, 0.7172778844833374, 0.7617868781089783, 0.8062959313392639, 0.8508049249649048, 0.8953139781951904, 0.9398229718208313, 0.9843319654464722, 1.0288410186767578, 1.073349952697754, 1.1178590059280396, 1.1623679399490356, 1.2068769931793213, 1.251386046409607, 1.2958950996398926, 1.3404040336608887, 1.3849130868911743, 1.42942214012146]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 7.0, 7.0, 2.0, 9.0, 11.0, 12.0, 19.0, 40.0, 47.0, 93.0, 142.0, 253.0, 587.0, 1356.0, 3827.0, 13567.0, 69348.0, 458122.0, 420698.0, 62146.0, 12193.0, 3609.0, 1286.0, 556.0, 257.0, 126.0, 62.0, 63.0, 23.0, 30.0, 14.0, 10.0, 12.0, 7.0, 2.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.166015625, -2.09124755859375, -2.0164794921875, -1.94171142578125, -1.866943359375, -1.79217529296875, -1.7174072265625, -1.64263916015625, -1.56787109375, -1.49310302734375, -1.4183349609375, -1.34356689453125, -1.268798828125, -1.19403076171875, -1.1192626953125, -1.04449462890625, -0.9697265625, -0.89495849609375, -0.8201904296875, -0.74542236328125, -0.670654296875, -0.59588623046875, -0.5211181640625, -0.44635009765625, -0.37158203125, -0.29681396484375, -0.2220458984375, -0.14727783203125, -0.072509765625, 0.00225830078125, 0.0770263671875, 0.15179443359375, 0.2265625, 0.30133056640625, 0.3760986328125, 0.45086669921875, 0.525634765625, 0.60040283203125, 0.6751708984375, 0.74993896484375, 0.82470703125, 0.89947509765625, 0.9742431640625, 1.04901123046875, 1.123779296875, 1.19854736328125, 1.2733154296875, 1.34808349609375, 1.4228515625, 1.49761962890625, 1.5723876953125, 1.64715576171875, 1.721923828125, 1.79669189453125, 1.8714599609375, 1.94622802734375, 2.02099609375, 2.09576416015625, 2.1705322265625, 2.24530029296875, 2.320068359375, 2.39483642578125, 2.4696044921875, 2.54437255859375, 2.619140625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 8.0, 7.0, 15.0, 14.0, 37.0, 20.0, 35.0, 40.0, 54.0, 72.0, 72.0, 73.0, 86.0, 78.0, 81.0, 62.0, 51.0, 50.0, 26.0, 25.0, 21.0, 15.0, 10.0, 11.0, 6.0, 7.0, 5.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.26953125, -1.2364349365234375, -1.203338623046875, -1.1702423095703125, -1.13714599609375, -1.1040496826171875, -1.070953369140625, -1.0378570556640625, -1.0047607421875, -0.9716644287109375, -0.938568115234375, -0.9054718017578125, -0.87237548828125, -0.8392791748046875, -0.806182861328125, -0.7730865478515625, -0.739990234375, -0.7068939208984375, -0.673797607421875, -0.6407012939453125, -0.60760498046875, -0.5745086669921875, -0.541412353515625, -0.5083160400390625, -0.4752197265625, -0.4421234130859375, -0.409027099609375, -0.3759307861328125, -0.34283447265625, -0.3097381591796875, -0.276641845703125, -0.2435455322265625, -0.21044921875, -0.1773529052734375, -0.144256591796875, -0.1111602783203125, -0.07806396484375, -0.0449676513671875, -0.011871337890625, 0.0212249755859375, 0.0543212890625, 0.0874176025390625, 0.120513916015625, 0.1536102294921875, 0.18670654296875, 0.2198028564453125, 0.252899169921875, 0.2859954833984375, 0.319091796875, 0.3521881103515625, 0.385284423828125, 0.4183807373046875, 0.45147705078125, 0.4845733642578125, 0.517669677734375, 0.5507659912109375, 0.5838623046875, 0.6169586181640625, 0.650054931640625, 0.6831512451171875, 0.71624755859375, 0.7493438720703125, 0.782440185546875, 0.8155364990234375, 0.8486328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 3.0, 6.0, 17.0, 12.0, 22.0, 29.0, 42.0, 75.0, 153.0, 325.0, 1022.0, 4938.0, 95001.0, 913593.0, 29230.0, 2781.0, 718.0, 259.0, 118.0, 61.0, 41.0, 27.0, 22.0, 11.0, 9.0, 11.0, 4.0, 5.0, 1.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1171875, -4.94281005859375, -4.7684326171875, -4.59405517578125, -4.419677734375, -4.24530029296875, -4.0709228515625, -3.89654541015625, -3.72216796875, -3.54779052734375, -3.3734130859375, -3.19903564453125, -3.024658203125, -2.85028076171875, -2.6759033203125, -2.50152587890625, -2.3271484375, -2.15277099609375, -1.9783935546875, -1.80401611328125, -1.629638671875, -1.45526123046875, -1.2808837890625, -1.10650634765625, -0.93212890625, -0.75775146484375, -0.5833740234375, -0.40899658203125, -0.234619140625, -0.06024169921875, 0.1141357421875, 0.28851318359375, 0.462890625, 0.63726806640625, 0.8116455078125, 0.98602294921875, 1.160400390625, 1.33477783203125, 1.5091552734375, 1.68353271484375, 1.85791015625, 2.03228759765625, 2.2066650390625, 2.38104248046875, 2.555419921875, 2.72979736328125, 2.9041748046875, 3.07855224609375, 3.2529296875, 3.42730712890625, 3.6016845703125, 3.77606201171875, 3.950439453125, 4.12481689453125, 4.2991943359375, 4.47357177734375, 4.64794921875, 4.82232666015625, 4.9967041015625, 5.17108154296875, 5.345458984375, 5.51983642578125, 5.6942138671875, 5.86859130859375, 6.04296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 9.0, 6.0, 13.0, 19.0, 19.0, 19.0, 31.0, 36.0, 41.0, 47.0, 49.0, 54.0, 60.0, 58.0, 55.0, 57.0, 77.0, 53.0, 38.0, 39.0, 35.0, 33.0, 29.0, 19.0, 12.0, 14.0, 17.0, 11.0, 10.0, 5.0, 3.0, 7.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.90234375, -3.75994873046875, -3.6175537109375, -3.47515869140625, -3.332763671875, -3.19036865234375, -3.0479736328125, -2.90557861328125, -2.76318359375, -2.62078857421875, -2.4783935546875, -2.33599853515625, -2.193603515625, -2.05120849609375, -1.9088134765625, -1.76641845703125, -1.6240234375, -1.48162841796875, -1.3392333984375, -1.19683837890625, -1.054443359375, -0.91204833984375, -0.7696533203125, -0.62725830078125, -0.48486328125, -0.34246826171875, -0.2000732421875, -0.05767822265625, 0.084716796875, 0.22711181640625, 0.3695068359375, 0.51190185546875, 0.654296875, 0.79669189453125, 0.9390869140625, 1.08148193359375, 1.223876953125, 1.36627197265625, 1.5086669921875, 1.65106201171875, 1.79345703125, 1.93585205078125, 2.0782470703125, 2.22064208984375, 2.363037109375, 2.50543212890625, 2.6478271484375, 2.79022216796875, 2.9326171875, 3.07501220703125, 3.2174072265625, 3.35980224609375, 3.502197265625, 3.64459228515625, 3.7869873046875, 3.92938232421875, 4.07177734375, 4.21417236328125, 4.3565673828125, 4.49896240234375, 4.641357421875, 4.78375244140625, 4.9261474609375, 5.06854248046875, 5.2109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 4.0, 15.0, 22.0, 14.0, 20.0, 25.0, 47.0, 56.0, 67.0, 112.0, 202.0, 363.0, 807.0, 2472.0, 15050.0, 420887.0, 585484.0, 18092.0, 2870.0, 928.0, 380.0, 200.0, 125.0, 74.0, 56.0, 36.0, 40.0, 19.0, 11.0, 19.0, 10.0, 7.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.80078125, -2.7271575927734375, -2.653533935546875, -2.5799102783203125, -2.50628662109375, -2.4326629638671875, -2.359039306640625, -2.2854156494140625, -2.2117919921875, -2.1381683349609375, -2.064544677734375, -1.9909210205078125, -1.91729736328125, -1.8436737060546875, -1.770050048828125, -1.6964263916015625, -1.622802734375, -1.5491790771484375, -1.475555419921875, -1.4019317626953125, -1.32830810546875, -1.2546844482421875, -1.181060791015625, -1.1074371337890625, -1.0338134765625, -0.9601898193359375, -0.886566162109375, -0.8129425048828125, -0.73931884765625, -0.6656951904296875, -0.592071533203125, -0.5184478759765625, -0.44482421875, -0.3712005615234375, -0.297576904296875, -0.2239532470703125, -0.15032958984375, -0.0767059326171875, -0.003082275390625, 0.0705413818359375, 0.1441650390625, 0.2177886962890625, 0.291412353515625, 0.3650360107421875, 0.43865966796875, 0.5122833251953125, 0.585906982421875, 0.6595306396484375, 0.733154296875, 0.8067779541015625, 0.880401611328125, 0.9540252685546875, 1.02764892578125, 1.1012725830078125, 1.174896240234375, 1.2485198974609375, 1.3221435546875, 1.3957672119140625, 1.469390869140625, 1.5430145263671875, 1.61663818359375, 1.6902618408203125, 1.763885498046875, 1.8375091552734375, 1.9111328125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 19.0, 35.0, 43.0, 94.0, 141.0, 177.0, 156.0, 135.0, 96.0, 34.0, 31.0, 10.0, 8.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0003345012664794922, -0.00032736361026763916, -0.00032022595405578613, -0.0003130882978439331, -0.0003059506416320801, -0.00029881298542022705, -0.000291675329208374, -0.000284537672996521, -0.00027740001678466797, -0.00027026236057281494, -0.0002631247043609619, -0.0002559870481491089, -0.00024884939193725586, -0.00024171173572540283, -0.0002345740795135498, -0.00022743642330169678, -0.00022029876708984375, -0.00021316111087799072, -0.0002060234546661377, -0.00019888579845428467, -0.00019174814224243164, -0.0001846104860305786, -0.00017747282981872559, -0.00017033517360687256, -0.00016319751739501953, -0.0001560598611831665, -0.00014892220497131348, -0.00014178454875946045, -0.00013464689254760742, -0.0001275092363357544, -0.00012037158012390137, -0.00011323392391204834, -0.00010609626770019531, -9.895861148834229e-05, -9.182095527648926e-05, -8.468329906463623e-05, -7.75456428527832e-05, -7.040798664093018e-05, -6.327033042907715e-05, -5.613267421722412e-05, -4.8995018005371094e-05, -4.1857361793518066e-05, -3.471970558166504e-05, -2.7582049369812012e-05, -2.0444393157958984e-05, -1.3306736946105957e-05, -6.16908073425293e-06, 9.685754776000977e-07, 8.106231689453125e-06, 1.5243887901306152e-05, 2.238154411315918e-05, 2.9519200325012207e-05, 3.6656856536865234e-05, 4.379451274871826e-05, 5.093216896057129e-05, 5.8069825172424316e-05, 6.520748138427734e-05, 7.234513759613037e-05, 7.94827938079834e-05, 8.662045001983643e-05, 9.375810623168945e-05, 0.00010089576244354248, 0.00010803341865539551, 0.00011517107486724854, 0.00012230873107910156]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 6.0, 16.0, 28.0, 28.0, 72.0, 136.0, 240.0, 683.0, 2320.0, 22255.0, 937447.0, 79577.0, 4089.0, 915.0, 337.0, 177.0, 74.0, 54.0, 26.0, 14.0, 19.0, 11.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.59405517578125, -2.4888916015625, -2.38372802734375, -2.278564453125, -2.17340087890625, -2.0682373046875, -1.96307373046875, -1.85791015625, -1.75274658203125, -1.6475830078125, -1.54241943359375, -1.437255859375, -1.33209228515625, -1.2269287109375, -1.12176513671875, -1.0166015625, -0.91143798828125, -0.8062744140625, -0.70111083984375, -0.595947265625, -0.49078369140625, -0.3856201171875, -0.28045654296875, -0.17529296875, -0.07012939453125, 0.0350341796875, 0.14019775390625, 0.245361328125, 0.35052490234375, 0.4556884765625, 0.56085205078125, 0.666015625, 0.77117919921875, 0.8763427734375, 0.98150634765625, 1.086669921875, 1.19183349609375, 1.2969970703125, 1.40216064453125, 1.50732421875, 1.61248779296875, 1.7176513671875, 1.82281494140625, 1.927978515625, 2.03314208984375, 2.1383056640625, 2.24346923828125, 2.3486328125, 2.45379638671875, 2.5589599609375, 2.66412353515625, 2.769287109375, 2.87445068359375, 2.9796142578125, 3.08477783203125, 3.18994140625, 3.29510498046875, 3.4002685546875, 3.50543212890625, 3.610595703125, 3.71575927734375, 3.8209228515625, 3.92608642578125, 4.03125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 8.0, 12.0, 23.0, 32.0, 49.0, 86.0, 147.0, 176.0, 158.0, 117.0, 66.0, 48.0, 31.0, 18.0, 7.0, 10.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09765625, -3.0199737548828125, -2.942291259765625, -2.8646087646484375, -2.78692626953125, -2.7092437744140625, -2.631561279296875, -2.5538787841796875, -2.4761962890625, -2.3985137939453125, -2.320831298828125, -2.2431488037109375, -2.16546630859375, -2.0877838134765625, -2.010101318359375, -1.9324188232421875, -1.854736328125, -1.7770538330078125, -1.699371337890625, -1.6216888427734375, -1.54400634765625, -1.4663238525390625, -1.388641357421875, -1.3109588623046875, -1.2332763671875, -1.1555938720703125, -1.077911376953125, -1.0002288818359375, -0.92254638671875, -0.8448638916015625, -0.767181396484375, -0.6894989013671875, -0.61181640625, -0.5341339111328125, -0.456451416015625, -0.3787689208984375, -0.30108642578125, -0.2234039306640625, -0.145721435546875, -0.0680389404296875, 0.0096435546875, 0.0873260498046875, 0.165008544921875, 0.2426910400390625, 0.32037353515625, 0.3980560302734375, 0.475738525390625, 0.5534210205078125, 0.631103515625, 0.7087860107421875, 0.786468505859375, 0.8641510009765625, 0.94183349609375, 1.0195159912109375, 1.097198486328125, 1.1748809814453125, 1.2525634765625, 1.3302459716796875, 1.407928466796875, 1.4856109619140625, 1.56329345703125, 1.6409759521484375, 1.718658447265625, 1.7963409423828125, 1.8740234375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 0.0, 10.0, 8.0, 24.0, 33.0, 65.0, 89.0, 141.0, 150.0, 183.0, 102.0, 78.0, 59.0, 29.0, 11.0, 7.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.10253143310547, -19.405010223388672, -18.707489013671875, -18.009967803955078, -17.31244659423828, -16.614925384521484, -15.917405128479004, -15.219884872436523, -14.522363662719727, -13.82484245300293, -13.127321243286133, -12.429800033569336, -11.732279777526855, -11.034758567810059, -10.337237358093262, -9.639717102050781, -8.942194938659668, -8.244673728942871, -7.547152996063232, -6.8496317863464355, -6.152111053466797, -5.45458984375, -4.757068634033203, -4.0595479011535645, -3.3620266914367676, -2.66450572013855, -1.9669846296310425, -1.2694635391235352, -0.5719425678253174, 0.1255784034729004, 0.8230996131896973, 1.520620346069336, 2.218141555786133, 2.9156625270843506, 3.6131834983825684, 4.310704708099365, 5.008225440979004, 5.705746650695801, 6.403267860412598, 7.100788593292236, 7.798309803009033, 8.495830535888672, 9.193351745605469, 9.890872955322266, 10.588394165039062, 11.28591537475586, 11.983436584472656, 12.680956840515137, 13.378478050231934, 14.07599925994873, 14.773520469665527, 15.471040725708008, 16.168561935424805, 16.8660831451416, 17.5636043548584, 18.261125564575195, 18.958646774291992, 19.65616798400879, 20.353689193725586, 21.051210403442383, 21.74873161315918, 22.446250915527344, 23.14377212524414, 23.841293334960938, 24.538814544677734]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 8.0, 4.0, 3.0, 7.0, 5.0, 8.0, 8.0, 13.0, 20.0, 21.0, 23.0, 28.0, 26.0, 45.0, 39.0, 47.0, 41.0, 52.0, 68.0, 47.0, 58.0, 47.0, 58.0, 55.0, 47.0, 37.0, 38.0, 33.0, 17.0, 20.0, 22.0, 9.0, 8.0, 8.0, 7.0, 7.0, 8.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.755983352661133, -15.202385902404785, -14.648787498474121, -14.095190048217773, -13.54159164428711, -12.987994194030762, -12.434396743774414, -11.88079833984375, -11.327200889587402, -10.773603439331055, -10.22000503540039, -9.666407585144043, -9.112810134887695, -8.559211730957031, -8.005614280700684, -7.452016353607178, -6.898418426513672, -6.344820499420166, -5.79122257232666, -5.2376251220703125, -4.684027194976807, -4.130429267883301, -3.576831579208374, -3.0232338905334473, -2.4696359634399414, -1.916038155555725, -1.3624403476715088, -0.8088425397872925, -0.25524473190307617, 0.2983531951904297, 0.8519508838653564, 1.4055485725402832, 1.959146499633789, 2.512744426727295, 3.0663421154022217, 3.6199398040771484, 4.173537731170654, 4.72713565826416, 5.280733108520508, 5.834331035614014, 6.3879289627075195, 6.941526889801025, 7.495124816894531, 8.048722267150879, 8.602319717407227, 9.15591812133789, 9.709515571594238, 10.263113021850586, 10.81671142578125, 11.370308876037598, 11.923907279968262, 12.47750473022461, 13.031103134155273, 13.584700584411621, 14.138298034667969, 14.691896438598633, 15.24549388885498, 15.799091339111328, 16.352689743041992, 16.906288146972656, 17.459884643554688, 18.01348304748535, 18.567081451416016, 19.120677947998047, 19.67427635192871]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 8.0, 11.0, 6.0, 11.0, 12.0, 21.0, 33.0, 62.0, 101.0, 176.0, 399.0, 1196.0, 4567.0, 49335.0, 4107947.0, 25557.0, 3233.0, 907.0, 355.0, 167.0, 73.0, 39.0, 27.0, 13.0, 6.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.18896484375, -5.0380859375, -4.88720703125, -4.736328125, -4.58544921875, -4.4345703125, -4.28369140625, -4.1328125, -3.98193359375, -3.8310546875, -3.68017578125, -3.529296875, -3.37841796875, -3.2275390625, -3.07666015625, -2.92578125, -2.77490234375, -2.6240234375, -2.47314453125, -2.322265625, -2.17138671875, -2.0205078125, -1.86962890625, -1.71875, -1.56787109375, -1.4169921875, -1.26611328125, -1.115234375, -0.96435546875, -0.8134765625, -0.66259765625, -0.51171875, -0.36083984375, -0.2099609375, -0.05908203125, 0.091796875, 0.24267578125, 0.3935546875, 0.54443359375, 0.6953125, 0.84619140625, 0.9970703125, 1.14794921875, 1.298828125, 1.44970703125, 1.6005859375, 1.75146484375, 1.90234375, 2.05322265625, 2.2041015625, 2.35498046875, 2.505859375, 2.65673828125, 2.8076171875, 2.95849609375, 3.109375, 3.26025390625, 3.4111328125, 3.56201171875, 3.712890625, 3.86376953125, 4.0146484375, 4.16552734375, 4.31640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 7.0, 4.0, 9.0, 13.0, 15.0, 23.0, 32.0, 40.0, 44.0, 65.0, 78.0, 96.0, 100.0, 95.0, 82.0, 63.0, 64.0, 42.0, 33.0, 25.0, 16.0, 10.0, 16.0, 8.0, 3.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4951171875, -1.454345703125, -1.41357421875, -1.372802734375, -1.33203125, -1.291259765625, -1.25048828125, -1.209716796875, -1.1689453125, -1.128173828125, -1.08740234375, -1.046630859375, -1.005859375, -0.965087890625, -0.92431640625, -0.883544921875, -0.8427734375, -0.802001953125, -0.76123046875, -0.720458984375, -0.6796875, -0.638916015625, -0.59814453125, -0.557373046875, -0.5166015625, -0.475830078125, -0.43505859375, -0.394287109375, -0.353515625, -0.312744140625, -0.27197265625, -0.231201171875, -0.1904296875, -0.149658203125, -0.10888671875, -0.068115234375, -0.02734375, 0.013427734375, 0.05419921875, 0.094970703125, 0.1357421875, 0.176513671875, 0.21728515625, 0.258056640625, 0.298828125, 0.339599609375, 0.38037109375, 0.421142578125, 0.4619140625, 0.502685546875, 0.54345703125, 0.584228515625, 0.625, 0.665771484375, 0.70654296875, 0.747314453125, 0.7880859375, 0.828857421875, 0.86962890625, 0.910400390625, 0.951171875, 0.991943359375, 1.03271484375, 1.073486328125, 1.1142578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 8.0, 21.0, 12.0, 22.0, 27.0, 32.0, 49.0, 60.0, 91.0, 136.0, 227.0, 361.0, 650.0, 1336.0, 2869.0, 6836.0, 22212.0, 127820.0, 3912299.0, 89575.0, 18128.0, 6023.0, 2576.0, 1311.0, 610.0, 315.0, 196.0, 137.0, 79.0, 80.0, 35.0, 42.0, 21.0, 29.0, 14.0, 13.0, 7.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.71484375, -1.652313232421875, -1.58978271484375, -1.527252197265625, -1.4647216796875, -1.402191162109375, -1.33966064453125, -1.277130126953125, -1.214599609375, -1.152069091796875, -1.08953857421875, -1.027008056640625, -0.9644775390625, -0.901947021484375, -0.83941650390625, -0.776885986328125, -0.71435546875, -0.651824951171875, -0.58929443359375, -0.526763916015625, -0.4642333984375, -0.401702880859375, -0.33917236328125, -0.276641845703125, -0.214111328125, -0.151580810546875, -0.08905029296875, -0.026519775390625, 0.0360107421875, 0.098541259765625, 0.16107177734375, 0.223602294921875, 0.2861328125, 0.348663330078125, 0.41119384765625, 0.473724365234375, 0.5362548828125, 0.598785400390625, 0.66131591796875, 0.723846435546875, 0.786376953125, 0.848907470703125, 0.91143798828125, 0.973968505859375, 1.0364990234375, 1.099029541015625, 1.16156005859375, 1.224090576171875, 1.28662109375, 1.349151611328125, 1.41168212890625, 1.474212646484375, 1.5367431640625, 1.599273681640625, 1.66180419921875, 1.724334716796875, 1.786865234375, 1.849395751953125, 1.91192626953125, 1.974456787109375, 2.0369873046875, 2.099517822265625, 2.16204833984375, 2.224578857421875, 2.287109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 7.0, 20.0, 20.0, 53.0, 100.0, 419.0, 3192.0, 152.0, 43.0, 29.0, 24.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4462890625, -0.4217529296875, -0.397216796875, -0.3726806640625, -0.34814453125, -0.3236083984375, -0.299072265625, -0.2745361328125, -0.25, -0.2254638671875, -0.200927734375, -0.1763916015625, -0.15185546875, -0.1273193359375, -0.102783203125, -0.0782470703125, -0.0537109375, -0.0291748046875, -0.004638671875, 0.0198974609375, 0.04443359375, 0.0689697265625, 0.093505859375, 0.1180419921875, 0.142578125, 0.1671142578125, 0.191650390625, 0.2161865234375, 0.24072265625, 0.2652587890625, 0.289794921875, 0.3143310546875, 0.3388671875, 0.3634033203125, 0.387939453125, 0.4124755859375, 0.43701171875, 0.4615478515625, 0.486083984375, 0.5106201171875, 0.53515625, 0.5596923828125, 0.584228515625, 0.6087646484375, 0.63330078125, 0.6578369140625, 0.682373046875, 0.7069091796875, 0.7314453125, 0.7559814453125, 0.780517578125, 0.8050537109375, 0.82958984375, 0.8541259765625, 0.878662109375, 0.9031982421875, 0.927734375, 0.9522705078125, 0.976806640625, 1.0013427734375, 1.02587890625, 1.0504150390625, 1.074951171875, 1.0994873046875, 1.1240234375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 11.0, 12.0, 31.0, 54.0, 98.0, 95.0, 165.0, 166.0, 138.0, 108.0, 54.0, 31.0, 24.0, 8.0, 6.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3960165977478027, -1.3235034942626953, -1.2509905099868774, -1.1784775257110596, -1.1059644222259521, -1.0334513187408447, -0.9609383344650269, -0.8884252905845642, -0.8159122467041016, -0.7433992028236389, -0.6708861589431763, -0.5983731150627136, -0.525860071182251, -0.45334702730178833, -0.3808339834213257, -0.30832093954086304, -0.2358078956604004, -0.16329485177993774, -0.0907818078994751, -0.01826876401901245, 0.054244279861450195, 0.12675732374191284, 0.1992703676223755, 0.27178341150283813, 0.3442964553833008, 0.4168094992637634, 0.4893225431442261, 0.5618355870246887, 0.6343486309051514, 0.706861674785614, 0.7793747186660767, 0.8518877625465393, 0.924400806427002, 0.9969138503074646, 1.0694268941879272, 1.1419398784637451, 1.2144529819488525, 1.28696608543396, 1.3594790697097778, 1.4319920539855957, 1.5045051574707031, 1.5770182609558105, 1.6495312452316284, 1.7220442295074463, 1.7945573329925537, 1.8670704364776611, 1.939583420753479, 2.012096405029297, 2.0846095085144043, 2.1571226119995117, 2.229635715484619, 2.3021485805511475, 2.374661684036255, 2.4471747875213623, 2.5196876525878906, 2.592200756072998, 2.6647138595581055, 2.737226963043213, 2.8097400665283203, 2.8822529315948486, 2.954766035079956, 3.0272791385650635, 3.099792003631592, 3.172305107116699, 3.2448182106018066]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 8.0, 4.0, 3.0, 4.0, 7.0, 9.0, 9.0, 14.0, 15.0, 25.0, 24.0, 30.0, 34.0, 48.0, 40.0, 45.0, 44.0, 50.0, 54.0, 61.0, 60.0, 50.0, 55.0, 47.0, 36.0, 42.0, 39.0, 25.0, 20.0, 22.0, 13.0, 16.0, 12.0, 11.0, 9.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.322563886642456, -1.2858307361602783, -1.2490975856781006, -1.2123644351959229, -1.1756314039230347, -1.138898253440857, -1.1021651029586792, -1.0654319524765015, -1.0286988019943237, -0.991965651512146, -0.955232560634613, -0.9184994101524353, -0.8817662596702576, -0.8450331687927246, -0.8083000183105469, -0.7715668678283691, -0.7348337769508362, -0.6981006264686584, -0.6613675355911255, -0.6246343851089478, -0.58790123462677, -0.5511680841445923, -0.5144349932670593, -0.4777018427848816, -0.44096872210502625, -0.4042356014251709, -0.36750245094299316, -0.3307693302631378, -0.29403620958328247, -0.25730305910110474, -0.2205699384212494, -0.18383678793907166, -0.1471036672592163, -0.11037053167819977, -0.07363740354776382, -0.03690427541732788, -0.00017113983631134033, 0.0365619957447052, 0.07329511642456055, 0.11002826690673828, 0.14676138758659363, 0.18349452316761017, 0.2202276587486267, 0.25696077942848206, 0.2936939001083374, 0.33042705059051514, 0.3671601712703705, 0.4038933217525482, 0.44062644243240356, 0.4773595631122589, 0.5140926837921143, 0.550825834274292, 0.5875589847564697, 0.6242921352386475, 0.6610252261161804, 0.6977583765983582, 0.7344914674758911, 0.7712246179580688, 0.8079577088356018, 0.8446908593177795, 0.8814240097999573, 0.9181571006774902, 0.954890251159668, 0.9916234016418457, 1.0283565521240234]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 4.0, 11.0, 5.0, 15.0, 23.0, 46.0, 87.0, 131.0, 301.0, 789.0, 2342.0, 11015.0, 94360.0, 738519.0, 178771.0, 16914.0, 3411.0, 1041.0, 381.0, 179.0, 92.0, 42.0, 27.0, 13.0, 10.0, 4.0, 3.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.630859375, -3.531707763671875, -3.43255615234375, -3.333404541015625, -3.2342529296875, -3.135101318359375, -3.03594970703125, -2.936798095703125, -2.837646484375, -2.738494873046875, -2.63934326171875, -2.540191650390625, -2.4410400390625, -2.341888427734375, -2.24273681640625, -2.143585205078125, -2.04443359375, -1.945281982421875, -1.84613037109375, -1.746978759765625, -1.6478271484375, -1.548675537109375, -1.44952392578125, -1.350372314453125, -1.251220703125, -1.152069091796875, -1.05291748046875, -0.953765869140625, -0.8546142578125, -0.755462646484375, -0.65631103515625, -0.557159423828125, -0.4580078125, -0.358856201171875, -0.25970458984375, -0.160552978515625, -0.0614013671875, 0.037750244140625, 0.13690185546875, 0.236053466796875, 0.335205078125, 0.434356689453125, 0.53350830078125, 0.632659912109375, 0.7318115234375, 0.830963134765625, 0.93011474609375, 1.029266357421875, 1.12841796875, 1.227569580078125, 1.32672119140625, 1.425872802734375, 1.5250244140625, 1.624176025390625, 1.72332763671875, 1.822479248046875, 1.921630859375, 2.020782470703125, 2.11993408203125, 2.219085693359375, 2.3182373046875, 2.417388916015625, 2.51654052734375, 2.615692138671875, 2.71484375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 8.0, 1.0, 4.0, 6.0, 5.0, 10.0, 21.0, 18.0, 24.0, 27.0, 38.0, 53.0, 61.0, 79.0, 84.0, 89.0, 78.0, 67.0, 73.0, 55.0, 48.0, 43.0, 17.0, 26.0, 20.0, 16.0, 10.0, 7.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.390625, -1.3539276123046875, -1.317230224609375, -1.2805328369140625, -1.24383544921875, -1.2071380615234375, -1.170440673828125, -1.1337432861328125, -1.0970458984375, -1.0603485107421875, -1.023651123046875, -0.9869537353515625, -0.95025634765625, -0.9135589599609375, -0.876861572265625, -0.8401641845703125, -0.803466796875, -0.7667694091796875, -0.730072021484375, -0.6933746337890625, -0.65667724609375, -0.6199798583984375, -0.583282470703125, -0.5465850830078125, -0.5098876953125, -0.4731903076171875, -0.436492919921875, -0.3997955322265625, -0.36309814453125, -0.3264007568359375, -0.289703369140625, -0.2530059814453125, -0.21630859375, -0.1796112060546875, -0.142913818359375, -0.1062164306640625, -0.06951904296875, -0.0328216552734375, 0.003875732421875, 0.0405731201171875, 0.0772705078125, 0.1139678955078125, 0.150665283203125, 0.1873626708984375, 0.22406005859375, 0.2607574462890625, 0.297454833984375, 0.3341522216796875, 0.370849609375, 0.4075469970703125, 0.444244384765625, 0.4809417724609375, 0.51763916015625, 0.5543365478515625, 0.591033935546875, 0.6277313232421875, 0.6644287109375, 0.7011260986328125, 0.737823486328125, 0.7745208740234375, 0.81121826171875, 0.8479156494140625, 0.884613037109375, 0.9213104248046875, 0.9580078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 8.0, 12.0, 13.0, 17.0, 27.0, 31.0, 64.0, 96.0, 153.0, 309.0, 565.0, 1699.0, 9291.0, 275303.0, 734775.0, 21884.0, 2618.0, 855.0, 336.0, 162.0, 108.0, 72.0, 43.0, 28.0, 25.0, 20.0, 8.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.388671875, -3.263885498046875, -3.13909912109375, -3.014312744140625, -2.8895263671875, -2.764739990234375, -2.63995361328125, -2.515167236328125, -2.390380859375, -2.265594482421875, -2.14080810546875, -2.016021728515625, -1.8912353515625, -1.766448974609375, -1.64166259765625, -1.516876220703125, -1.39208984375, -1.267303466796875, -1.14251708984375, -1.017730712890625, -0.8929443359375, -0.768157958984375, -0.64337158203125, -0.518585205078125, -0.393798828125, -0.269012451171875, -0.14422607421875, -0.019439697265625, 0.1053466796875, 0.230133056640625, 0.35491943359375, 0.479705810546875, 0.6044921875, 0.729278564453125, 0.85406494140625, 0.978851318359375, 1.1036376953125, 1.228424072265625, 1.35321044921875, 1.477996826171875, 1.602783203125, 1.727569580078125, 1.85235595703125, 1.977142333984375, 2.1019287109375, 2.226715087890625, 2.35150146484375, 2.476287841796875, 2.60107421875, 2.725860595703125, 2.85064697265625, 2.975433349609375, 3.1002197265625, 3.225006103515625, 3.34979248046875, 3.474578857421875, 3.599365234375, 3.724151611328125, 3.84893798828125, 3.973724365234375, 4.0985107421875, 4.223297119140625, 4.34808349609375, 4.472869873046875, 4.59765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 6.0, 8.0, 9.0, 13.0, 8.0, 11.0, 16.0, 9.0, 19.0, 34.0, 27.0, 36.0, 31.0, 43.0, 43.0, 37.0, 48.0, 49.0, 38.0, 44.0, 48.0, 41.0, 50.0, 42.0, 49.0, 33.0, 32.0, 21.0, 34.0, 31.0, 13.0, 16.0, 12.0, 14.0, 7.0, 10.0, 8.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.298828125, -3.19293212890625, -3.0870361328125, -2.98114013671875, -2.875244140625, -2.76934814453125, -2.6634521484375, -2.55755615234375, -2.45166015625, -2.34576416015625, -2.2398681640625, -2.13397216796875, -2.028076171875, -1.92218017578125, -1.8162841796875, -1.71038818359375, -1.6044921875, -1.49859619140625, -1.3927001953125, -1.28680419921875, -1.180908203125, -1.07501220703125, -0.9691162109375, -0.86322021484375, -0.75732421875, -0.65142822265625, -0.5455322265625, -0.43963623046875, -0.333740234375, -0.22784423828125, -0.1219482421875, -0.01605224609375, 0.08984375, 0.19573974609375, 0.3016357421875, 0.40753173828125, 0.513427734375, 0.61932373046875, 0.7252197265625, 0.83111572265625, 0.93701171875, 1.04290771484375, 1.1488037109375, 1.25469970703125, 1.360595703125, 1.46649169921875, 1.5723876953125, 1.67828369140625, 1.7841796875, 1.89007568359375, 1.9959716796875, 2.10186767578125, 2.207763671875, 2.31365966796875, 2.4195556640625, 2.52545166015625, 2.63134765625, 2.73724365234375, 2.8431396484375, 2.94903564453125, 3.054931640625, 3.16082763671875, 3.2667236328125, 3.37261962890625, 3.478515625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 8.0, 13.0, 18.0, 31.0, 54.0, 74.0, 131.0, 278.0, 766.0, 2824.0, 27913.0, 923585.0, 86576.0, 4461.0, 1006.0, 385.0, 190.0, 99.0, 56.0, 24.0, 13.0, 8.0, 7.0, 6.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.138671875, -2.071075439453125, -2.00347900390625, -1.935882568359375, -1.8682861328125, -1.800689697265625, -1.73309326171875, -1.665496826171875, -1.597900390625, -1.530303955078125, -1.46270751953125, -1.395111083984375, -1.3275146484375, -1.259918212890625, -1.19232177734375, -1.124725341796875, -1.05712890625, -0.989532470703125, -0.92193603515625, -0.854339599609375, -0.7867431640625, -0.719146728515625, -0.65155029296875, -0.583953857421875, -0.516357421875, -0.448760986328125, -0.38116455078125, -0.313568115234375, -0.2459716796875, -0.178375244140625, -0.11077880859375, -0.043182373046875, 0.0244140625, 0.092010498046875, 0.15960693359375, 0.227203369140625, 0.2947998046875, 0.362396240234375, 0.42999267578125, 0.497589111328125, 0.565185546875, 0.632781982421875, 0.70037841796875, 0.767974853515625, 0.8355712890625, 0.903167724609375, 0.97076416015625, 1.038360595703125, 1.10595703125, 1.173553466796875, 1.24114990234375, 1.308746337890625, 1.3763427734375, 1.443939208984375, 1.51153564453125, 1.579132080078125, 1.646728515625, 1.714324951171875, 1.78192138671875, 1.849517822265625, 1.9171142578125, 1.984710693359375, 2.05230712890625, 2.119903564453125, 2.1875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 8.0, 10.0, 15.0, 20.0, 40.0, 75.0, 110.0, 159.0, 159.0, 149.0, 91.0, 78.0, 43.0, 24.0, 11.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002090930938720703, -0.00020320340991020203, -0.00019731372594833374, -0.00019142404198646545, -0.00018553435802459717, -0.00017964467406272888, -0.0001737549901008606, -0.0001678653061389923, -0.00016197562217712402, -0.00015608593821525574, -0.00015019625425338745, -0.00014430657029151917, -0.00013841688632965088, -0.0001325272023677826, -0.0001266375184059143, -0.00012074783444404602, -0.00011485815048217773, -0.00010896846652030945, -0.00010307878255844116, -9.718909859657288e-05, -9.129941463470459e-05, -8.54097306728363e-05, -7.952004671096802e-05, -7.363036274909973e-05, -6.774067878723145e-05, -6.185099482536316e-05, -5.596131086349487e-05, -5.007162690162659e-05, -4.41819429397583e-05, -3.8292258977890015e-05, -3.240257501602173e-05, -2.6512891054153442e-05, -2.0623207092285156e-05, -1.473352313041687e-05, -8.843839168548584e-06, -2.954155206680298e-06, 2.9355287551879883e-06, 8.825212717056274e-06, 1.471489667892456e-05, 2.0604580640792847e-05, 2.6494264602661133e-05, 3.238394856452942e-05, 3.8273632526397705e-05, 4.416331648826599e-05, 5.005300045013428e-05, 5.5942684412002563e-05, 6.183236837387085e-05, 6.772205233573914e-05, 7.361173629760742e-05, 7.950142025947571e-05, 8.5391104221344e-05, 9.128078818321228e-05, 9.717047214508057e-05, 0.00010306015610694885, 0.00010894984006881714, 0.00011483952403068542, 0.00012072920799255371, 0.000126618891954422, 0.00013250857591629028, 0.00013839825987815857, 0.00014428794384002686, 0.00015017762780189514, 0.00015606731176376343, 0.00016195699572563171, 0.0001678466796875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 5.0, 14.0, 24.0, 31.0, 54.0, 96.0, 136.0, 295.0, 629.0, 1752.0, 5947.0, 51530.0, 805263.0, 167308.0, 11323.0, 2428.0, 860.0, 396.0, 183.0, 95.0, 55.0, 39.0, 16.0, 17.0, 10.0, 9.0, 4.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3291015625, -1.2827606201171875, -1.236419677734375, -1.1900787353515625, -1.14373779296875, -1.0973968505859375, -1.051055908203125, -1.0047149658203125, -0.9583740234375, -0.9120330810546875, -0.865692138671875, -0.8193511962890625, -0.77301025390625, -0.7266693115234375, -0.680328369140625, -0.6339874267578125, -0.587646484375, -0.5413055419921875, -0.494964599609375, -0.4486236572265625, -0.40228271484375, -0.3559417724609375, -0.309600830078125, -0.2632598876953125, -0.2169189453125, -0.1705780029296875, -0.124237060546875, -0.0778961181640625, -0.03155517578125, 0.0147857666015625, 0.061126708984375, 0.1074676513671875, 0.15380859375, 0.2001495361328125, 0.246490478515625, 0.2928314208984375, 0.33917236328125, 0.3855133056640625, 0.431854248046875, 0.4781951904296875, 0.5245361328125, 0.5708770751953125, 0.617218017578125, 0.6635589599609375, 0.70989990234375, 0.7562408447265625, 0.802581787109375, 0.8489227294921875, 0.895263671875, 0.9416046142578125, 0.987945556640625, 1.0342864990234375, 1.08062744140625, 1.1269683837890625, 1.173309326171875, 1.2196502685546875, 1.2659912109375, 1.3123321533203125, 1.358673095703125, 1.4050140380859375, 1.45135498046875, 1.4976959228515625, 1.544036865234375, 1.5903778076171875, 1.63671875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 13.0, 18.0, 20.0, 30.0, 85.0, 77.0, 115.0, 123.0, 140.0, 115.0, 91.0, 55.0, 33.0, 29.0, 21.0, 9.0, 6.0, 0.0, 7.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6328125, -1.584808349609375, -1.53680419921875, -1.488800048828125, -1.4407958984375, -1.392791748046875, -1.34478759765625, -1.296783447265625, -1.248779296875, -1.200775146484375, -1.15277099609375, -1.104766845703125, -1.0567626953125, -1.008758544921875, -0.96075439453125, -0.912750244140625, -0.86474609375, -0.816741943359375, -0.76873779296875, -0.720733642578125, -0.6727294921875, -0.624725341796875, -0.57672119140625, -0.528717041015625, -0.480712890625, -0.432708740234375, -0.38470458984375, -0.336700439453125, -0.2886962890625, -0.240692138671875, -0.19268798828125, -0.144683837890625, -0.0966796875, -0.048675537109375, -0.00067138671875, 0.047332763671875, 0.0953369140625, 0.143341064453125, 0.19134521484375, 0.239349365234375, 0.287353515625, 0.335357666015625, 0.38336181640625, 0.431365966796875, 0.4793701171875, 0.527374267578125, 0.57537841796875, 0.623382568359375, 0.67138671875, 0.719390869140625, 0.76739501953125, 0.815399169921875, 0.8634033203125, 0.911407470703125, 0.95941162109375, 1.007415771484375, 1.055419921875, 1.103424072265625, 1.15142822265625, 1.199432373046875, 1.2474365234375, 1.295440673828125, 1.34344482421875, 1.391448974609375, 1.439453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 12.0, 77.0, 519.0, 365.0, 32.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.524555206298828, -20.250925064086914, -17.977294921875, -15.703664779663086, -13.430034637451172, -11.156404495239258, -8.882774353027344, -6.60914421081543, -4.335514068603516, -2.0618839263916016, 0.2117462158203125, 2.4853763580322266, 4.759006500244141, 7.032636642456055, 9.306266784667969, 11.579896926879883, 13.853527069091797, 16.12715721130371, 18.400787353515625, 20.67441749572754, 22.948047637939453, 25.221677780151367, 27.49530792236328, 29.768938064575195, 32.04256820678711, 34.316200256347656, 36.58982849121094, 38.86345672607422, 41.137088775634766, 43.41072082519531, 45.684349060058594, 47.957977294921875, 50.23161315917969, 52.50524139404297, 54.778873443603516, 57.05250549316406, 59.326133728027344, 61.599761962890625, 63.87339401245117, 66.14702606201172, 68.420654296875, 70.69428253173828, 72.96791076660156, 75.24154663085938, 77.51517486572266, 79.78880310058594, 82.06243896484375, 84.33606719970703, 86.60969543457031, 88.8833236694336, 91.15695190429688, 93.43058776855469, 95.70421600341797, 97.97784423828125, 100.25148010253906, 102.52510833740234, 104.79873657226562, 107.0723648071289, 109.34599304199219, 111.61962890625, 113.89325714111328, 116.16688537597656, 118.44052124023438, 120.71414947509766, 122.98777770996094]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 7.0, 10.0, 22.0, 26.0, 16.0, 21.0, 21.0, 42.0, 54.0, 51.0, 61.0, 55.0, 69.0, 56.0, 62.0, 65.0, 63.0, 41.0, 39.0, 36.0, 31.0, 30.0, 31.0, 16.0, 11.0, 23.0, 8.0, 11.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.545770645141602, -12.991360664367676, -12.43695068359375, -11.882540702819824, -11.328130722045898, -10.773721694946289, -10.219311714172363, -9.664901733398438, -9.110491752624512, -8.556081771850586, -8.00167179107666, -7.447262287139893, -6.892852306365967, -6.338442325592041, -5.784032821655273, -5.229622840881348, -4.675212860107422, -4.120802879333496, -3.5663931369781494, -3.0119833946228027, -2.457573413848877, -1.9031634330749512, -1.3487536907196045, -0.7943439483642578, -0.23993396759033203, 0.3144758939743042, 0.8688857555389404, 1.4232956171035767, 1.977705478668213, 2.5321154594421387, 3.0865252017974854, 3.640934944152832, 4.195343017578125, 4.749752998352051, 5.304162979125977, 5.858572483062744, 6.41298246383667, 6.967392444610596, 7.521801948547363, 8.076211929321289, 8.630621910095215, 9.18503189086914, 9.739441871643066, 10.293851852416992, 10.848260879516602, 11.402671813964844, 11.957080841064453, 12.511490821838379, 13.065900802612305, 13.62031078338623, 14.174720764160156, 14.729130744934082, 15.283540725708008, 15.837949752807617, 16.39236068725586, 16.94676971435547, 17.501178741455078, 18.055587768554688, 18.60999870300293, 19.16440773010254, 19.71881866455078, 20.27322769165039, 20.827638626098633, 21.382047653198242, 21.936458587646484]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 8.0, 7.0, 10.0, 17.0, 18.0, 27.0, 39.0, 68.0, 105.0, 166.0, 305.0, 449.0, 896.0, 1721.0, 4053.0, 12532.0, 62663.0, 3610412.0, 448723.0, 36775.0, 8850.0, 3195.0, 1476.0, 737.0, 417.0, 210.0, 131.0, 84.0, 55.0, 40.0, 27.0, 27.0, 7.0, 7.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.69921875, -1.6441497802734375, -1.589080810546875, -1.5340118408203125, -1.47894287109375, -1.4238739013671875, -1.368804931640625, -1.3137359619140625, -1.2586669921875, -1.2035980224609375, -1.148529052734375, -1.0934600830078125, -1.03839111328125, -0.9833221435546875, -0.928253173828125, -0.8731842041015625, -0.818115234375, -0.7630462646484375, -0.707977294921875, -0.6529083251953125, -0.59783935546875, -0.5427703857421875, -0.487701416015625, -0.4326324462890625, -0.3775634765625, -0.3224945068359375, -0.267425537109375, -0.2123565673828125, -0.15728759765625, -0.1022186279296875, -0.047149658203125, 0.0079193115234375, 0.06298828125, 0.1180572509765625, 0.173126220703125, 0.2281951904296875, 0.28326416015625, 0.3383331298828125, 0.393402099609375, 0.4484710693359375, 0.5035400390625, 0.5586090087890625, 0.613677978515625, 0.6687469482421875, 0.72381591796875, 0.7788848876953125, 0.833953857421875, 0.8890228271484375, 0.944091796875, 0.9991607666015625, 1.054229736328125, 1.1092987060546875, 1.16436767578125, 1.2194366455078125, 1.274505615234375, 1.3295745849609375, 1.3846435546875, 1.4397125244140625, 1.494781494140625, 1.5498504638671875, 1.60491943359375, 1.6599884033203125, 1.715057373046875, 1.7701263427734375, 1.8251953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 7.0, 14.0, 17.0, 24.0, 29.0, 40.0, 35.0, 73.0, 59.0, 84.0, 86.0, 72.0, 74.0, 73.0, 63.0, 53.0, 28.0, 42.0, 21.0, 26.0, 18.0, 13.0, 12.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -1.003997802734375, -0.97088623046875, -0.937774658203125, -0.9046630859375, -0.871551513671875, -0.83843994140625, -0.805328369140625, -0.772216796875, -0.739105224609375, -0.70599365234375, -0.672882080078125, -0.6397705078125, -0.606658935546875, -0.57354736328125, -0.540435791015625, -0.50732421875, -0.474212646484375, -0.44110107421875, -0.407989501953125, -0.3748779296875, -0.341766357421875, -0.30865478515625, -0.275543212890625, -0.242431640625, -0.209320068359375, -0.17620849609375, -0.143096923828125, -0.1099853515625, -0.076873779296875, -0.04376220703125, -0.010650634765625, 0.0224609375, 0.055572509765625, 0.08868408203125, 0.121795654296875, 0.1549072265625, 0.188018798828125, 0.22113037109375, 0.254241943359375, 0.287353515625, 0.320465087890625, 0.35357666015625, 0.386688232421875, 0.4197998046875, 0.452911376953125, 0.48602294921875, 0.519134521484375, 0.55224609375, 0.585357666015625, 0.61846923828125, 0.651580810546875, 0.6846923828125, 0.717803955078125, 0.75091552734375, 0.784027099609375, 0.817138671875, 0.850250244140625, 0.88336181640625, 0.916473388671875, 0.9495849609375, 0.982696533203125, 1.01580810546875, 1.048919677734375, 1.08203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 8.0, 9.0, 12.0, 26.0, 31.0, 55.0, 87.0, 153.0, 297.0, 458.0, 1049.0, 1903.0, 4323.0, 10937.0, 35063.0, 184502.0, 3572591.0, 310045.0, 48790.0, 13958.0, 5170.0, 2372.0, 1101.0, 574.0, 298.0, 197.0, 104.0, 63.0, 36.0, 25.0, 12.0, 7.0, 12.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.0939178466796875, -1.056976318359375, -1.0200347900390625, -0.98309326171875, -0.9461517333984375, -0.909210205078125, -0.8722686767578125, -0.8353271484375, -0.7983856201171875, -0.761444091796875, -0.7245025634765625, -0.68756103515625, -0.6506195068359375, -0.613677978515625, -0.5767364501953125, -0.539794921875, -0.5028533935546875, -0.465911865234375, -0.4289703369140625, -0.39202880859375, -0.3550872802734375, -0.318145751953125, -0.2812042236328125, -0.2442626953125, -0.2073211669921875, -0.170379638671875, -0.1334381103515625, -0.09649658203125, -0.0595550537109375, -0.022613525390625, 0.0143280029296875, 0.05126953125, 0.0882110595703125, 0.125152587890625, 0.1620941162109375, 0.19903564453125, 0.2359771728515625, 0.272918701171875, 0.3098602294921875, 0.3468017578125, 0.3837432861328125, 0.420684814453125, 0.4576263427734375, 0.49456787109375, 0.5315093994140625, 0.568450927734375, 0.6053924560546875, 0.642333984375, 0.6792755126953125, 0.716217041015625, 0.7531585693359375, 0.79010009765625, 0.8270416259765625, 0.863983154296875, 0.9009246826171875, 0.9378662109375, 0.9748077392578125, 1.011749267578125, 1.0486907958984375, 1.08563232421875, 1.1225738525390625, 1.159515380859375, 1.1964569091796875, 1.2333984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 10.0, 11.0, 16.0, 30.0, 38.0, 54.0, 86.0, 148.0, 288.0, 1735.0, 955.0, 278.0, 132.0, 99.0, 49.0, 35.0, 27.0, 25.0, 7.0, 6.0, 8.0, 5.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40380859375, -0.3862152099609375, -0.368621826171875, -0.3510284423828125, -0.33343505859375, -0.3158416748046875, -0.298248291015625, -0.2806549072265625, -0.2630615234375, -0.2454681396484375, -0.227874755859375, -0.2102813720703125, -0.19268798828125, -0.1750946044921875, -0.157501220703125, -0.1399078369140625, -0.122314453125, -0.1047210693359375, -0.087127685546875, -0.0695343017578125, -0.05194091796875, -0.0343475341796875, -0.016754150390625, 0.0008392333984375, 0.0184326171875, 0.0360260009765625, 0.053619384765625, 0.0712127685546875, 0.08880615234375, 0.1063995361328125, 0.123992919921875, 0.1415863037109375, 0.1591796875, 0.1767730712890625, 0.194366455078125, 0.2119598388671875, 0.22955322265625, 0.2471466064453125, 0.264739990234375, 0.2823333740234375, 0.2999267578125, 0.3175201416015625, 0.335113525390625, 0.3527069091796875, 0.37030029296875, 0.3878936767578125, 0.405487060546875, 0.4230804443359375, 0.440673828125, 0.4582672119140625, 0.475860595703125, 0.4934539794921875, 0.51104736328125, 0.5286407470703125, 0.546234130859375, 0.5638275146484375, 0.5814208984375, 0.5990142822265625, 0.616607666015625, 0.6342010498046875, 0.65179443359375, 0.6693878173828125, 0.686981201171875, 0.7045745849609375, 0.72216796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 7.0, 11.0, 16.0, 33.0, 51.0, 76.0, 95.0, 127.0, 138.0, 118.0, 97.0, 81.0, 55.0, 31.0, 27.0, 13.0, 12.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.822126865386963, -2.7299299240112305, -2.637733221054077, -2.545536518096924, -2.4533395767211914, -2.361142635345459, -2.2689459323883057, -2.1767492294311523, -2.08455228805542, -1.992355465888977, -1.9001586437225342, -1.8079618215560913, -1.7157649993896484, -1.6235681772232056, -1.5313713550567627, -1.4391745328903198, -1.346977710723877, -1.254780888557434, -1.1625840663909912, -1.0703872442245483, -0.9781904220581055, -0.8859935998916626, -0.7937967777252197, -0.7015999555587769, -0.609403133392334, -0.5172063112258911, -0.42500948905944824, -0.33281266689300537, -0.2406158447265625, -0.14841902256011963, -0.05622220039367676, 0.03597462177276611, 0.12817144393920898, 0.22036826610565186, 0.3125650882720947, 0.4047619104385376, 0.49695873260498047, 0.5891555547714233, 0.6813523769378662, 0.7735491991043091, 0.865746021270752, 0.9579428434371948, 1.0501396656036377, 1.1423364877700806, 1.2345333099365234, 1.3267301321029663, 1.4189269542694092, 1.511123776435852, 1.603320598602295, 1.6955174207687378, 1.7877142429351807, 1.8799110651016235, 1.9721078872680664, 2.064304828643799, 2.156501531600952, 2.2486982345581055, 2.340895175933838, 2.4330921173095703, 2.5252888202667236, 2.617485523223877, 2.7096824645996094, 2.801879405975342, 2.894076108932495, 2.9862728118896484, 3.078469753265381]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 4.0, 5.0, 5.0, 6.0, 18.0, 13.0, 15.0, 20.0, 20.0, 32.0, 38.0, 32.0, 39.0, 49.0, 48.0, 45.0, 55.0, 57.0, 49.0, 54.0, 58.0, 36.0, 47.0, 44.0, 41.0, 30.0, 27.0, 18.0, 11.0, 16.0, 15.0, 11.0, 10.0, 6.0, 12.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.2364330291748047, -2.172072410583496, -2.1077117919921875, -2.043351411819458, -1.9789907932281494, -1.9146301746368408, -1.8502695560455322, -1.7859089374542236, -1.7215484380722046, -1.657187819480896, -1.592827320098877, -1.5284667015075684, -1.4641060829162598, -1.3997455835342407, -1.3353849649429321, -1.271024465560913, -1.2066638469696045, -1.142303228378296, -1.0779427289962769, -1.0135821104049683, -0.9492215514183044, -0.8848609924316406, -0.820500373840332, -0.7561398148536682, -0.6917792558670044, -0.6274186968803406, -0.5630581378936768, -0.49869751930236816, -0.43433696031570435, -0.3699764013290405, -0.3056158125400543, -0.24125522375106812, -0.1768946647644043, -0.11253409087657928, -0.04817351698875427, 0.01618705689907074, 0.08054763078689575, 0.14490818977355957, 0.20926877856254578, 0.273629367351532, 0.3379899263381958, 0.4023504853248596, 0.4667110741138458, 0.531071662902832, 0.5954322218894958, 0.6597927808761597, 0.7241533994674683, 0.7885139584541321, 0.8528745174407959, 0.9172350764274597, 0.9815956354141235, 1.0459562540054321, 1.1103167533874512, 1.1746773719787598, 1.2390379905700684, 1.303398609161377, 1.367759108543396, 1.4321197271347046, 1.4964802265167236, 1.5608408451080322, 1.6252014636993408, 1.6895619630813599, 1.7539225816726685, 1.8182830810546875, 1.882643699645996]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 12.0, 16.0, 16.0, 42.0, 84.0, 172.0, 471.0, 1796.0, 11020.0, 159562.0, 792191.0, 74647.0, 6623.0, 1241.0, 348.0, 156.0, 56.0, 38.0, 16.0, 11.0, 8.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.835845947265625, -2.72833251953125, -2.620819091796875, -2.5133056640625, -2.405792236328125, -2.29827880859375, -2.190765380859375, -2.083251953125, -1.975738525390625, -1.86822509765625, -1.760711669921875, -1.6531982421875, -1.545684814453125, -1.43817138671875, -1.330657958984375, -1.22314453125, -1.115631103515625, -1.00811767578125, -0.900604248046875, -0.7930908203125, -0.685577392578125, -0.57806396484375, -0.470550537109375, -0.363037109375, -0.255523681640625, -0.14801025390625, -0.040496826171875, 0.0670166015625, 0.174530029296875, 0.28204345703125, 0.389556884765625, 0.4970703125, 0.604583740234375, 0.71209716796875, 0.819610595703125, 0.9271240234375, 1.034637451171875, 1.14215087890625, 1.249664306640625, 1.357177734375, 1.464691162109375, 1.57220458984375, 1.679718017578125, 1.7872314453125, 1.894744873046875, 2.00225830078125, 2.109771728515625, 2.21728515625, 2.324798583984375, 2.43231201171875, 2.539825439453125, 2.6473388671875, 2.754852294921875, 2.86236572265625, 2.969879150390625, 3.077392578125, 3.184906005859375, 3.29241943359375, 3.399932861328125, 3.5074462890625, 3.614959716796875, 3.72247314453125, 3.829986572265625, 3.9375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 10.0, 3.0, 12.0, 6.0, 13.0, 13.0, 22.0, 26.0, 26.0, 34.0, 38.0, 51.0, 58.0, 67.0, 68.0, 72.0, 61.0, 67.0, 59.0, 66.0, 36.0, 30.0, 26.0, 28.0, 33.0, 16.0, 18.0, 13.0, 9.0, 5.0, 7.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.966796875, -0.9382095336914062, -0.9096221923828125, -0.8810348510742188, -0.852447509765625, -0.8238601684570312, -0.7952728271484375, -0.7666854858398438, -0.73809814453125, -0.7095108032226562, -0.6809234619140625, -0.6523361206054688, -0.623748779296875, -0.5951614379882812, -0.5665740966796875, -0.5379867553710938, -0.5093994140625, -0.48081207275390625, -0.4522247314453125, -0.42363739013671875, -0.395050048828125, -0.36646270751953125, -0.3378753662109375, -0.30928802490234375, -0.28070068359375, -0.25211334228515625, -0.2235260009765625, -0.19493865966796875, -0.166351318359375, -0.13776397705078125, -0.1091766357421875, -0.08058929443359375, -0.052001953125, -0.02341461181640625, 0.0051727294921875, 0.03376007080078125, 0.062347412109375, 0.09093475341796875, 0.1195220947265625, 0.14810943603515625, 0.17669677734375, 0.20528411865234375, 0.2338714599609375, 0.26245880126953125, 0.291046142578125, 0.31963348388671875, 0.3482208251953125, 0.37680816650390625, 0.4053955078125, 0.43398284912109375, 0.4625701904296875, 0.49115753173828125, 0.519744873046875, 0.5483322143554688, 0.5769195556640625, 0.6055068969726562, 0.63409423828125, 0.6626815795898438, 0.6912689208984375, 0.7198562622070312, 0.748443603515625, 0.7770309448242188, 0.8056182861328125, 0.8342056274414062, 0.86279296875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 2.0, 4.0, 6.0, 10.0, 10.0, 21.0, 30.0, 41.0, 52.0, 127.0, 180.0, 417.0, 861.0, 2532.0, 14022.0, 321077.0, 677931.0, 25437.0, 3575.0, 1166.0, 484.0, 214.0, 123.0, 80.0, 66.0, 28.0, 17.0, 10.0, 9.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.703125, -3.5946044921875, -3.486083984375, -3.3775634765625, -3.26904296875, -3.1605224609375, -3.052001953125, -2.9434814453125, -2.8349609375, -2.7264404296875, -2.617919921875, -2.5093994140625, -2.40087890625, -2.2923583984375, -2.183837890625, -2.0753173828125, -1.966796875, -1.8582763671875, -1.749755859375, -1.6412353515625, -1.53271484375, -1.4241943359375, -1.315673828125, -1.2071533203125, -1.0986328125, -0.9901123046875, -0.881591796875, -0.7730712890625, -0.66455078125, -0.5560302734375, -0.447509765625, -0.3389892578125, -0.23046875, -0.1219482421875, -0.013427734375, 0.0950927734375, 0.20361328125, 0.3121337890625, 0.420654296875, 0.5291748046875, 0.6376953125, 0.7462158203125, 0.854736328125, 0.9632568359375, 1.07177734375, 1.1802978515625, 1.288818359375, 1.3973388671875, 1.505859375, 1.6143798828125, 1.722900390625, 1.8314208984375, 1.93994140625, 2.0484619140625, 2.156982421875, 2.2655029296875, 2.3740234375, 2.4825439453125, 2.591064453125, 2.6995849609375, 2.80810546875, 2.9166259765625, 3.025146484375, 3.1336669921875, 3.2421875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 6.0, 8.0, 10.0, 11.0, 14.0, 16.0, 15.0, 23.0, 24.0, 13.0, 27.0, 36.0, 42.0, 34.0, 38.0, 39.0, 41.0, 44.0, 40.0, 47.0, 37.0, 38.0, 46.0, 46.0, 31.0, 38.0, 30.0, 25.0, 21.0, 29.0, 25.0, 17.0, 12.0, 13.0, 8.0, 6.0, 6.0, 9.0, 6.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.7265625, -2.6446533203125, -2.562744140625, -2.4808349609375, -2.39892578125, -2.3170166015625, -2.235107421875, -2.1531982421875, -2.0712890625, -1.9893798828125, -1.907470703125, -1.8255615234375, -1.74365234375, -1.6617431640625, -1.579833984375, -1.4979248046875, -1.416015625, -1.3341064453125, -1.252197265625, -1.1702880859375, -1.08837890625, -1.0064697265625, -0.924560546875, -0.8426513671875, -0.7607421875, -0.6788330078125, -0.596923828125, -0.5150146484375, -0.43310546875, -0.3511962890625, -0.269287109375, -0.1873779296875, -0.10546875, -0.0235595703125, 0.058349609375, 0.1402587890625, 0.22216796875, 0.3040771484375, 0.385986328125, 0.4678955078125, 0.5498046875, 0.6317138671875, 0.713623046875, 0.7955322265625, 0.87744140625, 0.9593505859375, 1.041259765625, 1.1231689453125, 1.205078125, 1.2869873046875, 1.368896484375, 1.4508056640625, 1.53271484375, 1.6146240234375, 1.696533203125, 1.7784423828125, 1.8603515625, 1.9422607421875, 2.024169921875, 2.1060791015625, 2.18798828125, 2.2698974609375, 2.351806640625, 2.4337158203125, 2.515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 7.0, 13.0, 23.0, 31.0, 101.0, 205.0, 572.0, 2166.0, 19961.0, 802985.0, 213734.0, 6881.0, 1207.0, 345.0, 150.0, 88.0, 38.0, 19.0, 10.0, 5.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.4870681762695312, -1.4487457275390625, -1.4104232788085938, -1.372100830078125, -1.3337783813476562, -1.2954559326171875, -1.2571334838867188, -1.21881103515625, -1.1804885864257812, -1.1421661376953125, -1.1038436889648438, -1.065521240234375, -1.0271987915039062, -0.9888763427734375, -0.9505538940429688, -0.9122314453125, -0.8739089965820312, -0.8355865478515625, -0.7972640991210938, -0.758941650390625, -0.7206192016601562, -0.6822967529296875, -0.6439743041992188, -0.60565185546875, -0.5673294067382812, -0.5290069580078125, -0.49068450927734375, -0.452362060546875, -0.41403961181640625, -0.3757171630859375, -0.33739471435546875, -0.299072265625, -0.26074981689453125, -0.2224273681640625, -0.18410491943359375, -0.145782470703125, -0.10746002197265625, -0.0691375732421875, -0.03081512451171875, 0.00750732421875, 0.04582977294921875, 0.0841522216796875, 0.12247467041015625, 0.160797119140625, 0.19911956787109375, 0.2374420166015625, 0.27576446533203125, 0.3140869140625, 0.35240936279296875, 0.3907318115234375, 0.42905426025390625, 0.467376708984375, 0.5056991577148438, 0.5440216064453125, 0.5823440551757812, 0.62066650390625, 0.6589889526367188, 0.6973114013671875, 0.7356338500976562, 0.773956298828125, 0.8122787475585938, 0.8506011962890625, 0.8889236450195312, 0.92724609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 4.0, 6.0, 4.0, 15.0, 6.0, 9.0, 13.0, 24.0, 17.0, 25.0, 31.0, 35.0, 44.0, 46.0, 66.0, 80.0, 93.0, 77.0, 65.0, 65.0, 38.0, 52.0, 31.0, 34.0, 18.0, 28.0, 15.0, 11.0, 9.0, 9.0, 6.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.273124694824219e-05, -8.041225373744965e-05, -7.80932605266571e-05, -7.577426731586456e-05, -7.345527410507202e-05, -7.113628089427948e-05, -6.881728768348694e-05, -6.64982944726944e-05, -6.417930126190186e-05, -6.186030805110931e-05, -5.954131484031677e-05, -5.722232162952423e-05, -5.490332841873169e-05, -5.258433520793915e-05, -5.0265341997146606e-05, -4.7946348786354065e-05, -4.5627355575561523e-05, -4.330836236476898e-05, -4.098936915397644e-05, -3.86703759431839e-05, -3.635138273239136e-05, -3.4032389521598816e-05, -3.1713396310806274e-05, -2.9394403100013733e-05, -2.707540988922119e-05, -2.475641667842865e-05, -2.243742346763611e-05, -2.0118430256843567e-05, -1.7799437046051025e-05, -1.5480443835258484e-05, -1.3161450624465942e-05, -1.0842457413673401e-05, -8.52346420288086e-06, -6.204470992088318e-06, -3.885477781295776e-06, -1.5664845705032349e-06, 7.525086402893066e-07, 3.071501851081848e-06, 5.39049506187439e-06, 7.709488272666931e-06, 1.0028481483459473e-05, 1.2347474694252014e-05, 1.4666467905044556e-05, 1.6985461115837097e-05, 1.930445432662964e-05, 2.162344753742218e-05, 2.394244074821472e-05, 2.6261433959007263e-05, 2.8580427169799805e-05, 3.0899420380592346e-05, 3.321841359138489e-05, 3.553740680217743e-05, 3.785640001296997e-05, 4.017539322376251e-05, 4.2494386434555054e-05, 4.4813379645347595e-05, 4.713237285614014e-05, 4.945136606693268e-05, 5.177035927772522e-05, 5.408935248851776e-05, 5.64083456993103e-05, 5.8727338910102844e-05, 6.104633212089539e-05, 6.336532533168793e-05, 6.568431854248047e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 2.0, 9.0, 11.0, 15.0, 26.0, 31.0, 69.0, 106.0, 221.0, 488.0, 1252.0, 4332.0, 35015.0, 737976.0, 252342.0, 12548.0, 2540.0, 844.0, 352.0, 138.0, 82.0, 46.0, 39.0, 21.0, 13.0, 4.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0791015625, -1.0489578247070312, -1.0188140869140625, -0.9886703491210938, -0.958526611328125, -0.9283828735351562, -0.8982391357421875, -0.8680953979492188, -0.83795166015625, -0.8078079223632812, -0.7776641845703125, -0.7475204467773438, -0.717376708984375, -0.6872329711914062, -0.6570892333984375, -0.6269454956054688, -0.5968017578125, -0.5666580200195312, -0.5365142822265625, -0.5063705444335938, -0.476226806640625, -0.44608306884765625, -0.4159393310546875, -0.38579559326171875, -0.35565185546875, -0.32550811767578125, -0.2953643798828125, -0.26522064208984375, -0.235076904296875, -0.20493316650390625, -0.1747894287109375, -0.14464569091796875, -0.114501953125, -0.08435821533203125, -0.0542144775390625, -0.02407073974609375, 0.006072998046875, 0.03621673583984375, 0.0663604736328125, 0.09650421142578125, 0.12664794921875, 0.15679168701171875, 0.1869354248046875, 0.21707916259765625, 0.247222900390625, 0.27736663818359375, 0.3075103759765625, 0.33765411376953125, 0.3677978515625, 0.39794158935546875, 0.4280853271484375, 0.45822906494140625, 0.488372802734375, 0.5185165405273438, 0.5486602783203125, 0.5788040161132812, 0.60894775390625, 0.6390914916992188, 0.6692352294921875, 0.6993789672851562, 0.729522705078125, 0.7596664428710938, 0.7898101806640625, 0.8199539184570312, 0.85009765625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 9.0, 11.0, 4.0, 14.0, 21.0, 32.0, 39.0, 48.0, 47.0, 77.0, 108.0, 108.0, 102.0, 98.0, 66.0, 65.0, 46.0, 22.0, 20.0, 20.0, 12.0, 9.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.705078125, -0.6812744140625, -0.657470703125, -0.6336669921875, -0.60986328125, -0.5860595703125, -0.562255859375, -0.5384521484375, -0.5146484375, -0.4908447265625, -0.467041015625, -0.4432373046875, -0.41943359375, -0.3956298828125, -0.371826171875, -0.3480224609375, -0.32421875, -0.3004150390625, -0.276611328125, -0.2528076171875, -0.22900390625, -0.2052001953125, -0.181396484375, -0.1575927734375, -0.1337890625, -0.1099853515625, -0.086181640625, -0.0623779296875, -0.03857421875, -0.0147705078125, 0.009033203125, 0.0328369140625, 0.056640625, 0.0804443359375, 0.104248046875, 0.1280517578125, 0.15185546875, 0.1756591796875, 0.199462890625, 0.2232666015625, 0.2470703125, 0.2708740234375, 0.294677734375, 0.3184814453125, 0.34228515625, 0.3660888671875, 0.389892578125, 0.4136962890625, 0.4375, 0.4613037109375, 0.485107421875, 0.5089111328125, 0.53271484375, 0.5565185546875, 0.580322265625, 0.6041259765625, 0.6279296875, 0.6517333984375, 0.675537109375, 0.6993408203125, 0.72314453125, 0.7469482421875, 0.770751953125, 0.7945556640625, 0.818359375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 18.0, 29.0, 53.0, 103.0, 150.0, 204.0, 188.0, 119.0, 71.0, 26.0, 14.0, 10.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.43756866455078, -15.863180160522461, -15.28879165649414, -14.71440315246582, -14.1400146484375, -13.56562614440918, -12.991238594055176, -12.416850090026855, -11.842461585998535, -11.268073081970215, -10.693684577941895, -10.119296073913574, -9.54490852355957, -8.97052001953125, -8.39613151550293, -7.821743011474609, -7.247354507446289, -6.672966003417969, -6.098577499389648, -5.524189472198486, -4.949800968170166, -4.375412464141846, -3.8010241985321045, -3.2266359329223633, -2.652247428894043, -2.0778589248657227, -1.5034706592559814, -0.9290822744369507, -0.3546938896179199, 0.2196946144104004, 0.7940828800201416, 1.3684711456298828, 1.942861557006836, 2.5172500610351562, 3.0916383266448975, 3.6660265922546387, 4.240415096282959, 4.814803600311279, 5.389191627502441, 5.963580131530762, 6.537968635559082, 7.112357139587402, 7.686745643615723, 8.261134147644043, 8.835521697998047, 9.409910202026367, 9.984298706054688, 10.558687210083008, 11.133075714111328, 11.707464218139648, 12.281852722167969, 12.856241226196289, 13.43062973022461, 14.00501823425293, 14.579405784606934, 15.153794288635254, 15.728182792663574, 16.302570343017578, 16.8769588470459, 17.45134735107422, 18.02573585510254, 18.60012435913086, 19.17451286315918, 19.7489013671875, 20.32328987121582]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 10.0, 8.0, 15.0, 9.0, 20.0, 13.0, 23.0, 34.0, 25.0, 46.0, 32.0, 48.0, 45.0, 49.0, 59.0, 52.0, 44.0, 63.0, 54.0, 51.0, 41.0, 39.0, 42.0, 28.0, 28.0, 21.0, 9.0, 19.0, 14.0, 8.0, 10.0, 8.0, 3.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.533100128173828, -15.084814071655273, -14.636527061462402, -14.188241004943848, -13.739953994750977, -13.291667938232422, -12.843381881713867, -12.395095825195312, -11.946808815002441, -11.498522758483887, -11.050235748291016, -10.601949691772461, -10.153663635253906, -9.705376625061035, -9.25709056854248, -8.80880355834961, -8.360517501831055, -7.912230968475342, -7.463944435119629, -7.015658378601074, -6.567371845245361, -6.119085311889648, -5.670799255371094, -5.222512722015381, -4.774226188659668, -4.325939655303955, -3.8776533603668213, -3.4293670654296875, -2.9810805320739746, -2.5327939987182617, -2.084507703781128, -1.6362214088439941, -1.1879348754882812, -0.7396484613418579, -0.29136204719543457, 0.15692436695098877, 0.6052107810974121, 1.053497314453125, 1.5017836093902588, 1.9500699043273926, 2.3983564376831055, 2.8466429710388184, 3.294929265975952, 3.743215560913086, 4.191502094268799, 4.639788627624512, 5.088074684143066, 5.536361217498779, 5.984647750854492, 6.432934284210205, 6.881220817565918, 7.329506874084473, 7.7777934074401855, 8.226079940795898, 8.674365997314453, 9.122652053833008, 9.570939064025879, 10.019225120544434, 10.467512130737305, 10.91579818725586, 11.364084243774414, 11.812371253967285, 12.26065731048584, 12.708944320678711, 13.157230377197266]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 3.0, 8.0, 12.0, 8.0, 19.0, 28.0, 54.0, 84.0, 163.0, 468.0, 1732.0, 12918.0, 598551.0, 3540691.0, 35028.0, 3305.0, 715.0, 238.0, 100.0, 54.0, 35.0, 15.0, 17.0, 12.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3125, -2.233245849609375, -2.15399169921875, -2.074737548828125, -1.9954833984375, -1.916229248046875, -1.83697509765625, -1.757720947265625, -1.678466796875, -1.599212646484375, -1.51995849609375, -1.440704345703125, -1.3614501953125, -1.282196044921875, -1.20294189453125, -1.123687744140625, -1.04443359375, -0.965179443359375, -0.88592529296875, -0.806671142578125, -0.7274169921875, -0.648162841796875, -0.56890869140625, -0.489654541015625, -0.410400390625, -0.331146240234375, -0.25189208984375, -0.172637939453125, -0.0933837890625, -0.014129638671875, 0.06512451171875, 0.144378662109375, 0.2236328125, 0.302886962890625, 0.38214111328125, 0.461395263671875, 0.5406494140625, 0.619903564453125, 0.69915771484375, 0.778411865234375, 0.857666015625, 0.936920166015625, 1.01617431640625, 1.095428466796875, 1.1746826171875, 1.253936767578125, 1.33319091796875, 1.412445068359375, 1.49169921875, 1.570953369140625, 1.65020751953125, 1.729461669921875, 1.8087158203125, 1.887969970703125, 1.96722412109375, 2.046478271484375, 2.125732421875, 2.204986572265625, 2.28424072265625, 2.363494873046875, 2.4427490234375, 2.522003173828125, 2.60125732421875, 2.680511474609375, 2.759765625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 7.0, 9.0, 10.0, 15.0, 14.0, 23.0, 39.0, 49.0, 52.0, 55.0, 72.0, 72.0, 62.0, 86.0, 65.0, 62.0, 66.0, 39.0, 59.0, 34.0, 26.0, 20.0, 29.0, 11.0, 13.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.96728515625, -0.9398193359375, -0.912353515625, -0.8848876953125, -0.857421875, -0.8299560546875, -0.802490234375, -0.7750244140625, -0.74755859375, -0.7200927734375, -0.692626953125, -0.6651611328125, -0.6376953125, -0.6102294921875, -0.582763671875, -0.5552978515625, -0.52783203125, -0.5003662109375, -0.472900390625, -0.4454345703125, -0.41796875, -0.3905029296875, -0.363037109375, -0.3355712890625, -0.30810546875, -0.2806396484375, -0.253173828125, -0.2257080078125, -0.1982421875, -0.1707763671875, -0.143310546875, -0.1158447265625, -0.08837890625, -0.0609130859375, -0.033447265625, -0.0059814453125, 0.021484375, 0.0489501953125, 0.076416015625, 0.1038818359375, 0.13134765625, 0.1588134765625, 0.186279296875, 0.2137451171875, 0.2412109375, 0.2686767578125, 0.296142578125, 0.3236083984375, 0.35107421875, 0.3785400390625, 0.406005859375, 0.4334716796875, 0.4609375, 0.4884033203125, 0.515869140625, 0.5433349609375, 0.57080078125, 0.5982666015625, 0.625732421875, 0.6531982421875, 0.6806640625, 0.7081298828125, 0.735595703125, 0.7630615234375, 0.79052734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 10.0, 12.0, 22.0, 29.0, 31.0, 87.0, 144.0, 415.0, 1274.0, 5908.0, 50866.0, 3402375.0, 705490.0, 23158.0, 3261.0, 736.0, 232.0, 78.0, 51.0, 23.0, 11.0, 13.0, 10.0, 5.0, 8.0, 5.0, 6.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.28125, -2.21759033203125, -2.1539306640625, -2.09027099609375, -2.026611328125, -1.96295166015625, -1.8992919921875, -1.83563232421875, -1.77197265625, -1.70831298828125, -1.6446533203125, -1.58099365234375, -1.517333984375, -1.45367431640625, -1.3900146484375, -1.32635498046875, -1.2626953125, -1.19903564453125, -1.1353759765625, -1.07171630859375, -1.008056640625, -0.94439697265625, -0.8807373046875, -0.81707763671875, -0.75341796875, -0.68975830078125, -0.6260986328125, -0.56243896484375, -0.498779296875, -0.43511962890625, -0.3714599609375, -0.30780029296875, -0.244140625, -0.18048095703125, -0.1168212890625, -0.05316162109375, 0.010498046875, 0.07415771484375, 0.1378173828125, 0.20147705078125, 0.26513671875, 0.32879638671875, 0.3924560546875, 0.45611572265625, 0.519775390625, 0.58343505859375, 0.6470947265625, 0.71075439453125, 0.7744140625, 0.83807373046875, 0.9017333984375, 0.96539306640625, 1.029052734375, 1.09271240234375, 1.1563720703125, 1.22003173828125, 1.28369140625, 1.34735107421875, 1.4110107421875, 1.47467041015625, 1.538330078125, 1.60198974609375, 1.6656494140625, 1.72930908203125, 1.79296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 1.0, 9.0, 14.0, 18.0, 21.0, 37.0, 71.0, 124.0, 258.0, 512.0, 924.0, 894.0, 549.0, 251.0, 123.0, 82.0, 48.0, 30.0, 22.0, 19.0, 19.0, 11.0, 8.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6767578125, -1.6275177001953125, -1.578277587890625, -1.5290374755859375, -1.47979736328125, -1.4305572509765625, -1.381317138671875, -1.3320770263671875, -1.2828369140625, -1.2335968017578125, -1.184356689453125, -1.1351165771484375, -1.08587646484375, -1.0366363525390625, -0.987396240234375, -0.9381561279296875, -0.888916015625, -0.8396759033203125, -0.790435791015625, -0.7411956787109375, -0.69195556640625, -0.6427154541015625, -0.593475341796875, -0.5442352294921875, -0.4949951171875, -0.4457550048828125, -0.396514892578125, -0.3472747802734375, -0.29803466796875, -0.2487945556640625, -0.199554443359375, -0.1503143310546875, -0.10107421875, -0.0518341064453125, -0.002593994140625, 0.0466461181640625, 0.09588623046875, 0.1451263427734375, 0.194366455078125, 0.2436065673828125, 0.2928466796875, 0.3420867919921875, 0.391326904296875, 0.4405670166015625, 0.48980712890625, 0.5390472412109375, 0.588287353515625, 0.6375274658203125, 0.686767578125, 0.7360076904296875, 0.785247802734375, 0.8344879150390625, 0.88372802734375, 0.9329681396484375, 0.982208251953125, 1.0314483642578125, 1.0806884765625, 1.1299285888671875, 1.179168701171875, 1.2284088134765625, 1.27764892578125, 1.3268890380859375, 1.376129150390625, 1.4253692626953125, 1.474609375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 19.0, 65.0, 160.0, 295.0, 259.0, 126.0, 30.0, 21.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.698305130004883, -20.1650333404541, -19.631763458251953, -19.098491668701172, -18.56521987915039, -18.03194808959961, -17.498676300048828, -16.96540641784668, -16.4321346282959, -15.898862838745117, -15.365592002868652, -14.832321166992188, -14.299049377441406, -13.765777587890625, -13.23250675201416, -12.699235916137695, -12.165964126586914, -11.632692337036133, -11.099421501159668, -10.566150665283203, -10.032878875732422, -9.49960708618164, -8.966336250305176, -8.433065414428711, -7.89979362487793, -7.366522312164307, -6.833250999450684, -6.2999796867370605, -5.7667083740234375, -5.2334370613098145, -4.700165748596191, -4.166894435882568, -3.633625030517578, -3.100353717803955, -2.567082405090332, -2.033811092376709, -1.500539779663086, -0.9672684669494629, -0.43399715423583984, 0.0992741584777832, 0.6325454711914062, 1.1658167839050293, 1.6990880966186523, 2.2323594093322754, 2.7656307220458984, 3.2989020347595215, 3.8321733474731445, 4.365444660186768, 4.898715972900391, 5.431987285614014, 5.965258598327637, 6.49852991104126, 7.031801223754883, 7.565072536468506, 8.098343849182129, 8.631614685058594, 9.164886474609375, 9.698158264160156, 10.231429100036621, 10.764699935913086, 11.297971725463867, 11.831243515014648, 12.364514350891113, 12.897785186767578, 13.43105697631836]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 23.0, 11.0, 23.0, 22.0, 25.0, 32.0, 37.0, 49.0, 47.0, 60.0, 59.0, 58.0, 56.0, 46.0, 47.0, 62.0, 50.0, 39.0, 39.0, 32.0, 40.0, 34.0, 20.0, 10.0, 12.0, 13.0, 5.0, 6.0, 7.0, 7.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.867152690887451, -7.651735782623291, -7.436319351196289, -7.220902442932129, -7.005485534667969, -6.790068626403809, -6.574651718139648, -6.3592352867126465, -6.143818378448486, -5.928401470184326, -5.712985038757324, -5.497568130493164, -5.282151222229004, -5.066734313964844, -4.851317405700684, -4.635900974273682, -4.4204840660095215, -4.205067157745361, -3.9896504878997803, -3.774233818054199, -3.558816909790039, -3.343400001525879, -3.127983331680298, -2.912566661834717, -2.6971497535705566, -2.4817328453063965, -2.2663161754608154, -2.0508995056152344, -1.8354825973510742, -1.6200658082962036, -1.404649019241333, -1.1892322301864624, -0.9738154411315918, -0.7583986520767212, -0.5429818630218506, -0.32756507396698, -0.11214828491210938, 0.10326850414276123, 0.31868529319763184, 0.5341020822525024, 0.749518871307373, 0.9649356603622437, 1.1803524494171143, 1.3957692384719849, 1.6111860275268555, 1.826602816581726, 2.0420196056365967, 2.2574362754821777, 2.472853183746338, 2.688270092010498, 2.903686761856079, 3.11910343170166, 3.3345203399658203, 3.5499372482299805, 3.7653539180755615, 3.9807705879211426, 4.196187496185303, 4.411604404449463, 4.627020835876465, 4.842437744140625, 5.057854652404785, 5.273271560668945, 5.4886884689331055, 5.704104900360107, 5.919521808624268]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 12.0, 15.0, 16.0, 28.0, 44.0, 67.0, 138.0, 210.0, 331.0, 615.0, 1095.0, 2040.0, 3989.0, 8894.0, 20999.0, 54873.0, 153538.0, 361619.0, 275041.0, 100494.0, 36803.0, 14600.0, 6372.0, 3132.0, 1570.0, 833.0, 472.0, 297.0, 165.0, 88.0, 60.0, 34.0, 24.0, 12.0, 9.0, 8.0, 6.0, 3.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85595703125, -0.8281631469726562, -0.8003692626953125, -0.7725753784179688, -0.744781494140625, -0.7169876098632812, -0.6891937255859375, -0.6613998413085938, -0.63360595703125, -0.6058120727539062, -0.5780181884765625, -0.5502243041992188, -0.522430419921875, -0.49463653564453125, -0.4668426513671875, -0.43904876708984375, -0.4112548828125, -0.38346099853515625, -0.3556671142578125, -0.32787322998046875, -0.300079345703125, -0.27228546142578125, -0.2444915771484375, -0.21669769287109375, -0.18890380859375, -0.16110992431640625, -0.1333160400390625, -0.10552215576171875, -0.077728271484375, -0.04993438720703125, -0.0221405029296875, 0.00565338134765625, 0.033447265625, 0.06124114990234375, 0.0890350341796875, 0.11682891845703125, 0.144622802734375, 0.17241668701171875, 0.2002105712890625, 0.22800445556640625, 0.25579833984375, 0.28359222412109375, 0.3113861083984375, 0.33917999267578125, 0.366973876953125, 0.39476776123046875, 0.4225616455078125, 0.45035552978515625, 0.4781494140625, 0.5059432983398438, 0.5337371826171875, 0.5615310668945312, 0.589324951171875, 0.6171188354492188, 0.6449127197265625, 0.6727066040039062, 0.70050048828125, 0.7282943725585938, 0.7560882568359375, 0.7838821411132812, 0.811676025390625, 0.8394699096679688, 0.8672637939453125, 0.8950576782226562, 0.9228515625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 5.0, 6.0, 10.0, 16.0, 24.0, 25.0, 42.0, 49.0, 64.0, 59.0, 62.0, 83.0, 80.0, 84.0, 81.0, 70.0, 63.0, 47.0, 33.0, 35.0, 14.0, 19.0, 16.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98681640625, -0.958221435546875, -0.92962646484375, -0.901031494140625, -0.8724365234375, -0.843841552734375, -0.81524658203125, -0.786651611328125, -0.758056640625, -0.729461669921875, -0.70086669921875, -0.672271728515625, -0.6436767578125, -0.615081787109375, -0.58648681640625, -0.557891845703125, -0.529296875, -0.500701904296875, -0.47210693359375, -0.443511962890625, -0.4149169921875, -0.386322021484375, -0.35772705078125, -0.329132080078125, -0.300537109375, -0.271942138671875, -0.24334716796875, -0.214752197265625, -0.1861572265625, -0.157562255859375, -0.12896728515625, -0.100372314453125, -0.07177734375, -0.043182373046875, -0.01458740234375, 0.014007568359375, 0.0426025390625, 0.071197509765625, 0.09979248046875, 0.128387451171875, 0.156982421875, 0.185577392578125, 0.21417236328125, 0.242767333984375, 0.2713623046875, 0.299957275390625, 0.32855224609375, 0.357147216796875, 0.3857421875, 0.414337158203125, 0.44293212890625, 0.471527099609375, 0.5001220703125, 0.528717041015625, 0.55731201171875, 0.585906982421875, 0.614501953125, 0.643096923828125, 0.67169189453125, 0.700286865234375, 0.7288818359375, 0.757476806640625, 0.78607177734375, 0.814666748046875, 0.84326171875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 3.0, 13.0, 13.0, 30.0, 24.0, 57.0, 60.0, 99.0, 148.0, 249.0, 518.0, 800.0, 1844.0, 6255.0, 55964.0, 813623.0, 152719.0, 10976.0, 2617.0, 1096.0, 557.0, 318.0, 220.0, 118.0, 74.0, 48.0, 40.0, 15.0, 19.0, 11.0, 8.0, 9.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.289031982421875, -2.21673583984375, -2.144439697265625, -2.0721435546875, -1.999847412109375, -1.92755126953125, -1.855255126953125, -1.782958984375, -1.710662841796875, -1.63836669921875, -1.566070556640625, -1.4937744140625, -1.421478271484375, -1.34918212890625, -1.276885986328125, -1.20458984375, -1.132293701171875, -1.05999755859375, -0.987701416015625, -0.9154052734375, -0.843109130859375, -0.77081298828125, -0.698516845703125, -0.626220703125, -0.553924560546875, -0.48162841796875, -0.409332275390625, -0.3370361328125, -0.264739990234375, -0.19244384765625, -0.120147705078125, -0.0478515625, 0.024444580078125, 0.09674072265625, 0.169036865234375, 0.2413330078125, 0.313629150390625, 0.38592529296875, 0.458221435546875, 0.530517578125, 0.602813720703125, 0.67510986328125, 0.747406005859375, 0.8197021484375, 0.891998291015625, 0.96429443359375, 1.036590576171875, 1.10888671875, 1.181182861328125, 1.25347900390625, 1.325775146484375, 1.3980712890625, 1.470367431640625, 1.54266357421875, 1.614959716796875, 1.687255859375, 1.759552001953125, 1.83184814453125, 1.904144287109375, 1.9764404296875, 2.048736572265625, 2.12103271484375, 2.193328857421875, 2.265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 1.0, 8.0, 5.0, 7.0, 10.0, 6.0, 16.0, 10.0, 16.0, 18.0, 15.0, 16.0, 19.0, 30.0, 32.0, 37.0, 33.0, 40.0, 44.0, 46.0, 39.0, 46.0, 42.0, 44.0, 39.0, 38.0, 38.0, 35.0, 32.0, 32.0, 36.0, 26.0, 23.0, 26.0, 17.0, 10.0, 18.0, 12.0, 10.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.0078125, -1.944610595703125, -1.88140869140625, -1.818206787109375, -1.7550048828125, -1.691802978515625, -1.62860107421875, -1.565399169921875, -1.502197265625, -1.438995361328125, -1.37579345703125, -1.312591552734375, -1.2493896484375, -1.186187744140625, -1.12298583984375, -1.059783935546875, -0.99658203125, -0.933380126953125, -0.87017822265625, -0.806976318359375, -0.7437744140625, -0.680572509765625, -0.61737060546875, -0.554168701171875, -0.490966796875, -0.427764892578125, -0.36456298828125, -0.301361083984375, -0.2381591796875, -0.174957275390625, -0.11175537109375, -0.048553466796875, 0.0146484375, 0.077850341796875, 0.14105224609375, 0.204254150390625, 0.2674560546875, 0.330657958984375, 0.39385986328125, 0.457061767578125, 0.520263671875, 0.583465576171875, 0.64666748046875, 0.709869384765625, 0.7730712890625, 0.836273193359375, 0.89947509765625, 0.962677001953125, 1.02587890625, 1.089080810546875, 1.15228271484375, 1.215484619140625, 1.2786865234375, 1.341888427734375, 1.40509033203125, 1.468292236328125, 1.531494140625, 1.594696044921875, 1.65789794921875, 1.721099853515625, 1.7843017578125, 1.847503662109375, 1.91070556640625, 1.973907470703125, 2.037109375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 7.0, 19.0, 14.0, 19.0, 23.0, 40.0, 74.0, 138.0, 233.0, 390.0, 994.0, 3136.0, 20259.0, 563784.0, 436430.0, 18105.0, 2948.0, 981.0, 408.0, 199.0, 129.0, 71.0, 39.0, 21.0, 18.0, 15.0, 14.0, 7.0, 6.0, 7.0, 1.0, 2.0, 5.0, 4.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0], "bins": [-0.96337890625, -0.9358367919921875, -0.908294677734375, -0.8807525634765625, -0.85321044921875, -0.8256683349609375, -0.798126220703125, -0.7705841064453125, -0.7430419921875, -0.7154998779296875, -0.687957763671875, -0.6604156494140625, -0.63287353515625, -0.6053314208984375, -0.577789306640625, -0.5502471923828125, -0.522705078125, -0.4951629638671875, -0.467620849609375, -0.4400787353515625, -0.41253662109375, -0.3849945068359375, -0.357452392578125, -0.3299102783203125, -0.3023681640625, -0.2748260498046875, -0.247283935546875, -0.2197418212890625, -0.19219970703125, -0.1646575927734375, -0.137115478515625, -0.1095733642578125, -0.08203125, -0.0544891357421875, -0.026947021484375, 0.0005950927734375, 0.02813720703125, 0.0556793212890625, 0.083221435546875, 0.1107635498046875, 0.1383056640625, 0.1658477783203125, 0.193389892578125, 0.2209320068359375, 0.24847412109375, 0.2760162353515625, 0.303558349609375, 0.3311004638671875, 0.358642578125, 0.3861846923828125, 0.413726806640625, 0.4412689208984375, 0.46881103515625, 0.4963531494140625, 0.523895263671875, 0.5514373779296875, 0.5789794921875, 0.6065216064453125, 0.634063720703125, 0.6616058349609375, 0.68914794921875, 0.7166900634765625, 0.744232177734375, 0.7717742919921875, 0.79931640625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 6.0, 12.0, 5.0, 9.0, 7.0, 13.0, 18.0, 29.0, 25.0, 32.0, 36.0, 52.0, 65.0, 84.0, 91.0, 86.0, 84.0, 66.0, 52.0, 46.0, 26.0, 29.0, 16.0, 16.0, 10.0, 13.0, 9.0, 12.0, 8.0, 9.0, 1.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.064508438110352e-05, -7.827114313840866e-05, -7.58972018957138e-05, -7.352326065301895e-05, -7.11493194103241e-05, -6.877537816762924e-05, -6.640143692493439e-05, -6.402749568223953e-05, -6.165355443954468e-05, -5.927961319684982e-05, -5.690567195415497e-05, -5.4531730711460114e-05, -5.215778946876526e-05, -4.9783848226070404e-05, -4.740990698337555e-05, -4.5035965740680695e-05, -4.266202449798584e-05, -4.0288083255290985e-05, -3.791414201259613e-05, -3.5540200769901276e-05, -3.316625952720642e-05, -3.0792318284511566e-05, -2.841837704181671e-05, -2.6044435799121857e-05, -2.3670494556427002e-05, -2.1296553313732147e-05, -1.8922612071037292e-05, -1.6548670828342438e-05, -1.4174729585647583e-05, -1.1800788342952728e-05, -9.426847100257874e-06, -7.052905857563019e-06, -4.678964614868164e-06, -2.3050233721733093e-06, 6.891787052154541e-08, 2.4428591132164e-06, 4.816800355911255e-06, 7.19074159860611e-06, 9.564682841300964e-06, 1.1938624083995819e-05, 1.4312565326690674e-05, 1.668650656938553e-05, 1.9060447812080383e-05, 2.1434389054775238e-05, 2.3808330297470093e-05, 2.6182271540164948e-05, 2.8556212782859802e-05, 3.093015402555466e-05, 3.330409526824951e-05, 3.5678036510944366e-05, 3.805197775363922e-05, 4.0425918996334076e-05, 4.279986023902893e-05, 4.5173801481723785e-05, 4.754774272441864e-05, 4.9921683967113495e-05, 5.229562520980835e-05, 5.4669566452503204e-05, 5.704350769519806e-05, 5.9417448937892914e-05, 6.179139018058777e-05, 6.416533142328262e-05, 6.653927266597748e-05, 6.891321390867233e-05, 7.128715515136719e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 8.0, 3.0, 5.0, 7.0, 16.0, 18.0, 21.0, 37.0, 56.0, 88.0, 186.0, 277.0, 473.0, 1064.0, 2710.0, 10019.0, 98444.0, 836598.0, 84622.0, 9158.0, 2518.0, 1034.0, 478.0, 274.0, 151.0, 92.0, 64.0, 38.0, 34.0, 24.0, 9.0, 7.0, 8.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7294921875, -0.7038726806640625, -0.678253173828125, -0.6526336669921875, -0.62701416015625, -0.6013946533203125, -0.575775146484375, -0.5501556396484375, -0.5245361328125, -0.4989166259765625, -0.473297119140625, -0.4476776123046875, -0.42205810546875, -0.3964385986328125, -0.370819091796875, -0.3451995849609375, -0.319580078125, -0.2939605712890625, -0.268341064453125, -0.2427215576171875, -0.21710205078125, -0.1914825439453125, -0.165863037109375, -0.1402435302734375, -0.1146240234375, -0.0890045166015625, -0.063385009765625, -0.0377655029296875, -0.01214599609375, 0.0134735107421875, 0.039093017578125, 0.0647125244140625, 0.09033203125, 0.1159515380859375, 0.141571044921875, 0.1671905517578125, 0.19281005859375, 0.2184295654296875, 0.244049072265625, 0.2696685791015625, 0.2952880859375, 0.3209075927734375, 0.346527099609375, 0.3721466064453125, 0.39776611328125, 0.4233856201171875, 0.449005126953125, 0.4746246337890625, 0.500244140625, 0.5258636474609375, 0.551483154296875, 0.5771026611328125, 0.60272216796875, 0.6283416748046875, 0.653961181640625, 0.6795806884765625, 0.7052001953125, 0.7308197021484375, 0.756439208984375, 0.7820587158203125, 0.80767822265625, 0.8332977294921875, 0.858917236328125, 0.8845367431640625, 0.91015625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 11.0, 5.0, 6.0, 9.0, 19.0, 17.0, 28.0, 35.0, 32.0, 48.0, 56.0, 65.0, 90.0, 101.0, 79.0, 74.0, 70.0, 56.0, 39.0, 49.0, 31.0, 21.0, 11.0, 18.0, 12.0, 4.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54443359375, -0.5223312377929688, -0.5002288818359375, -0.47812652587890625, -0.456024169921875, -0.43392181396484375, -0.4118194580078125, -0.38971710205078125, -0.36761474609375, -0.34551239013671875, -0.3234100341796875, -0.30130767822265625, -0.279205322265625, -0.25710296630859375, -0.2350006103515625, -0.21289825439453125, -0.1907958984375, -0.16869354248046875, -0.1465911865234375, -0.12448883056640625, -0.102386474609375, -0.08028411865234375, -0.0581817626953125, -0.03607940673828125, -0.01397705078125, 0.00812530517578125, 0.0302276611328125, 0.05233001708984375, 0.074432373046875, 0.09653472900390625, 0.1186370849609375, 0.14073944091796875, 0.162841796875, 0.18494415283203125, 0.2070465087890625, 0.22914886474609375, 0.251251220703125, 0.27335357666015625, 0.2954559326171875, 0.31755828857421875, 0.33966064453125, 0.36176300048828125, 0.3838653564453125, 0.40596771240234375, 0.428070068359375, 0.45017242431640625, 0.4722747802734375, 0.49437713623046875, 0.5164794921875, 0.5385818481445312, 0.5606842041015625, 0.5827865600585938, 0.604888916015625, 0.6269912719726562, 0.6490936279296875, 0.6711959838867188, 0.69329833984375, 0.7154006958007812, 0.7375030517578125, 0.7596054077148438, 0.781707763671875, 0.8038101196289062, 0.8259124755859375, 0.8480148315429688, 0.8701171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 12.0, 28.0, 70.0, 208.0, 360.0, 200.0, 87.0, 18.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.452632904052734, -15.788700103759766, -15.124768257141113, -14.460835456848145, -13.796902656555176, -13.132970809936523, -12.469038009643555, -11.805105209350586, -11.141172409057617, -10.477239608764648, -9.813307762145996, -9.149374961853027, -8.485442161560059, -7.821509838104248, -7.1575775146484375, -6.493644714355469, -5.829712867736816, -5.165780544281006, -4.501847743988037, -3.8379154205322266, -3.173982858657837, -2.5100502967834473, -1.8461179733276367, -1.182185173034668, -0.5182528495788574, 0.14567965269088745, 0.8096121549606323, 1.4735445976257324, 2.137477159500122, 2.8014097213745117, 3.4653420448303223, 4.129274845123291, 4.793207168579102, 5.457139492034912, 6.121072292327881, 6.785004615783691, 7.44893741607666, 8.112869262695312, 8.776802062988281, 9.44073486328125, 10.104667663574219, 10.768600463867188, 11.43253231048584, 12.096465110778809, 12.760397911071777, 13.42432975769043, 14.088262557983398, 14.752195358276367, 15.41612720489502, 16.080059051513672, 16.74399185180664, 17.40792465209961, 18.071857452392578, 18.735790252685547, 19.399723052978516, 20.063655853271484, 20.72758674621582, 21.39151954650879, 22.055452346801758, 22.719383239746094, 23.383316040039062, 24.04724884033203, 24.711181640625, 25.37511444091797, 26.039047241210938]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 6.0, 7.0, 9.0, 8.0, 5.0, 11.0, 10.0, 16.0, 21.0, 19.0, 15.0, 18.0, 36.0, 33.0, 31.0, 36.0, 38.0, 40.0, 45.0, 50.0, 51.0, 45.0, 43.0, 48.0, 40.0, 36.0, 27.0, 37.0, 27.0, 26.0, 28.0, 22.0, 26.0, 12.0, 16.0, 10.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0], "bins": [-9.18872356414795, -8.937575340270996, -8.68642807006836, -8.435279846191406, -8.184131622314453, -7.932984352111816, -7.681836128234863, -7.430688381195068, -7.179540634155273, -6.9283928871154785, -6.677245140075684, -6.4260969161987305, -6.1749491691589355, -5.923801422119141, -5.6726531982421875, -5.421505451202393, -5.170357704162598, -4.919209957122803, -4.668062210083008, -4.416913986206055, -4.16576623916626, -3.914618492126465, -3.663470506668091, -3.412322521209717, -3.161174774169922, -2.910027027130127, -2.658879041671753, -2.407731056213379, -2.156583309173584, -1.9054354429244995, -1.654287576675415, -1.4031397104263306, -1.1519923210144043, -0.9008444547653198, -0.6496965885162354, -0.3985487222671509, -0.1474008560180664, 0.10374701023101807, 0.35489487648010254, 0.606042742729187, 0.8571906089782715, 1.108338475227356, 1.3594863414764404, 1.610634207725525, 1.8617820739746094, 2.1129298210144043, 2.3640778064727783, 2.6152257919311523, 2.8663735389709473, 3.117521286010742, 3.368669271469116, 3.6198172569274902, 3.870965003967285, 4.12211275100708, 4.373260498046875, 4.624408721923828, 4.875556468963623, 5.126704216003418, 5.377852439880371, 5.629000186920166, 5.880147933959961, 6.131295680999756, 6.382443428039551, 6.633591651916504, 6.884739398956299]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 11.0, 11.0, 18.0, 24.0, 45.0, 61.0, 98.0, 152.0, 274.0, 737.0, 4133806.0, 58006.0, 419.0, 219.0, 138.0, 76.0, 58.0, 40.0, 23.0, 16.0, 14.0, 13.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.15283203125, -7.8603515625, -7.56787109375, -7.275390625, -6.98291015625, -6.6904296875, -6.39794921875, -6.10546875, -5.81298828125, -5.5205078125, -5.22802734375, -4.935546875, -4.64306640625, -4.3505859375, -4.05810546875, -3.765625, -3.47314453125, -3.1806640625, -2.88818359375, -2.595703125, -2.30322265625, -2.0107421875, -1.71826171875, -1.42578125, -1.13330078125, -0.8408203125, -0.54833984375, -0.255859375, 0.03662109375, 0.3291015625, 0.62158203125, 0.9140625, 1.20654296875, 1.4990234375, 1.79150390625, 2.083984375, 2.37646484375, 2.6689453125, 2.96142578125, 3.25390625, 3.54638671875, 3.8388671875, 4.13134765625, 4.423828125, 4.71630859375, 5.0087890625, 5.30126953125, 5.59375, 5.88623046875, 6.1787109375, 6.47119140625, 6.763671875, 7.05615234375, 7.3486328125, 7.64111328125, 7.93359375, 8.22607421875, 8.5185546875, 8.81103515625, 9.103515625, 9.39599609375, 9.6884765625, 9.98095703125, 10.2734375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 11.0, 9.0, 18.0, 33.0, 25.0, 61.0, 79.0, 80.0, 98.0, 102.0, 125.0, 97.0, 77.0, 65.0, 38.0, 37.0, 18.0, 12.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.42578125, -1.3906097412109375, -1.355438232421875, -1.3202667236328125, -1.28509521484375, -1.2499237060546875, -1.214752197265625, -1.1795806884765625, -1.1444091796875, -1.1092376708984375, -1.074066162109375, -1.0388946533203125, -1.00372314453125, -0.9685516357421875, -0.933380126953125, -0.8982086181640625, -0.863037109375, -0.8278656005859375, -0.792694091796875, -0.7575225830078125, -0.72235107421875, -0.6871795654296875, -0.652008056640625, -0.6168365478515625, -0.5816650390625, -0.5464935302734375, -0.511322021484375, -0.4761505126953125, -0.44097900390625, -0.4058074951171875, -0.370635986328125, -0.3354644775390625, -0.30029296875, -0.2651214599609375, -0.229949951171875, -0.1947784423828125, -0.15960693359375, -0.1244354248046875, -0.089263916015625, -0.0540924072265625, -0.0189208984375, 0.0162506103515625, 0.051422119140625, 0.0865936279296875, 0.12176513671875, 0.1569366455078125, 0.192108154296875, 0.2272796630859375, 0.262451171875, 0.2976226806640625, 0.332794189453125, 0.3679656982421875, 0.40313720703125, 0.4383087158203125, 0.473480224609375, 0.5086517333984375, 0.5438232421875, 0.5789947509765625, 0.614166259765625, 0.6493377685546875, 0.68450927734375, 0.7196807861328125, 0.754852294921875, 0.7900238037109375, 0.8251953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 13.0, 23.0, 44.0, 80.0, 152.0, 396.0, 872.0, 2076.0, 5978.0, 22948.0, 167268.0, 3409878.0, 526373.0, 41951.0, 10107.0, 3489.0, 1463.0, 582.0, 264.0, 132.0, 72.0, 37.0, 21.0, 12.0, 10.0, 4.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1318359375, -1.1001129150390625, -1.068389892578125, -1.0366668701171875, -1.00494384765625, -0.9732208251953125, -0.941497802734375, -0.9097747802734375, -0.8780517578125, -0.8463287353515625, -0.814605712890625, -0.7828826904296875, -0.75115966796875, -0.7194366455078125, -0.687713623046875, -0.6559906005859375, -0.624267578125, -0.5925445556640625, -0.560821533203125, -0.5290985107421875, -0.49737548828125, -0.4656524658203125, -0.433929443359375, -0.4022064208984375, -0.3704833984375, -0.3387603759765625, -0.307037353515625, -0.2753143310546875, -0.24359130859375, -0.2118682861328125, -0.180145263671875, -0.1484222412109375, -0.11669921875, -0.0849761962890625, -0.053253173828125, -0.0215301513671875, 0.01019287109375, 0.0419158935546875, 0.073638916015625, 0.1053619384765625, 0.1370849609375, 0.1688079833984375, 0.200531005859375, 0.2322540283203125, 0.26397705078125, 0.2957000732421875, 0.327423095703125, 0.3591461181640625, 0.390869140625, 0.4225921630859375, 0.454315185546875, 0.4860382080078125, 0.51776123046875, 0.5494842529296875, 0.581207275390625, 0.6129302978515625, 0.6446533203125, 0.6763763427734375, 0.708099365234375, 0.7398223876953125, 0.77154541015625, 0.8032684326171875, 0.834991455078125, 0.8667144775390625, 0.8984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 9.0, 11.0, 11.0, 25.0, 41.0, 48.0, 92.0, 179.0, 317.0, 660.0, 981.0, 796.0, 399.0, 220.0, 99.0, 48.0, 38.0, 25.0, 18.0, 9.0, 9.0, 5.0, 4.0, 6.0, 1.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.048828125, -1.01458740234375, -0.9803466796875, -0.94610595703125, -0.911865234375, -0.87762451171875, -0.8433837890625, -0.80914306640625, -0.77490234375, -0.74066162109375, -0.7064208984375, -0.67218017578125, -0.637939453125, -0.60369873046875, -0.5694580078125, -0.53521728515625, -0.5009765625, -0.46673583984375, -0.4324951171875, -0.39825439453125, -0.364013671875, -0.32977294921875, -0.2955322265625, -0.26129150390625, -0.22705078125, -0.19281005859375, -0.1585693359375, -0.12432861328125, -0.090087890625, -0.05584716796875, -0.0216064453125, 0.01263427734375, 0.046875, 0.08111572265625, 0.1153564453125, 0.14959716796875, 0.183837890625, 0.21807861328125, 0.2523193359375, 0.28656005859375, 0.32080078125, 0.35504150390625, 0.3892822265625, 0.42352294921875, 0.457763671875, 0.49200439453125, 0.5262451171875, 0.56048583984375, 0.5947265625, 0.62896728515625, 0.6632080078125, 0.69744873046875, 0.731689453125, 0.76593017578125, 0.8001708984375, 0.83441162109375, 0.86865234375, 0.90289306640625, 0.9371337890625, 0.97137451171875, 1.005615234375, 1.03985595703125, 1.0740966796875, 1.10833740234375, 1.142578125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 36.0, 171.0, 362.0, 292.0, 92.0, 21.0, 9.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.129640579223633, -18.661569595336914, -18.193498611450195, -17.725427627563477, -17.257356643676758, -16.78928565979004, -16.32121467590332, -15.853143692016602, -15.385072708129883, -14.917001724243164, -14.448930740356445, -13.980859756469727, -13.512788772583008, -13.044717788696289, -12.57664680480957, -12.108575820922852, -11.640504837036133, -11.172433853149414, -10.704362869262695, -10.236291885375977, -9.768220901489258, -9.300149917602539, -8.83207893371582, -8.364007949829102, -7.895937919616699, -7.4278669357299805, -6.959795951843262, -6.491724967956543, -6.023653984069824, -5.5555830001831055, -5.087512016296387, -4.619441032409668, -4.151370048522949, -3.6832990646362305, -3.2152280807495117, -2.747157096862793, -2.279086112976074, -1.8110153675079346, -1.3429443836212158, -0.8748733997344971, -0.4068024158477783, 0.06126853823661804, 0.5293394923210144, 0.9974104166030884, 1.4654814004898071, 1.9335522651672363, 2.401623249053955, 2.869694232940674, 3.3377652168273926, 3.8058362007141113, 4.27390718460083, 4.741978168487549, 5.210049152374268, 5.678119659423828, 6.146190643310547, 6.614261627197266, 7.082332611083984, 7.550403594970703, 8.018474578857422, 8.48654556274414, 8.95461654663086, 9.422687530517578, 9.890758514404297, 10.358829498291016, 10.826900482177734]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 7.0, 5.0, 5.0, 10.0, 6.0, 12.0, 18.0, 13.0, 25.0, 29.0, 40.0, 38.0, 36.0, 37.0, 45.0, 54.0, 56.0, 57.0, 53.0, 55.0, 52.0, 43.0, 52.0, 48.0, 27.0, 32.0, 33.0, 27.0, 20.0, 13.0, 14.0, 12.0, 9.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8907530307769775, -2.758129596710205, -2.6255059242248535, -2.492882490158081, -2.3602588176727295, -2.227635383605957, -2.0950117111206055, -1.962388277053833, -1.829764723777771, -1.697141170501709, -1.564517617225647, -1.431894063949585, -1.2992706298828125, -1.166646957397461, -1.0340235233306885, -0.9013999700546265, -0.7687764167785645, -0.6361528635025024, -0.5035293102264404, -0.3709058165550232, -0.23828226327896118, -0.10565871000289917, 0.026964783668518066, 0.15958833694458008, 0.2922118902206421, 0.4248354434967041, 0.5574589967727661, 0.6900824904441833, 0.8227060437202454, 0.9553295969963074, 1.0879530906677246, 1.2205766439437866, 1.3531999588012695, 1.4858235120773315, 1.6184470653533936, 1.751070499420166, 1.8836941719055176, 2.01631760597229, 2.1489410400390625, 2.281564712524414, 2.4141883850097656, 2.546811819076538, 2.6794354915618896, 2.812058925628662, 2.9446825981140137, 3.077306032180786, 3.2099294662475586, 3.34255313873291, 3.4751765727996826, 3.607800006866455, 3.7404236793518066, 3.873047113418579, 4.005670547485352, 4.138294219970703, 4.270917892456055, 4.403541564941406, 4.5361647605896, 4.668788433074951, 4.8014116287231445, 4.934035301208496, 5.066658973693848, 5.199282646179199, 5.331905841827393, 5.464529514312744, 5.597153186798096]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 7.0, 10.0, 6.0, 10.0, 14.0, 22.0, 36.0, 54.0, 55.0, 98.0, 131.0, 167.0, 299.0, 472.0, 706.0, 1290.0, 2258.0, 4404.0, 9078.0, 20458.0, 50685.0, 134769.0, 328357.0, 298775.0, 116575.0, 43923.0, 18238.0, 8373.0, 4070.0, 2100.0, 1198.0, 680.0, 386.0, 259.0, 162.0, 137.0, 89.0, 63.0, 47.0, 31.0, 17.0, 9.0, 10.0, 7.0, 6.0, 8.0, 0.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.74462890625, -0.722015380859375, -0.69940185546875, -0.676788330078125, -0.6541748046875, -0.631561279296875, -0.60894775390625, -0.586334228515625, -0.563720703125, -0.541107177734375, -0.51849365234375, -0.495880126953125, -0.4732666015625, -0.450653076171875, -0.42803955078125, -0.405426025390625, -0.3828125, -0.360198974609375, -0.33758544921875, -0.314971923828125, -0.2923583984375, -0.269744873046875, -0.24713134765625, -0.224517822265625, -0.201904296875, -0.179290771484375, -0.15667724609375, -0.134063720703125, -0.1114501953125, -0.088836669921875, -0.06622314453125, -0.043609619140625, -0.02099609375, 0.001617431640625, 0.02423095703125, 0.046844482421875, 0.0694580078125, 0.092071533203125, 0.11468505859375, 0.137298583984375, 0.159912109375, 0.182525634765625, 0.20513916015625, 0.227752685546875, 0.2503662109375, 0.272979736328125, 0.29559326171875, 0.318206787109375, 0.3408203125, 0.363433837890625, 0.38604736328125, 0.408660888671875, 0.4312744140625, 0.453887939453125, 0.47650146484375, 0.499114990234375, 0.521728515625, 0.544342041015625, 0.56695556640625, 0.589569091796875, 0.6121826171875, 0.634796142578125, 0.65740966796875, 0.680023193359375, 0.70263671875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 1.0, 7.0, 15.0, 14.0, 25.0, 30.0, 43.0, 58.0, 69.0, 83.0, 84.0, 78.0, 100.0, 90.0, 66.0, 65.0, 47.0, 47.0, 37.0, 13.0, 15.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98583984375, -0.9574356079101562, -0.9290313720703125, -0.9006271362304688, -0.872222900390625, -0.8438186645507812, -0.8154144287109375, -0.7870101928710938, -0.75860595703125, -0.7302017211914062, -0.7017974853515625, -0.6733932495117188, -0.644989013671875, -0.6165847778320312, -0.5881805419921875, -0.5597763061523438, -0.5313720703125, -0.5029678344726562, -0.4745635986328125, -0.44615936279296875, -0.417755126953125, -0.38935089111328125, -0.3609466552734375, -0.33254241943359375, -0.30413818359375, -0.27573394775390625, -0.2473297119140625, -0.21892547607421875, -0.190521240234375, -0.16211700439453125, -0.1337127685546875, -0.10530853271484375, -0.076904296875, -0.04850006103515625, -0.0200958251953125, 0.00830841064453125, 0.036712646484375, 0.06511688232421875, 0.0935211181640625, 0.12192535400390625, 0.15032958984375, 0.17873382568359375, 0.2071380615234375, 0.23554229736328125, 0.263946533203125, 0.29235076904296875, 0.3207550048828125, 0.34915924072265625, 0.3775634765625, 0.40596771240234375, 0.4343719482421875, 0.46277618408203125, 0.491180419921875, 0.5195846557617188, 0.5479888916015625, 0.5763931274414062, 0.60479736328125, 0.6332015991210938, 0.6616058349609375, 0.6900100708007812, 0.718414306640625, 0.7468185424804688, 0.7752227783203125, 0.8036270141601562, 0.83203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 22.0, 22.0, 31.0, 47.0, 106.0, 195.0, 407.0, 1006.0, 3431.0, 32453.0, 763599.0, 232417.0, 11430.0, 2021.0, 702.0, 327.0, 138.0, 84.0, 33.0, 25.0, 15.0, 10.0, 7.0, 5.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.732421875, -2.658172607421875, -2.58392333984375, -2.509674072265625, -2.4354248046875, -2.361175537109375, -2.28692626953125, -2.212677001953125, -2.138427734375, -2.064178466796875, -1.98992919921875, -1.915679931640625, -1.8414306640625, -1.767181396484375, -1.69293212890625, -1.618682861328125, -1.54443359375, -1.470184326171875, -1.39593505859375, -1.321685791015625, -1.2474365234375, -1.173187255859375, -1.09893798828125, -1.024688720703125, -0.950439453125, -0.876190185546875, -0.80194091796875, -0.727691650390625, -0.6534423828125, -0.579193115234375, -0.50494384765625, -0.430694580078125, -0.3564453125, -0.282196044921875, -0.20794677734375, -0.133697509765625, -0.0594482421875, 0.014801025390625, 0.08905029296875, 0.163299560546875, 0.237548828125, 0.311798095703125, 0.38604736328125, 0.460296630859375, 0.5345458984375, 0.608795166015625, 0.68304443359375, 0.757293701171875, 0.83154296875, 0.905792236328125, 0.98004150390625, 1.054290771484375, 1.1285400390625, 1.202789306640625, 1.27703857421875, 1.351287841796875, 1.425537109375, 1.499786376953125, 1.57403564453125, 1.648284912109375, 1.7225341796875, 1.796783447265625, 1.87103271484375, 1.945281982421875, 2.01953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 3.0, 1.0, 4.0, 9.0, 10.0, 11.0, 9.0, 9.0, 12.0, 15.0, 18.0, 17.0, 19.0, 25.0, 25.0, 33.0, 28.0, 33.0, 38.0, 41.0, 36.0, 44.0, 49.0, 38.0, 40.0, 35.0, 41.0, 47.0, 31.0, 36.0, 27.0, 29.0, 22.0, 24.0, 24.0, 18.0, 16.0, 18.0, 15.0, 11.0, 6.0, 7.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0], "bins": [-1.650390625, -1.6019439697265625, -1.553497314453125, -1.5050506591796875, -1.45660400390625, -1.4081573486328125, -1.359710693359375, -1.3112640380859375, -1.2628173828125, -1.2143707275390625, -1.165924072265625, -1.1174774169921875, -1.06903076171875, -1.0205841064453125, -0.972137451171875, -0.9236907958984375, -0.875244140625, -0.8267974853515625, -0.778350830078125, -0.7299041748046875, -0.68145751953125, -0.6330108642578125, -0.584564208984375, -0.5361175537109375, -0.4876708984375, -0.4392242431640625, -0.390777587890625, -0.3423309326171875, -0.29388427734375, -0.2454376220703125, -0.196990966796875, -0.1485443115234375, -0.10009765625, -0.0516510009765625, -0.003204345703125, 0.0452423095703125, 0.09368896484375, 0.1421356201171875, 0.190582275390625, 0.2390289306640625, 0.2874755859375, 0.3359222412109375, 0.384368896484375, 0.4328155517578125, 0.48126220703125, 0.5297088623046875, 0.578155517578125, 0.6266021728515625, 0.675048828125, 0.7234954833984375, 0.771942138671875, 0.8203887939453125, 0.86883544921875, 0.9172821044921875, 0.965728759765625, 1.0141754150390625, 1.0626220703125, 1.1110687255859375, 1.159515380859375, 1.2079620361328125, 1.25640869140625, 1.3048553466796875, 1.353302001953125, 1.4017486572265625, 1.4501953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 7.0, 23.0, 28.0, 32.0, 75.0, 153.0, 289.0, 764.0, 3296.0, 32004.0, 952363.0, 53777.0, 4036.0, 1004.0, 338.0, 143.0, 76.0, 42.0, 26.0, 14.0, 8.0, 10.0, 12.0, 5.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.07421875, -1.0378875732421875, -1.001556396484375, -0.9652252197265625, -0.92889404296875, -0.8925628662109375, -0.856231689453125, -0.8199005126953125, -0.7835693359375, -0.7472381591796875, -0.710906982421875, -0.6745758056640625, -0.63824462890625, -0.6019134521484375, -0.565582275390625, -0.5292510986328125, -0.492919921875, -0.4565887451171875, -0.420257568359375, -0.3839263916015625, -0.34759521484375, -0.3112640380859375, -0.274932861328125, -0.2386016845703125, -0.2022705078125, -0.1659393310546875, -0.129608154296875, -0.0932769775390625, -0.05694580078125, -0.0206146240234375, 0.015716552734375, 0.0520477294921875, 0.08837890625, 0.1247100830078125, 0.161041259765625, 0.1973724365234375, 0.23370361328125, 0.2700347900390625, 0.306365966796875, 0.3426971435546875, 0.3790283203125, 0.4153594970703125, 0.451690673828125, 0.4880218505859375, 0.52435302734375, 0.5606842041015625, 0.597015380859375, 0.6333465576171875, 0.669677734375, 0.7060089111328125, 0.742340087890625, 0.7786712646484375, 0.81500244140625, 0.8513336181640625, 0.887664794921875, 0.9239959716796875, 0.9603271484375, 0.9966583251953125, 1.032989501953125, 1.0693206787109375, 1.10565185546875, 1.1419830322265625, 1.178314208984375, 1.2146453857421875, 1.2509765625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 4.0, 9.0, 8.0, 12.0, 9.0, 18.0, 22.0, 43.0, 65.0, 82.0, 119.0, 137.0, 132.0, 83.0, 68.0, 39.0, 36.0, 24.0, 22.0, 7.0, 12.0, 16.0, 5.0, 10.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.822845458984375e-05, -9.521190077066422e-05, -9.219534695148468e-05, -8.917879313230515e-05, -8.616223931312561e-05, -8.314568549394608e-05, -8.012913167476654e-05, -7.7112577855587e-05, -7.409602403640747e-05, -7.107947021722794e-05, -6.80629163980484e-05, -6.504636257886887e-05, -6.202980875968933e-05, -5.9013254940509796e-05, -5.599670112133026e-05, -5.2980147302150726e-05, -4.996359348297119e-05, -4.6947039663791656e-05, -4.393048584461212e-05, -4.091393202543259e-05, -3.789737820625305e-05, -3.488082438707352e-05, -3.186427056789398e-05, -2.8847716748714447e-05, -2.5831162929534912e-05, -2.2814609110355377e-05, -1.9798055291175842e-05, -1.6781501471996307e-05, -1.3764947652816772e-05, -1.0748393833637238e-05, -7.731840014457703e-06, -4.715286195278168e-06, -1.6987323760986328e-06, 1.317821443080902e-06, 4.334375262260437e-06, 7.350929081439972e-06, 1.0367482900619507e-05, 1.3384036719799042e-05, 1.6400590538978577e-05, 1.941714435815811e-05, 2.2433698177337646e-05, 2.545025199651718e-05, 2.8466805815696716e-05, 3.148335963487625e-05, 3.4499913454055786e-05, 3.751646727323532e-05, 4.0533021092414856e-05, 4.354957491159439e-05, 4.6566128730773926e-05, 4.958268254995346e-05, 5.2599236369132996e-05, 5.561579018831253e-05, 5.8632344007492065e-05, 6.16488978266716e-05, 6.466545164585114e-05, 6.768200546503067e-05, 7.06985592842102e-05, 7.371511310338974e-05, 7.673166692256927e-05, 7.974822074174881e-05, 8.276477456092834e-05, 8.578132838010788e-05, 8.879788219928741e-05, 9.181443601846695e-05, 9.483098983764648e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 3.0, 7.0, 5.0, 11.0, 13.0, 19.0, 39.0, 46.0, 78.0, 134.0, 247.0, 460.0, 1022.0, 2925.0, 12762.0, 167054.0, 803437.0, 50231.0, 6619.0, 1869.0, 757.0, 320.0, 208.0, 94.0, 56.0, 36.0, 28.0, 28.0, 9.0, 11.0, 5.0, 8.0, 1.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7666015625, -0.7448883056640625, -0.723175048828125, -0.7014617919921875, -0.67974853515625, -0.6580352783203125, -0.636322021484375, -0.6146087646484375, -0.5928955078125, -0.5711822509765625, -0.549468994140625, -0.5277557373046875, -0.50604248046875, -0.4843292236328125, -0.462615966796875, -0.4409027099609375, -0.419189453125, -0.3974761962890625, -0.375762939453125, -0.3540496826171875, -0.33233642578125, -0.3106231689453125, -0.288909912109375, -0.2671966552734375, -0.2454833984375, -0.2237701416015625, -0.202056884765625, -0.1803436279296875, -0.15863037109375, -0.1369171142578125, -0.115203857421875, -0.0934906005859375, -0.07177734375, -0.0500640869140625, -0.028350830078125, -0.0066375732421875, 0.01507568359375, 0.0367889404296875, 0.058502197265625, 0.0802154541015625, 0.1019287109375, 0.1236419677734375, 0.145355224609375, 0.1670684814453125, 0.18878173828125, 0.2104949951171875, 0.232208251953125, 0.2539215087890625, 0.275634765625, 0.2973480224609375, 0.319061279296875, 0.3407745361328125, 0.36248779296875, 0.3842010498046875, 0.405914306640625, 0.4276275634765625, 0.4493408203125, 0.4710540771484375, 0.492767333984375, 0.5144805908203125, 0.53619384765625, 0.5579071044921875, 0.579620361328125, 0.6013336181640625, 0.623046875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 9.0, 8.0, 5.0, 19.0, 21.0, 29.0, 37.0, 36.0, 55.0, 67.0, 86.0, 90.0, 88.0, 97.0, 74.0, 59.0, 58.0, 37.0, 26.0, 26.0, 19.0, 22.0, 10.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5209732055664062, -0.5048370361328125, -0.48870086669921875, -0.472564697265625, -0.45642852783203125, -0.4402923583984375, -0.42415618896484375, -0.40802001953125, -0.39188385009765625, -0.3757476806640625, -0.35961151123046875, -0.343475341796875, -0.32733917236328125, -0.3112030029296875, -0.29506683349609375, -0.2789306640625, -0.26279449462890625, -0.2466583251953125, -0.23052215576171875, -0.214385986328125, -0.19824981689453125, -0.1821136474609375, -0.16597747802734375, -0.14984130859375, -0.13370513916015625, -0.1175689697265625, -0.10143280029296875, -0.085296630859375, -0.06916046142578125, -0.0530242919921875, -0.03688812255859375, -0.020751953125, -0.00461578369140625, 0.0115203857421875, 0.02765655517578125, 0.043792724609375, 0.05992889404296875, 0.0760650634765625, 0.09220123291015625, 0.10833740234375, 0.12447357177734375, 0.1406097412109375, 0.15674591064453125, 0.172882080078125, 0.18901824951171875, 0.2051544189453125, 0.22129058837890625, 0.2374267578125, 0.25356292724609375, 0.2696990966796875, 0.28583526611328125, 0.301971435546875, 0.31810760498046875, 0.3342437744140625, 0.35037994384765625, 0.36651611328125, 0.38265228271484375, 0.3987884521484375, 0.41492462158203125, 0.431060791015625, 0.44719696044921875, 0.4633331298828125, 0.47946929931640625, 0.49560546875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 10.0, 31.0, 83.0, 263.0, 334.0, 173.0, 56.0, 23.0, 7.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.919252395629883, -22.401060104370117, -21.88286590576172, -21.364673614501953, -20.846481323242188, -20.32828712463379, -19.810094833374023, -19.291902542114258, -18.77370834350586, -18.255516052246094, -17.737321853637695, -17.21912956237793, -16.700937271118164, -16.182743072509766, -15.66455078125, -15.146357536315918, -14.628165245056152, -14.10997200012207, -13.591779708862305, -13.073586463928223, -12.55539321899414, -12.037200927734375, -11.519007682800293, -11.000814437866211, -10.482622146606445, -9.964428901672363, -9.446236610412598, -8.928043365478516, -8.409850120544434, -7.89165735244751, -7.373464584350586, -6.855271339416504, -6.337078094482422, -5.818885326385498, -5.300692081451416, -4.782499313354492, -4.26430606842041, -3.7461133003234863, -3.2279205322265625, -2.7097275257110596, -2.1915345191955566, -1.6733415126800537, -1.1551486253738403, -0.636955738067627, -0.11876273155212402, 0.3994302749633789, 0.9176230430603027, 1.4358160495758057, 1.9540090560913086, 2.4722020626068115, 2.9903950691223145, 3.5085878372192383, 4.02678108215332, 4.544973850250244, 5.063166618347168, 5.58135986328125, 6.099552631378174, 6.617745399475098, 7.13593864440918, 7.6541314125061035, 8.172324180603027, 8.69051742553711, 9.208709716796875, 9.726902961730957, 10.245096206665039]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 5.0, 7.0, 8.0, 13.0, 5.0, 20.0, 18.0, 14.0, 21.0, 18.0, 36.0, 40.0, 37.0, 34.0, 42.0, 56.0, 47.0, 67.0, 57.0, 52.0, 44.0, 43.0, 58.0, 24.0, 35.0, 21.0, 15.0, 26.0, 30.0, 18.0, 7.0, 20.0, 7.0, 10.0, 12.0, 4.0, 9.0, 5.0, 1.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.808499336242676, -6.574554920196533, -6.340610504150391, -6.106666564941406, -5.872722148895264, -5.638777732849121, -5.404833793640137, -5.170889377593994, -4.936944961547852, -4.703000545501709, -4.469056129455566, -4.235112190246582, -4.0011677742004395, -3.767223358154297, -3.5332791805267334, -3.29933500289917, -3.0653905868530273, -2.8314461708068848, -2.5975019931793213, -2.363557815551758, -2.1296133995056152, -1.8956691026687622, -1.6617248058319092, -1.4277805089950562, -1.1938362121582031, -0.9598919153213501, -0.7259476184844971, -0.49200332164764404, -0.258059024810791, -0.02411472797393799, 0.20982956886291504, 0.44377386569976807, 0.6777181625366211, 0.9116624593734741, 1.1456067562103271, 1.3795510530471802, 1.6134953498840332, 1.8474396467208862, 2.0813839435577393, 2.3153281211853027, 2.5492725372314453, 2.783216953277588, 3.0171611309051514, 3.251105308532715, 3.4850497245788574, 3.718994140625, 3.9529383182525635, 4.186882495880127, 4.4208269119262695, 4.654771327972412, 4.888715744018555, 5.122659683227539, 5.356604099273682, 5.590548515319824, 5.824492454528809, 6.058436870574951, 6.292381286621094, 6.526325702667236, 6.760270118713379, 6.994214057922363, 7.228158473968506, 7.462102890014648, 7.696046829223633, 7.929991245269775, 8.163935661315918]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 9.0, 7.0, 11.0, 20.0, 32.0, 40.0, 81.0, 128.0, 191.0, 422.0, 1039.0, 3308.0, 16675.0, 192017.0, 3529800.0, 419879.0, 23823.0, 4441.0, 1229.0, 484.0, 229.0, 146.0, 79.0, 53.0, 38.0, 38.0, 17.0, 13.0, 9.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2626953125, -1.2308120727539062, -1.1989288330078125, -1.1670455932617188, -1.135162353515625, -1.1032791137695312, -1.0713958740234375, -1.0395126342773438, -1.00762939453125, -0.9757461547851562, -0.9438629150390625, -0.9119796752929688, -0.880096435546875, -0.8482131958007812, -0.8163299560546875, -0.7844467163085938, -0.7525634765625, -0.7206802368164062, -0.6887969970703125, -0.6569137573242188, -0.625030517578125, -0.5931472778320312, -0.5612640380859375, -0.5293807983398438, -0.49749755859375, -0.46561431884765625, -0.4337310791015625, -0.40184783935546875, -0.369964599609375, -0.33808135986328125, -0.3061981201171875, -0.27431488037109375, -0.242431640625, -0.21054840087890625, -0.1786651611328125, -0.14678192138671875, -0.114898681640625, -0.08301544189453125, -0.0511322021484375, -0.01924896240234375, 0.01263427734375, 0.04451751708984375, 0.0764007568359375, 0.10828399658203125, 0.140167236328125, 0.17205047607421875, 0.2039337158203125, 0.23581695556640625, 0.2677001953125, 0.29958343505859375, 0.3314666748046875, 0.36334991455078125, 0.395233154296875, 0.42711639404296875, 0.4589996337890625, 0.49088287353515625, 0.52276611328125, 0.5546493530273438, 0.5865325927734375, 0.6184158325195312, 0.650299072265625, 0.6821823120117188, 0.7140655517578125, 0.7459487915039062, 0.77783203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 6.0, 6.0, 18.0, 28.0, 26.0, 30.0, 63.0, 62.0, 83.0, 98.0, 103.0, 91.0, 96.0, 85.0, 71.0, 41.0, 38.0, 22.0, 21.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.95263671875, -0.9244003295898438, -0.8961639404296875, -0.8679275512695312, -0.839691162109375, -0.8114547729492188, -0.7832183837890625, -0.7549819946289062, -0.72674560546875, -0.6985092163085938, -0.6702728271484375, -0.6420364379882812, -0.613800048828125, -0.5855636596679688, -0.5573272705078125, -0.5290908813476562, -0.5008544921875, -0.47261810302734375, -0.4443817138671875, -0.41614532470703125, -0.387908935546875, -0.35967254638671875, -0.3314361572265625, -0.30319976806640625, -0.27496337890625, -0.24672698974609375, -0.2184906005859375, -0.19025421142578125, -0.162017822265625, -0.13378143310546875, -0.1055450439453125, -0.07730865478515625, -0.049072265625, -0.02083587646484375, 0.0074005126953125, 0.03563690185546875, 0.063873291015625, 0.09210968017578125, 0.1203460693359375, 0.14858245849609375, 0.17681884765625, 0.20505523681640625, 0.2332916259765625, 0.26152801513671875, 0.289764404296875, 0.31800079345703125, 0.3462371826171875, 0.37447357177734375, 0.4027099609375, 0.43094635009765625, 0.4591827392578125, 0.48741912841796875, 0.515655517578125, 0.5438919067382812, 0.5721282958984375, 0.6003646850585938, 0.62860107421875, 0.6568374633789062, 0.6850738525390625, 0.7133102416992188, 0.741546630859375, 0.7697830200195312, 0.7980194091796875, 0.8262557983398438, 0.8544921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 11.0, 22.0, 38.0, 63.0, 138.0, 293.0, 772.0, 3267.0, 29310.0, 2471930.0, 1660037.0, 24659.0, 2753.0, 610.0, 224.0, 81.0, 31.0, 22.0, 8.0, 11.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9853515625, -1.9344024658203125, -1.883453369140625, -1.8325042724609375, -1.78155517578125, -1.7306060791015625, -1.679656982421875, -1.6287078857421875, -1.5777587890625, -1.5268096923828125, -1.475860595703125, -1.4249114990234375, -1.37396240234375, -1.3230133056640625, -1.272064208984375, -1.2211151123046875, -1.170166015625, -1.1192169189453125, -1.068267822265625, -1.0173187255859375, -0.96636962890625, -0.9154205322265625, -0.864471435546875, -0.8135223388671875, -0.7625732421875, -0.7116241455078125, -0.660675048828125, -0.6097259521484375, -0.55877685546875, -0.5078277587890625, -0.456878662109375, -0.4059295654296875, -0.35498046875, -0.3040313720703125, -0.253082275390625, -0.2021331787109375, -0.15118408203125, -0.1002349853515625, -0.049285888671875, 0.0016632080078125, 0.0526123046875, 0.1035614013671875, 0.154510498046875, 0.2054595947265625, 0.25640869140625, 0.3073577880859375, 0.358306884765625, 0.4092559814453125, 0.460205078125, 0.5111541748046875, 0.562103271484375, 0.6130523681640625, 0.66400146484375, 0.7149505615234375, 0.765899658203125, 0.8168487548828125, 0.8677978515625, 0.9187469482421875, 0.969696044921875, 1.0206451416015625, 1.07159423828125, 1.1225433349609375, 1.173492431640625, 1.2244415283203125, 1.275390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 9.0, 10.0, 6.0, 12.0, 18.0, 35.0, 48.0, 69.0, 114.0, 304.0, 598.0, 951.0, 865.0, 477.0, 239.0, 106.0, 68.0, 44.0, 34.0, 19.0, 11.0, 12.0, 8.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4091796875, -1.3698883056640625, -1.330596923828125, -1.2913055419921875, -1.25201416015625, -1.2127227783203125, -1.173431396484375, -1.1341400146484375, -1.0948486328125, -1.0555572509765625, -1.016265869140625, -0.9769744873046875, -0.93768310546875, -0.8983917236328125, -0.859100341796875, -0.8198089599609375, -0.780517578125, -0.7412261962890625, -0.701934814453125, -0.6626434326171875, -0.62335205078125, -0.5840606689453125, -0.544769287109375, -0.5054779052734375, -0.4661865234375, -0.4268951416015625, -0.387603759765625, -0.3483123779296875, -0.30902099609375, -0.2697296142578125, -0.230438232421875, -0.1911468505859375, -0.15185546875, -0.1125640869140625, -0.073272705078125, -0.0339813232421875, 0.00531005859375, 0.0446014404296875, 0.083892822265625, 0.1231842041015625, 0.1624755859375, 0.2017669677734375, 0.241058349609375, 0.2803497314453125, 0.31964111328125, 0.3589324951171875, 0.398223876953125, 0.4375152587890625, 0.476806640625, 0.5160980224609375, 0.555389404296875, 0.5946807861328125, 0.63397216796875, 0.6732635498046875, 0.712554931640625, 0.7518463134765625, 0.7911376953125, 0.8304290771484375, 0.869720458984375, 0.9090118408203125, 0.94830322265625, 0.9875946044921875, 1.026885986328125, 1.0661773681640625, 1.10546875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 10.0, 21.0, 62.0, 183.0, 344.0, 236.0, 103.0, 19.0, 9.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.195302963256836, -11.739367485046387, -11.283432960510254, -10.827497482299805, -10.371562957763672, -9.915627479553223, -9.45969295501709, -9.00375747680664, -8.547822952270508, -8.091887474060059, -7.635952949523926, -7.180017948150635, -6.724082946777344, -6.2681474685668945, -5.812212944030762, -5.3562774658203125, -4.9003424644470215, -4.4444074630737305, -3.9884724617004395, -3.5325374603271484, -3.0766024589538574, -2.6206672191619873, -2.1647322177886963, -1.7087972164154053, -1.2528622150421143, -0.7969272136688232, -0.34099215269088745, 0.11494290828704834, 0.5708779096603394, 1.02681303024292, 1.482748031616211, 1.938683032989502, 2.394618034362793, 2.850553035736084, 3.306488037109375, 3.762423038482666, 4.218358039855957, 4.674293518066406, 5.130228042602539, 5.586163520812988, 6.042098045349121, 6.498033046722412, 6.953968048095703, 7.409903049468994, 7.865838050842285, 8.321773529052734, 8.777708053588867, 9.233643531799316, 9.689579010009766, 10.145514488220215, 10.601449012756348, 11.057384490966797, 11.51331901550293, 11.969254493713379, 12.425189018249512, 12.881124496459961, 13.337059020996094, 13.792994499206543, 14.248929023742676, 14.704864501953125, 15.160799026489258, 15.616734504699707, 16.072669982910156, 16.52860450744629, 16.984539031982422]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 6.0, 10.0, 6.0, 19.0, 11.0, 14.0, 19.0, 27.0, 28.0, 43.0, 41.0, 42.0, 56.0, 58.0, 49.0, 66.0, 58.0, 54.0, 55.0, 50.0, 49.0, 40.0, 36.0, 25.0, 17.0, 21.0, 22.0, 14.0, 9.0, 12.0, 8.0, 9.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.975935935974121, -4.809560775756836, -4.643185615539551, -4.476810932159424, -4.310435771942139, -4.1440606117248535, -3.9776854515075684, -3.811310291290283, -3.644935369491577, -3.478560209274292, -3.312185287475586, -3.145810127258301, -2.9794349670410156, -2.8130600452423096, -2.6466848850250244, -2.4803099632263184, -2.313934803009033, -2.147559642791748, -1.981184720993042, -1.8148095607757568, -1.6484345197677612, -1.4820594787597656, -1.3156843185424805, -1.1493092775344849, -0.9829342365264893, -0.8165591955184937, -0.6501840949058533, -0.4838090240955353, -0.3174339532852173, -0.15105891227722168, 0.015316188335418701, 0.18169128894805908, 0.3480663299560547, 0.5144413709640503, 0.6808164715766907, 0.847191572189331, 1.0135666131973267, 1.1799416542053223, 1.3463168144226074, 1.512691855430603, 1.6790668964385986, 1.8454419374465942, 2.01181697845459, 2.178192138671875, 2.34456729888916, 2.510942220687866, 2.6773173809051514, 2.8436923027038574, 3.0100674629211426, 3.1764426231384277, 3.342817544937134, 3.509192705154419, 3.675567626953125, 3.84194278717041, 4.008317947387695, 4.1746931076049805, 4.341068267822266, 4.507443428039551, 4.673818588256836, 4.840193271636963, 5.006568431854248, 5.172943592071533, 5.339318752288818, 5.5056939125061035, 5.6720685958862305]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 15.0, 15.0, 14.0, 28.0, 41.0, 56.0, 69.0, 127.0, 186.0, 243.0, 385.0, 681.0, 1165.0, 2219.0, 4604.0, 9824.0, 23457.0, 59631.0, 154248.0, 312223.0, 275130.0, 122370.0, 46872.0, 18565.0, 8027.0, 3794.0, 1885.0, 1036.0, 545.0, 389.0, 225.0, 148.0, 104.0, 65.0, 48.0, 30.0, 37.0, 17.0, 8.0, 8.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.603515625, -0.58331298828125, -0.5631103515625, -0.54290771484375, -0.522705078125, -0.50250244140625, -0.4822998046875, -0.46209716796875, -0.44189453125, -0.42169189453125, -0.4014892578125, -0.38128662109375, -0.361083984375, -0.34088134765625, -0.3206787109375, -0.30047607421875, -0.2802734375, -0.26007080078125, -0.2398681640625, -0.21966552734375, -0.199462890625, -0.17926025390625, -0.1590576171875, -0.13885498046875, -0.11865234375, -0.09844970703125, -0.0782470703125, -0.05804443359375, -0.037841796875, -0.01763916015625, 0.0025634765625, 0.02276611328125, 0.04296875, 0.06317138671875, 0.0833740234375, 0.10357666015625, 0.123779296875, 0.14398193359375, 0.1641845703125, 0.18438720703125, 0.20458984375, 0.22479248046875, 0.2449951171875, 0.26519775390625, 0.285400390625, 0.30560302734375, 0.3258056640625, 0.34600830078125, 0.3662109375, 0.38641357421875, 0.4066162109375, 0.42681884765625, 0.447021484375, 0.46722412109375, 0.4874267578125, 0.50762939453125, 0.52783203125, 0.54803466796875, 0.5682373046875, 0.58843994140625, 0.608642578125, 0.62884521484375, 0.6490478515625, 0.66925048828125, 0.689453125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 16.0, 25.0, 26.0, 42.0, 50.0, 67.0, 72.0, 92.0, 97.0, 104.0, 76.0, 79.0, 63.0, 52.0, 49.0, 30.0, 14.0, 14.0, 4.0, 4.0, 5.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87060546875, -0.8449172973632812, -0.8192291259765625, -0.7935409545898438, -0.767852783203125, -0.7421646118164062, -0.7164764404296875, -0.6907882690429688, -0.66510009765625, -0.6394119262695312, -0.6137237548828125, -0.5880355834960938, -0.562347412109375, -0.5366592407226562, -0.5109710693359375, -0.48528289794921875, -0.4595947265625, -0.43390655517578125, -0.4082183837890625, -0.38253021240234375, -0.356842041015625, -0.33115386962890625, -0.3054656982421875, -0.27977752685546875, -0.25408935546875, -0.22840118408203125, -0.2027130126953125, -0.17702484130859375, -0.151336669921875, -0.12564849853515625, -0.0999603271484375, -0.07427215576171875, -0.048583984375, -0.02289581298828125, 0.0027923583984375, 0.02848052978515625, 0.054168701171875, 0.07985687255859375, 0.1055450439453125, 0.13123321533203125, 0.15692138671875, 0.18260955810546875, 0.2082977294921875, 0.23398590087890625, 0.259674072265625, 0.28536224365234375, 0.3110504150390625, 0.33673858642578125, 0.3624267578125, 0.38811492919921875, 0.4138031005859375, 0.43949127197265625, 0.465179443359375, 0.49086761474609375, 0.5165557861328125, 0.5422439575195312, 0.56793212890625, 0.5936203002929688, 0.6193084716796875, 0.6449966430664062, 0.670684814453125, 0.6963729858398438, 0.7220611572265625, 0.7477493286132812, 0.7734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 8.0, 6.0, 15.0, 16.0, 13.0, 27.0, 31.0, 47.0, 59.0, 79.0, 130.0, 169.0, 242.0, 292.0, 478.0, 730.0, 1209.0, 2458.0, 7311.0, 42912.0, 551185.0, 392141.0, 36717.0, 6575.0, 2326.0, 1181.0, 627.0, 443.0, 316.0, 222.0, 146.0, 115.0, 83.0, 61.0, 39.0, 39.0, 28.0, 16.0, 20.0, 11.0, 7.0, 10.0, 5.0, 6.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5517578125, -1.5046844482421875, -1.457611083984375, -1.4105377197265625, -1.36346435546875, -1.3163909912109375, -1.269317626953125, -1.2222442626953125, -1.1751708984375, -1.1280975341796875, -1.081024169921875, -1.0339508056640625, -0.98687744140625, -0.9398040771484375, -0.892730712890625, -0.8456573486328125, -0.798583984375, -0.7515106201171875, -0.704437255859375, -0.6573638916015625, -0.61029052734375, -0.5632171630859375, -0.516143798828125, -0.4690704345703125, -0.4219970703125, -0.3749237060546875, -0.327850341796875, -0.2807769775390625, -0.23370361328125, -0.1866302490234375, -0.139556884765625, -0.0924835205078125, -0.04541015625, 0.0016632080078125, 0.048736572265625, 0.0958099365234375, 0.14288330078125, 0.1899566650390625, 0.237030029296875, 0.2841033935546875, 0.3311767578125, 0.3782501220703125, 0.425323486328125, 0.4723968505859375, 0.51947021484375, 0.5665435791015625, 0.613616943359375, 0.6606903076171875, 0.707763671875, 0.7548370361328125, 0.801910400390625, 0.8489837646484375, 0.89605712890625, 0.9431304931640625, 0.990203857421875, 1.0372772216796875, 1.0843505859375, 1.1314239501953125, 1.178497314453125, 1.2255706787109375, 1.27264404296875, 1.3197174072265625, 1.366790771484375, 1.4138641357421875, 1.4609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 8.0, 7.0, 9.0, 5.0, 13.0, 12.0, 7.0, 11.0, 16.0, 20.0, 18.0, 14.0, 25.0, 32.0, 33.0, 33.0, 49.0, 58.0, 43.0, 43.0, 39.0, 42.0, 49.0, 45.0, 48.0, 37.0, 38.0, 39.0, 27.0, 17.0, 24.0, 17.0, 20.0, 19.0, 14.0, 16.0, 13.0, 7.0, 6.0, 10.0, 2.0, 8.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-1.94140625, -1.8848114013671875, -1.828216552734375, -1.7716217041015625, -1.71502685546875, -1.6584320068359375, -1.601837158203125, -1.5452423095703125, -1.4886474609375, -1.4320526123046875, -1.375457763671875, -1.3188629150390625, -1.26226806640625, -1.2056732177734375, -1.149078369140625, -1.0924835205078125, -1.035888671875, -0.9792938232421875, -0.922698974609375, -0.8661041259765625, -0.80950927734375, -0.7529144287109375, -0.696319580078125, -0.6397247314453125, -0.5831298828125, -0.5265350341796875, -0.469940185546875, -0.4133453369140625, -0.35675048828125, -0.3001556396484375, -0.243560791015625, -0.1869659423828125, -0.13037109375, -0.0737762451171875, -0.017181396484375, 0.0394134521484375, 0.09600830078125, 0.1526031494140625, 0.209197998046875, 0.2657928466796875, 0.3223876953125, 0.3789825439453125, 0.435577392578125, 0.4921722412109375, 0.54876708984375, 0.6053619384765625, 0.661956787109375, 0.7185516357421875, 0.775146484375, 0.8317413330078125, 0.888336181640625, 0.9449310302734375, 1.00152587890625, 1.0581207275390625, 1.114715576171875, 1.1713104248046875, 1.2279052734375, 1.2845001220703125, 1.341094970703125, 1.3976898193359375, 1.45428466796875, 1.5108795166015625, 1.567474365234375, 1.6240692138671875, 1.6806640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 5.0, 7.0, 18.0, 14.0, 28.0, 38.0, 52.0, 99.0, 179.0, 271.0, 678.0, 1843.0, 5841.0, 33848.0, 668913.0, 307529.0, 22064.0, 4465.0, 1363.0, 621.0, 317.0, 133.0, 79.0, 44.0, 37.0, 21.0, 18.0, 3.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59912109375, -0.5809097290039062, -0.5626983642578125, -0.5444869995117188, -0.526275634765625, -0.5080642700195312, -0.4898529052734375, -0.47164154052734375, -0.45343017578125, -0.43521881103515625, -0.4170074462890625, -0.39879608154296875, -0.380584716796875, -0.36237335205078125, -0.3441619873046875, -0.32595062255859375, -0.3077392578125, -0.28952789306640625, -0.2713165283203125, -0.25310516357421875, -0.234893798828125, -0.21668243408203125, -0.1984710693359375, -0.18025970458984375, -0.16204833984375, -0.14383697509765625, -0.1256256103515625, -0.10741424560546875, -0.089202880859375, -0.07099151611328125, -0.0527801513671875, -0.03456878662109375, -0.016357421875, 0.00185394287109375, 0.0200653076171875, 0.03827667236328125, 0.056488037109375, 0.07469940185546875, 0.0929107666015625, 0.11112213134765625, 0.12933349609375, 0.14754486083984375, 0.1657562255859375, 0.18396759033203125, 0.202178955078125, 0.22039031982421875, 0.2386016845703125, 0.25681304931640625, 0.2750244140625, 0.29323577880859375, 0.3114471435546875, 0.32965850830078125, 0.347869873046875, 0.36608123779296875, 0.3842926025390625, 0.40250396728515625, 0.42071533203125, 0.43892669677734375, 0.4571380615234375, 0.47534942626953125, 0.493560791015625, 0.5117721557617188, 0.5299835205078125, 0.5481948852539062, 0.56640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 6.0, 9.0, 5.0, 18.0, 23.0, 19.0, 35.0, 38.0, 49.0, 63.0, 91.0, 108.0, 118.0, 79.0, 84.0, 59.0, 33.0, 41.0, 19.0, 22.0, 19.0, 22.0, 12.0, 8.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00011360645294189453, -0.00011077430099248886, -0.00010794214904308319, -0.00010510999709367752, -0.00010227784514427185, -9.944569319486618e-05, -9.661354124546051e-05, -9.378138929605484e-05, -9.094923734664917e-05, -8.81170853972435e-05, -8.528493344783783e-05, -8.245278149843216e-05, -7.962062954902649e-05, -7.678847759962082e-05, -7.395632565021515e-05, -7.112417370080948e-05, -6.829202175140381e-05, -6.545986980199814e-05, -6.262771785259247e-05, -5.97955659031868e-05, -5.696341395378113e-05, -5.413126200437546e-05, -5.129911005496979e-05, -4.846695810556412e-05, -4.563480615615845e-05, -4.280265420675278e-05, -3.997050225734711e-05, -3.713835030794144e-05, -3.4306198358535767e-05, -3.1474046409130096e-05, -2.8641894459724426e-05, -2.5809742510318756e-05, -2.2977590560913086e-05, -2.0145438611507416e-05, -1.7313286662101746e-05, -1.4481134712696075e-05, -1.1648982763290405e-05, -8.816830813884735e-06, -5.984678864479065e-06, -3.1525269150733948e-06, -3.203749656677246e-07, 2.5117769837379456e-06, 5.343928933143616e-06, 8.176080882549286e-06, 1.1008232831954956e-05, 1.3840384781360626e-05, 1.6672536730766296e-05, 1.9504688680171967e-05, 2.2336840629577637e-05, 2.5168992578983307e-05, 2.8001144528388977e-05, 3.083329647779465e-05, 3.366544842720032e-05, 3.649760037660599e-05, 3.932975232601166e-05, 4.216190427541733e-05, 4.4994056224823e-05, 4.782620817422867e-05, 5.065836012363434e-05, 5.349051207304001e-05, 5.632266402244568e-05, 5.915481597185135e-05, 6.198696792125702e-05, 6.481911987066269e-05, 6.765127182006836e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 13.0, 18.0, 37.0, 44.0, 70.0, 112.0, 207.0, 378.0, 710.0, 1893.0, 6822.0, 56294.0, 863266.0, 104752.0, 9680.0, 2350.0, 883.0, 421.0, 226.0, 137.0, 75.0, 51.0, 43.0, 21.0, 12.0, 13.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.68994140625, -0.670562744140625, -0.65118408203125, -0.631805419921875, -0.6124267578125, -0.593048095703125, -0.57366943359375, -0.554290771484375, -0.534912109375, -0.515533447265625, -0.49615478515625, -0.476776123046875, -0.4573974609375, -0.438018798828125, -0.41864013671875, -0.399261474609375, -0.3798828125, -0.360504150390625, -0.34112548828125, -0.321746826171875, -0.3023681640625, -0.282989501953125, -0.26361083984375, -0.244232177734375, -0.224853515625, -0.205474853515625, -0.18609619140625, -0.166717529296875, -0.1473388671875, -0.127960205078125, -0.10858154296875, -0.089202880859375, -0.06982421875, -0.050445556640625, -0.03106689453125, -0.011688232421875, 0.0076904296875, 0.027069091796875, 0.04644775390625, 0.065826416015625, 0.085205078125, 0.104583740234375, 0.12396240234375, 0.143341064453125, 0.1627197265625, 0.182098388671875, 0.20147705078125, 0.220855712890625, 0.240234375, 0.259613037109375, 0.27899169921875, 0.298370361328125, 0.3177490234375, 0.337127685546875, 0.35650634765625, 0.375885009765625, 0.395263671875, 0.414642333984375, 0.43402099609375, 0.453399658203125, 0.4727783203125, 0.492156982421875, 0.51153564453125, 0.530914306640625, 0.55029296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 7.0, 9.0, 12.0, 18.0, 19.0, 25.0, 34.0, 47.0, 64.0, 98.0, 107.0, 104.0, 107.0, 108.0, 59.0, 47.0, 31.0, 26.0, 15.0, 18.0, 9.0, 8.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5864791870117188, -0.5684661865234375, -0.5504531860351562, -0.532440185546875, -0.5144271850585938, -0.4964141845703125, -0.47840118408203125, -0.46038818359375, -0.44237518310546875, -0.4243621826171875, -0.40634918212890625, -0.388336181640625, -0.37032318115234375, -0.3523101806640625, -0.33429718017578125, -0.3162841796875, -0.29827117919921875, -0.2802581787109375, -0.26224517822265625, -0.244232177734375, -0.22621917724609375, -0.2082061767578125, -0.19019317626953125, -0.17218017578125, -0.15416717529296875, -0.1361541748046875, -0.11814117431640625, -0.100128173828125, -0.08211517333984375, -0.0641021728515625, -0.04608917236328125, -0.028076171875, -0.01006317138671875, 0.0079498291015625, 0.02596282958984375, 0.043975830078125, 0.06198883056640625, 0.0800018310546875, 0.09801483154296875, 0.11602783203125, 0.13404083251953125, 0.1520538330078125, 0.17006683349609375, 0.188079833984375, 0.20609283447265625, 0.2241058349609375, 0.24211883544921875, 0.2601318359375, 0.27814483642578125, 0.2961578369140625, 0.31417083740234375, 0.332183837890625, 0.35019683837890625, 0.3682098388671875, 0.38622283935546875, 0.40423583984375, 0.42224884033203125, 0.4402618408203125, 0.45827484130859375, 0.476287841796875, 0.49430084228515625, 0.5123138427734375, 0.5303268432617188, 0.54833984375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 7.0, 39.0, 77.0, 212.0, 346.0, 185.0, 66.0, 29.0, 18.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.19564437866211, -21.73833465576172, -21.281023025512695, -20.823713302612305, -20.36640167236328, -19.90909194946289, -19.451780319213867, -18.994470596313477, -18.537158966064453, -18.079849243164062, -17.62253761291504, -17.16522789001465, -16.707916259765625, -16.250606536865234, -15.793295860290527, -15.33598518371582, -14.87867546081543, -14.421364784240723, -13.964054107666016, -13.506743431091309, -13.049432754516602, -12.592123031616211, -12.134812355041504, -11.677501678466797, -11.22019100189209, -10.762880325317383, -10.305569648742676, -9.848258972167969, -9.390949249267578, -8.933637619018555, -8.476327896118164, -8.019017219543457, -7.561707019805908, -7.104396343231201, -6.647086143493652, -6.189775466918945, -5.732464790344238, -5.275154113769531, -4.817843437194824, -4.360533237457275, -3.9032225608825684, -3.4459118843078613, -2.9886014461517334, -2.5312910079956055, -2.0739803314208984, -1.6166696548461914, -1.1593592166900635, -0.7020487785339355, -0.24473810195922852, 0.21257245540618896, 0.6698830127716064, 1.127193570137024, 1.5845041275024414, 2.0418148040771484, 2.4991252422332764, 2.9564356803894043, 3.4137463569641113, 3.8710570335388184, 4.328367233276367, 4.785677909851074, 5.242988586425781, 5.700299263000488, 6.157609939575195, 6.614920139312744, 7.072230815887451]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 1.0, 3.0, 0.0, 4.0, 7.0, 11.0, 10.0, 7.0, 17.0, 18.0, 14.0, 15.0, 15.0, 18.0, 33.0, 32.0, 32.0, 24.0, 41.0, 39.0, 45.0, 53.0, 84.0, 53.0, 62.0, 53.0, 41.0, 34.0, 30.0, 36.0, 28.0, 21.0, 24.0, 15.0, 21.0, 12.0, 9.0, 8.0, 9.0, 7.0, 5.0, 2.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.471921920776367, -6.248087406158447, -6.024252891540527, -5.800418376922607, -5.5765838623046875, -5.352749824523926, -5.128914833068848, -4.905080795288086, -4.681246280670166, -4.457411766052246, -4.233577251434326, -4.009742736816406, -3.7859084606170654, -3.5620739459991455, -3.3382394313812256, -3.1144051551818848, -2.8905704021453857, -2.666735887527466, -2.442901372909546, -2.219067096710205, -1.9952325820922852, -1.7713980674743652, -1.5475635528564453, -1.323729157447815, -1.099894642829895, -0.8760601878166199, -0.6522257328033447, -0.4283912181854248, -0.20455676317214966, 0.01927769184112549, 0.2431122064590454, 0.4669466018676758, 0.6907811164855957, 0.9146155714988708, 1.138450026512146, 1.362284541130066, 1.5861189365386963, 1.8099534511566162, 2.033787965774536, 2.257622241973877, 2.481456756591797, 2.705291271209717, 2.9291257858276367, 3.1529603004455566, 3.3767945766448975, 3.6006290912628174, 3.8244636058807373, 4.048297882080078, 4.272132873535156, 4.495967388153076, 4.719801902770996, 4.943636417388916, 5.167470932006836, 5.391304969787598, 5.615139961242676, 5.8389739990234375, 6.062808513641357, 6.286643028259277, 6.510477542877197, 6.734312057495117, 6.958146572113037, 7.181981086730957, 7.405815124511719, 7.629649639129639, 7.853484153747559]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 5.0, 7.0, 13.0, 9.0, 24.0, 43.0, 73.0, 122.0, 225.0, 473.0, 1012.0, 2842.0, 9793.0, 48000.0, 508167.0, 3087990.0, 477593.0, 44336.0, 8839.0, 2690.0, 976.0, 463.0, 244.0, 146.0, 66.0, 45.0, 30.0, 14.0, 18.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73779296875, -0.7170028686523438, -0.6962127685546875, -0.6754226684570312, -0.654632568359375, -0.6338424682617188, -0.6130523681640625, -0.5922622680664062, -0.57147216796875, -0.5506820678710938, -0.5298919677734375, -0.5091018676757812, -0.488311767578125, -0.46752166748046875, -0.4467315673828125, -0.42594146728515625, -0.4051513671875, -0.38436126708984375, -0.3635711669921875, -0.34278106689453125, -0.321990966796875, -0.30120086669921875, -0.2804107666015625, -0.25962066650390625, -0.23883056640625, -0.21804046630859375, -0.1972503662109375, -0.17646026611328125, -0.155670166015625, -0.13488006591796875, -0.1140899658203125, -0.09329986572265625, -0.072509765625, -0.05171966552734375, -0.0309295654296875, -0.01013946533203125, 0.010650634765625, 0.03144073486328125, 0.0522308349609375, 0.07302093505859375, 0.09381103515625, 0.11460113525390625, 0.1353912353515625, 0.15618133544921875, 0.176971435546875, 0.19776153564453125, 0.2185516357421875, 0.23934173583984375, 0.2601318359375, 0.28092193603515625, 0.3017120361328125, 0.32250213623046875, 0.343292236328125, 0.36408233642578125, 0.3848724365234375, 0.40566253662109375, 0.42645263671875, 0.44724273681640625, 0.4680328369140625, 0.48882293701171875, 0.509613037109375, 0.5304031372070312, 0.5511932373046875, 0.5719833374023438, 0.5927734375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 9.0, 4.0, 11.0, 30.0, 22.0, 39.0, 53.0, 66.0, 77.0, 90.0, 85.0, 105.0, 75.0, 84.0, 63.0, 54.0, 40.0, 30.0, 19.0, 14.0, 8.0, 7.0, 1.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.87548828125, -0.8504791259765625, -0.825469970703125, -0.8004608154296875, -0.77545166015625, -0.7504425048828125, -0.725433349609375, -0.7004241943359375, -0.6754150390625, -0.6504058837890625, -0.625396728515625, -0.6003875732421875, -0.57537841796875, -0.5503692626953125, -0.525360107421875, -0.5003509521484375, -0.475341796875, -0.4503326416015625, -0.425323486328125, -0.4003143310546875, -0.37530517578125, -0.3502960205078125, -0.325286865234375, -0.3002777099609375, -0.2752685546875, -0.2502593994140625, -0.225250244140625, -0.2002410888671875, -0.17523193359375, -0.1502227783203125, -0.125213623046875, -0.1002044677734375, -0.0751953125, -0.0501861572265625, -0.025177001953125, -0.0001678466796875, 0.02484130859375, 0.0498504638671875, 0.074859619140625, 0.0998687744140625, 0.1248779296875, 0.1498870849609375, 0.174896240234375, 0.1999053955078125, 0.22491455078125, 0.2499237060546875, 0.274932861328125, 0.2999420166015625, 0.324951171875, 0.3499603271484375, 0.374969482421875, 0.3999786376953125, 0.42498779296875, 0.4499969482421875, 0.475006103515625, 0.5000152587890625, 0.5250244140625, 0.5500335693359375, 0.575042724609375, 0.6000518798828125, 0.62506103515625, 0.6500701904296875, 0.675079345703125, 0.7000885009765625, 0.72509765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 10.0, 36.0, 55.0, 91.0, 185.0, 532.0, 2272.0, 25967.0, 3783608.0, 371839.0, 8048.0, 1125.0, 310.0, 107.0, 47.0, 24.0, 9.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1953125, -2.1372222900390625, -2.079132080078125, -2.0210418701171875, -1.96295166015625, -1.9048614501953125, -1.846771240234375, -1.7886810302734375, -1.7305908203125, -1.6725006103515625, -1.614410400390625, -1.5563201904296875, -1.49822998046875, -1.4401397705078125, -1.382049560546875, -1.3239593505859375, -1.265869140625, -1.2077789306640625, -1.149688720703125, -1.0915985107421875, -1.03350830078125, -0.9754180908203125, -0.917327880859375, -0.8592376708984375, -0.8011474609375, -0.7430572509765625, -0.684967041015625, -0.6268768310546875, -0.56878662109375, -0.5106964111328125, -0.452606201171875, -0.3945159912109375, -0.33642578125, -0.2783355712890625, -0.220245361328125, -0.1621551513671875, -0.10406494140625, -0.0459747314453125, 0.012115478515625, 0.0702056884765625, 0.1282958984375, 0.1863861083984375, 0.244476318359375, 0.3025665283203125, 0.36065673828125, 0.4187469482421875, 0.476837158203125, 0.5349273681640625, 0.593017578125, 0.6511077880859375, 0.709197998046875, 0.7672882080078125, 0.82537841796875, 0.8834686279296875, 0.941558837890625, 0.9996490478515625, 1.0577392578125, 1.1158294677734375, 1.173919677734375, 1.2320098876953125, 1.29010009765625, 1.3481903076171875, 1.406280517578125, 1.4643707275390625, 1.5224609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 2.0, 8.0, 15.0, 19.0, 26.0, 53.0, 88.0, 205.0, 520.0, 1063.0, 1024.0, 485.0, 255.0, 124.0, 65.0, 42.0, 24.0, 17.0, 13.0, 6.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6474609375, -1.6063766479492188, -1.5652923583984375, -1.5242080688476562, -1.483123779296875, -1.4420394897460938, -1.4009552001953125, -1.3598709106445312, -1.31878662109375, -1.2777023315429688, -1.2366180419921875, -1.1955337524414062, -1.154449462890625, -1.1133651733398438, -1.0722808837890625, -1.0311965942382812, -0.9901123046875, -0.9490280151367188, -0.9079437255859375, -0.8668594360351562, -0.825775146484375, -0.7846908569335938, -0.7436065673828125, -0.7025222778320312, -0.66143798828125, -0.6203536987304688, -0.5792694091796875, -0.5381851196289062, -0.497100830078125, -0.45601654052734375, -0.4149322509765625, -0.37384796142578125, -0.332763671875, -0.29167938232421875, -0.2505950927734375, -0.20951080322265625, -0.168426513671875, -0.12734222412109375, -0.0862579345703125, -0.04517364501953125, -0.00408935546875, 0.03699493408203125, 0.0780792236328125, 0.11916351318359375, 0.160247802734375, 0.20133209228515625, 0.2424163818359375, 0.28350067138671875, 0.3245849609375, 0.36566925048828125, 0.4067535400390625, 0.44783782958984375, 0.488922119140625, 0.5300064086914062, 0.5710906982421875, 0.6121749877929688, 0.65325927734375, 0.6943435668945312, 0.7354278564453125, 0.7765121459960938, 0.817596435546875, 0.8586807250976562, 0.8997650146484375, 0.9408493041992188, 0.98193359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 13.0, 44.0, 79.0, 154.0, 239.0, 242.0, 118.0, 38.0, 30.0, 7.0, 10.0, 5.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.334019660949707, -9.047407150268555, -8.760793685913086, -8.474181175231934, -8.187568664550781, -7.900955677032471, -7.61434268951416, -7.327730178833008, -7.041117191314697, -6.754504203796387, -6.467891693115234, -6.181278705596924, -5.894665718078613, -5.608053207397461, -5.32144021987915, -5.03482723236084, -4.7482147216796875, -4.461601734161377, -4.174989223480225, -3.888376235961914, -3.6017634868621826, -3.315150737762451, -3.0285377502441406, -2.741925001144409, -2.4553122520446777, -2.1686995029449463, -1.8820866346359253, -1.5954737663269043, -1.3088610172271729, -1.0222482681274414, -0.7356353998184204, -0.4490225315093994, -0.16241073608398438, 0.12420207262039185, 0.41081488132476807, 0.6974276900291443, 0.9840404987335205, 1.270653247833252, 1.557266116142273, 1.843878984451294, 2.1304917335510254, 2.417104482650757, 2.7037172317504883, 2.990330219268799, 3.2769429683685303, 3.5635557174682617, 3.8501687049865723, 4.136781692504883, 4.423394203186035, 4.710007190704346, 4.996619701385498, 5.283232688903809, 5.569845199584961, 5.8564581871032715, 6.143071174621582, 6.429683685302734, 6.716296672821045, 7.0029096603393555, 7.289522171020508, 7.576135158538818, 7.862748146057129, 8.149360656738281, 8.435973167419434, 8.722586631774902, 9.009199142456055]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 10.0, 5.0, 7.0, 20.0, 14.0, 16.0, 16.0, 19.0, 28.0, 28.0, 37.0, 35.0, 44.0, 38.0, 46.0, 47.0, 62.0, 51.0, 46.0, 55.0, 44.0, 48.0, 38.0, 40.0, 30.0, 29.0, 19.0, 32.0, 19.0, 12.0, 11.0, 16.0, 4.0, 10.0, 3.0, 6.0, 8.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3766865730285645, -4.241964340209961, -4.107242107391357, -3.972520112991333, -3.8377978801727295, -3.703075647354126, -3.5683536529541016, -3.433631420135498, -3.2989091873168945, -3.164186954498291, -3.0294647216796875, -2.894742727279663, -2.7600204944610596, -2.625298261642456, -2.4905762672424316, -2.355854034423828, -2.2211318016052246, -2.086409568786621, -1.9516874551773071, -1.8169653415679932, -1.6822431087493896, -1.5475208759307861, -1.4127987623214722, -1.2780766487121582, -1.1433544158935547, -1.0086321830749512, -0.8739100694656372, -0.7391878962516785, -0.6044657230377197, -0.469743549823761, -0.33502137660980225, -0.2002992033958435, -0.06557655334472656, 0.06914561986923218, 0.20386779308319092, 0.33858996629714966, 0.4733121395111084, 0.6080343127250671, 0.7427564859390259, 0.8774786591529846, 1.0122008323669434, 1.1469230651855469, 1.2816451787948608, 1.4163672924041748, 1.5510895252227783, 1.6858117580413818, 1.8205338716506958, 1.9552559852600098, 2.0899782180786133, 2.224700450897217, 2.3594226837158203, 2.4941446781158447, 2.6288669109344482, 2.7635891437530518, 2.898311138153076, 3.0330333709716797, 3.167755603790283, 3.3024778366088867, 3.4372000694274902, 3.5719220638275146, 3.706644296646118, 3.8413665294647217, 3.976088523864746, 4.11081075668335, 4.245532989501953]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 9.0, 15.0, 20.0, 43.0, 45.0, 88.0, 160.0, 273.0, 607.0, 1091.0, 2639.0, 6787.0, 20665.0, 80607.0, 340930.0, 437857.0, 113879.0, 28102.0, 8621.0, 3290.0, 1401.0, 657.0, 323.0, 179.0, 101.0, 60.0, 38.0, 27.0, 15.0, 7.0, 9.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.05859375, -1.0300750732421875, -1.001556396484375, -0.9730377197265625, -0.94451904296875, -0.9160003662109375, -0.887481689453125, -0.8589630126953125, -0.8304443359375, -0.8019256591796875, -0.773406982421875, -0.7448883056640625, -0.71636962890625, -0.6878509521484375, -0.659332275390625, -0.6308135986328125, -0.602294921875, -0.5737762451171875, -0.545257568359375, -0.5167388916015625, -0.48822021484375, -0.4597015380859375, -0.431182861328125, -0.4026641845703125, -0.3741455078125, -0.3456268310546875, -0.317108154296875, -0.2885894775390625, -0.26007080078125, -0.2315521240234375, -0.203033447265625, -0.1745147705078125, -0.14599609375, -0.1174774169921875, -0.088958740234375, -0.0604400634765625, -0.03192138671875, -0.0034027099609375, 0.025115966796875, 0.0536346435546875, 0.0821533203125, 0.1106719970703125, 0.139190673828125, 0.1677093505859375, 0.19622802734375, 0.2247467041015625, 0.253265380859375, 0.2817840576171875, 0.310302734375, 0.3388214111328125, 0.367340087890625, 0.3958587646484375, 0.42437744140625, 0.4528961181640625, 0.481414794921875, 0.5099334716796875, 0.5384521484375, 0.5669708251953125, 0.595489501953125, 0.6240081787109375, 0.65252685546875, 0.6810455322265625, 0.709564208984375, 0.7380828857421875, 0.7666015625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 4.0, 7.0, 9.0, 8.0, 19.0, 28.0, 28.0, 38.0, 54.0, 60.0, 82.0, 110.0, 78.0, 86.0, 85.0, 56.0, 83.0, 43.0, 48.0, 22.0, 21.0, 12.0, 9.0, 7.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.85400390625, -0.8294296264648438, -0.8048553466796875, -0.7802810668945312, -0.755706787109375, -0.7311325073242188, -0.7065582275390625, -0.6819839477539062, -0.65740966796875, -0.6328353881835938, -0.6082611083984375, -0.5836868286132812, -0.559112548828125, -0.5345382690429688, -0.5099639892578125, -0.48538970947265625, -0.4608154296875, -0.43624114990234375, -0.4116668701171875, -0.38709259033203125, -0.362518310546875, -0.33794403076171875, -0.3133697509765625, -0.28879547119140625, -0.26422119140625, -0.23964691162109375, -0.2150726318359375, -0.19049835205078125, -0.165924072265625, -0.14134979248046875, -0.1167755126953125, -0.09220123291015625, -0.067626953125, -0.04305267333984375, -0.0184783935546875, 0.00609588623046875, 0.030670166015625, 0.05524444580078125, 0.0798187255859375, 0.10439300537109375, 0.12896728515625, 0.15354156494140625, 0.1781158447265625, 0.20269012451171875, 0.227264404296875, 0.25183868408203125, 0.2764129638671875, 0.30098724365234375, 0.3255615234375, 0.35013580322265625, 0.3747100830078125, 0.39928436279296875, 0.423858642578125, 0.44843292236328125, 0.4730072021484375, 0.49758148193359375, 0.52215576171875, 0.5467300415039062, 0.5713043212890625, 0.5958786010742188, 0.620452880859375, 0.6450271606445312, 0.6696014404296875, 0.6941757202148438, 0.71875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 12.0, 16.0, 26.0, 29.0, 29.0, 62.0, 72.0, 125.0, 215.0, 350.0, 558.0, 1205.0, 3399.0, 22804.0, 630962.0, 365553.0, 17389.0, 3058.0, 1160.0, 605.0, 341.0, 203.0, 130.0, 77.0, 53.0, 40.0, 32.0, 10.0, 9.0, 9.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5732421875, -1.5101776123046875, -1.447113037109375, -1.3840484619140625, -1.32098388671875, -1.2579193115234375, -1.194854736328125, -1.1317901611328125, -1.0687255859375, -1.0056610107421875, -0.942596435546875, -0.8795318603515625, -0.81646728515625, -0.7534027099609375, -0.690338134765625, -0.6272735595703125, -0.564208984375, -0.5011444091796875, -0.438079833984375, -0.3750152587890625, -0.31195068359375, -0.2488861083984375, -0.185821533203125, -0.1227569580078125, -0.0596923828125, 0.0033721923828125, 0.066436767578125, 0.1295013427734375, 0.19256591796875, 0.2556304931640625, 0.318695068359375, 0.3817596435546875, 0.44482421875, 0.5078887939453125, 0.570953369140625, 0.6340179443359375, 0.69708251953125, 0.7601470947265625, 0.823211669921875, 0.8862762451171875, 0.9493408203125, 1.0124053955078125, 1.075469970703125, 1.1385345458984375, 1.20159912109375, 1.2646636962890625, 1.327728271484375, 1.3907928466796875, 1.453857421875, 1.5169219970703125, 1.579986572265625, 1.6430511474609375, 1.70611572265625, 1.7691802978515625, 1.832244873046875, 1.8953094482421875, 1.9583740234375, 2.0214385986328125, 2.084503173828125, 2.1475677490234375, 2.21063232421875, 2.2736968994140625, 2.336761474609375, 2.3998260498046875, 2.462890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 1.0, 10.0, 7.0, 14.0, 7.0, 17.0, 21.0, 18.0, 36.0, 25.0, 22.0, 33.0, 36.0, 30.0, 28.0, 53.0, 50.0, 59.0, 57.0, 57.0, 61.0, 50.0, 33.0, 35.0, 33.0, 42.0, 23.0, 33.0, 20.0, 22.0, 14.0, 11.0, 13.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6083984375, -1.5524749755859375, -1.496551513671875, -1.4406280517578125, -1.38470458984375, -1.3287811279296875, -1.272857666015625, -1.2169342041015625, -1.1610107421875, -1.1050872802734375, -1.049163818359375, -0.9932403564453125, -0.93731689453125, -0.8813934326171875, -0.825469970703125, -0.7695465087890625, -0.713623046875, -0.6576995849609375, -0.601776123046875, -0.5458526611328125, -0.48992919921875, -0.4340057373046875, -0.378082275390625, -0.3221588134765625, -0.2662353515625, -0.2103118896484375, -0.154388427734375, -0.0984649658203125, -0.04254150390625, 0.0133819580078125, 0.069305419921875, 0.1252288818359375, 0.18115234375, 0.2370758056640625, 0.292999267578125, 0.3489227294921875, 0.40484619140625, 0.4607696533203125, 0.516693115234375, 0.5726165771484375, 0.6285400390625, 0.6844635009765625, 0.740386962890625, 0.7963104248046875, 0.85223388671875, 0.9081573486328125, 0.964080810546875, 1.0200042724609375, 1.075927734375, 1.1318511962890625, 1.187774658203125, 1.2436981201171875, 1.29962158203125, 1.3555450439453125, 1.411468505859375, 1.4673919677734375, 1.5233154296875, 1.5792388916015625, 1.635162353515625, 1.6910858154296875, 1.74700927734375, 1.8029327392578125, 1.858856201171875, 1.9147796630859375, 1.970703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 11.0, 17.0, 9.0, 19.0, 13.0, 19.0, 32.0, 59.0, 81.0, 146.0, 271.0, 710.0, 1947.0, 10253.0, 175761.0, 824561.0, 28864.0, 3811.0, 1056.0, 412.0, 210.0, 96.0, 53.0, 38.0, 23.0, 21.0, 11.0, 7.0, 9.0, 6.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64990234375, -0.6276626586914062, -0.6054229736328125, -0.5831832885742188, -0.560943603515625, -0.5387039184570312, -0.5164642333984375, -0.49422454833984375, -0.47198486328125, -0.44974517822265625, -0.4275054931640625, -0.40526580810546875, -0.383026123046875, -0.36078643798828125, -0.3385467529296875, -0.31630706787109375, -0.2940673828125, -0.27182769775390625, -0.2495880126953125, -0.22734832763671875, -0.205108642578125, -0.18286895751953125, -0.1606292724609375, -0.13838958740234375, -0.11614990234375, -0.09391021728515625, -0.0716705322265625, -0.04943084716796875, -0.027191162109375, -0.00495147705078125, 0.0172882080078125, 0.03952789306640625, 0.061767578125, 0.08400726318359375, 0.1062469482421875, 0.12848663330078125, 0.150726318359375, 0.17296600341796875, 0.1952056884765625, 0.21744537353515625, 0.23968505859375, 0.26192474365234375, 0.2841644287109375, 0.30640411376953125, 0.328643798828125, 0.35088348388671875, 0.3731231689453125, 0.39536285400390625, 0.4176025390625, 0.43984222412109375, 0.4620819091796875, 0.48432159423828125, 0.506561279296875, 0.5288009643554688, 0.5510406494140625, 0.5732803344726562, 0.59552001953125, 0.6177597045898438, 0.6399993896484375, 0.6622390747070312, 0.684478759765625, 0.7067184448242188, 0.7289581298828125, 0.7511978149414062, 0.7734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 5.0, 0.0, 3.0, 7.0, 9.0, 8.0, 7.0, 12.0, 10.0, 24.0, 21.0, 24.0, 31.0, 45.0, 69.0, 82.0, 117.0, 103.0, 83.0, 91.0, 58.0, 35.0, 32.0, 25.0, 22.0, 9.0, 11.0, 10.0, 17.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.730722427368164e-05, -7.474608719348907e-05, -7.218495011329651e-05, -6.962381303310394e-05, -6.706267595291138e-05, -6.450153887271881e-05, -6.194040179252625e-05, -5.937926471233368e-05, -5.681812763214111e-05, -5.425699055194855e-05, -5.169585347175598e-05, -4.9134716391563416e-05, -4.657357931137085e-05, -4.4012442231178284e-05, -4.145130515098572e-05, -3.889016807079315e-05, -3.6329030990600586e-05, -3.376789391040802e-05, -3.1206756830215454e-05, -2.8645619750022888e-05, -2.6084482669830322e-05, -2.3523345589637756e-05, -2.096220850944519e-05, -1.8401071429252625e-05, -1.583993434906006e-05, -1.3278797268867493e-05, -1.0717660188674927e-05, -8.15652310848236e-06, -5.595386028289795e-06, -3.034248948097229e-06, -4.731118679046631e-07, 2.088025212287903e-06, 4.649162292480469e-06, 7.210299372673035e-06, 9.7714364528656e-06, 1.2332573533058167e-05, 1.4893710613250732e-05, 1.74548476934433e-05, 2.0015984773635864e-05, 2.257712185382843e-05, 2.5138258934020996e-05, 2.7699396014213562e-05, 3.0260533094406128e-05, 3.2821670174598694e-05, 3.538280725479126e-05, 3.7943944334983826e-05, 4.050508141517639e-05, 4.306621849536896e-05, 4.5627355575561523e-05, 4.818849265575409e-05, 5.0749629735946655e-05, 5.331076681613922e-05, 5.587190389633179e-05, 5.843304097652435e-05, 6.099417805671692e-05, 6.355531513690948e-05, 6.611645221710205e-05, 6.867758929729462e-05, 7.123872637748718e-05, 7.379986345767975e-05, 7.636100053787231e-05, 7.892213761806488e-05, 8.148327469825745e-05, 8.404441177845001e-05, 8.660554885864258e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 6.0, 8.0, 21.0, 23.0, 35.0, 53.0, 92.0, 175.0, 388.0, 922.0, 2847.0, 19398.0, 784106.0, 227706.0, 9544.0, 1951.0, 641.0, 284.0, 126.0, 87.0, 56.0, 35.0, 16.0, 9.0, 8.0, 9.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49609375, -0.4743804931640625, -0.452667236328125, -0.4309539794921875, -0.40924072265625, -0.3875274658203125, -0.365814208984375, -0.3441009521484375, -0.3223876953125, -0.3006744384765625, -0.278961181640625, -0.2572479248046875, -0.23553466796875, -0.2138214111328125, -0.192108154296875, -0.1703948974609375, -0.148681640625, -0.1269683837890625, -0.105255126953125, -0.0835418701171875, -0.06182861328125, -0.0401153564453125, -0.018402099609375, 0.0033111572265625, 0.0250244140625, 0.0467376708984375, 0.068450927734375, 0.0901641845703125, 0.11187744140625, 0.1335906982421875, 0.155303955078125, 0.1770172119140625, 0.19873046875, 0.2204437255859375, 0.242156982421875, 0.2638702392578125, 0.28558349609375, 0.3072967529296875, 0.329010009765625, 0.3507232666015625, 0.3724365234375, 0.3941497802734375, 0.415863037109375, 0.4375762939453125, 0.45928955078125, 0.4810028076171875, 0.502716064453125, 0.5244293212890625, 0.546142578125, 0.5678558349609375, 0.589569091796875, 0.6112823486328125, 0.63299560546875, 0.6547088623046875, 0.676422119140625, 0.6981353759765625, 0.7198486328125, 0.7415618896484375, 0.763275146484375, 0.7849884033203125, 0.80670166015625, 0.8284149169921875, 0.850128173828125, 0.8718414306640625, 0.8935546875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 5.0, 3.0, 7.0, 16.0, 18.0, 28.0, 46.0, 58.0, 74.0, 96.0, 125.0, 112.0, 109.0, 90.0, 59.0, 56.0, 28.0, 18.0, 14.0, 7.0, 6.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.544921875, -0.5286026000976562, -0.5122833251953125, -0.49596405029296875, -0.479644775390625, -0.46332550048828125, -0.4470062255859375, -0.43068695068359375, -0.41436767578125, -0.39804840087890625, -0.3817291259765625, -0.36540985107421875, -0.349090576171875, -0.33277130126953125, -0.3164520263671875, -0.30013275146484375, -0.2838134765625, -0.26749420166015625, -0.2511749267578125, -0.23485565185546875, -0.218536376953125, -0.20221710205078125, -0.1858978271484375, -0.16957855224609375, -0.15325927734375, -0.13694000244140625, -0.1206207275390625, -0.10430145263671875, -0.087982177734375, -0.07166290283203125, -0.0553436279296875, -0.03902435302734375, -0.022705078125, -0.00638580322265625, 0.0099334716796875, 0.02625274658203125, 0.042572021484375, 0.05889129638671875, 0.0752105712890625, 0.09152984619140625, 0.10784912109375, 0.12416839599609375, 0.1404876708984375, 0.15680694580078125, 0.173126220703125, 0.18944549560546875, 0.2057647705078125, 0.22208404541015625, 0.2384033203125, 0.25472259521484375, 0.2710418701171875, 0.28736114501953125, 0.303680419921875, 0.31999969482421875, 0.3363189697265625, 0.35263824462890625, 0.36895751953125, 0.38527679443359375, 0.4015960693359375, 0.41791534423828125, 0.434234619140625, 0.45055389404296875, 0.4668731689453125, 0.48319244384765625, 0.49951171875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 11.0, 33.0, 45.0, 101.0, 165.0, 269.0, 186.0, 84.0, 45.0, 18.0, 10.0, 6.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.406059265136719, -13.091744422912598, -12.777429580688477, -12.463113784790039, -12.148798942565918, -11.834484100341797, -11.520169258117676, -11.205854415893555, -10.891538619995117, -10.577223777770996, -10.262908935546875, -9.948593139648438, -9.634278297424316, -9.319963455200195, -9.005648612976074, -8.691333770751953, -8.377018928527832, -8.062704086303711, -7.748388767242432, -7.4340739250183105, -7.119758605957031, -6.80544376373291, -6.491128921508789, -6.176814079284668, -5.862498760223389, -5.548183917999268, -5.233868598937988, -4.919553756713867, -4.605238914489746, -4.290923595428467, -3.9766087532043457, -3.6622936725616455, -3.3479795455932617, -3.0336644649505615, -2.7193493843078613, -2.4050345420837402, -2.09071946144104, -1.7764043807983398, -1.4620894193649292, -1.1477744579315186, -0.8334593772888184, -0.5191443562507629, -0.20482933521270752, 0.1094856858253479, 0.4238007068634033, 0.7381157875061035, 1.0524307489395142, 1.3667457103729248, 1.681060791015625, 1.9953758716583252, 2.3096909523010254, 2.6240057945251465, 2.9383208751678467, 3.252635955810547, 3.566950798034668, 3.881265878677368, 4.195580959320068, 4.5098958015441895, 4.824211120605469, 5.13852596282959, 5.452840805053711, 5.76715612411499, 6.081470966339111, 6.395786285400391, 6.710101127624512]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 3.0, 5.0, 5.0, 7.0, 7.0, 12.0, 15.0, 19.0, 20.0, 18.0, 20.0, 27.0, 21.0, 33.0, 33.0, 39.0, 42.0, 76.0, 60.0, 69.0, 88.0, 58.0, 46.0, 28.0, 25.0, 24.0, 26.0, 21.0, 35.0, 19.0, 21.0, 12.0, 17.0, 7.0, 5.0, 5.0, 7.0, 4.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.3751115798950195, -7.153839588165283, -6.932567596435547, -6.7112956047058105, -6.490023612976074, -6.26875114440918, -6.047479152679443, -5.826207160949707, -5.604935169219971, -5.383663177490234, -5.162391185760498, -4.941119194030762, -4.719846725463867, -4.498575210571289, -4.2773027420043945, -4.056030750274658, -3.834758758544922, -3.6134867668151855, -3.392214775085449, -3.170942544937134, -2.9496705532073975, -2.728398561477661, -2.5071263313293457, -2.2858543395996094, -2.064582347869873, -1.8433103561401367, -1.6220382452011108, -1.400766134262085, -1.1794941425323486, -0.9582221508026123, -0.7369500398635864, -0.5156779289245605, -0.2944064140319824, -0.07313436269760132, 0.14813768863677979, 0.3694097399711609, 0.590681791305542, 0.8119537830352783, 1.0332258939743042, 1.25449800491333, 1.4757699966430664, 1.6970419883728027, 1.9183140993118286, 2.1395862102508545, 2.360858201980591, 2.582130193710327, 2.8034024238586426, 3.024674415588379, 3.2459464073181152, 3.4672183990478516, 3.688490390777588, 3.9097626209259033, 4.131034851074219, 4.352306365966797, 4.573578834533691, 4.794850826263428, 5.016122817993164, 5.2373948097229, 5.458666801452637, 5.679938793182373, 5.901210784912109, 6.122483253479004, 6.34375524520874, 6.565027236938477, 6.786299228668213]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 12.0, 11.0, 11.0, 29.0, 36.0, 60.0, 120.0, 305.0, 656.0, 1942.0, 9935.0, 149303.0, 3719025.0, 297144.0, 12021.0, 2269.0, 707.0, 279.0, 169.0, 93.0, 53.0, 29.0, 24.0, 16.0, 9.0, 8.0, 5.0, 4.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9931640625, -0.9617156982421875, -0.930267333984375, -0.8988189697265625, -0.86737060546875, -0.8359222412109375, -0.804473876953125, -0.7730255126953125, -0.7415771484375, -0.7101287841796875, -0.678680419921875, -0.6472320556640625, -0.61578369140625, -0.5843353271484375, -0.552886962890625, -0.5214385986328125, -0.489990234375, -0.4585418701171875, -0.427093505859375, -0.3956451416015625, -0.36419677734375, -0.3327484130859375, -0.301300048828125, -0.2698516845703125, -0.2384033203125, -0.2069549560546875, -0.175506591796875, -0.1440582275390625, -0.11260986328125, -0.0811614990234375, -0.049713134765625, -0.0182647705078125, 0.01318359375, 0.0446319580078125, 0.076080322265625, 0.1075286865234375, 0.13897705078125, 0.1704254150390625, 0.201873779296875, 0.2333221435546875, 0.2647705078125, 0.2962188720703125, 0.327667236328125, 0.3591156005859375, 0.39056396484375, 0.4220123291015625, 0.453460693359375, 0.4849090576171875, 0.516357421875, 0.5478057861328125, 0.579254150390625, 0.6107025146484375, 0.64215087890625, 0.6735992431640625, 0.705047607421875, 0.7364959716796875, 0.7679443359375, 0.7993927001953125, 0.830841064453125, 0.8622894287109375, 0.89373779296875, 0.9251861572265625, 0.956634521484375, 0.9880828857421875, 1.01953125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 18.0, 17.0, 30.0, 34.0, 40.0, 64.0, 61.0, 99.0, 86.0, 95.0, 92.0, 82.0, 64.0, 53.0, 49.0, 33.0, 22.0, 10.0, 10.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8671875, -0.8426132202148438, -0.8180389404296875, -0.7934646606445312, -0.768890380859375, -0.7443161010742188, -0.7197418212890625, -0.6951675415039062, -0.67059326171875, -0.6460189819335938, -0.6214447021484375, -0.5968704223632812, -0.572296142578125, -0.5477218627929688, -0.5231475830078125, -0.49857330322265625, -0.4739990234375, -0.44942474365234375, -0.4248504638671875, -0.40027618408203125, -0.375701904296875, -0.35112762451171875, -0.3265533447265625, -0.30197906494140625, -0.27740478515625, -0.25283050537109375, -0.2282562255859375, -0.20368194580078125, -0.179107666015625, -0.15453338623046875, -0.1299591064453125, -0.10538482666015625, -0.080810546875, -0.05623626708984375, -0.0316619873046875, -0.00708770751953125, 0.017486572265625, 0.04206085205078125, 0.0666351318359375, 0.09120941162109375, 0.11578369140625, 0.14035797119140625, 0.1649322509765625, 0.18950653076171875, 0.214080810546875, 0.23865509033203125, 0.2632293701171875, 0.28780364990234375, 0.3123779296875, 0.33695220947265625, 0.3615264892578125, 0.38610076904296875, 0.410675048828125, 0.43524932861328125, 0.4598236083984375, 0.48439788818359375, 0.50897216796875, 0.5335464477539062, 0.5581207275390625, 0.5826950073242188, 0.607269287109375, 0.6318435668945312, 0.6564178466796875, 0.6809921264648438, 0.70556640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 8.0, 10.0, 6.0, 16.0, 25.0, 32.0, 85.0, 119.0, 262.0, 505.0, 1088.0, 2641.0, 9104.0, 63157.0, 3368683.0, 711049.0, 27958.0, 5567.0, 2077.0, 905.0, 421.0, 244.0, 117.0, 66.0, 43.0, 18.0, 12.0, 13.0, 9.0, 7.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93115234375, -0.8999252319335938, -0.8686981201171875, -0.8374710083007812, -0.806243896484375, -0.7750167846679688, -0.7437896728515625, -0.7125625610351562, -0.68133544921875, -0.6501083374023438, -0.6188812255859375, -0.5876541137695312, -0.556427001953125, -0.5251998901367188, -0.4939727783203125, -0.46274566650390625, -0.4315185546875, -0.40029144287109375, -0.3690643310546875, -0.33783721923828125, -0.306610107421875, -0.27538299560546875, -0.2441558837890625, -0.21292877197265625, -0.18170166015625, -0.15047454833984375, -0.1192474365234375, -0.08802032470703125, -0.056793212890625, -0.02556610107421875, 0.0056610107421875, 0.03688812255859375, 0.068115234375, 0.09934234619140625, 0.1305694580078125, 0.16179656982421875, 0.193023681640625, 0.22425079345703125, 0.2554779052734375, 0.28670501708984375, 0.31793212890625, 0.34915924072265625, 0.3803863525390625, 0.41161346435546875, 0.442840576171875, 0.47406768798828125, 0.5052947998046875, 0.5365219116210938, 0.5677490234375, 0.5989761352539062, 0.6302032470703125, 0.6614303588867188, 0.692657470703125, 0.7238845825195312, 0.7551116943359375, 0.7863388061523438, 0.81756591796875, 0.8487930297851562, 0.8800201416015625, 0.9112472534179688, 0.942474365234375, 0.9737014770507812, 1.0049285888671875, 1.0361557006835938, 1.0673828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 8.0, 9.0, 12.0, 24.0, 22.0, 39.0, 64.0, 132.0, 321.0, 706.0, 1175.0, 828.0, 360.0, 152.0, 89.0, 40.0, 27.0, 26.0, 13.0, 4.0, 8.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -0.99658203125, -0.962890625, -0.92919921875, -0.8955078125, -0.86181640625, -0.828125, -0.79443359375, -0.7607421875, -0.72705078125, -0.693359375, -0.65966796875, -0.6259765625, -0.59228515625, -0.55859375, -0.52490234375, -0.4912109375, -0.45751953125, -0.423828125, -0.39013671875, -0.3564453125, -0.32275390625, -0.2890625, -0.25537109375, -0.2216796875, -0.18798828125, -0.154296875, -0.12060546875, -0.0869140625, -0.05322265625, -0.01953125, 0.01416015625, 0.0478515625, 0.08154296875, 0.115234375, 0.14892578125, 0.1826171875, 0.21630859375, 0.25, 0.28369140625, 0.3173828125, 0.35107421875, 0.384765625, 0.41845703125, 0.4521484375, 0.48583984375, 0.51953125, 0.55322265625, 0.5869140625, 0.62060546875, 0.654296875, 0.68798828125, 0.7216796875, 0.75537109375, 0.7890625, 0.82275390625, 0.8564453125, 0.89013671875, 0.923828125, 0.95751953125, 0.9912109375, 1.02490234375, 1.05859375, 1.09228515625, 1.1259765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 5.0, 10.0, 21.0, 44.0, 119.0, 246.0, 252.0, 152.0, 63.0, 32.0, 16.0, 9.0, 8.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.174121856689453, -7.919416427612305, -7.6647114753723145, -7.410006046295166, -7.155301094055176, -6.900595664978027, -6.645890235900879, -6.3911848068237305, -6.13647985458374, -5.881774425506592, -5.627069473266602, -5.372364044189453, -5.117658615112305, -4.8629536628723145, -4.608248233795166, -4.353543281555176, -4.098837852478027, -3.844132661819458, -3.5894274711608887, -3.3347220420837402, -3.080016851425171, -2.8253116607666016, -2.570606231689453, -2.315901041030884, -2.0611958503723145, -1.8064906597137451, -1.5517853498458862, -1.2970800399780273, -1.042374849319458, -0.7876696586608887, -0.5329643487930298, -0.2782590389251709, -0.023553848266601562, 0.23115140199661255, 0.48585665225982666, 0.7405619025230408, 0.9952671527862549, 1.2499723434448242, 1.504677653312683, 1.759382963180542, 2.0140881538391113, 2.2687933444976807, 2.52349853515625, 2.7782039642333984, 3.0329091548919678, 3.287614345550537, 3.5423197746276855, 3.797024965286255, 4.051730155944824, 4.306435585021973, 4.561140537261963, 4.815845966339111, 5.070550918579102, 5.32525634765625, 5.579961776733398, 5.834667205810547, 6.089372158050537, 6.3440775871276855, 6.598782539367676, 6.853487968444824, 7.108193397521973, 7.362898349761963, 7.617603778839111, 7.872308731079102, 8.12701416015625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 11.0, 14.0, 10.0, 17.0, 24.0, 30.0, 35.0, 45.0, 44.0, 69.0, 56.0, 73.0, 105.0, 77.0, 66.0, 66.0, 58.0, 53.0, 39.0, 32.0, 29.0, 10.0, 16.0, 12.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.137676239013672, -5.969976425170898, -5.802276611328125, -5.634576797485352, -5.466876983642578, -5.299177169799805, -5.131477355957031, -4.963777542114258, -4.796077728271484, -4.628377914428711, -4.4606781005859375, -4.292978286743164, -4.125278472900391, -3.957578659057617, -3.7898788452148438, -3.6221790313720703, -3.454479455947876, -3.2867796421051025, -3.119079828262329, -2.9513800144195557, -2.7836802005767822, -2.615980386734009, -2.4482808113098145, -2.280580997467041, -2.1128811836242676, -1.9451813697814941, -1.7774815559387207, -1.6097817420959473, -1.4420819282531738, -1.2743821144104004, -1.1066824197769165, -0.9389826059341431, -0.7712826728820801, -0.6035828590393066, -0.4358830749988556, -0.26818329095840454, -0.1004834771156311, 0.06721633672714233, 0.234916090965271, 0.40261590480804443, 0.5703157186508179, 0.7380155324935913, 0.9057153463363647, 1.0734150409698486, 1.241114854812622, 1.4088146686553955, 1.576514482498169, 1.7442142963409424, 1.9119141101837158, 2.0796139240264893, 2.2473137378692627, 2.415013551712036, 2.5827133655548096, 2.750413179397583, 2.9181127548217773, 3.085812568664551, 3.253512382507324, 3.4212121963500977, 3.588912010192871, 3.7566118240356445, 3.924311637878418, 4.092011451721191, 4.259711265563965, 4.427411079406738, 4.595110893249512]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 6.0, 8.0, 18.0, 27.0, 37.0, 85.0, 115.0, 265.0, 515.0, 1258.0, 3878.0, 15113.0, 86926.0, 505120.0, 366210.0, 53885.0, 10267.0, 2832.0, 1038.0, 459.0, 206.0, 111.0, 57.0, 33.0, 19.0, 11.0, 13.0, 11.0, 3.0, 9.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9921875, -0.960052490234375, -0.92791748046875, -0.895782470703125, -0.8636474609375, -0.831512451171875, -0.79937744140625, -0.767242431640625, -0.735107421875, -0.702972412109375, -0.67083740234375, -0.638702392578125, -0.6065673828125, -0.574432373046875, -0.54229736328125, -0.510162353515625, -0.47802734375, -0.445892333984375, -0.41375732421875, -0.381622314453125, -0.3494873046875, -0.317352294921875, -0.28521728515625, -0.253082275390625, -0.220947265625, -0.188812255859375, -0.15667724609375, -0.124542236328125, -0.0924072265625, -0.060272216796875, -0.02813720703125, 0.003997802734375, 0.0361328125, 0.068267822265625, 0.10040283203125, 0.132537841796875, 0.1646728515625, 0.196807861328125, 0.22894287109375, 0.261077880859375, 0.293212890625, 0.325347900390625, 0.35748291015625, 0.389617919921875, 0.4217529296875, 0.453887939453125, 0.48602294921875, 0.518157958984375, 0.55029296875, 0.582427978515625, 0.61456298828125, 0.646697998046875, 0.6788330078125, 0.710968017578125, 0.74310302734375, 0.775238037109375, 0.807373046875, 0.839508056640625, 0.87164306640625, 0.903778076171875, 0.9359130859375, 0.968048095703125, 1.00018310546875, 1.032318115234375, 1.064453125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 4.0, 5.0, 11.0, 25.0, 24.0, 33.0, 49.0, 58.0, 84.0, 106.0, 77.0, 77.0, 88.0, 85.0, 66.0, 56.0, 36.0, 34.0, 24.0, 13.0, 14.0, 10.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.85986328125, -0.8354644775390625, -0.811065673828125, -0.7866668701171875, -0.76226806640625, -0.7378692626953125, -0.713470458984375, -0.6890716552734375, -0.6646728515625, -0.6402740478515625, -0.615875244140625, -0.5914764404296875, -0.56707763671875, -0.5426788330078125, -0.518280029296875, -0.4938812255859375, -0.469482421875, -0.4450836181640625, -0.420684814453125, -0.3962860107421875, -0.37188720703125, -0.3474884033203125, -0.323089599609375, -0.2986907958984375, -0.2742919921875, -0.2498931884765625, -0.225494384765625, -0.2010955810546875, -0.17669677734375, -0.1522979736328125, -0.127899169921875, -0.1035003662109375, -0.0791015625, -0.0547027587890625, -0.030303955078125, -0.0059051513671875, 0.01849365234375, 0.0428924560546875, 0.067291259765625, 0.0916900634765625, 0.1160888671875, 0.1404876708984375, 0.164886474609375, 0.1892852783203125, 0.21368408203125, 0.2380828857421875, 0.262481689453125, 0.2868804931640625, 0.311279296875, 0.3356781005859375, 0.360076904296875, 0.3844757080078125, 0.40887451171875, 0.4332733154296875, 0.457672119140625, 0.4820709228515625, 0.5064697265625, 0.5308685302734375, 0.555267333984375, 0.5796661376953125, 0.60406494140625, 0.6284637451171875, 0.652862548828125, 0.6772613525390625, 0.70166015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 2.0, 5.0, 15.0, 18.0, 25.0, 22.0, 32.0, 43.0, 73.0, 143.0, 239.0, 594.0, 2396.0, 17745.0, 288439.0, 696987.0, 36315.0, 3806.0, 906.0, 308.0, 150.0, 74.0, 54.0, 37.0, 35.0, 22.0, 19.0, 15.0, 8.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2724609375, -1.2218475341796875, -1.171234130859375, -1.1206207275390625, -1.07000732421875, -1.0193939208984375, -0.968780517578125, -0.9181671142578125, -0.8675537109375, -0.8169403076171875, -0.766326904296875, -0.7157135009765625, -0.66510009765625, -0.6144866943359375, -0.563873291015625, -0.5132598876953125, -0.462646484375, -0.4120330810546875, -0.361419677734375, -0.3108062744140625, -0.26019287109375, -0.2095794677734375, -0.158966064453125, -0.1083526611328125, -0.0577392578125, -0.0071258544921875, 0.043487548828125, 0.0941009521484375, 0.14471435546875, 0.1953277587890625, 0.245941162109375, 0.2965545654296875, 0.34716796875, 0.3977813720703125, 0.448394775390625, 0.4990081787109375, 0.54962158203125, 0.6002349853515625, 0.650848388671875, 0.7014617919921875, 0.7520751953125, 0.8026885986328125, 0.853302001953125, 0.9039154052734375, 0.95452880859375, 1.0051422119140625, 1.055755615234375, 1.1063690185546875, 1.156982421875, 1.2075958251953125, 1.258209228515625, 1.3088226318359375, 1.35943603515625, 1.4100494384765625, 1.460662841796875, 1.5112762451171875, 1.5618896484375, 1.6125030517578125, 1.663116455078125, 1.7137298583984375, 1.76434326171875, 1.8149566650390625, 1.865570068359375, 1.9161834716796875, 1.966796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 10.0, 9.0, 16.0, 15.0, 19.0, 18.0, 38.0, 32.0, 41.0, 37.0, 44.0, 55.0, 48.0, 55.0, 59.0, 49.0, 48.0, 53.0, 58.0, 34.0, 34.0, 41.0, 33.0, 33.0, 24.0, 13.0, 11.0, 16.0, 9.0, 7.0, 9.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.64453125, -1.588623046875, -1.53271484375, -1.476806640625, -1.4208984375, -1.364990234375, -1.30908203125, -1.253173828125, -1.197265625, -1.141357421875, -1.08544921875, -1.029541015625, -0.9736328125, -0.917724609375, -0.86181640625, -0.805908203125, -0.75, -0.694091796875, -0.63818359375, -0.582275390625, -0.5263671875, -0.470458984375, -0.41455078125, -0.358642578125, -0.302734375, -0.246826171875, -0.19091796875, -0.135009765625, -0.0791015625, -0.023193359375, 0.03271484375, 0.088623046875, 0.14453125, 0.200439453125, 0.25634765625, 0.312255859375, 0.3681640625, 0.424072265625, 0.47998046875, 0.535888671875, 0.591796875, 0.647705078125, 0.70361328125, 0.759521484375, 0.8154296875, 0.871337890625, 0.92724609375, 0.983154296875, 1.0390625, 1.094970703125, 1.15087890625, 1.206787109375, 1.2626953125, 1.318603515625, 1.37451171875, 1.430419921875, 1.486328125, 1.542236328125, 1.59814453125, 1.654052734375, 1.7099609375, 1.765869140625, 1.82177734375, 1.877685546875, 1.93359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 12.0, 13.0, 23.0, 27.0, 57.0, 95.0, 205.0, 458.0, 1018.0, 2797.0, 10517.0, 58005.0, 695990.0, 241905.0, 28067.0, 6076.0, 1884.0, 710.0, 308.0, 169.0, 102.0, 49.0, 27.0, 16.0, 9.0, 5.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270751953125, -0.2593803405761719, -0.24800872802734375, -0.23663711547851562, -0.2252655029296875, -0.21389389038085938, -0.20252227783203125, -0.19115066528320312, -0.179779052734375, -0.16840744018554688, -0.15703582763671875, -0.14566421508789062, -0.1342926025390625, -0.12292098999023438, -0.11154937744140625, -0.10017776489257812, -0.08880615234375, -0.07743453979492188, -0.06606292724609375, -0.054691314697265625, -0.0433197021484375, -0.031948089599609375, -0.02057647705078125, -0.009204864501953125, 0.002166748046875, 0.013538360595703125, 0.02490997314453125, 0.036281585693359375, 0.0476531982421875, 0.059024810791015625, 0.07039642333984375, 0.08176803588867188, 0.0931396484375, 0.10451126098632812, 0.11588287353515625, 0.12725448608398438, 0.1386260986328125, 0.14999771118164062, 0.16136932373046875, 0.17274093627929688, 0.184112548828125, 0.19548416137695312, 0.20685577392578125, 0.21822738647460938, 0.2295989990234375, 0.24097061157226562, 0.25234222412109375, 0.2637138366699219, 0.27508544921875, 0.2864570617675781, 0.29782867431640625, 0.3092002868652344, 0.3205718994140625, 0.3319435119628906, 0.34331512451171875, 0.3546867370605469, 0.366058349609375, 0.3774299621582031, 0.38880157470703125, 0.4001731872558594, 0.4115447998046875, 0.4229164123535156, 0.43428802490234375, 0.4456596374511719, 0.45703125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 7.0, 8.0, 4.0, 6.0, 13.0, 26.0, 30.0, 45.0, 55.0, 76.0, 88.0, 111.0, 115.0, 91.0, 70.0, 53.0, 51.0, 25.0, 23.0, 28.0, 22.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.798173904418945e-05, -4.59868460893631e-05, -4.399195313453674e-05, -4.199706017971039e-05, -4.000216722488403e-05, -3.800727427005768e-05, -3.601238131523132e-05, -3.401748836040497e-05, -3.202259540557861e-05, -3.0027702450752258e-05, -2.8032809495925903e-05, -2.603791654109955e-05, -2.4043023586273193e-05, -2.204813063144684e-05, -2.0053237676620483e-05, -1.805834472179413e-05, -1.6063451766967773e-05, -1.4068558812141418e-05, -1.2073665857315063e-05, -1.0078772902488708e-05, -8.083879947662354e-06, -6.0889869928359985e-06, -4.0940940380096436e-06, -2.0992010831832886e-06, -1.043081283569336e-07, 1.8905848264694214e-06, 3.885477781295776e-06, 5.880370736122131e-06, 7.875263690948486e-06, 9.870156645774841e-06, 1.1865049600601196e-05, 1.3859942555427551e-05, 1.5854835510253906e-05, 1.784972846508026e-05, 1.9844621419906616e-05, 2.183951437473297e-05, 2.3834407329559326e-05, 2.582930028438568e-05, 2.7824193239212036e-05, 2.981908619403839e-05, 3.1813979148864746e-05, 3.38088721036911e-05, 3.5803765058517456e-05, 3.779865801334381e-05, 3.9793550968170166e-05, 4.178844392299652e-05, 4.3783336877822876e-05, 4.577822983264923e-05, 4.7773122787475586e-05, 4.976801574230194e-05, 5.1762908697128296e-05, 5.375780165195465e-05, 5.5752694606781006e-05, 5.774758756160736e-05, 5.9742480516433716e-05, 6.173737347126007e-05, 6.373226642608643e-05, 6.572715938091278e-05, 6.772205233573914e-05, 6.971694529056549e-05, 7.171183824539185e-05, 7.37067312002182e-05, 7.570162415504456e-05, 7.769651710987091e-05, 7.969141006469727e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 13.0, 20.0, 24.0, 39.0, 88.0, 143.0, 306.0, 921.0, 4756.0, 51691.0, 842038.0, 137009.0, 9243.0, 1438.0, 418.0, 166.0, 106.0, 45.0, 39.0, 14.0, 11.0, 11.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364501953125, -0.3490943908691406, -0.33368682861328125, -0.3182792663574219, -0.3028717041015625, -0.2874641418457031, -0.27205657958984375, -0.2566490173339844, -0.241241455078125, -0.22583389282226562, -0.21042633056640625, -0.19501876831054688, -0.1796112060546875, -0.16420364379882812, -0.14879608154296875, -0.13338851928710938, -0.11798095703125, -0.10257339477539062, -0.08716583251953125, -0.07175827026367188, -0.0563507080078125, -0.040943145751953125, -0.02553558349609375, -0.010128021240234375, 0.005279541015625, 0.020687103271484375, 0.03609466552734375, 0.051502227783203125, 0.0669097900390625, 0.08231735229492188, 0.09772491455078125, 0.11313247680664062, 0.1285400390625, 0.14394760131835938, 0.15935516357421875, 0.17476272583007812, 0.1901702880859375, 0.20557785034179688, 0.22098541259765625, 0.23639297485351562, 0.251800537109375, 0.2672080993652344, 0.28261566162109375, 0.2980232238769531, 0.3134307861328125, 0.3288383483886719, 0.34424591064453125, 0.3596534729003906, 0.37506103515625, 0.3904685974121094, 0.40587615966796875, 0.4212837219238281, 0.4366912841796875, 0.4520988464355469, 0.46750640869140625, 0.4829139709472656, 0.498321533203125, 0.5137290954589844, 0.5291366577148438, 0.5445442199707031, 0.5599517822265625, 0.5753593444824219, 0.5907669067382812, 0.6061744689941406, 0.62158203125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 8.0, 9.0, 10.0, 20.0, 31.0, 32.0, 54.0, 76.0, 109.0, 127.0, 134.0, 106.0, 109.0, 69.0, 36.0, 27.0, 19.0, 15.0, 8.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3505859375, -0.3341522216796875, -0.317718505859375, -0.3012847900390625, -0.28485107421875, -0.2684173583984375, -0.251983642578125, -0.2355499267578125, -0.2191162109375, -0.2026824951171875, -0.186248779296875, -0.1698150634765625, -0.15338134765625, -0.1369476318359375, -0.120513916015625, -0.1040802001953125, -0.087646484375, -0.0712127685546875, -0.054779052734375, -0.0383453369140625, -0.02191162109375, -0.0054779052734375, 0.010955810546875, 0.0273895263671875, 0.0438232421875, 0.0602569580078125, 0.076690673828125, 0.0931243896484375, 0.10955810546875, 0.1259918212890625, 0.142425537109375, 0.1588592529296875, 0.17529296875, 0.1917266845703125, 0.208160400390625, 0.2245941162109375, 0.24102783203125, 0.2574615478515625, 0.273895263671875, 0.2903289794921875, 0.3067626953125, 0.3231964111328125, 0.339630126953125, 0.3560638427734375, 0.37249755859375, 0.3889312744140625, 0.405364990234375, 0.4217987060546875, 0.438232421875, 0.4546661376953125, 0.471099853515625, 0.4875335693359375, 0.50396728515625, 0.5204010009765625, 0.536834716796875, 0.5532684326171875, 0.5697021484375, 0.5861358642578125, 0.602569580078125, 0.6190032958984375, 0.63543701171875, 0.6518707275390625, 0.668304443359375, 0.6847381591796875, 0.701171875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 7.0, 3.0, 16.0, 68.0, 171.0, 422.0, 187.0, 66.0, 30.0, 13.0, 8.0, 4.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.818939208984375, -6.402278423309326, -5.985617637634277, -5.56895637512207, -5.1522955894470215, -4.735634803771973, -4.318974018096924, -3.902312994003296, -3.485652208328247, -3.0689914226531982, -2.6523303985595703, -2.2356696128845215, -1.819008708000183, -1.4023478031158447, -0.9856870174407959, -0.569025993347168, -0.15236520767211914, 0.26429566740989685, 0.6809565424919128, 1.0976173877716064, 1.5142782926559448, 1.9309391975402832, 2.347599983215332, 2.76426100730896, 3.180921792984009, 3.5975825786590576, 4.0142436027526855, 4.430904388427734, 4.847565174102783, 5.264225959777832, 5.680887222290039, 6.097548007965088, 6.514208793640137, 6.9308695793151855, 7.347530364990234, 7.764191627502441, 8.180851936340332, 8.597513198852539, 9.01417350769043, 9.430834770202637, 9.847496032714844, 10.26415729522705, 10.680817604064941, 11.097478866577148, 11.514139175415039, 11.930800437927246, 12.347461700439453, 12.764122009277344, 13.180782318115234, 13.597443580627441, 14.014103889465332, 14.430765151977539, 14.84742546081543, 15.264086723327637, 15.680747985839844, 16.097408294677734, 16.514070510864258, 16.93073081970215, 17.347393035888672, 17.764053344726562, 18.180713653564453, 18.597373962402344, 19.014036178588867, 19.430696487426758, 19.84735679626465]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 8.0, 8.0, 7.0, 9.0, 12.0, 13.0, 26.0, 12.0, 27.0, 26.0, 35.0, 39.0, 44.0, 34.0, 40.0, 55.0, 87.0, 94.0, 54.0, 43.0, 45.0, 35.0, 28.0, 34.0, 22.0, 22.0, 25.0, 19.0, 10.0, 20.0, 7.0, 6.0, 10.0, 5.0, 8.0, 8.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6862077713012695, -5.483908176422119, -5.281608581542969, -5.07930850982666, -4.87700891494751, -4.674709320068359, -4.472409725189209, -4.270110130310059, -4.06781005859375, -3.8655104637145996, -3.66321063041687, -3.4609110355377197, -3.2586112022399902, -3.05631160736084, -2.8540120124816895, -2.651712417602539, -2.4494128227233887, -2.2471132278442383, -2.044813394546509, -1.8425137996673584, -1.6402140855789185, -1.4379143714904785, -1.2356147766113281, -1.0333150625228882, -0.8310153484344482, -0.6287156343460083, -0.42641597986221313, -0.22411632537841797, -0.021816611289978027, 0.18048310279846191, 0.3827826976776123, 0.5850824117660522, 0.7873821258544922, 0.9896818399429321, 1.191981554031372, 1.3942811489105225, 1.5965808629989624, 1.7988805770874023, 2.0011801719665527, 2.203479766845703, 2.4057796001434326, 2.608079195022583, 2.8103790283203125, 3.012678623199463, 3.2149782180786133, 3.4172780513763428, 3.619577646255493, 3.8218774795532227, 4.024177074432373, 4.226476669311523, 4.428776264190674, 4.631075859069824, 4.833375930786133, 5.035675525665283, 5.237975120544434, 5.440274715423584, 5.642574310302734, 5.844873905181885, 6.047173500061035, 6.249473571777344, 6.451773166656494, 6.6540727615356445, 6.856372356414795, 7.058671951293945, 7.260972023010254]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 10.0, 13.0, 23.0, 33.0, 53.0, 97.0, 152.0, 282.0, 552.0, 1400.0, 3717.0, 11287.0, 60842.0, 688798.0, 2938586.0, 433199.0, 41506.0, 8479.0, 2783.0, 1168.0, 562.0, 266.0, 162.0, 92.0, 67.0, 42.0, 25.0, 27.0, 15.0, 12.0, 12.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.480224609375, -0.4633216857910156, -0.44641876220703125, -0.4295158386230469, -0.4126129150390625, -0.3957099914550781, -0.37880706787109375, -0.3619041442871094, -0.345001220703125, -0.3280982971191406, -0.31119537353515625, -0.2942924499511719, -0.2773895263671875, -0.2604866027832031, -0.24358367919921875, -0.22668075561523438, -0.20977783203125, -0.19287490844726562, -0.17597198486328125, -0.15906906127929688, -0.1421661376953125, -0.12526321411132812, -0.10836029052734375, -0.09145736694335938, -0.074554443359375, -0.057651519775390625, -0.04074859619140625, -0.023845672607421875, -0.0069427490234375, 0.009960174560546875, 0.02686309814453125, 0.043766021728515625, 0.0606689453125, 0.07757186889648438, 0.09447479248046875, 0.11137771606445312, 0.1282806396484375, 0.14518356323242188, 0.16208648681640625, 0.17898941040039062, 0.195892333984375, 0.21279525756835938, 0.22969818115234375, 0.24660110473632812, 0.2635040283203125, 0.2804069519042969, 0.29730987548828125, 0.3142127990722656, 0.33111572265625, 0.3480186462402344, 0.36492156982421875, 0.3818244934082031, 0.3987274169921875, 0.4156303405761719, 0.43253326416015625, 0.4494361877441406, 0.466339111328125, 0.4832420349121094, 0.5001449584960938, 0.5170478820800781, 0.5339508056640625, 0.5508537292480469, 0.5677566528320312, 0.5846595764160156, 0.6015625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 10.0, 15.0, 16.0, 37.0, 32.0, 54.0, 59.0, 77.0, 90.0, 85.0, 99.0, 103.0, 78.0, 61.0, 52.0, 41.0, 31.0, 17.0, 11.0, 9.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.904296875, -0.87921142578125, -0.8541259765625, -0.82904052734375, -0.803955078125, -0.77886962890625, -0.7537841796875, -0.72869873046875, -0.70361328125, -0.67852783203125, -0.6534423828125, -0.62835693359375, -0.603271484375, -0.57818603515625, -0.5531005859375, -0.52801513671875, -0.5029296875, -0.47784423828125, -0.4527587890625, -0.42767333984375, -0.402587890625, -0.37750244140625, -0.3524169921875, -0.32733154296875, -0.30224609375, -0.27716064453125, -0.2520751953125, -0.22698974609375, -0.201904296875, -0.17681884765625, -0.1517333984375, -0.12664794921875, -0.1015625, -0.07647705078125, -0.0513916015625, -0.02630615234375, -0.001220703125, 0.02386474609375, 0.0489501953125, 0.07403564453125, 0.09912109375, 0.12420654296875, 0.1492919921875, 0.17437744140625, 0.199462890625, 0.22454833984375, 0.2496337890625, 0.27471923828125, 0.2998046875, 0.32489013671875, 0.3499755859375, 0.37506103515625, 0.400146484375, 0.42523193359375, 0.4503173828125, 0.47540283203125, 0.50048828125, 0.52557373046875, 0.5506591796875, 0.57574462890625, 0.600830078125, 0.62591552734375, 0.6510009765625, 0.67608642578125, 0.701171875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 11.0, 8.0, 9.0, 17.0, 26.0, 58.0, 85.0, 188.0, 403.0, 1202.0, 5193.0, 72500.0, 3958470.0, 146614.0, 7077.0, 1484.0, 469.0, 224.0, 97.0, 55.0, 26.0, 18.0, 10.0, 13.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.04296875, -1.005157470703125, -0.96734619140625, -0.929534912109375, -0.8917236328125, -0.853912353515625, -0.81610107421875, -0.778289794921875, -0.740478515625, -0.702667236328125, -0.66485595703125, -0.627044677734375, -0.5892333984375, -0.551422119140625, -0.51361083984375, -0.475799560546875, -0.43798828125, -0.400177001953125, -0.36236572265625, -0.324554443359375, -0.2867431640625, -0.248931884765625, -0.21112060546875, -0.173309326171875, -0.135498046875, -0.097686767578125, -0.05987548828125, -0.022064208984375, 0.0157470703125, 0.053558349609375, 0.09136962890625, 0.129180908203125, 0.1669921875, 0.204803466796875, 0.24261474609375, 0.280426025390625, 0.3182373046875, 0.356048583984375, 0.39385986328125, 0.431671142578125, 0.469482421875, 0.507293701171875, 0.54510498046875, 0.582916259765625, 0.6207275390625, 0.658538818359375, 0.69635009765625, 0.734161376953125, 0.77197265625, 0.809783935546875, 0.84759521484375, 0.885406494140625, 0.9232177734375, 0.961029052734375, 0.99884033203125, 1.036651611328125, 1.074462890625, 1.112274169921875, 1.15008544921875, 1.187896728515625, 1.2257080078125, 1.263519287109375, 1.30133056640625, 1.339141845703125, 1.376953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 10.0, 15.0, 14.0, 29.0, 43.0, 62.0, 150.0, 230.0, 440.0, 853.0, 889.0, 667.0, 301.0, 161.0, 72.0, 49.0, 25.0, 17.0, 18.0, 2.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875, -0.6602020263671875, -0.632904052734375, -0.6056060791015625, -0.57830810546875, -0.5510101318359375, -0.523712158203125, -0.4964141845703125, -0.4691162109375, -0.4418182373046875, -0.414520263671875, -0.3872222900390625, -0.35992431640625, -0.3326263427734375, -0.305328369140625, -0.2780303955078125, -0.250732421875, -0.2234344482421875, -0.196136474609375, -0.1688385009765625, -0.14154052734375, -0.1142425537109375, -0.086944580078125, -0.0596466064453125, -0.0323486328125, -0.0050506591796875, 0.022247314453125, 0.0495452880859375, 0.07684326171875, 0.1041412353515625, 0.131439208984375, 0.1587371826171875, 0.18603515625, 0.2133331298828125, 0.240631103515625, 0.2679290771484375, 0.29522705078125, 0.3225250244140625, 0.349822998046875, 0.3771209716796875, 0.4044189453125, 0.4317169189453125, 0.459014892578125, 0.4863128662109375, 0.51361083984375, 0.5409088134765625, 0.568206787109375, 0.5955047607421875, 0.622802734375, 0.6501007080078125, 0.677398681640625, 0.7046966552734375, 0.73199462890625, 0.7592926025390625, 0.786590576171875, 0.8138885498046875, 0.8411865234375, 0.8684844970703125, 0.895782470703125, 0.9230804443359375, 0.95037841796875, 0.9776763916015625, 1.004974365234375, 1.0322723388671875, 1.0595703125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 17.0, 81.0, 244.0, 354.0, 203.0, 72.0, 16.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-17.57353973388672, -17.244478225708008, -16.915416717529297, -16.586353302001953, -16.257291793823242, -15.928230285644531, -15.59916877746582, -15.27010726928711, -14.941044807434082, -14.611983299255371, -14.282920837402344, -13.953859329223633, -13.624797821044922, -13.295735359191895, -12.966673851013184, -12.637611389160156, -12.308549880981445, -11.979488372802734, -11.650425910949707, -11.321364402770996, -10.992302894592285, -10.663240432739258, -10.334178924560547, -10.005117416381836, -9.676055908203125, -9.346994400024414, -9.017931938171387, -8.688870429992676, -8.359808921813965, -8.030746459960938, -7.701684951782227, -7.372622966766357, -7.043560981750488, -6.714498996734619, -6.385437488555908, -6.056375503540039, -5.72731351852417, -5.398251533508301, -5.06919002532959, -4.740128040313721, -4.41106653213501, -4.082004547119141, -3.7529428005218506, -3.4238810539245605, -3.0948190689086914, -2.7657573223114014, -2.4366955757141113, -2.107633590698242, -1.7785718441009521, -1.4495099782943726, -1.120448112487793, -0.7913863658905029, -0.46232450008392334, -0.13326263427734375, 0.1957991123199463, 0.5248610973358154, 0.8539228439331055, 1.182984709739685, 1.5120465755462646, 1.8411083221435547, 2.170170307159424, 2.499232053756714, 2.828293800354004, 3.157355785369873, 3.486417531967163]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 1.0, 6.0, 4.0, 9.0, 14.0, 9.0, 24.0, 19.0, 22.0, 22.0, 37.0, 30.0, 42.0, 49.0, 50.0, 56.0, 63.0, 58.0, 50.0, 82.0, 62.0, 49.0, 49.0, 37.0, 28.0, 20.0, 30.0, 22.0, 9.0, 12.0, 13.0, 10.0, 1.0, 9.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4971179962158203, -3.3783347606658936, -3.2595512866973877, -3.140768051147461, -3.021984577178955, -2.9032013416290283, -2.7844181060791016, -2.6656346321105957, -2.546851396560669, -2.428068161010742, -2.3092846870422363, -2.1905014514923096, -2.071718215942383, -1.952934741973877, -1.8341515064239502, -1.7153681516647339, -1.5965847969055176, -1.4778014421463013, -1.359018087387085, -1.2402348518371582, -1.121451497077942, -1.0026681423187256, -0.883884847164154, -0.7651015520095825, -0.6463181972503662, -0.5275348424911499, -0.40875154733657837, -0.28996822237968445, -0.17118489742279053, -0.05240154266357422, 0.06638175249099731, 0.18516504764556885, 0.30394840240478516, 0.4227317273616791, 0.541515052318573, 0.6602983474731445, 0.7790817022323608, 0.8978650569915771, 1.016648292541504, 1.1354316473007202, 1.2542150020599365, 1.3729983568191528, 1.4917817115783691, 1.610564947128296, 1.7293483018875122, 1.8481316566467285, 1.9669148921966553, 2.085698127746582, 2.204481601715088, 2.3232648372650146, 2.4420483112335205, 2.5608315467834473, 2.679615020751953, 2.79839825630188, 2.9171814918518066, 3.0359649658203125, 3.1547482013702393, 3.273531436920166, 3.392314910888672, 3.5110981464385986, 3.6298813819885254, 3.7486648559570312, 3.867448091506958, 3.9862313270568848, 4.105014801025391]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 11.0, 13.0, 14.0, 35.0, 51.0, 94.0, 175.0, 310.0, 734.0, 1776.0, 5340.0, 21493.0, 122894.0, 582966.0, 258841.0, 40410.0, 8870.0, 2591.0, 1019.0, 416.0, 203.0, 111.0, 68.0, 54.0, 16.0, 15.0, 12.0, 8.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75390625, -0.7245635986328125, -0.695220947265625, -0.6658782958984375, -0.63653564453125, -0.6071929931640625, -0.577850341796875, -0.5485076904296875, -0.5191650390625, -0.4898223876953125, -0.460479736328125, -0.4311370849609375, -0.40179443359375, -0.3724517822265625, -0.343109130859375, -0.3137664794921875, -0.284423828125, -0.2550811767578125, -0.225738525390625, -0.1963958740234375, -0.16705322265625, -0.1377105712890625, -0.108367919921875, -0.0790252685546875, -0.0496826171875, -0.0203399658203125, 0.009002685546875, 0.0383453369140625, 0.06768798828125, 0.0970306396484375, 0.126373291015625, 0.1557159423828125, 0.18505859375, 0.2144012451171875, 0.243743896484375, 0.2730865478515625, 0.30242919921875, 0.3317718505859375, 0.361114501953125, 0.3904571533203125, 0.4197998046875, 0.4491424560546875, 0.478485107421875, 0.5078277587890625, 0.53717041015625, 0.5665130615234375, 0.595855712890625, 0.6251983642578125, 0.654541015625, 0.6838836669921875, 0.713226318359375, 0.7425689697265625, 0.77191162109375, 0.8012542724609375, 0.830596923828125, 0.8599395751953125, 0.8892822265625, 0.9186248779296875, 0.947967529296875, 0.9773101806640625, 1.00665283203125, 1.0359954833984375, 1.065338134765625, 1.0946807861328125, 1.1240234375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 8.0, 15.0, 18.0, 27.0, 33.0, 33.0, 50.0, 82.0, 82.0, 97.0, 88.0, 83.0, 89.0, 69.0, 61.0, 48.0, 38.0, 27.0, 11.0, 20.0, 3.0, 6.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8271484375, -0.8032150268554688, -0.7792816162109375, -0.7553482055664062, -0.731414794921875, -0.7074813842773438, -0.6835479736328125, -0.6596145629882812, -0.63568115234375, -0.6117477416992188, -0.5878143310546875, -0.5638809204101562, -0.539947509765625, -0.5160140991210938, -0.4920806884765625, -0.46814727783203125, -0.4442138671875, -0.42028045654296875, -0.3963470458984375, -0.37241363525390625, -0.348480224609375, -0.32454681396484375, -0.3006134033203125, -0.27667999267578125, -0.25274658203125, -0.22881317138671875, -0.2048797607421875, -0.18094635009765625, -0.157012939453125, -0.13307952880859375, -0.1091461181640625, -0.08521270751953125, -0.061279296875, -0.03734588623046875, -0.0134124755859375, 0.01052093505859375, 0.034454345703125, 0.05838775634765625, 0.0823211669921875, 0.10625457763671875, 0.13018798828125, 0.15412139892578125, 0.1780548095703125, 0.20198822021484375, 0.225921630859375, 0.24985504150390625, 0.2737884521484375, 0.29772186279296875, 0.3216552734375, 0.34558868408203125, 0.3695220947265625, 0.39345550537109375, 0.417388916015625, 0.44132232666015625, 0.4652557373046875, 0.48918914794921875, 0.51312255859375, 0.5370559692382812, 0.5609893798828125, 0.5849227905273438, 0.608856201171875, 0.6327896118164062, 0.6567230224609375, 0.6806564331054688, 0.70458984375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 7.0, 5.0, 13.0, 14.0, 10.0, 19.0, 37.0, 42.0, 45.0, 70.0, 110.0, 152.0, 230.0, 374.0, 658.0, 1188.0, 3173.0, 13778.0, 111038.0, 766200.0, 129191.0, 15841.0, 3431.0, 1221.0, 617.0, 364.0, 215.0, 134.0, 97.0, 61.0, 58.0, 37.0, 24.0, 20.0, 27.0, 17.0, 7.0, 10.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.12109375, -1.0876617431640625, -1.054229736328125, -1.0207977294921875, -0.98736572265625, -0.9539337158203125, -0.920501708984375, -0.8870697021484375, -0.8536376953125, -0.8202056884765625, -0.786773681640625, -0.7533416748046875, -0.71990966796875, -0.6864776611328125, -0.653045654296875, -0.6196136474609375, -0.586181640625, -0.5527496337890625, -0.519317626953125, -0.4858856201171875, -0.45245361328125, -0.4190216064453125, -0.385589599609375, -0.3521575927734375, -0.3187255859375, -0.2852935791015625, -0.251861572265625, -0.2184295654296875, -0.18499755859375, -0.1515655517578125, -0.118133544921875, -0.0847015380859375, -0.05126953125, -0.0178375244140625, 0.015594482421875, 0.0490264892578125, 0.08245849609375, 0.1158905029296875, 0.149322509765625, 0.1827545166015625, 0.2161865234375, 0.2496185302734375, 0.283050537109375, 0.3164825439453125, 0.34991455078125, 0.3833465576171875, 0.416778564453125, 0.4502105712890625, 0.483642578125, 0.5170745849609375, 0.550506591796875, 0.5839385986328125, 0.61737060546875, 0.6508026123046875, 0.684234619140625, 0.7176666259765625, 0.7510986328125, 0.7845306396484375, 0.817962646484375, 0.8513946533203125, 0.88482666015625, 0.9182586669921875, 0.951690673828125, 0.9851226806640625, 1.0185546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 10.0, 10.0, 10.0, 22.0, 24.0, 39.0, 41.0, 43.0, 48.0, 66.0, 63.0, 60.0, 80.0, 65.0, 65.0, 73.0, 54.0, 45.0, 46.0, 37.0, 19.0, 18.0, 13.0, 10.0, 8.0, 7.0, 7.0, 3.0, 8.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.0360107421875, -1.974365234375, -1.9127197265625, -1.85107421875, -1.7894287109375, -1.727783203125, -1.6661376953125, -1.6044921875, -1.5428466796875, -1.481201171875, -1.4195556640625, -1.35791015625, -1.2962646484375, -1.234619140625, -1.1729736328125, -1.111328125, -1.0496826171875, -0.988037109375, -0.9263916015625, -0.86474609375, -0.8031005859375, -0.741455078125, -0.6798095703125, -0.6181640625, -0.5565185546875, -0.494873046875, -0.4332275390625, -0.37158203125, -0.3099365234375, -0.248291015625, -0.1866455078125, -0.125, -0.0633544921875, -0.001708984375, 0.0599365234375, 0.12158203125, 0.1832275390625, 0.244873046875, 0.3065185546875, 0.3681640625, 0.4298095703125, 0.491455078125, 0.5531005859375, 0.61474609375, 0.6763916015625, 0.738037109375, 0.7996826171875, 0.861328125, 0.9229736328125, 0.984619140625, 1.0462646484375, 1.10791015625, 1.1695556640625, 1.231201171875, 1.2928466796875, 1.3544921875, 1.4161376953125, 1.477783203125, 1.5394287109375, 1.60107421875, 1.6627197265625, 1.724365234375, 1.7860107421875, 1.84765625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 4.0, 5.0, 8.0, 14.0, 11.0, 13.0, 20.0, 25.0, 41.0, 51.0, 94.0, 123.0, 183.0, 280.0, 486.0, 757.0, 1359.0, 2415.0, 4838.0, 10592.0, 26445.0, 79751.0, 581927.0, 242476.0, 58481.0, 20539.0, 8687.0, 4023.0, 1961.0, 1189.0, 616.0, 378.0, 263.0, 164.0, 92.0, 73.0, 53.0, 25.0, 22.0, 24.0, 13.0, 7.0, 6.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2156982421875, -0.20932960510253906, -0.20296096801757812, -0.1965923309326172, -0.19022369384765625, -0.1838550567626953, -0.17748641967773438, -0.17111778259277344, -0.1647491455078125, -0.15838050842285156, -0.15201187133789062, -0.1456432342529297, -0.13927459716796875, -0.1329059600830078, -0.12653732299804688, -0.12016868591308594, -0.113800048828125, -0.10743141174316406, -0.10106277465820312, -0.09469413757324219, -0.08832550048828125, -0.08195686340332031, -0.07558822631835938, -0.06921958923339844, -0.0628509521484375, -0.05648231506347656, -0.050113677978515625, -0.04374504089355469, -0.03737640380859375, -0.031007766723632812, -0.024639129638671875, -0.018270492553710938, -0.01190185546875, -0.0055332183837890625, 0.000835418701171875, 0.0072040557861328125, 0.01357269287109375, 0.019941329956054688, 0.026309967041015625, 0.03267860412597656, 0.0390472412109375, 0.04541587829589844, 0.051784515380859375, 0.05815315246582031, 0.06452178955078125, 0.07089042663574219, 0.07725906372070312, 0.08362770080566406, 0.089996337890625, 0.09636497497558594, 0.10273361206054688, 0.10910224914550781, 0.11547088623046875, 0.12183952331542969, 0.12820816040039062, 0.13457679748535156, 0.1409454345703125, 0.14731407165527344, 0.15368270874023438, 0.1600513458251953, 0.16641998291015625, 0.1727886199951172, 0.17915725708007812, 0.18552589416503906, 0.19189453125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 9.0, 9.0, 18.0, 18.0, 15.0, 32.0, 34.0, 60.0, 60.0, 89.0, 105.0, 122.0, 104.0, 74.0, 57.0, 39.0, 36.0, 22.0, 19.0, 14.0, 6.0, 7.0, 9.0, 11.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.508827209472656e-05, -6.323400884866714e-05, -6.137974560260773e-05, -5.952548235654831e-05, -5.767121911048889e-05, -5.5816955864429474e-05, -5.3962692618370056e-05, -5.210842937231064e-05, -5.025416612625122e-05, -4.83999028801918e-05, -4.6545639634132385e-05, -4.469137638807297e-05, -4.283711314201355e-05, -4.098284989595413e-05, -3.9128586649894714e-05, -3.72743234038353e-05, -3.542006015777588e-05, -3.356579691171646e-05, -3.1711533665657043e-05, -2.9857270419597626e-05, -2.8003007173538208e-05, -2.614874392747879e-05, -2.4294480681419373e-05, -2.2440217435359955e-05, -2.0585954189300537e-05, -1.873169094324112e-05, -1.68774276971817e-05, -1.5023164451122284e-05, -1.3168901205062866e-05, -1.1314637959003448e-05, -9.46037471294403e-06, -7.606111466884613e-06, -5.751848220825195e-06, -3.897584974765778e-06, -2.04332172870636e-06, -1.8905848264694214e-07, 1.6652047634124756e-06, 3.5194680094718933e-06, 5.373731255531311e-06, 7.227994501590729e-06, 9.082257747650146e-06, 1.0936520993709564e-05, 1.2790784239768982e-05, 1.46450474858284e-05, 1.6499310731887817e-05, 1.8353573977947235e-05, 2.0207837224006653e-05, 2.206210047006607e-05, 2.3916363716125488e-05, 2.5770626962184906e-05, 2.7624890208244324e-05, 2.947915345430374e-05, 3.133341670036316e-05, 3.318767994642258e-05, 3.5041943192481995e-05, 3.689620643854141e-05, 3.875046968460083e-05, 4.060473293066025e-05, 4.2458996176719666e-05, 4.431325942277908e-05, 4.61675226688385e-05, 4.802178591489792e-05, 4.9876049160957336e-05, 5.1730312407016754e-05, 5.358457565307617e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 14.0, 17.0, 45.0, 62.0, 147.0, 345.0, 1007.0, 6572.0, 122929.0, 886889.0, 26827.0, 2668.0, 602.0, 205.0, 90.0, 61.0, 24.0, 20.0, 12.0, 6.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.681640625, -0.6638298034667969, -0.6460189819335938, -0.6282081604003906, -0.6103973388671875, -0.5925865173339844, -0.5747756958007812, -0.5569648742675781, -0.539154052734375, -0.5213432312011719, -0.5035324096679688, -0.4857215881347656, -0.4679107666015625, -0.4500999450683594, -0.43228912353515625, -0.4144783020019531, -0.39666748046875, -0.3788566589355469, -0.36104583740234375, -0.3432350158691406, -0.3254241943359375, -0.3076133728027344, -0.28980255126953125, -0.2719917297363281, -0.254180908203125, -0.23637008666992188, -0.21855926513671875, -0.20074844360351562, -0.1829376220703125, -0.16512680053710938, -0.14731597900390625, -0.12950515747070312, -0.1116943359375, -0.09388351440429688, -0.07607269287109375, -0.058261871337890625, -0.0404510498046875, -0.022640228271484375, -0.00482940673828125, 0.012981414794921875, 0.030792236328125, 0.048603057861328125, 0.06641387939453125, 0.08422470092773438, 0.1020355224609375, 0.11984634399414062, 0.13765716552734375, 0.15546798706054688, 0.17327880859375, 0.19108963012695312, 0.20890045166015625, 0.22671127319335938, 0.2445220947265625, 0.2623329162597656, 0.28014373779296875, 0.2979545593261719, 0.315765380859375, 0.3335762023925781, 0.35138702392578125, 0.3691978454589844, 0.3870086669921875, 0.4048194885253906, 0.42263031005859375, 0.4404411315917969, 0.458251953125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 10.0, 5.0, 8.0, 15.0, 17.0, 18.0, 38.0, 48.0, 62.0, 59.0, 120.0, 133.0, 123.0, 93.0, 64.0, 54.0, 29.0, 33.0, 23.0, 19.0, 4.0, 10.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.463623046875, -0.4510002136230469, -0.43837738037109375, -0.4257545471191406, -0.4131317138671875, -0.4005088806152344, -0.38788604736328125, -0.3752632141113281, -0.362640380859375, -0.3500175476074219, -0.33739471435546875, -0.3247718811035156, -0.3121490478515625, -0.2995262145996094, -0.28690338134765625, -0.2742805480957031, -0.26165771484375, -0.24903488159179688, -0.23641204833984375, -0.22378921508789062, -0.2111663818359375, -0.19854354858398438, -0.18592071533203125, -0.17329788208007812, -0.160675048828125, -0.14805221557617188, -0.13542938232421875, -0.12280654907226562, -0.1101837158203125, -0.09756088256835938, -0.08493804931640625, -0.07231521606445312, -0.0596923828125, -0.047069549560546875, -0.03444671630859375, -0.021823883056640625, -0.0092010498046875, 0.003421783447265625, 0.01604461669921875, 0.028667449951171875, 0.041290283203125, 0.053913116455078125, 0.06653594970703125, 0.07915878295898438, 0.0917816162109375, 0.10440444946289062, 0.11702728271484375, 0.12965011596679688, 0.14227294921875, 0.15489578247070312, 0.16751861572265625, 0.18014144897460938, 0.1927642822265625, 0.20538711547851562, 0.21800994873046875, 0.23063278198242188, 0.243255615234375, 0.2558784484863281, 0.26850128173828125, 0.2811241149902344, 0.2937469482421875, 0.3063697814941406, 0.31899261474609375, 0.3316154479980469, 0.34423828125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 8.0, 34.0, 229.0, 538.0, 144.0, 34.0, 14.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.751058578491211, -11.136977195739746, -10.522895812988281, -9.908814430236816, -9.294733047485352, -8.68065071105957, -8.066569328308105, -7.452487945556641, -6.838406562805176, -6.224325180053711, -5.610243797302246, -4.996161937713623, -4.382080554962158, -3.7679991722106934, -3.1539175510406494, -2.5398359298706055, -1.9257545471191406, -1.3116730451583862, -0.6975915431976318, -0.08351004123687744, 0.530571460723877, 1.1446528434753418, 1.7587344646453857, 2.3728160858154297, 2.9868974685668945, 3.6009788513183594, 4.215060234069824, 4.829142093658447, 5.443223476409912, 6.057304859161377, 6.67138671875, 7.285468101501465, 7.899547576904297, 8.513628959655762, 9.127710342407227, 9.741791725158691, 10.355873107910156, 10.969955444335938, 11.584036827087402, 12.198118209838867, 12.812199592590332, 13.426280975341797, 14.040362358093262, 14.654443740844727, 15.268526077270508, 15.882606506347656, 16.496688842773438, 17.11077117919922, 17.724851608276367, 18.33893394470215, 18.953014373779297, 19.567096710205078, 20.181177139282227, 20.795259475708008, 21.409339904785156, 22.023422241210938, 22.63750457763672, 23.2515869140625, 23.86566734313965, 24.47974967956543, 25.093830108642578, 25.70791244506836, 26.321992874145508, 26.93607521057129, 27.550155639648438]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 4.0, 7.0, 1.0, 8.0, 16.0, 16.0, 12.0, 23.0, 21.0, 23.0, 16.0, 32.0, 33.0, 33.0, 39.0, 42.0, 73.0, 85.0, 94.0, 71.0, 45.0, 36.0, 38.0, 18.0, 19.0, 29.0, 18.0, 16.0, 18.0, 9.0, 11.0, 13.0, 15.0, 12.0, 4.0, 4.0, 9.0, 6.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.552083969116211, -4.4005937576293945, -4.249103546142578, -4.097613334655762, -3.9461231231689453, -3.794632911682129, -3.6431427001953125, -3.491652488708496, -3.3401622772216797, -3.1886720657348633, -3.037181854248047, -2.8856916427612305, -2.734201431274414, -2.5827112197875977, -2.4312210083007812, -2.279730796813965, -2.1282408237457275, -1.9767506122589111, -1.8252604007720947, -1.6737701892852783, -1.522279977798462, -1.3707897663116455, -1.2192996740341187, -1.0678094625473022, -0.9163192510604858, -0.7648290395736694, -0.613338828086853, -0.4618486762046814, -0.310358464717865, -0.15886825323104858, -0.007378101348876953, 0.14411211013793945, 0.29560232162475586, 0.44709253311157227, 0.5985827445983887, 0.7500728964805603, 0.9015631079673767, 1.053053379058838, 1.2045434713363647, 1.3560336828231812, 1.5075238943099976, 1.659014105796814, 1.8105043172836304, 1.9619944095611572, 2.1134846210479736, 2.26497483253479, 2.4164650440216064, 2.567955255508423, 2.7194454669952393, 2.8709356784820557, 3.022425889968872, 3.1739161014556885, 3.325406312942505, 3.4768965244293213, 3.6283864974975586, 3.779876708984375, 3.9313669204711914, 4.082857131958008, 4.234347343444824, 4.385837554931641, 4.537327766418457, 4.688817977905273, 4.84030818939209, 4.991798400878906, 5.143288612365723]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 5.0, 17.0, 27.0, 39.0, 43.0, 104.0, 177.0, 317.0, 663.0, 2308.0, 10744.0, 129127.0, 2721995.0, 1273684.0, 46837.0, 5546.0, 1468.0, 501.0, 249.0, 137.0, 96.0, 68.0, 31.0, 20.0, 20.0, 13.0, 8.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8662109375, -0.842041015625, -0.81787109375, -0.793701171875, -0.76953125, -0.745361328125, -0.72119140625, -0.697021484375, -0.6728515625, -0.648681640625, -0.62451171875, -0.600341796875, -0.576171875, -0.552001953125, -0.52783203125, -0.503662109375, -0.4794921875, -0.455322265625, -0.43115234375, -0.406982421875, -0.3828125, -0.358642578125, -0.33447265625, -0.310302734375, -0.2861328125, -0.261962890625, -0.23779296875, -0.213623046875, -0.189453125, -0.165283203125, -0.14111328125, -0.116943359375, -0.0927734375, -0.068603515625, -0.04443359375, -0.020263671875, 0.00390625, 0.028076171875, 0.05224609375, 0.076416015625, 0.1005859375, 0.124755859375, 0.14892578125, 0.173095703125, 0.197265625, 0.221435546875, 0.24560546875, 0.269775390625, 0.2939453125, 0.318115234375, 0.34228515625, 0.366455078125, 0.390625, 0.414794921875, 0.43896484375, 0.463134765625, 0.4873046875, 0.511474609375, 0.53564453125, 0.559814453125, 0.583984375, 0.608154296875, 0.63232421875, 0.656494140625, 0.6806640625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 11.0, 6.0, 10.0, 16.0, 24.0, 36.0, 40.0, 43.0, 66.0, 70.0, 82.0, 101.0, 93.0, 75.0, 75.0, 65.0, 52.0, 37.0, 34.0, 18.0, 17.0, 10.0, 10.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.75537109375, -0.7325439453125, -0.709716796875, -0.6868896484375, -0.6640625, -0.6412353515625, -0.618408203125, -0.5955810546875, -0.57275390625, -0.5499267578125, -0.527099609375, -0.5042724609375, -0.4814453125, -0.4586181640625, -0.435791015625, -0.4129638671875, -0.39013671875, -0.3673095703125, -0.344482421875, -0.3216552734375, -0.298828125, -0.2760009765625, -0.253173828125, -0.2303466796875, -0.20751953125, -0.1846923828125, -0.161865234375, -0.1390380859375, -0.1162109375, -0.0933837890625, -0.070556640625, -0.0477294921875, -0.02490234375, -0.0020751953125, 0.020751953125, 0.0435791015625, 0.06640625, 0.0892333984375, 0.112060546875, 0.1348876953125, 0.15771484375, 0.1805419921875, 0.203369140625, 0.2261962890625, 0.2490234375, 0.2718505859375, 0.294677734375, 0.3175048828125, 0.34033203125, 0.3631591796875, 0.385986328125, 0.4088134765625, 0.431640625, 0.4544677734375, 0.477294921875, 0.5001220703125, 0.52294921875, 0.5457763671875, 0.568603515625, 0.5914306640625, 0.6142578125, 0.6370849609375, 0.659912109375, 0.6827392578125, 0.70556640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 10.0, 10.0, 40.0, 83.0, 296.0, 1097.0, 17244.0, 4163471.0, 10814.0, 854.0, 270.0, 54.0, 25.0, 11.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8828125, -2.79400634765625, -2.7052001953125, -2.61639404296875, -2.527587890625, -2.43878173828125, -2.3499755859375, -2.26116943359375, -2.17236328125, -2.08355712890625, -1.9947509765625, -1.90594482421875, -1.817138671875, -1.72833251953125, -1.6395263671875, -1.55072021484375, -1.4619140625, -1.37310791015625, -1.2843017578125, -1.19549560546875, -1.106689453125, -1.01788330078125, -0.9290771484375, -0.84027099609375, -0.75146484375, -0.66265869140625, -0.5738525390625, -0.48504638671875, -0.396240234375, -0.30743408203125, -0.2186279296875, -0.12982177734375, -0.041015625, 0.04779052734375, 0.1365966796875, 0.22540283203125, 0.314208984375, 0.40301513671875, 0.4918212890625, 0.58062744140625, 0.66943359375, 0.75823974609375, 0.8470458984375, 0.93585205078125, 1.024658203125, 1.11346435546875, 1.2022705078125, 1.29107666015625, 1.3798828125, 1.46868896484375, 1.5574951171875, 1.64630126953125, 1.735107421875, 1.82391357421875, 1.9127197265625, 2.00152587890625, 2.09033203125, 2.17913818359375, 2.2679443359375, 2.35675048828125, 2.445556640625, 2.53436279296875, 2.6231689453125, 2.71197509765625, 2.80078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 10.0, 12.0, 19.0, 27.0, 51.0, 105.0, 201.0, 458.0, 889.0, 1069.0, 641.0, 318.0, 126.0, 52.0, 45.0, 19.0, 15.0, 3.0, 6.0, 2.0, 2.0, 1.0, 5.0, 1.0], "bins": [-1.7548828125, -1.7192764282226562, -1.6836700439453125, -1.6480636596679688, -1.612457275390625, -1.5768508911132812, -1.5412445068359375, -1.5056381225585938, -1.47003173828125, -1.4344253540039062, -1.3988189697265625, -1.3632125854492188, -1.327606201171875, -1.2919998168945312, -1.2563934326171875, -1.2207870483398438, -1.1851806640625, -1.1495742797851562, -1.1139678955078125, -1.0783615112304688, -1.042755126953125, -1.0071487426757812, -0.9715423583984375, -0.9359359741210938, -0.90032958984375, -0.8647232055664062, -0.8291168212890625, -0.7935104370117188, -0.757904052734375, -0.7222976684570312, -0.6866912841796875, -0.6510848999023438, -0.615478515625, -0.5798721313476562, -0.5442657470703125, -0.5086593627929688, -0.473052978515625, -0.43744659423828125, -0.4018402099609375, -0.36623382568359375, -0.33062744140625, -0.29502105712890625, -0.2594146728515625, -0.22380828857421875, -0.188201904296875, -0.15259552001953125, -0.1169891357421875, -0.08138275146484375, -0.0457763671875, -0.01016998291015625, 0.0254364013671875, 0.06104278564453125, 0.096649169921875, 0.13225555419921875, 0.1678619384765625, 0.20346832275390625, 0.23907470703125, 0.27468109130859375, 0.3102874755859375, 0.34589385986328125, 0.381500244140625, 0.41710662841796875, 0.4527130126953125, 0.48831939697265625, 0.52392578125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 16.0, 23.0, 79.0, 253.0, 397.0, 166.0, 41.0, 14.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.131092071533203, -15.67730712890625, -15.22352123260498, -14.769736289978027, -14.315950393676758, -13.862165451049805, -13.408380508422852, -12.954595565795898, -12.500809669494629, -12.047024726867676, -11.593238830566406, -11.139453887939453, -10.6856689453125, -10.23188304901123, -9.778098106384277, -9.324312210083008, -8.870527267456055, -8.416742324829102, -7.962956428527832, -7.509171485900879, -7.055386066436768, -6.601600646972656, -6.147815704345703, -5.694030284881592, -5.2402448654174805, -4.786459445953369, -4.332674026489258, -3.8788890838623047, -3.4251036643981934, -2.971318244934082, -2.51753306388855, -2.0637478828430176, -1.6099634170532227, -1.1561781167984009, -0.7023928165435791, -0.24860751628875732, 0.20517778396606445, 0.6589632034301758, 1.112748384475708, 1.5665335655212402, 2.0203189849853516, 2.474104404449463, 2.927889585494995, 3.3816747665405273, 3.8354601860046387, 4.28924560546875, 4.743030548095703, 5.1968159675598145, 5.650601387023926, 6.104386806488037, 6.558172225952148, 7.011957168579102, 7.465742588043213, 7.919528007507324, 8.373312950134277, 8.827098846435547, 9.2808837890625, 9.734668731689453, 10.188454627990723, 10.642239570617676, 11.096025466918945, 11.549810409545898, 12.003595352172852, 12.457380294799805, 12.911166191101074]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 10.0, 12.0, 13.0, 18.0, 29.0, 14.0, 29.0, 17.0, 28.0, 30.0, 45.0, 35.0, 34.0, 45.0, 38.0, 41.0, 41.0, 43.0, 53.0, 38.0, 45.0, 41.0, 38.0, 33.0, 29.0, 33.0, 19.0, 21.0, 27.0, 18.0, 20.0, 11.0, 11.0, 2.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.32381010055542, -4.196715354919434, -4.0696210861206055, -3.9425265789031982, -3.815432071685791, -3.688337564468384, -3.5612430572509766, -3.4341483116149902, -3.307054042816162, -3.179959535598755, -3.0528650283813477, -2.9257705211639404, -2.798676013946533, -2.671581506729126, -2.5444869995117188, -2.4173922538757324, -2.290297746658325, -2.163203239440918, -2.0361087322235107, -1.9090142250061035, -1.7819197177886963, -1.654825210571289, -1.5277305841445923, -1.400636076927185, -1.2735415697097778, -1.1464470624923706, -1.0193525552749634, -0.8922579884529114, -0.7651634812355042, -0.6380689740180969, -0.5109744071960449, -0.3838798999786377, -0.25678539276123047, -0.12969087064266205, -0.002596348524093628, 0.12449818849563599, 0.2515926957130432, 0.37868720293045044, 0.5057817697525024, 0.6328762769699097, 0.7599707841873169, 0.8870652914047241, 1.0141597986221313, 1.1412544250488281, 1.2683489322662354, 1.3954434394836426, 1.5225379467010498, 1.649632453918457, 1.7767269611358643, 1.9038214683532715, 2.0309159755706787, 2.158010482788086, 2.285104990005493, 2.4121994972229004, 2.5392942428588867, 2.666388511657715, 2.793483257293701, 2.9205777645111084, 3.0476722717285156, 3.174766778945923, 3.30186128616333, 3.4289557933807373, 3.5560503005981445, 3.683145046234131, 3.810239315032959]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 11.0, 13.0, 14.0, 19.0, 48.0, 73.0, 140.0, 234.0, 464.0, 1098.0, 2729.0, 7690.0, 26089.0, 122783.0, 544165.0, 271925.0, 50661.0, 13130.0, 4256.0, 1589.0, 658.0, 339.0, 195.0, 89.0, 60.0, 25.0, 15.0, 19.0, 10.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.134765625, -1.106903076171875, -1.07904052734375, -1.051177978515625, -1.0233154296875, -0.995452880859375, -0.96759033203125, -0.939727783203125, -0.911865234375, -0.884002685546875, -0.85614013671875, -0.828277587890625, -0.8004150390625, -0.772552490234375, -0.74468994140625, -0.716827392578125, -0.68896484375, -0.661102294921875, -0.63323974609375, -0.605377197265625, -0.5775146484375, -0.549652099609375, -0.52178955078125, -0.493927001953125, -0.466064453125, -0.438201904296875, -0.41033935546875, -0.382476806640625, -0.3546142578125, -0.326751708984375, -0.29888916015625, -0.271026611328125, -0.2431640625, -0.215301513671875, -0.18743896484375, -0.159576416015625, -0.1317138671875, -0.103851318359375, -0.07598876953125, -0.048126220703125, -0.020263671875, 0.007598876953125, 0.03546142578125, 0.063323974609375, 0.0911865234375, 0.119049072265625, 0.14691162109375, 0.174774169921875, 0.20263671875, 0.230499267578125, 0.25836181640625, 0.286224365234375, 0.3140869140625, 0.341949462890625, 0.36981201171875, 0.397674560546875, 0.425537109375, 0.453399658203125, 0.48126220703125, 0.509124755859375, 0.5369873046875, 0.564849853515625, 0.59271240234375, 0.620574951171875, 0.6484375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 7.0, 16.0, 16.0, 22.0, 36.0, 43.0, 62.0, 53.0, 79.0, 68.0, 90.0, 88.0, 75.0, 76.0, 61.0, 48.0, 51.0, 21.0, 29.0, 18.0, 12.0, 9.0, 4.0, 2.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.75048828125, -0.7277145385742188, -0.7049407958984375, -0.6821670532226562, -0.659393310546875, -0.6366195678710938, -0.6138458251953125, -0.5910720825195312, -0.56829833984375, -0.5455245971679688, -0.5227508544921875, -0.49997711181640625, -0.477203369140625, -0.45442962646484375, -0.4316558837890625, -0.40888214111328125, -0.3861083984375, -0.36333465576171875, -0.3405609130859375, -0.31778717041015625, -0.295013427734375, -0.27223968505859375, -0.2494659423828125, -0.22669219970703125, -0.20391845703125, -0.18114471435546875, -0.1583709716796875, -0.13559722900390625, -0.112823486328125, -0.09004974365234375, -0.0672760009765625, -0.04450225830078125, -0.021728515625, 0.00104522705078125, 0.0238189697265625, 0.04659271240234375, 0.069366455078125, 0.09214019775390625, 0.1149139404296875, 0.13768768310546875, 0.16046142578125, 0.18323516845703125, 0.2060089111328125, 0.22878265380859375, 0.251556396484375, 0.27433013916015625, 0.2971038818359375, 0.31987762451171875, 0.3426513671875, 0.36542510986328125, 0.3881988525390625, 0.41097259521484375, 0.433746337890625, 0.45652008056640625, 0.4792938232421875, 0.5020675659179688, 0.52484130859375, 0.5476150512695312, 0.5703887939453125, 0.5931625366210938, 0.615936279296875, 0.6387100219726562, 0.6614837646484375, 0.6842575073242188, 0.70703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 6.0, 9.0, 8.0, 11.0, 19.0, 20.0, 26.0, 40.0, 63.0, 95.0, 114.0, 175.0, 272.0, 445.0, 748.0, 1544.0, 4413.0, 27706.0, 759643.0, 232671.0, 14419.0, 3064.0, 1191.0, 618.0, 381.0, 254.0, 154.0, 132.0, 91.0, 61.0, 41.0, 30.0, 14.0, 14.0, 10.0, 8.0, 3.0, 7.0, 2.0, 7.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.4951171875, -1.450958251953125, -1.40679931640625, -1.362640380859375, -1.3184814453125, -1.274322509765625, -1.23016357421875, -1.186004638671875, -1.141845703125, -1.097686767578125, -1.05352783203125, -1.009368896484375, -0.9652099609375, -0.921051025390625, -0.87689208984375, -0.832733154296875, -0.78857421875, -0.744415283203125, -0.70025634765625, -0.656097412109375, -0.6119384765625, -0.567779541015625, -0.52362060546875, -0.479461669921875, -0.435302734375, -0.391143798828125, -0.34698486328125, -0.302825927734375, -0.2586669921875, -0.214508056640625, -0.17034912109375, -0.126190185546875, -0.08203125, -0.037872314453125, 0.00628662109375, 0.050445556640625, 0.0946044921875, 0.138763427734375, 0.18292236328125, 0.227081298828125, 0.271240234375, 0.315399169921875, 0.35955810546875, 0.403717041015625, 0.4478759765625, 0.492034912109375, 0.53619384765625, 0.580352783203125, 0.62451171875, 0.668670654296875, 0.71282958984375, 0.756988525390625, 0.8011474609375, 0.845306396484375, 0.88946533203125, 0.933624267578125, 0.977783203125, 1.021942138671875, 1.06610107421875, 1.110260009765625, 1.1544189453125, 1.198577880859375, 1.24273681640625, 1.286895751953125, 1.3310546875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 4.0, 9.0, 12.0, 15.0, 15.0, 27.0, 37.0, 34.0, 47.0, 53.0, 72.0, 67.0, 63.0, 79.0, 77.0, 63.0, 55.0, 64.0, 38.0, 38.0, 34.0, 24.0, 14.0, 12.0, 16.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.207366943359375, -2.13934326171875, -2.071319580078125, -2.0032958984375, -1.935272216796875, -1.86724853515625, -1.799224853515625, -1.731201171875, -1.663177490234375, -1.59515380859375, -1.527130126953125, -1.4591064453125, -1.391082763671875, -1.32305908203125, -1.255035400390625, -1.18701171875, -1.118988037109375, -1.05096435546875, -0.982940673828125, -0.9149169921875, -0.846893310546875, -0.77886962890625, -0.710845947265625, -0.642822265625, -0.574798583984375, -0.50677490234375, -0.438751220703125, -0.3707275390625, -0.302703857421875, -0.23468017578125, -0.166656494140625, -0.0986328125, -0.030609130859375, 0.03741455078125, 0.105438232421875, 0.1734619140625, 0.241485595703125, 0.30950927734375, 0.377532958984375, 0.445556640625, 0.513580322265625, 0.58160400390625, 0.649627685546875, 0.7176513671875, 0.785675048828125, 0.85369873046875, 0.921722412109375, 0.98974609375, 1.057769775390625, 1.12579345703125, 1.193817138671875, 1.2618408203125, 1.329864501953125, 1.39788818359375, 1.465911865234375, 1.533935546875, 1.601959228515625, 1.66998291015625, 1.738006591796875, 1.8060302734375, 1.874053955078125, 1.94207763671875, 2.010101318359375, 2.078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 7.0, 4.0, 4.0, 4.0, 4.0, 17.0, 11.0, 32.0, 29.0, 59.0, 113.0, 158.0, 304.0, 624.0, 1540.0, 4452.0, 20656.0, 234450.0, 744901.0, 31751.0, 5940.0, 1902.0, 721.0, 337.0, 170.0, 126.0, 67.0, 35.0, 27.0, 26.0, 19.0, 9.0, 5.0, 10.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.373291015625, -0.3626594543457031, -0.35202789306640625, -0.3413963317871094, -0.3307647705078125, -0.3201332092285156, -0.30950164794921875, -0.2988700866699219, -0.288238525390625, -0.2776069641113281, -0.26697540283203125, -0.2563438415527344, -0.2457122802734375, -0.23508071899414062, -0.22444915771484375, -0.21381759643554688, -0.20318603515625, -0.19255447387695312, -0.18192291259765625, -0.17129135131835938, -0.1606597900390625, -0.15002822875976562, -0.13939666748046875, -0.12876510620117188, -0.118133544921875, -0.10750198364257812, -0.09687042236328125, -0.08623886108398438, -0.0756072998046875, -0.06497573852539062, -0.05434417724609375, -0.043712615966796875, -0.0330810546875, -0.022449493408203125, -0.01181793212890625, -0.001186370849609375, 0.0094451904296875, 0.020076751708984375, 0.03070831298828125, 0.041339874267578125, 0.051971435546875, 0.06260299682617188, 0.07323455810546875, 0.08386611938476562, 0.0944976806640625, 0.10512924194335938, 0.11576080322265625, 0.12639236450195312, 0.13702392578125, 0.14765548706054688, 0.15828704833984375, 0.16891860961914062, 0.1795501708984375, 0.19018173217773438, 0.20081329345703125, 0.21144485473632812, 0.222076416015625, 0.23270797729492188, 0.24333953857421875, 0.2539710998535156, 0.2646026611328125, 0.2752342224121094, 0.28586578369140625, 0.2964973449707031, 0.30712890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 2.0, 2.0, 14.0, 12.0, 18.0, 30.0, 48.0, 61.0, 129.0, 185.0, 183.0, 102.0, 69.0, 50.0, 26.0, 17.0, 13.0, 7.0, 10.0, 11.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.249282836914062e-05, -7.973518222570419e-05, -7.697753608226776e-05, -7.421988993883133e-05, -7.14622437953949e-05, -6.870459765195847e-05, -6.594695150852203e-05, -6.31893053650856e-05, -6.043165922164917e-05, -5.767401307821274e-05, -5.4916366934776306e-05, -5.2158720791339874e-05, -4.940107464790344e-05, -4.664342850446701e-05, -4.388578236103058e-05, -4.112813621759415e-05, -3.8370490074157715e-05, -3.561284393072128e-05, -3.285519778728485e-05, -3.009755164384842e-05, -2.7339905500411987e-05, -2.4582259356975555e-05, -2.1824613213539124e-05, -1.906696707010269e-05, -1.630932092666626e-05, -1.3551674783229828e-05, -1.0794028639793396e-05, -8.036382496356964e-06, -5.278736352920532e-06, -2.5210902094841003e-06, 2.3655593395233154e-07, 2.9942020773887634e-06, 5.751848220825195e-06, 8.509494364261627e-06, 1.1267140507698059e-05, 1.4024786651134491e-05, 1.6782432794570923e-05, 1.9540078938007355e-05, 2.2297725081443787e-05, 2.505537122488022e-05, 2.781301736831665e-05, 3.057066351175308e-05, 3.3328309655189514e-05, 3.6085955798625946e-05, 3.884360194206238e-05, 4.160124808549881e-05, 4.435889422893524e-05, 4.7116540372371674e-05, 4.9874186515808105e-05, 5.263183265924454e-05, 5.538947880268097e-05, 5.81471249461174e-05, 6.090477108955383e-05, 6.366241723299026e-05, 6.64200633764267e-05, 6.917770951986313e-05, 7.193535566329956e-05, 7.469300180673599e-05, 7.745064795017242e-05, 8.020829409360886e-05, 8.296594023704529e-05, 8.572358638048172e-05, 8.848123252391815e-05, 9.123887866735458e-05, 9.399652481079102e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 5.0, 7.0, 9.0, 12.0, 21.0, 27.0, 41.0, 80.0, 136.0, 294.0, 751.0, 2772.0, 17308.0, 780469.0, 232699.0, 10692.0, 2006.0, 634.0, 264.0, 115.0, 87.0, 36.0, 39.0, 18.0, 10.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32177734375, -0.30831146240234375, -0.2948455810546875, -0.28137969970703125, -0.267913818359375, -0.25444793701171875, -0.2409820556640625, -0.22751617431640625, -0.21405029296875, -0.20058441162109375, -0.1871185302734375, -0.17365264892578125, -0.160186767578125, -0.14672088623046875, -0.1332550048828125, -0.11978912353515625, -0.1063232421875, -0.09285736083984375, -0.0793914794921875, -0.06592559814453125, -0.052459716796875, -0.03899383544921875, -0.0255279541015625, -0.01206207275390625, 0.00140380859375, 0.01486968994140625, 0.0283355712890625, 0.04180145263671875, 0.055267333984375, 0.06873321533203125, 0.0821990966796875, 0.09566497802734375, 0.109130859375, 0.12259674072265625, 0.1360626220703125, 0.14952850341796875, 0.162994384765625, 0.17646026611328125, 0.1899261474609375, 0.20339202880859375, 0.21685791015625, 0.23032379150390625, 0.2437896728515625, 0.25725555419921875, 0.270721435546875, 0.28418731689453125, 0.2976531982421875, 0.31111907958984375, 0.3245849609375, 0.33805084228515625, 0.3515167236328125, 0.36498260498046875, 0.378448486328125, 0.39191436767578125, 0.4053802490234375, 0.41884613037109375, 0.43231201171875, 0.44577789306640625, 0.4592437744140625, 0.47270965576171875, 0.486175537109375, 0.49964141845703125, 0.5131072998046875, 0.5265731811523438, 0.5400390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 12.0, 13.0, 17.0, 16.0, 35.0, 46.0, 33.0, 61.0, 86.0, 107.0, 153.0, 106.0, 92.0, 63.0, 41.0, 29.0, 19.0, 17.0, 11.0, 17.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.295166015625, -0.2839775085449219, -0.27278900146484375, -0.2616004943847656, -0.2504119873046875, -0.23922348022460938, -0.22803497314453125, -0.21684646606445312, -0.205657958984375, -0.19446945190429688, -0.18328094482421875, -0.17209243774414062, -0.1609039306640625, -0.14971542358398438, -0.13852691650390625, -0.12733840942382812, -0.11614990234375, -0.10496139526367188, -0.09377288818359375, -0.08258438110351562, -0.0713958740234375, -0.060207366943359375, -0.04901885986328125, -0.037830352783203125, -0.026641845703125, -0.015453338623046875, -0.00426483154296875, 0.006923675537109375, 0.0181121826171875, 0.029300689697265625, 0.04048919677734375, 0.051677703857421875, 0.0628662109375, 0.07405471801757812, 0.08524322509765625, 0.09643173217773438, 0.1076202392578125, 0.11880874633789062, 0.12999725341796875, 0.14118576049804688, 0.152374267578125, 0.16356277465820312, 0.17475128173828125, 0.18593978881835938, 0.1971282958984375, 0.20831680297851562, 0.21950531005859375, 0.23069381713867188, 0.24188232421875, 0.2530708312988281, 0.26425933837890625, 0.2754478454589844, 0.2866363525390625, 0.2978248596191406, 0.30901336669921875, 0.3202018737792969, 0.331390380859375, 0.3425788879394531, 0.35376739501953125, 0.3649559020996094, 0.3761444091796875, 0.3873329162597656, 0.39852142333984375, 0.4097099304199219, 0.4208984375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 20.0, 68.0, 363.0, 449.0, 67.0, 14.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.502649307250977, -16.93880271911621, -16.374954223632812, -15.811107635498047, -15.247261047363281, -14.6834135055542, -14.119565963745117, -13.555719375610352, -12.99187183380127, -12.428024291992188, -11.864177703857422, -11.30033016204834, -10.736482620239258, -10.172636032104492, -9.60878849029541, -9.044940948486328, -8.481094360351562, -7.917247295379639, -7.353400230407715, -6.789552688598633, -6.225705623626709, -5.661858558654785, -5.098011016845703, -4.534163951873779, -3.9703168869018555, -3.4064698219299316, -2.8426225185394287, -2.278775215148926, -1.714928150177002, -1.1510810852050781, -0.5872337818145752, -0.023386478424072266, 0.5404605865478516, 1.104307770729065, 1.6681549549102783, 2.2320022583007812, 2.795849323272705, 3.359696388244629, 3.923543691635132, 4.487390995025635, 5.051238059997559, 5.615085124969482, 6.178932189941406, 6.742779731750488, 7.306626796722412, 7.870473861694336, 8.434321403503418, 8.9981689453125, 9.562015533447266, 10.125863075256348, 10.689709663391113, 11.253557205200195, 11.817403793334961, 12.381251335144043, 12.945098876953125, 13.50894546508789, 14.072793006896973, 14.636640548706055, 15.20048713684082, 15.764334678649902, 16.328182220458984, 16.89202880859375, 17.455875396728516, 18.019723892211914, 18.58357048034668]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 11.0, 8.0, 21.0, 12.0, 16.0, 21.0, 19.0, 29.0, 30.0, 27.0, 33.0, 34.0, 51.0, 111.0, 182.0, 74.0, 34.0, 36.0, 30.0, 35.0, 17.0, 18.0, 27.0, 21.0, 15.0, 8.0, 20.0, 13.0, 7.0, 5.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.206874847412109, -6.0015082359313965, -5.796141624450684, -5.5907745361328125, -5.3854079246521, -5.180041313171387, -4.974674701690674, -4.769308090209961, -4.56394100189209, -4.358574390411377, -4.153207778930664, -3.947840929031372, -3.74247407913208, -3.537107467651367, -3.3317408561706543, -3.1263740062713623, -2.9210073947906494, -2.7156407833099365, -2.5102739334106445, -2.3049073219299316, -2.0995404720306396, -1.8941738605499268, -1.6888071298599243, -1.4834403991699219, -1.2780736684799194, -1.072706937789917, -0.8673402070999146, -0.6619735360145569, -0.45660680532455444, -0.2512401342391968, -0.045873403549194336, 0.1594933271408081, 0.36486005783081055, 0.570226788520813, 0.7755935192108154, 0.9809601902961731, 1.1863269805908203, 1.3916935920715332, 1.5970603227615356, 1.802427053451538, 2.00779390335083, 2.213160514831543, 2.418527364730835, 2.623893976211548, 2.82926082611084, 3.0346274375915527, 3.2399940490722656, 3.4453608989715576, 3.6507275104522705, 3.8560941219329834, 4.061460971832275, 4.266827583312988, 4.472194194793701, 4.677560806274414, 4.882927894592285, 5.088294506072998, 5.293661117553711, 5.499027729034424, 5.704394340515137, 5.909761428833008, 6.115128040313721, 6.320494651794434, 6.5258612632751465, 6.731227874755859, 6.9365949630737305]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 12.0, 9.0, 14.0, 12.0, 29.0, 48.0, 77.0, 139.0, 274.0, 466.0, 921.0, 2229.0, 6480.0, 20959.0, 153581.0, 1384559.0, 2206382.0, 364843.0, 38547.0, 8830.0, 3125.0, 1254.0, 630.0, 340.0, 172.0, 116.0, 68.0, 53.0, 28.0, 20.0, 11.0, 12.0, 9.0, 5.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.646484375, -0.62432861328125, -0.6021728515625, -0.58001708984375, -0.557861328125, -0.53570556640625, -0.5135498046875, -0.49139404296875, -0.46923828125, -0.44708251953125, -0.4249267578125, -0.40277099609375, -0.380615234375, -0.35845947265625, -0.3363037109375, -0.31414794921875, -0.2919921875, -0.26983642578125, -0.2476806640625, -0.22552490234375, -0.203369140625, -0.18121337890625, -0.1590576171875, -0.13690185546875, -0.11474609375, -0.09259033203125, -0.0704345703125, -0.04827880859375, -0.026123046875, -0.00396728515625, 0.0181884765625, 0.04034423828125, 0.0625, 0.08465576171875, 0.1068115234375, 0.12896728515625, 0.151123046875, 0.17327880859375, 0.1954345703125, 0.21759033203125, 0.23974609375, 0.26190185546875, 0.2840576171875, 0.30621337890625, 0.328369140625, 0.35052490234375, 0.3726806640625, 0.39483642578125, 0.4169921875, 0.43914794921875, 0.4613037109375, 0.48345947265625, 0.505615234375, 0.52777099609375, 0.5499267578125, 0.57208251953125, 0.59423828125, 0.61639404296875, 0.6385498046875, 0.66070556640625, 0.682861328125, 0.70501708984375, 0.7271728515625, 0.74932861328125, 0.771484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 11.0, 12.0, 18.0, 14.0, 31.0, 37.0, 58.0, 69.0, 84.0, 63.0, 84.0, 91.0, 94.0, 78.0, 57.0, 47.0, 43.0, 31.0, 28.0, 11.0, 16.0, 6.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.748046875, -0.7253799438476562, -0.7027130126953125, -0.6800460815429688, -0.657379150390625, -0.6347122192382812, -0.6120452880859375, -0.5893783569335938, -0.56671142578125, -0.5440444946289062, -0.5213775634765625, -0.49871063232421875, -0.476043701171875, -0.45337677001953125, -0.4307098388671875, -0.40804290771484375, -0.3853759765625, -0.36270904541015625, -0.3400421142578125, -0.31737518310546875, -0.294708251953125, -0.27204132080078125, -0.2493743896484375, -0.22670745849609375, -0.20404052734375, -0.18137359619140625, -0.1587066650390625, -0.13603973388671875, -0.113372802734375, -0.09070587158203125, -0.0680389404296875, -0.04537200927734375, -0.022705078125, -3.814697265625e-05, 0.0226287841796875, 0.04529571533203125, 0.067962646484375, 0.09062957763671875, 0.1132965087890625, 0.13596343994140625, 0.15863037109375, 0.18129730224609375, 0.2039642333984375, 0.22663116455078125, 0.249298095703125, 0.27196502685546875, 0.2946319580078125, 0.31729888916015625, 0.3399658203125, 0.36263275146484375, 0.3852996826171875, 0.40796661376953125, 0.430633544921875, 0.45330047607421875, 0.4759674072265625, 0.49863433837890625, 0.52130126953125, 0.5439682006835938, 0.5666351318359375, 0.5893020629882812, 0.611968994140625, 0.6346359252929688, 0.6573028564453125, 0.6799697875976562, 0.70263671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 10.0, 10.0, 17.0, 27.0, 60.0, 115.0, 309.0, 923.0, 4326.0, 3665484.0, 518611.0, 3225.0, 715.0, 240.0, 98.0, 47.0, 29.0, 16.0, 10.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.25689697265625, -4.1192626953125, -3.98162841796875, -3.843994140625, -3.70635986328125, -3.5687255859375, -3.43109130859375, -3.29345703125, -3.15582275390625, -3.0181884765625, -2.88055419921875, -2.742919921875, -2.60528564453125, -2.4676513671875, -2.33001708984375, -2.1923828125, -2.05474853515625, -1.9171142578125, -1.77947998046875, -1.641845703125, -1.50421142578125, -1.3665771484375, -1.22894287109375, -1.09130859375, -0.95367431640625, -0.8160400390625, -0.67840576171875, -0.540771484375, -0.40313720703125, -0.2655029296875, -0.12786865234375, 0.009765625, 0.14739990234375, 0.2850341796875, 0.42266845703125, 0.560302734375, 0.69793701171875, 0.8355712890625, 0.97320556640625, 1.11083984375, 1.24847412109375, 1.3861083984375, 1.52374267578125, 1.661376953125, 1.79901123046875, 1.9366455078125, 2.07427978515625, 2.2119140625, 2.34954833984375, 2.4871826171875, 2.62481689453125, 2.762451171875, 2.90008544921875, 3.0377197265625, 3.17535400390625, 3.31298828125, 3.45062255859375, 3.5882568359375, 3.72589111328125, 3.863525390625, 4.00115966796875, 4.1387939453125, 4.27642822265625, 4.4140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 5.0, 12.0, 10.0, 31.0, 55.0, 108.0, 234.0, 573.0, 1168.0, 1000.0, 459.0, 212.0, 90.0, 43.0, 20.0, 21.0, 10.0, 9.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.361328125, -3.282989501953125, -3.20465087890625, -3.126312255859375, -3.0479736328125, -2.969635009765625, -2.89129638671875, -2.812957763671875, -2.734619140625, -2.656280517578125, -2.57794189453125, -2.499603271484375, -2.4212646484375, -2.342926025390625, -2.26458740234375, -2.186248779296875, -2.10791015625, -2.029571533203125, -1.95123291015625, -1.872894287109375, -1.7945556640625, -1.716217041015625, -1.63787841796875, -1.559539794921875, -1.481201171875, -1.402862548828125, -1.32452392578125, -1.246185302734375, -1.1678466796875, -1.089508056640625, -1.01116943359375, -0.932830810546875, -0.8544921875, -0.776153564453125, -0.69781494140625, -0.619476318359375, -0.5411376953125, -0.462799072265625, -0.38446044921875, -0.306121826171875, -0.227783203125, -0.149444580078125, -0.07110595703125, 0.007232666015625, 0.0855712890625, 0.163909912109375, 0.24224853515625, 0.320587158203125, 0.39892578125, 0.477264404296875, 0.55560302734375, 0.633941650390625, 0.7122802734375, 0.790618896484375, 0.86895751953125, 0.947296142578125, 1.025634765625, 1.103973388671875, 1.18231201171875, 1.260650634765625, 1.3389892578125, 1.417327880859375, 1.49566650390625, 1.574005126953125, 1.65234375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 6.0, 10.0, 17.0, 19.0, 38.0, 71.0, 152.0, 225.0, 225.0, 123.0, 49.0, 27.0, 11.0, 4.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.177806854248047, -15.654191970825195, -15.130577087402344, -14.606961250305176, -14.083346366882324, -13.559731483459473, -13.036115646362305, -12.512500762939453, -11.988885879516602, -11.46527099609375, -10.941656112670898, -10.41804027557373, -9.894425392150879, -9.370810508728027, -8.84719467163086, -8.323579788208008, -7.799964904785156, -7.276350021362305, -6.752734661102295, -6.229119300842285, -5.705504417419434, -5.181889533996582, -4.658274173736572, -4.1346588134765625, -3.611043930053711, -3.0874288082122803, -2.5638136863708496, -2.040198564529419, -1.5165834426879883, -0.9929683208465576, -0.46935319900512695, 0.05426192283630371, 0.5778770446777344, 1.101492166519165, 1.6251072883605957, 2.1487224102020264, 2.672337532043457, 3.1959526538848877, 3.7195677757263184, 4.243183135986328, 4.76679801940918, 5.290412902832031, 5.814028263092041, 6.337643623352051, 6.861258506774902, 7.384873390197754, 7.908488750457764, 8.432104110717773, 8.955718994140625, 9.479333877563477, 10.002948760986328, 10.526564598083496, 11.050179481506348, 11.5737943649292, 12.097410202026367, 12.621025085449219, 13.14463996887207, 13.668254852294922, 14.191869735717773, 14.715485572814941, 15.239100456237793, 15.762715339660645, 16.286331176757812, 16.809946060180664, 17.333560943603516]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 5.0, 8.0, 20.0, 28.0, 32.0, 35.0, 47.0, 53.0, 52.0, 67.0, 90.0, 86.0, 73.0, 80.0, 69.0, 48.0, 48.0, 31.0, 22.0, 24.0, 14.0, 19.0, 15.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.463289260864258, -9.098551750183105, -8.73381519317627, -8.369077682495117, -8.004341125488281, -7.639603614807129, -7.274866580963135, -6.910129547119141, -6.5453925132751465, -6.180655479431152, -5.815918445587158, -5.451181411743164, -5.086443901062012, -4.721707344055176, -4.356969833374023, -3.9922327995300293, -3.627495765686035, -3.262758731842041, -2.898021697998047, -2.5332844257354736, -2.1685473918914795, -1.8038103580474854, -1.439073085784912, -1.074336051940918, -0.7095990180969238, -0.3448619246482849, 0.019875168800354004, 0.3846123218536377, 0.7493493556976318, 1.114086389541626, 1.4788236618041992, 1.8435606956481934, 2.208296775817871, 2.5730338096618652, 2.9377708435058594, 3.3025081157684326, 3.6672451496124268, 4.031982421875, 4.396719455718994, 4.761456489562988, 5.126193523406982, 5.490930557250977, 5.855667591094971, 6.220404624938965, 6.585142135620117, 6.949878692626953, 7.3146162033081055, 7.6793532371521, 8.044090270996094, 8.408827781677246, 8.773564338684082, 9.138301849365234, 9.50303840637207, 9.867775917053223, 10.232513427734375, 10.597249984741211, 10.961986541748047, 11.3267240524292, 11.691460609436035, 12.056198120117188, 12.420934677124023, 12.785672187805176, 13.150409698486328, 13.515146255493164, 13.879883766174316]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 9.0, 3.0, 10.0, 9.0, 23.0, 22.0, 18.0, 49.0, 78.0, 106.0, 217.0, 404.0, 816.0, 1871.0, 5164.0, 18007.0, 95168.0, 727433.0, 161653.0, 26094.0, 6909.0, 2380.0, 977.0, 467.0, 243.0, 133.0, 99.0, 59.0, 45.0, 31.0, 24.0, 20.0, 8.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9111328125, -0.88232421875, -0.853515625, -0.82470703125, -0.7958984375, -0.76708984375, -0.73828125, -0.70947265625, -0.6806640625, -0.65185546875, -0.623046875, -0.59423828125, -0.5654296875, -0.53662109375, -0.5078125, -0.47900390625, -0.4501953125, -0.42138671875, -0.392578125, -0.36376953125, -0.3349609375, -0.30615234375, -0.27734375, -0.24853515625, -0.2197265625, -0.19091796875, -0.162109375, -0.13330078125, -0.1044921875, -0.07568359375, -0.046875, -0.01806640625, 0.0107421875, 0.03955078125, 0.068359375, 0.09716796875, 0.1259765625, 0.15478515625, 0.18359375, 0.21240234375, 0.2412109375, 0.27001953125, 0.298828125, 0.32763671875, 0.3564453125, 0.38525390625, 0.4140625, 0.44287109375, 0.4716796875, 0.50048828125, 0.529296875, 0.55810546875, 0.5869140625, 0.61572265625, 0.64453125, 0.67333984375, 0.7021484375, 0.73095703125, 0.759765625, 0.78857421875, 0.8173828125, 0.84619140625, 0.875, 0.90380859375, 0.9326171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 3.0, 6.0, 7.0, 13.0, 27.0, 38.0, 47.0, 67.0, 84.0, 99.0, 100.0, 98.0, 97.0, 87.0, 78.0, 46.0, 37.0, 17.0, 17.0, 15.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.021484375, -0.9906158447265625, -0.959747314453125, -0.9288787841796875, -0.89801025390625, -0.8671417236328125, -0.836273193359375, -0.8054046630859375, -0.7745361328125, -0.7436676025390625, -0.712799072265625, -0.6819305419921875, -0.65106201171875, -0.6201934814453125, -0.589324951171875, -0.5584564208984375, -0.527587890625, -0.4967193603515625, -0.465850830078125, -0.4349822998046875, -0.40411376953125, -0.3732452392578125, -0.342376708984375, -0.3115081787109375, -0.2806396484375, -0.2497711181640625, -0.218902587890625, -0.1880340576171875, -0.15716552734375, -0.1262969970703125, -0.095428466796875, -0.0645599365234375, -0.03369140625, -0.0028228759765625, 0.028045654296875, 0.0589141845703125, 0.08978271484375, 0.1206512451171875, 0.151519775390625, 0.1823883056640625, 0.2132568359375, 0.2441253662109375, 0.274993896484375, 0.3058624267578125, 0.33673095703125, 0.3675994873046875, 0.398468017578125, 0.4293365478515625, 0.460205078125, 0.4910736083984375, 0.521942138671875, 0.5528106689453125, 0.58367919921875, 0.6145477294921875, 0.645416259765625, 0.6762847900390625, 0.7071533203125, 0.7380218505859375, 0.768890380859375, 0.7997589111328125, 0.83062744140625, 0.8614959716796875, 0.892364501953125, 0.9232330322265625, 0.9541015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 10.0, 14.0, 21.0, 33.0, 37.0, 63.0, 113.0, 158.0, 314.0, 549.0, 1394.0, 6492.0, 85829.0, 922179.0, 25746.0, 3343.0, 1031.0, 455.0, 259.0, 157.0, 95.0, 54.0, 58.0, 37.0, 25.0, 13.0, 13.0, 9.0, 7.0, 6.0, 5.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.02734375, -0.98828125, -0.94921875, -0.91015625, -0.87109375, -0.83203125, -0.79296875, -0.75390625, -0.71484375, -0.67578125, -0.63671875, -0.59765625, -0.55859375, -0.51953125, -0.48046875, -0.44140625, -0.40234375, -0.36328125, -0.32421875, -0.28515625, -0.24609375, -0.20703125, -0.16796875, -0.12890625, -0.08984375, -0.05078125, -0.01171875, 0.02734375, 0.06640625, 0.10546875, 0.14453125, 0.18359375, 0.22265625, 0.26171875, 0.30078125, 0.33984375, 0.37890625, 0.41796875, 0.45703125, 0.49609375, 0.53515625, 0.57421875, 0.61328125, 0.65234375, 0.69140625, 0.73046875, 0.76953125, 0.80859375, 0.84765625, 0.88671875, 0.92578125, 0.96484375, 1.00390625, 1.04296875, 1.08203125, 1.12109375, 1.16015625, 1.19921875, 1.23828125, 1.27734375, 1.31640625, 1.35546875, 1.39453125, 1.43359375, 1.47265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 8.0, 4.0, 7.0, 7.0, 7.0, 21.0, 18.0, 23.0, 13.0, 32.0, 34.0, 44.0, 51.0, 66.0, 68.0, 64.0, 83.0, 72.0, 55.0, 47.0, 35.0, 41.0, 31.0, 23.0, 31.0, 22.0, 19.0, 13.0, 11.0, 11.0, 6.0, 5.0, 4.0, 5.0, 6.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8544921875, -1.7902984619140625, -1.726104736328125, -1.6619110107421875, -1.59771728515625, -1.5335235595703125, -1.469329833984375, -1.4051361083984375, -1.3409423828125, -1.2767486572265625, -1.212554931640625, -1.1483612060546875, -1.08416748046875, -1.0199737548828125, -0.955780029296875, -0.8915863037109375, -0.827392578125, -0.7631988525390625, -0.699005126953125, -0.6348114013671875, -0.57061767578125, -0.5064239501953125, -0.442230224609375, -0.3780364990234375, -0.3138427734375, -0.2496490478515625, -0.185455322265625, -0.1212615966796875, -0.05706787109375, 0.0071258544921875, 0.071319580078125, 0.1355133056640625, 0.19970703125, 0.2639007568359375, 0.328094482421875, 0.3922882080078125, 0.45648193359375, 0.5206756591796875, 0.584869384765625, 0.6490631103515625, 0.7132568359375, 0.7774505615234375, 0.841644287109375, 0.9058380126953125, 0.97003173828125, 1.0342254638671875, 1.098419189453125, 1.1626129150390625, 1.226806640625, 1.2910003662109375, 1.355194091796875, 1.4193878173828125, 1.48358154296875, 1.5477752685546875, 1.611968994140625, 1.6761627197265625, 1.7403564453125, 1.8045501708984375, 1.868743896484375, 1.9329376220703125, 1.99713134765625, 2.0613250732421875, 2.125518798828125, 2.1897125244140625, 2.25390625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 2.0, 3.0, 7.0, 4.0, 8.0, 11.0, 15.0, 17.0, 26.0, 48.0, 61.0, 87.0, 150.0, 289.0, 636.0, 1798.0, 7549.0, 87477.0, 922487.0, 22280.0, 3536.0, 1056.0, 412.0, 221.0, 132.0, 71.0, 45.0, 30.0, 16.0, 15.0, 11.0, 10.0, 12.0, 11.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2451171875, -0.2379627227783203, -0.23080825805664062, -0.22365379333496094, -0.21649932861328125, -0.20934486389160156, -0.20219039916992188, -0.1950359344482422, -0.1878814697265625, -0.1807270050048828, -0.17357254028320312, -0.16641807556152344, -0.15926361083984375, -0.15210914611816406, -0.14495468139648438, -0.1378002166748047, -0.130645751953125, -0.12349128723144531, -0.11633682250976562, -0.10918235778808594, -0.10202789306640625, -0.09487342834472656, -0.08771896362304688, -0.08056449890136719, -0.0734100341796875, -0.06625556945800781, -0.059101104736328125, -0.05194664001464844, -0.04479217529296875, -0.03763771057128906, -0.030483245849609375, -0.023328781127929688, -0.01617431640625, -0.009019851684570312, -0.001865386962890625, 0.0052890777587890625, 0.01244354248046875, 0.019598007202148438, 0.026752471923828125, 0.03390693664550781, 0.0410614013671875, 0.04821586608886719, 0.055370330810546875, 0.06252479553222656, 0.06967926025390625, 0.07683372497558594, 0.08398818969726562, 0.09114265441894531, 0.098297119140625, 0.10545158386230469, 0.11260604858398438, 0.11976051330566406, 0.12691497802734375, 0.13406944274902344, 0.14122390747070312, 0.1483783721923828, 0.1555328369140625, 0.1626873016357422, 0.16984176635742188, 0.17699623107910156, 0.18415069580078125, 0.19130516052246094, 0.19845962524414062, 0.2056140899658203, 0.2127685546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 14.0, 5.0, 5.0, 13.0, 16.0, 25.0, 31.0, 37.0, 52.0, 84.0, 102.0, 109.0, 124.0, 102.0, 69.0, 57.0, 44.0, 24.0, 17.0, 14.0, 10.0, 18.0, 5.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.737211227416992e-05, -3.620237112045288e-05, -3.503262996673584e-05, -3.38628888130188e-05, -3.269314765930176e-05, -3.152340650558472e-05, -3.0353665351867676e-05, -2.9183924198150635e-05, -2.8014183044433594e-05, -2.6844441890716553e-05, -2.5674700736999512e-05, -2.450495958328247e-05, -2.333521842956543e-05, -2.216547727584839e-05, -2.0995736122131348e-05, -1.9825994968414307e-05, -1.8656253814697266e-05, -1.7486512660980225e-05, -1.6316771507263184e-05, -1.5147030353546143e-05, -1.3977289199829102e-05, -1.280754804611206e-05, -1.163780689239502e-05, -1.0468065738677979e-05, -9.298324584960938e-06, -8.128583431243896e-06, -6.9588422775268555e-06, -5.7891011238098145e-06, -4.6193599700927734e-06, -3.4496188163757324e-06, -2.2798776626586914e-06, -1.1101365089416504e-06, 5.960464477539063e-08, 1.2293457984924316e-06, 2.3990869522094727e-06, 3.5688281059265137e-06, 4.738569259643555e-06, 5.908310413360596e-06, 7.078051567077637e-06, 8.247792720794678e-06, 9.417533874511719e-06, 1.058727502822876e-05, 1.17570161819458e-05, 1.2926757335662842e-05, 1.4096498489379883e-05, 1.5266239643096924e-05, 1.6435980796813965e-05, 1.7605721950531006e-05, 1.8775463104248047e-05, 1.9945204257965088e-05, 2.111494541168213e-05, 2.228468656539917e-05, 2.345442771911621e-05, 2.4624168872833252e-05, 2.5793910026550293e-05, 2.6963651180267334e-05, 2.8133392333984375e-05, 2.9303133487701416e-05, 3.0472874641418457e-05, 3.16426157951355e-05, 3.281235694885254e-05, 3.398209810256958e-05, 3.515183925628662e-05, 3.632158041000366e-05, 3.74913215637207e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 9.0, 6.0, 6.0, 11.0, 27.0, 31.0, 43.0, 104.0, 188.0, 341.0, 747.0, 1772.0, 4962.0, 19621.0, 175400.0, 802643.0, 31693.0, 7015.0, 2152.0, 820.0, 401.0, 229.0, 114.0, 75.0, 40.0, 24.0, 17.0, 13.0, 6.0, 5.0, 8.0, 2.0, 3.0, 7.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12384033203125, -0.11943912506103516, -0.11503791809082031, -0.11063671112060547, -0.10623550415039062, -0.10183429718017578, -0.09743309020996094, -0.0930318832397461, -0.08863067626953125, -0.0842294692993164, -0.07982826232910156, -0.07542705535888672, -0.07102584838867188, -0.06662464141845703, -0.06222343444824219, -0.057822227478027344, -0.0534210205078125, -0.049019813537597656, -0.04461860656738281, -0.04021739959716797, -0.035816192626953125, -0.03141498565673828, -0.027013778686523438, -0.022612571716308594, -0.01821136474609375, -0.013810157775878906, -0.009408950805664062, -0.005007743835449219, -0.000606536865234375, 0.0037946701049804688, 0.008195877075195312, 0.012597084045410156, 0.016998291015625, 0.021399497985839844, 0.025800704956054688, 0.03020191192626953, 0.034603118896484375, 0.03900432586669922, 0.04340553283691406, 0.047806739807128906, 0.05220794677734375, 0.056609153747558594, 0.06101036071777344, 0.06541156768798828, 0.06981277465820312, 0.07421398162841797, 0.07861518859863281, 0.08301639556884766, 0.0874176025390625, 0.09181880950927734, 0.09622001647949219, 0.10062122344970703, 0.10502243041992188, 0.10942363739013672, 0.11382484436035156, 0.1182260513305664, 0.12262725830078125, 0.1270284652709961, 0.13142967224121094, 0.13583087921142578, 0.14023208618164062, 0.14463329315185547, 0.1490345001220703, 0.15343570709228516, 0.1578369140625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 6.0, 9.0, 8.0, 9.0, 17.0, 29.0, 38.0, 45.0, 81.0, 92.0, 122.0, 135.0, 99.0, 77.0, 62.0, 45.0, 26.0, 16.0, 11.0, 9.0, 8.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.125, -0.119842529296875, -0.11468505859375, -0.109527587890625, -0.1043701171875, -0.099212646484375, -0.09405517578125, -0.088897705078125, -0.083740234375, -0.078582763671875, -0.07342529296875, -0.068267822265625, -0.0631103515625, -0.057952880859375, -0.05279541015625, -0.047637939453125, -0.04248046875, -0.037322998046875, -0.03216552734375, -0.027008056640625, -0.0218505859375, -0.016693115234375, -0.01153564453125, -0.006378173828125, -0.001220703125, 0.003936767578125, 0.00909423828125, 0.014251708984375, 0.0194091796875, 0.024566650390625, 0.02972412109375, 0.034881591796875, 0.0400390625, 0.045196533203125, 0.05035400390625, 0.055511474609375, 0.0606689453125, 0.065826416015625, 0.07098388671875, 0.076141357421875, 0.081298828125, 0.086456298828125, 0.09161376953125, 0.096771240234375, 0.1019287109375, 0.107086181640625, 0.11224365234375, 0.117401123046875, 0.12255859375, 0.127716064453125, 0.13287353515625, 0.138031005859375, 0.1431884765625, 0.148345947265625, 0.15350341796875, 0.158660888671875, 0.163818359375, 0.168975830078125, 0.17413330078125, 0.179290771484375, 0.1844482421875, 0.189605712890625, 0.19476318359375, 0.199920654296875, 0.205078125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 18.0, 43.0, 121.0, 626.0, 110.0, 49.0, 23.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.510433197021484, -9.08431625366211, -8.658199310302734, -8.23208236694336, -7.805965423583984, -7.379848480224609, -6.953731060028076, -6.527614116668701, -6.101497173309326, -5.675380229949951, -5.249263286590576, -4.823145866394043, -4.397028923034668, -3.970912218093872, -3.544795036315918, -3.118678092956543, -2.692561149597168, -2.266444206237793, -1.8403271436691284, -1.4142100811004639, -0.9880931377410889, -0.5619761943817139, -0.13585901260375977, 0.29025793075561523, 0.7163748741149902, 1.1424918174743652, 1.5686088800430298, 1.9947259426116943, 2.4208428859710693, 2.8469598293304443, 3.2730770111083984, 3.6991939544677734, 4.125310897827148, 4.551427841186523, 4.977544784545898, 5.403661727905273, 5.829778671264648, 6.255895614624023, 6.682013034820557, 7.108129978179932, 7.534246921539307, 7.960363864898682, 8.386481285095215, 8.81259822845459, 9.238715171813965, 9.66483211517334, 10.090949058532715, 10.51706600189209, 10.943182945251465, 11.36929988861084, 11.795416831970215, 12.22153377532959, 12.647650718688965, 13.07376766204834, 13.499885559082031, 13.926002502441406, 14.352119445800781, 14.778236389160156, 15.204353332519531, 15.630470275878906, 16.05658721923828, 16.482704162597656, 16.90882110595703, 17.334938049316406, 17.76105499267578]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 14.0, 10.0, 11.0, 13.0, 19.0, 19.0, 32.0, 25.0, 29.0, 41.0, 61.0, 422.0, 76.0, 35.0, 38.0, 23.0, 28.0, 17.0, 18.0, 16.0, 10.0, 9.0, 5.0, 8.0, 12.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.549214363098145, -10.295380592346191, -10.041546821594238, -9.787712097167969, -9.533878326416016, -9.280044555664062, -9.02621078491211, -8.772377014160156, -8.518543243408203, -8.26470947265625, -8.010875701904297, -7.7570414543151855, -7.503207683563232, -7.249373435974121, -6.995539665222168, -6.741705894470215, -6.4878716468811035, -6.23403787612915, -5.980203628540039, -5.726369857788086, -5.472536087036133, -5.21870231628418, -4.964868068695068, -4.711034297943115, -4.457200050354004, -4.203366279602051, -3.9495322704315186, -3.6956982612609863, -3.441864490509033, -3.188030481338501, -2.9341964721679688, -2.6803627014160156, -2.4265289306640625, -2.1726949214935303, -1.9188611507415771, -1.665027141571045, -1.4111932516098022, -1.1573593616485596, -0.9035253524780273, -0.6496914625167847, -0.395857572555542, -0.14202365279197693, 0.11181026697158813, 0.3656442165374756, 0.6194781064987183, 0.8733119964599609, 1.1271460056304932, 1.3809798955917358, 1.6348137855529785, 1.8886476755142212, 2.142481565475464, 2.396315574645996, 2.650149345397949, 2.9039833545684814, 3.1578173637390137, 3.411651134490967, 3.665485143661499, 3.9193191528320312, 4.173152923583984, 4.4269866943359375, 4.680820941925049, 4.934654712677002, 5.188488960266113, 5.442322731018066, 5.6961565017700195]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 9.0, 6.0, 16.0, 11.0, 16.0, 15.0, 23.0, 22.0, 33.0, 47.0, 36.0, 113.0, 280.0, 92.0, 43.0, 39.0, 23.0, 25.0, 32.0, 23.0, 15.0, 14.0, 8.0, 8.0, 9.0, 12.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.580078125, -0.5631637573242188, -0.5462493896484375, -0.5293350219726562, -0.512420654296875, -0.49550628662109375, -0.4785919189453125, -0.46167755126953125, -0.44476318359375, -0.42784881591796875, -0.4109344482421875, -0.39402008056640625, -0.377105712890625, -0.36019134521484375, -0.3432769775390625, -0.32636260986328125, -0.3094482421875, -0.29253387451171875, -0.2756195068359375, -0.25870513916015625, -0.241790771484375, -0.22487640380859375, -0.2079620361328125, -0.19104766845703125, -0.17413330078125, -0.15721893310546875, -0.1403045654296875, -0.12339019775390625, -0.106475830078125, -0.08956146240234375, -0.0726470947265625, -0.05573272705078125, -0.038818359375, -0.02190399169921875, -0.0049896240234375, 0.01192474365234375, 0.028839111328125, 0.04575347900390625, 0.0626678466796875, 0.07958221435546875, 0.09649658203125, 0.11341094970703125, 0.1303253173828125, 0.14723968505859375, 0.164154052734375, 0.18106842041015625, 0.1979827880859375, 0.21489715576171875, 0.2318115234375, 0.24872589111328125, 0.2656402587890625, 0.28255462646484375, 0.299468994140625, 0.31638336181640625, 0.3332977294921875, 0.35021209716796875, 0.36712646484375, 0.38404083251953125, 0.4009552001953125, 0.41786956787109375, 0.434783935546875, 0.45169830322265625, 0.4686126708984375, 0.48552703857421875, 0.50244140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 10.0, 12.0, 18.0, 21.0, 17.0, 38.0, 59.0, 108.0, 247.0, 567.0, 1998.0, 18255.0, 8357651.0, 7508.0, 1256.0, 401.0, 158.0, 89.0, 64.0, 27.0, 15.0, 5.0, 9.0, 15.0, 3.0, 0.0, 8.0, 1.0, 3.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0], "bins": [-5.078289985656738, -4.905268669128418, -4.732247829437256, -4.5592265129089355, -4.386205196380615, -4.213184356689453, -4.040163040161133, -3.8671417236328125, -3.6941206455230713, -3.52109956741333, -3.3480782508850098, -3.1750571727752686, -3.0020360946655273, -2.829014778137207, -2.655993700027466, -2.4829726219177246, -2.3099513053894043, -2.136930227279663, -1.9639089107513428, -1.7908878326416016, -1.6178666353225708, -1.44484543800354, -1.2718243598937988, -1.098803162574768, -0.9257819652557373, -0.7527607679367065, -0.5797396302223206, -0.40671849250793457, -0.2336972951889038, -0.06067609786987305, 0.11234498023986816, 0.2853661775588989, 0.4583878517150879, 0.6314090490341187, 0.8044301867485046, 0.9774513244628906, 1.1504725217819214, 1.3234937191009521, 1.4965147972106934, 1.6695359945297241, 1.8425571918487549, 2.015578269958496, 2.1885995864868164, 2.3616206645965576, 2.534641742706299, 2.707663059234619, 2.8806841373443604, 3.0537052154541016, 3.226726531982422, 3.399747610092163, 3.5727689266204834, 3.7457900047302246, 3.918811321258545, 4.091832160949707, 4.264853477478027, 4.437874794006348, 4.610896110534668, 4.783917427062988, 4.95693826675415, 5.129959583282471, 5.302980899810791, 5.476001739501953, 5.649023056030273, 5.822044372558594, 5.995065212249756]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 4.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 4.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.025946140289307, -6.829422950744629, -6.632899761199951, -6.436376571655273, -6.239853858947754, -6.043330669403076, -5.846807479858398, -5.650284290313721, -5.453761100769043, -5.257237911224365, -5.0607147216796875, -4.864192008972168, -4.66766881942749, -4.4711456298828125, -4.274622440338135, -4.078099250793457, -3.8815762996673584, -3.6850531101226807, -3.488530158996582, -3.2920069694519043, -3.0954837799072266, -2.898960590362549, -2.70243763923645, -2.5059144496917725, -2.309391498565674, -2.112868309020996, -1.916345238685608, -1.7198221683502197, -1.523298978805542, -1.3267759084701538, -1.1302528381347656, -0.9337296485900879, -0.7372064590454102, -0.5406833291053772, -0.3441602289676666, -0.14763712882995605, 0.048886001110076904, 0.24540913105010986, 0.44193220138549805, 0.6384553909301758, 0.834978461265564, 1.0315015316009521, 1.2280247211456299, 1.424547791481018, 1.6210708618164062, 1.817594051361084, 2.0141172409057617, 2.2106404304504395, 2.407163381576538, 2.603686571121216, 2.8002095222473145, 2.996732711791992, 3.19325590133667, 3.3897790908813477, 3.5863020420074463, 3.782825231552124, 3.9793481826782227, 4.1758713722229, 4.372394561767578, 4.568917274475098, 4.765440464019775, 4.961963653564453, 5.158486843109131, 5.355010032653809, 5.551533222198486]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 8.0, 3.0, 10.0, 19.0, 19.0, 29.0, 39.0, 53.0, 81.0, 119.0, 215.0, 350.0, 618.0, 1250.0, 2799.0, 7178.0, 19828.0, 59519.0, 170968.0, 170874.0, 58794.0, 19134.0, 6916.0, 2712.0, 1214.0, 597.0, 336.0, 196.0, 118.0, 88.0, 41.0, 40.0, 26.0, 24.0, 17.0, 4.0, 8.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.150390625, -3.062896728515625, -2.97540283203125, -2.887908935546875, -2.8004150390625, -2.712921142578125, -2.62542724609375, -2.537933349609375, -2.450439453125, -2.362945556640625, -2.27545166015625, -2.187957763671875, -2.1004638671875, -2.012969970703125, -1.92547607421875, -1.837982177734375, -1.75048828125, -1.662994384765625, -1.57550048828125, -1.488006591796875, -1.4005126953125, -1.313018798828125, -1.22552490234375, -1.138031005859375, -1.050537109375, -0.963043212890625, -0.87554931640625, -0.788055419921875, -0.7005615234375, -0.613067626953125, -0.52557373046875, -0.438079833984375, -0.3505859375, -0.263092041015625, -0.17559814453125, -0.088104248046875, -0.0006103515625, 0.086883544921875, 0.17437744140625, 0.261871337890625, 0.349365234375, 0.436859130859375, 0.52435302734375, 0.611846923828125, 0.6993408203125, 0.786834716796875, 0.87432861328125, 0.961822509765625, 1.04931640625, 1.136810302734375, 1.22430419921875, 1.311798095703125, 1.3992919921875, 1.486785888671875, 1.57427978515625, 1.661773681640625, 1.749267578125, 1.836761474609375, 1.92425537109375, 2.011749267578125, 2.0992431640625, 2.186737060546875, 2.27423095703125, 2.361724853515625, 2.44921875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 6.0, 9.0, 15.0, 21.0, 37.0, 38.0, 65.0, 94.0, 112.0, 157.0, 141.0, 112.0, 60.0, 52.0, 28.0, 23.0, 15.0, 9.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1904296875, -1.155120849609375, -1.11981201171875, -1.084503173828125, -1.0491943359375, -1.013885498046875, -0.97857666015625, -0.943267822265625, -0.907958984375, -0.872650146484375, -0.83734130859375, -0.802032470703125, -0.7667236328125, -0.731414794921875, -0.69610595703125, -0.660797119140625, -0.62548828125, -0.590179443359375, -0.55487060546875, -0.519561767578125, -0.4842529296875, -0.448944091796875, -0.41363525390625, -0.378326416015625, -0.343017578125, -0.307708740234375, -0.27239990234375, -0.237091064453125, -0.2017822265625, -0.166473388671875, -0.13116455078125, -0.095855712890625, -0.060546875, -0.025238037109375, 0.01007080078125, 0.045379638671875, 0.0806884765625, 0.115997314453125, 0.15130615234375, 0.186614990234375, 0.221923828125, 0.257232666015625, 0.29254150390625, 0.327850341796875, 0.3631591796875, 0.398468017578125, 0.43377685546875, 0.469085693359375, 0.50439453125, 0.539703369140625, 0.57501220703125, 0.610321044921875, 0.6456298828125, 0.680938720703125, 0.71624755859375, 0.751556396484375, 0.786865234375, 0.822174072265625, 0.85748291015625, 0.892791748046875, 0.9281005859375, 0.963409423828125, 0.99871826171875, 1.034027099609375, 1.0693359375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 8.0, 3.0, 11.0, 19.0, 33.0, 54.0, 101.0, 104.0, 69.0, 34.0, 13.0, 9.0, 9.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.014385223388672, -2.877683162689209, -2.740981101989746, -2.604279041290283, -2.4675769805908203, -2.3308749198913574, -2.1941728591918945, -2.0574707984924316, -1.9207688570022583, -1.7840667963027954, -1.6473647356033325, -1.5106627941131592, -1.3739607334136963, -1.2372586727142334, -1.1005566120147705, -0.9638545513153076, -0.8271524906158447, -0.6904504299163818, -0.553748369216919, -0.41704636812210083, -0.28034430742263794, -0.14364224672317505, -0.006940245628356934, 0.12976181507110596, 0.26646387577056885, 0.40316593647003174, 0.5398679971694946, 0.6765699982643127, 0.8132720589637756, 0.9499741196632385, 1.0866761207580566, 1.2233781814575195, 1.3600802421569824, 1.4967823028564453, 1.6334843635559082, 1.770186424255371, 1.906888484954834, 2.043590545654297, 2.1802926063537598, 2.3169946670532227, 2.4536967277526855, 2.5903987884521484, 2.7271008491516113, 2.863802909851074, 3.000504970550537, 3.13720703125, 3.273909091949463, 3.410611152648926, 3.5473129749298096, 3.6840150356292725, 3.8207170963287354, 3.9574191570281982, 4.094120979309082, 4.230823040008545, 4.367525100708008, 4.504227161407471, 4.640929222106934, 4.7776312828063965, 4.914333343505859, 5.051035404205322, 5.187737464904785, 5.324439525604248, 5.461141586303711, 5.597843647003174, 5.734545707702637]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 3.0, 3.0, 6.0, 8.0, 3.0, 14.0, 26.0, 63.0, 133.0, 105.0, 51.0, 26.0, 8.0, 5.0, 4.0, 4.0, 3.0, 2.0, 5.0, 1.0, 4.0, 5.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.935749530792236, -5.798346042633057, -5.660942554473877, -5.5235395431518555, -5.386136054992676, -5.248732566833496, -5.111329078674316, -4.973925590515137, -4.836522579193115, -4.6991190910339355, -4.561715602874756, -4.424312591552734, -4.286909103393555, -4.149505615234375, -4.012102127075195, -3.8746988773345947, -3.737295389175415, -3.5998919010162354, -3.4624886512756348, -3.325085163116455, -3.1876819133758545, -3.050278425216675, -2.912875175476074, -2.7754716873168945, -2.638068199157715, -2.500664710998535, -2.3632614612579346, -2.225857973098755, -2.0884547233581543, -1.9510512351989746, -1.8136478662490845, -1.6762444972991943, -1.5388410091400146, -1.4014376401901245, -1.2640342712402344, -1.1266307830810547, -0.9892274737358093, -0.8518241047859192, -0.7144206762313843, -0.5770173072814941, -0.439613938331604, -0.30221056938171387, -0.16480717062950134, -0.02740377187728882, 0.10999959707260132, 0.24740296602249146, 0.38480639457702637, 0.5222097635269165, 0.6596131324768066, 0.7970165014266968, 0.9344198703765869, 1.0718233585357666, 1.2092266082763672, 1.3466300964355469, 1.484033465385437, 1.6214368343353271, 1.7588402032852173, 1.8962435722351074, 2.033647060394287, 2.1710503101348877, 2.3084537982940674, 2.445857048034668, 2.5832605361938477, 2.7206640243530273, 2.858067274093628]}, "train/train_runtime": 4795.9642, "train/train_samples_per_second": 5.95, "train/train_steps_per_second": 0.062, "train/total_flos": 0.0, "train/train_loss": 4.303745459225844} \ No newline at end of file