diff --git "a/wandb/run-20220312_150930-1rtl0j2u/files/wandb-summary.json" "b/wandb/run-20220312_150930-1rtl0j2u/files/wandb-summary.json" --- "a/wandb/run-20220312_150930-1rtl0j2u/files/wandb-summary.json" +++ "b/wandb/run-20220312_150930-1rtl0j2u/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.0699, "train/learning_rate": 7.626484560570072e-05, "train/epoch": 5.61, "train/global_step": 5000, "_runtime": 31283, "_timestamp": 1647129053, "_step": 5001, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 23.0, 63.0, 162.0, 249.0, 280.0, 120.0, 67.0, 28.0, 12.0, 5.0, 3.0], "bins": [-165.30477905273438, -162.4090576171875, -159.51333618164062, -156.61761474609375, -153.72189331054688, -150.826171875, -147.93045043945312, -145.03472900390625, -142.13900756835938, -139.2432861328125, -136.34756469726562, -133.45184326171875, -130.55612182617188, -127.660400390625, -124.76467895507812, -121.86895751953125, -118.97322845458984, -116.07750701904297, -113.1817855834961, -110.28606414794922, -107.39034271240234, -104.49462127685547, -101.59889221191406, -98.70317077636719, -95.80744934082031, -92.91172790527344, -90.01600646972656, -87.12028503417969, -84.22456359863281, -81.32884216308594, -78.43312072753906, -75.53739929199219, -72.64167022705078, -69.7459487915039, -66.85022735595703, -63.954505920410156, -61.05878448486328, -58.163063049316406, -55.267337799072266, -52.37161636352539, -49.475894927978516, -46.58017349243164, -43.684452056884766, -40.788726806640625, -37.89300537109375, -34.997283935546875, -32.1015625, -29.205841064453125, -26.31011962890625, -23.414398193359375, -20.5186767578125, -17.622953414916992, -14.727231979370117, -11.831510543823242, -8.935787200927734, -6.040065765380859, -3.1443443298339844, -0.24862241744995117, 2.647099494934082, 5.542821884155273, 8.438543319702148, 11.334264755249023, 14.229988098144531, 17.125709533691406, 20.02143096923828]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 5.0, 5.0, 6.0, 10.0, 15.0, 15.0, 19.0, 22.0, 28.0, 37.0, 28.0, 34.0, 44.0, 60.0, 49.0, 59.0, 57.0, 54.0, 53.0, 48.0, 49.0, 40.0, 43.0, 39.0, 30.0, 34.0, 26.0, 24.0, 12.0, 13.0, 10.0, 6.0, 9.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.71501350402832, -25.8629207611084, -25.010828018188477, -24.158733367919922, -23.306640625, -22.454547882080078, -21.602455139160156, -20.750362396240234, -19.898269653320312, -19.04617691040039, -18.19408416748047, -17.341991424560547, -16.489896774291992, -15.63780403137207, -14.785711288452148, -13.933618545532227, -13.081524848937988, -12.229432106018066, -11.377338409423828, -10.525245666503906, -9.673152923583984, -8.821060180664062, -7.968966484069824, -7.116873741149902, -6.264780521392822, -5.412687301635742, -4.56059455871582, -3.7085013389587402, -2.8564083576202393, -2.0043153762817383, -1.1522221565246582, -0.30012941360473633, 0.5519638061523438, 1.4040567874908447, 2.2561497688293457, 3.108242988586426, 3.9603359699249268, 4.812428951263428, 5.664522171020508, 6.51661491394043, 7.36870813369751, 8.22080135345459, 9.072894096374512, 9.92498779296875, 10.777080535888672, 11.629173278808594, 12.481266021728516, 13.333358764648438, 14.185452461242676, 15.037545204162598, 15.889638900756836, 16.741731643676758, 17.59382438659668, 18.4459171295166, 19.298011779785156, 20.150104522705078, 21.002197265625, 21.854290008544922, 22.706382751464844, 23.558475494384766, 24.41057014465332, 25.262662887573242, 26.114755630493164, 26.966848373413086, 27.818941116333008]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 10.0, 14.0, 20.0, 26.0, 30.0, 33.0, 33.0, 45.0, 54.0, 63.0, 69.0, 55.0, 75.0, 66.0, 62.0, 53.0, 58.0, 43.0, 39.0, 40.0, 31.0, 18.0, 17.0, 9.0, 13.0, 5.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.767578125, -2.663421630859375, -2.55926513671875, -2.455108642578125, -2.3509521484375, -2.246795654296875, -2.14263916015625, -2.038482666015625, -1.934326171875, -1.830169677734375, -1.72601318359375, -1.621856689453125, -1.5177001953125, -1.413543701171875, -1.30938720703125, -1.205230712890625, -1.10107421875, -0.996917724609375, -0.89276123046875, -0.788604736328125, -0.6844482421875, -0.580291748046875, -0.47613525390625, -0.371978759765625, -0.267822265625, -0.163665771484375, -0.05950927734375, 0.044647216796875, 0.1488037109375, 0.252960205078125, 0.35711669921875, 0.461273193359375, 0.5654296875, 0.669586181640625, 0.77374267578125, 0.877899169921875, 0.9820556640625, 1.086212158203125, 1.19036865234375, 1.294525146484375, 1.398681640625, 1.502838134765625, 1.60699462890625, 1.711151123046875, 1.8153076171875, 1.919464111328125, 2.02362060546875, 2.127777099609375, 2.23193359375, 2.336090087890625, 2.44024658203125, 2.544403076171875, 2.6485595703125, 2.752716064453125, 2.85687255859375, 2.961029052734375, 3.065185546875, 3.169342041015625, 3.27349853515625, 3.377655029296875, 3.4818115234375, 3.585968017578125, 3.69012451171875, 3.794281005859375, 3.8984375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 0.0, 12.0, 21.0, 15.0, 40.0, 57.0, 84.0, 138.0, 230.0, 448.0, 899.0, 2038.0, 6331.0, 34454.0, 631336.0, 3426262.0, 76012.0, 10492.0, 2950.0, 1158.0, 541.0, 289.0, 183.0, 94.0, 71.0, 35.0, 32.0, 17.0, 12.0, 6.0, 11.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.40625, -20.61865234375, -19.8310546875, -19.04345703125, -18.255859375, -17.46826171875, -16.6806640625, -15.89306640625, -15.10546875, -14.31787109375, -13.5302734375, -12.74267578125, -11.955078125, -11.16748046875, -10.3798828125, -9.59228515625, -8.8046875, -8.01708984375, -7.2294921875, -6.44189453125, -5.654296875, -4.86669921875, -4.0791015625, -3.29150390625, -2.50390625, -1.71630859375, -0.9287109375, -0.14111328125, 0.646484375, 1.43408203125, 2.2216796875, 3.00927734375, 3.796875, 4.58447265625, 5.3720703125, 6.15966796875, 6.947265625, 7.73486328125, 8.5224609375, 9.31005859375, 10.09765625, 10.88525390625, 11.6728515625, 12.46044921875, 13.248046875, 14.03564453125, 14.8232421875, 15.61083984375, 16.3984375, 17.18603515625, 17.9736328125, 18.76123046875, 19.548828125, 20.33642578125, 21.1240234375, 21.91162109375, 22.69921875, 23.48681640625, 24.2744140625, 25.06201171875, 25.849609375, 26.63720703125, 27.4248046875, 28.21240234375, 29.0]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 11.0, 4.0, 9.0, 15.0, 21.0, 44.0, 90.0, 158.0, 292.0, 476.0, 930.0, 920.0, 491.0, 276.0, 152.0, 85.0, 48.0, 20.0, 14.0, 13.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.4407958984375, -17.928466796875, -17.4161376953125, -16.90380859375, -16.3914794921875, -15.879150390625, -15.3668212890625, -14.8544921875, -14.3421630859375, -13.829833984375, -13.3175048828125, -12.80517578125, -12.2928466796875, -11.780517578125, -11.2681884765625, -10.755859375, -10.2435302734375, -9.731201171875, -9.2188720703125, -8.70654296875, -8.1942138671875, -7.681884765625, -7.1695556640625, -6.6572265625, -6.1448974609375, -5.632568359375, -5.1202392578125, -4.60791015625, -4.0955810546875, -3.583251953125, -3.0709228515625, -2.55859375, -2.0462646484375, -1.533935546875, -1.0216064453125, -0.50927734375, 0.0030517578125, 0.515380859375, 1.0277099609375, 1.5400390625, 2.0523681640625, 2.564697265625, 3.0770263671875, 3.58935546875, 4.1016845703125, 4.614013671875, 5.1263427734375, 5.638671875, 6.1510009765625, 6.663330078125, 7.1756591796875, 7.68798828125, 8.2003173828125, 8.712646484375, 9.2249755859375, 9.7373046875, 10.2496337890625, 10.761962890625, 11.2742919921875, 11.78662109375, 12.2989501953125, 12.811279296875, 13.3236083984375, 13.8359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 9.0, 18.0, 39.0, 59.0, 96.0, 172.0, 380.0, 819.0, 2290.0, 13717.0, 330158.0, 3745881.0, 91509.0, 6463.0, 1455.0, 582.0, 289.0, 140.0, 72.0, 54.0, 26.0, 11.0, 7.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.03125, -56.43408203125, -54.8369140625, -53.23974609375, -51.642578125, -50.04541015625, -48.4482421875, -46.85107421875, -45.25390625, -43.65673828125, -42.0595703125, -40.46240234375, -38.865234375, -37.26806640625, -35.6708984375, -34.07373046875, -32.4765625, -30.87939453125, -29.2822265625, -27.68505859375, -26.087890625, -24.49072265625, -22.8935546875, -21.29638671875, -19.69921875, -18.10205078125, -16.5048828125, -14.90771484375, -13.310546875, -11.71337890625, -10.1162109375, -8.51904296875, -6.921875, -5.32470703125, -3.7275390625, -2.13037109375, -0.533203125, 1.06396484375, 2.6611328125, 4.25830078125, 5.85546875, 7.45263671875, 9.0498046875, 10.64697265625, 12.244140625, 13.84130859375, 15.4384765625, 17.03564453125, 18.6328125, 20.22998046875, 21.8271484375, 23.42431640625, 25.021484375, 26.61865234375, 28.2158203125, 29.81298828125, 31.41015625, 33.00732421875, 34.6044921875, 36.20166015625, 37.798828125, 39.39599609375, 40.9931640625, 42.59033203125, 44.1875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 20.0, 83.0, 260.0, 419.0, 184.0, 35.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-178.97796630859375, -174.0478057861328, -169.1176300048828, -164.18746948242188, -159.25729370117188, -154.32713317871094, -149.39697265625, -144.466796875, -139.53663635253906, -134.60647583007812, -129.67630004882812, -124.74613952636719, -119.81597137451172, -114.88580322265625, -109.95564270019531, -105.02547454833984, -100.09530639648438, -95.1651382446289, -90.23497009277344, -85.3048095703125, -80.37464141845703, -75.44447326660156, -70.51431274414062, -65.58414459228516, -60.65397644042969, -55.72380828857422, -50.793643951416016, -45.86347961425781, -40.933311462402344, -36.003143310546875, -31.072978973388672, -26.14281463623047, -21.212646484375, -16.282480239868164, -11.352313995361328, -6.422147750854492, -1.4919815063476562, 3.4381847381591797, 8.368350982666016, 13.298515319824219, 18.228683471679688, 23.158849716186523, 28.08901596069336, 33.01918029785156, 37.94934844970703, 42.8795166015625, 47.8096809387207, 52.739845275878906, 57.670013427734375, 62.600181579589844, 67.53034973144531, 72.46051025390625, 77.39067840576172, 82.32084655761719, 87.25100708007812, 92.1811752319336, 97.11134338378906, 102.04151153564453, 106.9716796875, 111.90184020996094, 116.8320083618164, 121.76217651367188, 126.69233703613281, 131.62249755859375, 136.55267333984375]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 10.0, 11.0, 11.0, 7.0, 17.0, 17.0, 19.0, 28.0, 16.0, 29.0, 31.0, 29.0, 32.0, 34.0, 34.0, 29.0, 26.0, 27.0, 32.0, 26.0, 30.0, 37.0, 35.0, 39.0, 23.0, 26.0, 41.0, 33.0, 28.0, 30.0, 25.0, 22.0, 19.0, 33.0, 14.0, 19.0, 9.0, 8.0, 13.0, 7.0, 6.0, 1.0, 5.0, 1.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-30.16293716430664, -29.280155181884766, -28.397371292114258, -27.514589309692383, -26.631805419921875, -25.7490234375, -24.866241455078125, -23.983457565307617, -23.100675582885742, -22.217893600463867, -21.33510971069336, -20.452327728271484, -19.569543838500977, -18.6867618560791, -17.803977966308594, -16.92119598388672, -16.038414001464844, -15.155631065368652, -14.272848129272461, -13.390066146850586, -12.507283210754395, -11.624500274658203, -10.741717338562012, -9.85893440246582, -8.976150512695312, -8.093367576599121, -7.210585117340088, -6.3278021812438965, -5.445019721984863, -4.562236785888672, -3.6794538497924805, -2.7966713905334473, -1.913888931274414, -1.0311062335968018, -0.1483234167098999, 0.734459400177002, 1.6172420978546143, 2.5000247955322266, 3.382807731628418, 4.265590190887451, 5.148373126983643, 6.031156063079834, 6.913938522338867, 7.796721458435059, 8.67950439453125, 9.562286376953125, 10.445070266723633, 11.327852249145508, 12.2106351852417, 13.09341812133789, 13.976201057434082, 14.858983993530273, 15.741765975952148, 16.624549865722656, 17.50733184814453, 18.390113830566406, 19.272897720336914, 20.15567970275879, 21.038463592529297, 21.921245574951172, 22.80402946472168, 23.686811447143555, 24.569595336914062, 25.452377319335938, 26.335159301757812]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 11.0, 10.0, 13.0, 14.0, 21.0, 16.0, 23.0, 21.0, 27.0, 35.0, 32.0, 33.0, 31.0, 47.0, 50.0, 54.0, 39.0, 60.0, 54.0, 36.0, 33.0, 32.0, 38.0, 35.0, 35.0, 28.0, 29.0, 26.0, 21.0, 18.0, 13.0, 10.0, 12.0, 9.0, 7.0, 4.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9404296875, -1.8642425537109375, -1.788055419921875, -1.7118682861328125, -1.63568115234375, -1.5594940185546875, -1.483306884765625, -1.4071197509765625, -1.3309326171875, -1.2547454833984375, -1.178558349609375, -1.1023712158203125, -1.02618408203125, -0.9499969482421875, -0.873809814453125, -0.7976226806640625, -0.721435546875, -0.6452484130859375, -0.569061279296875, -0.4928741455078125, -0.41668701171875, -0.3404998779296875, -0.264312744140625, -0.1881256103515625, -0.1119384765625, -0.0357513427734375, 0.040435791015625, 0.1166229248046875, 0.19281005859375, 0.2689971923828125, 0.345184326171875, 0.4213714599609375, 0.49755859375, 0.5737457275390625, 0.649932861328125, 0.7261199951171875, 0.80230712890625, 0.8784942626953125, 0.954681396484375, 1.0308685302734375, 1.1070556640625, 1.1832427978515625, 1.259429931640625, 1.3356170654296875, 1.41180419921875, 1.4879913330078125, 1.564178466796875, 1.6403656005859375, 1.716552734375, 1.7927398681640625, 1.868927001953125, 1.9451141357421875, 2.02130126953125, 2.0974884033203125, 2.173675537109375, 2.2498626708984375, 2.3260498046875, 2.4022369384765625, 2.478424072265625, 2.5546112060546875, 2.63079833984375, 2.7069854736328125, 2.783172607421875, 2.8593597412109375, 2.935546875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 21.0, 18.0, 41.0, 43.0, 64.0, 100.0, 143.0, 212.0, 316.0, 443.0, 662.0, 900.0, 1369.0, 2201.0, 3176.0, 4739.0, 7082.0, 10488.0, 16453.0, 24021.0, 36042.0, 53674.0, 77454.0, 106690.0, 134984.0, 144562.0, 124562.0, 94323.0, 66215.0, 45624.0, 30439.0, 20425.0, 13637.0, 9026.0, 6083.0, 4006.0, 2645.0, 1788.0, 1319.0, 814.0, 569.0, 368.0, 264.0, 192.0, 101.0, 85.0, 48.0, 46.0, 18.0, 19.0, 14.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.8583984375, -1.79901123046875, -1.7396240234375, -1.68023681640625, -1.620849609375, -1.56146240234375, -1.5020751953125, -1.44268798828125, -1.38330078125, -1.32391357421875, -1.2645263671875, -1.20513916015625, -1.145751953125, -1.08636474609375, -1.0269775390625, -0.96759033203125, -0.908203125, -0.84881591796875, -0.7894287109375, -0.73004150390625, -0.670654296875, -0.61126708984375, -0.5518798828125, -0.49249267578125, -0.43310546875, -0.37371826171875, -0.3143310546875, -0.25494384765625, -0.195556640625, -0.13616943359375, -0.0767822265625, -0.01739501953125, 0.0419921875, 0.10137939453125, 0.1607666015625, 0.22015380859375, 0.279541015625, 0.33892822265625, 0.3983154296875, 0.45770263671875, 0.51708984375, 0.57647705078125, 0.6358642578125, 0.69525146484375, 0.754638671875, 0.81402587890625, 0.8734130859375, 0.93280029296875, 0.9921875, 1.05157470703125, 1.1109619140625, 1.17034912109375, 1.229736328125, 1.28912353515625, 1.3485107421875, 1.40789794921875, 1.46728515625, 1.52667236328125, 1.5860595703125, 1.64544677734375, 1.704833984375, 1.76422119140625, 1.8236083984375, 1.88299560546875, 1.9423828125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 16.0, 10.0, 19.0, 15.0, 18.0, 16.0, 29.0, 29.0, 33.0, 38.0, 47.0, 40.0, 39.0, 43.0, 33.0, 1069.0, 51.0, 51.0, 47.0, 51.0, 44.0, 43.0, 22.0, 32.0, 37.0, 24.0, 15.0, 17.0, 21.0, 15.0, 11.0, 6.0, 16.0, 6.0, 2.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.380859375, -3.28411865234375, -3.1873779296875, -3.09063720703125, -2.993896484375, -2.89715576171875, -2.8004150390625, -2.70367431640625, -2.60693359375, -2.51019287109375, -2.4134521484375, -2.31671142578125, -2.219970703125, -2.12322998046875, -2.0264892578125, -1.92974853515625, -1.8330078125, -1.73626708984375, -1.6395263671875, -1.54278564453125, -1.446044921875, -1.34930419921875, -1.2525634765625, -1.15582275390625, -1.05908203125, -0.96234130859375, -0.8656005859375, -0.76885986328125, -0.672119140625, -0.57537841796875, -0.4786376953125, -0.38189697265625, -0.28515625, -0.18841552734375, -0.0916748046875, 0.00506591796875, 0.101806640625, 0.19854736328125, 0.2952880859375, 0.39202880859375, 0.48876953125, 0.58551025390625, 0.6822509765625, 0.77899169921875, 0.875732421875, 0.97247314453125, 1.0692138671875, 1.16595458984375, 1.2626953125, 1.35943603515625, 1.4561767578125, 1.55291748046875, 1.649658203125, 1.74639892578125, 1.8431396484375, 1.93988037109375, 2.03662109375, 2.13336181640625, 2.2301025390625, 2.32684326171875, 2.423583984375, 2.52032470703125, 2.6170654296875, 2.71380615234375, 2.810546875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 11.0, 12.0, 20.0, 20.0, 32.0, 33.0, 62.0, 103.0, 143.0, 211.0, 334.0, 495.0, 749.0, 1224.0, 1884.0, 3136.0, 5151.0, 8617.0, 15060.0, 27488.0, 59130.0, 1131318.0, 721840.0, 57004.0, 26510.0, 14847.0, 8413.0, 4892.0, 3058.0, 1940.0, 1108.0, 725.0, 498.0, 313.0, 227.0, 155.0, 95.0, 90.0, 49.0, 45.0, 27.0, 13.0, 10.0, 13.0, 2.0, 6.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.609375, -4.4696044921875, -4.329833984375, -4.1900634765625, -4.05029296875, -3.9105224609375, -3.770751953125, -3.6309814453125, -3.4912109375, -3.3514404296875, -3.211669921875, -3.0718994140625, -2.93212890625, -2.7923583984375, -2.652587890625, -2.5128173828125, -2.373046875, -2.2332763671875, -2.093505859375, -1.9537353515625, -1.81396484375, -1.6741943359375, -1.534423828125, -1.3946533203125, -1.2548828125, -1.1151123046875, -0.975341796875, -0.8355712890625, -0.69580078125, -0.5560302734375, -0.416259765625, -0.2764892578125, -0.13671875, 0.0030517578125, 0.142822265625, 0.2825927734375, 0.42236328125, 0.5621337890625, 0.701904296875, 0.8416748046875, 0.9814453125, 1.1212158203125, 1.260986328125, 1.4007568359375, 1.54052734375, 1.6802978515625, 1.820068359375, 1.9598388671875, 2.099609375, 2.2393798828125, 2.379150390625, 2.5189208984375, 2.65869140625, 2.7984619140625, 2.938232421875, 3.0780029296875, 3.2177734375, 3.3575439453125, 3.497314453125, 3.6370849609375, 3.77685546875, 3.9166259765625, 4.056396484375, 4.1961669921875, 4.3359375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 6.0, 2.0, 3.0, 5.0, 7.0, 11.0, 4.0, 14.0, 15.0, 15.0, 19.0, 21.0, 31.0, 32.0, 49.0, 59.0, 71.0, 66.0, 65.0, 67.0, 72.0, 73.0, 59.0, 52.0, 39.0, 39.0, 25.0, 16.0, 14.0, 12.0, 9.0, 4.0, 8.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.783203125, -0.76025390625, -0.7373046875, -0.71435546875, -0.69140625, -0.66845703125, -0.6455078125, -0.62255859375, -0.599609375, -0.57666015625, -0.5537109375, -0.53076171875, -0.5078125, -0.48486328125, -0.4619140625, -0.43896484375, -0.416015625, -0.39306640625, -0.3701171875, -0.34716796875, -0.32421875, -0.30126953125, -0.2783203125, -0.25537109375, -0.232421875, -0.20947265625, -0.1865234375, -0.16357421875, -0.140625, -0.11767578125, -0.0947265625, -0.07177734375, -0.048828125, -0.02587890625, -0.0029296875, 0.02001953125, 0.04296875, 0.06591796875, 0.0888671875, 0.11181640625, 0.134765625, 0.15771484375, 0.1806640625, 0.20361328125, 0.2265625, 0.24951171875, 0.2724609375, 0.29541015625, 0.318359375, 0.34130859375, 0.3642578125, 0.38720703125, 0.41015625, 0.43310546875, 0.4560546875, 0.47900390625, 0.501953125, 0.52490234375, 0.5478515625, 0.57080078125, 0.59375, 0.61669921875, 0.6396484375, 0.66259765625, 0.685546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 7.0, 5.0, 12.0, 15.0, 18.0, 28.0, 34.0, 39.0, 49.0, 62.0, 78.0, 112.0, 149.0, 294.0, 439.0, 1996.0, 58954.0, 971861.0, 12342.0, 927.0, 345.0, 226.0, 149.0, 105.0, 79.0, 61.0, 27.0, 33.0, 19.0, 19.0, 9.0, 11.0, 11.0, 5.0, 6.0, 5.0, 3.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.4765625, -13.0838623046875, -12.691162109375, -12.2984619140625, -11.90576171875, -11.5130615234375, -11.120361328125, -10.7276611328125, -10.3349609375, -9.9422607421875, -9.549560546875, -9.1568603515625, -8.76416015625, -8.3714599609375, -7.978759765625, -7.5860595703125, -7.193359375, -6.8006591796875, -6.407958984375, -6.0152587890625, -5.62255859375, -5.2298583984375, -4.837158203125, -4.4444580078125, -4.0517578125, -3.6590576171875, -3.266357421875, -2.8736572265625, -2.48095703125, -2.0882568359375, -1.695556640625, -1.3028564453125, -0.91015625, -0.5174560546875, -0.124755859375, 0.2679443359375, 0.66064453125, 1.0533447265625, 1.446044921875, 1.8387451171875, 2.2314453125, 2.6241455078125, 3.016845703125, 3.4095458984375, 3.80224609375, 4.1949462890625, 4.587646484375, 4.9803466796875, 5.373046875, 5.7657470703125, 6.158447265625, 6.5511474609375, 6.94384765625, 7.3365478515625, 7.729248046875, 8.1219482421875, 8.5146484375, 8.9073486328125, 9.300048828125, 9.6927490234375, 10.08544921875, 10.4781494140625, 10.870849609375, 11.2635498046875, 11.65625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 13.0, 14.0, 32.0, 86.0, 168.0, 329.0, 205.0, 81.0, 37.0, 27.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2261810302734375, -5.029883861541748, -4.833586692810059, -4.637290000915527, -4.440992832183838, -4.244695663452148, -4.048398494720459, -3.8521013259887695, -3.655804395675659, -3.4595072269439697, -3.2632102966308594, -3.06691312789917, -2.8706159591674805, -2.67431902885437, -2.4780218601226807, -2.2817249298095703, -2.085427761077881, -1.889130711555481, -1.692833662033081, -1.4965364933013916, -1.3002394437789917, -1.1039423942565918, -0.9076452255249023, -0.7113481760025024, -0.5150511264801025, -0.31875404715538025, -0.12245696783065796, 0.07384014129638672, 0.2701371908187866, 0.4664342403411865, 0.662731409072876, 0.8590284585952759, 1.0553255081176758, 1.2516225576400757, 1.4479196071624756, 1.644216775894165, 1.840513825416565, 2.036810874938965, 2.2331080436706543, 2.4294052124023438, 2.625702142715454, 2.8219993114471436, 3.018296241760254, 3.2145934104919434, 3.410890579223633, 3.607187509536743, 3.8034846782684326, 3.999781608581543, 4.196078777313232, 4.392375946044922, 4.588673114776611, 4.784970283508301, 4.981266975402832, 5.1775641441345215, 5.373861312866211, 5.5701584815979, 5.76645565032959, 5.962752819061279, 6.159049987792969, 6.3553466796875, 6.5516438484191895, 6.747941017150879, 6.944238185882568, 7.140535354614258, 7.336832046508789]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 12.0, 8.0, 10.0, 20.0, 25.0, 17.0, 35.0, 33.0, 32.0, 32.0, 38.0, 44.0, 39.0, 52.0, 35.0, 40.0, 55.0, 34.0, 36.0, 40.0, 24.0, 31.0, 47.0, 23.0, 31.0, 19.0, 25.0, 26.0, 17.0, 8.0, 11.0, 8.0, 14.0, 10.0, 6.0, 7.0, 4.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7738559246063232, -1.719215989112854, -1.6645760536193848, -1.609936237335205, -1.5552963018417358, -1.5006563663482666, -1.446016550064087, -1.3913766145706177, -1.3367366790771484, -1.2820967435836792, -1.22745680809021, -1.1728169918060303, -1.118177056312561, -1.0635371208190918, -1.008897304534912, -0.9542573690414429, -0.8996174335479736, -0.8449774980545044, -0.7903376221656799, -0.7356977462768555, -0.6810578107833862, -0.626417875289917, -0.5717779994010925, -0.5171381235122681, -0.46249818801879883, -0.407858282327652, -0.3532183766365051, -0.2985784709453583, -0.24393856525421143, -0.18929865956306458, -0.13465875387191772, -0.08001884818077087, -0.025378942489624023, 0.029260963201522827, 0.08390086889266968, 0.13854077458381653, 0.19318068027496338, 0.24782058596611023, 0.3024604916572571, 0.35710039734840393, 0.4117403030395508, 0.46638020873069763, 0.5210201144218445, 0.575659990310669, 0.6302999258041382, 0.6849398612976074, 0.7395797371864319, 0.7942196130752563, 0.8488595485687256, 0.9034994840621948, 0.9581393599510193, 1.0127792358398438, 1.067419171333313, 1.1220591068267822, 1.176698923110962, 1.2313388586044312, 1.2859787940979004, 1.3406187295913696, 1.3952586650848389, 1.4498984813690186, 1.5045384168624878, 1.559178352355957, 1.6138181686401367, 1.668458104133606, 1.7230980396270752]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 10.0, 11.0, 11.0, 11.0, 20.0, 23.0, 14.0, 24.0, 27.0, 34.0, 33.0, 32.0, 35.0, 41.0, 49.0, 52.0, 43.0, 52.0, 55.0, 48.0, 37.0, 24.0, 33.0, 36.0, 37.0, 29.0, 33.0, 21.0, 27.0, 16.0, 11.0, 17.0, 10.0, 6.0, 10.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.95703125, -1.880828857421875, -1.80462646484375, -1.728424072265625, -1.6522216796875, -1.576019287109375, -1.49981689453125, -1.423614501953125, -1.347412109375, -1.271209716796875, -1.19500732421875, -1.118804931640625, -1.0426025390625, -0.966400146484375, -0.89019775390625, -0.813995361328125, -0.73779296875, -0.661590576171875, -0.58538818359375, -0.509185791015625, -0.4329833984375, -0.356781005859375, -0.28057861328125, -0.204376220703125, -0.128173828125, -0.051971435546875, 0.02423095703125, 0.100433349609375, 0.1766357421875, 0.252838134765625, 0.32904052734375, 0.405242919921875, 0.4814453125, 0.557647705078125, 0.63385009765625, 0.710052490234375, 0.7862548828125, 0.862457275390625, 0.93865966796875, 1.014862060546875, 1.091064453125, 1.167266845703125, 1.24346923828125, 1.319671630859375, 1.3958740234375, 1.472076416015625, 1.54827880859375, 1.624481201171875, 1.70068359375, 1.776885986328125, 1.85308837890625, 1.929290771484375, 2.0054931640625, 2.081695556640625, 2.15789794921875, 2.234100341796875, 2.310302734375, 2.386505126953125, 2.46270751953125, 2.538909912109375, 2.6151123046875, 2.691314697265625, 2.76751708984375, 2.843719482421875, 2.919921875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 1.0, 5.0, 5.0, 15.0, 22.0, 23.0, 37.0, 59.0, 93.0, 136.0, 215.0, 372.0, 601.0, 996.0, 1825.0, 3367.0, 6798.0, 16093.0, 47522.0, 177658.0, 504995.0, 202048.0, 52568.0, 17508.0, 7269.0, 3670.0, 1876.0, 1125.0, 605.0, 379.0, 234.0, 133.0, 103.0, 52.0, 51.0, 35.0, 23.0, 8.0, 10.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.3515625, -10.99169921875, -10.6318359375, -10.27197265625, -9.912109375, -9.55224609375, -9.1923828125, -8.83251953125, -8.47265625, -8.11279296875, -7.7529296875, -7.39306640625, -7.033203125, -6.67333984375, -6.3134765625, -5.95361328125, -5.59375, -5.23388671875, -4.8740234375, -4.51416015625, -4.154296875, -3.79443359375, -3.4345703125, -3.07470703125, -2.71484375, -2.35498046875, -1.9951171875, -1.63525390625, -1.275390625, -0.91552734375, -0.5556640625, -0.19580078125, 0.1640625, 0.52392578125, 0.8837890625, 1.24365234375, 1.603515625, 1.96337890625, 2.3232421875, 2.68310546875, 3.04296875, 3.40283203125, 3.7626953125, 4.12255859375, 4.482421875, 4.84228515625, 5.2021484375, 5.56201171875, 5.921875, 6.28173828125, 6.6416015625, 7.00146484375, 7.361328125, 7.72119140625, 8.0810546875, 8.44091796875, 8.80078125, 9.16064453125, 9.5205078125, 9.88037109375, 10.240234375, 10.60009765625, 10.9599609375, 11.31982421875, 11.6796875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 2.0, 9.0, 8.0, 13.0, 12.0, 12.0, 24.0, 18.0, 33.0, 25.0, 30.0, 32.0, 43.0, 72.0, 69.0, 104.0, 142.0, 272.0, 1379.0, 181.0, 127.0, 76.0, 54.0, 50.0, 54.0, 47.0, 25.0, 22.0, 22.0, 23.0, 13.0, 10.0, 13.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.671875, -9.3892822265625, -9.106689453125, -8.8240966796875, -8.54150390625, -8.2589111328125, -7.976318359375, -7.6937255859375, -7.4111328125, -7.1285400390625, -6.845947265625, -6.5633544921875, -6.28076171875, -5.9981689453125, -5.715576171875, -5.4329833984375, -5.150390625, -4.8677978515625, -4.585205078125, -4.3026123046875, -4.02001953125, -3.7374267578125, -3.454833984375, -3.1722412109375, -2.8896484375, -2.6070556640625, -2.324462890625, -2.0418701171875, -1.75927734375, -1.4766845703125, -1.194091796875, -0.9114990234375, -0.62890625, -0.3463134765625, -0.063720703125, 0.2188720703125, 0.50146484375, 0.7840576171875, 1.066650390625, 1.3492431640625, 1.6318359375, 1.9144287109375, 2.197021484375, 2.4796142578125, 2.76220703125, 3.0447998046875, 3.327392578125, 3.6099853515625, 3.892578125, 4.1751708984375, 4.457763671875, 4.7403564453125, 5.02294921875, 5.3055419921875, 5.588134765625, 5.8707275390625, 6.1533203125, 6.4359130859375, 6.718505859375, 7.0010986328125, 7.28369140625, 7.5662841796875, 7.848876953125, 8.1314697265625, 8.4140625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 9.0, 4.0, 7.0, 8.0, 12.0, 12.0, 15.0, 22.0, 21.0, 24.0, 35.0, 53.0, 54.0, 99.0, 269.0, 863.0, 8522.0, 1078123.0, 2044017.0, 11825.0, 1000.0, 273.0, 131.0, 62.0, 49.0, 38.0, 26.0, 21.0, 22.0, 17.0, 14.0, 10.0, 11.0, 9.0, 7.0, 7.0, 4.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.625, -34.4775390625, -33.330078125, -32.1826171875, -31.03515625, -29.8876953125, -28.740234375, -27.5927734375, -26.4453125, -25.2978515625, -24.150390625, -23.0029296875, -21.85546875, -20.7080078125, -19.560546875, -18.4130859375, -17.265625, -16.1181640625, -14.970703125, -13.8232421875, -12.67578125, -11.5283203125, -10.380859375, -9.2333984375, -8.0859375, -6.9384765625, -5.791015625, -4.6435546875, -3.49609375, -2.3486328125, -1.201171875, -0.0537109375, 1.09375, 2.2412109375, 3.388671875, 4.5361328125, 5.68359375, 6.8310546875, 7.978515625, 9.1259765625, 10.2734375, 11.4208984375, 12.568359375, 13.7158203125, 14.86328125, 16.0107421875, 17.158203125, 18.3056640625, 19.453125, 20.6005859375, 21.748046875, 22.8955078125, 24.04296875, 25.1904296875, 26.337890625, 27.4853515625, 28.6328125, 29.7802734375, 30.927734375, 32.0751953125, 33.22265625, 34.3701171875, 35.517578125, 36.6650390625, 37.8125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 498.0, 510.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.7233657836914, -68.14322662353516, -60.563087463378906, -52.982948303222656, -45.402809143066406, -37.82266616821289, -30.24252700805664, -22.66238784790039, -15.08224868774414, -7.502109050750732, 0.07803058624267578, 7.658170700073242, 15.238309860229492, 22.818450927734375, 30.398590087890625, 37.978729248046875, 45.558868408203125, 53.139007568359375, 60.719146728515625, 68.29928588867188, 75.87942504882812, 83.45956420898438, 91.03970336914062, 98.61984252929688, 106.19998168945312, 113.78012084960938, 121.36026000976562, 128.94039916992188, 136.52053833007812, 144.10067749023438, 151.68081665039062, 159.26095581054688, 166.8411102294922, 174.42124938964844, 182.0013885498047, 189.58152770996094, 197.1616668701172, 204.74180603027344, 212.3219451904297, 219.90208435058594, 227.4822235107422, 235.06236267089844, 242.6425018310547, 250.22264099121094, 257.80279541015625, 265.3829345703125, 272.96307373046875, 280.543212890625, 288.12335205078125, 295.7034912109375, 303.28363037109375, 310.86376953125, 318.44390869140625, 326.0240478515625, 333.60418701171875, 341.184326171875, 348.76446533203125, 356.3446044921875, 363.92474365234375, 371.5048828125, 379.08502197265625, 386.6651611328125, 394.24530029296875, 401.825439453125, 409.40557861328125]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 8.0, 7.0, 16.0, 19.0, 17.0, 20.0, 14.0, 21.0, 31.0, 34.0, 29.0, 31.0, 27.0, 47.0, 30.0, 45.0, 34.0, 45.0, 50.0, 40.0, 44.0, 49.0, 38.0, 33.0, 37.0, 24.0, 30.0, 22.0, 23.0, 14.0, 19.0, 12.0, 13.0, 10.0, 7.0, 8.0, 11.0, 8.0, 2.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.11102294921875, -24.2674560546875, -23.423891067504883, -22.580324172973633, -21.736759185791016, -20.893192291259766, -20.049625396728516, -19.2060604095459, -18.36249351501465, -17.5189266204834, -16.67536163330078, -15.831794738769531, -14.988228797912598, -14.144662857055664, -13.30109691619873, -12.457530975341797, -11.613965034484863, -10.77039909362793, -9.926833152770996, -9.083267211914062, -8.239700317382812, -7.396134376525879, -6.552568435668945, -5.7090020179748535, -4.86543607711792, -4.021870136260986, -3.1783037185668945, -2.334737777709961, -1.4911715984344482, -0.6476054191589355, 0.19596052169799805, 1.0395269393920898, 1.8830928802490234, 2.726659059524536, 3.570225238800049, 4.413791179656982, 5.257357597351074, 6.100923538208008, 6.944489479064941, 7.788055896759033, 8.631622314453125, 9.475188255310059, 10.318754196166992, 11.162321090698242, 12.005887031555176, 12.84945297241211, 13.693018913269043, 14.536584854125977, 15.38015079498291, 16.223716735839844, 17.067283630371094, 17.91084861755371, 18.75441551208496, 19.597980499267578, 20.441547393798828, 21.285114288330078, 22.128679275512695, 22.972246170043945, 23.815811157226562, 24.659378051757812, 25.50294303894043, 26.34650993347168, 27.190074920654297, 28.033641815185547, 28.877208709716797]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 7.0, 8.0, 14.0, 14.0, 12.0, 21.0, 21.0, 24.0, 22.0, 39.0, 39.0, 47.0, 34.0, 44.0, 42.0, 53.0, 63.0, 57.0, 52.0, 37.0, 49.0, 25.0, 37.0, 30.0, 40.0, 24.0, 28.0, 25.0, 24.0, 13.0, 13.0, 9.0, 3.0, 9.0, 7.0, 4.0, 9.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.101165771484375, -2.01092529296875, -1.920684814453125, -1.8304443359375, -1.740203857421875, -1.64996337890625, -1.559722900390625, -1.469482421875, -1.379241943359375, -1.28900146484375, -1.198760986328125, -1.1085205078125, -1.018280029296875, -0.92803955078125, -0.837799072265625, -0.74755859375, -0.657318115234375, -0.56707763671875, -0.476837158203125, -0.3865966796875, -0.296356201171875, -0.20611572265625, -0.115875244140625, -0.025634765625, 0.064605712890625, 0.15484619140625, 0.245086669921875, 0.3353271484375, 0.425567626953125, 0.51580810546875, 0.606048583984375, 0.6962890625, 0.786529541015625, 0.87677001953125, 0.967010498046875, 1.0572509765625, 1.147491455078125, 1.23773193359375, 1.327972412109375, 1.418212890625, 1.508453369140625, 1.59869384765625, 1.688934326171875, 1.7791748046875, 1.869415283203125, 1.95965576171875, 2.049896240234375, 2.14013671875, 2.230377197265625, 2.32061767578125, 2.410858154296875, 2.5010986328125, 2.591339111328125, 2.68157958984375, 2.771820068359375, 2.862060546875, 2.952301025390625, 3.04254150390625, 3.132781982421875, 3.2230224609375, 3.313262939453125, 3.40350341796875, 3.493743896484375, 3.583984375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 15.0, 25.0, 45.0, 62.0, 90.0, 154.0, 203.0, 395.0, 775.0, 1509.0, 3985.0, 11739.0, 42574.0, 213823.0, 2628633.0, 1138855.0, 112331.0, 26033.0, 7573.0, 2777.0, 1157.0, 582.0, 335.0, 213.0, 134.0, 89.0, 51.0, 35.0, 28.0, 17.0, 13.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.09375, -10.7218017578125, -10.349853515625, -9.9779052734375, -9.60595703125, -9.2340087890625, -8.862060546875, -8.4901123046875, -8.1181640625, -7.7462158203125, -7.374267578125, -7.0023193359375, -6.63037109375, -6.2584228515625, -5.886474609375, -5.5145263671875, -5.142578125, -4.7706298828125, -4.398681640625, -4.0267333984375, -3.65478515625, -3.2828369140625, -2.910888671875, -2.5389404296875, -2.1669921875, -1.7950439453125, -1.423095703125, -1.0511474609375, -0.67919921875, -0.3072509765625, 0.064697265625, 0.4366455078125, 0.80859375, 1.1805419921875, 1.552490234375, 1.9244384765625, 2.29638671875, 2.6683349609375, 3.040283203125, 3.4122314453125, 3.7841796875, 4.1561279296875, 4.528076171875, 4.9000244140625, 5.27197265625, 5.6439208984375, 6.015869140625, 6.3878173828125, 6.759765625, 7.1317138671875, 7.503662109375, 7.8756103515625, 8.24755859375, 8.6195068359375, 8.991455078125, 9.3634033203125, 9.7353515625, 10.1072998046875, 10.479248046875, 10.8511962890625, 11.22314453125, 11.5950927734375, 11.967041015625, 12.3389892578125, 12.7109375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 8.0, 21.0, 41.0, 99.0, 149.0, 315.0, 644.0, 1143.0, 794.0, 421.0, 215.0, 101.0, 65.0, 26.0, 16.0, 4.0, 4.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.421875, -9.797119140625, -9.17236328125, -8.547607421875, -7.9228515625, -7.298095703125, -6.67333984375, -6.048583984375, -5.423828125, -4.799072265625, -4.17431640625, -3.549560546875, -2.9248046875, -2.300048828125, -1.67529296875, -1.050537109375, -0.42578125, 0.198974609375, 0.82373046875, 1.448486328125, 2.0732421875, 2.697998046875, 3.32275390625, 3.947509765625, 4.572265625, 5.197021484375, 5.82177734375, 6.446533203125, 7.0712890625, 7.696044921875, 8.32080078125, 8.945556640625, 9.5703125, 10.195068359375, 10.81982421875, 11.444580078125, 12.0693359375, 12.694091796875, 13.31884765625, 13.943603515625, 14.568359375, 15.193115234375, 15.81787109375, 16.442626953125, 17.0673828125, 17.692138671875, 18.31689453125, 18.941650390625, 19.56640625, 20.191162109375, 20.81591796875, 21.440673828125, 22.0654296875, 22.690185546875, 23.31494140625, 23.939697265625, 24.564453125, 25.189208984375, 25.81396484375, 26.438720703125, 27.0634765625, 27.688232421875, 28.31298828125, 28.937744140625, 29.5625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 12.0, 12.0, 5.0, 12.0, 28.0, 45.0, 68.0, 69.0, 138.0, 243.0, 635.0, 2606.0, 30477.0, 2592564.0, 1541468.0, 22778.0, 2096.0, 523.0, 182.0, 110.0, 64.0, 38.0, 29.0, 20.0, 25.0, 13.0, 10.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.8125, -38.33544921875, -36.8583984375, -35.38134765625, -33.904296875, -32.42724609375, -30.9501953125, -29.47314453125, -27.99609375, -26.51904296875, -25.0419921875, -23.56494140625, -22.087890625, -20.61083984375, -19.1337890625, -17.65673828125, -16.1796875, -14.70263671875, -13.2255859375, -11.74853515625, -10.271484375, -8.79443359375, -7.3173828125, -5.84033203125, -4.36328125, -2.88623046875, -1.4091796875, 0.06787109375, 1.544921875, 3.02197265625, 4.4990234375, 5.97607421875, 7.453125, 8.93017578125, 10.4072265625, 11.88427734375, 13.361328125, 14.83837890625, 16.3154296875, 17.79248046875, 19.26953125, 20.74658203125, 22.2236328125, 23.70068359375, 25.177734375, 26.65478515625, 28.1318359375, 29.60888671875, 31.0859375, 32.56298828125, 34.0400390625, 35.51708984375, 36.994140625, 38.47119140625, 39.9482421875, 41.42529296875, 42.90234375, 44.37939453125, 45.8564453125, 47.33349609375, 48.810546875, 50.28759765625, 51.7646484375, 53.24169921875, 54.71875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [9.0, 99.0, 500.0, 361.0, 46.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.929244995117188, -12.961709022521973, -5.994173049926758, 0.9733619689941406, 7.940898895263672, 14.908435821533203, 21.87596893310547, 28.843505859375, 35.81104278564453, 42.77857971191406, 49.746116638183594, 56.71364974975586, 63.68118667602539, 70.64872741699219, 77.61625671386719, 84.58379364013672, 91.55133056640625, 98.51886749267578, 105.48640441894531, 112.45393371582031, 119.42147827148438, 126.38900756835938, 133.35653686523438, 140.32408142089844, 147.2916259765625, 154.2591552734375, 161.22669982910156, 168.19422912597656, 175.16177368164062, 182.12930297851562, 189.09683227539062, 196.0643768310547, 203.03189086914062, 209.99942016601562, 216.9669647216797, 223.9344940185547, 230.90203857421875, 237.86956787109375, 244.83709716796875, 251.8046417236328, 258.7721862792969, 265.7397155761719, 272.7072448730469, 279.6748046875, 286.642333984375, 293.60986328125, 300.577392578125, 307.544921875, 314.512451171875, 321.47998046875, 328.447509765625, 335.4150695800781, 342.3825988769531, 349.3501281738281, 356.3176574707031, 363.28521728515625, 370.25274658203125, 377.22027587890625, 384.18780517578125, 391.1553649902344, 398.1228942871094, 405.0904235839844, 412.0579528808594, 419.0255126953125, 425.9930419921875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 13.0, 9.0, 10.0, 11.0, 15.0, 15.0, 19.0, 18.0, 29.0, 20.0, 28.0, 31.0, 31.0, 26.0, 31.0, 36.0, 43.0, 22.0, 48.0, 48.0, 36.0, 42.0, 41.0, 41.0, 43.0, 35.0, 30.0, 28.0, 31.0, 29.0, 28.0, 16.0, 13.0, 18.0, 8.0, 11.0, 8.0, 7.0, 5.0, 2.0, 1.0, 8.0, 2.0, 0.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.342430114746094, -25.440038681030273, -24.537647247314453, -23.635255813598633, -22.732864379882812, -21.830474853515625, -20.928083419799805, -20.025691986083984, -19.123300552368164, -18.220909118652344, -17.318517684936523, -16.416126251220703, -15.5137357711792, -14.611344337463379, -13.708953857421875, -12.806562423706055, -11.904170989990234, -11.001779556274414, -10.099388122558594, -9.19699764251709, -8.29460620880127, -7.392214775085449, -6.489823818206787, -5.587432861328125, -4.685041427612305, -3.7826502323150635, -2.8802590370178223, -1.977867841720581, -1.0754766464233398, -0.17308521270751953, 0.7293057441711426, 1.6316967010498047, 2.534090042114258, 3.436481237411499, 4.33887243270874, 5.241263389587402, 6.143654823303223, 7.046046257019043, 7.948437213897705, 8.850828170776367, 9.753219604492188, 10.655611038208008, 11.558002471923828, 12.460392951965332, 13.362784385681152, 14.265175819396973, 15.167566299438477, 16.069957733154297, 16.972349166870117, 17.874740600585938, 18.777132034301758, 19.679523468017578, 20.581912994384766, 21.48430633544922, 22.386695861816406, 23.289087295532227, 24.191478729248047, 25.093870162963867, 25.996261596679688, 26.898653030395508, 27.801044464111328, 28.703433990478516, 29.605825424194336, 30.508216857910156, 31.410608291625977]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 11.0, 5.0, 11.0, 13.0, 13.0, 17.0, 20.0, 21.0, 20.0, 30.0, 31.0, 31.0, 28.0, 45.0, 39.0, 33.0, 44.0, 43.0, 49.0, 51.0, 30.0, 40.0, 40.0, 26.0, 34.0, 29.0, 32.0, 30.0, 20.0, 20.0, 28.0, 20.0, 12.0, 14.0, 17.0, 10.0, 9.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.498046875, -2.420318603515625, -2.34259033203125, -2.264862060546875, -2.1871337890625, -2.109405517578125, -2.03167724609375, -1.953948974609375, -1.876220703125, -1.798492431640625, -1.72076416015625, -1.643035888671875, -1.5653076171875, -1.487579345703125, -1.40985107421875, -1.332122802734375, -1.25439453125, -1.176666259765625, -1.09893798828125, -1.021209716796875, -0.9434814453125, -0.865753173828125, -0.78802490234375, -0.710296630859375, -0.632568359375, -0.554840087890625, -0.47711181640625, -0.399383544921875, -0.3216552734375, -0.243927001953125, -0.16619873046875, -0.088470458984375, -0.0107421875, 0.066986083984375, 0.14471435546875, 0.222442626953125, 0.3001708984375, 0.377899169921875, 0.45562744140625, 0.533355712890625, 0.611083984375, 0.688812255859375, 0.76654052734375, 0.844268798828125, 0.9219970703125, 0.999725341796875, 1.07745361328125, 1.155181884765625, 1.23291015625, 1.310638427734375, 1.38836669921875, 1.466094970703125, 1.5438232421875, 1.621551513671875, 1.69927978515625, 1.777008056640625, 1.854736328125, 1.932464599609375, 2.01019287109375, 2.087921142578125, 2.1656494140625, 2.243377685546875, 2.32110595703125, 2.398834228515625, 2.4765625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 12.0, 17.0, 27.0, 27.0, 62.0, 80.0, 113.0, 201.0, 274.0, 480.0, 716.0, 1059.0, 1566.0, 2351.0, 3685.0, 5290.0, 8185.0, 11996.0, 18249.0, 26951.0, 38445.0, 54546.0, 75197.0, 95909.0, 114203.0, 124284.0, 115346.0, 96993.0, 75390.0, 55284.0, 39436.0, 27119.0, 18297.0, 12340.0, 8199.0, 5472.0, 3625.0, 2472.0, 1540.0, 1068.0, 694.0, 441.0, 288.0, 220.0, 147.0, 89.0, 59.0, 46.0, 28.0, 15.0, 6.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-2.041015625, -1.97625732421875, -1.9114990234375, -1.84674072265625, -1.781982421875, -1.71722412109375, -1.6524658203125, -1.58770751953125, -1.52294921875, -1.45819091796875, -1.3934326171875, -1.32867431640625, -1.263916015625, -1.19915771484375, -1.1343994140625, -1.06964111328125, -1.0048828125, -0.94012451171875, -0.8753662109375, -0.81060791015625, -0.745849609375, -0.68109130859375, -0.6163330078125, -0.55157470703125, -0.48681640625, -0.42205810546875, -0.3572998046875, -0.29254150390625, -0.227783203125, -0.16302490234375, -0.0982666015625, -0.03350830078125, 0.03125, 0.09600830078125, 0.1607666015625, 0.22552490234375, 0.290283203125, 0.35504150390625, 0.4197998046875, 0.48455810546875, 0.54931640625, 0.61407470703125, 0.6788330078125, 0.74359130859375, 0.808349609375, 0.87310791015625, 0.9378662109375, 1.00262451171875, 1.0673828125, 1.13214111328125, 1.1968994140625, 1.26165771484375, 1.326416015625, 1.39117431640625, 1.4559326171875, 1.52069091796875, 1.58544921875, 1.65020751953125, 1.7149658203125, 1.77972412109375, 1.844482421875, 1.90924072265625, 1.9739990234375, 2.03875732421875, 2.103515625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 3.0, 7.0, 4.0, 10.0, 14.0, 19.0, 16.0, 24.0, 23.0, 25.0, 29.0, 32.0, 43.0, 43.0, 37.0, 46.0, 50.0, 38.0, 42.0, 1071.0, 28.0, 59.0, 42.0, 37.0, 37.0, 27.0, 35.0, 27.0, 25.0, 21.0, 22.0, 8.0, 15.0, 11.0, 5.0, 10.0, 9.0, 6.0, 8.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.88671875, -2.7879638671875, -2.689208984375, -2.5904541015625, -2.49169921875, -2.3929443359375, -2.294189453125, -2.1954345703125, -2.0966796875, -1.9979248046875, -1.899169921875, -1.8004150390625, -1.70166015625, -1.6029052734375, -1.504150390625, -1.4053955078125, -1.306640625, -1.2078857421875, -1.109130859375, -1.0103759765625, -0.91162109375, -0.8128662109375, -0.714111328125, -0.6153564453125, -0.5166015625, -0.4178466796875, -0.319091796875, -0.2203369140625, -0.12158203125, -0.0228271484375, 0.075927734375, 0.1746826171875, 0.2734375, 0.3721923828125, 0.470947265625, 0.5697021484375, 0.66845703125, 0.7672119140625, 0.865966796875, 0.9647216796875, 1.0634765625, 1.1622314453125, 1.260986328125, 1.3597412109375, 1.45849609375, 1.5572509765625, 1.656005859375, 1.7547607421875, 1.853515625, 1.9522705078125, 2.051025390625, 2.1497802734375, 2.24853515625, 2.3472900390625, 2.446044921875, 2.5447998046875, 2.6435546875, 2.7423095703125, 2.841064453125, 2.9398193359375, 3.03857421875, 3.1373291015625, 3.236083984375, 3.3348388671875, 3.43359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 10.0, 12.0, 17.0, 10.0, 17.0, 28.0, 49.0, 51.0, 60.0, 65.0, 123.0, 145.0, 169.0, 301.0, 416.0, 657.0, 1100.0, 2061.0, 4127.0, 8608.0, 19976.0, 53844.0, 1185496.0, 731366.0, 51830.0, 19053.0, 8291.0, 3895.0, 2059.0, 1073.0, 694.0, 430.0, 313.0, 222.0, 149.0, 102.0, 97.0, 36.0, 42.0, 32.0, 23.0, 21.0, 11.0, 9.0, 7.0, 11.0, 4.0, 3.0, 1.0, 0.0, 4.0], "bins": [-9.09375, -8.84100341796875, -8.5882568359375, -8.33551025390625, -8.082763671875, -7.83001708984375, -7.5772705078125, -7.32452392578125, -7.07177734375, -6.81903076171875, -6.5662841796875, -6.31353759765625, -6.060791015625, -5.80804443359375, -5.5552978515625, -5.30255126953125, -5.0498046875, -4.79705810546875, -4.5443115234375, -4.29156494140625, -4.038818359375, -3.78607177734375, -3.5333251953125, -3.28057861328125, -3.02783203125, -2.77508544921875, -2.5223388671875, -2.26959228515625, -2.016845703125, -1.76409912109375, -1.5113525390625, -1.25860595703125, -1.005859375, -0.75311279296875, -0.5003662109375, -0.24761962890625, 0.005126953125, 0.25787353515625, 0.5106201171875, 0.76336669921875, 1.01611328125, 1.26885986328125, 1.5216064453125, 1.77435302734375, 2.027099609375, 2.27984619140625, 2.5325927734375, 2.78533935546875, 3.0380859375, 3.29083251953125, 3.5435791015625, 3.79632568359375, 4.049072265625, 4.30181884765625, 4.5545654296875, 4.80731201171875, 5.06005859375, 5.31280517578125, 5.5655517578125, 5.81829833984375, 6.071044921875, 6.32379150390625, 6.5765380859375, 6.82928466796875, 7.08203125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 3.0, 3.0, 4.0, 7.0, 8.0, 10.0, 8.0, 6.0, 7.0, 11.0, 13.0, 20.0, 27.0, 24.0, 49.0, 62.0, 65.0, 102.0, 100.0, 90.0, 90.0, 64.0, 56.0, 37.0, 24.0, 20.0, 14.0, 13.0, 9.0, 9.0, 8.0, 2.0, 10.0, 2.0, 3.0, 1.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.306640625, -1.2656707763671875, -1.224700927734375, -1.1837310791015625, -1.14276123046875, -1.1017913818359375, -1.060821533203125, -1.0198516845703125, -0.9788818359375, -0.9379119873046875, -0.896942138671875, -0.8559722900390625, -0.81500244140625, -0.7740325927734375, -0.733062744140625, -0.6920928955078125, -0.651123046875, -0.6101531982421875, -0.569183349609375, -0.5282135009765625, -0.48724365234375, -0.4462738037109375, -0.405303955078125, -0.3643341064453125, -0.3233642578125, -0.2823944091796875, -0.241424560546875, -0.2004547119140625, -0.15948486328125, -0.1185150146484375, -0.077545166015625, -0.0365753173828125, 0.00439453125, 0.0453643798828125, 0.086334228515625, 0.1273040771484375, 0.16827392578125, 0.2092437744140625, 0.250213623046875, 0.2911834716796875, 0.3321533203125, 0.3731231689453125, 0.414093017578125, 0.4550628662109375, 0.49603271484375, 0.5370025634765625, 0.577972412109375, 0.6189422607421875, 0.659912109375, 0.7008819580078125, 0.741851806640625, 0.7828216552734375, 0.82379150390625, 0.8647613525390625, 0.905731201171875, 0.9467010498046875, 0.9876708984375, 1.0286407470703125, 1.069610595703125, 1.1105804443359375, 1.15155029296875, 1.1925201416015625, 1.233489990234375, 1.2744598388671875, 1.3154296875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 8.0, 5.0, 11.0, 10.0, 7.0, 11.0, 18.0, 19.0, 20.0, 27.0, 18.0, 20.0, 45.0, 40.0, 52.0, 79.0, 112.0, 179.0, 337.0, 828.0, 8251.0, 840578.0, 191895.0, 4497.0, 602.0, 293.0, 152.0, 90.0, 72.0, 45.0, 36.0, 33.0, 25.0, 17.0, 26.0, 15.0, 11.0, 8.0, 14.0, 12.0, 12.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-21.40625, -20.73486328125, -20.0634765625, -19.39208984375, -18.720703125, -18.04931640625, -17.3779296875, -16.70654296875, -16.03515625, -15.36376953125, -14.6923828125, -14.02099609375, -13.349609375, -12.67822265625, -12.0068359375, -11.33544921875, -10.6640625, -9.99267578125, -9.3212890625, -8.64990234375, -7.978515625, -7.30712890625, -6.6357421875, -5.96435546875, -5.29296875, -4.62158203125, -3.9501953125, -3.27880859375, -2.607421875, -1.93603515625, -1.2646484375, -0.59326171875, 0.078125, 0.74951171875, 1.4208984375, 2.09228515625, 2.763671875, 3.43505859375, 4.1064453125, 4.77783203125, 5.44921875, 6.12060546875, 6.7919921875, 7.46337890625, 8.134765625, 8.80615234375, 9.4775390625, 10.14892578125, 10.8203125, 11.49169921875, 12.1630859375, 12.83447265625, 13.505859375, 14.17724609375, 14.8486328125, 15.52001953125, 16.19140625, 16.86279296875, 17.5341796875, 18.20556640625, 18.876953125, 19.54833984375, 20.2197265625, 20.89111328125, 21.5625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 22.0, 92.0, 331.0, 445.0, 80.0, 21.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.939538955688477, -7.224195957183838, -6.508852958679199, -5.793509483337402, -5.078166484832764, -4.362823486328125, -3.647480010986328, -2.9321370124816895, -2.216794013977051, -1.5014508962631226, -0.7861077785491943, -0.07076454162597656, 0.6445784568786621, 1.3599214553833008, 2.0752649307250977, 2.7906079292297363, 3.505950927734375, 4.221293926239014, 4.936636924743652, 5.651980400085449, 6.367323398590088, 7.082666397094727, 7.798009872436523, 8.51335334777832, 9.2286958694458, 9.944039344787598, 10.659381866455078, 11.374725341796875, 12.090068817138672, 12.805411338806152, 13.52075481414795, 14.23609733581543, 14.951438903808594, 15.66678237915039, 16.382125854492188, 17.097469329833984, 17.81281089782715, 18.528154373168945, 19.243497848510742, 19.95884132385254, 20.674182891845703, 21.3895263671875, 22.104869842529297, 22.820213317871094, 23.535554885864258, 24.250898361206055, 24.96624183654785, 25.68158531188965, 26.396928787231445, 27.112272262573242, 27.82761573791504, 28.542957305908203, 29.25830078125, 29.973644256591797, 30.688987731933594, 31.40433120727539, 32.11967468261719, 32.835018157958984, 33.55036163330078, 34.26570510864258, 34.981048583984375, 35.696388244628906, 36.41173553466797, 37.1270751953125, 37.8424186706543]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 14.0, 5.0, 10.0, 6.0, 17.0, 25.0, 25.0, 30.0, 25.0, 40.0, 40.0, 43.0, 46.0, 46.0, 60.0, 37.0, 45.0, 45.0, 49.0, 33.0, 46.0, 37.0, 44.0, 25.0, 31.0, 36.0, 22.0, 31.0, 13.0, 12.0, 9.0, 14.0, 5.0, 10.0, 3.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0843329429626465, -3.943326950073242, -3.802320718765259, -3.6613147258758545, -3.520308494567871, -3.379302501678467, -3.2382965087890625, -3.097290515899658, -2.956284284591675, -2.8152782917022705, -2.674272060394287, -2.533266067504883, -2.3922600746154785, -2.251253843307495, -2.110247850418091, -1.969241738319397, -1.8282356262207031, -1.6872295141220093, -1.5462234020233154, -1.4052174091339111, -1.2642112970352173, -1.1232051849365234, -0.9821991324424744, -0.8411930799484253, -0.7001869678497314, -0.5591808557510376, -0.4181748032569885, -0.27716872096061707, -0.1361626386642456, 0.004843473434448242, 0.14584952592849731, 0.2868555784225464, 0.42786216735839844, 0.5688682794570923, 0.7098743319511414, 0.8508803844451904, 0.9918864965438843, 1.1328926086425781, 1.2738986015319824, 1.4149047136306763, 1.5559108257293701, 1.696916937828064, 1.8379230499267578, 1.978929042816162, 2.1199350357055664, 2.26094126701355, 2.401947259902954, 2.5429534912109375, 2.683959484100342, 2.824965476989746, 2.9659717082977295, 3.106977701187134, 3.247983932495117, 3.3889899253845215, 3.529995918273926, 3.67100191116333, 3.8120081424713135, 3.9530141353607178, 4.094020366668701, 4.2350263595581055, 4.37603235244751, 4.517038345336914, 4.658044815063477, 4.799050807952881, 4.940056800842285]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 10.0, 10.0, 13.0, 16.0, 8.0, 17.0, 23.0, 25.0, 25.0, 31.0, 37.0, 22.0, 42.0, 45.0, 45.0, 27.0, 47.0, 54.0, 46.0, 45.0, 35.0, 38.0, 33.0, 29.0, 34.0, 33.0, 26.0, 19.0, 31.0, 17.0, 22.0, 13.0, 15.0, 12.0, 8.0, 15.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.533203125, -2.4522705078125, -2.371337890625, -2.2904052734375, -2.20947265625, -2.1285400390625, -2.047607421875, -1.9666748046875, -1.8857421875, -1.8048095703125, -1.723876953125, -1.6429443359375, -1.56201171875, -1.4810791015625, -1.400146484375, -1.3192138671875, -1.23828125, -1.1573486328125, -1.076416015625, -0.9954833984375, -0.91455078125, -0.8336181640625, -0.752685546875, -0.6717529296875, -0.5908203125, -0.5098876953125, -0.428955078125, -0.3480224609375, -0.26708984375, -0.1861572265625, -0.105224609375, -0.0242919921875, 0.056640625, 0.1375732421875, 0.218505859375, 0.2994384765625, 0.38037109375, 0.4613037109375, 0.542236328125, 0.6231689453125, 0.7041015625, 0.7850341796875, 0.865966796875, 0.9468994140625, 1.02783203125, 1.1087646484375, 1.189697265625, 1.2706298828125, 1.3515625, 1.4324951171875, 1.513427734375, 1.5943603515625, 1.67529296875, 1.7562255859375, 1.837158203125, 1.9180908203125, 1.9990234375, 2.0799560546875, 2.160888671875, 2.2418212890625, 2.32275390625, 2.4036865234375, 2.484619140625, 2.5655517578125, 2.646484375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 6.0, 8.0, 12.0, 9.0, 16.0, 18.0, 21.0, 26.0, 41.0, 65.0, 88.0, 109.0, 178.0, 235.0, 378.0, 559.0, 794.0, 1316.0, 2091.0, 3702.0, 6673.0, 12748.0, 27750.0, 62954.0, 150788.0, 294797.0, 262540.0, 121757.0, 51095.0, 22659.0, 10995.0, 5589.0, 3177.0, 1934.0, 1115.0, 705.0, 476.0, 331.0, 213.0, 165.0, 124.0, 94.0, 59.0, 42.0, 24.0, 21.0, 12.0, 20.0, 14.0, 7.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0], "bins": [-3.9140625, -3.79852294921875, -3.6829833984375, -3.56744384765625, -3.451904296875, -3.33636474609375, -3.2208251953125, -3.10528564453125, -2.98974609375, -2.87420654296875, -2.7586669921875, -2.64312744140625, -2.527587890625, -2.41204833984375, -2.2965087890625, -2.18096923828125, -2.0654296875, -1.94989013671875, -1.8343505859375, -1.71881103515625, -1.603271484375, -1.48773193359375, -1.3721923828125, -1.25665283203125, -1.14111328125, -1.02557373046875, -0.9100341796875, -0.79449462890625, -0.678955078125, -0.56341552734375, -0.4478759765625, -0.33233642578125, -0.216796875, -0.10125732421875, 0.0142822265625, 0.12982177734375, 0.245361328125, 0.36090087890625, 0.4764404296875, 0.59197998046875, 0.70751953125, 0.82305908203125, 0.9385986328125, 1.05413818359375, 1.169677734375, 1.28521728515625, 1.4007568359375, 1.51629638671875, 1.6318359375, 1.74737548828125, 1.8629150390625, 1.97845458984375, 2.093994140625, 2.20953369140625, 2.3250732421875, 2.44061279296875, 2.55615234375, 2.67169189453125, 2.7872314453125, 2.90277099609375, 3.018310546875, 3.13385009765625, 3.2493896484375, 3.36492919921875, 3.48046875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 5.0, 2.0, 6.0, 13.0, 18.0, 21.0, 12.0, 19.0, 15.0, 16.0, 32.0, 30.0, 27.0, 30.0, 55.0, 43.0, 60.0, 83.0, 130.0, 244.0, 1374.0, 207.0, 128.0, 73.0, 63.0, 50.0, 43.0, 38.0, 31.0, 26.0, 14.0, 18.0, 30.0, 9.0, 16.0, 9.0, 16.0, 8.0, 3.0, 9.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.125, -8.8427734375, -8.560546875, -8.2783203125, -7.99609375, -7.7138671875, -7.431640625, -7.1494140625, -6.8671875, -6.5849609375, -6.302734375, -6.0205078125, -5.73828125, -5.4560546875, -5.173828125, -4.8916015625, -4.609375, -4.3271484375, -4.044921875, -3.7626953125, -3.48046875, -3.1982421875, -2.916015625, -2.6337890625, -2.3515625, -2.0693359375, -1.787109375, -1.5048828125, -1.22265625, -0.9404296875, -0.658203125, -0.3759765625, -0.09375, 0.1884765625, 0.470703125, 0.7529296875, 1.03515625, 1.3173828125, 1.599609375, 1.8818359375, 2.1640625, 2.4462890625, 2.728515625, 3.0107421875, 3.29296875, 3.5751953125, 3.857421875, 4.1396484375, 4.421875, 4.7041015625, 4.986328125, 5.2685546875, 5.55078125, 5.8330078125, 6.115234375, 6.3974609375, 6.6796875, 6.9619140625, 7.244140625, 7.5263671875, 7.80859375, 8.0908203125, 8.373046875, 8.6552734375, 8.9375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 6.0, 16.0, 11.0, 22.0, 15.0, 21.0, 31.0, 40.0, 50.0, 76.0, 172.0, 334.0, 820.0, 2664.0, 11696.0, 83716.0, 2034666.0, 952971.0, 47311.0, 7693.0, 2019.0, 626.0, 265.0, 136.0, 61.0, 56.0, 35.0, 21.0, 27.0, 12.0, 17.0, 12.0, 16.0, 14.0, 10.0, 6.0, 3.0, 5.0, 5.0, 1.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.890625, -15.39208984375, -14.8935546875, -14.39501953125, -13.896484375, -13.39794921875, -12.8994140625, -12.40087890625, -11.90234375, -11.40380859375, -10.9052734375, -10.40673828125, -9.908203125, -9.40966796875, -8.9111328125, -8.41259765625, -7.9140625, -7.41552734375, -6.9169921875, -6.41845703125, -5.919921875, -5.42138671875, -4.9228515625, -4.42431640625, -3.92578125, -3.42724609375, -2.9287109375, -2.43017578125, -1.931640625, -1.43310546875, -0.9345703125, -0.43603515625, 0.0625, 0.56103515625, 1.0595703125, 1.55810546875, 2.056640625, 2.55517578125, 3.0537109375, 3.55224609375, 4.05078125, 4.54931640625, 5.0478515625, 5.54638671875, 6.044921875, 6.54345703125, 7.0419921875, 7.54052734375, 8.0390625, 8.53759765625, 9.0361328125, 9.53466796875, 10.033203125, 10.53173828125, 11.0302734375, 11.52880859375, 12.02734375, 12.52587890625, 13.0244140625, 13.52294921875, 14.021484375, 14.52001953125, 15.0185546875, 15.51708984375, 16.015625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 8.0, 424.0, 577.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.516944885253906, -12.425996780395508, -6.335047721862793, -0.24409866333007812, 5.84684944152832, 11.937797546386719, 18.02874755859375, 24.119693756103516, 30.210643768310547, 36.30159378051758, 42.392539978027344, 48.483489990234375, 54.574440002441406, 60.66538619995117, 66.75633239746094, 72.84728240966797, 78.938232421875, 85.02918243408203, 91.12013244628906, 97.21107482910156, 103.3020248413086, 109.39297485351562, 115.48392486572266, 121.57487487792969, 127.66581726074219, 133.7567596435547, 139.84771728515625, 145.93865966796875, 152.0296173095703, 158.1205596923828, 164.21151733398438, 170.30245971679688, 176.39341735839844, 182.48435974121094, 188.5753173828125, 194.666259765625, 200.75721740722656, 206.84815979003906, 212.93911743164062, 219.03005981445312, 225.12100219726562, 231.21194458007812, 237.3029022216797, 243.3938446044922, 249.48480224609375, 255.57574462890625, 261.66668701171875, 267.75762939453125, 273.8486022949219, 279.9395446777344, 286.0304870605469, 292.1214599609375, 298.21240234375, 304.3033447265625, 310.394287109375, 316.4852294921875, 322.576171875, 328.6671142578125, 334.758056640625, 340.8490295410156, 346.9399719238281, 353.0309143066406, 359.1218566894531, 365.2127990722656, 371.30377197265625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 6.0, 1.0, 3.0, 5.0, 11.0, 5.0, 12.0, 10.0, 12.0, 14.0, 14.0, 30.0, 29.0, 20.0, 24.0, 39.0, 32.0, 28.0, 35.0, 31.0, 34.0, 29.0, 38.0, 42.0, 30.0, 32.0, 34.0, 40.0, 44.0, 31.0, 36.0, 23.0, 26.0, 25.0, 28.0, 17.0, 29.0, 23.0, 13.0, 11.0, 10.0, 6.0, 8.0, 5.0, 5.0, 7.0, 2.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.158645629882812, -25.31238555908203, -24.46612548828125, -23.61986541748047, -22.773605346679688, -21.927345275878906, -21.081085205078125, -20.234827041625977, -19.388566970825195, -18.542306900024414, -17.696046829223633, -16.84978675842285, -16.00352668762207, -15.157267570495605, -14.311007499694824, -13.46474838256836, -12.618487358093262, -11.77222728729248, -10.9259672164917, -10.079708099365234, -9.233448028564453, -8.387187957763672, -7.540927886962891, -6.694668292999268, -5.848408222198486, -5.002148151397705, -4.155888557434082, -3.309628486633301, -2.4633686542510986, -1.6171088218688965, -0.7708487510681152, 0.07541084289550781, 0.9216709136962891, 1.7679307460784912, 2.6141905784606934, 3.4604506492614746, 4.306710243225098, 5.152970314025879, 5.99923038482666, 6.845489978790283, 7.6917500495910645, 8.538009643554688, 9.384269714355469, 10.23052978515625, 11.076789855957031, 11.923049926757812, 12.769309997558594, 13.615569114685059, 14.46182918548584, 15.308089256286621, 16.154348373413086, 17.000608444213867, 17.84686851501465, 18.69312858581543, 19.53938865661621, 20.385648727416992, 21.231908798217773, 22.078168869018555, 22.924428939819336, 23.770689010620117, 24.6169490814209, 25.463207244873047, 26.309467315673828, 27.15572738647461, 28.00198745727539]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 10.0, 19.0, 15.0, 17.0, 28.0, 21.0, 21.0, 26.0, 32.0, 37.0, 41.0, 51.0, 38.0, 34.0, 37.0, 50.0, 40.0, 40.0, 35.0, 50.0, 37.0, 39.0, 26.0, 28.0, 23.0, 26.0, 27.0, 21.0, 20.0, 19.0, 13.0, 11.0, 16.0, 4.0, 6.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.78125, -2.695404052734375, -2.60955810546875, -2.523712158203125, -2.4378662109375, -2.352020263671875, -2.26617431640625, -2.180328369140625, -2.094482421875, -2.008636474609375, -1.92279052734375, -1.836944580078125, -1.7510986328125, -1.665252685546875, -1.57940673828125, -1.493560791015625, -1.40771484375, -1.321868896484375, -1.23602294921875, -1.150177001953125, -1.0643310546875, -0.978485107421875, -0.89263916015625, -0.806793212890625, -0.720947265625, -0.635101318359375, -0.54925537109375, -0.463409423828125, -0.3775634765625, -0.291717529296875, -0.20587158203125, -0.120025634765625, -0.0341796875, 0.051666259765625, 0.13751220703125, 0.223358154296875, 0.3092041015625, 0.395050048828125, 0.48089599609375, 0.566741943359375, 0.652587890625, 0.738433837890625, 0.82427978515625, 0.910125732421875, 0.9959716796875, 1.081817626953125, 1.16766357421875, 1.253509521484375, 1.33935546875, 1.425201416015625, 1.51104736328125, 1.596893310546875, 1.6827392578125, 1.768585205078125, 1.85443115234375, 1.940277099609375, 2.026123046875, 2.111968994140625, 2.19781494140625, 2.283660888671875, 2.3695068359375, 2.455352783203125, 2.54119873046875, 2.627044677734375, 2.712890625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 10.0, 15.0, 7.0, 17.0, 38.0, 33.0, 29.0, 48.0, 43.0, 60.0, 94.0, 132.0, 204.0, 421.0, 1023.0, 2772.0, 9518.0, 38583.0, 227573.0, 2919458.0, 884661.0, 82702.0, 18365.0, 5091.0, 1707.0, 656.0, 351.0, 155.0, 114.0, 86.0, 44.0, 41.0, 47.0, 23.0, 27.0, 34.0, 11.0, 18.0, 4.0, 8.0, 11.0, 10.0, 9.0, 2.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.6171875, -10.26025390625, -9.9033203125, -9.54638671875, -9.189453125, -8.83251953125, -8.4755859375, -8.11865234375, -7.76171875, -7.40478515625, -7.0478515625, -6.69091796875, -6.333984375, -5.97705078125, -5.6201171875, -5.26318359375, -4.90625, -4.54931640625, -4.1923828125, -3.83544921875, -3.478515625, -3.12158203125, -2.7646484375, -2.40771484375, -2.05078125, -1.69384765625, -1.3369140625, -0.97998046875, -0.623046875, -0.26611328125, 0.0908203125, 0.44775390625, 0.8046875, 1.16162109375, 1.5185546875, 1.87548828125, 2.232421875, 2.58935546875, 2.9462890625, 3.30322265625, 3.66015625, 4.01708984375, 4.3740234375, 4.73095703125, 5.087890625, 5.44482421875, 5.8017578125, 6.15869140625, 6.515625, 6.87255859375, 7.2294921875, 7.58642578125, 7.943359375, 8.30029296875, 8.6572265625, 9.01416015625, 9.37109375, 9.72802734375, 10.0849609375, 10.44189453125, 10.798828125, 11.15576171875, 11.5126953125, 11.86962890625, 12.2265625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 6.0, 11.0, 17.0, 13.0, 19.0, 15.0, 25.0, 29.0, 48.0, 64.0, 90.0, 128.0, 165.0, 205.0, 229.0, 314.0, 372.0, 433.0, 404.0, 347.0, 243.0, 226.0, 168.0, 125.0, 86.0, 67.0, 46.0, 41.0, 32.0, 20.0, 18.0, 17.0, 8.0, 10.0, 6.0, 3.0, 6.0, 2.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.7890625, -7.56353759765625, -7.3380126953125, -7.11248779296875, -6.886962890625, -6.66143798828125, -6.4359130859375, -6.21038818359375, -5.98486328125, -5.75933837890625, -5.5338134765625, -5.30828857421875, -5.082763671875, -4.85723876953125, -4.6317138671875, -4.40618896484375, -4.1806640625, -3.95513916015625, -3.7296142578125, -3.50408935546875, -3.278564453125, -3.05303955078125, -2.8275146484375, -2.60198974609375, -2.37646484375, -2.15093994140625, -1.9254150390625, -1.69989013671875, -1.474365234375, -1.24884033203125, -1.0233154296875, -0.79779052734375, -0.572265625, -0.34674072265625, -0.1212158203125, 0.10430908203125, 0.329833984375, 0.55535888671875, 0.7808837890625, 1.00640869140625, 1.23193359375, 1.45745849609375, 1.6829833984375, 1.90850830078125, 2.134033203125, 2.35955810546875, 2.5850830078125, 2.81060791015625, 3.0361328125, 3.26165771484375, 3.4871826171875, 3.71270751953125, 3.938232421875, 4.16375732421875, 4.3892822265625, 4.61480712890625, 4.84033203125, 5.06585693359375, 5.2913818359375, 5.51690673828125, 5.742431640625, 5.96795654296875, 6.1934814453125, 6.41900634765625, 6.64453125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 12.0, 13.0, 15.0, 33.0, 48.0, 69.0, 102.0, 172.0, 290.0, 467.0, 745.0, 1473.0, 3048.0, 7035.0, 17382.0, 49184.0, 167608.0, 788918.0, 2393631.0, 567793.0, 130285.0, 39893.0, 14473.0, 5943.0, 2607.0, 1324.0, 674.0, 363.0, 238.0, 160.0, 87.0, 68.0, 44.0, 30.0, 17.0, 14.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.4560546875, -11.052734375, -10.6494140625, -10.24609375, -9.8427734375, -9.439453125, -9.0361328125, -8.6328125, -8.2294921875, -7.826171875, -7.4228515625, -7.01953125, -6.6162109375, -6.212890625, -5.8095703125, -5.40625, -5.0029296875, -4.599609375, -4.1962890625, -3.79296875, -3.3896484375, -2.986328125, -2.5830078125, -2.1796875, -1.7763671875, -1.373046875, -0.9697265625, -0.56640625, -0.1630859375, 0.240234375, 0.6435546875, 1.046875, 1.4501953125, 1.853515625, 2.2568359375, 2.66015625, 3.0634765625, 3.466796875, 3.8701171875, 4.2734375, 4.6767578125, 5.080078125, 5.4833984375, 5.88671875, 6.2900390625, 6.693359375, 7.0966796875, 7.5, 7.9033203125, 8.306640625, 8.7099609375, 9.11328125, 9.5166015625, 9.919921875, 10.3232421875, 10.7265625, 11.1298828125, 11.533203125, 11.9365234375, 12.33984375, 12.7431640625, 13.146484375, 13.5498046875, 13.953125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 34.0, 116.0, 287.0, 305.0, 172.0, 67.0, 22.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-224.4994354248047, -220.2763214111328, -216.05319213867188, -211.830078125, -207.60696411132812, -203.38385009765625, -199.1607208251953, -194.93760681152344, -190.7144775390625, -186.49136352539062, -182.2682342529297, -178.0451202392578, -173.82200622558594, -169.598876953125, -165.37576293945312, -161.15264892578125, -156.92953491210938, -152.7064208984375, -148.48329162597656, -144.2601776123047, -140.0370635986328, -135.81393432617188, -131.5908203125, -127.36770629882812, -123.14458465576172, -118.92146301269531, -114.69834899902344, -110.47522735595703, -106.25210571289062, -102.02899169921875, -97.80587005615234, -93.58274841308594, -89.35963439941406, -85.13651275634766, -80.91339874267578, -76.69027709960938, -72.4671630859375, -68.2440414428711, -64.02091979980469, -59.79780197143555, -55.574684143066406, -51.351566314697266, -47.128448486328125, -42.90532684326172, -38.68220901489258, -34.45909118652344, -30.235971450805664, -26.01285171508789, -21.78973388671875, -17.56661605834961, -13.343496322631836, -9.120377540588379, -4.897258758544922, -0.6741409301757812, 3.548978805541992, 7.772098541259766, 11.995216369628906, 16.218334197998047, 20.44145393371582, 24.664573669433594, 28.887691497802734, 33.110809326171875, 37.33393096923828, 41.55704879760742, 45.78016662597656]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 14.0, 5.0, 17.0, 19.0, 13.0, 25.0, 25.0, 26.0, 41.0, 17.0, 31.0, 37.0, 38.0, 44.0, 40.0, 42.0, 38.0, 41.0, 42.0, 36.0, 38.0, 40.0, 32.0, 32.0, 27.0, 25.0, 25.0, 22.0, 22.0, 21.0, 21.0, 23.0, 9.0, 9.0, 5.0, 4.0, 10.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.811885833740234, -26.935426712036133, -26.0589656829834, -25.182506561279297, -24.306047439575195, -23.429588317871094, -22.55312728881836, -21.676668167114258, -20.800209045410156, -19.923749923706055, -19.04728889465332, -18.17082977294922, -17.294370651245117, -16.417911529541016, -15.541450500488281, -14.66499137878418, -13.788530349731445, -12.912070274353027, -12.035611152648926, -11.159151077270508, -10.282691955566406, -9.406231880187988, -8.52977180480957, -7.6533122062683105, -6.776852607727051, -5.900393009185791, -5.023933410644531, -4.147473335266113, -3.2710137367248535, -2.3945541381835938, -1.5180940628051758, -0.641634464263916, 0.23482322692871094, 1.1112829446792603, 1.9877426624298096, 2.8642024993896484, 3.740662097930908, 4.617121696472168, 5.493581771850586, 6.370041370391846, 7.2465009689331055, 8.122961044311523, 8.999420166015625, 9.875880241394043, 10.752340316772461, 11.628799438476562, 12.50525951385498, 13.381719589233398, 14.2581787109375, 15.134638786315918, 16.011098861694336, 16.887557983398438, 17.76401710510254, 18.64047622680664, 19.516937255859375, 20.393396377563477, 21.269855499267578, 22.14631462097168, 23.022775650024414, 23.899234771728516, 24.775693893432617, 25.65215301513672, 26.528614044189453, 27.405073165893555, 28.28153419494629]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 5.0, 3.0, 9.0, 8.0, 13.0, 14.0, 17.0, 19.0, 20.0, 32.0, 31.0, 20.0, 35.0, 32.0, 32.0, 37.0, 35.0, 38.0, 44.0, 53.0, 35.0, 51.0, 35.0, 40.0, 34.0, 33.0, 31.0, 19.0, 32.0, 34.0, 27.0, 28.0, 16.0, 14.0, 11.0, 10.0, 7.0, 9.0, 8.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.748046875, -2.659698486328125, -2.57135009765625, -2.483001708984375, -2.3946533203125, -2.306304931640625, -2.21795654296875, -2.129608154296875, -2.041259765625, -1.952911376953125, -1.86456298828125, -1.776214599609375, -1.6878662109375, -1.599517822265625, -1.51116943359375, -1.422821044921875, -1.33447265625, -1.246124267578125, -1.15777587890625, -1.069427490234375, -0.9810791015625, -0.892730712890625, -0.80438232421875, -0.716033935546875, -0.627685546875, -0.539337158203125, -0.45098876953125, -0.362640380859375, -0.2742919921875, -0.185943603515625, -0.09759521484375, -0.009246826171875, 0.0791015625, 0.167449951171875, 0.25579833984375, 0.344146728515625, 0.4324951171875, 0.520843505859375, 0.60919189453125, 0.697540283203125, 0.785888671875, 0.874237060546875, 0.96258544921875, 1.050933837890625, 1.1392822265625, 1.227630615234375, 1.31597900390625, 1.404327392578125, 1.49267578125, 1.581024169921875, 1.66937255859375, 1.757720947265625, 1.8460693359375, 1.934417724609375, 2.02276611328125, 2.111114501953125, 2.199462890625, 2.287811279296875, 2.37615966796875, 2.464508056640625, 2.5528564453125, 2.641204833984375, 2.72955322265625, 2.817901611328125, 2.90625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 14.0, 13.0, 19.0, 24.0, 43.0, 73.0, 88.0, 145.0, 220.0, 320.0, 470.0, 765.0, 1047.0, 1719.0, 2673.0, 3926.0, 6043.0, 9004.0, 13778.0, 20622.0, 30457.0, 44382.0, 61310.0, 82464.0, 105717.0, 143381.0, 140764.0, 104644.0, 81129.0, 60781.0, 43291.0, 29808.0, 20205.0, 13311.0, 8987.0, 5640.0, 3894.0, 2482.0, 1607.0, 1109.0, 741.0, 517.0, 328.0, 179.0, 150.0, 103.0, 58.0, 40.0, 33.0, 16.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.232421875, -2.155364990234375, -2.07830810546875, -2.001251220703125, -1.9241943359375, -1.847137451171875, -1.77008056640625, -1.693023681640625, -1.615966796875, -1.538909912109375, -1.46185302734375, -1.384796142578125, -1.3077392578125, -1.230682373046875, -1.15362548828125, -1.076568603515625, -0.99951171875, -0.922454833984375, -0.84539794921875, -0.768341064453125, -0.6912841796875, -0.614227294921875, -0.53717041015625, -0.460113525390625, -0.383056640625, -0.305999755859375, -0.22894287109375, -0.151885986328125, -0.0748291015625, 0.002227783203125, 0.07928466796875, 0.156341552734375, 0.2333984375, 0.310455322265625, 0.38751220703125, 0.464569091796875, 0.5416259765625, 0.618682861328125, 0.69573974609375, 0.772796630859375, 0.849853515625, 0.926910400390625, 1.00396728515625, 1.081024169921875, 1.1580810546875, 1.235137939453125, 1.31219482421875, 1.389251708984375, 1.46630859375, 1.543365478515625, 1.62042236328125, 1.697479248046875, 1.7745361328125, 1.851593017578125, 1.92864990234375, 2.005706787109375, 2.082763671875, 2.159820556640625, 2.23687744140625, 2.313934326171875, 2.3909912109375, 2.468048095703125, 2.54510498046875, 2.622161865234375, 2.69921875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 3.0, 4.0, 15.0, 7.0, 5.0, 11.0, 8.0, 16.0, 22.0, 17.0, 15.0, 21.0, 17.0, 26.0, 14.0, 32.0, 29.0, 39.0, 29.0, 24.0, 35.0, 49.0, 28.0, 1063.0, 52.0, 46.0, 28.0, 25.0, 39.0, 34.0, 30.0, 27.0, 24.0, 20.0, 24.0, 25.0, 13.0, 22.0, 7.0, 12.0, 7.0, 11.0, 7.0, 9.0, 12.0, 8.0, 3.0, 4.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.099609375, -3.005401611328125, -2.91119384765625, -2.816986083984375, -2.7227783203125, -2.628570556640625, -2.53436279296875, -2.440155029296875, -2.345947265625, -2.251739501953125, -2.15753173828125, -2.063323974609375, -1.9691162109375, -1.874908447265625, -1.78070068359375, -1.686492919921875, -1.59228515625, -1.498077392578125, -1.40386962890625, -1.309661865234375, -1.2154541015625, -1.121246337890625, -1.02703857421875, -0.932830810546875, -0.838623046875, -0.744415283203125, -0.65020751953125, -0.555999755859375, -0.4617919921875, -0.367584228515625, -0.27337646484375, -0.179168701171875, -0.0849609375, 0.009246826171875, 0.10345458984375, 0.197662353515625, 0.2918701171875, 0.386077880859375, 0.48028564453125, 0.574493408203125, 0.668701171875, 0.762908935546875, 0.85711669921875, 0.951324462890625, 1.0455322265625, 1.139739990234375, 1.23394775390625, 1.328155517578125, 1.42236328125, 1.516571044921875, 1.61077880859375, 1.704986572265625, 1.7991943359375, 1.893402099609375, 1.98760986328125, 2.081817626953125, 2.176025390625, 2.270233154296875, 2.36444091796875, 2.458648681640625, 2.5528564453125, 2.647064208984375, 2.74127197265625, 2.835479736328125, 2.9296875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 12.0, 20.0, 33.0, 41.0, 54.0, 71.0, 116.0, 177.0, 237.0, 414.0, 607.0, 979.0, 1550.0, 2545.0, 4379.0, 7408.0, 12737.0, 23685.0, 48614.0, 242270.0, 1601506.0, 76836.0, 32441.0, 16917.0, 9402.0, 5495.0, 3173.0, 2045.0, 1185.0, 725.0, 509.0, 292.0, 180.0, 145.0, 76.0, 65.0, 54.0, 36.0, 20.0, 17.0, 11.0, 13.0, 7.0, 7.0, 7.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.6484375, -6.4483642578125, -6.248291015625, -6.0482177734375, -5.84814453125, -5.6480712890625, -5.447998046875, -5.2479248046875, -5.0478515625, -4.8477783203125, -4.647705078125, -4.4476318359375, -4.24755859375, -4.0474853515625, -3.847412109375, -3.6473388671875, -3.447265625, -3.2471923828125, -3.047119140625, -2.8470458984375, -2.64697265625, -2.4468994140625, -2.246826171875, -2.0467529296875, -1.8466796875, -1.6466064453125, -1.446533203125, -1.2464599609375, -1.04638671875, -0.8463134765625, -0.646240234375, -0.4461669921875, -0.24609375, -0.0460205078125, 0.154052734375, 0.3541259765625, 0.55419921875, 0.7542724609375, 0.954345703125, 1.1544189453125, 1.3544921875, 1.5545654296875, 1.754638671875, 1.9547119140625, 2.15478515625, 2.3548583984375, 2.554931640625, 2.7550048828125, 2.955078125, 3.1551513671875, 3.355224609375, 3.5552978515625, 3.75537109375, 3.9554443359375, 4.155517578125, 4.3555908203125, 4.5556640625, 4.7557373046875, 4.955810546875, 5.1558837890625, 5.35595703125, 5.5560302734375, 5.756103515625, 5.9561767578125, 6.15625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 6.0, 8.0, 10.0, 18.0, 18.0, 17.0, 19.0, 37.0, 21.0, 45.0, 47.0, 50.0, 51.0, 72.0, 110.0, 96.0, 58.0, 54.0, 55.0, 31.0, 30.0, 33.0, 15.0, 18.0, 15.0, 17.0, 11.0, 4.0, 4.0, 3.0, 5.0, 2.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7626953125, -0.7331085205078125, -0.703521728515625, -0.6739349365234375, -0.64434814453125, -0.6147613525390625, -0.585174560546875, -0.5555877685546875, -0.5260009765625, -0.4964141845703125, -0.466827392578125, -0.4372406005859375, -0.40765380859375, -0.3780670166015625, -0.348480224609375, -0.3188934326171875, -0.289306640625, -0.2597198486328125, -0.230133056640625, -0.2005462646484375, -0.17095947265625, -0.1413726806640625, -0.111785888671875, -0.0821990966796875, -0.0526123046875, -0.0230255126953125, 0.006561279296875, 0.0361480712890625, 0.06573486328125, 0.0953216552734375, 0.124908447265625, 0.1544952392578125, 0.18408203125, 0.2136688232421875, 0.243255615234375, 0.2728424072265625, 0.30242919921875, 0.3320159912109375, 0.361602783203125, 0.3911895751953125, 0.4207763671875, 0.4503631591796875, 0.479949951171875, 0.5095367431640625, 0.53912353515625, 0.5687103271484375, 0.598297119140625, 0.6278839111328125, 0.657470703125, 0.6870574951171875, 0.716644287109375, 0.7462310791015625, 0.77581787109375, 0.8054046630859375, 0.834991455078125, 0.8645782470703125, 0.8941650390625, 0.9237518310546875, 0.953338623046875, 0.9829254150390625, 1.01251220703125, 1.0420989990234375, 1.071685791015625, 1.1012725830078125, 1.130859375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 6.0, 9.0, 8.0, 13.0, 18.0, 9.0, 25.0, 31.0, 39.0, 62.0, 69.0, 103.0, 116.0, 206.0, 304.0, 983.0, 9243.0, 336655.0, 683523.0, 14773.0, 1316.0, 360.0, 189.0, 112.0, 89.0, 83.0, 54.0, 42.0, 28.0, 17.0, 13.0, 16.0, 12.0, 16.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5546875, -15.06982421875, -14.5849609375, -14.10009765625, -13.615234375, -13.13037109375, -12.6455078125, -12.16064453125, -11.67578125, -11.19091796875, -10.7060546875, -10.22119140625, -9.736328125, -9.25146484375, -8.7666015625, -8.28173828125, -7.796875, -7.31201171875, -6.8271484375, -6.34228515625, -5.857421875, -5.37255859375, -4.8876953125, -4.40283203125, -3.91796875, -3.43310546875, -2.9482421875, -2.46337890625, -1.978515625, -1.49365234375, -1.0087890625, -0.52392578125, -0.0390625, 0.44580078125, 0.9306640625, 1.41552734375, 1.900390625, 2.38525390625, 2.8701171875, 3.35498046875, 3.83984375, 4.32470703125, 4.8095703125, 5.29443359375, 5.779296875, 6.26416015625, 6.7490234375, 7.23388671875, 7.71875, 8.20361328125, 8.6884765625, 9.17333984375, 9.658203125, 10.14306640625, 10.6279296875, 11.11279296875, 11.59765625, 12.08251953125, 12.5673828125, 13.05224609375, 13.537109375, 14.02197265625, 14.5068359375, 14.99169921875, 15.4765625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 11.0, 35.0, 97.0, 340.0, 406.0, 84.0, 19.0, 9.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.7659854888916, -29.0228214263916, -28.279659271240234, -27.536495208740234, -26.793331146240234, -26.050167083740234, -25.307004928588867, -24.563840866088867, -23.8206787109375, -23.0775146484375, -22.334352493286133, -21.591188430786133, -20.848024368286133, -20.104862213134766, -19.361698150634766, -18.618534088134766, -17.875370025634766, -17.132205963134766, -16.3890438079834, -15.645879745483398, -14.902715682983398, -14.159552574157715, -13.416389465332031, -12.673225402832031, -11.930062294006348, -11.186899185180664, -10.443735122680664, -9.70057201385498, -8.957408905029297, -8.214244842529297, -7.471081733703613, -6.7279181480407715, -5.9847564697265625, -5.241592884063721, -4.498429298400879, -3.7552661895751953, -3.0121026039123535, -2.2689390182495117, -1.5257759094238281, -0.7826123237609863, -0.03944873809814453, 0.7037147283554077, 1.44687819480896, 2.1900415420532227, 2.9332051277160645, 3.6763687133789062, 4.41953182220459, 5.162695407867432, 5.905858993530273, 6.649022579193115, 7.392186164855957, 8.13534927368164, 8.87851333618164, 9.621676445007324, 10.364839553833008, 11.108003616333008, 11.851166725158691, 12.594329833984375, 13.337493896484375, 14.080657005310059, 14.823820114135742, 15.566984176635742, 16.31014633178711, 17.05331039428711, 17.79647445678711]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 8.0, 10.0, 9.0, 16.0, 19.0, 23.0, 19.0, 30.0, 32.0, 38.0, 31.0, 54.0, 48.0, 53.0, 48.0, 47.0, 72.0, 49.0, 39.0, 46.0, 32.0, 48.0, 31.0, 35.0, 27.0, 24.0, 12.0, 20.0, 14.0, 13.0, 13.0, 7.0, 13.0, 6.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.764403820037842, -2.6582677364349365, -2.5521318912506104, -2.445995807647705, -2.339859962463379, -2.2337238788604736, -2.1275877952575684, -2.021451950073242, -1.9153159856796265, -1.8091800212860107, -1.703044056892395, -1.5969080924987793, -1.490772008895874, -1.3846361637115479, -1.2785000801086426, -1.1723641157150269, -1.0662281513214111, -0.9600921869277954, -0.8539562225341797, -0.7478201985359192, -0.6416842341423035, -0.5355482697486877, -0.42941224575042725, -0.3232762813568115, -0.2171403169631958, -0.11100433766841888, -0.004868358373641968, 0.10126763582229614, 0.20740360021591187, 0.3135395646095276, 0.4196755886077881, 0.5258115530014038, 0.6319475173950195, 0.7380834817886353, 0.844219446182251, 0.9503554701805115, 1.0564913749694824, 1.1626274585723877, 1.2687634229660034, 1.3748993873596191, 1.4810353517532349, 1.5871713161468506, 1.6933072805404663, 1.799443244934082, 1.9055793285369873, 2.0117151737213135, 2.1178512573242188, 2.223987102508545, 2.33012318611145, 2.4362592697143555, 2.5423951148986816, 2.648531198501587, 2.754667043685913, 2.8608031272888184, 2.9669389724731445, 3.07307505607605, 3.179211139678955, 3.2853472232818604, 3.3914830684661865, 3.497619152069092, 3.603754997253418, 3.7098910808563232, 3.8160271644592285, 3.9221630096435547, 4.028298854827881]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 7.0, 9.0, 10.0, 11.0, 15.0, 20.0, 27.0, 33.0, 17.0, 28.0, 28.0, 35.0, 30.0, 38.0, 40.0, 36.0, 34.0, 54.0, 42.0, 47.0, 36.0, 37.0, 35.0, 31.0, 33.0, 34.0, 24.0, 29.0, 24.0, 31.0, 25.0, 13.0, 14.0, 6.0, 11.0, 7.0, 11.0, 8.0, 2.0, 3.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.81640625, -2.727081298828125, -2.63775634765625, -2.548431396484375, -2.4591064453125, -2.369781494140625, -2.28045654296875, -2.191131591796875, -2.101806640625, -2.012481689453125, -1.92315673828125, -1.833831787109375, -1.7445068359375, -1.655181884765625, -1.56585693359375, -1.476531982421875, -1.38720703125, -1.297882080078125, -1.20855712890625, -1.119232177734375, -1.0299072265625, -0.940582275390625, -0.85125732421875, -0.761932373046875, -0.672607421875, -0.583282470703125, -0.49395751953125, -0.404632568359375, -0.3153076171875, -0.225982666015625, -0.13665771484375, -0.047332763671875, 0.0419921875, 0.131317138671875, 0.22064208984375, 0.309967041015625, 0.3992919921875, 0.488616943359375, 0.57794189453125, 0.667266845703125, 0.756591796875, 0.845916748046875, 0.93524169921875, 1.024566650390625, 1.1138916015625, 1.203216552734375, 1.29254150390625, 1.381866455078125, 1.47119140625, 1.560516357421875, 1.64984130859375, 1.739166259765625, 1.8284912109375, 1.917816162109375, 2.00714111328125, 2.096466064453125, 2.185791015625, 2.275115966796875, 2.36444091796875, 2.453765869140625, 2.5430908203125, 2.632415771484375, 2.72174072265625, 2.811065673828125, 2.900390625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 3.0, 15.0, 20.0, 7.0, 24.0, 54.0, 86.0, 91.0, 130.0, 172.0, 274.0, 387.0, 588.0, 765.0, 1059.0, 1514.0, 2237.0, 3154.0, 4961.0, 7245.0, 12312.0, 24762.0, 60940.0, 190285.0, 418272.0, 195883.0, 62335.0, 25642.0, 12499.0, 7465.0, 4679.0, 3253.0, 2246.0, 1518.0, 1097.0, 762.0, 566.0, 371.0, 261.0, 176.0, 147.0, 96.0, 62.0, 42.0, 33.0, 22.0, 17.0, 10.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.28515625, -5.117431640625, -4.94970703125, -4.781982421875, -4.6142578125, -4.446533203125, -4.27880859375, -4.111083984375, -3.943359375, -3.775634765625, -3.60791015625, -3.440185546875, -3.2724609375, -3.104736328125, -2.93701171875, -2.769287109375, -2.6015625, -2.433837890625, -2.26611328125, -2.098388671875, -1.9306640625, -1.762939453125, -1.59521484375, -1.427490234375, -1.259765625, -1.092041015625, -0.92431640625, -0.756591796875, -0.5888671875, -0.421142578125, -0.25341796875, -0.085693359375, 0.08203125, 0.249755859375, 0.41748046875, 0.585205078125, 0.7529296875, 0.920654296875, 1.08837890625, 1.256103515625, 1.423828125, 1.591552734375, 1.75927734375, 1.927001953125, 2.0947265625, 2.262451171875, 2.43017578125, 2.597900390625, 2.765625, 2.933349609375, 3.10107421875, 3.268798828125, 3.4365234375, 3.604248046875, 3.77197265625, 3.939697265625, 4.107421875, 4.275146484375, 4.44287109375, 4.610595703125, 4.7783203125, 4.946044921875, 5.11376953125, 5.281494140625, 5.44921875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 7.0, 8.0, 6.0, 10.0, 17.0, 15.0, 23.0, 17.0, 23.0, 28.0, 40.0, 42.0, 46.0, 52.0, 80.0, 88.0, 110.0, 208.0, 1393.0, 226.0, 132.0, 72.0, 56.0, 59.0, 56.0, 42.0, 33.0, 19.0, 33.0, 19.0, 19.0, 13.0, 12.0, 8.0, 1.0, 11.0, 7.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8203125, -9.4764404296875, -9.132568359375, -8.7886962890625, -8.44482421875, -8.1009521484375, -7.757080078125, -7.4132080078125, -7.0693359375, -6.7254638671875, -6.381591796875, -6.0377197265625, -5.69384765625, -5.3499755859375, -5.006103515625, -4.6622314453125, -4.318359375, -3.9744873046875, -3.630615234375, -3.2867431640625, -2.94287109375, -2.5989990234375, -2.255126953125, -1.9112548828125, -1.5673828125, -1.2235107421875, -0.879638671875, -0.5357666015625, -0.19189453125, 0.1519775390625, 0.495849609375, 0.8397216796875, 1.18359375, 1.5274658203125, 1.871337890625, 2.2152099609375, 2.55908203125, 2.9029541015625, 3.246826171875, 3.5906982421875, 3.9345703125, 4.2784423828125, 4.622314453125, 4.9661865234375, 5.31005859375, 5.6539306640625, 5.997802734375, 6.3416748046875, 6.685546875, 7.0294189453125, 7.373291015625, 7.7171630859375, 8.06103515625, 8.4049072265625, 8.748779296875, 9.0926513671875, 9.4365234375, 9.7803955078125, 10.124267578125, 10.4681396484375, 10.81201171875, 11.1558837890625, 11.499755859375, 11.8436279296875, 12.1875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 7.0, 11.0, 16.0, 15.0, 30.0, 32.0, 66.0, 121.0, 197.0, 449.0, 1164.0, 3917.0, 16824.0, 108397.0, 2427026.0, 535046.0, 40831.0, 8081.0, 2076.0, 675.0, 294.0, 168.0, 91.0, 50.0, 31.0, 27.0, 18.0, 13.0, 12.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.109375, -16.41845703125, -15.7275390625, -15.03662109375, -14.345703125, -13.65478515625, -12.9638671875, -12.27294921875, -11.58203125, -10.89111328125, -10.2001953125, -9.50927734375, -8.818359375, -8.12744140625, -7.4365234375, -6.74560546875, -6.0546875, -5.36376953125, -4.6728515625, -3.98193359375, -3.291015625, -2.60009765625, -1.9091796875, -1.21826171875, -0.52734375, 0.16357421875, 0.8544921875, 1.54541015625, 2.236328125, 2.92724609375, 3.6181640625, 4.30908203125, 5.0, 5.69091796875, 6.3818359375, 7.07275390625, 7.763671875, 8.45458984375, 9.1455078125, 9.83642578125, 10.52734375, 11.21826171875, 11.9091796875, 12.60009765625, 13.291015625, 13.98193359375, 14.6728515625, 15.36376953125, 16.0546875, 16.74560546875, 17.4365234375, 18.12744140625, 18.818359375, 19.50927734375, 20.2001953125, 20.89111328125, 21.58203125, 22.27294921875, 22.9638671875, 23.65478515625, 24.345703125, 25.03662109375, 25.7275390625, 26.41845703125, 27.109375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 104.0, 888.0, 25.0], "bins": [-812.82177734375, -799.7821044921875, -786.742431640625, -773.7027587890625, -760.6630859375, -747.6234130859375, -734.5838012695312, -721.5441284179688, -708.5044555664062, -695.4647827148438, -682.4251098632812, -669.3854370117188, -656.3457641601562, -643.30615234375, -630.2664794921875, -617.226806640625, -604.1871337890625, -591.1474609375, -578.1077880859375, -565.068115234375, -552.0284423828125, -538.98876953125, -525.9491577148438, -512.9094848632812, -499.8697814941406, -486.8301086425781, -473.7904357910156, -460.75079345703125, -447.71112060546875, -434.67144775390625, -421.63177490234375, -408.59210205078125, -395.5524597167969, -382.5127868652344, -369.4731140136719, -356.4334716796875, -343.393798828125, -330.3541259765625, -317.314453125, -304.2747802734375, -291.2351379394531, -278.1954650878906, -265.1557922363281, -252.1161346435547, -239.07647705078125, -226.03680419921875, -212.99713134765625, -199.9574737548828, -186.91781616210938, -173.87814331054688, -160.83848571777344, -147.79881286621094, -134.7591552734375, -121.719482421875, -108.67981719970703, -95.64015197753906, -82.60047912597656, -69.5608139038086, -56.521148681640625, -43.48147964477539, -30.441814422607422, -17.402145385742188, -4.362480163574219, 8.67718505859375, 21.716846466064453]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 3.0, 11.0, 12.0, 13.0, 19.0, 20.0, 29.0, 25.0, 20.0, 44.0, 28.0, 33.0, 46.0, 43.0, 37.0, 37.0, 49.0, 47.0, 41.0, 48.0, 39.0, 35.0, 33.0, 34.0, 31.0, 26.0, 24.0, 36.0, 24.0, 16.0, 14.0, 23.0, 14.0, 6.0, 6.0, 12.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.899436950683594, -34.70469284057617, -33.509952545166016, -32.315208435058594, -31.120468139648438, -29.925724029541016, -28.730981826782227, -27.536239624023438, -26.34149742126465, -25.14675521850586, -23.95201301574707, -22.75727081298828, -21.56252670288086, -20.367786407470703, -19.17304229736328, -17.978300094604492, -16.783557891845703, -15.588815689086914, -14.394073486328125, -13.19933032989502, -12.00458812713623, -10.809845924377441, -9.615102767944336, -8.420360565185547, -7.225618362426758, -6.030876159667969, -4.8361334800720215, -3.6413910388946533, -2.446648597717285, -1.251906394958496, -0.05716371536254883, 1.1375789642333984, 2.3323211669921875, 3.5270636081695557, 4.721806049346924, 5.916548728942871, 7.11129093170166, 8.30603313446045, 9.500776290893555, 10.695518493652344, 11.890260696411133, 13.085002899169922, 14.279745101928711, 15.474488258361816, 16.669231414794922, 17.863971710205078, 19.0587158203125, 20.25345802307129, 21.448200225830078, 22.642942428588867, 23.837684631347656, 25.032426834106445, 26.227169036865234, 27.421913146972656, 28.616655349731445, 29.811397552490234, 31.006139755249023, 32.20088195800781, 33.395626068115234, 34.59036636352539, 35.78511047363281, 36.97985076904297, 38.17459487915039, 39.36933898925781, 40.56407928466797]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 7.0, 3.0, 5.0, 3.0, 16.0, 8.0, 22.0, 14.0, 19.0, 20.0, 28.0, 21.0, 26.0, 31.0, 26.0, 27.0, 41.0, 35.0, 44.0, 37.0, 46.0, 35.0, 35.0, 46.0, 42.0, 34.0, 40.0, 33.0, 38.0, 26.0, 25.0, 29.0, 11.0, 16.0, 25.0, 14.0, 14.0, 11.0, 9.0, 7.0, 7.0, 8.0, 5.0, 3.0, 2.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.8203125, -2.728607177734375, -2.63690185546875, -2.545196533203125, -2.4534912109375, -2.361785888671875, -2.27008056640625, -2.178375244140625, -2.086669921875, -1.994964599609375, -1.90325927734375, -1.811553955078125, -1.7198486328125, -1.628143310546875, -1.53643798828125, -1.444732666015625, -1.35302734375, -1.261322021484375, -1.16961669921875, -1.077911376953125, -0.9862060546875, -0.894500732421875, -0.80279541015625, -0.711090087890625, -0.619384765625, -0.527679443359375, -0.43597412109375, -0.344268798828125, -0.2525634765625, -0.160858154296875, -0.06915283203125, 0.022552490234375, 0.1142578125, 0.205963134765625, 0.29766845703125, 0.389373779296875, 0.4810791015625, 0.572784423828125, 0.66448974609375, 0.756195068359375, 0.847900390625, 0.939605712890625, 1.03131103515625, 1.123016357421875, 1.2147216796875, 1.306427001953125, 1.39813232421875, 1.489837646484375, 1.58154296875, 1.673248291015625, 1.76495361328125, 1.856658935546875, 1.9483642578125, 2.040069580078125, 2.13177490234375, 2.223480224609375, 2.315185546875, 2.406890869140625, 2.49859619140625, 2.590301513671875, 2.6820068359375, 2.773712158203125, 2.86541748046875, 2.957122802734375, 3.048828125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 13.0, 9.0, 12.0, 9.0, 16.0, 20.0, 38.0, 43.0, 54.0, 70.0, 91.0, 173.0, 333.0, 636.0, 1500.0, 4051.0, 13611.0, 62340.0, 788813.0, 3075064.0, 203993.0, 30200.0, 7869.0, 2847.0, 1205.0, 517.0, 241.0, 142.0, 89.0, 78.0, 47.0, 35.0, 23.0, 14.0, 20.0, 9.0, 8.0, 10.0, 5.0, 4.0, 4.0, 4.0, 7.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6875, -11.301513671875, -10.91552734375, -10.529541015625, -10.1435546875, -9.757568359375, -9.37158203125, -8.985595703125, -8.599609375, -8.213623046875, -7.82763671875, -7.441650390625, -7.0556640625, -6.669677734375, -6.28369140625, -5.897705078125, -5.51171875, -5.125732421875, -4.73974609375, -4.353759765625, -3.9677734375, -3.581787109375, -3.19580078125, -2.809814453125, -2.423828125, -2.037841796875, -1.65185546875, -1.265869140625, -0.8798828125, -0.493896484375, -0.10791015625, 0.278076171875, 0.6640625, 1.050048828125, 1.43603515625, 1.822021484375, 2.2080078125, 2.593994140625, 2.97998046875, 3.365966796875, 3.751953125, 4.137939453125, 4.52392578125, 4.909912109375, 5.2958984375, 5.681884765625, 6.06787109375, 6.453857421875, 6.83984375, 7.225830078125, 7.61181640625, 7.997802734375, 8.3837890625, 8.769775390625, 9.15576171875, 9.541748046875, 9.927734375, 10.313720703125, 10.69970703125, 11.085693359375, 11.4716796875, 11.857666015625, 12.24365234375, 12.629638671875, 13.015625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 11.0, 13.0, 29.0, 27.0, 56.0, 91.0, 113.0, 198.0, 348.0, 534.0, 766.0, 688.0, 433.0, 296.0, 178.0, 92.0, 67.0, 39.0, 37.0, 25.0, 11.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.65625, -15.2720947265625, -14.887939453125, -14.5037841796875, -14.11962890625, -13.7354736328125, -13.351318359375, -12.9671630859375, -12.5830078125, -12.1988525390625, -11.814697265625, -11.4305419921875, -11.04638671875, -10.6622314453125, -10.278076171875, -9.8939208984375, -9.509765625, -9.1256103515625, -8.741455078125, -8.3572998046875, -7.97314453125, -7.5889892578125, -7.204833984375, -6.8206787109375, -6.4365234375, -6.0523681640625, -5.668212890625, -5.2840576171875, -4.89990234375, -4.5157470703125, -4.131591796875, -3.7474365234375, -3.36328125, -2.9791259765625, -2.594970703125, -2.2108154296875, -1.82666015625, -1.4425048828125, -1.058349609375, -0.6741943359375, -0.2900390625, 0.0941162109375, 0.478271484375, 0.8624267578125, 1.24658203125, 1.6307373046875, 2.014892578125, 2.3990478515625, 2.783203125, 3.1673583984375, 3.551513671875, 3.9356689453125, 4.31982421875, 4.7039794921875, 5.088134765625, 5.4722900390625, 5.8564453125, 6.2406005859375, 6.624755859375, 7.0089111328125, 7.39306640625, 7.7772216796875, 8.161376953125, 8.5455322265625, 8.9296875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 5.0, 12.0, 15.0, 30.0, 49.0, 85.0, 127.0, 230.0, 413.0, 935.0, 2408.0, 8260.0, 37792.0, 331947.0, 3270103.0, 478835.0, 48447.0, 9805.0, 2762.0, 1000.0, 463.0, 247.0, 114.0, 74.0, 40.0, 30.0, 15.0, 15.0, 5.0, 8.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.25, -17.507080078125, -16.76416015625, -16.021240234375, -15.2783203125, -14.535400390625, -13.79248046875, -13.049560546875, -12.306640625, -11.563720703125, -10.82080078125, -10.077880859375, -9.3349609375, -8.592041015625, -7.84912109375, -7.106201171875, -6.36328125, -5.620361328125, -4.87744140625, -4.134521484375, -3.3916015625, -2.648681640625, -1.90576171875, -1.162841796875, -0.419921875, 0.322998046875, 1.06591796875, 1.808837890625, 2.5517578125, 3.294677734375, 4.03759765625, 4.780517578125, 5.5234375, 6.266357421875, 7.00927734375, 7.752197265625, 8.4951171875, 9.238037109375, 9.98095703125, 10.723876953125, 11.466796875, 12.209716796875, 12.95263671875, 13.695556640625, 14.4384765625, 15.181396484375, 15.92431640625, 16.667236328125, 17.41015625, 18.153076171875, 18.89599609375, 19.638916015625, 20.3818359375, 21.124755859375, 21.86767578125, 22.610595703125, 23.353515625, 24.096435546875, 24.83935546875, 25.582275390625, 26.3251953125, 27.068115234375, 27.81103515625, 28.553955078125, 29.296875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 5.0, 13.0, 21.0, 20.0, 31.0, 42.0, 86.0, 117.0, 94.0, 112.0, 99.0, 98.0, 64.0, 63.0, 48.0, 27.0, 26.0, 11.0, 12.0, 5.0, 6.0, 3.0, 3.0, 1.0], "bins": [-77.65921783447266, -76.09965515136719, -74.54010009765625, -72.98053741455078, -71.42097473144531, -69.86141967773438, -68.3018569946289, -66.74229431152344, -65.18273162841797, -63.623172760009766, -62.0636100769043, -60.504051208496094, -58.944488525390625, -57.38492965698242, -55.82537078857422, -54.26580810546875, -52.70625305175781, -51.14669418334961, -49.58713150024414, -48.02757263183594, -46.46800994873047, -44.908451080322266, -43.34889221191406, -41.789329528808594, -40.229766845703125, -38.67020797729492, -37.11064529418945, -35.55108642578125, -33.99152374267578, -32.43196487426758, -30.872404098510742, -29.312843322753906, -27.75328254699707, -26.193721771240234, -24.6341609954834, -23.074600219726562, -21.51504135131836, -19.955480575561523, -18.395919799804688, -16.836360931396484, -15.276799201965332, -13.717238426208496, -12.157678604125977, -10.59811782836914, -9.038557052612305, -7.478997230529785, -5.919436454772949, -4.35987663269043, -2.8003158569335938, -1.2407554388046265, 0.3188049793243408, 1.8783655166625977, 3.4379258155822754, 4.997486114501953, 6.557046890258789, 8.116606712341309, 9.676167488098145, 11.23572826385498, 12.7952880859375, 14.354848861694336, 15.914409637451172, 17.473968505859375, 19.033531188964844, 20.593090057373047, 22.152650833129883]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 5.0, 6.0, 4.0, 11.0, 13.0, 12.0, 12.0, 11.0, 28.0, 17.0, 27.0, 19.0, 29.0, 38.0, 45.0, 34.0, 41.0, 34.0, 32.0, 40.0, 60.0, 31.0, 52.0, 42.0, 35.0, 32.0, 36.0, 23.0, 28.0, 30.0, 24.0, 20.0, 12.0, 20.0, 15.0, 17.0, 8.0, 11.0, 9.0, 11.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.793928146362305, -22.9865779876709, -22.179227828979492, -21.371877670288086, -20.56452751159668, -19.757177352905273, -18.9498291015625, -18.142478942871094, -17.335128784179688, -16.52777862548828, -15.720428466796875, -14.913078308105469, -14.105728149414062, -13.298377990722656, -12.491028785705566, -11.68367862701416, -10.876327514648438, -10.068977355957031, -9.261627197265625, -8.454277038574219, -7.646927356719971, -6.8395771980285645, -6.032227516174316, -5.22487735748291, -4.417527198791504, -3.6101770401000977, -2.8028271198272705, -1.9954771995544434, -1.188127040863037, -0.38077688217163086, 0.4265727996826172, 1.2339229583740234, 2.0412731170654297, 2.848623275756836, 3.655973196029663, 4.46332311630249, 5.2706732749938965, 6.078023433685303, 6.885373115539551, 7.692723274230957, 8.500073432922363, 9.30742359161377, 10.114773750305176, 10.922122955322266, 11.729473114013672, 12.536823272705078, 13.344173431396484, 14.15152359008789, 14.958873748779297, 15.766223907470703, 16.57357406616211, 17.380924224853516, 18.188274383544922, 18.995624542236328, 19.802974700927734, 20.61032485961914, 21.417675018310547, 22.225025177001953, 23.03237533569336, 23.839725494384766, 24.647075653076172, 25.454425811767578, 26.261775970458984, 27.06912612915039, 27.876474380493164]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 3.0, 6.0, 5.0, 5.0, 16.0, 10.0, 22.0, 22.0, 17.0, 26.0, 29.0, 30.0, 46.0, 27.0, 25.0, 37.0, 48.0, 41.0, 28.0, 42.0, 57.0, 42.0, 43.0, 46.0, 43.0, 42.0, 39.0, 34.0, 17.0, 26.0, 20.0, 16.0, 8.0, 17.0, 15.0, 7.0, 11.0, 8.0, 6.0, 7.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.728515625, -2.623138427734375, -2.51776123046875, -2.412384033203125, -2.3070068359375, -2.201629638671875, -2.09625244140625, -1.990875244140625, -1.885498046875, -1.780120849609375, -1.67474365234375, -1.569366455078125, -1.4639892578125, -1.358612060546875, -1.25323486328125, -1.147857666015625, -1.04248046875, -0.937103271484375, -0.83172607421875, -0.726348876953125, -0.6209716796875, -0.515594482421875, -0.41021728515625, -0.304840087890625, -0.199462890625, -0.094085693359375, 0.01129150390625, 0.116668701171875, 0.2220458984375, 0.327423095703125, 0.43280029296875, 0.538177490234375, 0.6435546875, 0.748931884765625, 0.85430908203125, 0.959686279296875, 1.0650634765625, 1.170440673828125, 1.27581787109375, 1.381195068359375, 1.486572265625, 1.591949462890625, 1.69732666015625, 1.802703857421875, 1.9080810546875, 2.013458251953125, 2.11883544921875, 2.224212646484375, 2.32958984375, 2.434967041015625, 2.54034423828125, 2.645721435546875, 2.7510986328125, 2.856475830078125, 2.96185302734375, 3.067230224609375, 3.172607421875, 3.277984619140625, 3.38336181640625, 3.488739013671875, 3.5941162109375, 3.699493408203125, 3.80487060546875, 3.910247802734375, 4.015625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 7.0, 7.0, 7.0, 15.0, 30.0, 29.0, 40.0, 84.0, 140.0, 166.0, 267.0, 395.0, 680.0, 958.0, 1454.0, 2409.0, 3625.0, 5455.0, 8698.0, 13478.0, 20562.0, 31042.0, 45146.0, 63717.0, 85202.0, 105119.0, 119806.0, 121705.0, 109327.0, 90185.0, 69218.0, 49628.0, 34114.0, 22920.0, 15019.0, 9882.0, 6286.0, 4110.0, 2663.0, 1765.0, 1114.0, 793.0, 452.0, 281.0, 180.0, 131.0, 80.0, 66.0, 50.0, 22.0, 12.0, 8.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.61328125, -2.531951904296875, -2.45062255859375, -2.369293212890625, -2.2879638671875, -2.206634521484375, -2.12530517578125, -2.043975830078125, -1.962646484375, -1.881317138671875, -1.79998779296875, -1.718658447265625, -1.6373291015625, -1.555999755859375, -1.47467041015625, -1.393341064453125, -1.31201171875, -1.230682373046875, -1.14935302734375, -1.068023681640625, -0.9866943359375, -0.905364990234375, -0.82403564453125, -0.742706298828125, -0.661376953125, -0.580047607421875, -0.49871826171875, -0.417388916015625, -0.3360595703125, -0.254730224609375, -0.17340087890625, -0.092071533203125, -0.0107421875, 0.070587158203125, 0.15191650390625, 0.233245849609375, 0.3145751953125, 0.395904541015625, 0.47723388671875, 0.558563232421875, 0.639892578125, 0.721221923828125, 0.80255126953125, 0.883880615234375, 0.9652099609375, 1.046539306640625, 1.12786865234375, 1.209197998046875, 1.29052734375, 1.371856689453125, 1.45318603515625, 1.534515380859375, 1.6158447265625, 1.697174072265625, 1.77850341796875, 1.859832763671875, 1.941162109375, 2.022491455078125, 2.10382080078125, 2.185150146484375, 2.2664794921875, 2.347808837890625, 2.42913818359375, 2.510467529296875, 2.591796875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 8.0, 7.0, 7.0, 9.0, 12.0, 16.0, 12.0, 26.0, 18.0, 18.0, 15.0, 24.0, 38.0, 31.0, 33.0, 35.0, 33.0, 38.0, 43.0, 31.0, 41.0, 1059.0, 34.0, 35.0, 44.0, 23.0, 32.0, 37.0, 37.0, 18.0, 27.0, 27.0, 22.0, 14.0, 23.0, 19.0, 10.0, 13.0, 8.0, 4.0, 7.0, 5.0, 5.0, 8.0, 9.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0], "bins": [-3.708984375, -3.5977783203125, -3.486572265625, -3.3753662109375, -3.26416015625, -3.1529541015625, -3.041748046875, -2.9305419921875, -2.8193359375, -2.7081298828125, -2.596923828125, -2.4857177734375, -2.37451171875, -2.2633056640625, -2.152099609375, -2.0408935546875, -1.9296875, -1.8184814453125, -1.707275390625, -1.5960693359375, -1.48486328125, -1.3736572265625, -1.262451171875, -1.1512451171875, -1.0400390625, -0.9288330078125, -0.817626953125, -0.7064208984375, -0.59521484375, -0.4840087890625, -0.372802734375, -0.2615966796875, -0.150390625, -0.0391845703125, 0.072021484375, 0.1832275390625, 0.29443359375, 0.4056396484375, 0.516845703125, 0.6280517578125, 0.7392578125, 0.8504638671875, 0.961669921875, 1.0728759765625, 1.18408203125, 1.2952880859375, 1.406494140625, 1.5177001953125, 1.62890625, 1.7401123046875, 1.851318359375, 1.9625244140625, 2.07373046875, 2.1849365234375, 2.296142578125, 2.4073486328125, 2.5185546875, 2.6297607421875, 2.740966796875, 2.8521728515625, 2.96337890625, 3.0745849609375, 3.185791015625, 3.2969970703125, 3.408203125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 6.0, 6.0, 15.0, 13.0, 17.0, 26.0, 37.0, 37.0, 33.0, 72.0, 99.0, 131.0, 197.0, 363.0, 582.0, 855.0, 1417.0, 2740.0, 5337.0, 11752.0, 29008.0, 85404.0, 1743253.0, 146661.0, 38723.0, 15449.0, 7003.0, 3372.0, 1777.0, 1016.0, 606.0, 364.0, 216.0, 144.0, 103.0, 86.0, 44.0, 33.0, 28.0, 20.0, 13.0, 14.0, 16.0, 11.0, 8.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.8984375, -9.552978515625, -9.20751953125, -8.862060546875, -8.5166015625, -8.171142578125, -7.82568359375, -7.480224609375, -7.134765625, -6.789306640625, -6.44384765625, -6.098388671875, -5.7529296875, -5.407470703125, -5.06201171875, -4.716552734375, -4.37109375, -4.025634765625, -3.68017578125, -3.334716796875, -2.9892578125, -2.643798828125, -2.29833984375, -1.952880859375, -1.607421875, -1.261962890625, -0.91650390625, -0.571044921875, -0.2255859375, 0.119873046875, 0.46533203125, 0.810791015625, 1.15625, 1.501708984375, 1.84716796875, 2.192626953125, 2.5380859375, 2.883544921875, 3.22900390625, 3.574462890625, 3.919921875, 4.265380859375, 4.61083984375, 4.956298828125, 5.3017578125, 5.647216796875, 5.99267578125, 6.338134765625, 6.68359375, 7.029052734375, 7.37451171875, 7.719970703125, 8.0654296875, 8.410888671875, 8.75634765625, 9.101806640625, 9.447265625, 9.792724609375, 10.13818359375, 10.483642578125, 10.8291015625, 11.174560546875, 11.52001953125, 11.865478515625, 12.2109375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 12.0, 14.0, 15.0, 18.0, 24.0, 26.0, 39.0, 48.0, 62.0, 87.0, 76.0, 74.0, 80.0, 80.0, 89.0, 49.0, 40.0, 46.0, 21.0, 21.0, 16.0, 8.0, 2.0, 11.0, 1.0, 3.0, 4.0, 7.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.419342041015625, -1.37481689453125, -1.330291748046875, -1.2857666015625, -1.241241455078125, -1.19671630859375, -1.152191162109375, -1.107666015625, -1.063140869140625, -1.01861572265625, -0.974090576171875, -0.9295654296875, -0.885040283203125, -0.84051513671875, -0.795989990234375, -0.75146484375, -0.706939697265625, -0.66241455078125, -0.617889404296875, -0.5733642578125, -0.528839111328125, -0.48431396484375, -0.439788818359375, -0.395263671875, -0.350738525390625, -0.30621337890625, -0.261688232421875, -0.2171630859375, -0.172637939453125, -0.12811279296875, -0.083587646484375, -0.0390625, 0.005462646484375, 0.04998779296875, 0.094512939453125, 0.1390380859375, 0.183563232421875, 0.22808837890625, 0.272613525390625, 0.317138671875, 0.361663818359375, 0.40618896484375, 0.450714111328125, 0.4952392578125, 0.539764404296875, 0.58428955078125, 0.628814697265625, 0.67333984375, 0.717864990234375, 0.76239013671875, 0.806915283203125, 0.8514404296875, 0.895965576171875, 0.94049072265625, 0.985015869140625, 1.029541015625, 1.074066162109375, 1.11859130859375, 1.163116455078125, 1.2076416015625, 1.252166748046875, 1.29669189453125, 1.341217041015625, 1.3857421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 9.0, 8.0, 9.0, 12.0, 16.0, 16.0, 18.0, 31.0, 57.0, 67.0, 113.0, 157.0, 263.0, 669.0, 2710.0, 18691.0, 540429.0, 463899.0, 17384.0, 2612.0, 648.0, 259.0, 129.0, 80.0, 76.0, 35.0, 39.0, 31.0, 19.0, 14.0, 14.0, 7.0, 7.0, 0.0, 4.0, 5.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.5625, -16.99560546875, -16.4287109375, -15.86181640625, -15.294921875, -14.72802734375, -14.1611328125, -13.59423828125, -13.02734375, -12.46044921875, -11.8935546875, -11.32666015625, -10.759765625, -10.19287109375, -9.6259765625, -9.05908203125, -8.4921875, -7.92529296875, -7.3583984375, -6.79150390625, -6.224609375, -5.65771484375, -5.0908203125, -4.52392578125, -3.95703125, -3.39013671875, -2.8232421875, -2.25634765625, -1.689453125, -1.12255859375, -0.5556640625, 0.01123046875, 0.578125, 1.14501953125, 1.7119140625, 2.27880859375, 2.845703125, 3.41259765625, 3.9794921875, 4.54638671875, 5.11328125, 5.68017578125, 6.2470703125, 6.81396484375, 7.380859375, 7.94775390625, 8.5146484375, 9.08154296875, 9.6484375, 10.21533203125, 10.7822265625, 11.34912109375, 11.916015625, 12.48291015625, 13.0498046875, 13.61669921875, 14.18359375, 14.75048828125, 15.3173828125, 15.88427734375, 16.451171875, 17.01806640625, 17.5849609375, 18.15185546875, 18.71875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 12.0, 13.0, 45.0, 109.0, 255.0, 364.0, 130.0, 45.0, 18.0, 11.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.484811782836914, -20.69284439086914, -19.900876998901367, -19.108909606933594, -18.316944122314453, -17.52497673034668, -16.733009338378906, -15.941041946411133, -15.149075508117676, -14.357108116149902, -13.565141677856445, -12.773174285888672, -11.981206893920898, -11.189240455627441, -10.397273063659668, -9.605306625366211, -8.813339233398438, -8.021371841430664, -7.229405403137207, -6.437438011169434, -5.645471096038818, -4.853504180908203, -4.06153678894043, -3.2695698738098145, -2.477602958679199, -1.6856359243392944, -0.8936688899993896, -0.10170173645019531, 0.6902651786804199, 1.4822320938110352, 2.2741994857788086, 3.066166400909424, 3.858135223388672, 4.650102138519287, 5.442069053649902, 6.234036445617676, 7.026003360748291, 7.817970275878906, 8.60993766784668, 9.401905059814453, 10.19387149810791, 10.985838890075684, 11.77780532836914, 12.569772720336914, 13.361740112304688, 14.153706550598145, 14.945673942565918, 15.737640380859375, 16.52960777282715, 17.321575164794922, 18.113542556762695, 18.90550994873047, 19.69747543334961, 20.489442825317383, 21.281410217285156, 22.07337760925293, 22.865345001220703, 23.657312393188477, 24.44927978515625, 25.24124526977539, 26.033212661743164, 26.825180053710938, 27.61714744567871, 28.409114837646484, 29.201080322265625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 9.0, 6.0, 17.0, 16.0, 20.0, 12.0, 23.0, 30.0, 39.0, 22.0, 23.0, 28.0, 40.0, 33.0, 31.0, 57.0, 41.0, 38.0, 38.0, 43.0, 40.0, 34.0, 37.0, 34.0, 31.0, 42.0, 35.0, 25.0, 22.0, 25.0, 20.0, 13.0, 15.0, 12.0, 11.0, 10.0, 7.0, 8.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.685756683349609, -4.528868675231934, -4.371981143951416, -4.21509313583374, -4.058205604553223, -3.901317596435547, -3.74442982673645, -3.5875420570373535, -3.4306540489196777, -3.273766279220581, -3.1168785095214844, -2.9599905014038086, -2.803102731704712, -2.6462149620056152, -2.4893271923065186, -2.332439422607422, -2.175551652908325, -2.0186638832092285, -1.8617759943008423, -1.7048882246017456, -1.5480003356933594, -1.3911125659942627, -1.234224796295166, -1.0773369073867798, -0.9204491376876831, -0.7635613083839417, -0.6066734790802002, -0.4497857093811035, -0.29289788007736206, -0.1360100507736206, 0.020877718925476074, 0.1777656078338623, 0.334653377532959, 0.49154120683670044, 0.6484290361404419, 0.8053168058395386, 0.96220463514328, 1.1190924644470215, 1.2759802341461182, 1.4328681230545044, 1.589755892753601, 1.7466436624526978, 1.903531551361084, 2.0604193210601807, 2.2173070907592773, 2.374195098876953, 2.5310826301574707, 2.6879706382751465, 2.844858407974243, 3.00174617767334, 3.1586339473724365, 3.315521717071533, 3.472409725189209, 3.6292974948883057, 3.7861852645874023, 3.943073272705078, 4.099960803985596, 4.2568488121032715, 4.413736343383789, 4.570624351501465, 4.727511882781982, 4.884399890899658, 5.041287422180176, 5.198175430297852, 5.355063438415527]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 11.0, 11.0, 14.0, 18.0, 21.0, 22.0, 23.0, 26.0, 34.0, 23.0, 40.0, 36.0, 35.0, 35.0, 37.0, 47.0, 30.0, 42.0, 44.0, 48.0, 46.0, 40.0, 51.0, 27.0, 39.0, 21.0, 26.0, 17.0, 21.0, 15.0, 13.0, 13.0, 8.0, 15.0, 6.0, 8.0, 4.0, 4.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.667724609375, -2.56201171875, -2.456298828125, -2.3505859375, -2.244873046875, -2.13916015625, -2.033447265625, -1.927734375, -1.822021484375, -1.71630859375, -1.610595703125, -1.5048828125, -1.399169921875, -1.29345703125, -1.187744140625, -1.08203125, -0.976318359375, -0.87060546875, -0.764892578125, -0.6591796875, -0.553466796875, -0.44775390625, -0.342041015625, -0.236328125, -0.130615234375, -0.02490234375, 0.080810546875, 0.1865234375, 0.292236328125, 0.39794921875, 0.503662109375, 0.609375, 0.715087890625, 0.82080078125, 0.926513671875, 1.0322265625, 1.137939453125, 1.24365234375, 1.349365234375, 1.455078125, 1.560791015625, 1.66650390625, 1.772216796875, 1.8779296875, 1.983642578125, 2.08935546875, 2.195068359375, 2.30078125, 2.406494140625, 2.51220703125, 2.617919921875, 2.7236328125, 2.829345703125, 2.93505859375, 3.040771484375, 3.146484375, 3.252197265625, 3.35791015625, 3.463623046875, 3.5693359375, 3.675048828125, 3.78076171875, 3.886474609375, 3.9921875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 9.0, 8.0, 12.0, 23.0, 25.0, 37.0, 69.0, 96.0, 170.0, 265.0, 409.0, 647.0, 1045.0, 1656.0, 2850.0, 4936.0, 9562.0, 20708.0, 54315.0, 168335.0, 420738.0, 236569.0, 73614.0, 26701.0, 11763.0, 5776.0, 3209.0, 1825.0, 1228.0, 717.0, 442.0, 286.0, 164.0, 123.0, 79.0, 50.0, 29.0, 20.0, 21.0, 8.0, 7.0, 4.0, 6.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.7896728515625, -5.606689453125, -5.4237060546875, -5.24072265625, -5.0577392578125, -4.874755859375, -4.6917724609375, -4.5087890625, -4.3258056640625, -4.142822265625, -3.9598388671875, -3.77685546875, -3.5938720703125, -3.410888671875, -3.2279052734375, -3.044921875, -2.8619384765625, -2.678955078125, -2.4959716796875, -2.31298828125, -2.1300048828125, -1.947021484375, -1.7640380859375, -1.5810546875, -1.3980712890625, -1.215087890625, -1.0321044921875, -0.84912109375, -0.6661376953125, -0.483154296875, -0.3001708984375, -0.1171875, 0.0657958984375, 0.248779296875, 0.4317626953125, 0.61474609375, 0.7977294921875, 0.980712890625, 1.1636962890625, 1.3466796875, 1.5296630859375, 1.712646484375, 1.8956298828125, 2.07861328125, 2.2615966796875, 2.444580078125, 2.6275634765625, 2.810546875, 2.9935302734375, 3.176513671875, 3.3594970703125, 3.54248046875, 3.7254638671875, 3.908447265625, 4.0914306640625, 4.2744140625, 4.4573974609375, 4.640380859375, 4.8233642578125, 5.00634765625, 5.1893310546875, 5.372314453125, 5.5552978515625, 5.73828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 3.0, 7.0, 9.0, 9.0, 13.0, 14.0, 17.0, 13.0, 31.0, 33.0, 35.0, 33.0, 36.0, 53.0, 68.0, 112.0, 190.0, 1433.0, 303.0, 167.0, 86.0, 60.0, 48.0, 51.0, 37.0, 28.0, 42.0, 31.0, 20.0, 15.0, 14.0, 15.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.96875, -12.5177001953125, -12.066650390625, -11.6156005859375, -11.16455078125, -10.7135009765625, -10.262451171875, -9.8114013671875, -9.3603515625, -8.9093017578125, -8.458251953125, -8.0072021484375, -7.55615234375, -7.1051025390625, -6.654052734375, -6.2030029296875, -5.751953125, -5.3009033203125, -4.849853515625, -4.3988037109375, -3.94775390625, -3.4967041015625, -3.045654296875, -2.5946044921875, -2.1435546875, -1.6925048828125, -1.241455078125, -0.7904052734375, -0.33935546875, 0.1116943359375, 0.562744140625, 1.0137939453125, 1.46484375, 1.9158935546875, 2.366943359375, 2.8179931640625, 3.26904296875, 3.7200927734375, 4.171142578125, 4.6221923828125, 5.0732421875, 5.5242919921875, 5.975341796875, 6.4263916015625, 6.87744140625, 7.3284912109375, 7.779541015625, 8.2305908203125, 8.681640625, 9.1326904296875, 9.583740234375, 10.0347900390625, 10.48583984375, 10.9368896484375, 11.387939453125, 11.8389892578125, 12.2900390625, 12.7410888671875, 13.192138671875, 13.6431884765625, 14.09423828125, 14.5452880859375, 14.996337890625, 15.4473876953125, 15.8984375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 7.0, 9.0, 14.0, 14.0, 27.0, 35.0, 48.0, 82.0, 100.0, 148.0, 259.0, 490.0, 972.0, 2092.0, 5091.0, 14062.0, 55406.0, 561239.0, 2259020.0, 199382.0, 31181.0, 9190.0, 3564.0, 1594.0, 701.0, 366.0, 197.0, 150.0, 75.0, 57.0, 28.0, 25.0, 19.0, 15.0, 11.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 5.0, 0.0, 2.0], "bins": [-17.25, -16.7877197265625, -16.325439453125, -15.8631591796875, -15.40087890625, -14.9385986328125, -14.476318359375, -14.0140380859375, -13.5517578125, -13.0894775390625, -12.627197265625, -12.1649169921875, -11.70263671875, -11.2403564453125, -10.778076171875, -10.3157958984375, -9.853515625, -9.3912353515625, -8.928955078125, -8.4666748046875, -8.00439453125, -7.5421142578125, -7.079833984375, -6.6175537109375, -6.1552734375, -5.6929931640625, -5.230712890625, -4.7684326171875, -4.30615234375, -3.8438720703125, -3.381591796875, -2.9193115234375, -2.45703125, -1.9947509765625, -1.532470703125, -1.0701904296875, -0.60791015625, -0.1456298828125, 0.316650390625, 0.7789306640625, 1.2412109375, 1.7034912109375, 2.165771484375, 2.6280517578125, 3.09033203125, 3.5526123046875, 4.014892578125, 4.4771728515625, 4.939453125, 5.4017333984375, 5.864013671875, 6.3262939453125, 6.78857421875, 7.2508544921875, 7.713134765625, 8.1754150390625, 8.6376953125, 9.0999755859375, 9.562255859375, 10.0245361328125, 10.48681640625, 10.9490966796875, 11.411376953125, 11.8736572265625, 12.3359375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 36.0, 354.0, 532.0, 89.0, 4.0, 1.0, 0.0, 1.0], "bins": [-315.1501159667969, -309.726806640625, -304.30352783203125, -298.8802185058594, -293.4569396972656, -288.03363037109375, -282.6103515625, -277.1870422363281, -271.76373291015625, -266.3404235839844, -260.9171447753906, -255.4938507080078, -250.070556640625, -244.64724731445312, -239.2239532470703, -233.8006591796875, -228.37738037109375, -222.95408630371094, -217.53079223632812, -212.1074981689453, -206.6842041015625, -201.26089477539062, -195.8376007080078, -190.414306640625, -184.9910125732422, -179.56771850585938, -174.14442443847656, -168.72113037109375, -163.29782104492188, -157.87452697753906, -152.45123291015625, -147.02793884277344, -141.60464477539062, -136.1813507080078, -130.758056640625, -125.33475494384766, -119.91146087646484, -114.48816680908203, -109.06486511230469, -103.64157104492188, -98.21826934814453, -92.79497528076172, -87.37167358398438, -81.94837951660156, -76.52508544921875, -71.10179138183594, -65.67849731445312, -60.25519561767578, -54.83190155029297, -49.408607482910156, -43.98530960083008, -38.56201171875, -33.13871765136719, -27.715421676635742, -22.292125701904297, -16.86882781982422, -11.445533752441406, -6.022237777709961, -0.5989418029785156, 4.82435417175293, 10.247650146484375, 15.67094612121582, 21.094242095947266, 26.517539978027344, 31.940834045410156]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 10.0, 9.0, 6.0, 10.0, 10.0, 24.0, 13.0, 21.0, 25.0, 25.0, 25.0, 31.0, 26.0, 39.0, 39.0, 35.0, 35.0, 32.0, 53.0, 43.0, 39.0, 44.0, 38.0, 42.0, 27.0, 23.0, 24.0, 35.0, 26.0, 22.0, 33.0, 20.0, 27.0, 13.0, 19.0, 11.0, 8.0, 10.0, 8.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.94978332519531, -36.749515533447266, -35.54924774169922, -34.34898376464844, -33.14871597290039, -31.948448181152344, -30.748180389404297, -29.54791259765625, -28.347646713256836, -27.14737892150879, -25.947113037109375, -24.746845245361328, -23.54657745361328, -22.346311569213867, -21.14604377746582, -19.945777893066406, -18.74551010131836, -17.545242309570312, -16.3449764251709, -15.144708633422852, -13.944441795349121, -12.74417495727539, -11.543907165527344, -10.343640327453613, -9.143373489379883, -7.943106651306152, -6.742839336395264, -5.542572021484375, -4.3423051834106445, -3.142038345336914, -1.9417710304260254, -0.7415037155151367, 0.45876312255859375, 1.6590301990509033, 2.859297275543213, 4.059564590454102, 5.259831428527832, 6.4600982666015625, 7.660365581512451, 8.86063289642334, 10.06089973449707, 11.2611665725708, 12.461433410644531, 13.661701202392578, 14.861968040466309, 16.06223487854004, 17.262502670288086, 18.4627685546875, 19.663036346435547, 20.863304138183594, 22.063570022583008, 23.263837814331055, 24.46410369873047, 25.664371490478516, 26.864639282226562, 28.06490707397461, 29.265172958374023, 30.46544075012207, 31.665706634521484, 32.86597442626953, 34.06624221801758, 35.266510009765625, 36.466773986816406, 37.66704177856445, 38.8673095703125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 2.0, 5.0, 8.0, 8.0, 13.0, 18.0, 17.0, 18.0, 18.0, 17.0, 28.0, 26.0, 40.0, 30.0, 36.0, 40.0, 29.0, 46.0, 39.0, 53.0, 44.0, 58.0, 51.0, 41.0, 47.0, 36.0, 25.0, 27.0, 38.0, 23.0, 20.0, 20.0, 13.0, 7.0, 12.0, 14.0, 8.0, 8.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.953948974609375, -2.83563232421875, -2.717315673828125, -2.5989990234375, -2.480682373046875, -2.36236572265625, -2.244049072265625, -2.125732421875, -2.007415771484375, -1.88909912109375, -1.770782470703125, -1.6524658203125, -1.534149169921875, -1.41583251953125, -1.297515869140625, -1.17919921875, -1.060882568359375, -0.94256591796875, -0.824249267578125, -0.7059326171875, -0.587615966796875, -0.46929931640625, -0.350982666015625, -0.232666015625, -0.114349365234375, 0.00396728515625, 0.122283935546875, 0.2406005859375, 0.358917236328125, 0.47723388671875, 0.595550537109375, 0.7138671875, 0.832183837890625, 0.95050048828125, 1.068817138671875, 1.1871337890625, 1.305450439453125, 1.42376708984375, 1.542083740234375, 1.660400390625, 1.778717041015625, 1.89703369140625, 2.015350341796875, 2.1336669921875, 2.251983642578125, 2.37030029296875, 2.488616943359375, 2.60693359375, 2.725250244140625, 2.84356689453125, 2.961883544921875, 3.0802001953125, 3.198516845703125, 3.31683349609375, 3.435150146484375, 3.553466796875, 3.671783447265625, 3.79010009765625, 3.908416748046875, 4.0267333984375, 4.145050048828125, 4.26336669921875, 4.381683349609375, 4.5]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 10.0, 15.0, 36.0, 35.0, 42.0, 66.0, 96.0, 126.0, 173.0, 315.0, 450.0, 733.0, 1245.0, 2124.0, 3730.0, 6850.0, 14197.0, 31472.0, 81506.0, 304826.0, 1584182.0, 1687004.0, 323774.0, 86250.0, 32602.0, 14885.0, 7360.0, 3939.0, 2402.0, 1377.0, 832.0, 555.0, 343.0, 227.0, 154.0, 96.0, 77.0, 51.0, 27.0, 29.0, 24.0, 11.0, 12.0, 6.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.257080078125, -6.04150390625, -5.825927734375, -5.6103515625, -5.394775390625, -5.17919921875, -4.963623046875, -4.748046875, -4.532470703125, -4.31689453125, -4.101318359375, -3.8857421875, -3.670166015625, -3.45458984375, -3.239013671875, -3.0234375, -2.807861328125, -2.59228515625, -2.376708984375, -2.1611328125, -1.945556640625, -1.72998046875, -1.514404296875, -1.298828125, -1.083251953125, -0.86767578125, -0.652099609375, -0.4365234375, -0.220947265625, -0.00537109375, 0.210205078125, 0.42578125, 0.641357421875, 0.85693359375, 1.072509765625, 1.2880859375, 1.503662109375, 1.71923828125, 1.934814453125, 2.150390625, 2.365966796875, 2.58154296875, 2.797119140625, 3.0126953125, 3.228271484375, 3.44384765625, 3.659423828125, 3.875, 4.090576171875, 4.30615234375, 4.521728515625, 4.7373046875, 4.952880859375, 5.16845703125, 5.384033203125, 5.599609375, 5.815185546875, 6.03076171875, 6.246337890625, 6.4619140625, 6.677490234375, 6.89306640625, 7.108642578125, 7.32421875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 7.0, 6.0, 4.0, 13.0, 11.0, 17.0, 20.0, 18.0, 35.0, 43.0, 69.0, 92.0, 114.0, 152.0, 249.0, 338.0, 442.0, 528.0, 477.0, 406.0, 269.0, 184.0, 138.0, 123.0, 92.0, 54.0, 45.0, 38.0, 14.0, 22.0, 11.0, 13.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.6875, -10.3883056640625, -10.089111328125, -9.7899169921875, -9.49072265625, -9.1915283203125, -8.892333984375, -8.5931396484375, -8.2939453125, -7.9947509765625, -7.695556640625, -7.3963623046875, -7.09716796875, -6.7979736328125, -6.498779296875, -6.1995849609375, -5.900390625, -5.6011962890625, -5.302001953125, -5.0028076171875, -4.70361328125, -4.4044189453125, -4.105224609375, -3.8060302734375, -3.5068359375, -3.2076416015625, -2.908447265625, -2.6092529296875, -2.31005859375, -2.0108642578125, -1.711669921875, -1.4124755859375, -1.11328125, -0.8140869140625, -0.514892578125, -0.2156982421875, 0.08349609375, 0.3826904296875, 0.681884765625, 0.9810791015625, 1.2802734375, 1.5794677734375, 1.878662109375, 2.1778564453125, 2.47705078125, 2.7762451171875, 3.075439453125, 3.3746337890625, 3.673828125, 3.9730224609375, 4.272216796875, 4.5714111328125, 4.87060546875, 5.1697998046875, 5.468994140625, 5.7681884765625, 6.0673828125, 6.3665771484375, 6.665771484375, 6.9649658203125, 7.26416015625, 7.5633544921875, 7.862548828125, 8.1617431640625, 8.4609375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 4.0, 6.0, 6.0, 23.0, 29.0, 56.0, 81.0, 111.0, 177.0, 289.0, 488.0, 897.0, 1728.0, 3427.0, 7562.0, 19205.0, 55849.0, 219232.0, 1553858.0, 1960667.0, 268138.0, 64630.0, 21453.0, 8430.0, 3674.0, 1851.0, 986.0, 536.0, 322.0, 197.0, 148.0, 77.0, 48.0, 39.0, 20.0, 18.0, 7.0, 6.0, 2.0, 4.0, 2.0], "bins": [-20.609375, -20.119384765625, -19.62939453125, -19.139404296875, -18.6494140625, -18.159423828125, -17.66943359375, -17.179443359375, -16.689453125, -16.199462890625, -15.70947265625, -15.219482421875, -14.7294921875, -14.239501953125, -13.74951171875, -13.259521484375, -12.76953125, -12.279541015625, -11.78955078125, -11.299560546875, -10.8095703125, -10.319580078125, -9.82958984375, -9.339599609375, -8.849609375, -8.359619140625, -7.86962890625, -7.379638671875, -6.8896484375, -6.399658203125, -5.90966796875, -5.419677734375, -4.9296875, -4.439697265625, -3.94970703125, -3.459716796875, -2.9697265625, -2.479736328125, -1.98974609375, -1.499755859375, -1.009765625, -0.519775390625, -0.02978515625, 0.460205078125, 0.9501953125, 1.440185546875, 1.93017578125, 2.420166015625, 2.91015625, 3.400146484375, 3.89013671875, 4.380126953125, 4.8701171875, 5.360107421875, 5.85009765625, 6.340087890625, 6.830078125, 7.320068359375, 7.81005859375, 8.300048828125, 8.7900390625, 9.280029296875, 9.77001953125, 10.260009765625, 10.75]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 22.0, 37.0, 106.0, 209.0, 252.0, 217.0, 104.0, 45.0, 10.0, 7.0, 0.0, 1.0], "bins": [-236.332763671875, -232.1504364013672, -227.96812438964844, -223.78579711914062, -219.60348510742188, -215.42115783691406, -211.2388458251953, -207.0565185546875, -202.87420654296875, -198.69187927246094, -194.5095672607422, -190.32723999023438, -186.14492797851562, -181.9626007080078, -177.78028869628906, -173.59796142578125, -169.41563415527344, -165.23330688476562, -161.05099487304688, -156.86866760253906, -152.6863555908203, -148.5040283203125, -144.32171630859375, -140.13938903808594, -135.95706176757812, -131.7747344970703, -127.59242248535156, -123.41010284423828, -119.227783203125, -115.04545593261719, -110.8631362915039, -106.68081665039062, -102.49850463867188, -98.3161849975586, -94.13386535644531, -89.95154571533203, -85.76922607421875, -81.58689880371094, -77.40457916259766, -73.22225952148438, -69.0399398803711, -64.85762023925781, -60.67530059814453, -56.492977142333984, -52.3106575012207, -48.12833786010742, -43.946014404296875, -39.763694763183594, -35.58137512207031, -31.39905548095703, -27.216733932495117, -23.034412384033203, -18.852092742919922, -14.66977310180664, -10.487451553344727, -6.3051300048828125, -2.122812271118164, 2.0595083236694336, 6.241828918457031, 10.424149513244629, 14.606470108032227, 18.788789749145508, 22.971111297607422, 27.153432846069336, 31.335752487182617]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 6.0, 6.0, 10.0, 9.0, 10.0, 16.0, 13.0, 17.0, 15.0, 18.0, 25.0, 28.0, 27.0, 41.0, 30.0, 35.0, 44.0, 41.0, 43.0, 46.0, 42.0, 44.0, 43.0, 47.0, 42.0, 36.0, 35.0, 31.0, 27.0, 29.0, 21.0, 22.0, 24.0, 17.0, 17.0, 6.0, 7.0, 11.0, 5.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-35.92610168457031, -34.8918571472168, -33.85761260986328, -32.82337188720703, -31.789127349853516, -30.7548828125, -29.720638275146484, -28.6863956451416, -27.65215301513672, -26.617908477783203, -25.58366584777832, -24.549421310424805, -23.515178680419922, -22.480934143066406, -21.44668960571289, -20.412446975708008, -19.378202438354492, -18.343957901000977, -17.309715270996094, -16.275470733642578, -15.241228103637695, -14.20698356628418, -13.17273998260498, -12.138496398925781, -11.104252815246582, -10.070009231567383, -9.035765647888184, -8.001522064208984, -6.967278003692627, -5.933034420013428, -4.89879035949707, -3.864546775817871, -2.830301284790039, -1.7960575819015503, -0.7618138790130615, 0.2724299430847168, 1.306673526763916, 2.3409171104431152, 3.3751611709594727, 4.409404754638672, 5.443648338317871, 6.47789192199707, 7.5121355056762695, 8.546379089355469, 9.580623626708984, 10.614866256713867, 11.649110794067383, 12.683354377746582, 13.717597961425781, 14.75184154510498, 15.78608512878418, 16.820329666137695, 17.854572296142578, 18.888816833496094, 19.92306137084961, 20.957304000854492, 21.991546630859375, 23.02579116821289, 24.060033798217773, 25.09427833557129, 26.128520965576172, 27.162765502929688, 28.197010040283203, 29.231252670288086, 30.2654972076416]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 6.0, 10.0, 4.0, 10.0, 11.0, 8.0, 16.0, 16.0, 15.0, 15.0, 29.0, 27.0, 34.0, 27.0, 44.0, 29.0, 39.0, 40.0, 46.0, 45.0, 53.0, 64.0, 45.0, 35.0, 37.0, 22.0, 35.0, 36.0, 29.0, 30.0, 22.0, 30.0, 13.0, 14.0, 14.0, 14.0, 6.0, 7.0, 11.0, 5.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.19921875, -3.078125, -2.95703125, -2.8359375, -2.71484375, -2.59375, -2.47265625, -2.3515625, -2.23046875, -2.109375, -1.98828125, -1.8671875, -1.74609375, -1.625, -1.50390625, -1.3828125, -1.26171875, -1.140625, -1.01953125, -0.8984375, -0.77734375, -0.65625, -0.53515625, -0.4140625, -0.29296875, -0.171875, -0.05078125, 0.0703125, 0.19140625, 0.3125, 0.43359375, 0.5546875, 0.67578125, 0.796875, 0.91796875, 1.0390625, 1.16015625, 1.28125, 1.40234375, 1.5234375, 1.64453125, 1.765625, 1.88671875, 2.0078125, 2.12890625, 2.25, 2.37109375, 2.4921875, 2.61328125, 2.734375, 2.85546875, 2.9765625, 3.09765625, 3.21875, 3.33984375, 3.4609375, 3.58203125, 3.703125, 3.82421875, 3.9453125, 4.06640625, 4.1875, 4.30859375, 4.4296875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 12.0, 12.0, 24.0, 38.0, 50.0, 91.0, 118.0, 248.0, 388.0, 707.0, 1205.0, 2232.0, 4153.0, 7529.0, 14172.0, 26121.0, 47167.0, 78693.0, 121997.0, 161898.0, 176141.0, 148874.0, 106374.0, 66025.0, 38257.0, 21096.0, 11452.0, 6130.0, 3254.0, 1761.0, 998.0, 529.0, 326.0, 198.0, 98.0, 71.0, 35.0, 20.0, 19.0, 15.0, 8.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.329315185546875, -3.20745849609375, -3.085601806640625, -2.9637451171875, -2.841888427734375, -2.72003173828125, -2.598175048828125, -2.476318359375, -2.354461669921875, -2.23260498046875, -2.110748291015625, -1.9888916015625, -1.867034912109375, -1.74517822265625, -1.623321533203125, -1.50146484375, -1.379608154296875, -1.25775146484375, -1.135894775390625, -1.0140380859375, -0.892181396484375, -0.77032470703125, -0.648468017578125, -0.526611328125, -0.404754638671875, -0.28289794921875, -0.161041259765625, -0.0391845703125, 0.082672119140625, 0.20452880859375, 0.326385498046875, 0.4482421875, 0.570098876953125, 0.69195556640625, 0.813812255859375, 0.9356689453125, 1.057525634765625, 1.17938232421875, 1.301239013671875, 1.423095703125, 1.544952392578125, 1.66680908203125, 1.788665771484375, 1.9105224609375, 2.032379150390625, 2.15423583984375, 2.276092529296875, 2.39794921875, 2.519805908203125, 2.64166259765625, 2.763519287109375, 2.8853759765625, 3.007232666015625, 3.12908935546875, 3.250946044921875, 3.372802734375, 3.494659423828125, 3.61651611328125, 3.738372802734375, 3.8602294921875, 3.982086181640625, 4.10394287109375, 4.225799560546875, 4.34765625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 1.0, 6.0, 7.0, 10.0, 9.0, 11.0, 19.0, 18.0, 23.0, 24.0, 32.0, 28.0, 34.0, 35.0, 35.0, 29.0, 40.0, 47.0, 46.0, 1066.0, 39.0, 40.0, 42.0, 36.0, 46.0, 30.0, 29.0, 19.0, 39.0, 26.0, 25.0, 16.0, 18.0, 19.0, 16.0, 6.0, 13.0, 7.0, 7.0, 1.0, 9.0, 6.0, 3.0, 1.0, 3.0, 2.0], "bins": [-4.5234375, -4.403564453125, -4.28369140625, -4.163818359375, -4.0439453125, -3.924072265625, -3.80419921875, -3.684326171875, -3.564453125, -3.444580078125, -3.32470703125, -3.204833984375, -3.0849609375, -2.965087890625, -2.84521484375, -2.725341796875, -2.60546875, -2.485595703125, -2.36572265625, -2.245849609375, -2.1259765625, -2.006103515625, -1.88623046875, -1.766357421875, -1.646484375, -1.526611328125, -1.40673828125, -1.286865234375, -1.1669921875, -1.047119140625, -0.92724609375, -0.807373046875, -0.6875, -0.567626953125, -0.44775390625, -0.327880859375, -0.2080078125, -0.088134765625, 0.03173828125, 0.151611328125, 0.271484375, 0.391357421875, 0.51123046875, 0.631103515625, 0.7509765625, 0.870849609375, 0.99072265625, 1.110595703125, 1.23046875, 1.350341796875, 1.47021484375, 1.590087890625, 1.7099609375, 1.829833984375, 1.94970703125, 2.069580078125, 2.189453125, 2.309326171875, 2.42919921875, 2.549072265625, 2.6689453125, 2.788818359375, 2.90869140625, 3.028564453125, 3.1484375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 0.0, 10.0, 8.0, 18.0, 11.0, 12.0, 21.0, 19.0, 39.0, 32.0, 43.0, 87.0, 102.0, 114.0, 189.0, 259.0, 374.0, 478.0, 819.0, 1233.0, 1875.0, 3198.0, 5537.0, 9798.0, 18529.0, 39040.0, 129634.0, 1711962.0, 99481.0, 35202.0, 16871.0, 8935.0, 4971.0, 2872.0, 1772.0, 1042.0, 719.0, 496.0, 388.0, 236.0, 176.0, 142.0, 95.0, 72.0, 65.0, 39.0, 31.0, 28.0, 12.0, 14.0, 11.0, 8.0, 6.0, 5.0, 2.0, 2.0], "bins": [-8.8203125, -8.57135009765625, -8.3223876953125, -8.07342529296875, -7.824462890625, -7.57550048828125, -7.3265380859375, -7.07757568359375, -6.82861328125, -6.57965087890625, -6.3306884765625, -6.08172607421875, -5.832763671875, -5.58380126953125, -5.3348388671875, -5.08587646484375, -4.8369140625, -4.58795166015625, -4.3389892578125, -4.09002685546875, -3.841064453125, -3.59210205078125, -3.3431396484375, -3.09417724609375, -2.84521484375, -2.59625244140625, -2.3472900390625, -2.09832763671875, -1.849365234375, -1.60040283203125, -1.3514404296875, -1.10247802734375, -0.853515625, -0.60455322265625, -0.3555908203125, -0.10662841796875, 0.142333984375, 0.39129638671875, 0.6402587890625, 0.88922119140625, 1.13818359375, 1.38714599609375, 1.6361083984375, 1.88507080078125, 2.134033203125, 2.38299560546875, 2.6319580078125, 2.88092041015625, 3.1298828125, 3.37884521484375, 3.6278076171875, 3.87677001953125, 4.125732421875, 4.37469482421875, 4.6236572265625, 4.87261962890625, 5.12158203125, 5.37054443359375, 5.6195068359375, 5.86846923828125, 6.117431640625, 6.36639404296875, 6.6153564453125, 6.86431884765625, 7.11328125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 5.0, 4.0, 10.0, 9.0, 4.0, 15.0, 16.0, 11.0, 17.0, 15.0, 24.0, 26.0, 38.0, 51.0, 54.0, 58.0, 64.0, 81.0, 62.0, 79.0, 65.0, 41.0, 42.0, 33.0, 19.0, 14.0, 23.0, 16.0, 14.0, 13.0, 7.0, 9.0, 11.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9140625, -0.8852615356445312, -0.8564605712890625, -0.8276596069335938, -0.798858642578125, -0.7700576782226562, -0.7412567138671875, -0.7124557495117188, -0.68365478515625, -0.6548538208007812, -0.6260528564453125, -0.5972518920898438, -0.568450927734375, -0.5396499633789062, -0.5108489990234375, -0.48204803466796875, -0.4532470703125, -0.42444610595703125, -0.3956451416015625, -0.36684417724609375, -0.338043212890625, -0.30924224853515625, -0.2804412841796875, -0.25164031982421875, -0.22283935546875, -0.19403839111328125, -0.1652374267578125, -0.13643646240234375, -0.107635498046875, -0.07883453369140625, -0.0500335693359375, -0.02123260498046875, 0.007568359375, 0.03636932373046875, 0.0651702880859375, 0.09397125244140625, 0.122772216796875, 0.15157318115234375, 0.1803741455078125, 0.20917510986328125, 0.23797607421875, 0.26677703857421875, 0.2955780029296875, 0.32437896728515625, 0.353179931640625, 0.38198089599609375, 0.4107818603515625, 0.43958282470703125, 0.4683837890625, 0.49718475341796875, 0.5259857177734375, 0.5547866821289062, 0.583587646484375, 0.6123886108398438, 0.6411895751953125, 0.6699905395507812, 0.69879150390625, 0.7275924682617188, 0.7563934326171875, 0.7851943969726562, 0.813995361328125, 0.8427963256835938, 0.8715972900390625, 0.9003982543945312, 0.92919921875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 5.0, 4.0, 2.0, 6.0, 7.0, 8.0, 20.0, 15.0, 18.0, 25.0, 36.0, 37.0, 52.0, 58.0, 90.0, 102.0, 137.0, 267.0, 526.0, 1913.0, 9421.0, 71430.0, 834793.0, 112710.0, 12867.0, 2393.0, 679.0, 267.0, 151.0, 116.0, 66.0, 65.0, 52.0, 41.0, 42.0, 22.0, 19.0, 21.0, 8.0, 11.0, 9.0, 15.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-12.1875, -11.8134765625, -11.439453125, -11.0654296875, -10.69140625, -10.3173828125, -9.943359375, -9.5693359375, -9.1953125, -8.8212890625, -8.447265625, -8.0732421875, -7.69921875, -7.3251953125, -6.951171875, -6.5771484375, -6.203125, -5.8291015625, -5.455078125, -5.0810546875, -4.70703125, -4.3330078125, -3.958984375, -3.5849609375, -3.2109375, -2.8369140625, -2.462890625, -2.0888671875, -1.71484375, -1.3408203125, -0.966796875, -0.5927734375, -0.21875, 0.1552734375, 0.529296875, 0.9033203125, 1.27734375, 1.6513671875, 2.025390625, 2.3994140625, 2.7734375, 3.1474609375, 3.521484375, 3.8955078125, 4.26953125, 4.6435546875, 5.017578125, 5.3916015625, 5.765625, 6.1396484375, 6.513671875, 6.8876953125, 7.26171875, 7.6357421875, 8.009765625, 8.3837890625, 8.7578125, 9.1318359375, 9.505859375, 9.8798828125, 10.25390625, 10.6279296875, 11.001953125, 11.3759765625, 11.75]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 12.0, 19.0, 28.0, 71.0, 151.0, 311.0, 240.0, 95.0, 34.0, 23.0, 13.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.079212188720703, -10.631657600402832, -10.184102058410645, -9.736547470092773, -9.288992881774902, -8.841438293457031, -8.393882751464844, -7.946328163146973, -7.498773097991943, -7.051218032836914, -6.603663444519043, -6.156108379364014, -5.708553314208984, -5.260998725891113, -4.813443660736084, -4.365888595581055, -3.9183340072631836, -3.4707791805267334, -3.023224353790283, -2.575669288635254, -2.1281144618988037, -1.6805596351623535, -1.2330045700073242, -0.785449743270874, -0.33789491653442383, 0.10965996980667114, 0.5572148561477661, 1.0047698020935059, 1.452324628829956, 1.8998794555664062, 2.3474345207214355, 2.7949893474578857, 3.242544174194336, 3.690099000930786, 4.137653827667236, 4.585208892822266, 5.032763481140137, 5.480318546295166, 5.927873611450195, 6.375428199768066, 6.822983264923096, 7.270538330078125, 7.718092918395996, 8.165647506713867, 8.613203048706055, 9.060757637023926, 9.508312225341797, 9.955867767333984, 10.403422355651855, 10.850976943969727, 11.298532485961914, 11.746087074279785, 12.193641662597656, 12.641197204589844, 13.088751792907715, 13.536306381225586, 13.983861923217773, 14.431416511535645, 14.878972053527832, 15.326526641845703, 15.774081230163574, 16.221635818481445, 16.669191360473633, 17.11674690246582, 17.564300537109375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 11.0, 12.0, 23.0, 22.0, 17.0, 24.0, 20.0, 19.0, 30.0, 22.0, 34.0, 34.0, 43.0, 32.0, 41.0, 32.0, 56.0, 42.0, 49.0, 36.0, 36.0, 50.0, 35.0, 29.0, 33.0, 32.0, 30.0, 20.0, 20.0, 23.0, 20.0, 16.0, 14.0, 7.0, 8.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.07973313331604, -2.9771764278411865, -2.874619722366333, -2.7720632553100586, -2.669506549835205, -2.5669498443603516, -2.464393138885498, -2.3618364334106445, -2.259279727935791, -2.1567230224609375, -2.054166316986084, -1.95160973072052, -1.8490530252456665, -1.7464964389801025, -1.643939733505249, -1.5413830280303955, -1.4388264417648315, -1.336269736289978, -1.233713150024414, -1.1311564445495605, -1.028599739074707, -0.9260430932044983, -0.8234864473342896, -0.720929741859436, -0.6183730959892273, -0.5158164501190186, -0.41325974464416504, -0.3107030987739563, -0.20814642310142517, -0.10558974742889404, -0.0030331015586853027, 0.09952360391616821, 0.20208024978637695, 0.3046369254589081, 0.4071936011314392, 0.509750247001648, 0.6123069524765015, 0.7148635983467102, 0.817420244216919, 0.9199769496917725, 1.022533655166626, 1.1250903606414795, 1.2276469469070435, 1.330203652381897, 1.4327603578567505, 1.5353169441223145, 1.637873649597168, 1.7404303550720215, 1.8429869413375854, 1.945543646812439, 2.048100233078003, 2.1506569385528564, 2.25321364402771, 2.3557703495025635, 2.458326816558838, 2.5608835220336914, 2.663440227508545, 2.7659969329833984, 2.868553638458252, 2.9711103439331055, 3.07366681098938, 3.1762235164642334, 3.278780221939087, 3.3813369274139404, 3.483893632888794]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 2.0, 5.0, 7.0, 10.0, 9.0, 9.0, 8.0, 13.0, 16.0, 20.0, 14.0, 26.0, 29.0, 36.0, 19.0, 40.0, 38.0, 38.0, 43.0, 38.0, 48.0, 56.0, 46.0, 57.0, 40.0, 30.0, 37.0, 21.0, 38.0, 33.0, 23.0, 25.0, 31.0, 19.0, 12.0, 16.0, 10.0, 9.0, 8.0, 9.0, 8.0, 1.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.541015625, -3.417205810546875, -3.29339599609375, -3.169586181640625, -3.0457763671875, -2.921966552734375, -2.79815673828125, -2.674346923828125, -2.550537109375, -2.426727294921875, -2.30291748046875, -2.179107666015625, -2.0552978515625, -1.931488037109375, -1.80767822265625, -1.683868408203125, -1.56005859375, -1.436248779296875, -1.31243896484375, -1.188629150390625, -1.0648193359375, -0.941009521484375, -0.81719970703125, -0.693389892578125, -0.569580078125, -0.445770263671875, -0.32196044921875, -0.198150634765625, -0.0743408203125, 0.049468994140625, 0.17327880859375, 0.297088623046875, 0.4208984375, 0.544708251953125, 0.66851806640625, 0.792327880859375, 0.9161376953125, 1.039947509765625, 1.16375732421875, 1.287567138671875, 1.411376953125, 1.535186767578125, 1.65899658203125, 1.782806396484375, 1.9066162109375, 2.030426025390625, 2.15423583984375, 2.278045654296875, 2.40185546875, 2.525665283203125, 2.64947509765625, 2.773284912109375, 2.8970947265625, 3.020904541015625, 3.14471435546875, 3.268524169921875, 3.392333984375, 3.516143798828125, 3.63995361328125, 3.763763427734375, 3.8875732421875, 4.011383056640625, 4.13519287109375, 4.259002685546875, 4.3828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 9.0, 9.0, 10.0, 10.0, 18.0, 25.0, 29.0, 47.0, 93.0, 105.0, 180.0, 292.0, 423.0, 631.0, 925.0, 1389.0, 2413.0, 4677.0, 12578.0, 50146.0, 265120.0, 521013.0, 142226.0, 28630.0, 8407.0, 3622.0, 1969.0, 1222.0, 807.0, 512.0, 331.0, 219.0, 154.0, 87.0, 64.0, 55.0, 26.0, 30.0, 17.0, 13.0, 14.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.87109375, -6.676513671875, -6.48193359375, -6.287353515625, -6.0927734375, -5.898193359375, -5.70361328125, -5.509033203125, -5.314453125, -5.119873046875, -4.92529296875, -4.730712890625, -4.5361328125, -4.341552734375, -4.14697265625, -3.952392578125, -3.7578125, -3.563232421875, -3.36865234375, -3.174072265625, -2.9794921875, -2.784912109375, -2.59033203125, -2.395751953125, -2.201171875, -2.006591796875, -1.81201171875, -1.617431640625, -1.4228515625, -1.228271484375, -1.03369140625, -0.839111328125, -0.64453125, -0.449951171875, -0.25537109375, -0.060791015625, 0.1337890625, 0.328369140625, 0.52294921875, 0.717529296875, 0.912109375, 1.106689453125, 1.30126953125, 1.495849609375, 1.6904296875, 1.885009765625, 2.07958984375, 2.274169921875, 2.46875, 2.663330078125, 2.85791015625, 3.052490234375, 3.2470703125, 3.441650390625, 3.63623046875, 3.830810546875, 4.025390625, 4.219970703125, 4.41455078125, 4.609130859375, 4.8037109375, 4.998291015625, 5.19287109375, 5.387451171875, 5.58203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 1.0, 2.0, 7.0, 9.0, 9.0, 16.0, 18.0, 11.0, 23.0, 21.0, 15.0, 22.0, 24.0, 34.0, 31.0, 34.0, 37.0, 47.0, 69.0, 92.0, 222.0, 1332.0, 271.0, 155.0, 91.0, 52.0, 48.0, 43.0, 35.0, 34.0, 31.0, 22.0, 25.0, 20.0, 17.0, 27.0, 16.0, 9.0, 9.0, 13.0, 9.0, 9.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.859375, -10.494873046875, -10.13037109375, -9.765869140625, -9.4013671875, -9.036865234375, -8.67236328125, -8.307861328125, -7.943359375, -7.578857421875, -7.21435546875, -6.849853515625, -6.4853515625, -6.120849609375, -5.75634765625, -5.391845703125, -5.02734375, -4.662841796875, -4.29833984375, -3.933837890625, -3.5693359375, -3.204833984375, -2.84033203125, -2.475830078125, -2.111328125, -1.746826171875, -1.38232421875, -1.017822265625, -0.6533203125, -0.288818359375, 0.07568359375, 0.440185546875, 0.8046875, 1.169189453125, 1.53369140625, 1.898193359375, 2.2626953125, 2.627197265625, 2.99169921875, 3.356201171875, 3.720703125, 4.085205078125, 4.44970703125, 4.814208984375, 5.1787109375, 5.543212890625, 5.90771484375, 6.272216796875, 6.63671875, 7.001220703125, 7.36572265625, 7.730224609375, 8.0947265625, 8.459228515625, 8.82373046875, 9.188232421875, 9.552734375, 9.917236328125, 10.28173828125, 10.646240234375, 11.0107421875, 11.375244140625, 11.73974609375, 12.104248046875, 12.46875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 4.0, 10.0, 14.0, 13.0, 12.0, 17.0, 26.0, 39.0, 35.0, 51.0, 58.0, 106.0, 165.0, 255.0, 485.0, 926.0, 2159.0, 6331.0, 22363.0, 126748.0, 2263315.0, 654173.0, 49513.0, 11900.0, 3817.0, 1526.0, 644.0, 346.0, 175.0, 120.0, 99.0, 53.0, 42.0, 36.0, 34.0, 18.0, 15.0, 13.0, 5.0, 8.0, 7.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-16.140625, -15.66259765625, -15.1845703125, -14.70654296875, -14.228515625, -13.75048828125, -13.2724609375, -12.79443359375, -12.31640625, -11.83837890625, -11.3603515625, -10.88232421875, -10.404296875, -9.92626953125, -9.4482421875, -8.97021484375, -8.4921875, -8.01416015625, -7.5361328125, -7.05810546875, -6.580078125, -6.10205078125, -5.6240234375, -5.14599609375, -4.66796875, -4.18994140625, -3.7119140625, -3.23388671875, -2.755859375, -2.27783203125, -1.7998046875, -1.32177734375, -0.84375, -0.36572265625, 0.1123046875, 0.59033203125, 1.068359375, 1.54638671875, 2.0244140625, 2.50244140625, 2.98046875, 3.45849609375, 3.9365234375, 4.41455078125, 4.892578125, 5.37060546875, 5.8486328125, 6.32666015625, 6.8046875, 7.28271484375, 7.7607421875, 8.23876953125, 8.716796875, 9.19482421875, 9.6728515625, 10.15087890625, 10.62890625, 11.10693359375, 11.5849609375, 12.06298828125, 12.541015625, 13.01904296875, 13.4970703125, 13.97509765625, 14.453125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [8.0, 21.0, 127.0, 323.0, 364.0, 138.0, 33.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.937607765197754, -8.976861000061035, -6.016114711761475, -3.055368423461914, -0.09462165832519531, 2.8661251068115234, 5.826870918273926, 8.787617683410645, 11.748364448547363, 14.709111213684082, 17.669857025146484, 20.630603790283203, 23.591350555419922, 26.55209732055664, 29.51284408569336, 32.47359085083008, 35.4343376159668, 38.395084381103516, 41.355831146240234, 44.31657791137695, 47.27732467651367, 50.23807144165039, 53.198814392089844, 56.15956115722656, 59.12030792236328, 62.0810546875, 65.04180145263672, 68.00254821777344, 70.96329498291016, 73.92404174804688, 76.8847885131836, 79.84553527832031, 82.80628204345703, 85.76702880859375, 88.72777557373047, 91.68852233886719, 94.6492691040039, 97.61001586914062, 100.57076263427734, 103.53150939941406, 106.49225616455078, 109.4530029296875, 112.41374969482422, 115.37449645996094, 118.33524322509766, 121.29598999023438, 124.2567367553711, 127.21748352050781, 130.17822265625, 133.1389617919922, 136.09971618652344, 139.06045532226562, 142.02120971679688, 144.98194885253906, 147.9427032470703, 150.9034423828125, 153.86419677734375, 156.82493591308594, 159.7856903076172, 162.74642944335938, 165.70718383789062, 168.6679229736328, 171.62867736816406, 174.58941650390625, 177.5501708984375]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 7.0, 5.0, 8.0, 6.0, 13.0, 13.0, 14.0, 16.0, 10.0, 24.0, 27.0, 24.0, 21.0, 29.0, 34.0, 38.0, 35.0, 35.0, 34.0, 43.0, 23.0, 36.0, 33.0, 43.0, 32.0, 38.0, 46.0, 50.0, 32.0, 30.0, 30.0, 23.0, 18.0, 15.0, 21.0, 12.0, 8.0, 20.0, 9.0, 7.0, 9.0, 5.0, 6.0, 7.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-37.215946197509766, -36.07471466064453, -34.93347930908203, -33.7922477722168, -32.65101623535156, -31.509780883789062, -30.368549346923828, -29.22731590270996, -28.086082458496094, -26.944849014282227, -25.80361557006836, -24.662384033203125, -23.521150588989258, -22.37991714477539, -21.238685607910156, -20.09745216369629, -18.956218719482422, -17.814985275268555, -16.673751831054688, -15.532520294189453, -14.391286849975586, -13.250053405761719, -12.108820915222168, -10.967588424682617, -9.82635498046875, -8.685121536254883, -7.543889045715332, -6.402656078338623, -5.261423110961914, -4.120190143585205, -2.978957176208496, -1.837724208831787, -0.6964950561523438, 0.44473791122436523, 1.5859708786010742, 2.727203845977783, 3.868436813354492, 5.009669780731201, 6.15090274810791, 7.292135715484619, 8.433368682861328, 9.574602127075195, 10.715834617614746, 11.857067108154297, 12.998300552368164, 14.139533996582031, 15.280766487121582, 16.421998977661133, 17.563232421875, 18.704465866088867, 19.845699310302734, 20.98693084716797, 22.128164291381836, 23.269397735595703, 24.410629272460938, 25.551862716674805, 26.693096160888672, 27.83432960510254, 28.975563049316406, 30.11679458618164, 31.258028030395508, 32.399261474609375, 33.54049301147461, 34.68172836303711, 35.822959899902344]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 7.0, 11.0, 9.0, 13.0, 14.0, 19.0, 13.0, 18.0, 20.0, 21.0, 36.0, 35.0, 34.0, 23.0, 39.0, 58.0, 34.0, 48.0, 43.0, 44.0, 51.0, 43.0, 40.0, 39.0, 24.0, 26.0, 28.0, 27.0, 30.0, 20.0, 22.0, 17.0, 22.0, 11.0, 7.0, 7.0, 7.0, 10.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.533203125, -3.410614013671875, -3.28802490234375, -3.165435791015625, -3.0428466796875, -2.920257568359375, -2.79766845703125, -2.675079345703125, -2.552490234375, -2.429901123046875, -2.30731201171875, -2.184722900390625, -2.0621337890625, -1.939544677734375, -1.81695556640625, -1.694366455078125, -1.57177734375, -1.449188232421875, -1.32659912109375, -1.204010009765625, -1.0814208984375, -0.958831787109375, -0.83624267578125, -0.713653564453125, -0.591064453125, -0.468475341796875, -0.34588623046875, -0.223297119140625, -0.1007080078125, 0.021881103515625, 0.14447021484375, 0.267059326171875, 0.3896484375, 0.512237548828125, 0.63482666015625, 0.757415771484375, 0.8800048828125, 1.002593994140625, 1.12518310546875, 1.247772216796875, 1.370361328125, 1.492950439453125, 1.61553955078125, 1.738128662109375, 1.8607177734375, 1.983306884765625, 2.10589599609375, 2.228485107421875, 2.35107421875, 2.473663330078125, 2.59625244140625, 2.718841552734375, 2.8414306640625, 2.964019775390625, 3.08660888671875, 3.209197998046875, 3.331787109375, 3.454376220703125, 3.57696533203125, 3.699554443359375, 3.8221435546875, 3.944732666015625, 4.06732177734375, 4.189910888671875, 4.3125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 7.0, 11.0, 14.0, 18.0, 35.0, 45.0, 52.0, 68.0, 88.0, 146.0, 219.0, 293.0, 400.0, 620.0, 978.0, 1495.0, 2587.0, 4424.0, 8641.0, 17619.0, 43636.0, 138338.0, 723617.0, 2300075.0, 729054.0, 138791.0, 43745.0, 18205.0, 8735.0, 4655.0, 2690.0, 1621.0, 1088.0, 721.0, 485.0, 326.0, 229.0, 151.0, 96.0, 89.0, 43.0, 40.0, 22.0, 16.0, 14.0, 11.0, 10.0, 6.0, 5.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-7.9296875, -7.677978515625, -7.42626953125, -7.174560546875, -6.9228515625, -6.671142578125, -6.41943359375, -6.167724609375, -5.916015625, -5.664306640625, -5.41259765625, -5.160888671875, -4.9091796875, -4.657470703125, -4.40576171875, -4.154052734375, -3.90234375, -3.650634765625, -3.39892578125, -3.147216796875, -2.8955078125, -2.643798828125, -2.39208984375, -2.140380859375, -1.888671875, -1.636962890625, -1.38525390625, -1.133544921875, -0.8818359375, -0.630126953125, -0.37841796875, -0.126708984375, 0.125, 0.376708984375, 0.62841796875, 0.880126953125, 1.1318359375, 1.383544921875, 1.63525390625, 1.886962890625, 2.138671875, 2.390380859375, 2.64208984375, 2.893798828125, 3.1455078125, 3.397216796875, 3.64892578125, 3.900634765625, 4.15234375, 4.404052734375, 4.65576171875, 4.907470703125, 5.1591796875, 5.410888671875, 5.66259765625, 5.914306640625, 6.166015625, 6.417724609375, 6.66943359375, 6.921142578125, 7.1728515625, 7.424560546875, 7.67626953125, 7.927978515625, 8.1796875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 3.0, 1.0, 10.0, 9.0, 9.0, 16.0, 11.0, 25.0, 32.0, 40.0, 67.0, 123.0, 182.0, 254.0, 403.0, 572.0, 642.0, 526.0, 374.0, 253.0, 145.0, 116.0, 81.0, 57.0, 37.0, 15.0, 13.0, 10.0, 7.0, 11.0, 5.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.0703125, -8.6832275390625, -8.296142578125, -7.9090576171875, -7.52197265625, -7.1348876953125, -6.747802734375, -6.3607177734375, -5.9736328125, -5.5865478515625, -5.199462890625, -4.8123779296875, -4.42529296875, -4.0382080078125, -3.651123046875, -3.2640380859375, -2.876953125, -2.4898681640625, -2.102783203125, -1.7156982421875, -1.32861328125, -0.9415283203125, -0.554443359375, -0.1673583984375, 0.2197265625, 0.6068115234375, 0.993896484375, 1.3809814453125, 1.76806640625, 2.1551513671875, 2.542236328125, 2.9293212890625, 3.31640625, 3.7034912109375, 4.090576171875, 4.4776611328125, 4.86474609375, 5.2518310546875, 5.638916015625, 6.0260009765625, 6.4130859375, 6.8001708984375, 7.187255859375, 7.5743408203125, 7.96142578125, 8.3485107421875, 8.735595703125, 9.1226806640625, 9.509765625, 9.8968505859375, 10.283935546875, 10.6710205078125, 11.05810546875, 11.4451904296875, 11.832275390625, 12.2193603515625, 12.6064453125, 12.9935302734375, 13.380615234375, 13.7677001953125, 14.15478515625, 14.5418701171875, 14.928955078125, 15.3160400390625, 15.703125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 13.0, 8.0, 16.0, 17.0, 29.0, 26.0, 51.0, 53.0, 85.0, 129.0, 168.0, 225.0, 423.0, 621.0, 1109.0, 1999.0, 4141.0, 9317.0, 26683.0, 102804.0, 709389.0, 2802727.0, 425095.0, 73265.0, 20485.0, 7517.0, 3416.0, 1706.0, 962.0, 569.0, 394.0, 253.0, 162.0, 132.0, 78.0, 57.0, 45.0, 31.0, 26.0, 19.0, 12.0, 5.0, 5.0, 7.0, 3.0, 1.0, 3.0], "bins": [-22.46875, -21.8834228515625, -21.298095703125, -20.7127685546875, -20.12744140625, -19.5421142578125, -18.956787109375, -18.3714599609375, -17.7861328125, -17.2008056640625, -16.615478515625, -16.0301513671875, -15.44482421875, -14.8594970703125, -14.274169921875, -13.6888427734375, -13.103515625, -12.5181884765625, -11.932861328125, -11.3475341796875, -10.76220703125, -10.1768798828125, -9.591552734375, -9.0062255859375, -8.4208984375, -7.8355712890625, -7.250244140625, -6.6649169921875, -6.07958984375, -5.4942626953125, -4.908935546875, -4.3236083984375, -3.73828125, -3.1529541015625, -2.567626953125, -1.9822998046875, -1.39697265625, -0.8116455078125, -0.226318359375, 0.3590087890625, 0.9443359375, 1.5296630859375, 2.114990234375, 2.7003173828125, 3.28564453125, 3.8709716796875, 4.456298828125, 5.0416259765625, 5.626953125, 6.2122802734375, 6.797607421875, 7.3829345703125, 7.96826171875, 8.5535888671875, 9.138916015625, 9.7242431640625, 10.3095703125, 10.8948974609375, 11.480224609375, 12.0655517578125, 12.65087890625, 13.2362060546875, 13.821533203125, 14.4068603515625, 14.9921875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 19.0, 24.0, 106.0, 228.0, 283.0, 221.0, 84.0, 26.0, 12.0, 3.0, 2.0, 0.0, 1.0], "bins": [-278.4163818359375, -273.3913269042969, -268.36627197265625, -263.3412170410156, -258.3161315917969, -253.2910919189453, -248.26602172851562, -243.240966796875, -238.21591186523438, -233.19085693359375, -228.16578674316406, -223.14073181152344, -218.1156768798828, -213.0906219482422, -208.0655517578125, -203.04049682617188, -198.01544189453125, -192.99038696289062, -187.96531677246094, -182.9402618408203, -177.9152069091797, -172.89015197753906, -167.86508178710938, -162.84002685546875, -157.81495666503906, -152.78990173339844, -147.76483154296875, -142.73977661132812, -137.7147216796875, -132.68966674804688, -127.66459655761719, -122.63954162597656, -117.61448669433594, -112.58942413330078, -107.56436920166016, -102.539306640625, -97.51425170898438, -92.48918914794922, -87.46412658691406, -82.43907165527344, -77.41401672363281, -72.38895416259766, -67.36389923095703, -62.338836669921875, -57.31378173828125, -52.288719177246094, -47.2636604309082, -42.23860168457031, -37.213539123535156, -32.188480377197266, -27.163421630859375, -22.13836097717285, -17.11330223083496, -12.08824348449707, -7.063182830810547, -2.0381240844726562, 2.9869346618652344, 8.011993408203125, 13.037053108215332, 18.06211280822754, 23.08717155456543, 28.11223030090332, 33.137290954589844, 38.162349700927734, 43.187408447265625]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 9.0, 7.0, 6.0, 7.0, 9.0, 15.0, 15.0, 21.0, 19.0, 27.0, 15.0, 35.0, 34.0, 38.0, 47.0, 41.0, 39.0, 48.0, 40.0, 41.0, 43.0, 43.0, 43.0, 40.0, 36.0, 28.0, 24.0, 35.0, 28.0, 27.0, 15.0, 19.0, 11.0, 17.0, 17.0, 11.0, 10.0, 10.0, 5.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-33.288055419921875, -32.23106384277344, -31.174070358276367, -30.117076873779297, -29.06008529663086, -28.003093719482422, -26.94610023498535, -25.88910675048828, -24.832115173339844, -23.775123596191406, -22.718130111694336, -21.661136627197266, -20.604145050048828, -19.54715347290039, -18.49015998840332, -17.43316650390625, -16.376174926757812, -15.319182395935059, -14.262189865112305, -13.20519733428955, -12.148204803466797, -11.091212272644043, -10.034219741821289, -8.977227210998535, -7.920234680175781, -6.863242149353027, -5.806249618530273, -4.7492570877075195, -3.6922645568847656, -2.6352720260620117, -1.5782794952392578, -0.5212869644165039, 0.53570556640625, 1.592698097229004, 2.649690628051758, 3.7066831588745117, 4.763675689697266, 5.8206682205200195, 6.877660751342773, 7.934653282165527, 8.991645812988281, 10.048638343811035, 11.105630874633789, 12.162623405456543, 13.219615936279297, 14.27660846710205, 15.333600997924805, 16.390594482421875, 17.447586059570312, 18.50457763671875, 19.56157112121582, 20.61856460571289, 21.675556182861328, 22.732547760009766, 23.789541244506836, 24.846534729003906, 25.903526306152344, 26.96051788330078, 28.01751136779785, 29.074504852294922, 30.13149642944336, 31.188488006591797, 32.2454833984375, 33.30247497558594, 34.359466552734375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 2.0, 5.0, 9.0, 5.0, 10.0, 12.0, 9.0, 15.0, 20.0, 28.0, 14.0, 19.0, 20.0, 33.0, 41.0, 41.0, 52.0, 33.0, 43.0, 37.0, 43.0, 56.0, 52.0, 54.0, 48.0, 34.0, 22.0, 28.0, 21.0, 23.0, 28.0, 19.0, 20.0, 21.0, 16.0, 14.0, 12.0, 11.0, 7.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.72265625, -3.59808349609375, -3.4735107421875, -3.34893798828125, -3.224365234375, -3.09979248046875, -2.9752197265625, -2.85064697265625, -2.72607421875, -2.60150146484375, -2.4769287109375, -2.35235595703125, -2.227783203125, -2.10321044921875, -1.9786376953125, -1.85406494140625, -1.7294921875, -1.60491943359375, -1.4803466796875, -1.35577392578125, -1.231201171875, -1.10662841796875, -0.9820556640625, -0.85748291015625, -0.73291015625, -0.60833740234375, -0.4837646484375, -0.35919189453125, -0.234619140625, -0.11004638671875, 0.0145263671875, 0.13909912109375, 0.263671875, 0.38824462890625, 0.5128173828125, 0.63739013671875, 0.761962890625, 0.88653564453125, 1.0111083984375, 1.13568115234375, 1.26025390625, 1.38482666015625, 1.5093994140625, 1.63397216796875, 1.758544921875, 1.88311767578125, 2.0076904296875, 2.13226318359375, 2.2568359375, 2.38140869140625, 2.5059814453125, 2.63055419921875, 2.755126953125, 2.87969970703125, 3.0042724609375, 3.12884521484375, 3.25341796875, 3.37799072265625, 3.5025634765625, 3.62713623046875, 3.751708984375, 3.87628173828125, 4.0008544921875, 4.12542724609375, 4.25]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 4.0, 14.0, 11.0, 37.0, 34.0, 51.0, 108.0, 131.0, 273.0, 456.0, 853.0, 1646.0, 3354.0, 6808.0, 14118.0, 28561.0, 56534.0, 100800.0, 158032.0, 196798.0, 184224.0, 132334.0, 79422.0, 42116.0, 21255.0, 10384.0, 5019.0, 2439.0, 1210.0, 648.0, 319.0, 189.0, 112.0, 79.0, 53.0, 30.0, 25.0, 11.0, 15.0, 13.0, 5.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.67578125, -4.53314208984375, -4.3905029296875, -4.24786376953125, -4.105224609375, -3.96258544921875, -3.8199462890625, -3.67730712890625, -3.53466796875, -3.39202880859375, -3.2493896484375, -3.10675048828125, -2.964111328125, -2.82147216796875, -2.6788330078125, -2.53619384765625, -2.3935546875, -2.25091552734375, -2.1082763671875, -1.96563720703125, -1.822998046875, -1.68035888671875, -1.5377197265625, -1.39508056640625, -1.25244140625, -1.10980224609375, -0.9671630859375, -0.82452392578125, -0.681884765625, -0.53924560546875, -0.3966064453125, -0.25396728515625, -0.111328125, 0.03131103515625, 0.1739501953125, 0.31658935546875, 0.459228515625, 0.60186767578125, 0.7445068359375, 0.88714599609375, 1.02978515625, 1.17242431640625, 1.3150634765625, 1.45770263671875, 1.600341796875, 1.74298095703125, 1.8856201171875, 2.02825927734375, 2.1708984375, 2.31353759765625, 2.4561767578125, 2.59881591796875, 2.741455078125, 2.88409423828125, 3.0267333984375, 3.16937255859375, 3.31201171875, 3.45465087890625, 3.5972900390625, 3.73992919921875, 3.882568359375, 4.02520751953125, 4.1678466796875, 4.31048583984375, 4.453125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 2.0, 5.0, 9.0, 6.0, 14.0, 8.0, 11.0, 10.0, 20.0, 15.0, 25.0, 21.0, 24.0, 25.0, 31.0, 34.0, 33.0, 37.0, 44.0, 27.0, 35.0, 28.0, 1065.0, 40.0, 41.0, 37.0, 30.0, 28.0, 34.0, 31.0, 33.0, 19.0, 26.0, 26.0, 19.0, 18.0, 18.0, 13.0, 12.0, 17.0, 7.0, 11.0, 3.0, 4.0, 4.0, 4.0, 5.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.15234375, -3.045166015625, -2.93798828125, -2.830810546875, -2.7236328125, -2.616455078125, -2.50927734375, -2.402099609375, -2.294921875, -2.187744140625, -2.08056640625, -1.973388671875, -1.8662109375, -1.759033203125, -1.65185546875, -1.544677734375, -1.4375, -1.330322265625, -1.22314453125, -1.115966796875, -1.0087890625, -0.901611328125, -0.79443359375, -0.687255859375, -0.580078125, -0.472900390625, -0.36572265625, -0.258544921875, -0.1513671875, -0.044189453125, 0.06298828125, 0.170166015625, 0.27734375, 0.384521484375, 0.49169921875, 0.598876953125, 0.7060546875, 0.813232421875, 0.92041015625, 1.027587890625, 1.134765625, 1.241943359375, 1.34912109375, 1.456298828125, 1.5634765625, 1.670654296875, 1.77783203125, 1.885009765625, 1.9921875, 2.099365234375, 2.20654296875, 2.313720703125, 2.4208984375, 2.528076171875, 2.63525390625, 2.742431640625, 2.849609375, 2.956787109375, 3.06396484375, 3.171142578125, 3.2783203125, 3.385498046875, 3.49267578125, 3.599853515625, 3.70703125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 4.0, 2.0, 8.0, 10.0, 14.0, 17.0, 22.0, 39.0, 58.0, 71.0, 116.0, 130.0, 230.0, 311.0, 416.0, 651.0, 921.0, 1353.0, 2098.0, 3109.0, 4686.0, 7813.0, 12651.0, 21343.0, 39821.0, 105311.0, 1627236.0, 161037.0, 45570.0, 24057.0, 13791.0, 8524.0, 5466.0, 3337.0, 2192.0, 1524.0, 1026.0, 652.0, 454.0, 303.0, 211.0, 155.0, 103.0, 71.0, 65.0, 46.0, 32.0, 26.0, 19.0, 15.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.7890625, -5.593505859375, -5.39794921875, -5.202392578125, -5.0068359375, -4.811279296875, -4.61572265625, -4.420166015625, -4.224609375, -4.029052734375, -3.83349609375, -3.637939453125, -3.4423828125, -3.246826171875, -3.05126953125, -2.855712890625, -2.66015625, -2.464599609375, -2.26904296875, -2.073486328125, -1.8779296875, -1.682373046875, -1.48681640625, -1.291259765625, -1.095703125, -0.900146484375, -0.70458984375, -0.509033203125, -0.3134765625, -0.117919921875, 0.07763671875, 0.273193359375, 0.46875, 0.664306640625, 0.85986328125, 1.055419921875, 1.2509765625, 1.446533203125, 1.64208984375, 1.837646484375, 2.033203125, 2.228759765625, 2.42431640625, 2.619873046875, 2.8154296875, 3.010986328125, 3.20654296875, 3.402099609375, 3.59765625, 3.793212890625, 3.98876953125, 4.184326171875, 4.3798828125, 4.575439453125, 4.77099609375, 4.966552734375, 5.162109375, 5.357666015625, 5.55322265625, 5.748779296875, 5.9443359375, 6.139892578125, 6.33544921875, 6.531005859375, 6.7265625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 10.0, 7.0, 10.0, 10.0, 11.0, 8.0, 11.0, 18.0, 26.0, 29.0, 39.0, 41.0, 52.0, 62.0, 67.0, 91.0, 70.0, 75.0, 68.0, 50.0, 37.0, 37.0, 25.0, 25.0, 24.0, 15.0, 9.0, 13.0, 15.0, 12.0, 6.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0908203125, -1.0576934814453125, -1.024566650390625, -0.9914398193359375, -0.95831298828125, -0.9251861572265625, -0.892059326171875, -0.8589324951171875, -0.8258056640625, -0.7926788330078125, -0.759552001953125, -0.7264251708984375, -0.69329833984375, -0.6601715087890625, -0.627044677734375, -0.5939178466796875, -0.560791015625, -0.5276641845703125, -0.494537353515625, -0.4614105224609375, -0.42828369140625, -0.3951568603515625, -0.362030029296875, -0.3289031982421875, -0.2957763671875, -0.2626495361328125, -0.229522705078125, -0.1963958740234375, -0.16326904296875, -0.1301422119140625, -0.097015380859375, -0.0638885498046875, -0.03076171875, 0.0023651123046875, 0.035491943359375, 0.0686187744140625, 0.10174560546875, 0.1348724365234375, 0.167999267578125, 0.2011260986328125, 0.2342529296875, 0.2673797607421875, 0.300506591796875, 0.3336334228515625, 0.36676025390625, 0.3998870849609375, 0.433013916015625, 0.4661407470703125, 0.499267578125, 0.5323944091796875, 0.565521240234375, 0.5986480712890625, 0.63177490234375, 0.6649017333984375, 0.698028564453125, 0.7311553955078125, 0.7642822265625, 0.7974090576171875, 0.830535888671875, 0.8636627197265625, 0.89678955078125, 0.9299163818359375, 0.963043212890625, 0.9961700439453125, 1.029296875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 9.0, 9.0, 16.0, 24.0, 25.0, 25.0, 45.0, 35.0, 57.0, 92.0, 120.0, 207.0, 387.0, 1022.0, 4887.0, 36388.0, 764151.0, 221353.0, 15641.0, 2491.0, 685.0, 288.0, 172.0, 127.0, 74.0, 40.0, 49.0, 26.0, 13.0, 23.0, 16.0, 15.0, 6.0, 12.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.515625, -13.076904296875, -12.63818359375, -12.199462890625, -11.7607421875, -11.322021484375, -10.88330078125, -10.444580078125, -10.005859375, -9.567138671875, -9.12841796875, -8.689697265625, -8.2509765625, -7.812255859375, -7.37353515625, -6.934814453125, -6.49609375, -6.057373046875, -5.61865234375, -5.179931640625, -4.7412109375, -4.302490234375, -3.86376953125, -3.425048828125, -2.986328125, -2.547607421875, -2.10888671875, -1.670166015625, -1.2314453125, -0.792724609375, -0.35400390625, 0.084716796875, 0.5234375, 0.962158203125, 1.40087890625, 1.839599609375, 2.2783203125, 2.717041015625, 3.15576171875, 3.594482421875, 4.033203125, 4.471923828125, 4.91064453125, 5.349365234375, 5.7880859375, 6.226806640625, 6.66552734375, 7.104248046875, 7.54296875, 7.981689453125, 8.42041015625, 8.859130859375, 9.2978515625, 9.736572265625, 10.17529296875, 10.614013671875, 11.052734375, 11.491455078125, 11.93017578125, 12.368896484375, 12.8076171875, 13.246337890625, 13.68505859375, 14.123779296875, 14.5625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 11.0, 10.0, 27.0, 52.0, 71.0, 197.0, 309.0, 183.0, 73.0, 33.0, 19.0, 13.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.560818672180176, -9.134309768676758, -8.707801818847656, -8.281292915344238, -7.854784965515137, -7.428276062011719, -7.001767635345459, -6.575259208679199, -6.1487507820129395, -5.72224235534668, -5.29573392868042, -4.86922550201416, -4.442716598510742, -4.016208648681641, -3.5896997451782227, -3.163191318511963, -2.736682891845703, -2.3101744651794434, -1.883665919303894, -1.4571573734283447, -1.030648946762085, -0.6041405200958252, -0.17763185501098633, 0.24887657165527344, 0.6753849983215332, 1.101893424987793, 1.5284019708633423, 1.9549105167388916, 2.3814189434051514, 2.807927370071411, 3.23443603515625, 3.6609444618225098, 4.087451934814453, 4.513960361480713, 4.940468788146973, 5.366977691650391, 5.793485641479492, 6.21999454498291, 6.64650297164917, 7.07301139831543, 7.4995198249816895, 7.926028251647949, 8.352537155151367, 8.779045104980469, 9.205554008483887, 9.632061958312988, 10.058570861816406, 10.485078811645508, 10.911587715148926, 11.338096618652344, 11.764604568481445, 12.191113471984863, 12.617621421813965, 13.044130325317383, 13.470638275146484, 13.897147178649902, 14.32365608215332, 14.750164985656738, 15.17667293548584, 15.603181838989258, 16.02968978881836, 16.45619773864746, 16.882707595825195, 17.309215545654297, 17.7357234954834]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 12.0, 19.0, 15.0, 14.0, 28.0, 24.0, 18.0, 30.0, 18.0, 23.0, 33.0, 51.0, 47.0, 46.0, 45.0, 39.0, 34.0, 43.0, 39.0, 50.0, 41.0, 44.0, 34.0, 44.0, 34.0, 31.0, 27.0, 24.0, 16.0, 14.0, 16.0, 15.0, 15.0, 4.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2397148609161377, -3.1242477893829346, -3.0087807178497314, -2.893313407897949, -2.777846336364746, -2.662379264831543, -2.54691219329834, -2.4314451217651367, -2.3159780502319336, -2.2005109786987305, -2.0850439071655273, -1.9695767164230347, -1.854109525680542, -1.7386424541473389, -1.6231753826141357, -1.5077083110809326, -1.3922410011291504, -1.2767739295959473, -1.1613067388534546, -1.0458396673202515, -0.9303725361824036, -0.8149054050445557, -0.6994383335113525, -0.5839712023735046, -0.46850407123565674, -0.35303694009780884, -0.23756983876228333, -0.12210273742675781, -0.006635606288909912, 0.10883152484893799, 0.2242985963821411, 0.339765727519989, 0.4552326202392578, 0.5706997513771057, 0.6861668825149536, 0.8016339540481567, 0.9171010851860046, 1.0325682163238525, 1.1480352878570557, 1.2635023593902588, 1.3789695501327515, 1.4944366216659546, 1.6099038124084473, 1.7253708839416504, 1.8408379554748535, 1.9563051462173462, 2.0717720985412598, 2.187239408493042, 2.302706480026245, 2.4181735515594482, 2.5336406230926514, 2.6491079330444336, 2.7645750045776367, 2.88004207611084, 2.995509147644043, 3.110976219177246, 3.226443290710449, 3.3419103622436523, 3.4573774337768555, 3.5728445053100586, 3.688311815261841, 3.803778886795044, 3.919245958328247, 4.034713268280029, 4.150180339813232]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 8.0, 5.0, 4.0, 12.0, 13.0, 10.0, 21.0, 29.0, 15.0, 15.0, 24.0, 26.0, 33.0, 43.0, 44.0, 47.0, 39.0, 43.0, 36.0, 48.0, 51.0, 56.0, 45.0, 50.0, 25.0, 27.0, 26.0, 16.0, 33.0, 22.0, 20.0, 21.0, 18.0, 10.0, 16.0, 9.0, 10.0, 7.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.9178466796875, -3.788818359375, -3.6597900390625, -3.53076171875, -3.4017333984375, -3.272705078125, -3.1436767578125, -3.0146484375, -2.8856201171875, -2.756591796875, -2.6275634765625, -2.49853515625, -2.3695068359375, -2.240478515625, -2.1114501953125, -1.982421875, -1.8533935546875, -1.724365234375, -1.5953369140625, -1.46630859375, -1.3372802734375, -1.208251953125, -1.0792236328125, -0.9501953125, -0.8211669921875, -0.692138671875, -0.5631103515625, -0.43408203125, -0.3050537109375, -0.176025390625, -0.0469970703125, 0.08203125, 0.2110595703125, 0.340087890625, 0.4691162109375, 0.59814453125, 0.7271728515625, 0.856201171875, 0.9852294921875, 1.1142578125, 1.2432861328125, 1.372314453125, 1.5013427734375, 1.63037109375, 1.7593994140625, 1.888427734375, 2.0174560546875, 2.146484375, 2.2755126953125, 2.404541015625, 2.5335693359375, 2.66259765625, 2.7916259765625, 2.920654296875, 3.0496826171875, 3.1787109375, 3.3077392578125, 3.436767578125, 3.5657958984375, 3.69482421875, 3.8238525390625, 3.952880859375, 4.0819091796875, 4.2109375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 8.0, 7.0, 9.0, 14.0, 31.0, 35.0, 47.0, 73.0, 95.0, 156.0, 267.0, 389.0, 679.0, 1165.0, 2117.0, 3671.0, 6596.0, 12864.0, 27493.0, 77628.0, 561917.0, 258891.0, 50807.0, 20915.0, 10320.0, 5352.0, 2890.0, 1608.0, 895.0, 579.0, 368.0, 223.0, 150.0, 90.0, 59.0, 54.0, 29.0, 16.0, 14.0, 12.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -11.00244140625, -10.6455078125, -10.28857421875, -9.931640625, -9.57470703125, -9.2177734375, -8.86083984375, -8.50390625, -8.14697265625, -7.7900390625, -7.43310546875, -7.076171875, -6.71923828125, -6.3623046875, -6.00537109375, -5.6484375, -5.29150390625, -4.9345703125, -4.57763671875, -4.220703125, -3.86376953125, -3.5068359375, -3.14990234375, -2.79296875, -2.43603515625, -2.0791015625, -1.72216796875, -1.365234375, -1.00830078125, -0.6513671875, -0.29443359375, 0.0625, 0.41943359375, 0.7763671875, 1.13330078125, 1.490234375, 1.84716796875, 2.2041015625, 2.56103515625, 2.91796875, 3.27490234375, 3.6318359375, 3.98876953125, 4.345703125, 4.70263671875, 5.0595703125, 5.41650390625, 5.7734375, 6.13037109375, 6.4873046875, 6.84423828125, 7.201171875, 7.55810546875, 7.9150390625, 8.27197265625, 8.62890625, 8.98583984375, 9.3427734375, 9.69970703125, 10.056640625, 10.41357421875, 10.7705078125, 11.12744140625, 11.484375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 4.0, 6.0, 5.0, 13.0, 16.0, 21.0, 19.0, 41.0, 31.0, 43.0, 62.0, 56.0, 67.0, 96.0, 143.0, 291.0, 1432.0, 154.0, 100.0, 101.0, 69.0, 46.0, 47.0, 47.0, 27.0, 23.0, 28.0, 15.0, 13.0, 7.0, 9.0, 3.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.921875, -18.333984375, -17.74609375, -17.158203125, -16.5703125, -15.982421875, -15.39453125, -14.806640625, -14.21875, -13.630859375, -13.04296875, -12.455078125, -11.8671875, -11.279296875, -10.69140625, -10.103515625, -9.515625, -8.927734375, -8.33984375, -7.751953125, -7.1640625, -6.576171875, -5.98828125, -5.400390625, -4.8125, -4.224609375, -3.63671875, -3.048828125, -2.4609375, -1.873046875, -1.28515625, -0.697265625, -0.109375, 0.478515625, 1.06640625, 1.654296875, 2.2421875, 2.830078125, 3.41796875, 4.005859375, 4.59375, 5.181640625, 5.76953125, 6.357421875, 6.9453125, 7.533203125, 8.12109375, 8.708984375, 9.296875, 9.884765625, 10.47265625, 11.060546875, 11.6484375, 12.236328125, 12.82421875, 13.412109375, 14.0, 14.587890625, 15.17578125, 15.763671875, 16.3515625, 16.939453125, 17.52734375, 18.115234375, 18.703125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 6.0, 7.0, 6.0, 19.0, 32.0, 63.0, 95.0, 180.0, 294.0, 707.0, 1646.0, 4871.0, 20280.0, 190272.0, 2822464.0, 85718.0, 13196.0, 3434.0, 1276.0, 549.0, 266.0, 108.0, 80.0, 49.0, 26.0, 16.0, 10.0, 9.0, 6.0, 6.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.5, -45.06298828125, -43.6259765625, -42.18896484375, -40.751953125, -39.31494140625, -37.8779296875, -36.44091796875, -35.00390625, -33.56689453125, -32.1298828125, -30.69287109375, -29.255859375, -27.81884765625, -26.3818359375, -24.94482421875, -23.5078125, -22.07080078125, -20.6337890625, -19.19677734375, -17.759765625, -16.32275390625, -14.8857421875, -13.44873046875, -12.01171875, -10.57470703125, -9.1376953125, -7.70068359375, -6.263671875, -4.82666015625, -3.3896484375, -1.95263671875, -0.515625, 0.92138671875, 2.3583984375, 3.79541015625, 5.232421875, 6.66943359375, 8.1064453125, 9.54345703125, 10.98046875, 12.41748046875, 13.8544921875, 15.29150390625, 16.728515625, 18.16552734375, 19.6025390625, 21.03955078125, 22.4765625, 23.91357421875, 25.3505859375, 26.78759765625, 28.224609375, 29.66162109375, 31.0986328125, 32.53564453125, 33.97265625, 35.40966796875, 36.8466796875, 38.28369140625, 39.720703125, 41.15771484375, 42.5947265625, 44.03173828125, 45.46875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [8.0, 81.0, 782.0, 141.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.82672882080078, -24.411945343017578, -8.997161865234375, 6.417621612548828, 21.83240509033203, 37.24718475341797, 52.66197204589844, 68.0767593383789, 83.49153900146484, 98.90632629394531, 114.32110595703125, 129.7358856201172, 145.15066528320312, 160.56546020507812, 175.98023986816406, 191.39501953125, 206.809814453125, 222.22459411621094, 237.63937377929688, 253.05416870117188, 268.46893310546875, 283.88372802734375, 299.29852294921875, 314.71331787109375, 330.1280822753906, 345.5428771972656, 360.9576416015625, 376.3724365234375, 391.7872314453125, 407.2019958496094, 422.6167907714844, 438.03155517578125, 453.44635009765625, 468.86114501953125, 484.2759094238281, 499.6907043457031, 515.10546875, 530.520263671875, 545.93505859375, 561.349853515625, 576.7646484375, 592.179443359375, 607.59423828125, 623.0089721679688, 638.4237670898438, 653.8385620117188, 669.2533569335938, 684.6681518554688, 700.0828857421875, 715.4976806640625, 730.9124755859375, 746.3272094726562, 761.7420043945312, 777.1567993164062, 792.5715942382812, 807.9863891601562, 823.401123046875, 838.81591796875, 854.230712890625, 869.6454467773438, 885.0602416992188, 900.4750366210938, 915.8898315429688, 931.3046264648438, 946.7194213867188]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 8.0, 9.0, 12.0, 10.0, 20.0, 17.0, 15.0, 22.0, 33.0, 29.0, 24.0, 35.0, 34.0, 45.0, 42.0, 42.0, 44.0, 41.0, 52.0, 39.0, 42.0, 41.0, 37.0, 29.0, 33.0, 29.0, 21.0, 28.0, 25.0, 17.0, 23.0, 16.0, 15.0, 15.0, 8.0, 10.0, 2.0, 8.0, 3.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.09623718261719, -42.63670349121094, -41.17716979980469, -39.71763610839844, -38.25810241699219, -36.7985725402832, -35.33903884887695, -33.8795051574707, -32.41997146606445, -30.960437774658203, -29.500904083251953, -28.041372299194336, -26.581838607788086, -25.122304916381836, -23.66277313232422, -22.20323944091797, -20.74370574951172, -19.28417205810547, -17.82463836669922, -16.3651065826416, -14.905572891235352, -13.446039199829102, -11.986506462097168, -10.526973724365234, -9.067440032958984, -7.607906818389893, -6.148373603820801, -4.688840389251709, -3.229307174682617, -1.7697739601135254, -0.3102407455444336, 1.1492919921875, 2.6088294982910156, 4.068362712860107, 5.527895927429199, 6.987429141998291, 8.446962356567383, 9.906496047973633, 11.366028785705566, 12.8255615234375, 14.28509521484375, 15.74462890625, 17.20416259765625, 18.663694381713867, 20.123228073120117, 21.582761764526367, 23.042293548583984, 24.501827239990234, 25.961360931396484, 27.420894622802734, 28.880428314208984, 30.3399600982666, 31.79949378967285, 33.25902557373047, 34.71855926513672, 36.17809295654297, 37.63762664794922, 39.09716033935547, 40.55669403076172, 42.01622772216797, 43.47576141357422, 44.9352912902832, 46.39482498168945, 47.8543586730957, 49.31389236450195]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 4.0, 6.0, 12.0, 11.0, 6.0, 13.0, 10.0, 13.0, 18.0, 20.0, 24.0, 23.0, 29.0, 34.0, 35.0, 36.0, 29.0, 36.0, 29.0, 42.0, 44.0, 44.0, 37.0, 44.0, 47.0, 34.0, 34.0, 25.0, 37.0, 26.0, 21.0, 22.0, 19.0, 14.0, 16.0, 21.0, 12.0, 11.0, 11.0, 6.0, 8.0, 6.0, 8.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.623046875, -3.499237060546875, -3.37542724609375, -3.251617431640625, -3.1278076171875, -3.003997802734375, -2.88018798828125, -2.756378173828125, -2.632568359375, -2.508758544921875, -2.38494873046875, -2.261138916015625, -2.1373291015625, -2.013519287109375, -1.88970947265625, -1.765899658203125, -1.64208984375, -1.518280029296875, -1.39447021484375, -1.270660400390625, -1.1468505859375, -1.023040771484375, -0.89923095703125, -0.775421142578125, -0.651611328125, -0.527801513671875, -0.40399169921875, -0.280181884765625, -0.1563720703125, -0.032562255859375, 0.09124755859375, 0.215057373046875, 0.3388671875, 0.462677001953125, 0.58648681640625, 0.710296630859375, 0.8341064453125, 0.957916259765625, 1.08172607421875, 1.205535888671875, 1.329345703125, 1.453155517578125, 1.57696533203125, 1.700775146484375, 1.8245849609375, 1.948394775390625, 2.07220458984375, 2.196014404296875, 2.31982421875, 2.443634033203125, 2.56744384765625, 2.691253662109375, 2.8150634765625, 2.938873291015625, 3.06268310546875, 3.186492919921875, 3.310302734375, 3.434112548828125, 3.55792236328125, 3.681732177734375, 3.8055419921875, 3.929351806640625, 4.05316162109375, 4.176971435546875, 4.30078125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 7.0, 16.0, 13.0, 17.0, 34.0, 51.0, 75.0, 129.0, 187.0, 319.0, 535.0, 1020.0, 1850.0, 3959.0, 9066.0, 23810.0, 80320.0, 441555.0, 2453965.0, 978577.0, 139157.0, 36286.0, 12384.0, 5170.0, 2457.0, 1295.0, 733.0, 418.0, 321.0, 163.0, 127.0, 73.0, 51.0, 26.0, 34.0, 26.0, 14.0, 8.0, 12.0, 5.0, 3.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0859375, -9.7462158203125, -9.406494140625, -9.0667724609375, -8.72705078125, -8.3873291015625, -8.047607421875, -7.7078857421875, -7.3681640625, -7.0284423828125, -6.688720703125, -6.3489990234375, -6.00927734375, -5.6695556640625, -5.329833984375, -4.9901123046875, -4.650390625, -4.3106689453125, -3.970947265625, -3.6312255859375, -3.29150390625, -2.9517822265625, -2.612060546875, -2.2723388671875, -1.9326171875, -1.5928955078125, -1.253173828125, -0.9134521484375, -0.57373046875, -0.2340087890625, 0.105712890625, 0.4454345703125, 0.78515625, 1.1248779296875, 1.464599609375, 1.8043212890625, 2.14404296875, 2.4837646484375, 2.823486328125, 3.1632080078125, 3.5029296875, 3.8426513671875, 4.182373046875, 4.5220947265625, 4.86181640625, 5.2015380859375, 5.541259765625, 5.8809814453125, 6.220703125, 6.5604248046875, 6.900146484375, 7.2398681640625, 7.57958984375, 7.9193115234375, 8.259033203125, 8.5987548828125, 8.9384765625, 9.2781982421875, 9.617919921875, 9.9576416015625, 10.29736328125, 10.6370849609375, 10.976806640625, 11.3165283203125, 11.65625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 7.0, 5.0, 2.0, 3.0, 12.0, 13.0, 12.0, 17.0, 21.0, 35.0, 46.0, 63.0, 106.0, 127.0, 186.0, 240.0, 411.0, 527.0, 581.0, 493.0, 359.0, 229.0, 149.0, 136.0, 93.0, 40.0, 45.0, 28.0, 25.0, 17.0, 11.0, 6.0, 7.0, 6.0, 3.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.26171875, -10.890625, -10.51953125, -10.1484375, -9.77734375, -9.40625, -9.03515625, -8.6640625, -8.29296875, -7.921875, -7.55078125, -7.1796875, -6.80859375, -6.4375, -6.06640625, -5.6953125, -5.32421875, -4.953125, -4.58203125, -4.2109375, -3.83984375, -3.46875, -3.09765625, -2.7265625, -2.35546875, -1.984375, -1.61328125, -1.2421875, -0.87109375, -0.5, -0.12890625, 0.2421875, 0.61328125, 0.984375, 1.35546875, 1.7265625, 2.09765625, 2.46875, 2.83984375, 3.2109375, 3.58203125, 3.953125, 4.32421875, 4.6953125, 5.06640625, 5.4375, 5.80859375, 6.1796875, 6.55078125, 6.921875, 7.29296875, 7.6640625, 8.03515625, 8.40625, 8.77734375, 9.1484375, 9.51953125, 9.890625, 10.26171875, 10.6328125, 11.00390625, 11.375, 11.74609375, 12.1171875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 8.0, 13.0, 16.0, 25.0, 31.0, 43.0, 67.0, 87.0, 130.0, 206.0, 279.0, 450.0, 672.0, 1001.0, 1775.0, 3236.0, 6284.0, 12700.0, 29851.0, 85270.0, 331118.0, 1869077.0, 1470107.0, 260294.0, 71238.0, 25965.0, 11099.0, 5470.0, 3046.0, 1712.0, 1075.0, 613.0, 453.0, 285.0, 182.0, 119.0, 77.0, 57.0, 44.0, 35.0, 26.0, 13.0, 13.0, 9.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.390625, -12.943115234375, -12.49560546875, -12.048095703125, -11.6005859375, -11.153076171875, -10.70556640625, -10.258056640625, -9.810546875, -9.363037109375, -8.91552734375, -8.468017578125, -8.0205078125, -7.572998046875, -7.12548828125, -6.677978515625, -6.23046875, -5.782958984375, -5.33544921875, -4.887939453125, -4.4404296875, -3.992919921875, -3.54541015625, -3.097900390625, -2.650390625, -2.202880859375, -1.75537109375, -1.307861328125, -0.8603515625, -0.412841796875, 0.03466796875, 0.482177734375, 0.9296875, 1.377197265625, 1.82470703125, 2.272216796875, 2.7197265625, 3.167236328125, 3.61474609375, 4.062255859375, 4.509765625, 4.957275390625, 5.40478515625, 5.852294921875, 6.2998046875, 6.747314453125, 7.19482421875, 7.642333984375, 8.08984375, 8.537353515625, 8.98486328125, 9.432373046875, 9.8798828125, 10.327392578125, 10.77490234375, 11.222412109375, 11.669921875, 12.117431640625, 12.56494140625, 13.012451171875, 13.4599609375, 13.907470703125, 14.35498046875, 14.802490234375, 15.25]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 23.0, 76.0, 190.0, 288.0, 269.0, 103.0, 40.0, 13.0, 2.0, 2.0, 2.0, 1.0], "bins": [-321.8177185058594, -316.0428161621094, -310.2679443359375, -304.4930419921875, -298.7181701660156, -292.9432678222656, -287.16839599609375, -281.39349365234375, -275.61859130859375, -269.84368896484375, -264.0688171386719, -258.2939147949219, -252.51902770996094, -246.744140625, -240.96925354003906, -235.19436645507812, -229.4194793701172, -223.64459228515625, -217.8697052001953, -212.09481811523438, -206.31991577148438, -200.54502868652344, -194.7701416015625, -188.99525451660156, -183.22036743164062, -177.4454803466797, -171.67059326171875, -165.89569091796875, -160.1208038330078, -154.34591674804688, -148.57102966308594, -142.796142578125, -137.021240234375, -131.24635314941406, -125.4714584350586, -119.69657135009766, -113.92167663574219, -108.14678955078125, -102.37190246582031, -96.59701538085938, -90.82211303710938, -85.04722595214844, -79.27233123779297, -73.49744415283203, -67.72254943847656, -61.947662353515625, -56.17277526855469, -50.397884368896484, -44.62299346923828, -38.84810256958008, -33.073211669921875, -27.298324584960938, -21.523433685302734, -15.748542785644531, -9.973655700683594, -4.198764801025391, 1.5761260986328125, 7.351016044616699, 13.125905990600586, 18.900794982910156, 24.67568588256836, 30.450576782226562, 36.2254638671875, 42.0003547668457, 47.775245666503906]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 13.0, 6.0, 11.0, 18.0, 22.0, 17.0, 15.0, 26.0, 36.0, 29.0, 36.0, 42.0, 43.0, 51.0, 50.0, 45.0, 53.0, 61.0, 49.0, 44.0, 43.0, 39.0, 44.0, 32.0, 27.0, 20.0, 23.0, 19.0, 17.0, 6.0, 14.0, 7.0, 9.0, 7.0, 4.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.22642517089844, -39.92996597290039, -38.63350296020508, -37.33704376220703, -36.040584564208984, -34.74412536621094, -33.447662353515625, -32.15120315551758, -30.8547420501709, -29.55828094482422, -28.261821746826172, -26.965360641479492, -25.668899536132812, -24.372440338134766, -23.075979232788086, -21.779518127441406, -20.48305892944336, -19.18659782409668, -17.890138626098633, -16.593677520751953, -15.29721736907959, -14.000757217407227, -12.704296112060547, -11.407835960388184, -10.11137580871582, -8.814915657043457, -7.5184550285339355, -6.221994400024414, -4.925534248352051, -3.6290740966796875, -2.332613468170166, -1.0361528396606445, 0.2603034973144531, 1.5567638874053955, 2.853224277496338, 4.149684906005859, 5.446145057678223, 6.742605209350586, 8.039066314697266, 9.335526466369629, 10.631986618041992, 11.928446769714355, 13.224906921386719, 14.521368026733398, 15.817828178405762, 17.114288330078125, 18.410749435424805, 19.707210540771484, 21.00366973876953, 22.30013084411621, 23.596590042114258, 24.893051147460938, 26.189510345458984, 27.485971450805664, 28.782432556152344, 30.07889175415039, 31.37535285949707, 32.67181396484375, 33.9682731628418, 35.264732360839844, 36.561195373535156, 37.8576545715332, 39.15411376953125, 40.45057678222656, 41.74703598022461]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 4.0, 12.0, 16.0, 10.0, 16.0, 15.0, 20.0, 20.0, 16.0, 18.0, 36.0, 28.0, 33.0, 33.0, 35.0, 26.0, 37.0, 43.0, 45.0, 28.0, 46.0, 43.0, 29.0, 40.0, 41.0, 26.0, 33.0, 27.0, 28.0, 24.0, 22.0, 23.0, 12.0, 21.0, 16.0, 12.0, 12.0, 13.0, 6.0, 9.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.58984375, -3.4649658203125, -3.340087890625, -3.2152099609375, -3.09033203125, -2.9654541015625, -2.840576171875, -2.7156982421875, -2.5908203125, -2.4659423828125, -2.341064453125, -2.2161865234375, -2.09130859375, -1.9664306640625, -1.841552734375, -1.7166748046875, -1.591796875, -1.4669189453125, -1.342041015625, -1.2171630859375, -1.09228515625, -0.9674072265625, -0.842529296875, -0.7176513671875, -0.5927734375, -0.4678955078125, -0.343017578125, -0.2181396484375, -0.09326171875, 0.0316162109375, 0.156494140625, 0.2813720703125, 0.40625, 0.5311279296875, 0.656005859375, 0.7808837890625, 0.90576171875, 1.0306396484375, 1.155517578125, 1.2803955078125, 1.4052734375, 1.5301513671875, 1.655029296875, 1.7799072265625, 1.90478515625, 2.0296630859375, 2.154541015625, 2.2794189453125, 2.404296875, 2.5291748046875, 2.654052734375, 2.7789306640625, 2.90380859375, 3.0286865234375, 3.153564453125, 3.2784423828125, 3.4033203125, 3.5281982421875, 3.653076171875, 3.7779541015625, 3.90283203125, 4.0277099609375, 4.152587890625, 4.2774658203125, 4.40234375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 9.0, 3.0, 7.0, 12.0, 17.0, 25.0, 38.0, 59.0, 99.0, 168.0, 289.0, 469.0, 861.0, 1738.0, 3502.0, 7454.0, 16128.0, 34001.0, 69705.0, 127922.0, 194353.0, 216261.0, 169801.0, 103007.0, 53665.0, 25687.0, 11974.0, 5595.0, 2638.0, 1347.0, 693.0, 383.0, 237.0, 156.0, 82.0, 59.0, 35.0, 23.0, 21.0, 8.0, 10.0, 5.0, 9.0, 5.0, 1.0, 1.0, 2.0], "bins": [-6.55859375, -6.38739013671875, -6.2161865234375, -6.04498291015625, -5.873779296875, -5.70257568359375, -5.5313720703125, -5.36016845703125, -5.18896484375, -5.01776123046875, -4.8465576171875, -4.67535400390625, -4.504150390625, -4.33294677734375, -4.1617431640625, -3.99053955078125, -3.8193359375, -3.64813232421875, -3.4769287109375, -3.30572509765625, -3.134521484375, -2.96331787109375, -2.7921142578125, -2.62091064453125, -2.44970703125, -2.27850341796875, -2.1072998046875, -1.93609619140625, -1.764892578125, -1.59368896484375, -1.4224853515625, -1.25128173828125, -1.080078125, -0.90887451171875, -0.7376708984375, -0.56646728515625, -0.395263671875, -0.22406005859375, -0.0528564453125, 0.11834716796875, 0.28955078125, 0.46075439453125, 0.6319580078125, 0.80316162109375, 0.974365234375, 1.14556884765625, 1.3167724609375, 1.48797607421875, 1.6591796875, 1.83038330078125, 2.0015869140625, 2.17279052734375, 2.343994140625, 2.51519775390625, 2.6864013671875, 2.85760498046875, 3.02880859375, 3.20001220703125, 3.3712158203125, 3.54241943359375, 3.713623046875, 3.88482666015625, 4.0560302734375, 4.22723388671875, 4.3984375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 8.0, 10.0, 8.0, 8.0, 13.0, 16.0, 15.0, 26.0, 20.0, 26.0, 31.0, 22.0, 35.0, 30.0, 32.0, 35.0, 23.0, 32.0, 34.0, 41.0, 1066.0, 31.0, 28.0, 27.0, 42.0, 34.0, 28.0, 23.0, 28.0, 35.0, 26.0, 24.0, 18.0, 19.0, 14.0, 16.0, 13.0, 18.0, 11.0, 12.0, 4.0, 7.0, 10.0, 2.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.287109375, -3.184173583984375, -3.08123779296875, -2.978302001953125, -2.8753662109375, -2.772430419921875, -2.66949462890625, -2.566558837890625, -2.463623046875, -2.360687255859375, -2.25775146484375, -2.154815673828125, -2.0518798828125, -1.948944091796875, -1.84600830078125, -1.743072509765625, -1.64013671875, -1.537200927734375, -1.43426513671875, -1.331329345703125, -1.2283935546875, -1.125457763671875, -1.02252197265625, -0.919586181640625, -0.816650390625, -0.713714599609375, -0.61077880859375, -0.507843017578125, -0.4049072265625, -0.301971435546875, -0.19903564453125, -0.096099853515625, 0.0068359375, 0.109771728515625, 0.21270751953125, 0.315643310546875, 0.4185791015625, 0.521514892578125, 0.62445068359375, 0.727386474609375, 0.830322265625, 0.933258056640625, 1.03619384765625, 1.139129638671875, 1.2420654296875, 1.345001220703125, 1.44793701171875, 1.550872802734375, 1.65380859375, 1.756744384765625, 1.85968017578125, 1.962615966796875, 2.0655517578125, 2.168487548828125, 2.27142333984375, 2.374359130859375, 2.477294921875, 2.580230712890625, 2.68316650390625, 2.786102294921875, 2.8890380859375, 2.991973876953125, 3.09490966796875, 3.197845458984375, 3.30078125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 6.0, 15.0, 15.0, 35.0, 44.0, 70.0, 76.0, 133.0, 215.0, 293.0, 431.0, 603.0, 978.0, 1393.0, 2042.0, 3036.0, 4669.0, 7029.0, 10836.0, 17287.0, 29723.0, 63029.0, 928453.0, 885396.0, 62822.0, 29816.0, 17309.0, 10714.0, 6906.0, 4532.0, 3069.0, 2005.0, 1306.0, 951.0, 593.0, 386.0, 280.0, 189.0, 143.0, 97.0, 66.0, 43.0, 24.0, 26.0, 21.0, 14.0, 4.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5859375, -4.42779541015625, -4.2696533203125, -4.11151123046875, -3.953369140625, -3.79522705078125, -3.6370849609375, -3.47894287109375, -3.32080078125, -3.16265869140625, -3.0045166015625, -2.84637451171875, -2.688232421875, -2.53009033203125, -2.3719482421875, -2.21380615234375, -2.0556640625, -1.89752197265625, -1.7393798828125, -1.58123779296875, -1.423095703125, -1.26495361328125, -1.1068115234375, -0.94866943359375, -0.79052734375, -0.63238525390625, -0.4742431640625, -0.31610107421875, -0.157958984375, 0.00018310546875, 0.1583251953125, 0.31646728515625, 0.474609375, 0.63275146484375, 0.7908935546875, 0.94903564453125, 1.107177734375, 1.26531982421875, 1.4234619140625, 1.58160400390625, 1.73974609375, 1.89788818359375, 2.0560302734375, 2.21417236328125, 2.372314453125, 2.53045654296875, 2.6885986328125, 2.84674072265625, 3.0048828125, 3.16302490234375, 3.3211669921875, 3.47930908203125, 3.637451171875, 3.79559326171875, 3.9537353515625, 4.11187744140625, 4.27001953125, 4.42816162109375, 4.5863037109375, 4.74444580078125, 4.902587890625, 5.06072998046875, 5.2188720703125, 5.37701416015625, 5.53515625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 11.0, 13.0, 19.0, 20.0, 35.0, 32.0, 48.0, 55.0, 59.0, 82.0, 65.0, 67.0, 66.0, 85.0, 60.0, 77.0, 47.0, 44.0, 24.0, 14.0, 17.0, 18.0, 8.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.94970703125, -0.9231719970703125, -0.896636962890625, -0.8701019287109375, -0.84356689453125, -0.8170318603515625, -0.790496826171875, -0.7639617919921875, -0.7374267578125, -0.7108917236328125, -0.684356689453125, -0.6578216552734375, -0.63128662109375, -0.6047515869140625, -0.578216552734375, -0.5516815185546875, -0.525146484375, -0.4986114501953125, -0.472076416015625, -0.4455413818359375, -0.41900634765625, -0.3924713134765625, -0.365936279296875, -0.3394012451171875, -0.3128662109375, -0.2863311767578125, -0.259796142578125, -0.2332611083984375, -0.20672607421875, -0.1801910400390625, -0.153656005859375, -0.1271209716796875, -0.1005859375, -0.0740509033203125, -0.047515869140625, -0.0209808349609375, 0.00555419921875, 0.0320892333984375, 0.058624267578125, 0.0851593017578125, 0.1116943359375, 0.1382293701171875, 0.164764404296875, 0.1912994384765625, 0.21783447265625, 0.2443695068359375, 0.270904541015625, 0.2974395751953125, 0.323974609375, 0.3505096435546875, 0.377044677734375, 0.4035797119140625, 0.43011474609375, 0.4566497802734375, 0.483184814453125, 0.5097198486328125, 0.5362548828125, 0.5627899169921875, 0.589324951171875, 0.6158599853515625, 0.64239501953125, 0.6689300537109375, 0.695465087890625, 0.7220001220703125, 0.74853515625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 11.0, 8.0, 9.0, 21.0, 26.0, 41.0, 50.0, 101.0, 196.0, 359.0, 986.0, 4213.0, 64307.0, 935826.0, 37552.0, 3258.0, 830.0, 305.0, 156.0, 85.0, 59.0, 50.0, 26.0, 19.0, 10.0, 14.0, 9.0, 4.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7890625, -10.4095458984375, -10.030029296875, -9.6505126953125, -9.27099609375, -8.8914794921875, -8.511962890625, -8.1324462890625, -7.7529296875, -7.3734130859375, -6.993896484375, -6.6143798828125, -6.23486328125, -5.8553466796875, -5.475830078125, -5.0963134765625, -4.716796875, -4.3372802734375, -3.957763671875, -3.5782470703125, -3.19873046875, -2.8192138671875, -2.439697265625, -2.0601806640625, -1.6806640625, -1.3011474609375, -0.921630859375, -0.5421142578125, -0.16259765625, 0.2169189453125, 0.596435546875, 0.9759521484375, 1.35546875, 1.7349853515625, 2.114501953125, 2.4940185546875, 2.87353515625, 3.2530517578125, 3.632568359375, 4.0120849609375, 4.3916015625, 4.7711181640625, 5.150634765625, 5.5301513671875, 5.90966796875, 6.2891845703125, 6.668701171875, 7.0482177734375, 7.427734375, 7.8072509765625, 8.186767578125, 8.5662841796875, 8.94580078125, 9.3253173828125, 9.704833984375, 10.0843505859375, 10.4638671875, 10.8433837890625, 11.222900390625, 11.6024169921875, 11.98193359375, 12.3614501953125, 12.740966796875, 13.1204833984375, 13.5]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 17.0, 74.0, 277.0, 423.0, 146.0, 54.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.753621101379395, -9.29594612121582, -8.838272094726562, -8.380597114562988, -7.922922611236572, -7.465248107910156, -7.007573127746582, -6.549898624420166, -6.09222412109375, -5.634549617767334, -5.176875114440918, -4.719200134277344, -4.261525630950928, -3.8038511276245117, -3.3461763858795166, -2.8885016441345215, -2.4308271408081055, -1.9731525182724, -1.5154778957366943, -1.0578032732009888, -0.6001286506652832, -0.1424541473388672, 0.31522059440612793, 0.772895336151123, 1.230569839477539, 1.6882444620132446, 2.14591908454895, 2.6035938262939453, 3.0612683296203613, 3.5189428329467773, 3.9766175746917725, 4.434292316436768, 4.891965866088867, 5.349640369415283, 5.807314872741699, 6.264989852905273, 6.7226643562316895, 7.1803388595581055, 7.63801383972168, 8.095687866210938, 8.553362846374512, 9.011037826538086, 9.468711853027344, 9.926386833190918, 10.384061813354492, 10.84173583984375, 11.299410820007324, 11.757085800170898, 12.214759826660156, 12.67243480682373, 13.130108833312988, 13.587783813476562, 14.04545783996582, 14.503132820129395, 14.960807800292969, 15.418481826782227, 15.8761568069458, 16.333831787109375, 16.791505813598633, 17.24917984008789, 17.70685577392578, 18.16452980041504, 18.622203826904297, 19.079879760742188, 19.537553787231445]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 2.0, 4.0, 10.0, 12.0, 9.0, 20.0, 16.0, 31.0, 34.0, 31.0, 34.0, 35.0, 28.0, 51.0, 46.0, 42.0, 48.0, 54.0, 45.0, 40.0, 36.0, 50.0, 43.0, 44.0, 25.0, 45.0, 30.0, 24.0, 24.0, 20.0, 21.0, 10.0, 12.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2022948265075684, -2.127028465270996, -2.051762104034424, -1.9764959812164307, -1.9012296199798584, -1.8259632587432861, -1.7506970167160034, -1.6754307746887207, -1.6001644134521484, -1.5248980522155762, -1.4496318101882935, -1.3743655681610107, -1.2990992069244385, -1.2238328456878662, -1.1485666036605835, -1.0733003616333008, -0.9980340003967285, -0.922767698764801, -0.8475013971328735, -0.772235095500946, -0.6969687938690186, -0.6217024922370911, -0.5464361906051636, -0.4711698889732361, -0.3959035873413086, -0.3206372857093811, -0.2453709840774536, -0.17010468244552612, -0.09483838081359863, -0.019572079181671143, 0.05569422245025635, 0.13096052408218384, 0.20622682571411133, 0.2814931273460388, 0.3567594289779663, 0.4320257306098938, 0.5072920322418213, 0.5825583338737488, 0.6578246355056763, 0.7330909371376038, 0.8083572387695312, 0.8836235404014587, 0.9588898420333862, 1.034156084060669, 1.1094224452972412, 1.1846888065338135, 1.2599550485610962, 1.335221290588379, 1.4104876518249512, 1.4857540130615234, 1.5610202550888062, 1.6362864971160889, 1.7115528583526611, 1.7868192195892334, 1.8620854616165161, 1.9373517036437988, 2.012618064880371, 2.0878844261169434, 2.1631507873535156, 2.238416910171509, 2.313683271408081, 2.3889496326446533, 2.4642157554626465, 2.5394821166992188, 2.614748477935791]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 6.0, 2.0, 4.0, 10.0, 15.0, 10.0, 19.0, 14.0, 19.0, 14.0, 19.0, 22.0, 27.0, 33.0, 30.0, 34.0, 32.0, 32.0, 32.0, 49.0, 34.0, 36.0, 39.0, 41.0, 36.0, 32.0, 42.0, 35.0, 30.0, 34.0, 20.0, 23.0, 27.0, 22.0, 17.0, 17.0, 18.0, 11.0, 13.0, 14.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.650390625, -3.524810791015625, -3.39923095703125, -3.273651123046875, -3.1480712890625, -3.022491455078125, -2.89691162109375, -2.771331787109375, -2.645751953125, -2.520172119140625, -2.39459228515625, -2.269012451171875, -2.1434326171875, -2.017852783203125, -1.89227294921875, -1.766693115234375, -1.64111328125, -1.515533447265625, -1.38995361328125, -1.264373779296875, -1.1387939453125, -1.013214111328125, -0.88763427734375, -0.762054443359375, -0.636474609375, -0.510894775390625, -0.38531494140625, -0.259735107421875, -0.1341552734375, -0.008575439453125, 0.11700439453125, 0.242584228515625, 0.3681640625, 0.493743896484375, 0.61932373046875, 0.744903564453125, 0.8704833984375, 0.996063232421875, 1.12164306640625, 1.247222900390625, 1.372802734375, 1.498382568359375, 1.62396240234375, 1.749542236328125, 1.8751220703125, 2.000701904296875, 2.12628173828125, 2.251861572265625, 2.37744140625, 2.503021240234375, 2.62860107421875, 2.754180908203125, 2.8797607421875, 3.005340576171875, 3.13092041015625, 3.256500244140625, 3.382080078125, 3.507659912109375, 3.63323974609375, 3.758819580078125, 3.8843994140625, 4.009979248046875, 4.13555908203125, 4.261138916015625, 4.38671875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 6.0, 8.0, 9.0, 9.0, 22.0, 26.0, 29.0, 36.0, 55.0, 63.0, 120.0, 181.0, 332.0, 619.0, 1274.0, 2818.0, 6832.0, 19233.0, 64022.0, 288844.0, 488411.0, 124397.0, 32552.0, 10701.0, 4183.0, 1794.0, 853.0, 438.0, 211.0, 145.0, 99.0, 43.0, 40.0, 15.0, 29.0, 20.0, 10.0, 8.0, 16.0, 6.0, 14.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0], "bins": [-9.3515625, -9.08612060546875, -8.8206787109375, -8.55523681640625, -8.289794921875, -8.02435302734375, -7.7589111328125, -7.49346923828125, -7.22802734375, -6.96258544921875, -6.6971435546875, -6.43170166015625, -6.166259765625, -5.90081787109375, -5.6353759765625, -5.36993408203125, -5.1044921875, -4.83905029296875, -4.5736083984375, -4.30816650390625, -4.042724609375, -3.77728271484375, -3.5118408203125, -3.24639892578125, -2.98095703125, -2.71551513671875, -2.4500732421875, -2.18463134765625, -1.919189453125, -1.65374755859375, -1.3883056640625, -1.12286376953125, -0.857421875, -0.59197998046875, -0.3265380859375, -0.06109619140625, 0.204345703125, 0.46978759765625, 0.7352294921875, 1.00067138671875, 1.26611328125, 1.53155517578125, 1.7969970703125, 2.06243896484375, 2.327880859375, 2.59332275390625, 2.8587646484375, 3.12420654296875, 3.3896484375, 3.65509033203125, 3.9205322265625, 4.18597412109375, 4.451416015625, 4.71685791015625, 4.9822998046875, 5.24774169921875, 5.51318359375, 5.77862548828125, 6.0440673828125, 6.30950927734375, 6.574951171875, 6.84039306640625, 7.1058349609375, 7.37127685546875, 7.63671875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 9.0, 12.0, 14.0, 10.0, 18.0, 23.0, 34.0, 31.0, 53.0, 58.0, 71.0, 77.0, 139.0, 367.0, 1498.0, 218.0, 85.0, 59.0, 48.0, 48.0, 35.0, 33.0, 30.0, 18.0, 17.0, 12.0, 8.0, 9.0, 6.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.0, -18.35009765625, -17.7001953125, -17.05029296875, -16.400390625, -15.75048828125, -15.1005859375, -14.45068359375, -13.80078125, -13.15087890625, -12.5009765625, -11.85107421875, -11.201171875, -10.55126953125, -9.9013671875, -9.25146484375, -8.6015625, -7.95166015625, -7.3017578125, -6.65185546875, -6.001953125, -5.35205078125, -4.7021484375, -4.05224609375, -3.40234375, -2.75244140625, -2.1025390625, -1.45263671875, -0.802734375, -0.15283203125, 0.4970703125, 1.14697265625, 1.796875, 2.44677734375, 3.0966796875, 3.74658203125, 4.396484375, 5.04638671875, 5.6962890625, 6.34619140625, 6.99609375, 7.64599609375, 8.2958984375, 8.94580078125, 9.595703125, 10.24560546875, 10.8955078125, 11.54541015625, 12.1953125, 12.84521484375, 13.4951171875, 14.14501953125, 14.794921875, 15.44482421875, 16.0947265625, 16.74462890625, 17.39453125, 18.04443359375, 18.6943359375, 19.34423828125, 19.994140625, 20.64404296875, 21.2939453125, 21.94384765625, 22.59375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 4.0, 9.0, 9.0, 28.0, 25.0, 36.0, 43.0, 87.0, 106.0, 205.0, 380.0, 1221.0, 6370.0, 141122.0, 2896469.0, 92542.0, 5090.0, 963.0, 406.0, 197.0, 130.0, 65.0, 59.0, 32.0, 22.0, 16.0, 14.0, 19.0, 11.0, 4.0, 5.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-33.03125, -32.043701171875, -31.05615234375, -30.068603515625, -29.0810546875, -28.093505859375, -27.10595703125, -26.118408203125, -25.130859375, -24.143310546875, -23.15576171875, -22.168212890625, -21.1806640625, -20.193115234375, -19.20556640625, -18.218017578125, -17.23046875, -16.242919921875, -15.25537109375, -14.267822265625, -13.2802734375, -12.292724609375, -11.30517578125, -10.317626953125, -9.330078125, -8.342529296875, -7.35498046875, -6.367431640625, -5.3798828125, -4.392333984375, -3.40478515625, -2.417236328125, -1.4296875, -0.442138671875, 0.54541015625, 1.532958984375, 2.5205078125, 3.508056640625, 4.49560546875, 5.483154296875, 6.470703125, 7.458251953125, 8.44580078125, 9.433349609375, 10.4208984375, 11.408447265625, 12.39599609375, 13.383544921875, 14.37109375, 15.358642578125, 16.34619140625, 17.333740234375, 18.3212890625, 19.308837890625, 20.29638671875, 21.283935546875, 22.271484375, 23.259033203125, 24.24658203125, 25.234130859375, 26.2216796875, 27.209228515625, 28.19677734375, 29.184326171875, 30.171875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [61.0, 816.0, 144.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.651171684265137, -5.941215515136719, 3.768740653991699, 13.4786958694458, 23.18865203857422, 32.89860916137695, 42.60856246948242, 52.31852340698242, 62.02847671508789, 71.73843383789062, 81.4483871459961, 91.15834045410156, 100.86830139160156, 110.57826232910156, 120.2882080078125, 129.9981689453125, 139.7081298828125, 149.4180908203125, 159.12803649902344, 168.83799743652344, 178.54795837402344, 188.25790405273438, 197.96786499023438, 207.67782592773438, 217.3877716064453, 227.0977325439453, 236.80767822265625, 246.51763916015625, 256.22760009765625, 265.93756103515625, 275.64752197265625, 285.35748291015625, 295.0674133300781, 304.7773742675781, 314.4873352050781, 324.197265625, 333.9072265625, 343.6171875, 353.3271484375, 363.037109375, 372.7470703125, 382.45703125, 392.1669921875, 401.876953125, 411.5868835449219, 421.2968444824219, 431.0068054199219, 440.7167663574219, 450.42669677734375, 460.13665771484375, 469.84661865234375, 479.55657958984375, 489.2665100097656, 498.9764709472656, 508.6864318847656, 518.3963623046875, 528.1063842773438, 537.8163452148438, 547.5263061523438, 557.2362670898438, 566.9462280273438, 576.6561889648438, 586.3660888671875, 596.0760498046875, 605.7860107421875]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 9.0, 12.0, 4.0, 11.0, 12.0, 10.0, 17.0, 24.0, 23.0, 32.0, 23.0, 25.0, 35.0, 41.0, 37.0, 28.0, 27.0, 42.0, 35.0, 50.0, 47.0, 38.0, 35.0, 33.0, 40.0, 39.0, 28.0, 25.0, 28.0, 26.0, 20.0, 18.0, 13.0, 15.0, 21.0, 15.0, 12.0, 8.0, 11.0, 6.0, 5.0, 7.0, 4.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.436378479003906, -34.323089599609375, -33.20979690551758, -32.09650802612305, -30.983217239379883, -29.86992645263672, -28.756637573242188, -27.643346786499023, -26.53005599975586, -25.416765213012695, -24.30347442626953, -23.190185546875, -22.076894760131836, -20.963603973388672, -19.85031509399414, -18.737024307250977, -17.623733520507812, -16.51044273376465, -15.3971529006958, -14.283863067626953, -13.170572280883789, -12.057281494140625, -10.943991661071777, -9.83070182800293, -8.717411041259766, -7.60412073135376, -6.490830421447754, -5.377540111541748, -4.264249801635742, -3.1509594917297363, -2.0376691818237305, -0.9243788719177246, 0.18891525268554688, 1.3022055625915527, 2.4154958724975586, 3.5287861824035645, 4.64207649230957, 5.755366802215576, 6.868657112121582, 7.981947422027588, 9.095237731933594, 10.208528518676758, 11.321818351745605, 12.435108184814453, 13.548398971557617, 14.661689758300781, 15.774979591369629, 16.888269424438477, 18.00156021118164, 19.114850997924805, 20.22814178466797, 21.3414306640625, 22.454721450805664, 23.568012237548828, 24.68130111694336, 25.794591903686523, 26.907882690429688, 28.02117347717285, 29.134464263916016, 30.247753143310547, 31.36104393005371, 32.474334716796875, 33.587623596191406, 34.7009162902832, 35.814205169677734]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 2.0, 2.0, 3.0, 9.0, 10.0, 13.0, 16.0, 18.0, 15.0, 19.0, 16.0, 18.0, 31.0, 31.0, 24.0, 39.0, 34.0, 28.0, 44.0, 38.0, 39.0, 51.0, 37.0, 48.0, 31.0, 36.0, 35.0, 39.0, 35.0, 24.0, 16.0, 31.0, 25.0, 34.0, 13.0, 20.0, 13.0, 15.0, 12.0, 9.0, 11.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.02734375, -3.88983154296875, -3.7523193359375, -3.61480712890625, -3.477294921875, -3.33978271484375, -3.2022705078125, -3.06475830078125, -2.92724609375, -2.78973388671875, -2.6522216796875, -2.51470947265625, -2.377197265625, -2.23968505859375, -2.1021728515625, -1.96466064453125, -1.8271484375, -1.68963623046875, -1.5521240234375, -1.41461181640625, -1.277099609375, -1.13958740234375, -1.0020751953125, -0.86456298828125, -0.72705078125, -0.58953857421875, -0.4520263671875, -0.31451416015625, -0.177001953125, -0.03948974609375, 0.0980224609375, 0.23553466796875, 0.373046875, 0.51055908203125, 0.6480712890625, 0.78558349609375, 0.923095703125, 1.06060791015625, 1.1981201171875, 1.33563232421875, 1.47314453125, 1.61065673828125, 1.7481689453125, 1.88568115234375, 2.023193359375, 2.16070556640625, 2.2982177734375, 2.43572998046875, 2.5732421875, 2.71075439453125, 2.8482666015625, 2.98577880859375, 3.123291015625, 3.26080322265625, 3.3983154296875, 3.53582763671875, 3.67333984375, 3.81085205078125, 3.9483642578125, 4.08587646484375, 4.223388671875, 4.36090087890625, 4.4984130859375, 4.63592529296875, 4.7734375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 14.0, 19.0, 30.0, 31.0, 32.0, 55.0, 76.0, 93.0, 146.0, 221.0, 350.0, 494.0, 840.0, 1349.0, 2416.0, 4593.0, 10051.0, 25926.0, 84566.0, 488928.0, 2530887.0, 859975.0, 123948.0, 33210.0, 12653.0, 5779.0, 2972.0, 1668.0, 1023.0, 660.0, 402.0, 264.0, 201.0, 120.0, 87.0, 62.0, 51.0, 22.0, 16.0, 13.0, 11.0, 8.0, 3.0, 1.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.1875, -10.822265625, -10.45703125, -10.091796875, -9.7265625, -9.361328125, -8.99609375, -8.630859375, -8.265625, -7.900390625, -7.53515625, -7.169921875, -6.8046875, -6.439453125, -6.07421875, -5.708984375, -5.34375, -4.978515625, -4.61328125, -4.248046875, -3.8828125, -3.517578125, -3.15234375, -2.787109375, -2.421875, -2.056640625, -1.69140625, -1.326171875, -0.9609375, -0.595703125, -0.23046875, 0.134765625, 0.5, 0.865234375, 1.23046875, 1.595703125, 1.9609375, 2.326171875, 2.69140625, 3.056640625, 3.421875, 3.787109375, 4.15234375, 4.517578125, 4.8828125, 5.248046875, 5.61328125, 5.978515625, 6.34375, 6.708984375, 7.07421875, 7.439453125, 7.8046875, 8.169921875, 8.53515625, 8.900390625, 9.265625, 9.630859375, 9.99609375, 10.361328125, 10.7265625, 11.091796875, 11.45703125, 11.822265625, 12.1875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 16.0, 16.0, 23.0, 36.0, 48.0, 78.0, 143.0, 248.0, 382.0, 713.0, 858.0, 589.0, 359.0, 212.0, 111.0, 84.0, 41.0, 25.0, 20.0, 23.0, 13.0, 16.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.484375, -16.943359375, -16.40234375, -15.861328125, -15.3203125, -14.779296875, -14.23828125, -13.697265625, -13.15625, -12.615234375, -12.07421875, -11.533203125, -10.9921875, -10.451171875, -9.91015625, -9.369140625, -8.828125, -8.287109375, -7.74609375, -7.205078125, -6.6640625, -6.123046875, -5.58203125, -5.041015625, -4.5, -3.958984375, -3.41796875, -2.876953125, -2.3359375, -1.794921875, -1.25390625, -0.712890625, -0.171875, 0.369140625, 0.91015625, 1.451171875, 1.9921875, 2.533203125, 3.07421875, 3.615234375, 4.15625, 4.697265625, 5.23828125, 5.779296875, 6.3203125, 6.861328125, 7.40234375, 7.943359375, 8.484375, 9.025390625, 9.56640625, 10.107421875, 10.6484375, 11.189453125, 11.73046875, 12.271484375, 12.8125, 13.353515625, 13.89453125, 14.435546875, 14.9765625, 15.517578125, 16.05859375, 16.599609375, 17.140625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 10.0, 5.0, 21.0, 31.0, 44.0, 65.0, 115.0, 270.0, 641.0, 2097.0, 8450.0, 57760.0, 2115703.0, 1942334.0, 55342.0, 8248.0, 2005.0, 636.0, 229.0, 124.0, 74.0, 33.0, 21.0, 9.0, 5.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.59375, -35.37353515625, -34.1533203125, -32.93310546875, -31.712890625, -30.49267578125, -29.2724609375, -28.05224609375, -26.83203125, -25.61181640625, -24.3916015625, -23.17138671875, -21.951171875, -20.73095703125, -19.5107421875, -18.29052734375, -17.0703125, -15.85009765625, -14.6298828125, -13.40966796875, -12.189453125, -10.96923828125, -9.7490234375, -8.52880859375, -7.30859375, -6.08837890625, -4.8681640625, -3.64794921875, -2.427734375, -1.20751953125, 0.0126953125, 1.23291015625, 2.453125, 3.67333984375, 4.8935546875, 6.11376953125, 7.333984375, 8.55419921875, 9.7744140625, 10.99462890625, 12.21484375, 13.43505859375, 14.6552734375, 15.87548828125, 17.095703125, 18.31591796875, 19.5361328125, 20.75634765625, 21.9765625, 23.19677734375, 24.4169921875, 25.63720703125, 26.857421875, 28.07763671875, 29.2978515625, 30.51806640625, 31.73828125, 32.95849609375, 34.1787109375, 35.39892578125, 36.619140625, 37.83935546875, 39.0595703125, 40.27978515625, 41.5]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 16.0, 42.0, 135.0, 234.0, 301.0, 172.0, 72.0, 30.0, 4.0, 4.0], "bins": [-351.56719970703125, -345.52203369140625, -339.4768981933594, -333.4317321777344, -327.3865661621094, -321.3414306640625, -315.2962646484375, -309.2510986328125, -303.2059326171875, -297.1607666015625, -291.1156311035156, -285.0704650878906, -279.0252990722656, -272.98016357421875, -266.93499755859375, -260.88983154296875, -254.84469604492188, -248.79954528808594, -242.75437927246094, -236.709228515625, -230.6640625, -224.61891174316406, -218.57376098632812, -212.52859497070312, -206.4834442138672, -200.43829345703125, -194.39312744140625, -188.3479766845703, -182.30282592773438, -176.25765991210938, -170.21250915527344, -164.1673583984375, -158.12217712402344, -152.0770263671875, -146.0318603515625, -139.98670959472656, -133.94155883789062, -127.89639282226562, -121.85124206542969, -115.80608367919922, -109.76092529296875, -103.71576690673828, -97.67060852050781, -91.62545776367188, -85.5802993774414, -79.53514099121094, -73.489990234375, -67.44483184814453, -61.39967346191406, -55.354515075683594, -49.30936050415039, -43.26420593261719, -37.21904754638672, -31.173891067504883, -25.128734588623047, -19.083580017089844, -13.038421630859375, -6.993265151977539, -0.9481086730957031, 5.097047805786133, 11.142204284667969, 17.187360763549805, 23.23251724243164, 29.277671813964844, 35.32283020019531]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 11.0, 6.0, 13.0, 12.0, 12.0, 20.0, 19.0, 16.0, 21.0, 36.0, 29.0, 38.0, 29.0, 35.0, 30.0, 37.0, 35.0, 37.0, 37.0, 44.0, 41.0, 35.0, 42.0, 43.0, 31.0, 30.0, 37.0, 24.0, 22.0, 30.0, 21.0, 11.0, 11.0, 11.0, 12.0, 11.0, 8.0, 10.0, 5.0, 7.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0], "bins": [-38.842124938964844, -37.6963005065918, -36.550479888916016, -35.40465545654297, -34.25883483886719, -33.11301040649414, -31.967187881469727, -30.821365356445312, -29.675540924072266, -28.52971839904785, -27.383895874023438, -26.23807144165039, -25.092248916625977, -23.946426391601562, -22.80060386657715, -21.654781341552734, -20.50895881652832, -19.363136291503906, -18.217313766479492, -17.071491241455078, -15.925666809082031, -14.779844284057617, -13.634021759033203, -12.488198280334473, -11.342375755310059, -10.196553230285645, -9.050729751586914, -7.9049072265625, -6.759084224700928, -5.6132612228393555, -4.467438697814941, -3.321615219116211, -2.175792694091797, -1.0299698114395142, 0.11585307121276855, 1.2616758346557617, 2.407498836517334, 3.5533218383789062, 4.69914436340332, 5.844967842102051, 6.990790367126465, 8.136612892150879, 9.28243637084961, 10.428258895874023, 11.574081420898438, 12.719904899597168, 13.865727424621582, 15.011550903320312, 16.157373428344727, 17.30319595336914, 18.449018478393555, 19.59484100341797, 20.740665435791016, 21.88648796081543, 23.032310485839844, 24.17813491821289, 25.323955535888672, 26.469778060913086, 27.6156005859375, 28.761425018310547, 29.90724754333496, 31.053070068359375, 32.198890686035156, 33.3447151184082, 34.49053955078125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 7.0, 10.0, 3.0, 6.0, 16.0, 11.0, 15.0, 22.0, 22.0, 28.0, 16.0, 27.0, 35.0, 35.0, 32.0, 42.0, 29.0, 43.0, 41.0, 39.0, 48.0, 31.0, 42.0, 46.0, 31.0, 37.0, 30.0, 26.0, 27.0, 20.0, 35.0, 27.0, 14.0, 22.0, 20.0, 12.0, 14.0, 8.0, 4.0, 8.0, 7.0, 4.0, 0.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.71875, -3.58331298828125, -3.4478759765625, -3.31243896484375, -3.177001953125, -3.04156494140625, -2.9061279296875, -2.77069091796875, -2.63525390625, -2.49981689453125, -2.3643798828125, -2.22894287109375, -2.093505859375, -1.95806884765625, -1.8226318359375, -1.68719482421875, -1.5517578125, -1.41632080078125, -1.2808837890625, -1.14544677734375, -1.010009765625, -0.87457275390625, -0.7391357421875, -0.60369873046875, -0.46826171875, -0.33282470703125, -0.1973876953125, -0.06195068359375, 0.073486328125, 0.20892333984375, 0.3443603515625, 0.47979736328125, 0.615234375, 0.75067138671875, 0.8861083984375, 1.02154541015625, 1.156982421875, 1.29241943359375, 1.4278564453125, 1.56329345703125, 1.69873046875, 1.83416748046875, 1.9696044921875, 2.10504150390625, 2.240478515625, 2.37591552734375, 2.5113525390625, 2.64678955078125, 2.7822265625, 2.91766357421875, 3.0531005859375, 3.18853759765625, 3.323974609375, 3.45941162109375, 3.5948486328125, 3.73028564453125, 3.86572265625, 4.00115966796875, 4.1365966796875, 4.27203369140625, 4.407470703125, 4.54290771484375, 4.6783447265625, 4.81378173828125, 4.94921875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 4.0, 5.0, 11.0, 19.0, 14.0, 21.0, 39.0, 60.0, 85.0, 153.0, 221.0, 384.0, 642.0, 1148.0, 2078.0, 3905.0, 7281.0, 13976.0, 25877.0, 46902.0, 81657.0, 161360.0, 335635.0, 173600.0, 85764.0, 49279.0, 27119.0, 14494.0, 7608.0, 4067.0, 2216.0, 1166.0, 678.0, 383.0, 256.0, 159.0, 72.0, 71.0, 34.0, 36.0, 20.0, 10.0, 11.0, 9.0, 6.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.814453125, -3.693511962890625, -3.57257080078125, -3.451629638671875, -3.3306884765625, -3.209747314453125, -3.08880615234375, -2.967864990234375, -2.846923828125, -2.725982666015625, -2.60504150390625, -2.484100341796875, -2.3631591796875, -2.242218017578125, -2.12127685546875, -2.000335693359375, -1.87939453125, -1.758453369140625, -1.63751220703125, -1.516571044921875, -1.3956298828125, -1.274688720703125, -1.15374755859375, -1.032806396484375, -0.911865234375, -0.790924072265625, -0.66998291015625, -0.549041748046875, -0.4281005859375, -0.307159423828125, -0.18621826171875, -0.065277099609375, 0.0556640625, 0.176605224609375, 0.29754638671875, 0.418487548828125, 0.5394287109375, 0.660369873046875, 0.78131103515625, 0.902252197265625, 1.023193359375, 1.144134521484375, 1.26507568359375, 1.386016845703125, 1.5069580078125, 1.627899169921875, 1.74884033203125, 1.869781494140625, 1.99072265625, 2.111663818359375, 2.23260498046875, 2.353546142578125, 2.4744873046875, 2.595428466796875, 2.71636962890625, 2.837310791015625, 2.958251953125, 3.079193115234375, 3.20013427734375, 3.321075439453125, 3.4420166015625, 3.562957763671875, 3.68389892578125, 3.804840087890625, 3.92578125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 2.0, 7.0, 11.0, 13.0, 8.0, 16.0, 21.0, 25.0, 24.0, 22.0, 26.0, 28.0, 29.0, 32.0, 44.0, 40.0, 50.0, 42.0, 41.0, 1073.0, 47.0, 35.0, 30.0, 35.0, 39.0, 40.0, 32.0, 24.0, 30.0, 19.0, 26.0, 26.0, 13.0, 11.0, 14.0, 6.0, 9.0, 6.0, 5.0, 6.0, 3.0, 5.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6953125, -3.57318115234375, -3.4510498046875, -3.32891845703125, -3.206787109375, -3.08465576171875, -2.9625244140625, -2.84039306640625, -2.71826171875, -2.59613037109375, -2.4739990234375, -2.35186767578125, -2.229736328125, -2.10760498046875, -1.9854736328125, -1.86334228515625, -1.7412109375, -1.61907958984375, -1.4969482421875, -1.37481689453125, -1.252685546875, -1.13055419921875, -1.0084228515625, -0.88629150390625, -0.76416015625, -0.64202880859375, -0.5198974609375, -0.39776611328125, -0.275634765625, -0.15350341796875, -0.0313720703125, 0.09075927734375, 0.212890625, 0.33502197265625, 0.4571533203125, 0.57928466796875, 0.701416015625, 0.82354736328125, 0.9456787109375, 1.06781005859375, 1.18994140625, 1.31207275390625, 1.4342041015625, 1.55633544921875, 1.678466796875, 1.80059814453125, 1.9227294921875, 2.04486083984375, 2.1669921875, 2.28912353515625, 2.4112548828125, 2.53338623046875, 2.655517578125, 2.77764892578125, 2.8997802734375, 3.02191162109375, 3.14404296875, 3.26617431640625, 3.3883056640625, 3.51043701171875, 3.632568359375, 3.75469970703125, 3.8768310546875, 3.99896240234375, 4.12109375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 10.0, 2.0, 12.0, 11.0, 14.0, 20.0, 24.0, 29.0, 40.0, 41.0, 66.0, 112.0, 156.0, 180.0, 252.0, 374.0, 506.0, 726.0, 1130.0, 1485.0, 2134.0, 3227.0, 4721.0, 7136.0, 11197.0, 18527.0, 39730.0, 278060.0, 1605165.0, 60395.0, 23166.0, 13088.0, 8004.0, 5284.0, 3620.0, 2554.0, 1710.0, 1221.0, 799.0, 559.0, 478.0, 324.0, 212.0, 183.0, 107.0, 96.0, 76.0, 43.0, 34.0, 38.0, 24.0, 8.0, 9.0, 10.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.37890625, -4.2427978515625, -4.106689453125, -3.9705810546875, -3.83447265625, -3.6983642578125, -3.562255859375, -3.4261474609375, -3.2900390625, -3.1539306640625, -3.017822265625, -2.8817138671875, -2.74560546875, -2.6094970703125, -2.473388671875, -2.3372802734375, -2.201171875, -2.0650634765625, -1.928955078125, -1.7928466796875, -1.65673828125, -1.5206298828125, -1.384521484375, -1.2484130859375, -1.1123046875, -0.9761962890625, -0.840087890625, -0.7039794921875, -0.56787109375, -0.4317626953125, -0.295654296875, -0.1595458984375, -0.0234375, 0.1126708984375, 0.248779296875, 0.3848876953125, 0.52099609375, 0.6571044921875, 0.793212890625, 0.9293212890625, 1.0654296875, 1.2015380859375, 1.337646484375, 1.4737548828125, 1.60986328125, 1.7459716796875, 1.882080078125, 2.0181884765625, 2.154296875, 2.2904052734375, 2.426513671875, 2.5626220703125, 2.69873046875, 2.8348388671875, 2.970947265625, 3.1070556640625, 3.2431640625, 3.3792724609375, 3.515380859375, 3.6514892578125, 3.78759765625, 3.9237060546875, 4.059814453125, 4.1959228515625, 4.33203125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 13.0, 13.0, 10.0, 15.0, 22.0, 33.0, 44.0, 92.0, 118.0, 151.0, 131.0, 105.0, 64.0, 36.0, 27.0, 12.0, 15.0, 13.0, 16.0, 9.0, 10.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6455078125, -0.6262893676757812, -0.6070709228515625, -0.5878524780273438, -0.568634033203125, -0.5494155883789062, -0.5301971435546875, -0.5109786987304688, -0.49176025390625, -0.47254180908203125, -0.4533233642578125, -0.43410491943359375, -0.414886474609375, -0.39566802978515625, -0.3764495849609375, -0.35723114013671875, -0.3380126953125, -0.31879425048828125, -0.2995758056640625, -0.28035736083984375, -0.261138916015625, -0.24192047119140625, -0.2227020263671875, -0.20348358154296875, -0.18426513671875, -0.16504669189453125, -0.1458282470703125, -0.12660980224609375, -0.107391357421875, -0.08817291259765625, -0.0689544677734375, -0.04973602294921875, -0.030517578125, -0.01129913330078125, 0.0079193115234375, 0.02713775634765625, 0.046356201171875, 0.06557464599609375, 0.0847930908203125, 0.10401153564453125, 0.12322998046875, 0.14244842529296875, 0.1616668701171875, 0.18088531494140625, 0.200103759765625, 0.21932220458984375, 0.2385406494140625, 0.25775909423828125, 0.2769775390625, 0.29619598388671875, 0.3154144287109375, 0.33463287353515625, 0.353851318359375, 0.37306976318359375, 0.3922882080078125, 0.41150665283203125, 0.43072509765625, 0.44994354248046875, 0.4691619873046875, 0.48838043212890625, 0.507598876953125, 0.5268173217773438, 0.5460357666015625, 0.5652542114257812, 0.58447265625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 6.0, 5.0, 4.0, 8.0, 13.0, 21.0, 21.0, 27.0, 39.0, 57.0, 90.0, 179.0, 550.0, 2360.0, 16202.0, 819911.0, 197354.0, 9326.0, 1540.0, 419.0, 142.0, 97.0, 53.0, 28.0, 27.0, 16.0, 16.0, 11.0, 4.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.262451171875, -7.98583984375, -7.709228515625, -7.4326171875, -7.156005859375, -6.87939453125, -6.602783203125, -6.326171875, -6.049560546875, -5.77294921875, -5.496337890625, -5.2197265625, -4.943115234375, -4.66650390625, -4.389892578125, -4.11328125, -3.836669921875, -3.56005859375, -3.283447265625, -3.0068359375, -2.730224609375, -2.45361328125, -2.177001953125, -1.900390625, -1.623779296875, -1.34716796875, -1.070556640625, -0.7939453125, -0.517333984375, -0.24072265625, 0.035888671875, 0.3125, 0.589111328125, 0.86572265625, 1.142333984375, 1.4189453125, 1.695556640625, 1.97216796875, 2.248779296875, 2.525390625, 2.802001953125, 3.07861328125, 3.355224609375, 3.6318359375, 3.908447265625, 4.18505859375, 4.461669921875, 4.73828125, 5.014892578125, 5.29150390625, 5.568115234375, 5.8447265625, 6.121337890625, 6.39794921875, 6.674560546875, 6.951171875, 7.227783203125, 7.50439453125, 7.781005859375, 8.0576171875, 8.334228515625, 8.61083984375, 8.887451171875, 9.1640625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 11.0, 27.0, 58.0, 127.0, 316.0, 279.0, 96.0, 47.0, 21.0, 10.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.545872211456299, -6.3406758308410645, -6.135479927062988, -5.930283546447754, -5.725087642669678, -5.519891262054443, -5.314695358276367, -5.109498977661133, -4.904302597045898, -4.699106216430664, -4.493910312652588, -4.2887139320373535, -4.083518028259277, -3.878321647644043, -3.6731255054473877, -3.4679293632507324, -3.2627334594726562, -3.057537317276001, -2.8523411750793457, -2.6471447944641113, -2.441948890686035, -2.236752510070801, -2.0315563678741455, -1.8263602256774902, -1.621164083480835, -1.4159679412841797, -1.2107717990875244, -1.0055755376815796, -0.8003793954849243, -0.595183253288269, -0.3899869918823242, -0.18479084968566895, 0.02040576934814453, 0.2256019413471222, 0.43079811334609985, 0.6359943151473999, 0.8411904573440552, 1.0463865995407104, 1.2515828609466553, 1.4567790031433105, 1.6619751453399658, 1.867171287536621, 2.0723674297332764, 2.2775635719299316, 2.482759952545166, 2.687955856323242, 2.8931522369384766, 3.098348379135132, 3.303544521331787, 3.5087406635284424, 3.7139368057250977, 3.919133186340332, 4.124329090118408, 4.329525470733643, 4.534721374511719, 4.739917755126953, 4.9451141357421875, 5.150310516357422, 5.355506420135498, 5.560702800750732, 5.765898704528809, 5.971095085144043, 6.176291465759277, 6.3814873695373535, 6.58668327331543]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 7.0, 11.0, 11.0, 9.0, 15.0, 16.0, 25.0, 14.0, 29.0, 24.0, 25.0, 32.0, 39.0, 38.0, 35.0, 44.0, 43.0, 47.0, 42.0, 39.0, 45.0, 41.0, 57.0, 38.0, 29.0, 29.0, 29.0, 28.0, 34.0, 27.0, 26.0, 15.0, 11.0, 11.0, 7.0, 9.0, 4.0, 11.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3711695671081543, -1.3273911476135254, -1.283612608909607, -1.2398340702056885, -1.1960556507110596, -1.1522772312164307, -1.1084986925125122, -1.0647201538085938, -1.0209417343139648, -0.9771632552146912, -0.9333847761154175, -0.8896062970161438, -0.8458278179168701, -0.8020493388175964, -0.7582708597183228, -0.7144923806190491, -0.6707139015197754, -0.6269354224205017, -0.583156943321228, -0.5393784642219543, -0.49559998512268066, -0.451821506023407, -0.4080430269241333, -0.3642645478248596, -0.32048606872558594, -0.27670758962631226, -0.23292911052703857, -0.1891506314277649, -0.1453721523284912, -0.10159367322921753, -0.05781519412994385, -0.014036715030670166, 0.029741644859313965, 0.07352012395858765, 0.11729860305786133, 0.161077082157135, 0.2048555612564087, 0.24863404035568237, 0.29241251945495605, 0.33619099855422974, 0.3799694776535034, 0.4237479567527771, 0.4675264358520508, 0.5113049149513245, 0.5550833940505981, 0.5988618731498718, 0.6426403522491455, 0.6864188313484192, 0.7301973104476929, 0.7739757895469666, 0.8177542686462402, 0.8615327477455139, 0.9053112268447876, 0.9490897059440613, 0.992868185043335, 1.0366466045379639, 1.0804251432418823, 1.1242036819458008, 1.1679821014404297, 1.2117605209350586, 1.255539059638977, 1.2993175983428955, 1.3430960178375244, 1.3868744373321533, 1.4306529760360718]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 7.0, 9.0, 4.0, 6.0, 17.0, 8.0, 17.0, 20.0, 23.0, 27.0, 15.0, 26.0, 32.0, 43.0, 32.0, 30.0, 41.0, 39.0, 39.0, 40.0, 50.0, 28.0, 39.0, 44.0, 37.0, 39.0, 26.0, 28.0, 25.0, 29.0, 26.0, 29.0, 17.0, 26.0, 15.0, 13.0, 13.0, 8.0, 6.0, 5.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.76171875, -3.62530517578125, -3.4888916015625, -3.35247802734375, -3.216064453125, -3.07965087890625, -2.9432373046875, -2.80682373046875, -2.67041015625, -2.53399658203125, -2.3975830078125, -2.26116943359375, -2.124755859375, -1.98834228515625, -1.8519287109375, -1.71551513671875, -1.5791015625, -1.44268798828125, -1.3062744140625, -1.16986083984375, -1.033447265625, -0.89703369140625, -0.7606201171875, -0.62420654296875, -0.48779296875, -0.35137939453125, -0.2149658203125, -0.07855224609375, 0.057861328125, 0.19427490234375, 0.3306884765625, 0.46710205078125, 0.603515625, 0.73992919921875, 0.8763427734375, 1.01275634765625, 1.149169921875, 1.28558349609375, 1.4219970703125, 1.55841064453125, 1.69482421875, 1.83123779296875, 1.9676513671875, 2.10406494140625, 2.240478515625, 2.37689208984375, 2.5133056640625, 2.64971923828125, 2.7861328125, 2.92254638671875, 3.0589599609375, 3.19537353515625, 3.331787109375, 3.46820068359375, 3.6046142578125, 3.74102783203125, 3.87744140625, 4.01385498046875, 4.1502685546875, 4.28668212890625, 4.423095703125, 4.55950927734375, 4.6959228515625, 4.83233642578125, 4.96875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 2.0, 14.0, 11.0, 19.0, 26.0, 54.0, 72.0, 124.0, 180.0, 339.0, 562.0, 1031.0, 1805.0, 3240.0, 5459.0, 10086.0, 18955.0, 35936.0, 72883.0, 185033.0, 394922.0, 172675.0, 69727.0, 34704.0, 18388.0, 9725.0, 5568.0, 3015.0, 1694.0, 945.0, 508.0, 313.0, 214.0, 128.0, 64.0, 48.0, 28.0, 16.0, 14.0, 6.0, 5.0, 2.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1796875, -5.99505615234375, -5.8104248046875, -5.62579345703125, -5.441162109375, -5.25653076171875, -5.0718994140625, -4.88726806640625, -4.70263671875, -4.51800537109375, -4.3333740234375, -4.14874267578125, -3.964111328125, -3.77947998046875, -3.5948486328125, -3.41021728515625, -3.2255859375, -3.04095458984375, -2.8563232421875, -2.67169189453125, -2.487060546875, -2.30242919921875, -2.1177978515625, -1.93316650390625, -1.74853515625, -1.56390380859375, -1.3792724609375, -1.19464111328125, -1.010009765625, -0.82537841796875, -0.6407470703125, -0.45611572265625, -0.271484375, -0.08685302734375, 0.0977783203125, 0.28240966796875, 0.467041015625, 0.65167236328125, 0.8363037109375, 1.02093505859375, 1.20556640625, 1.39019775390625, 1.5748291015625, 1.75946044921875, 1.944091796875, 2.12872314453125, 2.3133544921875, 2.49798583984375, 2.6826171875, 2.86724853515625, 3.0518798828125, 3.23651123046875, 3.421142578125, 3.60577392578125, 3.7904052734375, 3.97503662109375, 4.15966796875, 4.34429931640625, 4.5289306640625, 4.71356201171875, 4.898193359375, 5.08282470703125, 5.2674560546875, 5.45208740234375, 5.63671875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 5.0, 8.0, 6.0, 11.0, 14.0, 8.0, 5.0, 12.0, 20.0, 24.0, 24.0, 25.0, 25.0, 36.0, 34.0, 38.0, 56.0, 52.0, 81.0, 135.0, 260.0, 1371.0, 189.0, 94.0, 73.0, 59.0, 40.0, 35.0, 39.0, 39.0, 33.0, 34.0, 27.0, 13.0, 21.0, 15.0, 14.0, 12.0, 11.0, 10.0, 11.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.375, -12.9473876953125, -12.519775390625, -12.0921630859375, -11.66455078125, -11.2369384765625, -10.809326171875, -10.3817138671875, -9.9541015625, -9.5264892578125, -9.098876953125, -8.6712646484375, -8.24365234375, -7.8160400390625, -7.388427734375, -6.9608154296875, -6.533203125, -6.1055908203125, -5.677978515625, -5.2503662109375, -4.82275390625, -4.3951416015625, -3.967529296875, -3.5399169921875, -3.1123046875, -2.6846923828125, -2.257080078125, -1.8294677734375, -1.40185546875, -0.9742431640625, -0.546630859375, -0.1190185546875, 0.30859375, 0.7362060546875, 1.163818359375, 1.5914306640625, 2.01904296875, 2.4466552734375, 2.874267578125, 3.3018798828125, 3.7294921875, 4.1571044921875, 4.584716796875, 5.0123291015625, 5.43994140625, 5.8675537109375, 6.295166015625, 6.7227783203125, 7.150390625, 7.5780029296875, 8.005615234375, 8.4332275390625, 8.86083984375, 9.2884521484375, 9.716064453125, 10.1436767578125, 10.5712890625, 10.9989013671875, 11.426513671875, 11.8541259765625, 12.28173828125, 12.7093505859375, 13.136962890625, 13.5645751953125, 13.9921875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 10.0, 12.0, 9.0, 15.0, 36.0, 56.0, 74.0, 113.0, 205.0, 383.0, 919.0, 3106.0, 26059.0, 2556749.0, 542296.0, 12169.0, 2044.0, 680.0, 293.0, 187.0, 85.0, 63.0, 42.0, 25.0, 18.0, 14.0, 10.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-41.15625, -39.8642578125, -38.572265625, -37.2802734375, -35.98828125, -34.6962890625, -33.404296875, -32.1123046875, -30.8203125, -29.5283203125, -28.236328125, -26.9443359375, -25.65234375, -24.3603515625, -23.068359375, -21.7763671875, -20.484375, -19.1923828125, -17.900390625, -16.6083984375, -15.31640625, -14.0244140625, -12.732421875, -11.4404296875, -10.1484375, -8.8564453125, -7.564453125, -6.2724609375, -4.98046875, -3.6884765625, -2.396484375, -1.1044921875, 0.1875, 1.4794921875, 2.771484375, 4.0634765625, 5.35546875, 6.6474609375, 7.939453125, 9.2314453125, 10.5234375, 11.8154296875, 13.107421875, 14.3994140625, 15.69140625, 16.9833984375, 18.275390625, 19.5673828125, 20.859375, 22.1513671875, 23.443359375, 24.7353515625, 26.02734375, 27.3193359375, 28.611328125, 29.9033203125, 31.1953125, 32.4873046875, 33.779296875, 35.0712890625, 36.36328125, 37.6552734375, 38.947265625, 40.2392578125, 41.53125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 13.0, 138.0, 473.0, 328.0, 53.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.17153930664062, -74.7376937866211, -69.3038558959961, -63.87001037597656, -58.43617248535156, -53.00232696533203, -47.568485260009766, -42.1346435546875, -36.700801849365234, -31.26696014404297, -25.833118438720703, -20.399274826049805, -14.965433120727539, -9.531591415405273, -4.097747802734375, 1.3360939025878906, 6.769935607910156, 12.203777313232422, 17.637619018554688, 23.071462631225586, 28.50530433654785, 33.93914794921875, 39.372989654541016, 44.80683135986328, 50.24067306518555, 55.67451477050781, 61.10835647583008, 66.54219818115234, 71.97604370117188, 77.40988159179688, 82.8437271118164, 88.27757263183594, 93.71141052246094, 99.14525604248047, 104.57909393310547, 110.012939453125, 115.44677734375, 120.88062286376953, 126.31446838378906, 131.74830627441406, 137.18214416503906, 142.61598205566406, 148.04983520507812, 153.48367309570312, 158.91751098632812, 164.35134887695312, 169.7852020263672, 175.2190399169922, 180.65289306640625, 186.08673095703125, 191.5205841064453, 196.9544219970703, 202.3882598876953, 207.8220977783203, 213.25595092773438, 218.68978881835938, 224.12362670898438, 229.55746459960938, 234.99131774902344, 240.42515563964844, 245.85899353027344, 251.29283142089844, 256.7266845703125, 262.1605224609375, 267.5943603515625]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 3.0, 9.0, 8.0, 11.0, 8.0, 16.0, 17.0, 23.0, 13.0, 18.0, 20.0, 24.0, 32.0, 33.0, 41.0, 26.0, 39.0, 39.0, 36.0, 34.0, 41.0, 45.0, 29.0, 45.0, 29.0, 47.0, 33.0, 44.0, 25.0, 31.0, 30.0, 20.0, 18.0, 9.0, 18.0, 16.0, 11.0, 10.0, 8.0, 7.0, 5.0, 8.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-44.41162872314453, -43.09401321411133, -41.776397705078125, -40.45878601074219, -39.141170501708984, -37.82355499267578, -36.50593948364258, -35.188323974609375, -33.87071228027344, -32.553096771240234, -31.235483169555664, -29.91786766052246, -28.60025405883789, -27.282638549804688, -25.965023040771484, -24.64740753173828, -23.329792022705078, -22.012176513671875, -20.694562911987305, -19.3769474029541, -18.05933380126953, -16.741718292236328, -15.424102783203125, -14.106488227844238, -12.788873672485352, -11.471259117126465, -10.153644561767578, -8.836029052734375, -7.518414497375488, -6.200799942016602, -4.883184909820557, -3.5655698776245117, -2.2479515075683594, -0.9303367137908936, 0.38727807998657227, 1.704892873764038, 3.022507667541504, 4.340122222900391, 5.6577372550964355, 6.9753522872924805, 8.292966842651367, 9.610581398010254, 10.92819595336914, 12.245811462402344, 13.56342601776123, 14.881040573120117, 16.19865608215332, 17.51626968383789, 18.833885192871094, 20.151500701904297, 21.469114303588867, 22.78672981262207, 24.10434341430664, 25.421958923339844, 26.739574432373047, 28.05718994140625, 29.37480354309082, 30.692419052124023, 32.010032653808594, 33.3276481628418, 34.645263671875, 35.96287536621094, 37.28049087524414, 38.598106384277344, 39.91572189331055]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 7.0, 10.0, 10.0, 16.0, 21.0, 17.0, 20.0, 22.0, 21.0, 28.0, 31.0, 36.0, 37.0, 42.0, 30.0, 36.0, 42.0, 37.0, 50.0, 43.0, 38.0, 39.0, 32.0, 27.0, 32.0, 26.0, 23.0, 24.0, 23.0, 25.0, 20.0, 29.0, 21.0, 16.0, 9.0, 8.0, 10.0, 7.0, 3.0, 3.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.861328125, -3.721038818359375, -3.58074951171875, -3.440460205078125, -3.3001708984375, -3.159881591796875, -3.01959228515625, -2.879302978515625, -2.739013671875, -2.598724365234375, -2.45843505859375, -2.318145751953125, -2.1778564453125, -2.037567138671875, -1.89727783203125, -1.756988525390625, -1.61669921875, -1.476409912109375, -1.33612060546875, -1.195831298828125, -1.0555419921875, -0.915252685546875, -0.77496337890625, -0.634674072265625, -0.494384765625, -0.354095458984375, -0.21380615234375, -0.073516845703125, 0.0667724609375, 0.207061767578125, 0.34735107421875, 0.487640380859375, 0.6279296875, 0.768218994140625, 0.90850830078125, 1.048797607421875, 1.1890869140625, 1.329376220703125, 1.46966552734375, 1.609954833984375, 1.750244140625, 1.890533447265625, 2.03082275390625, 2.171112060546875, 2.3114013671875, 2.451690673828125, 2.59197998046875, 2.732269287109375, 2.87255859375, 3.012847900390625, 3.15313720703125, 3.293426513671875, 3.4337158203125, 3.574005126953125, 3.71429443359375, 3.854583740234375, 3.994873046875, 4.135162353515625, 4.27545166015625, 4.415740966796875, 4.5560302734375, 4.696319580078125, 4.83660888671875, 4.976898193359375, 5.1171875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 6.0, 12.0, 12.0, 25.0, 33.0, 32.0, 62.0, 84.0, 139.0, 211.0, 311.0, 502.0, 777.0, 1309.0, 2224.0, 3961.0, 8013.0, 18269.0, 52318.0, 229853.0, 1665734.0, 1862428.0, 253959.0, 55552.0, 19592.0, 8304.0, 4255.0, 2294.0, 1392.0, 870.0, 560.0, 386.0, 275.0, 164.0, 108.0, 82.0, 46.0, 47.0, 25.0, 16.0, 15.0, 11.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75, -11.3587646484375, -10.967529296875, -10.5762939453125, -10.18505859375, -9.7938232421875, -9.402587890625, -9.0113525390625, -8.6201171875, -8.2288818359375, -7.837646484375, -7.4464111328125, -7.05517578125, -6.6639404296875, -6.272705078125, -5.8814697265625, -5.490234375, -5.0989990234375, -4.707763671875, -4.3165283203125, -3.92529296875, -3.5340576171875, -3.142822265625, -2.7515869140625, -2.3603515625, -1.9691162109375, -1.577880859375, -1.1866455078125, -0.79541015625, -0.4041748046875, -0.012939453125, 0.3782958984375, 0.76953125, 1.1607666015625, 1.552001953125, 1.9432373046875, 2.33447265625, 2.7257080078125, 3.116943359375, 3.5081787109375, 3.8994140625, 4.2906494140625, 4.681884765625, 5.0731201171875, 5.46435546875, 5.8555908203125, 6.246826171875, 6.6380615234375, 7.029296875, 7.4205322265625, 7.811767578125, 8.2030029296875, 8.59423828125, 8.9854736328125, 9.376708984375, 9.7679443359375, 10.1591796875, 10.5504150390625, 10.941650390625, 11.3328857421875, 11.72412109375, 12.1153564453125, 12.506591796875, 12.8978271484375, 13.2890625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 6.0, 12.0, 8.0, 14.0, 21.0, 29.0, 39.0, 71.0, 73.0, 90.0, 130.0, 192.0, 268.0, 380.0, 499.0, 569.0, 437.0, 325.0, 274.0, 169.0, 121.0, 89.0, 54.0, 42.0, 33.0, 22.0, 21.0, 20.0, 10.0, 11.0, 2.0, 10.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.4453125, -12.0712890625, -11.697265625, -11.3232421875, -10.94921875, -10.5751953125, -10.201171875, -9.8271484375, -9.453125, -9.0791015625, -8.705078125, -8.3310546875, -7.95703125, -7.5830078125, -7.208984375, -6.8349609375, -6.4609375, -6.0869140625, -5.712890625, -5.3388671875, -4.96484375, -4.5908203125, -4.216796875, -3.8427734375, -3.46875, -3.0947265625, -2.720703125, -2.3466796875, -1.97265625, -1.5986328125, -1.224609375, -0.8505859375, -0.4765625, -0.1025390625, 0.271484375, 0.6455078125, 1.01953125, 1.3935546875, 1.767578125, 2.1416015625, 2.515625, 2.8896484375, 3.263671875, 3.6376953125, 4.01171875, 4.3857421875, 4.759765625, 5.1337890625, 5.5078125, 5.8818359375, 6.255859375, 6.6298828125, 7.00390625, 7.3779296875, 7.751953125, 8.1259765625, 8.5, 8.8740234375, 9.248046875, 9.6220703125, 9.99609375, 10.3701171875, 10.744140625, 11.1181640625, 11.4921875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 10.0, 10.0, 24.0, 24.0, 42.0, 59.0, 73.0, 101.0, 152.0, 271.0, 418.0, 680.0, 1124.0, 2074.0, 3929.0, 7636.0, 16636.0, 43617.0, 153247.0, 827686.0, 2439025.0, 525574.0, 109872.0, 34007.0, 13566.0, 6552.0, 3252.0, 1775.0, 1096.0, 577.0, 409.0, 222.0, 163.0, 93.0, 84.0, 57.0, 39.0, 28.0, 21.0, 15.0, 8.0, 8.0, 6.0, 8.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-15.828125, -15.32373046875, -14.8193359375, -14.31494140625, -13.810546875, -13.30615234375, -12.8017578125, -12.29736328125, -11.79296875, -11.28857421875, -10.7841796875, -10.27978515625, -9.775390625, -9.27099609375, -8.7666015625, -8.26220703125, -7.7578125, -7.25341796875, -6.7490234375, -6.24462890625, -5.740234375, -5.23583984375, -4.7314453125, -4.22705078125, -3.72265625, -3.21826171875, -2.7138671875, -2.20947265625, -1.705078125, -1.20068359375, -0.6962890625, -0.19189453125, 0.3125, 0.81689453125, 1.3212890625, 1.82568359375, 2.330078125, 2.83447265625, 3.3388671875, 3.84326171875, 4.34765625, 4.85205078125, 5.3564453125, 5.86083984375, 6.365234375, 6.86962890625, 7.3740234375, 7.87841796875, 8.3828125, 8.88720703125, 9.3916015625, 9.89599609375, 10.400390625, 10.90478515625, 11.4091796875, 11.91357421875, 12.41796875, 12.92236328125, 13.4267578125, 13.93115234375, 14.435546875, 14.93994140625, 15.4443359375, 15.94873046875, 16.453125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 11.0, 25.0, 32.0, 33.0, 47.0, 84.0, 84.0, 118.0, 109.0, 95.0, 92.0, 72.0, 65.0, 35.0, 28.0, 22.0, 17.0, 6.0, 3.0, 3.0, 7.0, 4.0, 0.0, 1.0], "bins": [-101.47373962402344, -99.38347625732422, -97.293212890625, -95.20294952392578, -93.11268615722656, -91.02242279052734, -88.93215942382812, -86.84188842773438, -84.75163269042969, -82.66136932373047, -80.57110595703125, -78.48084259033203, -76.39057922363281, -74.3003158569336, -72.21005249023438, -70.11978149414062, -68.0295181274414, -65.93925476074219, -63.84899139404297, -61.75872802734375, -59.66846466064453, -57.57820129394531, -55.48793411254883, -53.39767074584961, -51.30740737915039, -49.21714401245117, -47.12688064575195, -45.036617279052734, -42.94635009765625, -40.85608673095703, -38.76582336425781, -36.675559997558594, -34.585289001464844, -32.495025634765625, -30.404762268066406, -28.314496994018555, -26.224233627319336, -24.133970260620117, -22.043704986572266, -19.953441619873047, -17.863178253173828, -15.77291488647461, -13.682650566101074, -11.592386245727539, -9.50212287902832, -7.411859512329102, -5.321595191955566, -3.2313308715820312, -1.1410675048828125, 0.9491963386535645, 3.0394601821899414, 5.129724025726318, 7.219987869262695, 9.310251235961914, 11.40051555633545, 13.490779876708984, 15.581043243408203, 17.671306610107422, 19.76156997680664, 21.851835250854492, 23.94209861755371, 26.03236198425293, 28.12262725830078, 30.212890625, 32.30315399169922]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 20.0, 10.0, 16.0, 16.0, 21.0, 18.0, 30.0, 22.0, 34.0, 30.0, 40.0, 32.0, 36.0, 33.0, 43.0, 49.0, 47.0, 44.0, 40.0, 38.0, 41.0, 47.0, 24.0, 25.0, 35.0, 39.0, 22.0, 17.0, 22.0, 14.0, 13.0, 14.0, 7.0, 11.0, 6.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.13240432739258, -36.945465087890625, -35.75852584838867, -34.57158660888672, -33.3846435546875, -32.19770431518555, -31.010765075683594, -29.82382583618164, -28.636886596679688, -27.449947357177734, -26.26300811767578, -25.076066970825195, -23.889127731323242, -22.70218849182129, -21.515247344970703, -20.32830810546875, -19.141368865966797, -17.954429626464844, -16.76749038696289, -15.580549240112305, -14.393610000610352, -13.206670761108398, -12.019730567932129, -10.83279037475586, -9.645851135253906, -8.458911895751953, -7.271971702575684, -6.085031986236572, -4.898092269897461, -3.7111525535583496, -2.5242128372192383, -1.3372726440429688, -0.15032958984375, 1.0366101264953613, 2.2235498428344727, 3.410489559173584, 4.597429275512695, 5.784368991851807, 6.971308708190918, 8.158248901367188, 9.34518814086914, 10.532127380371094, 11.719067573547363, 12.906007766723633, 14.092947006225586, 15.279886245727539, 16.466827392578125, 17.653766632080078, 18.84070587158203, 20.027645111083984, 21.214584350585938, 22.401525497436523, 23.588464736938477, 24.77540397644043, 25.962345123291016, 27.14928436279297, 28.336223602294922, 29.523162841796875, 30.710102081298828, 31.897043228149414, 33.083984375, 34.27092361450195, 35.457862854003906, 36.64480209350586, 37.83174133300781]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 11.0, 9.0, 15.0, 20.0, 19.0, 30.0, 31.0, 29.0, 22.0, 43.0, 33.0, 29.0, 46.0, 39.0, 35.0, 45.0, 55.0, 52.0, 32.0, 40.0, 43.0, 48.0, 33.0, 26.0, 27.0, 20.0, 24.0, 22.0, 23.0, 17.0, 10.0, 14.0, 11.0, 8.0, 3.0, 6.0, 3.0, 3.0, 7.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.2628173828125, -4.107666015625, -3.9525146484375, -3.79736328125, -3.6422119140625, -3.487060546875, -3.3319091796875, -3.1767578125, -3.0216064453125, -2.866455078125, -2.7113037109375, -2.55615234375, -2.4010009765625, -2.245849609375, -2.0906982421875, -1.935546875, -1.7803955078125, -1.625244140625, -1.4700927734375, -1.31494140625, -1.1597900390625, -1.004638671875, -0.8494873046875, -0.6943359375, -0.5391845703125, -0.384033203125, -0.2288818359375, -0.07373046875, 0.0814208984375, 0.236572265625, 0.3917236328125, 0.546875, 0.7020263671875, 0.857177734375, 1.0123291015625, 1.16748046875, 1.3226318359375, 1.477783203125, 1.6329345703125, 1.7880859375, 1.9432373046875, 2.098388671875, 2.2535400390625, 2.40869140625, 2.5638427734375, 2.718994140625, 2.8741455078125, 3.029296875, 3.1844482421875, 3.339599609375, 3.4947509765625, 3.64990234375, 3.8050537109375, 3.960205078125, 4.1153564453125, 4.2705078125, 4.4256591796875, 4.580810546875, 4.7359619140625, 4.89111328125, 5.0462646484375, 5.201416015625, 5.3565673828125, 5.51171875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 5.0, 8.0, 12.0, 16.0, 25.0, 39.0, 51.0, 95.0, 121.0, 175.0, 238.0, 417.0, 678.0, 1147.0, 1852.0, 3169.0, 5217.0, 9083.0, 16090.0, 28241.0, 49029.0, 82679.0, 125284.0, 165587.0, 173546.0, 143114.0, 98883.0, 60687.0, 35261.0, 20153.0, 11281.0, 6535.0, 3786.0, 2271.0, 1339.0, 907.0, 530.0, 356.0, 187.0, 143.0, 100.0, 71.0, 40.0, 33.0, 24.0, 16.0, 6.0, 18.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.490234375, -3.3818359375, -3.2734375, -3.1650390625, -3.056640625, -2.9482421875, -2.83984375, -2.7314453125, -2.623046875, -2.5146484375, -2.40625, -2.2978515625, -2.189453125, -2.0810546875, -1.97265625, -1.8642578125, -1.755859375, -1.6474609375, -1.5390625, -1.4306640625, -1.322265625, -1.2138671875, -1.10546875, -0.9970703125, -0.888671875, -0.7802734375, -0.671875, -0.5634765625, -0.455078125, -0.3466796875, -0.23828125, -0.1298828125, -0.021484375, 0.0869140625, 0.1953125, 0.3037109375, 0.412109375, 0.5205078125, 0.62890625, 0.7373046875, 0.845703125, 0.9541015625, 1.0625, 1.1708984375, 1.279296875, 1.3876953125, 1.49609375, 1.6044921875, 1.712890625, 1.8212890625, 1.9296875, 2.0380859375, 2.146484375, 2.2548828125, 2.36328125, 2.4716796875, 2.580078125, 2.6884765625, 2.796875, 2.9052734375, 3.013671875, 3.1220703125, 3.23046875, 3.3388671875, 3.447265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 6.0, 2.0, 6.0, 10.0, 9.0, 14.0, 17.0, 18.0, 23.0, 16.0, 21.0, 24.0, 24.0, 37.0, 37.0, 35.0, 24.0, 35.0, 46.0, 39.0, 42.0, 1065.0, 40.0, 28.0, 39.0, 35.0, 30.0, 46.0, 42.0, 31.0, 27.0, 22.0, 16.0, 23.0, 18.0, 16.0, 9.0, 10.0, 7.0, 11.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.978515625, -3.852325439453125, -3.72613525390625, -3.599945068359375, -3.4737548828125, -3.347564697265625, -3.22137451171875, -3.095184326171875, -2.968994140625, -2.842803955078125, -2.71661376953125, -2.590423583984375, -2.4642333984375, -2.338043212890625, -2.21185302734375, -2.085662841796875, -1.95947265625, -1.833282470703125, -1.70709228515625, -1.580902099609375, -1.4547119140625, -1.328521728515625, -1.20233154296875, -1.076141357421875, -0.949951171875, -0.823760986328125, -0.69757080078125, -0.571380615234375, -0.4451904296875, -0.319000244140625, -0.19281005859375, -0.066619873046875, 0.0595703125, 0.185760498046875, 0.31195068359375, 0.438140869140625, 0.5643310546875, 0.690521240234375, 0.81671142578125, 0.942901611328125, 1.069091796875, 1.195281982421875, 1.32147216796875, 1.447662353515625, 1.5738525390625, 1.700042724609375, 1.82623291015625, 1.952423095703125, 2.07861328125, 2.204803466796875, 2.33099365234375, 2.457183837890625, 2.5833740234375, 2.709564208984375, 2.83575439453125, 2.961944580078125, 3.088134765625, 3.214324951171875, 3.34051513671875, 3.466705322265625, 3.5928955078125, 3.719085693359375, 3.84527587890625, 3.971466064453125, 4.09765625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 6.0, 8.0, 13.0, 19.0, 24.0, 45.0, 68.0, 108.0, 108.0, 228.0, 337.0, 518.0, 875.0, 1386.0, 2261.0, 3670.0, 6066.0, 10477.0, 18265.0, 36929.0, 163460.0, 1712255.0, 74964.0, 28380.0, 14958.0, 8535.0, 5106.0, 3011.0, 1786.0, 1195.0, 743.0, 448.0, 343.0, 180.0, 127.0, 85.0, 53.0, 25.0, 20.0, 13.0, 9.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.669921875, -5.4765625, -5.283203125, -5.08984375, -4.896484375, -4.703125, -4.509765625, -4.31640625, -4.123046875, -3.9296875, -3.736328125, -3.54296875, -3.349609375, -3.15625, -2.962890625, -2.76953125, -2.576171875, -2.3828125, -2.189453125, -1.99609375, -1.802734375, -1.609375, -1.416015625, -1.22265625, -1.029296875, -0.8359375, -0.642578125, -0.44921875, -0.255859375, -0.0625, 0.130859375, 0.32421875, 0.517578125, 0.7109375, 0.904296875, 1.09765625, 1.291015625, 1.484375, 1.677734375, 1.87109375, 2.064453125, 2.2578125, 2.451171875, 2.64453125, 2.837890625, 3.03125, 3.224609375, 3.41796875, 3.611328125, 3.8046875, 3.998046875, 4.19140625, 4.384765625, 4.578125, 4.771484375, 4.96484375, 5.158203125, 5.3515625, 5.544921875, 5.73828125, 5.931640625, 6.125, 6.318359375, 6.51171875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 11.0, 11.0, 9.0, 10.0, 13.0, 20.0, 16.0, 35.0, 26.0, 44.0, 59.0, 56.0, 74.0, 67.0, 77.0, 90.0, 78.0, 49.0, 55.0, 38.0, 32.0, 20.0, 20.0, 12.0, 15.0, 12.0, 7.0, 1.0, 6.0, 2.0, 5.0, 12.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.418212890625, -0.4033470153808594, -0.38848114013671875, -0.3736152648925781, -0.3587493896484375, -0.3438835144042969, -0.32901763916015625, -0.3141517639160156, -0.299285888671875, -0.2844200134277344, -0.26955413818359375, -0.2546882629394531, -0.2398223876953125, -0.22495651245117188, -0.21009063720703125, -0.19522476196289062, -0.18035888671875, -0.16549301147460938, -0.15062713623046875, -0.13576126098632812, -0.1208953857421875, -0.10602951049804688, -0.09116363525390625, -0.07629776000976562, -0.061431884765625, -0.046566009521484375, -0.03170013427734375, -0.016834259033203125, -0.0019683837890625, 0.012897491455078125, 0.02776336669921875, 0.042629241943359375, 0.0574951171875, 0.07236099243164062, 0.08722686767578125, 0.10209274291992188, 0.1169586181640625, 0.13182449340820312, 0.14669036865234375, 0.16155624389648438, 0.176422119140625, 0.19128799438476562, 0.20615386962890625, 0.22101974487304688, 0.2358856201171875, 0.2507514953613281, 0.26561737060546875, 0.2804832458496094, 0.29534912109375, 0.3102149963378906, 0.32508087158203125, 0.3399467468261719, 0.3548126220703125, 0.3696784973144531, 0.38454437255859375, 0.3994102478027344, 0.414276123046875, 0.4291419982910156, 0.44400787353515625, 0.4588737487792969, 0.4737396240234375, 0.4886054992675781, 0.5034713745117188, 0.5183372497558594, 0.533203125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 3.0, 6.0, 4.0, 8.0, 3.0, 11.0, 16.0, 17.0, 17.0, 23.0, 30.0, 64.0, 72.0, 146.0, 242.0, 636.0, 1785.0, 7372.0, 52922.0, 871036.0, 99728.0, 10511.0, 2352.0, 759.0, 299.0, 159.0, 87.0, 66.0, 44.0, 30.0, 29.0, 19.0, 14.0, 10.0, 9.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.03515625, -6.83758544921875, -6.6400146484375, -6.44244384765625, -6.244873046875, -6.04730224609375, -5.8497314453125, -5.65216064453125, -5.45458984375, -5.25701904296875, -5.0594482421875, -4.86187744140625, -4.664306640625, -4.46673583984375, -4.2691650390625, -4.07159423828125, -3.8740234375, -3.67645263671875, -3.4788818359375, -3.28131103515625, -3.083740234375, -2.88616943359375, -2.6885986328125, -2.49102783203125, -2.29345703125, -2.09588623046875, -1.8983154296875, -1.70074462890625, -1.503173828125, -1.30560302734375, -1.1080322265625, -0.91046142578125, -0.712890625, -0.51531982421875, -0.3177490234375, -0.12017822265625, 0.077392578125, 0.27496337890625, 0.4725341796875, 0.67010498046875, 0.86767578125, 1.06524658203125, 1.2628173828125, 1.46038818359375, 1.657958984375, 1.85552978515625, 2.0531005859375, 2.25067138671875, 2.4482421875, 2.64581298828125, 2.8433837890625, 3.04095458984375, 3.238525390625, 3.43609619140625, 3.6336669921875, 3.83123779296875, 4.02880859375, 4.22637939453125, 4.4239501953125, 4.62152099609375, 4.819091796875, 5.01666259765625, 5.2142333984375, 5.41180419921875, 5.609375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 12.0, 15.0, 49.0, 144.0, 522.0, 190.0, 49.0, 19.0, 9.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.115744590759277, -8.77298355102539, -8.430222511291504, -8.087461471557617, -7.744701385498047, -7.40194034576416, -7.059179306030273, -6.716418266296387, -6.373657703399658, -6.0308966636657715, -5.688136100769043, -5.345375061035156, -5.0026140213012695, -4.659853458404541, -4.317092418670654, -3.9743316173553467, -3.631570816040039, -3.2888100147247314, -2.946049213409424, -2.603288173675537, -2.2605273723602295, -1.9177665710449219, -1.5750055313110352, -1.2322447299957275, -0.8894839286804199, -0.5467230677604675, -0.20396220684051514, 0.13879871368408203, 0.48155951499938965, 0.8243203163146973, 1.167081356048584, 1.5098421573638916, 1.8526029586791992, 2.195363759994507, 2.5381245613098145, 2.880885601043701, 3.223646402359009, 3.5664072036743164, 3.909168243408203, 4.25192928314209, 4.594689846038818, 4.937450885772705, 5.280211448669434, 5.62297248840332, 5.965733528137207, 6.3084940910339355, 6.651255130767822, 6.994015693664551, 7.3367767333984375, 7.679537773132324, 8.022298812866211, 8.365058898925781, 8.707819938659668, 9.050580978393555, 9.393342018127441, 9.736103057861328, 10.078863143920898, 10.421624183654785, 10.764385223388672, 11.107145309448242, 11.449906349182129, 11.792667388916016, 12.135428428649902, 12.478189468383789, 12.820950508117676]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 7.0, 10.0, 14.0, 17.0, 30.0, 18.0, 23.0, 36.0, 41.0, 41.0, 50.0, 46.0, 44.0, 67.0, 49.0, 54.0, 54.0, 59.0, 61.0, 43.0, 35.0, 40.0, 39.0, 31.0, 26.0, 16.0, 13.0, 13.0, 4.0, 9.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1572608947753906, -2.0928618907928467, -2.0284628868103027, -1.9640638828277588, -1.8996648788452148, -1.835265874862671, -1.770866870880127, -1.706467866897583, -1.642068862915039, -1.5776698589324951, -1.5132708549499512, -1.4488718509674072, -1.3844728469848633, -1.3200738430023193, -1.2556748390197754, -1.1912758350372314, -1.1268768310546875, -1.0624778270721436, -0.9980788230895996, -0.9336798191070557, -0.8692808151245117, -0.8048818111419678, -0.7404828071594238, -0.6760838031768799, -0.6116847991943359, -0.547285795211792, -0.48288679122924805, -0.4184877872467041, -0.35408878326416016, -0.2896897792816162, -0.22529077529907227, -0.16089177131652832, -0.09649252891540527, -0.03209352493286133, 0.03230547904968262, 0.09670448303222656, 0.1611034870147705, 0.22550249099731445, 0.2899014949798584, 0.35430049896240234, 0.4186995029449463, 0.48309850692749023, 0.5474975109100342, 0.6118965148925781, 0.6762955188751221, 0.740694522857666, 0.80509352684021, 0.8694925308227539, 0.9338915348052979, 0.9982905387878418, 1.0626895427703857, 1.1270885467529297, 1.1914875507354736, 1.2558865547180176, 1.3202855587005615, 1.3846845626831055, 1.4490835666656494, 1.5134825706481934, 1.5778815746307373, 1.6422805786132812, 1.7066795825958252, 1.7710785865783691, 1.835477590560913, 1.899876594543457, 1.964275598526001]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 9.0, 10.0, 7.0, 15.0, 22.0, 19.0, 27.0, 28.0, 30.0, 22.0, 42.0, 37.0, 24.0, 48.0, 39.0, 39.0, 39.0, 53.0, 49.0, 38.0, 31.0, 47.0, 53.0, 33.0, 27.0, 25.0, 23.0, 25.0, 21.0, 25.0, 15.0, 13.0, 13.0, 12.0, 7.0, 3.0, 7.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48828125, -4.33148193359375, -4.1746826171875, -4.01788330078125, -3.861083984375, -3.70428466796875, -3.5474853515625, -3.39068603515625, -3.23388671875, -3.07708740234375, -2.9202880859375, -2.76348876953125, -2.606689453125, -2.44989013671875, -2.2930908203125, -2.13629150390625, -1.9794921875, -1.82269287109375, -1.6658935546875, -1.50909423828125, -1.352294921875, -1.19549560546875, -1.0386962890625, -0.88189697265625, -0.72509765625, -0.56829833984375, -0.4114990234375, -0.25469970703125, -0.097900390625, 0.05889892578125, 0.2156982421875, 0.37249755859375, 0.529296875, 0.68609619140625, 0.8428955078125, 0.99969482421875, 1.156494140625, 1.31329345703125, 1.4700927734375, 1.62689208984375, 1.78369140625, 1.94049072265625, 2.0972900390625, 2.25408935546875, 2.410888671875, 2.56768798828125, 2.7244873046875, 2.88128662109375, 3.0380859375, 3.19488525390625, 3.3516845703125, 3.50848388671875, 3.665283203125, 3.82208251953125, 3.9788818359375, 4.13568115234375, 4.29248046875, 4.44927978515625, 4.6060791015625, 4.76287841796875, 4.919677734375, 5.07647705078125, 5.2332763671875, 5.39007568359375, 5.546875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 11.0, 17.0, 19.0, 29.0, 34.0, 41.0, 66.0, 112.0, 131.0, 209.0, 333.0, 507.0, 785.0, 1131.0, 1889.0, 3139.0, 5292.0, 9122.0, 17800.0, 40366.0, 113642.0, 327529.0, 330138.0, 114424.0, 40884.0, 17830.0, 9281.0, 5162.0, 3084.0, 1910.0, 1260.0, 759.0, 514.0, 337.0, 251.0, 137.0, 111.0, 81.0, 43.0, 36.0, 32.0, 23.0, 14.0, 16.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-10.875, -10.5643310546875, -10.253662109375, -9.9429931640625, -9.63232421875, -9.3216552734375, -9.010986328125, -8.7003173828125, -8.3896484375, -8.0789794921875, -7.768310546875, -7.4576416015625, -7.14697265625, -6.8363037109375, -6.525634765625, -6.2149658203125, -5.904296875, -5.5936279296875, -5.282958984375, -4.9722900390625, -4.66162109375, -4.3509521484375, -4.040283203125, -3.7296142578125, -3.4189453125, -3.1082763671875, -2.797607421875, -2.4869384765625, -2.17626953125, -1.8656005859375, -1.554931640625, -1.2442626953125, -0.93359375, -0.6229248046875, -0.312255859375, -0.0015869140625, 0.30908203125, 0.6197509765625, 0.930419921875, 1.2410888671875, 1.5517578125, 1.8624267578125, 2.173095703125, 2.4837646484375, 2.79443359375, 3.1051025390625, 3.415771484375, 3.7264404296875, 4.037109375, 4.3477783203125, 4.658447265625, 4.9691162109375, 5.27978515625, 5.5904541015625, 5.901123046875, 6.2117919921875, 6.5224609375, 6.8331298828125, 7.143798828125, 7.4544677734375, 7.76513671875, 8.0758056640625, 8.386474609375, 8.6971435546875, 9.0078125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 6.0, 6.0, 10.0, 14.0, 16.0, 16.0, 23.0, 25.0, 32.0, 41.0, 41.0, 46.0, 44.0, 63.0, 70.0, 113.0, 167.0, 230.0, 1276.0, 162.0, 124.0, 79.0, 81.0, 55.0, 46.0, 38.0, 45.0, 31.0, 23.0, 16.0, 14.0, 14.0, 8.0, 13.0, 7.0, 10.0, 9.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.1796875, -14.6409912109375, -14.102294921875, -13.5635986328125, -13.02490234375, -12.4862060546875, -11.947509765625, -11.4088134765625, -10.8701171875, -10.3314208984375, -9.792724609375, -9.2540283203125, -8.71533203125, -8.1766357421875, -7.637939453125, -7.0992431640625, -6.560546875, -6.0218505859375, -5.483154296875, -4.9444580078125, -4.40576171875, -3.8670654296875, -3.328369140625, -2.7896728515625, -2.2509765625, -1.7122802734375, -1.173583984375, -0.6348876953125, -0.09619140625, 0.4425048828125, 0.981201171875, 1.5198974609375, 2.05859375, 2.5972900390625, 3.135986328125, 3.6746826171875, 4.21337890625, 4.7520751953125, 5.290771484375, 5.8294677734375, 6.3681640625, 6.9068603515625, 7.445556640625, 7.9842529296875, 8.52294921875, 9.0616455078125, 9.600341796875, 10.1390380859375, 10.677734375, 11.2164306640625, 11.755126953125, 12.2938232421875, 12.83251953125, 13.3712158203125, 13.909912109375, 14.4486083984375, 14.9873046875, 15.5260009765625, 16.064697265625, 16.6033935546875, 17.14208984375, 17.6807861328125, 18.219482421875, 18.7581787109375, 19.296875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 10.0, 10.0, 23.0, 33.0, 31.0, 66.0, 71.0, 134.0, 216.0, 413.0, 1051.0, 3209.0, 14239.0, 98632.0, 2448872.0, 532354.0, 36320.0, 6752.0, 1821.0, 632.0, 323.0, 165.0, 108.0, 69.0, 44.0, 27.0, 20.0, 14.0, 17.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-45.34375, -44.03955078125, -42.7353515625, -41.43115234375, -40.126953125, -38.82275390625, -37.5185546875, -36.21435546875, -34.91015625, -33.60595703125, -32.3017578125, -30.99755859375, -29.693359375, -28.38916015625, -27.0849609375, -25.78076171875, -24.4765625, -23.17236328125, -21.8681640625, -20.56396484375, -19.259765625, -17.95556640625, -16.6513671875, -15.34716796875, -14.04296875, -12.73876953125, -11.4345703125, -10.13037109375, -8.826171875, -7.52197265625, -6.2177734375, -4.91357421875, -3.609375, -2.30517578125, -1.0009765625, 0.30322265625, 1.607421875, 2.91162109375, 4.2158203125, 5.52001953125, 6.82421875, 8.12841796875, 9.4326171875, 10.73681640625, 12.041015625, 13.34521484375, 14.6494140625, 15.95361328125, 17.2578125, 18.56201171875, 19.8662109375, 21.17041015625, 22.474609375, 23.77880859375, 25.0830078125, 26.38720703125, 27.69140625, 28.99560546875, 30.2998046875, 31.60400390625, 32.908203125, 34.21240234375, 35.5166015625, 36.82080078125, 38.125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 17.0, 345.0, 616.0, 37.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.37284088134766, -64.06053161621094, -48.74822235107422, -33.4359130859375, -18.12360382080078, -2.8112945556640625, 12.501014709472656, 27.813323974609375, 43.125633239746094, 58.43794250488281, 73.75025177001953, 89.06256103515625, 104.37487030029297, 119.68717956542969, 134.99948120117188, 150.31179809570312, 165.62411499023438, 180.93643188476562, 196.2487335205078, 211.56103515625, 226.87335205078125, 242.1856689453125, 257.49798583984375, 272.8102722167969, 288.1225891113281, 303.4349060058594, 318.7471923828125, 334.05950927734375, 349.371826171875, 364.68414306640625, 379.9964599609375, 395.3087463378906, 410.62103271484375, 425.933349609375, 441.24566650390625, 456.5579528808594, 471.8702697753906, 487.1825866699219, 502.494873046875, 517.8071899414062, 533.1195068359375, 548.4318237304688, 563.744140625, 579.0564575195312, 594.3687744140625, 609.6810302734375, 624.9933471679688, 640.3056640625, 655.6179809570312, 670.9302978515625, 686.2426147460938, 701.554931640625, 716.8671875, 732.1795043945312, 747.4918212890625, 762.8041381835938, 778.116455078125, 793.4287719726562, 808.7410888671875, 824.0534057617188, 839.36572265625, 854.677978515625, 869.9902954101562, 885.3026123046875, 900.6149291992188]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 4.0, 1.0, 7.0, 3.0, 6.0, 6.0, 6.0, 8.0, 15.0, 14.0, 13.0, 19.0, 23.0, 23.0, 23.0, 27.0, 31.0, 25.0, 18.0, 29.0, 31.0, 32.0, 32.0, 33.0, 44.0, 52.0, 25.0, 44.0, 33.0, 34.0, 36.0, 23.0, 16.0, 29.0, 31.0, 34.0, 23.0, 21.0, 23.0, 19.0, 9.0, 12.0, 19.0, 6.0, 8.0, 7.0, 7.0, 4.0, 6.0, 7.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-44.023338317871094, -42.7347526550293, -41.446163177490234, -40.15757751464844, -38.868988037109375, -37.58040237426758, -36.29181671142578, -35.00322723388672, -33.71464157104492, -32.426055908203125, -31.137466430664062, -29.848880767822266, -28.560293197631836, -27.271705627441406, -25.983118057250977, -24.694530487060547, -23.405942916870117, -22.117355346679688, -20.828767776489258, -19.540180206298828, -18.25159454345703, -16.9630069732666, -15.674419403076172, -14.385832786560059, -13.097245216369629, -11.8086576461792, -10.520071029663086, -9.231483459472656, -7.942896366119385, -6.654309272766113, -5.365721702575684, -4.07713508605957, -2.7885475158691406, -1.4999603033065796, -0.21137309074401855, 1.077214241027832, 2.3658013343811035, 3.654388427734375, 4.942975997924805, 6.231562614440918, 7.520150184631348, 8.808737754821777, 10.09732437133789, 11.38591194152832, 12.67449951171875, 13.963086128234863, 15.251673698425293, 16.540260314941406, 17.828847885131836, 19.117435455322266, 20.406023025512695, 21.694610595703125, 22.983196258544922, 24.27178382873535, 25.56037139892578, 26.848957061767578, 28.13754653930664, 29.42613410949707, 30.7147216796875, 32.0033073425293, 33.29189682006836, 34.580482482910156, 35.86907196044922, 37.157657623291016, 38.44624328613281]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 7.0, 5.0, 5.0, 9.0, 8.0, 24.0, 11.0, 9.0, 17.0, 28.0, 27.0, 20.0, 31.0, 38.0, 25.0, 37.0, 32.0, 33.0, 56.0, 43.0, 49.0, 41.0, 35.0, 42.0, 39.0, 37.0, 33.0, 37.0, 29.0, 21.0, 19.0, 29.0, 22.0, 19.0, 15.0, 12.0, 12.0, 8.0, 7.0, 9.0, 10.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.71527099609375, -4.5477294921875, -4.38018798828125, -4.212646484375, -4.04510498046875, -3.8775634765625, -3.71002197265625, -3.54248046875, -3.37493896484375, -3.2073974609375, -3.03985595703125, -2.872314453125, -2.70477294921875, -2.5372314453125, -2.36968994140625, -2.2021484375, -2.03460693359375, -1.8670654296875, -1.69952392578125, -1.531982421875, -1.36444091796875, -1.1968994140625, -1.02935791015625, -0.86181640625, -0.69427490234375, -0.5267333984375, -0.35919189453125, -0.191650390625, -0.02410888671875, 0.1434326171875, 0.31097412109375, 0.478515625, 0.64605712890625, 0.8135986328125, 0.98114013671875, 1.148681640625, 1.31622314453125, 1.4837646484375, 1.65130615234375, 1.81884765625, 1.98638916015625, 2.1539306640625, 2.32147216796875, 2.489013671875, 2.65655517578125, 2.8240966796875, 2.99163818359375, 3.1591796875, 3.32672119140625, 3.4942626953125, 3.66180419921875, 3.829345703125, 3.99688720703125, 4.1644287109375, 4.33197021484375, 4.49951171875, 4.66705322265625, 4.8345947265625, 5.00213623046875, 5.169677734375, 5.33721923828125, 5.5047607421875, 5.67230224609375, 5.83984375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 10.0, 6.0, 10.0, 17.0, 23.0, 30.0, 35.0, 62.0, 68.0, 109.0, 151.0, 188.0, 351.0, 478.0, 778.0, 1403.0, 2294.0, 4343.0, 9030.0, 21441.0, 67026.0, 318175.0, 1866284.0, 1564445.0, 244058.0, 56058.0, 18700.0, 8274.0, 4225.0, 2294.0, 1377.0, 850.0, 529.0, 344.0, 251.0, 138.0, 119.0, 74.0, 68.0, 32.0, 41.0, 23.0, 17.0, 15.0, 12.0, 9.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.5, -11.1025390625, -10.705078125, -10.3076171875, -9.91015625, -9.5126953125, -9.115234375, -8.7177734375, -8.3203125, -7.9228515625, -7.525390625, -7.1279296875, -6.73046875, -6.3330078125, -5.935546875, -5.5380859375, -5.140625, -4.7431640625, -4.345703125, -3.9482421875, -3.55078125, -3.1533203125, -2.755859375, -2.3583984375, -1.9609375, -1.5634765625, -1.166015625, -0.7685546875, -0.37109375, 0.0263671875, 0.423828125, 0.8212890625, 1.21875, 1.6162109375, 2.013671875, 2.4111328125, 2.80859375, 3.2060546875, 3.603515625, 4.0009765625, 4.3984375, 4.7958984375, 5.193359375, 5.5908203125, 5.98828125, 6.3857421875, 6.783203125, 7.1806640625, 7.578125, 7.9755859375, 8.373046875, 8.7705078125, 9.16796875, 9.5654296875, 9.962890625, 10.3603515625, 10.7578125, 11.1552734375, 11.552734375, 11.9501953125, 12.34765625, 12.7451171875, 13.142578125, 13.5400390625, 13.9375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 3.0, 3.0, 11.0, 16.0, 25.0, 29.0, 25.0, 53.0, 69.0, 97.0, 136.0, 247.0, 361.0, 540.0, 620.0, 564.0, 424.0, 239.0, 180.0, 120.0, 90.0, 50.0, 36.0, 34.0, 18.0, 18.0, 10.0, 13.0, 8.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.265625, -14.79736328125, -14.3291015625, -13.86083984375, -13.392578125, -12.92431640625, -12.4560546875, -11.98779296875, -11.51953125, -11.05126953125, -10.5830078125, -10.11474609375, -9.646484375, -9.17822265625, -8.7099609375, -8.24169921875, -7.7734375, -7.30517578125, -6.8369140625, -6.36865234375, -5.900390625, -5.43212890625, -4.9638671875, -4.49560546875, -4.02734375, -3.55908203125, -3.0908203125, -2.62255859375, -2.154296875, -1.68603515625, -1.2177734375, -0.74951171875, -0.28125, 0.18701171875, 0.6552734375, 1.12353515625, 1.591796875, 2.06005859375, 2.5283203125, 2.99658203125, 3.46484375, 3.93310546875, 4.4013671875, 4.86962890625, 5.337890625, 5.80615234375, 6.2744140625, 6.74267578125, 7.2109375, 7.67919921875, 8.1474609375, 8.61572265625, 9.083984375, 9.55224609375, 10.0205078125, 10.48876953125, 10.95703125, 11.42529296875, 11.8935546875, 12.36181640625, 12.830078125, 13.29833984375, 13.7666015625, 14.23486328125, 14.703125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 3.0, 19.0, 19.0, 21.0, 38.0, 57.0, 104.0, 173.0, 284.0, 494.0, 807.0, 1584.0, 3269.0, 7432.0, 20294.0, 80064.0, 686326.0, 2960177.0, 353056.0, 53331.0, 15215.0, 5843.0, 2559.0, 1340.0, 715.0, 403.0, 238.0, 157.0, 91.0, 54.0, 40.0, 23.0, 12.0, 15.0, 7.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.28125, -21.495849609375, -20.71044921875, -19.925048828125, -19.1396484375, -18.354248046875, -17.56884765625, -16.783447265625, -15.998046875, -15.212646484375, -14.42724609375, -13.641845703125, -12.8564453125, -12.071044921875, -11.28564453125, -10.500244140625, -9.71484375, -8.929443359375, -8.14404296875, -7.358642578125, -6.5732421875, -5.787841796875, -5.00244140625, -4.217041015625, -3.431640625, -2.646240234375, -1.86083984375, -1.075439453125, -0.2900390625, 0.495361328125, 1.28076171875, 2.066162109375, 2.8515625, 3.636962890625, 4.42236328125, 5.207763671875, 5.9931640625, 6.778564453125, 7.56396484375, 8.349365234375, 9.134765625, 9.920166015625, 10.70556640625, 11.490966796875, 12.2763671875, 13.061767578125, 13.84716796875, 14.632568359375, 15.41796875, 16.203369140625, 16.98876953125, 17.774169921875, 18.5595703125, 19.344970703125, 20.13037109375, 20.915771484375, 21.701171875, 22.486572265625, 23.27197265625, 24.057373046875, 24.8427734375, 25.628173828125, 26.41357421875, 27.198974609375, 27.984375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 20.0, 27.0, 36.0, 82.0, 121.0, 128.0, 157.0, 148.0, 103.0, 75.0, 42.0, 31.0, 17.0, 7.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.61260986328125, -169.1876220703125, -165.76263427734375, -162.337646484375, -158.91265869140625, -155.4876708984375, -152.06268310546875, -148.6376953125, -145.21270751953125, -141.7877197265625, -138.36273193359375, -134.937744140625, -131.51275634765625, -128.0877685546875, -124.66278839111328, -121.23780059814453, -117.81282043457031, -114.38783264160156, -110.96284484863281, -107.53785705566406, -104.11286926269531, -100.68788146972656, -97.26290130615234, -93.8379135131836, -90.41292572021484, -86.9879379272461, -83.56295013427734, -80.1379623413086, -76.71298217773438, -73.28799438476562, -69.86300659179688, -66.43801879882812, -63.013023376464844, -59.588035583496094, -56.163047790527344, -52.73806381225586, -49.31307601928711, -45.88808822631836, -42.463104248046875, -39.038116455078125, -35.613128662109375, -32.188140869140625, -28.763154983520508, -25.33816909790039, -21.91318130493164, -18.48819351196289, -15.063207626342773, -11.638221740722656, -8.213233947753906, -4.788247108459473, -1.363260269165039, 2.0617265701293945, 5.486713409423828, 8.911701202392578, 12.336687088012695, 15.761672973632812, 19.186660766601562, 22.611648559570312, 26.03663444519043, 29.461620330810547, 32.8866081237793, 36.31159591674805, 39.73657989501953, 43.16156768798828, 46.58655548095703]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 10.0, 11.0, 11.0, 16.0, 16.0, 17.0, 22.0, 20.0, 27.0, 30.0, 37.0, 25.0, 37.0, 32.0, 37.0, 32.0, 37.0, 43.0, 47.0, 39.0, 43.0, 41.0, 36.0, 23.0, 31.0, 25.0, 33.0, 27.0, 26.0, 24.0, 27.0, 17.0, 22.0, 13.0, 11.0, 10.0, 7.0, 3.0, 6.0, 6.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-40.66231918334961, -39.40364456176758, -38.14497375488281, -36.88629913330078, -35.627628326416016, -34.368953704833984, -33.11028289794922, -31.851608276367188, -30.592937469482422, -29.334264755249023, -28.075592041015625, -26.816919326782227, -25.558246612548828, -24.29957389831543, -23.04090118408203, -21.7822265625, -20.5235538482666, -19.264881134033203, -18.006208419799805, -16.747535705566406, -15.488862991333008, -14.23019027709961, -12.971516609191895, -11.712843894958496, -10.454171180725098, -9.1954984664917, -7.936825752258301, -6.678152561187744, -5.419479846954346, -4.160807132720947, -2.9021339416503906, -1.6434612274169922, -0.38478851318359375, 0.8738843202590942, 2.1325571537017822, 3.3912301063537598, 4.649902820587158, 5.908575534820557, 7.167248725891113, 8.425921440124512, 9.68459415435791, 10.943266868591309, 12.201939582824707, 13.460613250732422, 14.71928596496582, 15.977958679199219, 17.236631393432617, 18.495304107666016, 19.753976821899414, 21.012649536132812, 22.27132225036621, 23.52999496459961, 24.788667678833008, 26.047340393066406, 27.306015014648438, 28.564685821533203, 29.823360443115234, 31.082033157348633, 32.34070587158203, 33.59938049316406, 34.85805130004883, 36.11672592163086, 37.375396728515625, 38.634071350097656, 39.89274215698242]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 5.0, 5.0, 8.0, 10.0, 10.0, 11.0, 14.0, 17.0, 20.0, 27.0, 34.0, 28.0, 33.0, 35.0, 32.0, 43.0, 38.0, 27.0, 45.0, 44.0, 46.0, 39.0, 41.0, 34.0, 43.0, 43.0, 19.0, 35.0, 27.0, 30.0, 24.0, 17.0, 22.0, 12.0, 14.0, 13.0, 7.0, 11.0, 8.0, 5.0, 8.0, 7.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.5045166015625, -4.341064453125, -4.1776123046875, -4.01416015625, -3.8507080078125, -3.687255859375, -3.5238037109375, -3.3603515625, -3.1968994140625, -3.033447265625, -2.8699951171875, -2.70654296875, -2.5430908203125, -2.379638671875, -2.2161865234375, -2.052734375, -1.8892822265625, -1.725830078125, -1.5623779296875, -1.39892578125, -1.2354736328125, -1.072021484375, -0.9085693359375, -0.7451171875, -0.5816650390625, -0.418212890625, -0.2547607421875, -0.09130859375, 0.0721435546875, 0.235595703125, 0.3990478515625, 0.5625, 0.7259521484375, 0.889404296875, 1.0528564453125, 1.21630859375, 1.3797607421875, 1.543212890625, 1.7066650390625, 1.8701171875, 2.0335693359375, 2.197021484375, 2.3604736328125, 2.52392578125, 2.6873779296875, 2.850830078125, 3.0142822265625, 3.177734375, 3.3411865234375, 3.504638671875, 3.6680908203125, 3.83154296875, 3.9949951171875, 4.158447265625, 4.3218994140625, 4.4853515625, 4.6488037109375, 4.812255859375, 4.9757080078125, 5.13916015625, 5.3026123046875, 5.466064453125, 5.6295166015625, 5.79296875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 11.0, 12.0, 16.0, 36.0, 53.0, 71.0, 124.0, 182.0, 266.0, 498.0, 722.0, 1316.0, 2312.0, 4041.0, 7321.0, 13337.0, 24317.0, 46838.0, 96183.0, 213675.0, 305722.0, 169547.0, 77133.0, 38987.0, 20559.0, 11034.0, 6079.0, 3400.0, 2006.0, 1079.0, 602.0, 382.0, 251.0, 156.0, 91.0, 60.0, 42.0, 35.0, 21.0, 11.0, 6.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.193359375, -3.10040283203125, -3.0074462890625, -2.91448974609375, -2.821533203125, -2.72857666015625, -2.6356201171875, -2.54266357421875, -2.44970703125, -2.35675048828125, -2.2637939453125, -2.17083740234375, -2.077880859375, -1.98492431640625, -1.8919677734375, -1.79901123046875, -1.7060546875, -1.61309814453125, -1.5201416015625, -1.42718505859375, -1.334228515625, -1.24127197265625, -1.1483154296875, -1.05535888671875, -0.96240234375, -0.86944580078125, -0.7764892578125, -0.68353271484375, -0.590576171875, -0.49761962890625, -0.4046630859375, -0.31170654296875, -0.21875, -0.12579345703125, -0.0328369140625, 0.06011962890625, 0.153076171875, 0.24603271484375, 0.3389892578125, 0.43194580078125, 0.52490234375, 0.61785888671875, 0.7108154296875, 0.80377197265625, 0.896728515625, 0.98968505859375, 1.0826416015625, 1.17559814453125, 1.2685546875, 1.36151123046875, 1.4544677734375, 1.54742431640625, 1.640380859375, 1.73333740234375, 1.8262939453125, 1.91925048828125, 2.01220703125, 2.10516357421875, 2.1981201171875, 2.29107666015625, 2.384033203125, 2.47698974609375, 2.5699462890625, 2.66290283203125, 2.755859375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 10.0, 9.0, 11.0, 9.0, 16.0, 19.0, 18.0, 21.0, 20.0, 24.0, 28.0, 37.0, 25.0, 35.0, 28.0, 27.0, 45.0, 36.0, 42.0, 1060.0, 46.0, 37.0, 31.0, 43.0, 21.0, 31.0, 34.0, 37.0, 26.0, 25.0, 20.0, 22.0, 25.0, 29.0, 9.0, 9.0, 9.0, 12.0, 4.0, 5.0, 7.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.59375, -3.47723388671875, -3.3607177734375, -3.24420166015625, -3.127685546875, -3.01116943359375, -2.8946533203125, -2.77813720703125, -2.66162109375, -2.54510498046875, -2.4285888671875, -2.31207275390625, -2.195556640625, -2.07904052734375, -1.9625244140625, -1.84600830078125, -1.7294921875, -1.61297607421875, -1.4964599609375, -1.37994384765625, -1.263427734375, -1.14691162109375, -1.0303955078125, -0.91387939453125, -0.79736328125, -0.68084716796875, -0.5643310546875, -0.44781494140625, -0.331298828125, -0.21478271484375, -0.0982666015625, 0.01824951171875, 0.134765625, 0.25128173828125, 0.3677978515625, 0.48431396484375, 0.600830078125, 0.71734619140625, 0.8338623046875, 0.95037841796875, 1.06689453125, 1.18341064453125, 1.2999267578125, 1.41644287109375, 1.532958984375, 1.64947509765625, 1.7659912109375, 1.88250732421875, 1.9990234375, 2.11553955078125, 2.2320556640625, 2.34857177734375, 2.465087890625, 2.58160400390625, 2.6981201171875, 2.81463623046875, 2.93115234375, 3.04766845703125, 3.1641845703125, 3.28070068359375, 3.397216796875, 3.51373291015625, 3.6302490234375, 3.74676513671875, 3.86328125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 6.0, 12.0, 21.0, 32.0, 30.0, 49.0, 63.0, 93.0, 153.0, 205.0, 333.0, 475.0, 804.0, 1251.0, 1956.0, 3269.0, 5765.0, 10423.0, 22710.0, 101022.0, 1841931.0, 64865.0, 19197.0, 9092.0, 5128.0, 3104.0, 1848.0, 1168.0, 746.0, 464.0, 290.0, 213.0, 136.0, 77.0, 65.0, 37.0, 30.0, 18.0, 11.0, 14.0, 7.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.26953125, -4.11920166015625, -3.9688720703125, -3.81854248046875, -3.668212890625, -3.51788330078125, -3.3675537109375, -3.21722412109375, -3.06689453125, -2.91656494140625, -2.7662353515625, -2.61590576171875, -2.465576171875, -2.31524658203125, -2.1649169921875, -2.01458740234375, -1.8642578125, -1.71392822265625, -1.5635986328125, -1.41326904296875, -1.262939453125, -1.11260986328125, -0.9622802734375, -0.81195068359375, -0.66162109375, -0.51129150390625, -0.3609619140625, -0.21063232421875, -0.060302734375, 0.09002685546875, 0.2403564453125, 0.39068603515625, 0.541015625, 0.69134521484375, 0.8416748046875, 0.99200439453125, 1.142333984375, 1.29266357421875, 1.4429931640625, 1.59332275390625, 1.74365234375, 1.89398193359375, 2.0443115234375, 2.19464111328125, 2.344970703125, 2.49530029296875, 2.6456298828125, 2.79595947265625, 2.9462890625, 3.09661865234375, 3.2469482421875, 3.39727783203125, 3.547607421875, 3.69793701171875, 3.8482666015625, 3.99859619140625, 4.14892578125, 4.29925537109375, 4.4495849609375, 4.59991455078125, 4.750244140625, 4.90057373046875, 5.0509033203125, 5.20123291015625, 5.3515625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 7.0, 7.0, 8.0, 7.0, 8.0, 11.0, 21.0, 13.0, 21.0, 29.0, 38.0, 40.0, 54.0, 85.0, 80.0, 98.0, 96.0, 71.0, 60.0, 47.0, 48.0, 35.0, 21.0, 16.0, 9.0, 13.0, 9.0, 15.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1568603515625, -0.15100479125976562, -0.14514923095703125, -0.13929367065429688, -0.1334381103515625, -0.12758255004882812, -0.12172698974609375, -0.11587142944335938, -0.110015869140625, -0.10416030883789062, -0.09830474853515625, -0.09244918823242188, -0.0865936279296875, -0.08073806762695312, -0.07488250732421875, -0.06902694702148438, -0.06317138671875, -0.057315826416015625, -0.05146026611328125, -0.045604705810546875, -0.0397491455078125, -0.033893585205078125, -0.02803802490234375, -0.022182464599609375, -0.016326904296875, -0.010471343994140625, -0.00461578369140625, 0.001239776611328125, 0.0070953369140625, 0.012950897216796875, 0.01880645751953125, 0.024662017822265625, 0.030517578125, 0.036373138427734375, 0.04222869873046875, 0.048084259033203125, 0.0539398193359375, 0.059795379638671875, 0.06565093994140625, 0.07150650024414062, 0.077362060546875, 0.08321762084960938, 0.08907318115234375, 0.09492874145507812, 0.1007843017578125, 0.10663986206054688, 0.11249542236328125, 0.11835098266601562, 0.12420654296875, 0.13006210327148438, 0.13591766357421875, 0.14177322387695312, 0.1476287841796875, 0.15348434448242188, 0.15933990478515625, 0.16519546508789062, 0.171051025390625, 0.17690658569335938, 0.18276214599609375, 0.18861770629882812, 0.1944732666015625, 0.20032882690429688, 0.20618438720703125, 0.21203994750976562, 0.2178955078125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 3.0, 7.0, 5.0, 12.0, 5.0, 13.0, 10.0, 17.0, 20.0, 17.0, 53.0, 58.0, 123.0, 236.0, 517.0, 3213.0, 200202.0, 830854.0, 11718.0, 735.0, 262.0, 166.0, 85.0, 61.0, 26.0, 21.0, 23.0, 15.0, 16.0, 10.0, 12.0, 7.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.59375, -3.4996337890625, -3.405517578125, -3.3114013671875, -3.21728515625, -3.1231689453125, -3.029052734375, -2.9349365234375, -2.8408203125, -2.7467041015625, -2.652587890625, -2.5584716796875, -2.46435546875, -2.3702392578125, -2.276123046875, -2.1820068359375, -2.087890625, -1.9937744140625, -1.899658203125, -1.8055419921875, -1.71142578125, -1.6173095703125, -1.523193359375, -1.4290771484375, -1.3349609375, -1.2408447265625, -1.146728515625, -1.0526123046875, -0.95849609375, -0.8643798828125, -0.770263671875, -0.6761474609375, -0.58203125, -0.4879150390625, -0.393798828125, -0.2996826171875, -0.20556640625, -0.1114501953125, -0.017333984375, 0.0767822265625, 0.1708984375, 0.2650146484375, 0.359130859375, 0.4532470703125, 0.54736328125, 0.6414794921875, 0.735595703125, 0.8297119140625, 0.923828125, 1.0179443359375, 1.112060546875, 1.2061767578125, 1.30029296875, 1.3944091796875, 1.488525390625, 1.5826416015625, 1.6767578125, 1.7708740234375, 1.864990234375, 1.9591064453125, 2.05322265625, 2.1473388671875, 2.241455078125, 2.3355712890625, 2.4296875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 7.0, 27.0, 33.0, 78.0, 105.0, 141.0, 165.0, 157.0, 112.0, 76.0, 47.0, 20.0, 11.0, 9.0, 3.0, 4.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.683811366558075, -0.6621345281600952, -0.6404576301574707, -0.6187807321548462, -0.5971038937568665, -0.5754270553588867, -0.5537501573562622, -0.5320732593536377, -0.510396420955658, -0.48871955275535583, -0.4670426845550537, -0.4453658163547516, -0.42368894815444946, -0.40201207995414734, -0.3803352117538452, -0.3586583435535431, -0.33698147535324097, -0.31530460715293884, -0.2936277389526367, -0.2719508707523346, -0.25027400255203247, -0.22859713435173035, -0.20692026615142822, -0.1852433979511261, -0.16356652975082397, -0.14188966155052185, -0.12021279335021973, -0.0985359251499176, -0.07685905694961548, -0.055182188749313354, -0.03350532054901123, -0.011828452348709106, 0.009848475456237793, 0.03152534365653992, 0.05320221185684204, 0.07487908005714417, 0.09655594825744629, 0.11823281645774841, 0.13990968465805054, 0.16158655285835266, 0.18326342105865479, 0.2049402892589569, 0.22661715745925903, 0.24829402565956116, 0.2699708938598633, 0.2916477620601654, 0.31332463026046753, 0.33500149846076965, 0.3566783666610718, 0.3783552348613739, 0.400032103061676, 0.42170897126197815, 0.4433858394622803, 0.4650627076625824, 0.4867395758628845, 0.5084164142608643, 0.5300933122634888, 0.5517702102661133, 0.573447048664093, 0.5951238870620728, 0.6168007850646973, 0.6384776830673218, 0.6601545214653015, 0.6818313598632812, 0.7035082578659058]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 5.0, 3.0, 6.0, 5.0, 7.0, 12.0, 8.0, 17.0, 18.0, 18.0, 33.0, 27.0, 34.0, 39.0, 40.0, 41.0, 39.0, 46.0, 43.0, 33.0, 53.0, 58.0, 39.0, 40.0, 25.0, 49.0, 34.0, 32.0, 32.0, 26.0, 22.0, 18.0, 18.0, 24.0, 15.0, 9.0, 9.0, 7.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1987743377685547, -0.19270861148834229, -0.1866428703069687, -0.1805771440267563, -0.1745114028453827, -0.1684456765651703, -0.16237995028495789, -0.15631422400474548, -0.1502484828233719, -0.14418275654315948, -0.1381170153617859, -0.1320512890815735, -0.12598556280136108, -0.11991982161998749, -0.11385409533977509, -0.10778836160898209, -0.10172262787818909, -0.09565689414739609, -0.08959116041660309, -0.08352543413639069, -0.07745970040559769, -0.07139396667480469, -0.06532824039459229, -0.059262506663799286, -0.05319677293300629, -0.04713103920221329, -0.04106530919671059, -0.034999579191207886, -0.028933845460414886, -0.022868113592267036, -0.016802381724119186, -0.010736651718616486, -0.004670917987823486, 0.0013948138803243637, 0.007460545748472214, 0.013526277616620064, 0.019592009484767914, 0.025657741352915764, 0.031723473221063614, 0.037789203226566315, 0.043854936957359314, 0.04992067068815231, 0.055986400693655014, 0.062052130699157715, 0.06811786442995071, 0.07418359816074371, 0.08024932444095612, 0.08631505817174911, 0.09238079190254211, 0.09844652563333511, 0.10451225936412811, 0.11057798564434052, 0.11664371937513351, 0.12270945310592651, 0.12877517938613892, 0.13484090566635132, 0.14090664684772491, 0.14697237312793732, 0.1530381143093109, 0.15910384058952332, 0.16516956686973572, 0.17123530805110931, 0.17730103433132172, 0.1833667755126953, 0.18943250179290771]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 5.0, 5.0, 8.0, 10.0, 9.0, 13.0, 14.0, 16.0, 20.0, 27.0, 33.0, 29.0, 32.0, 36.0, 32.0, 41.0, 39.0, 30.0, 43.0, 45.0, 46.0, 38.0, 41.0, 33.0, 44.0, 41.0, 20.0, 35.0, 29.0, 26.0, 27.0, 18.0, 21.0, 12.0, 14.0, 13.0, 8.0, 10.0, 7.0, 7.0, 7.0, 7.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.671875, -4.50830078125, -4.3447265625, -4.18115234375, -4.017578125, -3.85400390625, -3.6904296875, -3.52685546875, -3.36328125, -3.19970703125, -3.0361328125, -2.87255859375, -2.708984375, -2.54541015625, -2.3818359375, -2.21826171875, -2.0546875, -1.89111328125, -1.7275390625, -1.56396484375, -1.400390625, -1.23681640625, -1.0732421875, -0.90966796875, -0.74609375, -0.58251953125, -0.4189453125, -0.25537109375, -0.091796875, 0.07177734375, 0.2353515625, 0.39892578125, 0.5625, 0.72607421875, 0.8896484375, 1.05322265625, 1.216796875, 1.38037109375, 1.5439453125, 1.70751953125, 1.87109375, 2.03466796875, 2.1982421875, 2.36181640625, 2.525390625, 2.68896484375, 2.8525390625, 3.01611328125, 3.1796875, 3.34326171875, 3.5068359375, 3.67041015625, 3.833984375, 3.99755859375, 4.1611328125, 4.32470703125, 4.48828125, 4.65185546875, 4.8154296875, 4.97900390625, 5.142578125, 5.30615234375, 5.4697265625, 5.63330078125, 5.796875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 4.0, 7.0, 7.0, 11.0, 22.0, 29.0, 25.0, 41.0, 45.0, 65.0, 109.0, 138.0, 236.0, 347.0, 545.0, 873.0, 1616.0, 2854.0, 5472.0, 11572.0, 28988.0, 94532.0, 385532.0, 370845.0, 92591.0, 28367.0, 11325.0, 5451.0, 2778.0, 1568.0, 936.0, 541.0, 350.0, 213.0, 125.0, 97.0, 75.0, 46.0, 38.0, 20.0, 25.0, 21.0, 16.0, 10.0, 14.0, 3.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-13.078125, -12.6693115234375, -12.260498046875, -11.8516845703125, -11.44287109375, -11.0340576171875, -10.625244140625, -10.2164306640625, -9.8076171875, -9.3988037109375, -8.989990234375, -8.5811767578125, -8.17236328125, -7.7635498046875, -7.354736328125, -6.9459228515625, -6.537109375, -6.1282958984375, -5.719482421875, -5.3106689453125, -4.90185546875, -4.4930419921875, -4.084228515625, -3.6754150390625, -3.2666015625, -2.8577880859375, -2.448974609375, -2.0401611328125, -1.63134765625, -1.2225341796875, -0.813720703125, -0.4049072265625, 0.00390625, 0.4127197265625, 0.821533203125, 1.2303466796875, 1.63916015625, 2.0479736328125, 2.456787109375, 2.8656005859375, 3.2744140625, 3.6832275390625, 4.092041015625, 4.5008544921875, 4.90966796875, 5.3184814453125, 5.727294921875, 6.1361083984375, 6.544921875, 6.9537353515625, 7.362548828125, 7.7713623046875, 8.18017578125, 8.5889892578125, 8.997802734375, 9.4066162109375, 9.8154296875, 10.2242431640625, 10.633056640625, 11.0418701171875, 11.45068359375, 11.8594970703125, 12.268310546875, 12.6771240234375, 13.0859375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 9.0, 7.0, 10.0, 22.0, 15.0, 24.0, 18.0, 28.0, 27.0, 25.0, 33.0, 46.0, 52.0, 54.0, 61.0, 93.0, 198.0, 1428.0, 254.0, 153.0, 81.0, 71.0, 49.0, 42.0, 44.0, 32.0, 29.0, 20.0, 14.0, 12.0, 19.0, 17.0, 9.0, 4.0, 9.0, 9.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.671875, -16.110595703125, -15.54931640625, -14.988037109375, -14.4267578125, -13.865478515625, -13.30419921875, -12.742919921875, -12.181640625, -11.620361328125, -11.05908203125, -10.497802734375, -9.9365234375, -9.375244140625, -8.81396484375, -8.252685546875, -7.69140625, -7.130126953125, -6.56884765625, -6.007568359375, -5.4462890625, -4.885009765625, -4.32373046875, -3.762451171875, -3.201171875, -2.639892578125, -2.07861328125, -1.517333984375, -0.9560546875, -0.394775390625, 0.16650390625, 0.727783203125, 1.2890625, 1.850341796875, 2.41162109375, 2.972900390625, 3.5341796875, 4.095458984375, 4.65673828125, 5.218017578125, 5.779296875, 6.340576171875, 6.90185546875, 7.463134765625, 8.0244140625, 8.585693359375, 9.14697265625, 9.708251953125, 10.26953125, 10.830810546875, 11.39208984375, 11.953369140625, 12.5146484375, 13.075927734375, 13.63720703125, 14.198486328125, 14.759765625, 15.321044921875, 15.88232421875, 16.443603515625, 17.0048828125, 17.566162109375, 18.12744140625, 18.688720703125, 19.25]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 4.0, 4.0, 10.0, 12.0, 26.0, 17.0, 27.0, 30.0, 41.0, 44.0, 60.0, 122.0, 157.0, 239.0, 478.0, 1493.0, 5834.0, 41338.0, 1866752.0, 1186870.0, 34361.0, 5209.0, 1288.0, 442.0, 236.0, 165.0, 111.0, 81.0, 64.0, 40.0, 36.0, 28.0, 17.0, 23.0, 9.0, 13.0, 6.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.875, -34.71630859375, -33.5576171875, -32.39892578125, -31.240234375, -30.08154296875, -28.9228515625, -27.76416015625, -26.60546875, -25.44677734375, -24.2880859375, -23.12939453125, -21.970703125, -20.81201171875, -19.6533203125, -18.49462890625, -17.3359375, -16.17724609375, -15.0185546875, -13.85986328125, -12.701171875, -11.54248046875, -10.3837890625, -9.22509765625, -8.06640625, -6.90771484375, -5.7490234375, -4.59033203125, -3.431640625, -2.27294921875, -1.1142578125, 0.04443359375, 1.203125, 2.36181640625, 3.5205078125, 4.67919921875, 5.837890625, 6.99658203125, 8.1552734375, 9.31396484375, 10.47265625, 11.63134765625, 12.7900390625, 13.94873046875, 15.107421875, 16.26611328125, 17.4248046875, 18.58349609375, 19.7421875, 20.90087890625, 22.0595703125, 23.21826171875, 24.376953125, 25.53564453125, 26.6943359375, 27.85302734375, 29.01171875, 30.17041015625, 31.3291015625, 32.48779296875, 33.646484375, 34.80517578125, 35.9638671875, 37.12255859375, 38.28125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 115.0, 588.0, 282.0, 20.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.159912109375, -60.217926025390625, -51.275943756103516, -42.333961486816406, -33.39197540283203, -24.449989318847656, -15.508007049560547, -6.5660247802734375, 2.3759613037109375, 11.31794548034668, 20.259929656982422, 29.201913833618164, 38.143898010253906, 47.08588409423828, 56.02786636352539, 64.9698486328125, 73.91183471679688, 82.85382080078125, 91.79580688476562, 100.73778533935547, 109.67977142333984, 118.62175750732422, 127.56373596191406, 136.50572204589844, 145.4477081298828, 154.3896942138672, 163.33168029785156, 172.27366638183594, 181.21563720703125, 190.15762329101562, 199.099609375, 208.04159545898438, 216.98355102539062, 225.925537109375, 234.86752319335938, 243.80950927734375, 252.75149536132812, 261.6934814453125, 270.6354675292969, 279.57745361328125, 288.5194091796875, 297.4613952636719, 306.40338134765625, 315.3453674316406, 324.287353515625, 333.2293395996094, 342.17132568359375, 351.11328125, 360.0552978515625, 368.9972839355469, 377.93927001953125, 386.8812561035156, 395.8232421875, 404.7652282714844, 413.70721435546875, 422.649169921875, 431.5911865234375, 440.5331726074219, 449.47515869140625, 458.4171447753906, 467.359130859375, 476.3011169433594, 485.24310302734375, 494.18505859375, 503.1270446777344]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 3.0, 8.0, 6.0, 8.0, 8.0, 17.0, 17.0, 23.0, 24.0, 20.0, 17.0, 39.0, 24.0, 47.0, 34.0, 35.0, 39.0, 35.0, 45.0, 36.0, 46.0, 45.0, 29.0, 35.0, 32.0, 29.0, 35.0, 29.0, 34.0, 27.0, 28.0, 28.0, 13.0, 24.0, 10.0, 11.0, 11.0, 8.0, 7.0, 4.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-50.300865173339844, -48.71402359008789, -47.1271858215332, -45.54034423828125, -43.9535026550293, -42.366661071777344, -40.779823303222656, -39.1929817199707, -37.60614013671875, -36.0192985534668, -34.43246078491211, -32.845619201660156, -31.258777618408203, -29.671937942504883, -28.085098266601562, -26.49825668334961, -24.91141700744629, -23.32457733154297, -21.737735748291016, -20.150896072387695, -18.564054489135742, -16.977214813232422, -15.390374183654785, -13.803533554077148, -12.216692924499512, -10.629852294921875, -9.043011665344238, -7.45617151260376, -5.869330883026123, -4.282490253448486, -2.695650100708008, -1.108809471130371, 0.4780311584472656, 2.0648717880249023, 3.65171217918396, 5.238552570343018, 6.825393199920654, 8.412233352661133, 9.99907398223877, 11.585914611816406, 13.172755241394043, 14.75959587097168, 16.346435546875, 17.933277130126953, 19.520116806030273, 21.106958389282227, 22.693798065185547, 24.2806396484375, 25.86747932434082, 27.45431900024414, 29.041160583496094, 30.628000259399414, 32.214839935302734, 33.80168151855469, 35.38852310180664, 36.975364685058594, 38.56220245361328, 40.149044036865234, 41.73588180541992, 43.322723388671875, 44.90956497192383, 46.49640655517578, 48.08324432373047, 49.67008590698242, 51.256927490234375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 15.0, 7.0, 6.0, 12.0, 22.0, 22.0, 12.0, 28.0, 32.0, 31.0, 36.0, 31.0, 44.0, 31.0, 51.0, 49.0, 55.0, 51.0, 29.0, 28.0, 40.0, 36.0, 50.0, 25.0, 36.0, 28.0, 23.0, 24.0, 19.0, 24.0, 16.0, 13.0, 14.0, 7.0, 7.0, 10.0, 6.0, 10.0, 3.0, 4.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.78515625, -5.6036376953125, -5.422119140625, -5.2406005859375, -5.05908203125, -4.8775634765625, -4.696044921875, -4.5145263671875, -4.3330078125, -4.1514892578125, -3.969970703125, -3.7884521484375, -3.60693359375, -3.4254150390625, -3.243896484375, -3.0623779296875, -2.880859375, -2.6993408203125, -2.517822265625, -2.3363037109375, -2.15478515625, -1.9732666015625, -1.791748046875, -1.6102294921875, -1.4287109375, -1.2471923828125, -1.065673828125, -0.8841552734375, -0.70263671875, -0.5211181640625, -0.339599609375, -0.1580810546875, 0.0234375, 0.2049560546875, 0.386474609375, 0.5679931640625, 0.74951171875, 0.9310302734375, 1.112548828125, 1.2940673828125, 1.4755859375, 1.6571044921875, 1.838623046875, 2.0201416015625, 2.20166015625, 2.3831787109375, 2.564697265625, 2.7462158203125, 2.927734375, 3.1092529296875, 3.290771484375, 3.4722900390625, 3.65380859375, 3.8353271484375, 4.016845703125, 4.1983642578125, 4.3798828125, 4.5614013671875, 4.742919921875, 4.9244384765625, 5.10595703125, 5.2874755859375, 5.468994140625, 5.6505126953125, 5.83203125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 3.0, 4.0, 5.0, 7.0, 6.0, 4.0, 17.0, 14.0, 18.0, 29.0, 37.0, 62.0, 91.0, 142.0, 241.0, 343.0, 598.0, 874.0, 1516.0, 2765.0, 4871.0, 9589.0, 21199.0, 59543.0, 245838.0, 1400733.0, 1944668.0, 368687.0, 80482.0, 26756.0, 11501.0, 5808.0, 3111.0, 1754.0, 1084.0, 675.0, 437.0, 263.0, 159.0, 109.0, 83.0, 55.0, 31.0, 25.0, 17.0, 11.0, 5.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.0234375, -11.610595703125, -11.19775390625, -10.784912109375, -10.3720703125, -9.959228515625, -9.54638671875, -9.133544921875, -8.720703125, -8.307861328125, -7.89501953125, -7.482177734375, -7.0693359375, -6.656494140625, -6.24365234375, -5.830810546875, -5.41796875, -5.005126953125, -4.59228515625, -4.179443359375, -3.7666015625, -3.353759765625, -2.94091796875, -2.528076171875, -2.115234375, -1.702392578125, -1.28955078125, -0.876708984375, -0.4638671875, -0.051025390625, 0.36181640625, 0.774658203125, 1.1875, 1.600341796875, 2.01318359375, 2.426025390625, 2.8388671875, 3.251708984375, 3.66455078125, 4.077392578125, 4.490234375, 4.903076171875, 5.31591796875, 5.728759765625, 6.1416015625, 6.554443359375, 6.96728515625, 7.380126953125, 7.79296875, 8.205810546875, 8.61865234375, 9.031494140625, 9.4443359375, 9.857177734375, 10.27001953125, 10.682861328125, 11.095703125, 11.508544921875, 11.92138671875, 12.334228515625, 12.7470703125, 13.159912109375, 13.57275390625, 13.985595703125, 14.3984375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 11.0, 17.0, 18.0, 33.0, 35.0, 53.0, 98.0, 144.0, 268.0, 422.0, 668.0, 756.0, 549.0, 352.0, 229.0, 126.0, 87.0, 60.0, 32.0, 33.0, 14.0, 15.0, 12.0, 6.0, 7.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.125, -15.511474609375, -14.89794921875, -14.284423828125, -13.6708984375, -13.057373046875, -12.44384765625, -11.830322265625, -11.216796875, -10.603271484375, -9.98974609375, -9.376220703125, -8.7626953125, -8.149169921875, -7.53564453125, -6.922119140625, -6.30859375, -5.695068359375, -5.08154296875, -4.468017578125, -3.8544921875, -3.240966796875, -2.62744140625, -2.013916015625, -1.400390625, -0.786865234375, -0.17333984375, 0.440185546875, 1.0537109375, 1.667236328125, 2.28076171875, 2.894287109375, 3.5078125, 4.121337890625, 4.73486328125, 5.348388671875, 5.9619140625, 6.575439453125, 7.18896484375, 7.802490234375, 8.416015625, 9.029541015625, 9.64306640625, 10.256591796875, 10.8701171875, 11.483642578125, 12.09716796875, 12.710693359375, 13.32421875, 13.937744140625, 14.55126953125, 15.164794921875, 15.7783203125, 16.391845703125, 17.00537109375, 17.618896484375, 18.232421875, 18.845947265625, 19.45947265625, 20.072998046875, 20.6865234375, 21.300048828125, 21.91357421875, 22.527099609375, 23.140625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 6.0, 2.0, 6.0, 6.0, 8.0, 26.0, 39.0, 56.0, 107.0, 196.0, 414.0, 965.0, 2183.0, 6603.0, 28921.0, 368870.0, 3592437.0, 165736.0, 19517.0, 4957.0, 1755.0, 765.0, 321.0, 170.0, 97.0, 42.0, 32.0, 13.0, 13.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-55.125, -53.650390625, -52.17578125, -50.701171875, -49.2265625, -47.751953125, -46.27734375, -44.802734375, -43.328125, -41.853515625, -40.37890625, -38.904296875, -37.4296875, -35.955078125, -34.48046875, -33.005859375, -31.53125, -30.056640625, -28.58203125, -27.107421875, -25.6328125, -24.158203125, -22.68359375, -21.208984375, -19.734375, -18.259765625, -16.78515625, -15.310546875, -13.8359375, -12.361328125, -10.88671875, -9.412109375, -7.9375, -6.462890625, -4.98828125, -3.513671875, -2.0390625, -0.564453125, 0.91015625, 2.384765625, 3.859375, 5.333984375, 6.80859375, 8.283203125, 9.7578125, 11.232421875, 12.70703125, 14.181640625, 15.65625, 17.130859375, 18.60546875, 20.080078125, 21.5546875, 23.029296875, 24.50390625, 25.978515625, 27.453125, 28.927734375, 30.40234375, 31.876953125, 33.3515625, 34.826171875, 36.30078125, 37.775390625, 39.25]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 18.0, 75.0, 215.0, 354.0, 219.0, 85.0, 17.0, 12.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-356.1386413574219, -347.74432373046875, -339.35003662109375, -330.9557189941406, -322.5614318847656, -314.1671142578125, -305.7728271484375, -297.3785095214844, -288.98419189453125, -280.5898742675781, -272.1955871582031, -263.80126953125, -255.406982421875, -247.01266479492188, -238.6183624267578, -230.22406005859375, -221.82977294921875, -213.4354705810547, -205.04116821289062, -196.64686584472656, -188.2525634765625, -179.85824584960938, -171.4639434814453, -163.06964111328125, -154.6753387451172, -146.28103637695312, -137.88673400878906, -129.492431640625, -121.0981216430664, -112.70381927490234, -104.30950927734375, -95.91520690917969, -87.52088928222656, -79.1265869140625, -70.73228454589844, -62.337974548339844, -53.94367218017578, -45.54936981201172, -37.15506362915039, -28.760757446289062, -20.366455078125, -11.972150802612305, -3.5778465270996094, 4.816457748413086, 13.210762023925781, 21.605064392089844, 29.999370574951172, 38.3936767578125, 46.78797912597656, 55.182281494140625, 63.57658767700195, 71.97089385986328, 80.36519622802734, 88.7594985961914, 97.15380859375, 105.54811096191406, 113.94241333007812, 122.33671569824219, 130.73101806640625, 139.1253204345703, 147.51962280273438, 155.9139404296875, 164.30824279785156, 172.70254516601562, 181.0968475341797]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 7.0, 8.0, 6.0, 9.0, 12.0, 17.0, 20.0, 20.0, 26.0, 16.0, 26.0, 27.0, 32.0, 38.0, 43.0, 36.0, 38.0, 42.0, 29.0, 33.0, 32.0, 41.0, 38.0, 41.0, 49.0, 39.0, 32.0, 24.0, 35.0, 26.0, 16.0, 22.0, 23.0, 18.0, 13.0, 9.0, 12.0, 8.0, 5.0, 5.0, 4.0, 4.0, 6.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-45.35698318481445, -43.886024475097656, -42.41506576538086, -40.94410705566406, -39.47314453125, -38.0021858215332, -36.531227111816406, -35.06026840209961, -33.58930969238281, -32.118350982666016, -30.647390365600586, -29.17643165588379, -27.70547103881836, -26.234512329101562, -24.763553619384766, -23.29259490966797, -21.821632385253906, -20.35067367553711, -18.87971305847168, -17.408754348754883, -15.93779468536377, -14.466835021972656, -12.99587631225586, -11.524916648864746, -10.053956985473633, -8.58299732208252, -7.1120381355285645, -5.641078948974609, -4.170119285583496, -2.699159622192383, -1.228200912475586, 0.24275875091552734, 1.713714599609375, 3.184674024581909, 4.655633449554443, 6.126592636108398, 7.597552299499512, 9.068511962890625, 10.539470672607422, 12.010430335998535, 13.481389999389648, 14.952349662780762, 16.423309326171875, 17.894268035888672, 19.36522674560547, 20.8361873626709, 22.307146072387695, 23.778106689453125, 25.249065399169922, 26.72002410888672, 28.19098472595215, 29.661943435668945, 31.132904052734375, 32.60386276245117, 34.07482147216797, 35.545780181884766, 37.01673889160156, 38.48769760131836, 39.958656311035156, 41.42961883544922, 42.900577545166016, 44.37153625488281, 45.84249496459961, 47.313453674316406, 48.78441619873047]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 6.0, 9.0, 19.0, 9.0, 17.0, 17.0, 19.0, 20.0, 28.0, 19.0, 29.0, 22.0, 31.0, 29.0, 32.0, 35.0, 44.0, 42.0, 42.0, 33.0, 46.0, 40.0, 44.0, 40.0, 40.0, 38.0, 28.0, 23.0, 28.0, 23.0, 19.0, 21.0, 20.0, 16.0, 11.0, 10.0, 9.0, 8.0, 8.0, 3.0, 7.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.38671875, -5.2161865234375, -5.045654296875, -4.8751220703125, -4.70458984375, -4.5340576171875, -4.363525390625, -4.1929931640625, -4.0224609375, -3.8519287109375, -3.681396484375, -3.5108642578125, -3.34033203125, -3.1697998046875, -2.999267578125, -2.8287353515625, -2.658203125, -2.4876708984375, -2.317138671875, -2.1466064453125, -1.97607421875, -1.8055419921875, -1.635009765625, -1.4644775390625, -1.2939453125, -1.1234130859375, -0.952880859375, -0.7823486328125, -0.61181640625, -0.4412841796875, -0.270751953125, -0.1002197265625, 0.0703125, 0.2408447265625, 0.411376953125, 0.5819091796875, 0.75244140625, 0.9229736328125, 1.093505859375, 1.2640380859375, 1.4345703125, 1.6051025390625, 1.775634765625, 1.9461669921875, 2.11669921875, 2.2872314453125, 2.457763671875, 2.6282958984375, 2.798828125, 2.9693603515625, 3.139892578125, 3.3104248046875, 3.48095703125, 3.6514892578125, 3.822021484375, 3.9925537109375, 4.1630859375, 4.3336181640625, 4.504150390625, 4.6746826171875, 4.84521484375, 5.0157470703125, 5.186279296875, 5.3568115234375, 5.52734375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 11.0, 14.0, 10.0, 23.0, 31.0, 45.0, 67.0, 104.0, 110.0, 208.0, 296.0, 490.0, 870.0, 1518.0, 2780.0, 5383.0, 11617.0, 26118.0, 61096.0, 140460.0, 275678.0, 274261.0, 137874.0, 60290.0, 25973.0, 11286.0, 5468.0, 2713.0, 1484.0, 819.0, 494.0, 301.0, 203.0, 137.0, 88.0, 71.0, 47.0, 29.0, 15.0, 19.0, 10.0, 6.0, 9.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.398681640625, -2.31298828125, -2.227294921875, -2.1416015625, -2.055908203125, -1.97021484375, -1.884521484375, -1.798828125, -1.713134765625, -1.62744140625, -1.541748046875, -1.4560546875, -1.370361328125, -1.28466796875, -1.198974609375, -1.11328125, -1.027587890625, -0.94189453125, -0.856201171875, -0.7705078125, -0.684814453125, -0.59912109375, -0.513427734375, -0.427734375, -0.342041015625, -0.25634765625, -0.170654296875, -0.0849609375, 0.000732421875, 0.08642578125, 0.172119140625, 0.2578125, 0.343505859375, 0.42919921875, 0.514892578125, 0.6005859375, 0.686279296875, 0.77197265625, 0.857666015625, 0.943359375, 1.029052734375, 1.11474609375, 1.200439453125, 1.2861328125, 1.371826171875, 1.45751953125, 1.543212890625, 1.62890625, 1.714599609375, 1.80029296875, 1.885986328125, 1.9716796875, 2.057373046875, 2.14306640625, 2.228759765625, 2.314453125, 2.400146484375, 2.48583984375, 2.571533203125, 2.6572265625, 2.742919921875, 2.82861328125, 2.914306640625, 3.0]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 3.0, 7.0, 7.0, 7.0, 8.0, 5.0, 7.0, 16.0, 16.0, 28.0, 17.0, 15.0, 22.0, 24.0, 36.0, 30.0, 25.0, 38.0, 35.0, 48.0, 42.0, 31.0, 1067.0, 46.0, 42.0, 40.0, 49.0, 42.0, 35.0, 29.0, 31.0, 24.0, 32.0, 16.0, 19.0, 14.0, 17.0, 8.0, 13.0, 4.0, 9.0, 6.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.4453125, -4.309326171875, -4.17333984375, -4.037353515625, -3.9013671875, -3.765380859375, -3.62939453125, -3.493408203125, -3.357421875, -3.221435546875, -3.08544921875, -2.949462890625, -2.8134765625, -2.677490234375, -2.54150390625, -2.405517578125, -2.26953125, -2.133544921875, -1.99755859375, -1.861572265625, -1.7255859375, -1.589599609375, -1.45361328125, -1.317626953125, -1.181640625, -1.045654296875, -0.90966796875, -0.773681640625, -0.6376953125, -0.501708984375, -0.36572265625, -0.229736328125, -0.09375, 0.042236328125, 0.17822265625, 0.314208984375, 0.4501953125, 0.586181640625, 0.72216796875, 0.858154296875, 0.994140625, 1.130126953125, 1.26611328125, 1.402099609375, 1.5380859375, 1.674072265625, 1.81005859375, 1.946044921875, 2.08203125, 2.218017578125, 2.35400390625, 2.489990234375, 2.6259765625, 2.761962890625, 2.89794921875, 3.033935546875, 3.169921875, 3.305908203125, 3.44189453125, 3.577880859375, 3.7138671875, 3.849853515625, 3.98583984375, 4.121826171875, 4.2578125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 14.0, 20.0, 24.0, 35.0, 59.0, 96.0, 196.0, 417.0, 972.0, 2589.0, 7324.0, 25095.0, 731978.0, 1290961.0, 25456.0, 7398.0, 2638.0, 982.0, 420.0, 201.0, 107.0, 56.0, 33.0, 26.0, 9.0, 11.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.0078125, -6.7662353515625, -6.524658203125, -6.2830810546875, -6.04150390625, -5.7999267578125, -5.558349609375, -5.3167724609375, -5.0751953125, -4.8336181640625, -4.592041015625, -4.3504638671875, -4.10888671875, -3.8673095703125, -3.625732421875, -3.3841552734375, -3.142578125, -2.9010009765625, -2.659423828125, -2.4178466796875, -2.17626953125, -1.9346923828125, -1.693115234375, -1.4515380859375, -1.2099609375, -0.9683837890625, -0.726806640625, -0.4852294921875, -0.24365234375, -0.0020751953125, 0.239501953125, 0.4810791015625, 0.72265625, 0.9642333984375, 1.205810546875, 1.4473876953125, 1.68896484375, 1.9305419921875, 2.172119140625, 2.4136962890625, 2.6552734375, 2.8968505859375, 3.138427734375, 3.3800048828125, 3.62158203125, 3.8631591796875, 4.104736328125, 4.3463134765625, 4.587890625, 4.8294677734375, 5.071044921875, 5.3126220703125, 5.55419921875, 5.7957763671875, 6.037353515625, 6.2789306640625, 6.5205078125, 6.7620849609375, 7.003662109375, 7.2452392578125, 7.48681640625, 7.7283935546875, 7.969970703125, 8.2115478515625, 8.453125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 7.0, 4.0, 6.0, 7.0, 11.0, 10.0, 13.0, 16.0, 21.0, 19.0, 20.0, 27.0, 40.0, 43.0, 45.0, 59.0, 71.0, 60.0, 51.0, 71.0, 44.0, 44.0, 57.0, 38.0, 43.0, 24.0, 22.0, 17.0, 18.0, 16.0, 16.0, 14.0, 7.0, 11.0, 4.0, 4.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.166015625, -0.1614398956298828, -0.15686416625976562, -0.15228843688964844, -0.14771270751953125, -0.14313697814941406, -0.13856124877929688, -0.1339855194091797, -0.1294097900390625, -0.12483406066894531, -0.12025833129882812, -0.11568260192871094, -0.11110687255859375, -0.10653114318847656, -0.10195541381835938, -0.09737968444824219, -0.092803955078125, -0.08822822570800781, -0.08365249633789062, -0.07907676696777344, -0.07450103759765625, -0.06992530822753906, -0.06534957885742188, -0.06077384948730469, -0.0561981201171875, -0.05162239074707031, -0.047046661376953125, -0.04247093200683594, -0.03789520263671875, -0.03331947326660156, -0.028743743896484375, -0.024168014526367188, -0.01959228515625, -0.015016555786132812, -0.010440826416015625, -0.0058650970458984375, -0.00128936767578125, 0.0032863616943359375, 0.007862091064453125, 0.012437820434570312, 0.0170135498046875, 0.021589279174804688, 0.026165008544921875, 0.030740737915039062, 0.03531646728515625, 0.03989219665527344, 0.044467926025390625, 0.04904365539550781, 0.053619384765625, 0.05819511413574219, 0.06277084350585938, 0.06734657287597656, 0.07192230224609375, 0.07649803161621094, 0.08107376098632812, 0.08564949035644531, 0.0902252197265625, 0.09480094909667969, 0.09937667846679688, 0.10395240783691406, 0.10852813720703125, 0.11310386657714844, 0.11767959594726562, 0.12225532531738281, 0.1268310546875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 5.0, 14.0, 8.0, 12.0, 15.0, 24.0, 32.0, 33.0, 57.0, 45.0, 94.0, 127.0, 191.0, 374.0, 954.0, 5435.0, 66001.0, 829115.0, 134353.0, 9116.0, 1345.0, 427.0, 216.0, 152.0, 96.0, 67.0, 53.0, 42.0, 25.0, 28.0, 17.0, 13.0, 10.0, 8.0, 9.0, 4.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.85546875, -1.792816162109375, -1.73016357421875, -1.667510986328125, -1.6048583984375, -1.542205810546875, -1.47955322265625, -1.416900634765625, -1.354248046875, -1.291595458984375, -1.22894287109375, -1.166290283203125, -1.1036376953125, -1.040985107421875, -0.97833251953125, -0.915679931640625, -0.85302734375, -0.790374755859375, -0.72772216796875, -0.665069580078125, -0.6024169921875, -0.539764404296875, -0.47711181640625, -0.414459228515625, -0.351806640625, -0.289154052734375, -0.22650146484375, -0.163848876953125, -0.1011962890625, -0.038543701171875, 0.02410888671875, 0.086761474609375, 0.1494140625, 0.212066650390625, 0.27471923828125, 0.337371826171875, 0.4000244140625, 0.462677001953125, 0.52532958984375, 0.587982177734375, 0.650634765625, 0.713287353515625, 0.77593994140625, 0.838592529296875, 0.9012451171875, 0.963897705078125, 1.02655029296875, 1.089202880859375, 1.15185546875, 1.214508056640625, 1.27716064453125, 1.339813232421875, 1.4024658203125, 1.465118408203125, 1.52777099609375, 1.590423583984375, 1.653076171875, 1.715728759765625, 1.77838134765625, 1.841033935546875, 1.9036865234375, 1.966339111328125, 2.02899169921875, 2.091644287109375, 2.154296875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 34.0, 328.0, 512.0, 122.0, 18.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9669957160949707, -1.8858271837234497, -1.8046586513519287, -1.7234902381896973, -1.6423217058181763, -1.5611531734466553, -1.4799846410751343, -1.3988161087036133, -1.3176476955413818, -1.2364791631698608, -1.1553106307983398, -1.0741422176361084, -0.9929736852645874, -0.9118051528930664, -0.8306366205215454, -0.7494681477546692, -0.6682995557785034, -0.5871310234069824, -0.5059625506401062, -0.4247940182685852, -0.3436255156993866, -0.262457013130188, -0.181288480758667, -0.10012000799179077, -0.018951475620269775, 0.06221703439950943, 0.14338554441928864, 0.22455406188964844, 0.30572256445884705, 0.38689106702804565, 0.46805959939956665, 0.5492280721664429, 0.6303966045379639, 0.7115651369094849, 0.7927336096763611, 0.8739021420478821, 0.9550706148147583, 1.0362391471862793, 1.1174076795578003, 1.1985762119293213, 1.2797446250915527, 1.3609131574630737, 1.4420816898345947, 1.5232501029968262, 1.6044186353683472, 1.6855871677398682, 1.7667557001113892, 1.8479242324829102, 1.9290927648544312, 2.010261297225952, 2.0914297103881836, 2.172598361968994, 2.2537667751312256, 2.334935188293457, 2.4161038398742676, 2.497272253036499, 2.5784409046173096, 2.659609317779541, 2.7407779693603516, 2.821946382522583, 2.9031150341033936, 2.984283447265625, 3.0654520988464355, 3.146620512008667, 3.2277889251708984]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 5.0, 13.0, 10.0, 10.0, 17.0, 19.0, 20.0, 21.0, 26.0, 27.0, 21.0, 27.0, 37.0, 38.0, 26.0, 38.0, 31.0, 40.0, 55.0, 43.0, 49.0, 41.0, 49.0, 37.0, 34.0, 32.0, 36.0, 26.0, 20.0, 22.0, 22.0, 17.0, 15.0, 15.0, 17.0, 10.0, 5.0, 7.0, 2.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2727521061897278, -0.26455652713775635, -0.2563609480857849, -0.2481653392314911, -0.23996976017951965, -0.23177418112754822, -0.2235785871744156, -0.21538299322128296, -0.20718741416931152, -0.1989918351173401, -0.19079624116420746, -0.18260064721107483, -0.1744050681591034, -0.16620948910713196, -0.15801389515399933, -0.1498183012008667, -0.14162272214889526, -0.13342714309692383, -0.1252315491437912, -0.11703596264123917, -0.10884037613868713, -0.1006447896361351, -0.09244920313358307, -0.08425361663103104, -0.076058030128479, -0.06786244362592697, -0.05966685712337494, -0.051471270620822906, -0.043275684118270874, -0.03508009761571884, -0.02688451111316681, -0.018688924610614777, -0.010493338108062744, -0.0022977516055107117, 0.005897834897041321, 0.014093421399593353, 0.022289007902145386, 0.030484594404697418, 0.03868018090724945, 0.04687576740980148, 0.055071353912353516, 0.06326694041490555, 0.07146252691745758, 0.07965811342000961, 0.08785369992256165, 0.09604928642511368, 0.10424487292766571, 0.11244045943021774, 0.12063604593276978, 0.1288316249847412, 0.13702721893787384, 0.14522281289100647, 0.1534183919429779, 0.16161397099494934, 0.16980956494808197, 0.1780051589012146, 0.18620073795318604, 0.19439631700515747, 0.2025919109582901, 0.21078750491142273, 0.21898308396339417, 0.2271786630153656, 0.23537425696849823, 0.24356985092163086, 0.2517654299736023]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 10.0, 20.0, 7.0, 17.0, 18.0, 18.0, 24.0, 28.0, 17.0, 29.0, 22.0, 34.0, 27.0, 28.0, 38.0, 43.0, 40.0, 46.0, 33.0, 46.0, 40.0, 42.0, 40.0, 43.0, 35.0, 29.0, 24.0, 26.0, 23.0, 20.0, 20.0, 20.0, 15.0, 12.0, 10.0, 9.0, 7.0, 9.0, 2.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.3828125, -5.2120361328125, -5.041259765625, -4.8704833984375, -4.69970703125, -4.5289306640625, -4.358154296875, -4.1873779296875, -4.0166015625, -3.8458251953125, -3.675048828125, -3.5042724609375, -3.33349609375, -3.1627197265625, -2.991943359375, -2.8211669921875, -2.650390625, -2.4796142578125, -2.308837890625, -2.1380615234375, -1.96728515625, -1.7965087890625, -1.625732421875, -1.4549560546875, -1.2841796875, -1.1134033203125, -0.942626953125, -0.7718505859375, -0.60107421875, -0.4302978515625, -0.259521484375, -0.0887451171875, 0.08203125, 0.2528076171875, 0.423583984375, 0.5943603515625, 0.76513671875, 0.9359130859375, 1.106689453125, 1.2774658203125, 1.4482421875, 1.6190185546875, 1.789794921875, 1.9605712890625, 2.13134765625, 2.3021240234375, 2.472900390625, 2.6436767578125, 2.814453125, 2.9852294921875, 3.156005859375, 3.3267822265625, 3.49755859375, 3.6683349609375, 3.839111328125, 4.0098876953125, 4.1806640625, 4.3514404296875, 4.522216796875, 4.6929931640625, 4.86376953125, 5.0345458984375, 5.205322265625, 5.3760986328125, 5.546875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 11.0, 13.0, 9.0, 20.0, 27.0, 27.0, 37.0, 64.0, 82.0, 109.0, 174.0, 265.0, 364.0, 507.0, 848.0, 1303.0, 2055.0, 3453.0, 5843.0, 10986.0, 22724.0, 55215.0, 149862.0, 381960.0, 247658.0, 93215.0, 35775.0, 15852.0, 8076.0, 4403.0, 2737.0, 1650.0, 1085.0, 716.0, 465.0, 291.0, 203.0, 122.0, 95.0, 68.0, 47.0, 39.0, 28.0, 22.0, 13.0, 19.0, 7.0, 10.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.578125, -11.213623046875, -10.84912109375, -10.484619140625, -10.1201171875, -9.755615234375, -9.39111328125, -9.026611328125, -8.662109375, -8.297607421875, -7.93310546875, -7.568603515625, -7.2041015625, -6.839599609375, -6.47509765625, -6.110595703125, -5.74609375, -5.381591796875, -5.01708984375, -4.652587890625, -4.2880859375, -3.923583984375, -3.55908203125, -3.194580078125, -2.830078125, -2.465576171875, -2.10107421875, -1.736572265625, -1.3720703125, -1.007568359375, -0.64306640625, -0.278564453125, 0.0859375, 0.450439453125, 0.81494140625, 1.179443359375, 1.5439453125, 1.908447265625, 2.27294921875, 2.637451171875, 3.001953125, 3.366455078125, 3.73095703125, 4.095458984375, 4.4599609375, 4.824462890625, 5.18896484375, 5.553466796875, 5.91796875, 6.282470703125, 6.64697265625, 7.011474609375, 7.3759765625, 7.740478515625, 8.10498046875, 8.469482421875, 8.833984375, 9.198486328125, 9.56298828125, 9.927490234375, 10.2919921875, 10.656494140625, 11.02099609375, 11.385498046875, 11.75]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 5.0, 2.0, 19.0, 17.0, 19.0, 22.0, 26.0, 30.0, 37.0, 41.0, 56.0, 87.0, 124.0, 207.0, 1362.0, 303.0, 202.0, 112.0, 73.0, 53.0, 51.0, 33.0, 34.0, 23.0, 31.0, 13.0, 15.0, 14.0, 11.0, 3.0, 3.0, 0.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.140625, -19.33154296875, -18.5224609375, -17.71337890625, -16.904296875, -16.09521484375, -15.2861328125, -14.47705078125, -13.66796875, -12.85888671875, -12.0498046875, -11.24072265625, -10.431640625, -9.62255859375, -8.8134765625, -8.00439453125, -7.1953125, -6.38623046875, -5.5771484375, -4.76806640625, -3.958984375, -3.14990234375, -2.3408203125, -1.53173828125, -0.72265625, 0.08642578125, 0.8955078125, 1.70458984375, 2.513671875, 3.32275390625, 4.1318359375, 4.94091796875, 5.75, 6.55908203125, 7.3681640625, 8.17724609375, 8.986328125, 9.79541015625, 10.6044921875, 11.41357421875, 12.22265625, 13.03173828125, 13.8408203125, 14.64990234375, 15.458984375, 16.26806640625, 17.0771484375, 17.88623046875, 18.6953125, 19.50439453125, 20.3134765625, 21.12255859375, 21.931640625, 22.74072265625, 23.5498046875, 24.35888671875, 25.16796875, 25.97705078125, 26.7861328125, 27.59521484375, 28.404296875, 29.21337890625, 30.0224609375, 30.83154296875, 31.640625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 17.0, 15.0, 28.0, 56.0, 94.0, 195.0, 455.0, 1353.0, 9415.0, 2044532.0, 1079621.0, 7901.0, 1246.0, 382.0, 194.0, 75.0, 44.0, 23.0, 7.0, 8.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.9375, -96.0244140625, -93.111328125, -90.1982421875, -87.28515625, -84.3720703125, -81.458984375, -78.5458984375, -75.6328125, -72.7197265625, -69.806640625, -66.8935546875, -63.98046875, -61.0673828125, -58.154296875, -55.2412109375, -52.328125, -49.4150390625, -46.501953125, -43.5888671875, -40.67578125, -37.7626953125, -34.849609375, -31.9365234375, -29.0234375, -26.1103515625, -23.197265625, -20.2841796875, -17.37109375, -14.4580078125, -11.544921875, -8.6318359375, -5.71875, -2.8056640625, 0.107421875, 3.0205078125, 5.93359375, 8.8466796875, 11.759765625, 14.6728515625, 17.5859375, 20.4990234375, 23.412109375, 26.3251953125, 29.23828125, 32.1513671875, 35.064453125, 37.9775390625, 40.890625, 43.8037109375, 46.716796875, 49.6298828125, 52.54296875, 55.4560546875, 58.369140625, 61.2822265625, 64.1953125, 67.1083984375, 70.021484375, 72.9345703125, 75.84765625, 78.7607421875, 81.673828125, 84.5869140625, 87.5]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [7.0, 202.0, 755.0, 52.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.71675109863281, -19.81415557861328, -4.91156005859375, 9.991035461425781, 24.893630981445312, 39.796226501464844, 54.698822021484375, 69.6014175415039, 84.50401306152344, 99.40660858154297, 114.3092041015625, 129.2117919921875, 144.11439514160156, 159.01699829101562, 173.91958618164062, 188.82217407226562, 203.7247772216797, 218.62738037109375, 233.52996826171875, 248.43255615234375, 263.33514404296875, 278.2377624511719, 293.1403503417969, 308.0429382324219, 322.945556640625, 337.84814453125, 352.750732421875, 367.6533508300781, 382.5559387207031, 397.4585266113281, 412.36114501953125, 427.26373291015625, 442.16632080078125, 457.06890869140625, 471.97149658203125, 486.8741149902344, 501.7767028808594, 516.6793212890625, 531.5819091796875, 546.4844970703125, 561.3870849609375, 576.2896728515625, 591.1922607421875, 606.0948486328125, 620.9974365234375, 635.9000854492188, 650.8026733398438, 665.7052612304688, 680.6078491210938, 695.5104370117188, 710.4130249023438, 725.3156127929688, 740.21826171875, 755.120849609375, 770.0234375, 784.926025390625, 799.82861328125, 814.731201171875, 829.6337890625, 844.536376953125, 859.43896484375, 874.3416137695312, 889.2442016601562, 904.1467895507812, 919.0493774414062]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 5.0, 10.0, 8.0, 9.0, 14.0, 15.0, 20.0, 15.0, 21.0, 26.0, 23.0, 22.0, 35.0, 31.0, 35.0, 31.0, 37.0, 36.0, 34.0, 35.0, 38.0, 28.0, 40.0, 52.0, 41.0, 45.0, 34.0, 34.0, 36.0, 22.0, 14.0, 17.0, 24.0, 21.0, 17.0, 12.0, 9.0, 15.0, 14.0, 5.0, 9.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-55.6558723449707, -53.93042755126953, -52.20498275756836, -50.47953796386719, -48.75409698486328, -47.02865219116211, -45.30320739746094, -43.577762603759766, -41.852317810058594, -40.12687301635742, -38.40142822265625, -36.675987243652344, -34.95054244995117, -33.22509765625, -31.499652862548828, -29.774208068847656, -28.048765182495117, -26.323320388793945, -24.597877502441406, -22.872432708740234, -21.146987915039062, -19.42154312133789, -17.69610023498535, -15.97065544128418, -14.245211601257324, -12.519767761230469, -10.794322967529297, -9.068879127502441, -7.343434810638428, -5.617990493774414, -3.8925466537475586, -2.1671018600463867, -0.44165802001953125, 1.2837861776351929, 3.009230375289917, 4.734674453735352, 6.460118770599365, 8.185563087463379, 9.911006927490234, 11.636451721191406, 13.361895561218262, 15.087339401245117, 16.81278419494629, 18.538227081298828, 20.263671875, 21.989116668701172, 23.714561462402344, 25.440006256103516, 27.165449142456055, 28.890893936157227, 30.616336822509766, 32.34178161621094, 34.06722640991211, 35.79267120361328, 37.51811218261719, 39.243560791015625, 40.96900177001953, 42.6944465637207, 44.419891357421875, 46.14533233642578, 47.87077713012695, 49.596221923828125, 51.3216667175293, 53.04711151123047, 54.77255630493164]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 16.0, 6.0, 13.0, 17.0, 20.0, 15.0, 17.0, 25.0, 31.0, 21.0, 33.0, 41.0, 38.0, 36.0, 40.0, 39.0, 47.0, 51.0, 37.0, 47.0, 44.0, 49.0, 46.0, 20.0, 34.0, 37.0, 23.0, 23.0, 19.0, 17.0, 12.0, 13.0, 12.0, 14.0, 9.0, 5.0, 10.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.94140625, -5.73516845703125, -5.5289306640625, -5.32269287109375, -5.116455078125, -4.91021728515625, -4.7039794921875, -4.49774169921875, -4.29150390625, -4.08526611328125, -3.8790283203125, -3.67279052734375, -3.466552734375, -3.26031494140625, -3.0540771484375, -2.84783935546875, -2.6416015625, -2.43536376953125, -2.2291259765625, -2.02288818359375, -1.816650390625, -1.61041259765625, -1.4041748046875, -1.19793701171875, -0.99169921875, -0.78546142578125, -0.5792236328125, -0.37298583984375, -0.166748046875, 0.03948974609375, 0.2457275390625, 0.45196533203125, 0.658203125, 0.86444091796875, 1.0706787109375, 1.27691650390625, 1.483154296875, 1.68939208984375, 1.8956298828125, 2.10186767578125, 2.30810546875, 2.51434326171875, 2.7205810546875, 2.92681884765625, 3.133056640625, 3.33929443359375, 3.5455322265625, 3.75177001953125, 3.9580078125, 4.16424560546875, 4.3704833984375, 4.57672119140625, 4.782958984375, 4.98919677734375, 5.1954345703125, 5.40167236328125, 5.60791015625, 5.81414794921875, 6.0203857421875, 6.22662353515625, 6.432861328125, 6.63909912109375, 6.8453369140625, 7.05157470703125, 7.2578125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 12.0, 24.0, 20.0, 22.0, 39.0, 38.0, 71.0, 118.0, 111.0, 211.0, 288.0, 414.0, 570.0, 894.0, 1154.0, 1805.0, 2624.0, 4321.0, 6865.0, 11792.0, 23693.0, 58015.0, 192704.0, 801885.0, 1979623.0, 805856.0, 187839.0, 57606.0, 23850.0, 11994.0, 6969.0, 4240.0, 2752.0, 1873.0, 1262.0, 863.0, 589.0, 359.0, 266.0, 185.0, 117.0, 95.0, 66.0, 49.0, 52.0, 32.0, 17.0, 13.0, 11.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.796875, -10.4541015625, -10.111328125, -9.7685546875, -9.42578125, -9.0830078125, -8.740234375, -8.3974609375, -8.0546875, -7.7119140625, -7.369140625, -7.0263671875, -6.68359375, -6.3408203125, -5.998046875, -5.6552734375, -5.3125, -4.9697265625, -4.626953125, -4.2841796875, -3.94140625, -3.5986328125, -3.255859375, -2.9130859375, -2.5703125, -2.2275390625, -1.884765625, -1.5419921875, -1.19921875, -0.8564453125, -0.513671875, -0.1708984375, 0.171875, 0.5146484375, 0.857421875, 1.2001953125, 1.54296875, 1.8857421875, 2.228515625, 2.5712890625, 2.9140625, 3.2568359375, 3.599609375, 3.9423828125, 4.28515625, 4.6279296875, 4.970703125, 5.3134765625, 5.65625, 5.9990234375, 6.341796875, 6.6845703125, 7.02734375, 7.3701171875, 7.712890625, 8.0556640625, 8.3984375, 8.7412109375, 9.083984375, 9.4267578125, 9.76953125, 10.1123046875, 10.455078125, 10.7978515625, 11.140625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 3.0, 4.0, 8.0, 15.0, 16.0, 19.0, 34.0, 56.0, 54.0, 82.0, 125.0, 209.0, 298.0, 456.0, 616.0, 625.0, 490.0, 264.0, 212.0, 124.0, 85.0, 69.0, 47.0, 39.0, 29.0, 23.0, 19.0, 10.0, 4.0, 6.0, 7.0, 7.0, 2.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.796875, -15.2724609375, -14.748046875, -14.2236328125, -13.69921875, -13.1748046875, -12.650390625, -12.1259765625, -11.6015625, -11.0771484375, -10.552734375, -10.0283203125, -9.50390625, -8.9794921875, -8.455078125, -7.9306640625, -7.40625, -6.8818359375, -6.357421875, -5.8330078125, -5.30859375, -4.7841796875, -4.259765625, -3.7353515625, -3.2109375, -2.6865234375, -2.162109375, -1.6376953125, -1.11328125, -0.5888671875, -0.064453125, 0.4599609375, 0.984375, 1.5087890625, 2.033203125, 2.5576171875, 3.08203125, 3.6064453125, 4.130859375, 4.6552734375, 5.1796875, 5.7041015625, 6.228515625, 6.7529296875, 7.27734375, 7.8017578125, 8.326171875, 8.8505859375, 9.375, 9.8994140625, 10.423828125, 10.9482421875, 11.47265625, 11.9970703125, 12.521484375, 13.0458984375, 13.5703125, 14.0947265625, 14.619140625, 15.1435546875, 15.66796875, 16.1923828125, 16.716796875, 17.2412109375, 17.765625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 10.0, 4.0, 15.0, 18.0, 36.0, 53.0, 75.0, 112.0, 202.0, 411.0, 935.0, 2075.0, 6156.0, 21447.0, 136459.0, 2893363.0, 1047379.0, 64646.0, 13596.0, 4325.0, 1593.0, 611.0, 305.0, 163.0, 88.0, 57.0, 41.0, 30.0, 24.0, 13.0, 6.0, 2.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.03125, -39.818359375, -38.60546875, -37.392578125, -36.1796875, -34.966796875, -33.75390625, -32.541015625, -31.328125, -30.115234375, -28.90234375, -27.689453125, -26.4765625, -25.263671875, -24.05078125, -22.837890625, -21.625, -20.412109375, -19.19921875, -17.986328125, -16.7734375, -15.560546875, -14.34765625, -13.134765625, -11.921875, -10.708984375, -9.49609375, -8.283203125, -7.0703125, -5.857421875, -4.64453125, -3.431640625, -2.21875, -1.005859375, 0.20703125, 1.419921875, 2.6328125, 3.845703125, 5.05859375, 6.271484375, 7.484375, 8.697265625, 9.91015625, 11.123046875, 12.3359375, 13.548828125, 14.76171875, 15.974609375, 17.1875, 18.400390625, 19.61328125, 20.826171875, 22.0390625, 23.251953125, 24.46484375, 25.677734375, 26.890625, 28.103515625, 29.31640625, 30.529296875, 31.7421875, 32.955078125, 34.16796875, 35.380859375, 36.59375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 16.0, 84.0, 213.0, 341.0, 241.0, 85.0, 27.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-318.90814208984375, -310.41888427734375, -301.9295959472656, -293.4403381347656, -284.9510803222656, -276.4618225097656, -267.9725341796875, -259.4832763671875, -250.9940185546875, -242.50474548339844, -234.01548767089844, -225.52621459960938, -217.03695678710938, -208.5476837158203, -200.05841064453125, -191.56915283203125, -183.0798797607422, -174.59060668945312, -166.10134887695312, -157.61207580566406, -149.12281799316406, -140.633544921875, -132.144287109375, -123.65501403808594, -115.1657485961914, -106.67648315429688, -98.18721771240234, -89.69795227050781, -81.20867919921875, -72.71942138671875, -64.23014831542969, -55.740882873535156, -47.25160217285156, -38.76233673095703, -30.273069381713867, -21.783802032470703, -13.294536590576172, -4.805271148681641, 3.6839981079101562, 12.173263549804688, 20.66252899169922, 29.15179443359375, 37.64105987548828, 46.13032913208008, 54.61959457397461, 63.10886001586914, 71.59812927246094, 80.08739471435547, 88.57666015625, 97.06592559814453, 105.55519104003906, 114.04446411132812, 122.53372192382812, 131.0229949951172, 139.51226806640625, 148.00152587890625, 156.49078369140625, 164.9800567626953, 173.4693145751953, 181.95858764648438, 190.44784545898438, 198.93711853027344, 207.4263916015625, 215.9156494140625, 224.40492248535156]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 6.0, 9.0, 3.0, 10.0, 13.0, 10.0, 17.0, 11.0, 22.0, 27.0, 23.0, 29.0, 26.0, 32.0, 25.0, 43.0, 40.0, 32.0, 39.0, 34.0, 41.0, 34.0, 54.0, 38.0, 37.0, 33.0, 45.0, 26.0, 27.0, 26.0, 29.0, 21.0, 25.0, 21.0, 22.0, 15.0, 12.0, 15.0, 8.0, 9.0, 11.0, 5.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-48.80941390991211, -47.3341064453125, -45.85879898071289, -44.38349151611328, -42.90818786621094, -41.43288040161133, -39.95757293701172, -38.48226547241211, -37.0069580078125, -35.53165054321289, -34.05634307861328, -32.58103561401367, -31.105730056762695, -29.630422592163086, -28.15511703491211, -26.6798095703125, -25.20450210571289, -23.72919464111328, -22.253887176513672, -20.778581619262695, -19.303274154663086, -17.827966690063477, -16.3526611328125, -14.87735366821289, -13.402046203613281, -11.926738739013672, -10.451432228088379, -8.976125717163086, -7.500818252563477, -6.025511264801025, -4.550204277038574, -3.0748977661132812, -1.5995941162109375, -0.12428712844848633, 1.3510198593139648, 2.826326847076416, 4.301633834838867, 5.776940822601318, 7.2522478103637695, 8.727554321289062, 10.202861785888672, 11.678169250488281, 13.153475761413574, 14.628782272338867, 16.104089736938477, 17.579397201538086, 19.054702758789062, 20.530010223388672, 22.00531768798828, 23.48062515258789, 24.9559326171875, 26.431238174438477, 27.906545639038086, 29.381853103637695, 30.857158660888672, 32.33246612548828, 33.80777359008789, 35.2830810546875, 36.75838851928711, 38.23369598388672, 39.70899963378906, 41.18430709838867, 42.65961456298828, 44.13492202758789, 45.6102294921875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 1.0, 4.0, 5.0, 8.0, 9.0, 9.0, 15.0, 16.0, 9.0, 9.0, 22.0, 24.0, 22.0, 23.0, 32.0, 33.0, 31.0, 41.0, 40.0, 47.0, 44.0, 42.0, 44.0, 46.0, 39.0, 44.0, 25.0, 30.0, 33.0, 28.0, 33.0, 30.0, 23.0, 26.0, 18.0, 8.0, 18.0, 14.0, 9.0, 10.0, 10.0, 4.0, 4.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-6.45703125, -6.26373291015625, -6.0704345703125, -5.87713623046875, -5.683837890625, -5.49053955078125, -5.2972412109375, -5.10394287109375, -4.91064453125, -4.71734619140625, -4.5240478515625, -4.33074951171875, -4.137451171875, -3.94415283203125, -3.7508544921875, -3.55755615234375, -3.3642578125, -3.17095947265625, -2.9776611328125, -2.78436279296875, -2.591064453125, -2.39776611328125, -2.2044677734375, -2.01116943359375, -1.81787109375, -1.62457275390625, -1.4312744140625, -1.23797607421875, -1.044677734375, -0.85137939453125, -0.6580810546875, -0.46478271484375, -0.271484375, -0.07818603515625, 0.1151123046875, 0.30841064453125, 0.501708984375, 0.69500732421875, 0.8883056640625, 1.08160400390625, 1.27490234375, 1.46820068359375, 1.6614990234375, 1.85479736328125, 2.048095703125, 2.24139404296875, 2.4346923828125, 2.62799072265625, 2.8212890625, 3.01458740234375, 3.2078857421875, 3.40118408203125, 3.594482421875, 3.78778076171875, 3.9810791015625, 4.17437744140625, 4.36767578125, 4.56097412109375, 4.7542724609375, 4.94757080078125, 5.140869140625, 5.33416748046875, 5.5274658203125, 5.72076416015625, 5.9140625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 13.0, 20.0, 30.0, 44.0, 54.0, 78.0, 119.0, 148.0, 236.0, 322.0, 450.0, 723.0, 1107.0, 1779.0, 2852.0, 5037.0, 9218.0, 17859.0, 35896.0, 73993.0, 148553.0, 244380.0, 234147.0, 135675.0, 66409.0, 32446.0, 16211.0, 8519.0, 4676.0, 2654.0, 1663.0, 1051.0, 741.0, 429.0, 306.0, 195.0, 159.0, 95.0, 81.0, 64.0, 41.0, 24.0, 16.0, 15.0, 2.0, 3.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.9228515625, -1.866180419921875, -1.80950927734375, -1.752838134765625, -1.6961669921875, -1.639495849609375, -1.58282470703125, -1.526153564453125, -1.469482421875, -1.412811279296875, -1.35614013671875, -1.299468994140625, -1.2427978515625, -1.186126708984375, -1.12945556640625, -1.072784423828125, -1.01611328125, -0.959442138671875, -0.90277099609375, -0.846099853515625, -0.7894287109375, -0.732757568359375, -0.67608642578125, -0.619415283203125, -0.562744140625, -0.506072998046875, -0.44940185546875, -0.392730712890625, -0.3360595703125, -0.279388427734375, -0.22271728515625, -0.166046142578125, -0.109375, -0.052703857421875, 0.00396728515625, 0.060638427734375, 0.1173095703125, 0.173980712890625, 0.23065185546875, 0.287322998046875, 0.343994140625, 0.400665283203125, 0.45733642578125, 0.514007568359375, 0.5706787109375, 0.627349853515625, 0.68402099609375, 0.740692138671875, 0.79736328125, 0.854034423828125, 0.91070556640625, 0.967376708984375, 1.0240478515625, 1.080718994140625, 1.13739013671875, 1.194061279296875, 1.250732421875, 1.307403564453125, 1.36407470703125, 1.420745849609375, 1.4774169921875, 1.534088134765625, 1.59075927734375, 1.647430419921875, 1.7041015625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 2.0, 7.0, 12.0, 15.0, 19.0, 22.0, 17.0, 34.0, 24.0, 35.0, 37.0, 41.0, 37.0, 45.0, 42.0, 44.0, 50.0, 1064.0, 52.0, 35.0, 48.0, 37.0, 36.0, 45.0, 35.0, 30.0, 28.0, 20.0, 26.0, 18.0, 9.0, 12.0, 5.0, 9.0, 7.0, 4.0, 5.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.0, -5.82562255859375, -5.6512451171875, -5.47686767578125, -5.302490234375, -5.12811279296875, -4.9537353515625, -4.77935791015625, -4.60498046875, -4.43060302734375, -4.2562255859375, -4.08184814453125, -3.907470703125, -3.73309326171875, -3.5587158203125, -3.38433837890625, -3.2099609375, -3.03558349609375, -2.8612060546875, -2.68682861328125, -2.512451171875, -2.33807373046875, -2.1636962890625, -1.98931884765625, -1.81494140625, -1.64056396484375, -1.4661865234375, -1.29180908203125, -1.117431640625, -0.94305419921875, -0.7686767578125, -0.59429931640625, -0.419921875, -0.24554443359375, -0.0711669921875, 0.10321044921875, 0.277587890625, 0.45196533203125, 0.6263427734375, 0.80072021484375, 0.97509765625, 1.14947509765625, 1.3238525390625, 1.49822998046875, 1.672607421875, 1.84698486328125, 2.0213623046875, 2.19573974609375, 2.3701171875, 2.54449462890625, 2.7188720703125, 2.89324951171875, 3.067626953125, 3.24200439453125, 3.4163818359375, 3.59075927734375, 3.76513671875, 3.93951416015625, 4.1138916015625, 4.28826904296875, 4.462646484375, 4.63702392578125, 4.8114013671875, 4.98577880859375, 5.16015625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 13.0, 21.0, 36.0, 43.0, 87.0, 145.0, 238.0, 418.0, 757.0, 1474.0, 3301.0, 7638.0, 20434.0, 98327.0, 1889580.0, 49542.0, 14169.0, 5659.0, 2515.0, 1212.0, 631.0, 346.0, 200.0, 114.0, 66.0, 52.0, 27.0, 19.0, 11.0, 9.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.87109375, -4.720458984375, -4.56982421875, -4.419189453125, -4.2685546875, -4.117919921875, -3.96728515625, -3.816650390625, -3.666015625, -3.515380859375, -3.36474609375, -3.214111328125, -3.0634765625, -2.912841796875, -2.76220703125, -2.611572265625, -2.4609375, -2.310302734375, -2.15966796875, -2.009033203125, -1.8583984375, -1.707763671875, -1.55712890625, -1.406494140625, -1.255859375, -1.105224609375, -0.95458984375, -0.803955078125, -0.6533203125, -0.502685546875, -0.35205078125, -0.201416015625, -0.05078125, 0.099853515625, 0.25048828125, 0.401123046875, 0.5517578125, 0.702392578125, 0.85302734375, 1.003662109375, 1.154296875, 1.304931640625, 1.45556640625, 1.606201171875, 1.7568359375, 1.907470703125, 2.05810546875, 2.208740234375, 2.359375, 2.510009765625, 2.66064453125, 2.811279296875, 2.9619140625, 3.112548828125, 3.26318359375, 3.413818359375, 3.564453125, 3.715087890625, 3.86572265625, 4.016357421875, 4.1669921875, 4.317626953125, 4.46826171875, 4.618896484375, 4.76953125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 11.0, 8.0, 9.0, 8.0, 13.0, 14.0, 12.0, 18.0, 21.0, 23.0, 25.0, 39.0, 33.0, 49.0, 66.0, 66.0, 67.0, 69.0, 69.0, 47.0, 52.0, 38.0, 36.0, 36.0, 39.0, 20.0, 24.0, 13.0, 14.0, 23.0, 7.0, 8.0, 4.0, 4.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1031494140625, -0.1000375747680664, -0.09692573547363281, -0.09381389617919922, -0.09070205688476562, -0.08759021759033203, -0.08447837829589844, -0.08136653900146484, -0.07825469970703125, -0.07514286041259766, -0.07203102111816406, -0.06891918182373047, -0.06580734252929688, -0.06269550323486328, -0.05958366394042969, -0.056471824645996094, -0.0533599853515625, -0.050248146057128906, -0.04713630676269531, -0.04402446746826172, -0.040912628173828125, -0.03780078887939453, -0.03468894958496094, -0.031577110290527344, -0.02846527099609375, -0.025353431701660156, -0.022241592407226562, -0.01912975311279297, -0.016017913818359375, -0.012906074523925781, -0.009794235229492188, -0.006682395935058594, -0.003570556640625, -0.00045871734619140625, 0.0026531219482421875, 0.005764961242675781, 0.008876800537109375, 0.011988639831542969, 0.015100479125976562, 0.018212318420410156, 0.02132415771484375, 0.024435997009277344, 0.027547836303710938, 0.03065967559814453, 0.033771514892578125, 0.03688335418701172, 0.03999519348144531, 0.043107032775878906, 0.0462188720703125, 0.049330711364746094, 0.05244255065917969, 0.05555438995361328, 0.058666229248046875, 0.06177806854248047, 0.06488990783691406, 0.06800174713134766, 0.07111358642578125, 0.07422542572021484, 0.07733726501464844, 0.08044910430908203, 0.08356094360351562, 0.08667278289794922, 0.08978462219238281, 0.0928964614868164, 0.09600830078125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 8.0, 14.0, 13.0, 18.0, 32.0, 28.0, 49.0, 62.0, 101.0, 128.0, 207.0, 583.0, 1974.0, 16554.0, 484580.0, 523322.0, 17643.0, 1973.0, 566.0, 225.0, 119.0, 84.0, 54.0, 43.0, 34.0, 28.0, 17.0, 12.0, 10.0, 15.0, 9.0, 7.0, 7.0, 6.0, 5.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4228515625, -1.3754425048828125, -1.328033447265625, -1.2806243896484375, -1.23321533203125, -1.1858062744140625, -1.138397216796875, -1.0909881591796875, -1.0435791015625, -0.9961700439453125, -0.948760986328125, -0.9013519287109375, -0.85394287109375, -0.8065338134765625, -0.759124755859375, -0.7117156982421875, -0.664306640625, -0.6168975830078125, -0.569488525390625, -0.5220794677734375, -0.47467041015625, -0.4272613525390625, -0.379852294921875, -0.3324432373046875, -0.2850341796875, -0.2376251220703125, -0.190216064453125, -0.1428070068359375, -0.09539794921875, -0.0479888916015625, -0.000579833984375, 0.0468292236328125, 0.09423828125, 0.1416473388671875, 0.189056396484375, 0.2364654541015625, 0.28387451171875, 0.3312835693359375, 0.378692626953125, 0.4261016845703125, 0.4735107421875, 0.5209197998046875, 0.568328857421875, 0.6157379150390625, 0.66314697265625, 0.7105560302734375, 0.757965087890625, 0.8053741455078125, 0.852783203125, 0.9001922607421875, 0.947601318359375, 0.9950103759765625, 1.04241943359375, 1.0898284912109375, 1.137237548828125, 1.1846466064453125, 1.2320556640625, 1.2794647216796875, 1.326873779296875, 1.3742828369140625, 1.42169189453125, 1.4691009521484375, 1.516510009765625, 1.5639190673828125, 1.611328125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 15.0, 19.0, 48.0, 105.0, 169.0, 220.0, 175.0, 115.0, 70.0, 26.0, 15.0, 9.0, 8.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46360036730766296, -0.4484054744243622, -0.4332105815410614, -0.4180156886577606, -0.40282079577445984, -0.38762590289115906, -0.37243103981018066, -0.3572361469268799, -0.3420412540435791, -0.3268463611602783, -0.31165146827697754, -0.29645657539367676, -0.281261682510376, -0.2660667896270752, -0.2508718967437744, -0.23567701876163483, -0.22048211097717285, -0.20528721809387207, -0.1900923252105713, -0.1748974323272705, -0.15970253944396973, -0.14450764656066895, -0.12931276857852936, -0.11411787569522858, -0.0989229828119278, -0.08372808992862701, -0.06853319704532623, -0.05333831161260605, -0.03814341872930527, -0.022948525846004486, -0.007753640413284302, 0.0074412524700164795, 0.022636115550994873, 0.037831008434295654, 0.05302589759230614, 0.06822078675031662, 0.0834156796336174, 0.09861057251691818, 0.11380545794963837, 0.12900035083293915, 0.14419524371623993, 0.1593901365995407, 0.1745850294828415, 0.18977990746498108, 0.20497480034828186, 0.22016969323158264, 0.23536458611488342, 0.2505594789981842, 0.265754371881485, 0.28094926476478577, 0.29614415764808655, 0.31133905053138733, 0.3265339434146881, 0.3417288362979889, 0.3569236993789673, 0.37211859226226807, 0.38731348514556885, 0.40250837802886963, 0.4177032709121704, 0.4328981637954712, 0.448093056678772, 0.46328794956207275, 0.47848284244537354, 0.4936777353286743, 0.5088726282119751]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 5.0, 10.0, 16.0, 11.0, 14.0, 20.0, 28.0, 27.0, 25.0, 32.0, 47.0, 47.0, 43.0, 43.0, 60.0, 51.0, 59.0, 43.0, 50.0, 42.0, 49.0, 44.0, 41.0, 30.0, 28.0, 25.0, 22.0, 10.0, 17.0, 18.0, 9.0, 11.0, 3.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1427396535873413, -0.13844697177410126, -0.1341542750597, -0.12986159324645996, -0.12556889653205872, -0.12127621471881866, -0.11698353290557861, -0.11269084364175797, -0.10839815437793732, -0.10410546511411667, -0.09981277585029602, -0.09552009403705597, -0.09122740477323532, -0.08693471550941467, -0.08264203369617462, -0.07834934443235397, -0.07405665516853333, -0.06976396590471268, -0.06547127664089203, -0.06117859482765198, -0.05688590556383133, -0.05259321630001068, -0.04830053076148033, -0.04400784522294998, -0.039715155959129333, -0.035422466695308685, -0.031129781156778336, -0.026837093755602837, -0.022544406354427338, -0.01825171895325184, -0.01395903155207634, -0.00966634415090084, -0.005373656749725342, -0.0010809693485498428, 0.003211718052625656, 0.007504405453801155, 0.011797092854976654, 0.016089780256152153, 0.020382467657327652, 0.02467515505850315, 0.02896784245967865, 0.0332605317234993, 0.03755321726202965, 0.04184590280056, 0.046138592064380646, 0.050431281328201294, 0.054723966866731644, 0.05901665240526199, 0.06330934166908264, 0.06760203093290329, 0.07189472019672394, 0.07618740200996399, 0.08048009127378464, 0.08477278053760529, 0.08906546235084534, 0.09335815161466599, 0.09765084087848663, 0.10194353014230728, 0.10623621940612793, 0.11052890121936798, 0.11482159048318863, 0.11911427974700928, 0.12340696156024933, 0.12769965827465057, 0.13199234008789062]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 1.0, 4.0, 3.0, 9.0, 10.0, 9.0, 14.0, 16.0, 10.0, 9.0, 22.0, 22.0, 21.0, 26.0, 31.0, 32.0, 32.0, 39.0, 40.0, 46.0, 48.0, 39.0, 45.0, 45.0, 41.0, 42.0, 26.0, 31.0, 33.0, 28.0, 32.0, 31.0, 23.0, 27.0, 16.0, 8.0, 18.0, 16.0, 9.0, 10.0, 10.0, 4.0, 2.0, 8.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-6.46875, -6.275390625, -6.08203125, -5.888671875, -5.6953125, -5.501953125, -5.30859375, -5.115234375, -4.921875, -4.728515625, -4.53515625, -4.341796875, -4.1484375, -3.955078125, -3.76171875, -3.568359375, -3.375, -3.181640625, -2.98828125, -2.794921875, -2.6015625, -2.408203125, -2.21484375, -2.021484375, -1.828125, -1.634765625, -1.44140625, -1.248046875, -1.0546875, -0.861328125, -0.66796875, -0.474609375, -0.28125, -0.087890625, 0.10546875, 0.298828125, 0.4921875, 0.685546875, 0.87890625, 1.072265625, 1.265625, 1.458984375, 1.65234375, 1.845703125, 2.0390625, 2.232421875, 2.42578125, 2.619140625, 2.8125, 3.005859375, 3.19921875, 3.392578125, 3.5859375, 3.779296875, 3.97265625, 4.166015625, 4.359375, 4.552734375, 4.74609375, 4.939453125, 5.1328125, 5.326171875, 5.51953125, 5.712890625, 5.90625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 10.0, 8.0, 15.0, 17.0, 29.0, 37.0, 55.0, 97.0, 127.0, 170.0, 280.0, 370.0, 613.0, 854.0, 1458.0, 2359.0, 4129.0, 7662.0, 14898.0, 31789.0, 71110.0, 176390.0, 418100.0, 179820.0, 72658.0, 31685.0, 15362.0, 7697.0, 4292.0, 2422.0, 1376.0, 895.0, 549.0, 377.0, 245.0, 173.0, 131.0, 101.0, 55.0, 36.0, 21.0, 21.0, 15.0, 7.0, 8.0, 5.0, 6.0, 4.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.015625, -8.7294921875, -8.443359375, -8.1572265625, -7.87109375, -7.5849609375, -7.298828125, -7.0126953125, -6.7265625, -6.4404296875, -6.154296875, -5.8681640625, -5.58203125, -5.2958984375, -5.009765625, -4.7236328125, -4.4375, -4.1513671875, -3.865234375, -3.5791015625, -3.29296875, -3.0068359375, -2.720703125, -2.4345703125, -2.1484375, -1.8623046875, -1.576171875, -1.2900390625, -1.00390625, -0.7177734375, -0.431640625, -0.1455078125, 0.140625, 0.4267578125, 0.712890625, 0.9990234375, 1.28515625, 1.5712890625, 1.857421875, 2.1435546875, 2.4296875, 2.7158203125, 3.001953125, 3.2880859375, 3.57421875, 3.8603515625, 4.146484375, 4.4326171875, 4.71875, 5.0048828125, 5.291015625, 5.5771484375, 5.86328125, 6.1494140625, 6.435546875, 6.7216796875, 7.0078125, 7.2939453125, 7.580078125, 7.8662109375, 8.15234375, 8.4384765625, 8.724609375, 9.0107421875, 9.296875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 10.0, 4.0, 16.0, 22.0, 19.0, 25.0, 25.0, 27.0, 37.0, 30.0, 49.0, 50.0, 56.0, 72.0, 126.0, 204.0, 1446.0, 250.0, 119.0, 96.0, 47.0, 44.0, 31.0, 34.0, 31.0, 37.0, 32.0, 20.0, 20.0, 12.0, 7.0, 8.0, 7.0, 6.0, 8.0, 5.0, 2.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.0, -25.177978515625, -24.35595703125, -23.533935546875, -22.7119140625, -21.889892578125, -21.06787109375, -20.245849609375, -19.423828125, -18.601806640625, -17.77978515625, -16.957763671875, -16.1357421875, -15.313720703125, -14.49169921875, -13.669677734375, -12.84765625, -12.025634765625, -11.20361328125, -10.381591796875, -9.5595703125, -8.737548828125, -7.91552734375, -7.093505859375, -6.271484375, -5.449462890625, -4.62744140625, -3.805419921875, -2.9833984375, -2.161376953125, -1.33935546875, -0.517333984375, 0.3046875, 1.126708984375, 1.94873046875, 2.770751953125, 3.5927734375, 4.414794921875, 5.23681640625, 6.058837890625, 6.880859375, 7.702880859375, 8.52490234375, 9.346923828125, 10.1689453125, 10.990966796875, 11.81298828125, 12.635009765625, 13.45703125, 14.279052734375, 15.10107421875, 15.923095703125, 16.7451171875, 17.567138671875, 18.38916015625, 19.211181640625, 20.033203125, 20.855224609375, 21.67724609375, 22.499267578125, 23.3212890625, 24.143310546875, 24.96533203125, 25.787353515625, 26.609375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 10.0, 5.0, 18.0, 30.0, 52.0, 79.0, 169.0, 379.0, 971.0, 3616.0, 499818.0, 2632770.0, 5652.0, 1248.0, 446.0, 199.0, 103.0, 66.0, 23.0, 20.0, 11.0, 3.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.0625, -91.7958984375, -88.529296875, -85.2626953125, -81.99609375, -78.7294921875, -75.462890625, -72.1962890625, -68.9296875, -65.6630859375, -62.396484375, -59.1298828125, -55.86328125, -52.5966796875, -49.330078125, -46.0634765625, -42.796875, -39.5302734375, -36.263671875, -32.9970703125, -29.73046875, -26.4638671875, -23.197265625, -19.9306640625, -16.6640625, -13.3974609375, -10.130859375, -6.8642578125, -3.59765625, -0.3310546875, 2.935546875, 6.2021484375, 9.46875, 12.7353515625, 16.001953125, 19.2685546875, 22.53515625, 25.8017578125, 29.068359375, 32.3349609375, 35.6015625, 38.8681640625, 42.134765625, 45.4013671875, 48.66796875, 51.9345703125, 55.201171875, 58.4677734375, 61.734375, 65.0009765625, 68.267578125, 71.5341796875, 74.80078125, 78.0673828125, 81.333984375, 84.6005859375, 87.8671875, 91.1337890625, 94.400390625, 97.6669921875, 100.93359375, 104.2001953125, 107.466796875, 110.7333984375, 114.0]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 617.0, 393.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.677799224853516, -38.732452392578125, -18.78710174560547, 1.1582450866699219, 21.103595733642578, 41.048946380615234, 60.99428939819336, 80.93965148925781, 100.88499450683594, 120.8303451538086, 140.77569580078125, 160.72103881835938, 180.6663818359375, 200.6117401123047, 220.5570831298828, 240.50244140625, 260.4477844238281, 280.39312744140625, 300.3384704589844, 320.2838134765625, 340.22918701171875, 360.1745300292969, 380.119873046875, 400.06524658203125, 420.01055908203125, 439.9559020996094, 459.9012451171875, 479.84661865234375, 499.7919616699219, 519.7373046875, 539.6826171875, 559.6279907226562, 579.5733032226562, 599.5186767578125, 619.4639892578125, 639.4093627929688, 659.3546752929688, 679.300048828125, 699.245361328125, 719.1907348632812, 739.1361083984375, 759.0814819335938, 779.0267944335938, 798.97216796875, 818.91748046875, 838.8628540039062, 858.8082275390625, 878.7535400390625, 898.6988525390625, 918.6442260742188, 938.5895385742188, 958.534912109375, 978.480224609375, 998.4255981445312, 1018.3709716796875, 1038.3162841796875, 1058.26171875, 1078.20703125, 1098.1524658203125, 1118.0977783203125, 1138.0430908203125, 1157.988525390625, 1177.933837890625, 1197.879150390625, 1217.824462890625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 7.0, 8.0, 5.0, 8.0, 18.0, 12.0, 16.0, 20.0, 30.0, 23.0, 20.0, 20.0, 26.0, 34.0, 25.0, 29.0, 37.0, 28.0, 53.0, 46.0, 36.0, 43.0, 31.0, 38.0, 31.0, 41.0, 24.0, 27.0, 37.0, 28.0, 33.0, 25.0, 24.0, 26.0, 16.0, 11.0, 14.0, 12.0, 10.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0], "bins": [-73.3570785522461, -71.42996215820312, -69.50284576416016, -67.57572937011719, -65.64861297607422, -63.72149658203125, -61.79438018798828, -59.86726379394531, -57.940147399902344, -56.013031005859375, -54.085914611816406, -52.15879821777344, -50.23168182373047, -48.3045654296875, -46.37744903564453, -44.45033264160156, -42.523216247558594, -40.596099853515625, -38.668983459472656, -36.74186706542969, -34.81475067138672, -32.88763427734375, -30.96051788330078, -29.033401489257812, -27.106285095214844, -25.179168701171875, -23.252052307128906, -21.324935913085938, -19.39781951904297, -17.470703125, -15.543586730957031, -13.616470336914062, -11.689350128173828, -9.76223373413086, -7.835117340087891, -5.908000946044922, -3.980884552001953, -2.0537681579589844, -0.12665176391601562, 1.8004646301269531, 3.727581024169922, 5.654697418212891, 7.581813812255859, 9.508930206298828, 11.436046600341797, 13.363162994384766, 15.290279388427734, 17.217395782470703, 19.144512176513672, 21.07162857055664, 22.99874496459961, 24.925861358642578, 26.852977752685547, 28.780094146728516, 30.707210540771484, 32.63432693481445, 34.56144332885742, 36.48855972290039, 38.41567611694336, 40.34279251098633, 42.2699089050293, 44.197025299072266, 46.124141693115234, 48.0512580871582, 49.97837448120117]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 7.0, 9.0, 13.0, 5.0, 12.0, 12.0, 18.0, 17.0, 19.0, 22.0, 24.0, 27.0, 29.0, 41.0, 44.0, 32.0, 38.0, 45.0, 48.0, 41.0, 42.0, 35.0, 41.0, 40.0, 32.0, 30.0, 41.0, 31.0, 23.0, 24.0, 16.0, 16.0, 14.0, 22.0, 14.0, 11.0, 15.0, 5.0, 2.0, 9.0, 7.0, 6.0, 7.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.0234375, -6.81634521484375, -6.6092529296875, -6.40216064453125, -6.195068359375, -5.98797607421875, -5.7808837890625, -5.57379150390625, -5.36669921875, -5.15960693359375, -4.9525146484375, -4.74542236328125, -4.538330078125, -4.33123779296875, -4.1241455078125, -3.91705322265625, -3.7099609375, -3.50286865234375, -3.2957763671875, -3.08868408203125, -2.881591796875, -2.67449951171875, -2.4674072265625, -2.26031494140625, -2.05322265625, -1.84613037109375, -1.6390380859375, -1.43194580078125, -1.224853515625, -1.01776123046875, -0.8106689453125, -0.60357666015625, -0.396484375, -0.18939208984375, 0.0177001953125, 0.22479248046875, 0.431884765625, 0.63897705078125, 0.8460693359375, 1.05316162109375, 1.26025390625, 1.46734619140625, 1.6744384765625, 1.88153076171875, 2.088623046875, 2.29571533203125, 2.5028076171875, 2.70989990234375, 2.9169921875, 3.12408447265625, 3.3311767578125, 3.53826904296875, 3.745361328125, 3.95245361328125, 4.1595458984375, 4.36663818359375, 4.57373046875, 4.78082275390625, 4.9879150390625, 5.19500732421875, 5.402099609375, 5.60919189453125, 5.8162841796875, 6.02337646484375, 6.23046875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 7.0, 5.0, 18.0, 11.0, 23.0, 27.0, 37.0, 67.0, 73.0, 83.0, 139.0, 216.0, 319.0, 464.0, 799.0, 1337.0, 2217.0, 3897.0, 7806.0, 17802.0, 54716.0, 258683.0, 1478199.0, 1893304.0, 360925.0, 71681.0, 21659.0, 8841.0, 4387.0, 2434.0, 1442.0, 899.0, 543.0, 346.0, 270.0, 157.0, 110.0, 86.0, 66.0, 59.0, 31.0, 29.0, 21.0, 14.0, 11.0, 4.0, 7.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-14.296875, -13.8514404296875, -13.406005859375, -12.9605712890625, -12.51513671875, -12.0697021484375, -11.624267578125, -11.1788330078125, -10.7333984375, -10.2879638671875, -9.842529296875, -9.3970947265625, -8.95166015625, -8.5062255859375, -8.060791015625, -7.6153564453125, -7.169921875, -6.7244873046875, -6.279052734375, -5.8336181640625, -5.38818359375, -4.9427490234375, -4.497314453125, -4.0518798828125, -3.6064453125, -3.1610107421875, -2.715576171875, -2.2701416015625, -1.82470703125, -1.3792724609375, -0.933837890625, -0.4884033203125, -0.04296875, 0.4024658203125, 0.847900390625, 1.2933349609375, 1.73876953125, 2.1842041015625, 2.629638671875, 3.0750732421875, 3.5205078125, 3.9659423828125, 4.411376953125, 4.8568115234375, 5.30224609375, 5.7476806640625, 6.193115234375, 6.6385498046875, 7.083984375, 7.5294189453125, 7.974853515625, 8.4202880859375, 8.86572265625, 9.3111572265625, 9.756591796875, 10.2020263671875, 10.6474609375, 11.0928955078125, 11.538330078125, 11.9837646484375, 12.42919921875, 12.8746337890625, 13.320068359375, 13.7655029296875, 14.2109375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 11.0, 11.0, 17.0, 23.0, 13.0, 30.0, 47.0, 46.0, 88.0, 116.0, 156.0, 301.0, 455.0, 612.0, 602.0, 457.0, 325.0, 227.0, 147.0, 87.0, 63.0, 49.0, 42.0, 41.0, 24.0, 17.0, 11.0, 12.0, 7.0, 7.0, 3.0, 3.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.171875, -14.649658203125, -14.12744140625, -13.605224609375, -13.0830078125, -12.560791015625, -12.03857421875, -11.516357421875, -10.994140625, -10.471923828125, -9.94970703125, -9.427490234375, -8.9052734375, -8.383056640625, -7.86083984375, -7.338623046875, -6.81640625, -6.294189453125, -5.77197265625, -5.249755859375, -4.7275390625, -4.205322265625, -3.68310546875, -3.160888671875, -2.638671875, -2.116455078125, -1.59423828125, -1.072021484375, -0.5498046875, -0.027587890625, 0.49462890625, 1.016845703125, 1.5390625, 2.061279296875, 2.58349609375, 3.105712890625, 3.6279296875, 4.150146484375, 4.67236328125, 5.194580078125, 5.716796875, 6.239013671875, 6.76123046875, 7.283447265625, 7.8056640625, 8.327880859375, 8.85009765625, 9.372314453125, 9.89453125, 10.416748046875, 10.93896484375, 11.461181640625, 11.9833984375, 12.505615234375, 13.02783203125, 13.550048828125, 14.072265625, 14.594482421875, 15.11669921875, 15.638916015625, 16.1611328125, 16.683349609375, 17.20556640625, 17.727783203125, 18.25]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 10.0, 10.0, 13.0, 17.0, 22.0, 36.0, 42.0, 53.0, 65.0, 132.0, 259.0, 636.0, 1705.0, 5608.0, 29351.0, 509226.0, 3506785.0, 120888.0, 14162.0, 3342.0, 1012.0, 381.0, 191.0, 100.0, 60.0, 38.0, 20.0, 26.0, 16.0, 12.0, 15.0, 9.0, 3.0, 5.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-54.1875, -52.56005859375, -50.9326171875, -49.30517578125, -47.677734375, -46.05029296875, -44.4228515625, -42.79541015625, -41.16796875, -39.54052734375, -37.9130859375, -36.28564453125, -34.658203125, -33.03076171875, -31.4033203125, -29.77587890625, -28.1484375, -26.52099609375, -24.8935546875, -23.26611328125, -21.638671875, -20.01123046875, -18.3837890625, -16.75634765625, -15.12890625, -13.50146484375, -11.8740234375, -10.24658203125, -8.619140625, -6.99169921875, -5.3642578125, -3.73681640625, -2.109375, -0.48193359375, 1.1455078125, 2.77294921875, 4.400390625, 6.02783203125, 7.6552734375, 9.28271484375, 10.91015625, 12.53759765625, 14.1650390625, 15.79248046875, 17.419921875, 19.04736328125, 20.6748046875, 22.30224609375, 23.9296875, 25.55712890625, 27.1845703125, 28.81201171875, 30.439453125, 32.06689453125, 33.6943359375, 35.32177734375, 36.94921875, 38.57666015625, 40.2041015625, 41.83154296875, 43.458984375, 45.08642578125, 46.7138671875, 48.34130859375, 49.96875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 19.0, 62.0, 149.0, 324.0, 285.0, 120.0, 31.0, 15.0, 6.0, 2.0, 2.0], "bins": [-447.4607238769531, -439.5749206542969, -431.6891174316406, -423.8033142089844, -415.9175109863281, -408.0317077636719, -400.14593505859375, -392.2601318359375, -384.37432861328125, -376.488525390625, -368.60272216796875, -360.7169189453125, -352.83111572265625, -344.9453125, -337.05950927734375, -329.1737060546875, -321.28790283203125, -313.402099609375, -305.51629638671875, -297.6304931640625, -289.74468994140625, -281.85888671875, -273.97308349609375, -266.0872802734375, -258.2015075683594, -250.31570434570312, -242.42990112304688, -234.54409790039062, -226.65830993652344, -218.7725067138672, -210.88670349121094, -203.0009002685547, -195.11509704589844, -187.2292938232422, -179.34349060058594, -171.45770263671875, -163.5718994140625, -155.68609619140625, -147.80029296875, -139.91448974609375, -132.0286865234375, -124.14288330078125, -116.25708770751953, -108.37128448486328, -100.48548126220703, -92.59968566894531, -84.71388244628906, -76.82807922363281, -68.94229125976562, -61.05649185180664, -53.17068862915039, -45.284889221191406, -37.399085998535156, -29.513286590576172, -21.627487182617188, -13.741683959960938, -5.8558807373046875, 2.0299201011657715, 9.91572093963623, 17.80152130126953, 25.68732261657715, 33.573123931884766, 41.45892333984375, 49.3447265625, 57.230525970458984]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 14.0, 6.0, 3.0, 13.0, 8.0, 12.0, 20.0, 20.0, 19.0, 47.0, 26.0, 35.0, 26.0, 44.0, 46.0, 43.0, 41.0, 51.0, 39.0, 45.0, 35.0, 38.0, 37.0, 40.0, 27.0, 35.0, 32.0, 29.0, 27.0, 23.0, 27.0, 18.0, 20.0, 12.0, 7.0, 8.0, 8.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.81034469604492, -55.06266784667969, -53.31499481201172, -51.567317962646484, -49.81964111328125, -48.07196807861328, -46.32429122924805, -44.57661437988281, -42.828941345214844, -41.08126449584961, -39.33359146118164, -37.585914611816406, -35.83824157714844, -34.0905647277832, -32.34288787841797, -30.595212936401367, -28.847537994384766, -27.099863052368164, -25.352188110351562, -23.604511260986328, -21.856836318969727, -20.109161376953125, -18.36148452758789, -16.61380958557129, -14.866134643554688, -13.118459701538086, -11.370783805847168, -9.62310791015625, -7.875432968139648, -6.127758026123047, -4.380082130432129, -2.632406234741211, -0.884735107421875, 0.8629403114318848, 2.6106157302856445, 4.358291149139404, 6.105966567993164, 7.853641510009766, 9.601317405700684, 11.348993301391602, 13.096668243408203, 14.844343185424805, 16.592018127441406, 18.33969497680664, 20.087369918823242, 21.835044860839844, 23.582721710205078, 25.33039665222168, 27.07807159423828, 28.825746536254883, 30.573421478271484, 32.32109832763672, 34.06877136230469, 35.81644821166992, 37.564125061035156, 39.311798095703125, 41.05947494506836, 42.807151794433594, 44.55482482910156, 46.3025016784668, 48.05017852783203, 49.7978515625, 51.545528411865234, 53.29320526123047, 55.04087829589844]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 10.0, 10.0, 15.0, 14.0, 17.0, 27.0, 27.0, 21.0, 36.0, 33.0, 32.0, 33.0, 37.0, 34.0, 42.0, 49.0, 37.0, 35.0, 45.0, 45.0, 47.0, 35.0, 14.0, 39.0, 32.0, 19.0, 27.0, 29.0, 27.0, 19.0, 15.0, 13.0, 15.0, 12.0, 6.0, 8.0, 4.0, 6.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.6953125, -5.49853515625, -5.3017578125, -5.10498046875, -4.908203125, -4.71142578125, -4.5146484375, -4.31787109375, -4.12109375, -3.92431640625, -3.7275390625, -3.53076171875, -3.333984375, -3.13720703125, -2.9404296875, -2.74365234375, -2.546875, -2.35009765625, -2.1533203125, -1.95654296875, -1.759765625, -1.56298828125, -1.3662109375, -1.16943359375, -0.97265625, -0.77587890625, -0.5791015625, -0.38232421875, -0.185546875, 0.01123046875, 0.2080078125, 0.40478515625, 0.6015625, 0.79833984375, 0.9951171875, 1.19189453125, 1.388671875, 1.58544921875, 1.7822265625, 1.97900390625, 2.17578125, 2.37255859375, 2.5693359375, 2.76611328125, 2.962890625, 3.15966796875, 3.3564453125, 3.55322265625, 3.75, 3.94677734375, 4.1435546875, 4.34033203125, 4.537109375, 4.73388671875, 4.9306640625, 5.12744140625, 5.32421875, 5.52099609375, 5.7177734375, 5.91455078125, 6.111328125, 6.30810546875, 6.5048828125, 6.70166015625, 6.8984375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 3.0, 8.0, 7.0, 13.0, 11.0, 24.0, 35.0, 49.0, 84.0, 107.0, 140.0, 260.0, 346.0, 486.0, 781.0, 1164.0, 1730.0, 2501.0, 3881.0, 5876.0, 9193.0, 13932.0, 21167.0, 31770.0, 46979.0, 68541.0, 93839.0, 121038.0, 137623.0, 131218.0, 107041.0, 80028.0, 55960.0, 38077.0, 25807.0, 16717.0, 10941.0, 7156.0, 4727.0, 3091.0, 1948.0, 1376.0, 925.0, 622.0, 427.0, 295.0, 181.0, 136.0, 80.0, 80.0, 50.0, 28.0, 27.0, 13.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.79931640625, -0.7741241455078125, -0.748931884765625, -0.7237396240234375, -0.69854736328125, -0.6733551025390625, -0.648162841796875, -0.6229705810546875, -0.5977783203125, -0.5725860595703125, -0.547393798828125, -0.5222015380859375, -0.49700927734375, -0.4718170166015625, -0.446624755859375, -0.4214324951171875, -0.396240234375, -0.3710479736328125, -0.345855712890625, -0.3206634521484375, -0.29547119140625, -0.2702789306640625, -0.245086669921875, -0.2198944091796875, -0.1947021484375, -0.1695098876953125, -0.144317626953125, -0.1191253662109375, -0.09393310546875, -0.0687408447265625, -0.043548583984375, -0.0183563232421875, 0.0068359375, 0.0320281982421875, 0.057220458984375, 0.0824127197265625, 0.10760498046875, 0.1327972412109375, 0.157989501953125, 0.1831817626953125, 0.2083740234375, 0.2335662841796875, 0.258758544921875, 0.2839508056640625, 0.30914306640625, 0.3343353271484375, 0.359527587890625, 0.3847198486328125, 0.409912109375, 0.4351043701171875, 0.460296630859375, 0.4854888916015625, 0.51068115234375, 0.5358734130859375, 0.561065673828125, 0.5862579345703125, 0.6114501953125, 0.6366424560546875, 0.661834716796875, 0.6870269775390625, 0.71221923828125, 0.7374114990234375, 0.762603759765625, 0.7877960205078125, 0.81298828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 10.0, 6.0, 7.0, 10.0, 13.0, 13.0, 13.0, 13.0, 24.0, 30.0, 29.0, 28.0, 29.0, 32.0, 31.0, 40.0, 50.0, 39.0, 31.0, 1068.0, 40.0, 36.0, 49.0, 42.0, 47.0, 41.0, 42.0, 35.0, 28.0, 26.0, 23.0, 20.0, 14.0, 9.0, 13.0, 10.0, 10.0, 3.0, 4.0, 7.0, 0.0, 2.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.60137939453125, -4.4449462890625, -4.28851318359375, -4.132080078125, -3.97564697265625, -3.8192138671875, -3.66278076171875, -3.50634765625, -3.34991455078125, -3.1934814453125, -3.03704833984375, -2.880615234375, -2.72418212890625, -2.5677490234375, -2.41131591796875, -2.2548828125, -2.09844970703125, -1.9420166015625, -1.78558349609375, -1.629150390625, -1.47271728515625, -1.3162841796875, -1.15985107421875, -1.00341796875, -0.84698486328125, -0.6905517578125, -0.53411865234375, -0.377685546875, -0.22125244140625, -0.0648193359375, 0.09161376953125, 0.248046875, 0.40447998046875, 0.5609130859375, 0.71734619140625, 0.873779296875, 1.03021240234375, 1.1866455078125, 1.34307861328125, 1.49951171875, 1.65594482421875, 1.8123779296875, 1.96881103515625, 2.125244140625, 2.28167724609375, 2.4381103515625, 2.59454345703125, 2.7509765625, 2.90740966796875, 3.0638427734375, 3.22027587890625, 3.376708984375, 3.53314208984375, 3.6895751953125, 3.84600830078125, 4.00244140625, 4.15887451171875, 4.3153076171875, 4.47174072265625, 4.628173828125, 4.78460693359375, 4.9410400390625, 5.09747314453125, 5.25390625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 13.0, 14.0, 12.0, 26.0, 32.0, 63.0, 113.0, 217.0, 315.0, 576.0, 1033.0, 1962.0, 3823.0, 7904.0, 17597.0, 47568.0, 1735013.0, 222062.0, 32415.0, 13559.0, 6168.0, 3119.0, 1567.0, 803.0, 453.0, 259.0, 149.0, 89.0, 63.0, 35.0, 23.0, 16.0, 13.0, 6.0, 3.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0], "bins": [-3.4609375, -3.371795654296875, -3.28265380859375, -3.193511962890625, -3.1043701171875, -3.015228271484375, -2.92608642578125, -2.836944580078125, -2.747802734375, -2.658660888671875, -2.56951904296875, -2.480377197265625, -2.3912353515625, -2.302093505859375, -2.21295166015625, -2.123809814453125, -2.03466796875, -1.945526123046875, -1.85638427734375, -1.767242431640625, -1.6781005859375, -1.588958740234375, -1.49981689453125, -1.410675048828125, -1.321533203125, -1.232391357421875, -1.14324951171875, -1.054107666015625, -0.9649658203125, -0.875823974609375, -0.78668212890625, -0.697540283203125, -0.6083984375, -0.519256591796875, -0.43011474609375, -0.340972900390625, -0.2518310546875, -0.162689208984375, -0.07354736328125, 0.015594482421875, 0.104736328125, 0.193878173828125, 0.28302001953125, 0.372161865234375, 0.4613037109375, 0.550445556640625, 0.63958740234375, 0.728729248046875, 0.81787109375, 0.907012939453125, 0.99615478515625, 1.085296630859375, 1.1744384765625, 1.263580322265625, 1.35272216796875, 1.441864013671875, 1.531005859375, 1.620147705078125, 1.70928955078125, 1.798431396484375, 1.8875732421875, 1.976715087890625, 2.06585693359375, 2.154998779296875, 2.244140625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 6.0, 4.0, 4.0, 7.0, 17.0, 16.0, 25.0, 21.0, 29.0, 28.0, 40.0, 46.0, 45.0, 65.0, 67.0, 64.0, 85.0, 68.0, 63.0, 47.0, 47.0, 42.0, 32.0, 26.0, 26.0, 20.0, 13.0, 13.0, 8.0, 12.0, 4.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09478759765625, -0.09154605865478516, -0.08830451965332031, -0.08506298065185547, -0.08182144165039062, -0.07857990264892578, -0.07533836364746094, -0.0720968246459961, -0.06885528564453125, -0.0656137466430664, -0.06237220764160156, -0.05913066864013672, -0.055889129638671875, -0.05264759063720703, -0.04940605163574219, -0.046164512634277344, -0.0429229736328125, -0.039681434631347656, -0.03643989562988281, -0.03319835662841797, -0.029956817626953125, -0.02671527862548828, -0.023473739624023438, -0.020232200622558594, -0.01699066162109375, -0.013749122619628906, -0.010507583618164062, -0.007266044616699219, -0.004024505615234375, -0.0007829666137695312, 0.0024585723876953125, 0.005700111389160156, 0.008941650390625, 0.012183189392089844, 0.015424728393554688, 0.01866626739501953, 0.021907806396484375, 0.02514934539794922, 0.028390884399414062, 0.031632423400878906, 0.03487396240234375, 0.038115501403808594, 0.04135704040527344, 0.04459857940673828, 0.047840118408203125, 0.05108165740966797, 0.05432319641113281, 0.057564735412597656, 0.0608062744140625, 0.06404781341552734, 0.06728935241699219, 0.07053089141845703, 0.07377243041992188, 0.07701396942138672, 0.08025550842285156, 0.0834970474243164, 0.08673858642578125, 0.0899801254272461, 0.09322166442871094, 0.09646320343017578, 0.09970474243164062, 0.10294628143310547, 0.10618782043457031, 0.10942935943603516, 0.1126708984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 8.0, 17.0, 16.0, 28.0, 39.0, 59.0, 41.0, 95.0, 141.0, 313.0, 921.0, 7715.0, 385351.0, 640355.0, 11418.0, 1145.0, 303.0, 187.0, 100.0, 64.0, 58.0, 42.0, 25.0, 19.0, 16.0, 23.0, 6.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.66015625, -1.6083831787109375, -1.556610107421875, -1.5048370361328125, -1.45306396484375, -1.4012908935546875, -1.349517822265625, -1.2977447509765625, -1.2459716796875, -1.1941986083984375, -1.142425537109375, -1.0906524658203125, -1.03887939453125, -0.9871063232421875, -0.935333251953125, -0.8835601806640625, -0.831787109375, -0.7800140380859375, -0.728240966796875, -0.6764678955078125, -0.62469482421875, -0.5729217529296875, -0.521148681640625, -0.4693756103515625, -0.4176025390625, -0.3658294677734375, -0.314056396484375, -0.2622833251953125, -0.21051025390625, -0.1587371826171875, -0.106964111328125, -0.0551910400390625, -0.00341796875, 0.0483551025390625, 0.100128173828125, 0.1519012451171875, 0.20367431640625, 0.2554473876953125, 0.307220458984375, 0.3589935302734375, 0.4107666015625, 0.4625396728515625, 0.514312744140625, 0.5660858154296875, 0.61785888671875, 0.6696319580078125, 0.721405029296875, 0.7731781005859375, 0.824951171875, 0.8767242431640625, 0.928497314453125, 0.9802703857421875, 1.03204345703125, 1.0838165283203125, 1.135589599609375, 1.1873626708984375, 1.2391357421875, 1.2909088134765625, 1.342681884765625, 1.3944549560546875, 1.44622802734375, 1.4980010986328125, 1.549774169921875, 1.6015472412109375, 1.6533203125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 11.0, 36.0, 86.0, 212.0, 370.0, 184.0, 71.0, 21.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7023066282272339, -0.6812922954559326, -0.6602779626846313, -0.6392636299133301, -0.6182492971420288, -0.5972350239753723, -0.576220691204071, -0.5552063584327698, -0.5341920256614685, -0.5131776928901672, -0.49216336011886597, -0.4711490571498871, -0.4501347243785858, -0.42912039160728455, -0.40810608863830566, -0.3870917558670044, -0.3660774230957031, -0.34506309032440186, -0.3240487575531006, -0.3030344545841217, -0.28202012181282043, -0.26100578904151917, -0.2399914711713791, -0.218977153301239, -0.19796282052993774, -0.17694848775863647, -0.1559341698884964, -0.13491985201835632, -0.11390551924705505, -0.09289119392633438, -0.07187686860561371, -0.05086255073547363, -0.02984827756881714, -0.008833952248096466, 0.012180373072624207, 0.03319469839334488, 0.05420902371406555, 0.07522334903478622, 0.0962376743555069, 0.11725199222564697, 0.13826632499694824, 0.1592806577682495, 0.1802949756383896, 0.20130929350852966, 0.22232362627983093, 0.2433379590511322, 0.2643522620201111, 0.28536659479141235, 0.3063809275627136, 0.3273952603340149, 0.34840959310531616, 0.36942389607429504, 0.3904382288455963, 0.4114525616168976, 0.43246686458587646, 0.45348119735717773, 0.474495530128479, 0.4955098628997803, 0.5165241956710815, 0.5375385284423828, 0.5585528612136841, 0.5795671343803406, 0.6005814671516418, 0.6215957999229431, 0.6426101326942444]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 6.0, 3.0, 8.0, 12.0, 10.0, 24.0, 20.0, 25.0, 33.0, 33.0, 33.0, 41.0, 56.0, 50.0, 61.0, 56.0, 60.0, 55.0, 52.0, 49.0, 60.0, 42.0, 37.0, 25.0, 27.0, 31.0, 22.0, 20.0, 17.0, 15.0, 9.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21556872129440308, -0.2084161937236786, -0.2012636810541153, -0.1941111534833908, -0.18695864081382751, -0.17980611324310303, -0.17265358567237854, -0.16550107300281525, -0.15834856033325195, -0.15119603276252747, -0.14404352009296417, -0.13689099252223969, -0.1297384798526764, -0.1225859522819519, -0.11543343216180801, -0.10828091204166412, -0.10112838447093964, -0.09397586435079575, -0.08682334423065186, -0.07967081665992737, -0.07251830399036407, -0.06536577641963959, -0.0582132562994957, -0.05106073617935181, -0.043908216059207916, -0.036755695939064026, -0.029603173956274986, -0.022450651973485947, -0.015298131853342056, -0.008145611733198166, -0.000993087887763977, 0.006159432232379913, 0.013311952352523804, 0.020464472472667694, 0.027616994455456734, 0.03476951643824577, 0.041922036558389664, 0.049074556678533554, 0.05622708052396774, 0.06337960064411163, 0.07053212076425552, 0.07768464088439941, 0.0848371610045433, 0.0919896811246872, 0.09914220869541168, 0.10629472136497498, 0.11344724893569946, 0.12059976905584335, 0.12775228917598724, 0.13490481674671173, 0.14205732941627502, 0.1492098569869995, 0.1563623696565628, 0.1635148972272873, 0.17066740989685059, 0.17781993746757507, 0.18497246503829956, 0.19212499260902405, 0.19927750527858734, 0.20643003284931183, 0.21358254551887512, 0.2207350730895996, 0.2278876006603241, 0.2350401133298874, 0.24219262599945068]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 10.0, 10.0, 15.0, 13.0, 18.0, 27.0, 26.0, 21.0, 35.0, 34.0, 32.0, 32.0, 40.0, 33.0, 40.0, 50.0, 34.0, 39.0, 44.0, 41.0, 48.0, 38.0, 15.0, 37.0, 34.0, 19.0, 26.0, 30.0, 26.0, 18.0, 17.0, 13.0, 15.0, 12.0, 6.0, 7.0, 5.0, 7.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.703125, -5.50634765625, -5.3095703125, -5.11279296875, -4.916015625, -4.71923828125, -4.5224609375, -4.32568359375, -4.12890625, -3.93212890625, -3.7353515625, -3.53857421875, -3.341796875, -3.14501953125, -2.9482421875, -2.75146484375, -2.5546875, -2.35791015625, -2.1611328125, -1.96435546875, -1.767578125, -1.57080078125, -1.3740234375, -1.17724609375, -0.98046875, -0.78369140625, -0.5869140625, -0.39013671875, -0.193359375, 0.00341796875, 0.2001953125, 0.39697265625, 0.59375, 0.79052734375, 0.9873046875, 1.18408203125, 1.380859375, 1.57763671875, 1.7744140625, 1.97119140625, 2.16796875, 2.36474609375, 2.5615234375, 2.75830078125, 2.955078125, 3.15185546875, 3.3486328125, 3.54541015625, 3.7421875, 3.93896484375, 4.1357421875, 4.33251953125, 4.529296875, 4.72607421875, 4.9228515625, 5.11962890625, 5.31640625, 5.51318359375, 5.7099609375, 5.90673828125, 6.103515625, 6.30029296875, 6.4970703125, 6.69384765625, 6.890625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 8.0, 11.0, 24.0, 26.0, 26.0, 46.0, 57.0, 67.0, 117.0, 171.0, 251.0, 326.0, 498.0, 777.0, 1333.0, 2177.0, 3939.0, 7264.0, 14332.0, 28481.0, 62317.0, 148671.0, 387726.0, 222829.0, 87608.0, 38729.0, 18805.0, 9733.0, 4921.0, 2738.0, 1602.0, 951.0, 656.0, 431.0, 267.0, 194.0, 118.0, 88.0, 62.0, 39.0, 39.0, 25.0, 13.0, 16.0, 12.0, 12.0, 4.0, 4.0, 3.0, 5.0, 1.0, 3.0], "bins": [-8.5234375, -8.27783203125, -8.0322265625, -7.78662109375, -7.541015625, -7.29541015625, -7.0498046875, -6.80419921875, -6.55859375, -6.31298828125, -6.0673828125, -5.82177734375, -5.576171875, -5.33056640625, -5.0849609375, -4.83935546875, -4.59375, -4.34814453125, -4.1025390625, -3.85693359375, -3.611328125, -3.36572265625, -3.1201171875, -2.87451171875, -2.62890625, -2.38330078125, -2.1376953125, -1.89208984375, -1.646484375, -1.40087890625, -1.1552734375, -0.90966796875, -0.6640625, -0.41845703125, -0.1728515625, 0.07275390625, 0.318359375, 0.56396484375, 0.8095703125, 1.05517578125, 1.30078125, 1.54638671875, 1.7919921875, 2.03759765625, 2.283203125, 2.52880859375, 2.7744140625, 3.02001953125, 3.265625, 3.51123046875, 3.7568359375, 4.00244140625, 4.248046875, 4.49365234375, 4.7392578125, 4.98486328125, 5.23046875, 5.47607421875, 5.7216796875, 5.96728515625, 6.212890625, 6.45849609375, 6.7041015625, 6.94970703125, 7.1953125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 6.0, 9.0, 5.0, 9.0, 21.0, 18.0, 11.0, 23.0, 18.0, 22.0, 18.0, 23.0, 33.0, 33.0, 44.0, 48.0, 63.0, 115.0, 226.0, 1462.0, 265.0, 122.0, 67.0, 48.0, 37.0, 47.0, 36.0, 40.0, 29.0, 23.0, 18.0, 10.0, 26.0, 10.0, 13.0, 12.0, 14.0, 11.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-26.390625, -25.648681640625, -24.90673828125, -24.164794921875, -23.4228515625, -22.680908203125, -21.93896484375, -21.197021484375, -20.455078125, -19.713134765625, -18.97119140625, -18.229248046875, -17.4873046875, -16.745361328125, -16.00341796875, -15.261474609375, -14.51953125, -13.777587890625, -13.03564453125, -12.293701171875, -11.5517578125, -10.809814453125, -10.06787109375, -9.325927734375, -8.583984375, -7.842041015625, -7.10009765625, -6.358154296875, -5.6162109375, -4.874267578125, -4.13232421875, -3.390380859375, -2.6484375, -1.906494140625, -1.16455078125, -0.422607421875, 0.3193359375, 1.061279296875, 1.80322265625, 2.545166015625, 3.287109375, 4.029052734375, 4.77099609375, 5.512939453125, 6.2548828125, 6.996826171875, 7.73876953125, 8.480712890625, 9.22265625, 9.964599609375, 10.70654296875, 11.448486328125, 12.1904296875, 12.932373046875, 13.67431640625, 14.416259765625, 15.158203125, 15.900146484375, 16.64208984375, 17.384033203125, 18.1259765625, 18.867919921875, 19.60986328125, 20.351806640625, 21.09375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 13.0, 15.0, 13.0, 22.0, 16.0, 9.0, 31.0, 40.0, 52.0, 72.0, 75.0, 119.0, 189.0, 267.0, 629.0, 1644.0, 6470.0, 84850.0, 2889682.0, 149479.0, 8501.0, 1861.0, 681.0, 297.0, 184.0, 124.0, 69.0, 61.0, 44.0, 39.0, 28.0, 26.0, 16.0, 15.0, 17.0, 15.0, 8.0, 4.0, 7.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.125, -39.685546875, -38.24609375, -36.806640625, -35.3671875, -33.927734375, -32.48828125, -31.048828125, -29.609375, -28.169921875, -26.73046875, -25.291015625, -23.8515625, -22.412109375, -20.97265625, -19.533203125, -18.09375, -16.654296875, -15.21484375, -13.775390625, -12.3359375, -10.896484375, -9.45703125, -8.017578125, -6.578125, -5.138671875, -3.69921875, -2.259765625, -0.8203125, 0.619140625, 2.05859375, 3.498046875, 4.9375, 6.376953125, 7.81640625, 9.255859375, 10.6953125, 12.134765625, 13.57421875, 15.013671875, 16.453125, 17.892578125, 19.33203125, 20.771484375, 22.2109375, 23.650390625, 25.08984375, 26.529296875, 27.96875, 29.408203125, 30.84765625, 32.287109375, 33.7265625, 35.166015625, 36.60546875, 38.044921875, 39.484375, 40.923828125, 42.36328125, 43.802734375, 45.2421875, 46.681640625, 48.12109375, 49.560546875, 51.0]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 35.0, 183.0, 386.0, 295.0, 88.0, 15.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-272.6480407714844, -267.7535095214844, -262.8590087890625, -257.9644775390625, -253.06997680664062, -248.17544555664062, -243.2809295654297, -238.38641357421875, -233.4918975830078, -228.59738159179688, -223.70286560058594, -218.808349609375, -213.913818359375, -209.01930236816406, -204.12478637695312, -199.2302703857422, -194.33575439453125, -189.4412384033203, -184.54672241210938, -179.65220642089844, -174.7576904296875, -169.8631591796875, -164.96864318847656, -160.07412719726562, -155.1796112060547, -150.28509521484375, -145.3905792236328, -140.49606323242188, -135.60153198242188, -130.70701599121094, -125.8125, -120.91798400878906, -116.02348327636719, -111.12896728515625, -106.23445129394531, -101.33992767333984, -96.4454116821289, -91.55089569091797, -86.6563720703125, -81.76185607910156, -76.86734008789062, -71.97282409667969, -67.07830810546875, -62.18378448486328, -57.289268493652344, -52.394752502441406, -47.5002326965332, -42.605712890625, -37.71119689941406, -32.816680908203125, -27.922161102294922, -23.02764320373535, -18.13312530517578, -13.238607406616211, -8.34408950805664, -3.4495697021484375, 1.4449462890625, 6.33946418762207, 11.23398208618164, 16.12849998474121, 21.02301788330078, 25.91753578186035, 30.812053680419922, 35.706573486328125, 40.60108947753906]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 8.0, 3.0, 9.0, 11.0, 9.0, 23.0, 12.0, 21.0, 18.0, 22.0, 28.0, 35.0, 25.0, 30.0, 37.0, 41.0, 46.0, 41.0, 34.0, 38.0, 33.0, 46.0, 47.0, 46.0, 37.0, 34.0, 40.0, 35.0, 22.0, 25.0, 18.0, 14.0, 12.0, 20.0, 18.0, 10.0, 10.0, 6.0, 6.0, 8.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.35573196411133, -53.49592590332031, -51.63611602783203, -49.77630615234375, -47.916500091552734, -46.05669403076172, -44.19688415527344, -42.337074279785156, -40.47726821899414, -38.617462158203125, -36.757652282714844, -34.89784240722656, -33.03803634643555, -31.1782283782959, -29.31842041015625, -27.4586124420166, -25.598804473876953, -23.738996505737305, -21.879188537597656, -20.019380569458008, -18.15957260131836, -16.29976463317871, -14.439956665039062, -12.580148696899414, -10.720340728759766, -8.860532760620117, -7.000724792480469, -5.14091682434082, -3.281108856201172, -1.4213008880615234, 0.438507080078125, 2.2983150482177734, 4.1581268310546875, 6.017934799194336, 7.877742767333984, 9.737550735473633, 11.597358703613281, 13.45716667175293, 15.316974639892578, 17.176782608032227, 19.036590576171875, 20.896398544311523, 22.756206512451172, 24.61601448059082, 26.47582244873047, 28.335630416870117, 30.195438385009766, 32.05524444580078, 33.91505432128906, 35.774864196777344, 37.63467025756836, 39.494476318359375, 41.354286193847656, 43.21409606933594, 45.07390213012695, 46.93370819091797, 48.79351806640625, 50.65332794189453, 52.51313400268555, 54.37294006347656, 56.232749938964844, 58.092559814453125, 59.95236587524414, 61.812171936035156, 63.67198181152344]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 7.0, 12.0, 11.0, 17.0, 20.0, 17.0, 27.0, 20.0, 22.0, 35.0, 35.0, 43.0, 30.0, 38.0, 42.0, 45.0, 45.0, 36.0, 46.0, 43.0, 44.0, 44.0, 41.0, 32.0, 28.0, 26.0, 20.0, 26.0, 26.0, 22.0, 20.0, 13.0, 14.0, 12.0, 9.0, 6.0, 1.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.546875, -6.317138671875, -6.08740234375, -5.857666015625, -5.6279296875, -5.398193359375, -5.16845703125, -4.938720703125, -4.708984375, -4.479248046875, -4.24951171875, -4.019775390625, -3.7900390625, -3.560302734375, -3.33056640625, -3.100830078125, -2.87109375, -2.641357421875, -2.41162109375, -2.181884765625, -1.9521484375, -1.722412109375, -1.49267578125, -1.262939453125, -1.033203125, -0.803466796875, -0.57373046875, -0.343994140625, -0.1142578125, 0.115478515625, 0.34521484375, 0.574951171875, 0.8046875, 1.034423828125, 1.26416015625, 1.493896484375, 1.7236328125, 1.953369140625, 2.18310546875, 2.412841796875, 2.642578125, 2.872314453125, 3.10205078125, 3.331787109375, 3.5615234375, 3.791259765625, 4.02099609375, 4.250732421875, 4.48046875, 4.710205078125, 4.93994140625, 5.169677734375, 5.3994140625, 5.629150390625, 5.85888671875, 6.088623046875, 6.318359375, 6.548095703125, 6.77783203125, 7.007568359375, 7.2373046875, 7.467041015625, 7.69677734375, 7.926513671875, 8.15625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 1.0, 10.0, 2.0, 15.0, 10.0, 14.0, 33.0, 37.0, 37.0, 65.0, 95.0, 113.0, 172.0, 276.0, 327.0, 455.0, 766.0, 1080.0, 1827.0, 2974.0, 5274.0, 10369.0, 23283.0, 68095.0, 284730.0, 1367454.0, 1846115.0, 429415.0, 94105.0, 29308.0, 12318.0, 6142.0, 3386.0, 2030.0, 1246.0, 844.0, 577.0, 358.0, 267.0, 165.0, 133.0, 100.0, 73.0, 58.0, 33.0, 26.0, 18.0, 13.0, 15.0, 7.0, 9.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-13.890625, -13.4713134765625, -13.052001953125, -12.6326904296875, -12.21337890625, -11.7940673828125, -11.374755859375, -10.9554443359375, -10.5361328125, -10.1168212890625, -9.697509765625, -9.2781982421875, -8.85888671875, -8.4395751953125, -8.020263671875, -7.6009521484375, -7.181640625, -6.7623291015625, -6.343017578125, -5.9237060546875, -5.50439453125, -5.0850830078125, -4.665771484375, -4.2464599609375, -3.8271484375, -3.4078369140625, -2.988525390625, -2.5692138671875, -2.14990234375, -1.7305908203125, -1.311279296875, -0.8919677734375, -0.47265625, -0.0533447265625, 0.365966796875, 0.7852783203125, 1.20458984375, 1.6239013671875, 2.043212890625, 2.4625244140625, 2.8818359375, 3.3011474609375, 3.720458984375, 4.1397705078125, 4.55908203125, 4.9783935546875, 5.397705078125, 5.8170166015625, 6.236328125, 6.6556396484375, 7.074951171875, 7.4942626953125, 7.91357421875, 8.3328857421875, 8.752197265625, 9.1715087890625, 9.5908203125, 10.0101318359375, 10.429443359375, 10.8487548828125, 11.26806640625, 11.6873779296875, 12.106689453125, 12.5260009765625, 12.9453125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 13.0, 11.0, 15.0, 25.0, 34.0, 46.0, 72.0, 101.0, 199.0, 324.0, 625.0, 897.0, 658.0, 417.0, 218.0, 127.0, 89.0, 64.0, 33.0, 35.0, 15.0, 11.0, 12.0, 6.0, 3.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.9375, -22.212158203125, -21.48681640625, -20.761474609375, -20.0361328125, -19.310791015625, -18.58544921875, -17.860107421875, -17.134765625, -16.409423828125, -15.68408203125, -14.958740234375, -14.2333984375, -13.508056640625, -12.78271484375, -12.057373046875, -11.33203125, -10.606689453125, -9.88134765625, -9.156005859375, -8.4306640625, -7.705322265625, -6.97998046875, -6.254638671875, -5.529296875, -4.803955078125, -4.07861328125, -3.353271484375, -2.6279296875, -1.902587890625, -1.17724609375, -0.451904296875, 0.2734375, 0.998779296875, 1.72412109375, 2.449462890625, 3.1748046875, 3.900146484375, 4.62548828125, 5.350830078125, 6.076171875, 6.801513671875, 7.52685546875, 8.252197265625, 8.9775390625, 9.702880859375, 10.42822265625, 11.153564453125, 11.87890625, 12.604248046875, 13.32958984375, 14.054931640625, 14.7802734375, 15.505615234375, 16.23095703125, 16.956298828125, 17.681640625, 18.406982421875, 19.13232421875, 19.857666015625, 20.5830078125, 21.308349609375, 22.03369140625, 22.759033203125, 23.484375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 8.0, 11.0, 9.0, 19.0, 26.0, 41.0, 100.0, 156.0, 305.0, 763.0, 2643.0, 16438.0, 529518.0, 3591889.0, 45273.0, 5008.0, 1126.0, 449.0, 222.0, 109.0, 55.0, 31.0, 23.0, 16.0, 12.0, 11.0, 6.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.3125, -77.818359375, -75.32421875, -72.830078125, -70.3359375, -67.841796875, -65.34765625, -62.853515625, -60.359375, -57.865234375, -55.37109375, -52.876953125, -50.3828125, -47.888671875, -45.39453125, -42.900390625, -40.40625, -37.912109375, -35.41796875, -32.923828125, -30.4296875, -27.935546875, -25.44140625, -22.947265625, -20.453125, -17.958984375, -15.46484375, -12.970703125, -10.4765625, -7.982421875, -5.48828125, -2.994140625, -0.5, 1.994140625, 4.48828125, 6.982421875, 9.4765625, 11.970703125, 14.46484375, 16.958984375, 19.453125, 21.947265625, 24.44140625, 26.935546875, 29.4296875, 31.923828125, 34.41796875, 36.912109375, 39.40625, 41.900390625, 44.39453125, 46.888671875, 49.3828125, 51.876953125, 54.37109375, 56.865234375, 59.359375, 61.853515625, 64.34765625, 66.841796875, 69.3359375, 71.830078125, 74.32421875, 76.818359375, 79.3125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 8.0, 7.0, 19.0, 47.0, 60.0, 125.0, 208.0, 182.0, 143.0, 108.0, 46.0, 25.0, 16.0, 10.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.23312377929688, -143.7524871826172, -139.2718505859375, -134.7912139892578, -130.31057739257812, -125.82994079589844, -121.34929656982422, -116.86865997314453, -112.38802337646484, -107.90738677978516, -103.42675018310547, -98.94611358642578, -94.46546936035156, -89.98483276367188, -85.50419616699219, -81.0235595703125, -76.54292297363281, -72.06228637695312, -67.58164978027344, -63.101009368896484, -58.6203727722168, -54.13973617553711, -49.659095764160156, -45.17845916748047, -40.69782257080078, -36.217185974121094, -31.736547470092773, -27.255908966064453, -22.775272369384766, -18.294635772705078, -13.813997268676758, -9.333358764648438, -4.85272216796875, -0.3720846176147461, 4.108552932739258, 8.589190483093262, 13.069828033447266, 17.550464630126953, 22.031103134155273, 26.511741638183594, 30.99237823486328, 35.47301483154297, 39.953651428222656, 44.43429183959961, 48.9149284362793, 53.395565032958984, 57.87620544433594, 62.356842041015625, 66.83747863769531, 71.318115234375, 75.79875183105469, 80.27938842773438, 84.76002502441406, 89.24066162109375, 93.72130584716797, 98.20194244384766, 102.68257904052734, 107.16321563720703, 111.64385223388672, 116.1244888305664, 120.60513305664062, 125.08576965332031, 129.56640625, 134.0470428466797, 138.52767944335938]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 7.0, 7.0, 4.0, 4.0, 9.0, 9.0, 11.0, 14.0, 14.0, 19.0, 25.0, 22.0, 31.0, 36.0, 31.0, 30.0, 31.0, 47.0, 41.0, 42.0, 48.0, 48.0, 43.0, 41.0, 43.0, 42.0, 30.0, 31.0, 28.0, 29.0, 30.0, 24.0, 15.0, 18.0, 12.0, 17.0, 15.0, 11.0, 7.0, 8.0, 2.0, 7.0, 6.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.69192123413086, -50.99960708618164, -49.30729675292969, -47.61498260498047, -45.92266845703125, -44.2303581237793, -42.53804397583008, -40.845733642578125, -39.153419494628906, -37.46110534667969, -35.768795013427734, -34.076480865478516, -32.3841667175293, -30.691856384277344, -28.999542236328125, -27.30722999572754, -25.61491584777832, -23.922603607177734, -22.230289459228516, -20.53797721862793, -18.845664978027344, -17.153350830078125, -15.461038589477539, -13.768726348876953, -12.07641315460205, -10.384099960327148, -8.691787719726562, -6.99947452545166, -5.307161808013916, -3.614849090576172, -1.9225358963012695, -0.2302236557006836, 1.4620895385742188, 3.154402256011963, 4.846714973449707, 6.539028167724609, 8.231340408325195, 9.923653602600098, 11.615966796875, 13.308279037475586, 15.000592231750488, 16.69290542602539, 18.385217666625977, 20.077529907226562, 21.76984405517578, 23.462156295776367, 25.154468536376953, 26.846782684326172, 28.539094924926758, 30.231407165527344, 31.923721313476562, 33.61603546142578, 35.308345794677734, 37.00065994262695, 38.692970275878906, 40.385284423828125, 42.077598571777344, 43.76991271972656, 45.462223052978516, 47.154537200927734, 48.84685134887695, 50.539161682128906, 52.231475830078125, 53.923789978027344, 55.6161003112793]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 5.0, 3.0, 10.0, 10.0, 8.0, 12.0, 16.0, 16.0, 19.0, 16.0, 26.0, 26.0, 32.0, 28.0, 29.0, 32.0, 46.0, 40.0, 42.0, 34.0, 43.0, 36.0, 61.0, 39.0, 37.0, 43.0, 31.0, 37.0, 28.0, 26.0, 17.0, 26.0, 22.0, 25.0, 8.0, 13.0, 13.0, 9.0, 8.0, 6.0, 8.0, 2.0, 7.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.12109375, -5.90203857421875, -5.6829833984375, -5.46392822265625, -5.244873046875, -5.02581787109375, -4.8067626953125, -4.58770751953125, -4.36865234375, -4.14959716796875, -3.9305419921875, -3.71148681640625, -3.492431640625, -3.27337646484375, -3.0543212890625, -2.83526611328125, -2.6162109375, -2.39715576171875, -2.1781005859375, -1.95904541015625, -1.739990234375, -1.52093505859375, -1.3018798828125, -1.08282470703125, -0.86376953125, -0.64471435546875, -0.4256591796875, -0.20660400390625, 0.012451171875, 0.23150634765625, 0.4505615234375, 0.66961669921875, 0.888671875, 1.10772705078125, 1.3267822265625, 1.54583740234375, 1.764892578125, 1.98394775390625, 2.2030029296875, 2.42205810546875, 2.64111328125, 2.86016845703125, 3.0792236328125, 3.29827880859375, 3.517333984375, 3.73638916015625, 3.9554443359375, 4.17449951171875, 4.3935546875, 4.61260986328125, 4.8316650390625, 5.05072021484375, 5.269775390625, 5.48883056640625, 5.7078857421875, 5.92694091796875, 6.14599609375, 6.36505126953125, 6.5841064453125, 6.80316162109375, 7.022216796875, 7.24127197265625, 7.4603271484375, 7.67938232421875, 7.8984375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 11.0, 17.0, 14.0, 33.0, 41.0, 59.0, 80.0, 147.0, 192.0, 285.0, 390.0, 623.0, 1062.0, 1570.0, 2488.0, 4009.0, 6587.0, 10868.0, 17999.0, 29310.0, 48678.0, 78163.0, 118287.0, 158446.0, 170882.0, 140132.0, 97436.0, 62580.0, 38285.0, 23031.0, 14027.0, 8732.0, 5125.0, 3198.0, 2039.0, 1288.0, 817.0, 521.0, 378.0, 229.0, 163.0, 99.0, 80.0, 42.0, 34.0, 26.0, 18.0, 12.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.91357421875, -0.88525390625, -0.85693359375, -0.82861328125, -0.80029296875, -0.77197265625, -0.74365234375, -0.71533203125, -0.68701171875, -0.65869140625, -0.63037109375, -0.60205078125, -0.57373046875, -0.54541015625, -0.51708984375, -0.48876953125, -0.46044921875, -0.43212890625, -0.40380859375, -0.37548828125, -0.34716796875, -0.31884765625, -0.29052734375, -0.26220703125, -0.23388671875, -0.20556640625, -0.17724609375, -0.14892578125, -0.12060546875, -0.09228515625, -0.06396484375, -0.03564453125, -0.00732421875, 0.02099609375, 0.04931640625, 0.07763671875, 0.10595703125, 0.13427734375, 0.16259765625, 0.19091796875, 0.21923828125, 0.24755859375, 0.27587890625, 0.30419921875, 0.33251953125, 0.36083984375, 0.38916015625, 0.41748046875, 0.44580078125, 0.47412109375, 0.50244140625, 0.53076171875, 0.55908203125, 0.58740234375, 0.61572265625, 0.64404296875, 0.67236328125, 0.70068359375, 0.72900390625, 0.75732421875, 0.78564453125, 0.81396484375, 0.84228515625, 0.87060546875, 0.89892578125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 9.0, 11.0, 11.0, 11.0, 19.0, 24.0, 22.0, 24.0, 26.0, 24.0, 39.0, 30.0, 41.0, 34.0, 59.0, 29.0, 46.0, 1069.0, 43.0, 48.0, 46.0, 39.0, 39.0, 31.0, 24.0, 30.0, 24.0, 21.0, 27.0, 21.0, 15.0, 17.0, 15.0, 12.0, 10.0, 3.0, 10.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.55859375, -5.39337158203125, -5.2281494140625, -5.06292724609375, -4.897705078125, -4.73248291015625, -4.5672607421875, -4.40203857421875, -4.23681640625, -4.07159423828125, -3.9063720703125, -3.74114990234375, -3.575927734375, -3.41070556640625, -3.2454833984375, -3.08026123046875, -2.9150390625, -2.74981689453125, -2.5845947265625, -2.41937255859375, -2.254150390625, -2.08892822265625, -1.9237060546875, -1.75848388671875, -1.59326171875, -1.42803955078125, -1.2628173828125, -1.09759521484375, -0.932373046875, -0.76715087890625, -0.6019287109375, -0.43670654296875, -0.271484375, -0.10626220703125, 0.0589599609375, 0.22418212890625, 0.389404296875, 0.55462646484375, 0.7198486328125, 0.88507080078125, 1.05029296875, 1.21551513671875, 1.3807373046875, 1.54595947265625, 1.711181640625, 1.87640380859375, 2.0416259765625, 2.20684814453125, 2.3720703125, 2.53729248046875, 2.7025146484375, 2.86773681640625, 3.032958984375, 3.19818115234375, 3.3634033203125, 3.52862548828125, 3.69384765625, 3.85906982421875, 4.0242919921875, 4.18951416015625, 4.354736328125, 4.51995849609375, 4.6851806640625, 4.85040283203125, 5.015625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 11.0, 17.0, 19.0, 27.0, 39.0, 54.0, 94.0, 150.0, 250.0, 447.0, 766.0, 1445.0, 2820.0, 5908.0, 12957.0, 33430.0, 388387.0, 1583671.0, 38815.0, 14548.0, 6425.0, 3203.0, 1599.0, 860.0, 487.0, 281.0, 144.0, 72.0, 76.0, 50.0, 23.0, 16.0, 8.0, 9.0, 2.0, 4.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.740234375, -2.65478515625, -2.5693359375, -2.48388671875, -2.3984375, -2.31298828125, -2.2275390625, -2.14208984375, -2.056640625, -1.97119140625, -1.8857421875, -1.80029296875, -1.71484375, -1.62939453125, -1.5439453125, -1.45849609375, -1.373046875, -1.28759765625, -1.2021484375, -1.11669921875, -1.03125, -0.94580078125, -0.8603515625, -0.77490234375, -0.689453125, -0.60400390625, -0.5185546875, -0.43310546875, -0.34765625, -0.26220703125, -0.1767578125, -0.09130859375, -0.005859375, 0.07958984375, 0.1650390625, 0.25048828125, 0.3359375, 0.42138671875, 0.5068359375, 0.59228515625, 0.677734375, 0.76318359375, 0.8486328125, 0.93408203125, 1.01953125, 1.10498046875, 1.1904296875, 1.27587890625, 1.361328125, 1.44677734375, 1.5322265625, 1.61767578125, 1.703125, 1.78857421875, 1.8740234375, 1.95947265625, 2.044921875, 2.13037109375, 2.2158203125, 2.30126953125, 2.38671875, 2.47216796875, 2.5576171875, 2.64306640625, 2.728515625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 8.0, 10.0, 17.0, 17.0, 29.0, 27.0, 33.0, 34.0, 43.0, 40.0, 59.0, 62.0, 70.0, 54.0, 78.0, 57.0, 47.0, 55.0, 50.0, 30.0, 35.0, 20.0, 25.0, 12.0, 15.0, 13.0, 11.0, 14.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0948486328125, -0.09192180633544922, -0.08899497985839844, -0.08606815338134766, -0.08314132690429688, -0.0802145004272461, -0.07728767395019531, -0.07436084747314453, -0.07143402099609375, -0.06850719451904297, -0.06558036804199219, -0.0626535415649414, -0.059726715087890625, -0.056799888610839844, -0.05387306213378906, -0.05094623565673828, -0.0480194091796875, -0.04509258270263672, -0.04216575622558594, -0.039238929748535156, -0.036312103271484375, -0.033385276794433594, -0.030458450317382812, -0.02753162384033203, -0.02460479736328125, -0.02167797088623047, -0.018751144409179688, -0.015824317932128906, -0.012897491455078125, -0.009970664978027344, -0.0070438385009765625, -0.004117012023925781, -0.001190185546875, 0.0017366409301757812, 0.0046634674072265625, 0.007590293884277344, 0.010517120361328125, 0.013443946838378906, 0.016370773315429688, 0.01929759979248047, 0.02222442626953125, 0.02515125274658203, 0.028078079223632812, 0.031004905700683594, 0.033931732177734375, 0.036858558654785156, 0.03978538513183594, 0.04271221160888672, 0.0456390380859375, 0.04856586456298828, 0.05149269104003906, 0.054419517517089844, 0.057346343994140625, 0.060273170471191406, 0.06319999694824219, 0.06612682342529297, 0.06905364990234375, 0.07198047637939453, 0.07490730285644531, 0.0778341293334961, 0.08076095581054688, 0.08368778228759766, 0.08661460876464844, 0.08954143524169922, 0.09246826171875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 10.0, 10.0, 16.0, 21.0, 18.0, 35.0, 39.0, 74.0, 83.0, 117.0, 156.0, 339.0, 1166.0, 13888.0, 807064.0, 219137.0, 4918.0, 684.0, 238.0, 146.0, 105.0, 72.0, 56.0, 45.0, 31.0, 22.0, 13.0, 7.0, 5.0, 8.0, 4.0, 4.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.552734375, -1.50543212890625, -1.4581298828125, -1.41082763671875, -1.363525390625, -1.31622314453125, -1.2689208984375, -1.22161865234375, -1.17431640625, -1.12701416015625, -1.0797119140625, -1.03240966796875, -0.985107421875, -0.93780517578125, -0.8905029296875, -0.84320068359375, -0.7958984375, -0.74859619140625, -0.7012939453125, -0.65399169921875, -0.606689453125, -0.55938720703125, -0.5120849609375, -0.46478271484375, -0.41748046875, -0.37017822265625, -0.3228759765625, -0.27557373046875, -0.228271484375, -0.18096923828125, -0.1336669921875, -0.08636474609375, -0.0390625, 0.00823974609375, 0.0555419921875, 0.10284423828125, 0.150146484375, 0.19744873046875, 0.2447509765625, 0.29205322265625, 0.33935546875, 0.38665771484375, 0.4339599609375, 0.48126220703125, 0.528564453125, 0.57586669921875, 0.6231689453125, 0.67047119140625, 0.7177734375, 0.76507568359375, 0.8123779296875, 0.85968017578125, 0.906982421875, 0.95428466796875, 1.0015869140625, 1.04888916015625, 1.09619140625, 1.14349365234375, 1.1907958984375, 1.23809814453125, 1.285400390625, 1.33270263671875, 1.3800048828125, 1.42730712890625, 1.474609375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 6.0, 27.0, 110.0, 555.0, 258.0, 42.0, 16.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2537088096141815, -0.22078925371170044, -0.18786969780921936, -0.15495015680789948, -0.1220306009054184, -0.08911104500293732, -0.05619150400161743, -0.023271948099136353, 0.009647607803344727, 0.04256715998053551, 0.07548671215772629, 0.10840626060962677, 0.14132581651210785, 0.17424537241458893, 0.2071649134159088, 0.2400844693183899, 0.27300402522087097, 0.30592358112335205, 0.33884313702583313, 0.3717626929283142, 0.4046822190284729, 0.43760180473327637, 0.47052133083343506, 0.5034408569335938, 0.5363604426383972, 0.5692799687385559, 0.6021995544433594, 0.6351190805435181, 0.6680386662483215, 0.7009581923484802, 0.7338777780532837, 0.7667973041534424, 0.7997168302536011, 0.8326363563537598, 0.8655559420585632, 0.8984754681587219, 0.9313950538635254, 0.9643145799636841, 0.9972341060638428, 1.030153751373291, 1.0630732774734497, 1.0959928035736084, 1.128912329673767, 1.1618319749832153, 1.194751501083374, 1.2276710271835327, 1.2605905532836914, 1.2935101985931396, 1.3264296054840088, 1.3593491315841675, 1.3922686576843262, 1.4251883029937744, 1.458107829093933, 1.4910273551940918, 1.5239468812942505, 1.5568664073944092, 1.5897860527038574, 1.6227055788040161, 1.6556251049041748, 1.688544750213623, 1.7214642763137817, 1.7543838024139404, 1.7873033285140991, 1.8202228546142578, 1.853142499923706]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 3.0, 9.0, 15.0, 22.0, 15.0, 20.0, 35.0, 45.0, 33.0, 47.0, 45.0, 52.0, 58.0, 55.0, 59.0, 45.0, 52.0, 60.0, 55.0, 44.0, 36.0, 36.0, 45.0, 26.0, 24.0, 14.0, 9.0, 9.0, 7.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18377423286437988, -0.178400456905365, -0.1730266958475113, -0.1676529198884964, -0.1622791439294815, -0.1569053828716278, -0.15153160691261292, -0.14615783095359802, -0.14078405499458313, -0.13541027903556824, -0.13003651797771454, -0.12466274201869965, -0.11928896605968475, -0.11391519755125046, -0.10854142904281616, -0.10316765308380127, -0.09779389202594757, -0.09242012351751328, -0.08704634755849838, -0.08167257905006409, -0.0762988030910492, -0.0709250345826149, -0.0655512660741806, -0.06017749384045601, -0.054803721606731415, -0.04942994937300682, -0.04405617713928223, -0.03868240863084793, -0.03330863639712334, -0.027934864163398743, -0.022561095654964447, -0.017187323421239853, -0.011813551187515259, -0.006439779885113239, -0.0010660085827112198, 0.004307761788368225, 0.00968153402209282, 0.015055306255817413, 0.02042907476425171, 0.025802846997976303, 0.031176619231700897, 0.03655039146542549, 0.041924163699150085, 0.04729793220758438, 0.052671704441308975, 0.05804547667503357, 0.06341924518346786, 0.06879301369190216, 0.07416678965091705, 0.07954055815935135, 0.08491433411836624, 0.09028810262680054, 0.09566187858581543, 0.10103564709424973, 0.10640941560268402, 0.11178319156169891, 0.11715696007013321, 0.1225307285785675, 0.1279045045375824, 0.1332782804965973, 0.138652041554451, 0.14402581751346588, 0.14939957857131958, 0.15477335453033447, 0.16014713048934937]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 5.0, 3.0, 10.0, 10.0, 8.0, 12.0, 16.0, 16.0, 18.0, 17.0, 26.0, 27.0, 30.0, 29.0, 29.0, 32.0, 44.0, 40.0, 45.0, 33.0, 42.0, 37.0, 58.0, 41.0, 36.0, 45.0, 30.0, 37.0, 28.0, 27.0, 17.0, 26.0, 21.0, 26.0, 6.0, 15.0, 13.0, 9.0, 8.0, 6.0, 8.0, 3.0, 6.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.12109375, -5.9022216796875, -5.683349609375, -5.4644775390625, -5.24560546875, -5.0267333984375, -4.807861328125, -4.5889892578125, -4.3701171875, -4.1512451171875, -3.932373046875, -3.7135009765625, -3.49462890625, -3.2757568359375, -3.056884765625, -2.8380126953125, -2.619140625, -2.4002685546875, -2.181396484375, -1.9625244140625, -1.74365234375, -1.5247802734375, -1.305908203125, -1.0870361328125, -0.8681640625, -0.6492919921875, -0.430419921875, -0.2115478515625, 0.00732421875, 0.2261962890625, 0.445068359375, 0.6639404296875, 0.8828125, 1.1016845703125, 1.320556640625, 1.5394287109375, 1.75830078125, 1.9771728515625, 2.196044921875, 2.4149169921875, 2.6337890625, 2.8526611328125, 3.071533203125, 3.2904052734375, 3.50927734375, 3.7281494140625, 3.947021484375, 4.1658935546875, 4.384765625, 4.6036376953125, 4.822509765625, 5.0413818359375, 5.26025390625, 5.4791259765625, 5.697998046875, 5.9168701171875, 6.1357421875, 6.3546142578125, 6.573486328125, 6.7923583984375, 7.01123046875, 7.2301025390625, 7.448974609375, 7.6678466796875, 7.88671875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 7.0, 6.0, 9.0, 18.0, 23.0, 36.0, 37.0, 57.0, 83.0, 98.0, 131.0, 230.0, 295.0, 464.0, 661.0, 1061.0, 1680.0, 2832.0, 5240.0, 9853.0, 19036.0, 37801.0, 73590.0, 137465.0, 293174.0, 218567.0, 117736.0, 61751.0, 31274.0, 16081.0, 8163.0, 4358.0, 2383.0, 1466.0, 890.0, 624.0, 418.0, 256.0, 221.0, 152.0, 100.0, 65.0, 60.0, 31.0, 22.0, 23.0, 11.0, 11.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.640625, -6.41827392578125, -6.1959228515625, -5.97357177734375, -5.751220703125, -5.52886962890625, -5.3065185546875, -5.08416748046875, -4.86181640625, -4.63946533203125, -4.4171142578125, -4.19476318359375, -3.972412109375, -3.75006103515625, -3.5277099609375, -3.30535888671875, -3.0830078125, -2.86065673828125, -2.6383056640625, -2.41595458984375, -2.193603515625, -1.97125244140625, -1.7489013671875, -1.52655029296875, -1.30419921875, -1.08184814453125, -0.8594970703125, -0.63714599609375, -0.414794921875, -0.19244384765625, 0.0299072265625, 0.25225830078125, 0.474609375, 0.69696044921875, 0.9193115234375, 1.14166259765625, 1.364013671875, 1.58636474609375, 1.8087158203125, 2.03106689453125, 2.25341796875, 2.47576904296875, 2.6981201171875, 2.92047119140625, 3.142822265625, 3.36517333984375, 3.5875244140625, 3.80987548828125, 4.0322265625, 4.25457763671875, 4.4769287109375, 4.69927978515625, 4.921630859375, 5.14398193359375, 5.3663330078125, 5.58868408203125, 5.81103515625, 6.03338623046875, 6.2557373046875, 6.47808837890625, 6.700439453125, 6.92279052734375, 7.1451416015625, 7.36749267578125, 7.58984375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 9.0, 6.0, 7.0, 18.0, 23.0, 19.0, 23.0, 27.0, 40.0, 43.0, 44.0, 59.0, 53.0, 105.0, 191.0, 1566.0, 276.0, 132.0, 50.0, 56.0, 47.0, 41.0, 22.0, 31.0, 23.0, 28.0, 26.0, 13.0, 17.0, 11.0, 15.0, 10.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.28125, -30.404541015625, -29.52783203125, -28.651123046875, -27.7744140625, -26.897705078125, -26.02099609375, -25.144287109375, -24.267578125, -23.390869140625, -22.51416015625, -21.637451171875, -20.7607421875, -19.884033203125, -19.00732421875, -18.130615234375, -17.25390625, -16.377197265625, -15.50048828125, -14.623779296875, -13.7470703125, -12.870361328125, -11.99365234375, -11.116943359375, -10.240234375, -9.363525390625, -8.48681640625, -7.610107421875, -6.7333984375, -5.856689453125, -4.97998046875, -4.103271484375, -3.2265625, -2.349853515625, -1.47314453125, -0.596435546875, 0.2802734375, 1.156982421875, 2.03369140625, 2.910400390625, 3.787109375, 4.663818359375, 5.54052734375, 6.417236328125, 7.2939453125, 8.170654296875, 9.04736328125, 9.924072265625, 10.80078125, 11.677490234375, 12.55419921875, 13.430908203125, 14.3076171875, 15.184326171875, 16.06103515625, 16.937744140625, 17.814453125, 18.691162109375, 19.56787109375, 20.444580078125, 21.3212890625, 22.197998046875, 23.07470703125, 23.951416015625, 24.828125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 4.0, 10.0, 12.0, 16.0, 15.0, 24.0, 24.0, 31.0, 36.0, 65.0, 74.0, 92.0, 126.0, 169.0, 256.0, 479.0, 890.0, 3902.0, 61236.0, 2808646.0, 258838.0, 7733.0, 1431.0, 547.0, 297.0, 197.0, 143.0, 97.0, 74.0, 58.0, 56.0, 35.0, 25.0, 15.0, 11.0, 7.0, 14.0, 5.0, 6.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.40625, -38.99658203125, -37.5869140625, -36.17724609375, -34.767578125, -33.35791015625, -31.9482421875, -30.53857421875, -29.12890625, -27.71923828125, -26.3095703125, -24.89990234375, -23.490234375, -22.08056640625, -20.6708984375, -19.26123046875, -17.8515625, -16.44189453125, -15.0322265625, -13.62255859375, -12.212890625, -10.80322265625, -9.3935546875, -7.98388671875, -6.57421875, -5.16455078125, -3.7548828125, -2.34521484375, -0.935546875, 0.47412109375, 1.8837890625, 3.29345703125, 4.703125, 6.11279296875, 7.5224609375, 8.93212890625, 10.341796875, 11.75146484375, 13.1611328125, 14.57080078125, 15.98046875, 17.39013671875, 18.7998046875, 20.20947265625, 21.619140625, 23.02880859375, 24.4384765625, 25.84814453125, 27.2578125, 28.66748046875, 30.0771484375, 31.48681640625, 32.896484375, 34.30615234375, 35.7158203125, 37.12548828125, 38.53515625, 39.94482421875, 41.3544921875, 42.76416015625, 44.173828125, 45.58349609375, 46.9931640625, 48.40283203125, 49.8125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 6.0, 121.0, 637.0, 244.0, 11.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.849346160888672, -22.330114364624023, -13.810882568359375, -5.291650772094727, 3.227581024169922, 11.746814727783203, 20.26604461669922, 28.785274505615234, 37.304508209228516, 45.82373809814453, 54.34297180175781, 62.862205505371094, 71.38143920898438, 79.90066528320312, 88.4198989868164, 96.93913269042969, 105.45835876464844, 113.97759246826172, 122.496826171875, 131.01605224609375, 139.5352783203125, 148.0545196533203, 156.57374572753906, 165.09298706054688, 173.61221313476562, 182.13143920898438, 190.6506805419922, 199.16990661621094, 207.68914794921875, 216.2083740234375, 224.72760009765625, 233.246826171875, 241.76605224609375, 250.2852783203125, 258.80450439453125, 267.3237609863281, 275.8429870605469, 284.3622131347656, 292.8814392089844, 301.4006652832031, 309.919921875, 318.43914794921875, 326.9583740234375, 335.4776306152344, 343.9968566894531, 352.5160827636719, 361.0353088378906, 369.5545349121094, 378.0737609863281, 386.5929870605469, 395.1122131347656, 403.6314697265625, 412.15069580078125, 420.669921875, 429.18914794921875, 437.7083740234375, 446.22760009765625, 454.746826171875, 463.26605224609375, 471.7853088378906, 480.3045349121094, 488.8237609863281, 497.3429870605469, 505.8622131347656, 514.3814697265625]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 6.0, 11.0, 12.0, 12.0, 14.0, 9.0, 18.0, 20.0, 28.0, 22.0, 25.0, 33.0, 41.0, 28.0, 33.0, 51.0, 34.0, 35.0, 41.0, 36.0, 30.0, 27.0, 30.0, 46.0, 39.0, 40.0, 29.0, 32.0, 37.0, 10.0, 20.0, 23.0, 17.0, 21.0, 18.0, 13.0, 11.0, 6.0, 4.0, 4.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-61.23611831665039, -59.284576416015625, -57.333038330078125, -55.38149642944336, -53.42995834350586, -51.478416442871094, -49.526878356933594, -47.57533645629883, -45.62379455566406, -43.6722526550293, -41.7207145690918, -39.76917266845703, -37.81763458251953, -35.866092681884766, -33.91455078125, -31.9630126953125, -30.011474609375, -28.059934616088867, -26.108394622802734, -24.15685272216797, -22.20531463623047, -20.253772735595703, -18.30223274230957, -16.350692749023438, -14.399152755737305, -12.447612762451172, -10.496072769165039, -8.54453182220459, -6.592991828918457, -4.641451835632324, -2.689910888671875, -0.7383708953857422, 1.2131729125976562, 3.164713144302368, 5.11625337600708, 7.067793846130371, 9.019333839416504, 10.970873832702637, 12.922414779663086, 14.873954772949219, 16.82549476623535, 18.777034759521484, 20.728574752807617, 22.68011474609375, 24.631656646728516, 26.583194732666016, 28.53473663330078, 30.486276626586914, 32.43781661987305, 34.38935852050781, 36.34089660644531, 38.29243850708008, 40.24397659301758, 42.195518493652344, 44.147056579589844, 46.09859848022461, 48.050140380859375, 50.00168228149414, 51.95322036743164, 53.904762268066406, 55.856300354003906, 57.80784225463867, 59.75938415527344, 61.71092224121094, 63.66246032714844]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 7.0, 10.0, 9.0, 16.0, 9.0, 9.0, 20.0, 15.0, 23.0, 31.0, 14.0, 30.0, 34.0, 32.0, 33.0, 29.0, 48.0, 63.0, 35.0, 49.0, 50.0, 37.0, 42.0, 37.0, 59.0, 33.0, 37.0, 25.0, 26.0, 21.0, 22.0, 17.0, 19.0, 13.0, 10.0, 7.0, 8.0, 4.0, 4.0, 9.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.45703125, -7.21185302734375, -6.9666748046875, -6.72149658203125, -6.476318359375, -6.23114013671875, -5.9859619140625, -5.74078369140625, -5.49560546875, -5.25042724609375, -5.0052490234375, -4.76007080078125, -4.514892578125, -4.26971435546875, -4.0245361328125, -3.77935791015625, -3.5341796875, -3.28900146484375, -3.0438232421875, -2.79864501953125, -2.553466796875, -2.30828857421875, -2.0631103515625, -1.81793212890625, -1.57275390625, -1.32757568359375, -1.0823974609375, -0.83721923828125, -0.592041015625, -0.34686279296875, -0.1016845703125, 0.14349365234375, 0.388671875, 0.63385009765625, 0.8790283203125, 1.12420654296875, 1.369384765625, 1.61456298828125, 1.8597412109375, 2.10491943359375, 2.35009765625, 2.59527587890625, 2.8404541015625, 3.08563232421875, 3.330810546875, 3.57598876953125, 3.8211669921875, 4.06634521484375, 4.3115234375, 4.55670166015625, 4.8018798828125, 5.04705810546875, 5.292236328125, 5.53741455078125, 5.7825927734375, 6.02777099609375, 6.27294921875, 6.51812744140625, 6.7633056640625, 7.00848388671875, 7.253662109375, 7.49884033203125, 7.7440185546875, 7.98919677734375, 8.234375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 8.0, 6.0, 10.0, 10.0, 16.0, 27.0, 26.0, 42.0, 52.0, 68.0, 93.0, 136.0, 184.0, 267.0, 313.0, 545.0, 814.0, 1279.0, 2214.0, 3987.0, 7863.0, 17707.0, 52995.0, 243990.0, 1391119.0, 1962760.0, 387558.0, 76752.0, 22770.0, 9350.0, 4606.0, 2478.0, 1461.0, 848.0, 594.0, 366.0, 260.0, 202.0, 128.0, 85.0, 79.0, 51.0, 47.0, 31.0, 24.0, 21.0, 12.0, 8.0, 8.0, 9.0, 4.0, 0.0, 5.0, 1.0, 0.0, 2.0], "bins": [-15.1015625, -14.645751953125, -14.18994140625, -13.734130859375, -13.2783203125, -12.822509765625, -12.36669921875, -11.910888671875, -11.455078125, -10.999267578125, -10.54345703125, -10.087646484375, -9.6318359375, -9.176025390625, -8.72021484375, -8.264404296875, -7.80859375, -7.352783203125, -6.89697265625, -6.441162109375, -5.9853515625, -5.529541015625, -5.07373046875, -4.617919921875, -4.162109375, -3.706298828125, -3.25048828125, -2.794677734375, -2.3388671875, -1.883056640625, -1.42724609375, -0.971435546875, -0.515625, -0.059814453125, 0.39599609375, 0.851806640625, 1.3076171875, 1.763427734375, 2.21923828125, 2.675048828125, 3.130859375, 3.586669921875, 4.04248046875, 4.498291015625, 4.9541015625, 5.409912109375, 5.86572265625, 6.321533203125, 6.77734375, 7.233154296875, 7.68896484375, 8.144775390625, 8.6005859375, 9.056396484375, 9.51220703125, 9.968017578125, 10.423828125, 10.879638671875, 11.33544921875, 11.791259765625, 12.2470703125, 12.702880859375, 13.15869140625, 13.614501953125, 14.0703125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 13.0, 10.0, 27.0, 29.0, 36.0, 86.0, 117.0, 227.0, 398.0, 768.0, 892.0, 616.0, 337.0, 170.0, 125.0, 65.0, 45.0, 32.0, 21.0, 14.0, 9.0, 10.0, 10.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.3125, -23.561279296875, -22.81005859375, -22.058837890625, -21.3076171875, -20.556396484375, -19.80517578125, -19.053955078125, -18.302734375, -17.551513671875, -16.80029296875, -16.049072265625, -15.2978515625, -14.546630859375, -13.79541015625, -13.044189453125, -12.29296875, -11.541748046875, -10.79052734375, -10.039306640625, -9.2880859375, -8.536865234375, -7.78564453125, -7.034423828125, -6.283203125, -5.531982421875, -4.78076171875, -4.029541015625, -3.2783203125, -2.527099609375, -1.77587890625, -1.024658203125, -0.2734375, 0.477783203125, 1.22900390625, 1.980224609375, 2.7314453125, 3.482666015625, 4.23388671875, 4.985107421875, 5.736328125, 6.487548828125, 7.23876953125, 7.989990234375, 8.7412109375, 9.492431640625, 10.24365234375, 10.994873046875, 11.74609375, 12.497314453125, 13.24853515625, 13.999755859375, 14.7509765625, 15.502197265625, 16.25341796875, 17.004638671875, 17.755859375, 18.507080078125, 19.25830078125, 20.009521484375, 20.7607421875, 21.511962890625, 22.26318359375, 23.014404296875, 23.765625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 12.0, 3.0, 22.0, 22.0, 31.0, 52.0, 101.0, 179.0, 489.0, 1485.0, 9494.0, 447433.0, 3707261.0, 23849.0, 2654.0, 699.0, 221.0, 106.0, 55.0, 34.0, 25.0, 17.0, 13.0, 5.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.0625, -100.828125, -97.59375, -94.359375, -91.125, -87.890625, -84.65625, -81.421875, -78.1875, -74.953125, -71.71875, -68.484375, -65.25, -62.015625, -58.78125, -55.546875, -52.3125, -49.078125, -45.84375, -42.609375, -39.375, -36.140625, -32.90625, -29.671875, -26.4375, -23.203125, -19.96875, -16.734375, -13.5, -10.265625, -7.03125, -3.796875, -0.5625, 2.671875, 5.90625, 9.140625, 12.375, 15.609375, 18.84375, 22.078125, 25.3125, 28.546875, 31.78125, 35.015625, 38.25, 41.484375, 44.71875, 47.953125, 51.1875, 54.421875, 57.65625, 60.890625, 64.125, 67.359375, 70.59375, 73.828125, 77.0625, 80.296875, 83.53125, 86.765625, 90.0, 93.234375, 96.46875, 99.703125, 102.9375]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 16.0, 27.0, 67.0, 159.0, 251.0, 217.0, 148.0, 66.0, 34.0, 13.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-291.2138977050781, -285.6064758300781, -279.9990539550781, -274.3916320800781, -268.7842102050781, -263.1767883300781, -257.5693664550781, -251.96194458007812, -246.35452270507812, -240.74710083007812, -235.13967895507812, -229.53225708007812, -223.92483520507812, -218.31741333007812, -212.70999145507812, -207.10256958007812, -201.49514770507812, -195.88772583007812, -190.28030395507812, -184.67288208007812, -179.06546020507812, -173.45803833007812, -167.85061645507812, -162.24319458007812, -156.63577270507812, -151.02835083007812, -145.42092895507812, -139.81350708007812, -134.20608520507812, -128.59866333007812, -122.99124145507812, -117.38381958007812, -111.7763900756836, -106.1689682006836, -100.5615463256836, -94.9541244506836, -89.3467025756836, -83.7392807006836, -78.1318588256836, -72.5244369506836, -66.9170150756836, -61.309593200683594, -55.702171325683594, -50.094749450683594, -44.487327575683594, -38.879905700683594, -33.272483825683594, -27.665061950683594, -22.057640075683594, -16.450218200683594, -10.842796325683594, -5.235374450683594, 0.37204742431640625, 5.979469299316406, 11.586891174316406, 17.194313049316406, 22.801734924316406, 28.409156799316406, 34.016578674316406, 39.624000549316406, 45.231422424316406, 50.838844299316406, 56.446266174316406, 62.053688049316406, 67.6611099243164]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 10.0, 3.0, 14.0, 10.0, 12.0, 18.0, 13.0, 20.0, 18.0, 23.0, 21.0, 29.0, 38.0, 30.0, 44.0, 44.0, 33.0, 56.0, 28.0, 38.0, 43.0, 51.0, 33.0, 33.0, 37.0, 28.0, 34.0, 28.0, 23.0, 20.0, 32.0, 19.0, 17.0, 23.0, 14.0, 20.0, 13.0, 10.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.881858825683594, -51.30610656738281, -49.730350494384766, -48.154598236083984, -46.57884216308594, -45.003089904785156, -43.427337646484375, -41.851585388183594, -40.27582931518555, -38.700077056884766, -37.12432098388672, -35.54856872558594, -33.972816467285156, -32.39706039428711, -30.821308135986328, -29.245553970336914, -27.6697998046875, -26.094045639038086, -24.518291473388672, -22.94253921508789, -21.366785049438477, -19.791030883789062, -18.21527862548828, -16.639524459838867, -15.063770294189453, -13.488016128540039, -11.912262916564941, -10.336509704589844, -8.76075553894043, -7.185001850128174, -5.609248161315918, -4.03349494934082, -2.4577407836914062, -0.8819870948791504, 0.6937665939331055, 2.2695202827453613, 3.845273971557617, 5.421027660369873, 6.996781349182129, 8.572534561157227, 10.14828872680664, 11.724042892456055, 13.299796104431152, 14.87554931640625, 16.451303482055664, 18.027057647705078, 19.60280990600586, 21.178564071655273, 22.754318237304688, 24.3300724029541, 25.905826568603516, 27.481578826904297, 29.05733299255371, 30.633087158203125, 32.208839416503906, 33.78459167480469, 35.360347747802734, 36.936100006103516, 38.51185607910156, 40.087608337402344, 41.663360595703125, 43.23911666870117, 44.81486892700195, 46.390625, 47.96637725830078]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 12.0, 4.0, 6.0, 15.0, 13.0, 16.0, 10.0, 25.0, 25.0, 19.0, 34.0, 34.0, 31.0, 51.0, 45.0, 55.0, 56.0, 51.0, 40.0, 38.0, 40.0, 37.0, 52.0, 42.0, 44.0, 32.0, 29.0, 22.0, 24.0, 25.0, 18.0, 21.0, 6.0, 10.0, 5.0, 4.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.00732421875, -7.7333984375, -7.45947265625, -7.185546875, -6.91162109375, -6.6376953125, -6.36376953125, -6.08984375, -5.81591796875, -5.5419921875, -5.26806640625, -4.994140625, -4.72021484375, -4.4462890625, -4.17236328125, -3.8984375, -3.62451171875, -3.3505859375, -3.07666015625, -2.802734375, -2.52880859375, -2.2548828125, -1.98095703125, -1.70703125, -1.43310546875, -1.1591796875, -0.88525390625, -0.611328125, -0.33740234375, -0.0634765625, 0.21044921875, 0.484375, 0.75830078125, 1.0322265625, 1.30615234375, 1.580078125, 1.85400390625, 2.1279296875, 2.40185546875, 2.67578125, 2.94970703125, 3.2236328125, 3.49755859375, 3.771484375, 4.04541015625, 4.3193359375, 4.59326171875, 4.8671875, 5.14111328125, 5.4150390625, 5.68896484375, 5.962890625, 6.23681640625, 6.5107421875, 6.78466796875, 7.05859375, 7.33251953125, 7.6064453125, 7.88037109375, 8.154296875, 8.42822265625, 8.7021484375, 8.97607421875, 9.25]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 10.0, 9.0, 18.0, 18.0, 31.0, 39.0, 79.0, 98.0, 165.0, 272.0, 430.0, 581.0, 925.0, 1437.0, 2165.0, 3515.0, 5796.0, 9586.0, 15858.0, 26691.0, 46114.0, 78436.0, 128092.0, 181425.0, 189075.0, 140597.0, 88370.0, 52153.0, 30480.0, 17947.0, 10620.0, 6595.0, 4120.0, 2410.0, 1511.0, 1038.0, 624.0, 423.0, 268.0, 184.0, 104.0, 94.0, 56.0, 30.0, 33.0, 11.0, 10.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.9962158203125, -0.963134765625, -0.9300537109375, -0.89697265625, -0.8638916015625, -0.830810546875, -0.7977294921875, -0.7646484375, -0.7315673828125, -0.698486328125, -0.6654052734375, -0.63232421875, -0.5992431640625, -0.566162109375, -0.5330810546875, -0.5, -0.4669189453125, -0.433837890625, -0.4007568359375, -0.36767578125, -0.3345947265625, -0.301513671875, -0.2684326171875, -0.2353515625, -0.2022705078125, -0.169189453125, -0.1361083984375, -0.10302734375, -0.0699462890625, -0.036865234375, -0.0037841796875, 0.029296875, 0.0623779296875, 0.095458984375, 0.1285400390625, 0.16162109375, 0.1947021484375, 0.227783203125, 0.2608642578125, 0.2939453125, 0.3270263671875, 0.360107421875, 0.3931884765625, 0.42626953125, 0.4593505859375, 0.492431640625, 0.5255126953125, 0.55859375, 0.5916748046875, 0.624755859375, 0.6578369140625, 0.69091796875, 0.7239990234375, 0.757080078125, 0.7901611328125, 0.8232421875, 0.8563232421875, 0.889404296875, 0.9224853515625, 0.95556640625, 0.9886474609375, 1.021728515625, 1.0548095703125, 1.087890625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 4.0, 3.0, 6.0, 16.0, 9.0, 11.0, 13.0, 10.0, 13.0, 13.0, 22.0, 17.0, 26.0, 16.0, 30.0, 29.0, 29.0, 33.0, 26.0, 36.0, 25.0, 29.0, 34.0, 1060.0, 50.0, 34.0, 48.0, 32.0, 33.0, 36.0, 35.0, 33.0, 31.0, 21.0, 23.0, 27.0, 14.0, 13.0, 15.0, 18.0, 10.0, 8.0, 6.0, 7.0, 8.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.890625, -4.74102783203125, -4.5914306640625, -4.44183349609375, -4.292236328125, -4.14263916015625, -3.9930419921875, -3.84344482421875, -3.69384765625, -3.54425048828125, -3.3946533203125, -3.24505615234375, -3.095458984375, -2.94586181640625, -2.7962646484375, -2.64666748046875, -2.4970703125, -2.34747314453125, -2.1978759765625, -2.04827880859375, -1.898681640625, -1.74908447265625, -1.5994873046875, -1.44989013671875, -1.30029296875, -1.15069580078125, -1.0010986328125, -0.85150146484375, -0.701904296875, -0.55230712890625, -0.4027099609375, -0.25311279296875, -0.103515625, 0.04608154296875, 0.1956787109375, 0.34527587890625, 0.494873046875, 0.64447021484375, 0.7940673828125, 0.94366455078125, 1.09326171875, 1.24285888671875, 1.3924560546875, 1.54205322265625, 1.691650390625, 1.84124755859375, 1.9908447265625, 2.14044189453125, 2.2900390625, 2.43963623046875, 2.5892333984375, 2.73883056640625, 2.888427734375, 3.03802490234375, 3.1876220703125, 3.33721923828125, 3.48681640625, 3.63641357421875, 3.7860107421875, 3.93560791015625, 4.085205078125, 4.23480224609375, 4.3843994140625, 4.53399658203125, 4.68359375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 14.0, 12.0, 21.0, 20.0, 31.0, 35.0, 42.0, 62.0, 105.0, 110.0, 178.0, 229.0, 344.0, 472.0, 692.0, 1011.0, 1470.0, 2202.0, 3320.0, 5525.0, 9103.0, 15243.0, 29444.0, 124621.0, 1754176.0, 85470.0, 25982.0, 14160.0, 8179.0, 5070.0, 3278.0, 2102.0, 1337.0, 937.0, 641.0, 430.0, 283.0, 223.0, 159.0, 105.0, 68.0, 69.0, 46.0, 26.0, 20.0, 16.0, 12.0, 12.0, 8.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0], "bins": [-1.732421875, -1.678985595703125, -1.62554931640625, -1.572113037109375, -1.5186767578125, -1.465240478515625, -1.41180419921875, -1.358367919921875, -1.304931640625, -1.251495361328125, -1.19805908203125, -1.144622802734375, -1.0911865234375, -1.037750244140625, -0.98431396484375, -0.930877685546875, -0.87744140625, -0.824005126953125, -0.77056884765625, -0.717132568359375, -0.6636962890625, -0.610260009765625, -0.55682373046875, -0.503387451171875, -0.449951171875, -0.396514892578125, -0.34307861328125, -0.289642333984375, -0.2362060546875, -0.182769775390625, -0.12933349609375, -0.075897216796875, -0.0224609375, 0.030975341796875, 0.08441162109375, 0.137847900390625, 0.1912841796875, 0.244720458984375, 0.29815673828125, 0.351593017578125, 0.405029296875, 0.458465576171875, 0.51190185546875, 0.565338134765625, 0.6187744140625, 0.672210693359375, 0.72564697265625, 0.779083251953125, 0.83251953125, 0.885955810546875, 0.93939208984375, 0.992828369140625, 1.0462646484375, 1.099700927734375, 1.15313720703125, 1.206573486328125, 1.260009765625, 1.313446044921875, 1.36688232421875, 1.420318603515625, 1.4737548828125, 1.527191162109375, 1.58062744140625, 1.634063720703125, 1.6875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 3.0, 16.0, 17.0, 15.0, 21.0, 15.0, 26.0, 37.0, 36.0, 40.0, 56.0, 70.0, 50.0, 70.0, 66.0, 67.0, 57.0, 43.0, 40.0, 53.0, 38.0, 29.0, 23.0, 17.0, 19.0, 16.0, 7.0, 8.0, 6.0, 8.0, 7.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08026123046875, -0.07768058776855469, -0.07509994506835938, -0.07251930236816406, -0.06993865966796875, -0.06735801696777344, -0.06477737426757812, -0.06219673156738281, -0.0596160888671875, -0.05703544616699219, -0.054454803466796875, -0.05187416076660156, -0.04929351806640625, -0.04671287536621094, -0.044132232666015625, -0.04155158996582031, -0.038970947265625, -0.03639030456542969, -0.033809661865234375, -0.031229019165039062, -0.02864837646484375, -0.026067733764648438, -0.023487091064453125, -0.020906448364257812, -0.0183258056640625, -0.015745162963867188, -0.013164520263671875, -0.010583877563476562, -0.00800323486328125, -0.0054225921630859375, -0.002841949462890625, -0.0002613067626953125, 0.0023193359375, 0.0048999786376953125, 0.007480621337890625, 0.010061264038085938, 0.01264190673828125, 0.015222549438476562, 0.017803192138671875, 0.020383834838867188, 0.0229644775390625, 0.025545120239257812, 0.028125762939453125, 0.030706405639648438, 0.03328704833984375, 0.03586769104003906, 0.038448333740234375, 0.04102897644042969, 0.043609619140625, 0.04619026184082031, 0.048770904541015625, 0.05135154724121094, 0.05393218994140625, 0.05651283264160156, 0.059093475341796875, 0.06167411804199219, 0.0642547607421875, 0.06683540344238281, 0.06941604614257812, 0.07199668884277344, 0.07457733154296875, 0.07715797424316406, 0.07973861694335938, 0.08231925964355469, 0.08489990234375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 2.0, 5.0, 6.0, 10.0, 5.0, 17.0, 14.0, 21.0, 23.0, 33.0, 47.0, 87.0, 87.0, 163.0, 267.0, 892.0, 20978.0, 969129.0, 54514.0, 1421.0, 322.0, 152.0, 102.0, 72.0, 50.0, 35.0, 23.0, 21.0, 15.0, 13.0, 9.0, 7.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6259765625, -1.5760955810546875, -1.526214599609375, -1.4763336181640625, -1.42645263671875, -1.3765716552734375, -1.326690673828125, -1.2768096923828125, -1.2269287109375, -1.1770477294921875, -1.127166748046875, -1.0772857666015625, -1.02740478515625, -0.9775238037109375, -0.927642822265625, -0.8777618408203125, -0.827880859375, -0.7779998779296875, -0.728118896484375, -0.6782379150390625, -0.62835693359375, -0.5784759521484375, -0.528594970703125, -0.4787139892578125, -0.4288330078125, -0.3789520263671875, -0.329071044921875, -0.2791900634765625, -0.22930908203125, -0.1794281005859375, -0.129547119140625, -0.0796661376953125, -0.02978515625, 0.0200958251953125, 0.069976806640625, 0.1198577880859375, 0.16973876953125, 0.2196197509765625, 0.269500732421875, 0.3193817138671875, 0.3692626953125, 0.4191436767578125, 0.469024658203125, 0.5189056396484375, 0.56878662109375, 0.6186676025390625, 0.668548583984375, 0.7184295654296875, 0.768310546875, 0.8181915283203125, 0.868072509765625, 0.9179534912109375, 0.96783447265625, 1.0177154541015625, 1.067596435546875, 1.1174774169921875, 1.1673583984375, 1.2172393798828125, 1.267120361328125, 1.3170013427734375, 1.36688232421875, 1.4167633056640625, 1.466644287109375, 1.5165252685546875, 1.56640625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 12.0, 59.0, 302.0, 446.0, 158.0, 29.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08715160191059113, -0.06665345281362534, -0.046155307441949844, -0.025657162070274353, -0.005159012973308563, 0.015339136123657227, 0.03583727777004242, 0.056335434317588806, 0.076833575963974, 0.09733172506093979, 0.11782987415790558, 0.13832801580429077, 0.15882617235183716, 0.17932431399822235, 0.19982245564460754, 0.22032061219215393, 0.24081875383853912, 0.2613168954849243, 0.2818150520324707, 0.3023132085800171, 0.3228113353252411, 0.3433094918727875, 0.3638076186180115, 0.38430577516555786, 0.40480393171310425, 0.42530208826065063, 0.44580021500587463, 0.466298371553421, 0.4867965281009674, 0.5072946548461914, 0.5277928113937378, 0.5482909679412842, 0.5687890648841858, 0.5892872214317322, 0.6097853779792786, 0.6302834749221802, 0.6507816314697266, 0.671279788017273, 0.6917779445648193, 0.7122761011123657, 0.7327742576599121, 0.7532724142074585, 0.7737705707550049, 0.7942687273025513, 0.8147668242454529, 0.8352649807929993, 0.8557631373405457, 0.876261293888092, 0.8967593908309937, 0.91725754737854, 0.9377557039260864, 0.9582538604736328, 0.9787519574165344, 0.9992501139640808, 1.0197482109069824, 1.0402464866638184, 1.0607446432113647, 1.0812427997589111, 1.1017409563064575, 1.122239112854004, 1.1427372694015503, 1.1632354259490967, 1.1837334632873535, 1.2042317390441895, 1.2247297763824463]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 14.0, 15.0, 11.0, 27.0, 32.0, 37.0, 47.0, 59.0, 64.0, 78.0, 90.0, 67.0, 76.0, 77.0, 46.0, 54.0, 56.0, 35.0, 35.0, 26.0, 16.0, 14.0, 6.0, 6.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.16948360204696655, -0.16351115703582764, -0.15753872692584991, -0.1515662968158722, -0.14559385180473328, -0.13962140679359436, -0.13364897668361664, -0.12767654657363892, -0.1217041015625, -0.11573166400194168, -0.10975922644138336, -0.10378678888082504, -0.09781435132026672, -0.0918419137597084, -0.08586947619915009, -0.07989703863859177, -0.07392460107803345, -0.06795216351747513, -0.06197972595691681, -0.05600728839635849, -0.05003485083580017, -0.04406241327524185, -0.03808997571468353, -0.032117538154125214, -0.026145100593566895, -0.020172663033008575, -0.014200225472450256, -0.008227787911891937, -0.002255350351333618, 0.003717087209224701, 0.00968952476978302, 0.01566196233034134, 0.021634399890899658, 0.027606837451457977, 0.033579275012016296, 0.039551712572574615, 0.045524150133132935, 0.051496587693691254, 0.05746902525424957, 0.06344146281480789, 0.06941390037536621, 0.07538633793592453, 0.08135877549648285, 0.08733121305704117, 0.09330365061759949, 0.0992760881781578, 0.10524852573871613, 0.11122096329927444, 0.11719340085983276, 0.12316583842039108, 0.1291382759809494, 0.13511070609092712, 0.14108315110206604, 0.14705559611320496, 0.15302802622318268, 0.1590004563331604, 0.16497290134429932, 0.17094534635543823, 0.17691777646541595, 0.18289020657539368, 0.1888626515865326, 0.1948350965976715, 0.20080752670764923, 0.20677995681762695, 0.21275240182876587]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 11.0, 5.0, 6.0, 15.0, 13.0, 16.0, 10.0, 25.0, 24.0, 20.0, 34.0, 34.0, 31.0, 50.0, 45.0, 55.0, 55.0, 52.0, 41.0, 38.0, 39.0, 36.0, 52.0, 42.0, 44.0, 34.0, 25.0, 25.0, 25.0, 24.0, 18.0, 20.0, 8.0, 10.0, 5.0, 4.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.007568359375, -7.73388671875, -7.460205078125, -7.1865234375, -6.912841796875, -6.63916015625, -6.365478515625, -6.091796875, -5.818115234375, -5.54443359375, -5.270751953125, -4.9970703125, -4.723388671875, -4.44970703125, -4.176025390625, -3.90234375, -3.628662109375, -3.35498046875, -3.081298828125, -2.8076171875, -2.533935546875, -2.26025390625, -1.986572265625, -1.712890625, -1.439208984375, -1.16552734375, -0.891845703125, -0.6181640625, -0.344482421875, -0.07080078125, 0.202880859375, 0.4765625, 0.750244140625, 1.02392578125, 1.297607421875, 1.5712890625, 1.844970703125, 2.11865234375, 2.392333984375, 2.666015625, 2.939697265625, 3.21337890625, 3.487060546875, 3.7607421875, 4.034423828125, 4.30810546875, 4.581787109375, 4.85546875, 5.129150390625, 5.40283203125, 5.676513671875, 5.9501953125, 6.223876953125, 6.49755859375, 6.771240234375, 7.044921875, 7.318603515625, 7.59228515625, 7.865966796875, 8.1396484375, 8.413330078125, 8.68701171875, 8.960693359375, 9.234375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 8.0, 10.0, 15.0, 27.0, 26.0, 29.0, 48.0, 66.0, 104.0, 150.0, 272.0, 527.0, 993.0, 2157.0, 5424.0, 14649.0, 40377.0, 121046.0, 446938.0, 289720.0, 80062.0, 28154.0, 10376.0, 3949.0, 1562.0, 763.0, 393.0, 232.0, 139.0, 105.0, 59.0, 57.0, 25.0, 26.0, 18.0, 13.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4453125, -9.1058349609375, -8.766357421875, -8.4268798828125, -8.08740234375, -7.7479248046875, -7.408447265625, -7.0689697265625, -6.7294921875, -6.3900146484375, -6.050537109375, -5.7110595703125, -5.37158203125, -5.0321044921875, -4.692626953125, -4.3531494140625, -4.013671875, -3.6741943359375, -3.334716796875, -2.9952392578125, -2.65576171875, -2.3162841796875, -1.976806640625, -1.6373291015625, -1.2978515625, -0.9583740234375, -0.618896484375, -0.2794189453125, 0.06005859375, 0.3995361328125, 0.739013671875, 1.0784912109375, 1.41796875, 1.7574462890625, 2.096923828125, 2.4364013671875, 2.77587890625, 3.1153564453125, 3.454833984375, 3.7943115234375, 4.1337890625, 4.4732666015625, 4.812744140625, 5.1522216796875, 5.49169921875, 5.8311767578125, 6.170654296875, 6.5101318359375, 6.849609375, 7.1890869140625, 7.528564453125, 7.8680419921875, 8.20751953125, 8.5469970703125, 8.886474609375, 9.2259521484375, 9.5654296875, 9.9049072265625, 10.244384765625, 10.5838623046875, 10.92333984375, 11.2628173828125, 11.602294921875, 11.9417724609375, 12.28125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 12.0, 7.0, 18.0, 27.0, 35.0, 24.0, 21.0, 38.0, 41.0, 51.0, 52.0, 81.0, 114.0, 331.0, 1474.0, 168.0, 89.0, 61.0, 57.0, 44.0, 45.0, 35.0, 32.0, 34.0, 24.0, 21.0, 21.0, 12.0, 14.0, 10.0, 3.0, 11.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.296875, -25.453857421875, -24.61083984375, -23.767822265625, -22.9248046875, -22.081787109375, -21.23876953125, -20.395751953125, -19.552734375, -18.709716796875, -17.86669921875, -17.023681640625, -16.1806640625, -15.337646484375, -14.49462890625, -13.651611328125, -12.80859375, -11.965576171875, -11.12255859375, -10.279541015625, -9.4365234375, -8.593505859375, -7.75048828125, -6.907470703125, -6.064453125, -5.221435546875, -4.37841796875, -3.535400390625, -2.6923828125, -1.849365234375, -1.00634765625, -0.163330078125, 0.6796875, 1.522705078125, 2.36572265625, 3.208740234375, 4.0517578125, 4.894775390625, 5.73779296875, 6.580810546875, 7.423828125, 8.266845703125, 9.10986328125, 9.952880859375, 10.7958984375, 11.638916015625, 12.48193359375, 13.324951171875, 14.16796875, 15.010986328125, 15.85400390625, 16.697021484375, 17.5400390625, 18.383056640625, 19.22607421875, 20.069091796875, 20.912109375, 21.755126953125, 22.59814453125, 23.441162109375, 24.2841796875, 25.127197265625, 25.97021484375, 26.813232421875, 27.65625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 7.0, 12.0, 16.0, 14.0, 18.0, 22.0, 28.0, 36.0, 39.0, 60.0, 93.0, 128.0, 254.0, 553.0, 1540.0, 14576.0, 2553993.0, 564720.0, 7491.0, 1080.0, 409.0, 183.0, 123.0, 68.0, 45.0, 33.0, 34.0, 32.0, 21.0, 11.0, 10.0, 12.0, 6.0, 8.0, 2.0, 4.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.4375, -64.4765625, -62.515625, -60.5546875, -58.59375, -56.6328125, -54.671875, -52.7109375, -50.75, -48.7890625, -46.828125, -44.8671875, -42.90625, -40.9453125, -38.984375, -37.0234375, -35.0625, -33.1015625, -31.140625, -29.1796875, -27.21875, -25.2578125, -23.296875, -21.3359375, -19.375, -17.4140625, -15.453125, -13.4921875, -11.53125, -9.5703125, -7.609375, -5.6484375, -3.6875, -1.7265625, 0.234375, 2.1953125, 4.15625, 6.1171875, 8.078125, 10.0390625, 12.0, 13.9609375, 15.921875, 17.8828125, 19.84375, 21.8046875, 23.765625, 25.7265625, 27.6875, 29.6484375, 31.609375, 33.5703125, 35.53125, 37.4921875, 39.453125, 41.4140625, 43.375, 45.3359375, 47.296875, 49.2578125, 51.21875, 53.1796875, 55.140625, 57.1015625, 59.0625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 110.0, 747.0, 160.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.42375946044922, -61.06727600097656, -51.71078872680664, -42.35430145263672, -32.99781799316406, -23.641334533691406, -14.284847259521484, -4.9283599853515625, 4.428123474121094, 13.784608840942383, 23.141094207763672, 32.497581481933594, 41.85406494140625, 51.210548400878906, 60.56703567504883, 69.92352294921875, 79.2800064086914, 88.63648986816406, 97.99298095703125, 107.3494644165039, 116.70594787597656, 126.06243133544922, 135.41891479492188, 144.77540588378906, 154.13189697265625, 163.48838806152344, 172.84486389160156, 182.20135498046875, 191.55783081054688, 200.91432189941406, 210.27081298828125, 219.62728881835938, 228.9837646484375, 238.3402557373047, 247.6967315673828, 257.05322265625, 266.4096984863281, 275.76617431640625, 285.1226806640625, 294.4791564941406, 303.83563232421875, 313.1921081542969, 322.5486145019531, 331.90509033203125, 341.2615661621094, 350.6180419921875, 359.97454833984375, 369.3310241699219, 378.6875305175781, 388.04400634765625, 397.4005126953125, 406.7569885253906, 416.11346435546875, 425.469970703125, 434.8264465332031, 444.18292236328125, 453.5394287109375, 462.8959045410156, 472.2524108886719, 481.60888671875, 490.9653625488281, 500.32183837890625, 509.6783447265625, 519.0348510742188, 528.3912963867188]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 3.0, 5.0, 4.0, 5.0, 6.0, 5.0, 13.0, 12.0, 12.0, 13.0, 20.0, 17.0, 25.0, 24.0, 26.0, 35.0, 37.0, 36.0, 39.0, 38.0, 48.0, 35.0, 47.0, 44.0, 41.0, 41.0, 49.0, 37.0, 33.0, 31.0, 39.0, 29.0, 20.0, 19.0, 19.0, 20.0, 12.0, 10.0, 8.0, 9.0, 8.0, 6.0, 3.0, 11.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-74.2867202758789, -72.10053253173828, -69.91433715820312, -67.7281494140625, -65.54195404052734, -63.35576629638672, -61.16957473754883, -58.98338317871094, -56.79719161987305, -54.611000061035156, -52.424808502197266, -50.238616943359375, -48.05242919921875, -45.866233825683594, -43.68004608154297, -41.49385452270508, -39.30766296386719, -37.1214714050293, -34.935279846191406, -32.749088287353516, -30.562898635864258, -28.376707077026367, -26.19051742553711, -24.00432586669922, -21.818134307861328, -19.631942749023438, -17.445751190185547, -15.259561538696289, -13.073369979858398, -10.887178421020508, -8.700987815856934, -6.514797210693359, -4.3285980224609375, -2.142406940460205, 0.043784141540527344, 2.2299752235412598, 4.416166305541992, 6.602357864379883, 8.788548469543457, 10.974739074707031, 13.160930633544922, 15.347122192382812, 17.533313751220703, 19.71950340270996, 21.90569496154785, 24.091886520385742, 26.278076171875, 28.46426773071289, 30.65045928955078, 32.83665084838867, 35.02284240722656, 37.20903396606445, 39.395225524902344, 41.58141326904297, 43.76760482788086, 45.95379638671875, 48.13998794555664, 50.32617950439453, 52.51237106323242, 54.69856262207031, 56.88475036621094, 59.070945739746094, 61.25713348388672, 63.44332504272461, 65.6295166015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 10.0, 5.0, 12.0, 12.0, 13.0, 5.0, 12.0, 20.0, 17.0, 24.0, 24.0, 27.0, 40.0, 34.0, 37.0, 40.0, 48.0, 52.0, 40.0, 41.0, 48.0, 34.0, 43.0, 51.0, 30.0, 47.0, 27.0, 32.0, 31.0, 25.0, 18.0, 18.0, 21.0, 17.0, 15.0, 15.0, 10.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.88671875, -7.61322021484375, -7.3397216796875, -7.06622314453125, -6.792724609375, -6.51922607421875, -6.2457275390625, -5.97222900390625, -5.69873046875, -5.42523193359375, -5.1517333984375, -4.87823486328125, -4.604736328125, -4.33123779296875, -4.0577392578125, -3.78424072265625, -3.5107421875, -3.23724365234375, -2.9637451171875, -2.69024658203125, -2.416748046875, -2.14324951171875, -1.8697509765625, -1.59625244140625, -1.32275390625, -1.04925537109375, -0.7757568359375, -0.50225830078125, -0.228759765625, 0.04473876953125, 0.3182373046875, 0.59173583984375, 0.865234375, 1.13873291015625, 1.4122314453125, 1.68572998046875, 1.959228515625, 2.23272705078125, 2.5062255859375, 2.77972412109375, 3.05322265625, 3.32672119140625, 3.6002197265625, 3.87371826171875, 4.147216796875, 4.42071533203125, 4.6942138671875, 4.96771240234375, 5.2412109375, 5.51470947265625, 5.7882080078125, 6.06170654296875, 6.335205078125, 6.60870361328125, 6.8822021484375, 7.15570068359375, 7.42919921875, 7.70269775390625, 7.9761962890625, 8.24969482421875, 8.523193359375, 8.79669189453125, 9.0701904296875, 9.34368896484375, 9.6171875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 8.0, 5.0, 12.0, 9.0, 21.0, 41.0, 53.0, 68.0, 106.0, 181.0, 321.0, 651.0, 1225.0, 2614.0, 6325.0, 20317.0, 130145.0, 2117659.0, 1776099.0, 108833.0, 18770.0, 6000.0, 2432.0, 1140.0, 529.0, 296.0, 175.0, 95.0, 50.0, 33.0, 26.0, 14.0, 12.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0], "bins": [-37.9375, -37.054443359375, -36.17138671875, -35.288330078125, -34.4052734375, -33.522216796875, -32.63916015625, -31.756103515625, -30.873046875, -29.989990234375, -29.10693359375, -28.223876953125, -27.3408203125, -26.457763671875, -25.57470703125, -24.691650390625, -23.80859375, -22.925537109375, -22.04248046875, -21.159423828125, -20.2763671875, -19.393310546875, -18.51025390625, -17.627197265625, -16.744140625, -15.861083984375, -14.97802734375, -14.094970703125, -13.2119140625, -12.328857421875, -11.44580078125, -10.562744140625, -9.6796875, -8.796630859375, -7.91357421875, -7.030517578125, -6.1474609375, -5.264404296875, -4.38134765625, -3.498291015625, -2.615234375, -1.732177734375, -0.84912109375, 0.033935546875, 0.9169921875, 1.800048828125, 2.68310546875, 3.566162109375, 4.44921875, 5.332275390625, 6.21533203125, 7.098388671875, 7.9814453125, 8.864501953125, 9.74755859375, 10.630615234375, 11.513671875, 12.396728515625, 13.27978515625, 14.162841796875, 15.0458984375, 15.928955078125, 16.81201171875, 17.695068359375, 18.578125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 5.0, 8.0, 4.0, 8.0, 9.0, 18.0, 31.0, 28.0, 38.0, 60.0, 73.0, 114.0, 135.0, 240.0, 369.0, 502.0, 635.0, 579.0, 418.0, 274.0, 155.0, 95.0, 55.0, 58.0, 39.0, 28.0, 21.0, 14.0, 11.0, 9.0, 9.0, 12.0, 6.0, 2.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.71875, -22.1165771484375, -21.514404296875, -20.9122314453125, -20.31005859375, -19.7078857421875, -19.105712890625, -18.5035400390625, -17.9013671875, -17.2991943359375, -16.697021484375, -16.0948486328125, -15.49267578125, -14.8905029296875, -14.288330078125, -13.6861572265625, -13.083984375, -12.4818115234375, -11.879638671875, -11.2774658203125, -10.67529296875, -10.0731201171875, -9.470947265625, -8.8687744140625, -8.2666015625, -7.6644287109375, -7.062255859375, -6.4600830078125, -5.85791015625, -5.2557373046875, -4.653564453125, -4.0513916015625, -3.44921875, -2.8470458984375, -2.244873046875, -1.6427001953125, -1.04052734375, -0.4383544921875, 0.163818359375, 0.7659912109375, 1.3681640625, 1.9703369140625, 2.572509765625, 3.1746826171875, 3.77685546875, 4.3790283203125, 4.981201171875, 5.5833740234375, 6.185546875, 6.7877197265625, 7.389892578125, 7.9920654296875, 8.59423828125, 9.1964111328125, 9.798583984375, 10.4007568359375, 11.0029296875, 11.6051025390625, 12.207275390625, 12.8094482421875, 13.41162109375, 14.0137939453125, 14.615966796875, 15.2181396484375, 15.8203125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 2.0, 7.0, 4.0, 2.0, 12.0, 16.0, 11.0, 15.0, 24.0, 37.0, 47.0, 103.0, 160.0, 300.0, 785.0, 2264.0, 8281.0, 46988.0, 1614891.0, 2449768.0, 56643.0, 9668.0, 2592.0, 785.0, 364.0, 174.0, 114.0, 65.0, 54.0, 32.0, 24.0, 12.0, 10.0, 8.0, 7.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.0625, -52.134765625, -50.20703125, -48.279296875, -46.3515625, -44.423828125, -42.49609375, -40.568359375, -38.640625, -36.712890625, -34.78515625, -32.857421875, -30.9296875, -29.001953125, -27.07421875, -25.146484375, -23.21875, -21.291015625, -19.36328125, -17.435546875, -15.5078125, -13.580078125, -11.65234375, -9.724609375, -7.796875, -5.869140625, -3.94140625, -2.013671875, -0.0859375, 1.841796875, 3.76953125, 5.697265625, 7.625, 9.552734375, 11.48046875, 13.408203125, 15.3359375, 17.263671875, 19.19140625, 21.119140625, 23.046875, 24.974609375, 26.90234375, 28.830078125, 30.7578125, 32.685546875, 34.61328125, 36.541015625, 38.46875, 40.396484375, 42.32421875, 44.251953125, 46.1796875, 48.107421875, 50.03515625, 51.962890625, 53.890625, 55.818359375, 57.74609375, 59.673828125, 61.6015625, 63.529296875, 65.45703125, 67.384765625, 69.3125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 46.0, 409.0, 471.0, 80.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-403.4555969238281, -387.406494140625, -371.357421875, -355.3083190917969, -339.25921630859375, -323.2101135253906, -307.1610107421875, -291.1119384765625, -275.0628356933594, -259.01373291015625, -242.9646453857422, -226.91555786132812, -210.866455078125, -194.81735229492188, -178.7682647705078, -162.71917724609375, -146.67007446289062, -130.6209716796875, -114.57188415527344, -98.52278900146484, -82.47369384765625, -66.42459869384766, -50.37550354003906, -34.32640838623047, -18.277313232421875, -2.2282180786132812, 13.820877075195312, 29.869972229003906, 45.9190673828125, 61.968162536621094, 78.01725769042969, 94.06635284423828, 110.115478515625, 126.1645736694336, 142.2136688232422, 158.26275634765625, 174.31185913085938, 190.3609619140625, 206.41004943847656, 222.45913696289062, 238.50823974609375, 254.55734252929688, 270.6064453125, 286.655517578125, 302.7046203613281, 318.75372314453125, 334.80279541015625, 350.8518981933594, 366.9010009765625, 382.9501037597656, 398.99920654296875, 415.04827880859375, 431.0973815917969, 447.146484375, 463.195556640625, 479.2446594238281, 495.29376220703125, 511.3428649902344, 527.3919677734375, 543.4410400390625, 559.4901123046875, 575.5392456054688, 591.5883178710938, 607.637451171875, 623.6865234375]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 3.0, 7.0, 12.0, 7.0, 13.0, 10.0, 15.0, 13.0, 18.0, 14.0, 19.0, 19.0, 23.0, 28.0, 23.0, 22.0, 30.0, 37.0, 34.0, 41.0, 30.0, 45.0, 34.0, 40.0, 33.0, 36.0, 34.0, 34.0, 41.0, 27.0, 25.0, 33.0, 21.0, 23.0, 25.0, 24.0, 15.0, 15.0, 12.0, 5.0, 7.0, 13.0, 3.0, 9.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0], "bins": [-55.256431579589844, -53.6898078918457, -52.1231803894043, -50.556556701660156, -48.989933013916016, -47.42330551147461, -45.85668182373047, -44.29005432128906, -42.72343063354492, -41.15680694580078, -39.590179443359375, -38.023555755615234, -36.456932067871094, -34.89030456542969, -33.32368087768555, -31.757055282592773, -30.190431594848633, -28.62380599975586, -27.05718231201172, -25.490556716918945, -23.923931121826172, -22.35730743408203, -20.790681838989258, -19.224056243896484, -17.657432556152344, -16.09080696105957, -14.524182319641113, -12.957557678222656, -11.390932083129883, -9.824307441711426, -8.257682800292969, -6.691057205200195, -5.124431610107422, -3.5578064918518066, -1.9911816120147705, -0.4245567321777344, 1.1420683860778809, 2.708693504333496, 4.275318145751953, 5.841943740844727, 7.408568382263184, 8.97519302368164, 10.541818618774414, 12.108443260192871, 13.675067901611328, 15.241693496704102, 16.808319091796875, 18.374942779541016, 19.94156837463379, 21.508193969726562, 23.074817657470703, 24.641443252563477, 26.20806884765625, 27.77469253540039, 29.341318130493164, 30.907943725585938, 32.47456741333008, 34.04119110107422, 35.607818603515625, 37.174442291259766, 38.741065979003906, 40.30769348144531, 41.87431716918945, 43.440940856933594, 45.007568359375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 6.0, 15.0, 16.0, 17.0, 19.0, 33.0, 27.0, 37.0, 24.0, 56.0, 67.0, 59.0, 64.0, 62.0, 51.0, 57.0, 58.0, 48.0, 40.0, 40.0, 39.0, 37.0, 27.0, 24.0, 18.0, 10.0, 8.0, 14.0, 7.0, 8.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.3203125, -12.97998046875, -12.6396484375, -12.29931640625, -11.958984375, -11.61865234375, -11.2783203125, -10.93798828125, -10.59765625, -10.25732421875, -9.9169921875, -9.57666015625, -9.236328125, -8.89599609375, -8.5556640625, -8.21533203125, -7.875, -7.53466796875, -7.1943359375, -6.85400390625, -6.513671875, -6.17333984375, -5.8330078125, -5.49267578125, -5.15234375, -4.81201171875, -4.4716796875, -4.13134765625, -3.791015625, -3.45068359375, -3.1103515625, -2.77001953125, -2.4296875, -2.08935546875, -1.7490234375, -1.40869140625, -1.068359375, -0.72802734375, -0.3876953125, -0.04736328125, 0.29296875, 0.63330078125, 0.9736328125, 1.31396484375, 1.654296875, 1.99462890625, 2.3349609375, 2.67529296875, 3.015625, 3.35595703125, 3.6962890625, 4.03662109375, 4.376953125, 4.71728515625, 5.0576171875, 5.39794921875, 5.73828125, 6.07861328125, 6.4189453125, 6.75927734375, 7.099609375, 7.43994140625, 7.7802734375, 8.12060546875, 8.4609375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 2.0, 5.0, 13.0, 21.0, 20.0, 43.0, 72.0, 119.0, 160.0, 216.0, 363.0, 615.0, 1000.0, 1617.0, 2853.0, 4778.0, 8124.0, 14521.0, 27110.0, 51865.0, 98489.0, 173455.0, 235347.0, 189244.0, 110789.0, 58458.0, 30577.0, 16536.0, 9191.0, 5221.0, 3088.0, 1767.0, 1081.0, 672.0, 406.0, 253.0, 145.0, 109.0, 74.0, 27.0, 25.0, 20.0, 19.0, 11.0, 12.0, 6.0, 8.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-1.2314453125, -1.19366455078125, -1.1558837890625, -1.11810302734375, -1.080322265625, -1.04254150390625, -1.0047607421875, -0.96697998046875, -0.92919921875, -0.89141845703125, -0.8536376953125, -0.81585693359375, -0.778076171875, -0.74029541015625, -0.7025146484375, -0.66473388671875, -0.626953125, -0.58917236328125, -0.5513916015625, -0.51361083984375, -0.475830078125, -0.43804931640625, -0.4002685546875, -0.36248779296875, -0.32470703125, -0.28692626953125, -0.2491455078125, -0.21136474609375, -0.173583984375, -0.13580322265625, -0.0980224609375, -0.06024169921875, -0.0224609375, 0.01531982421875, 0.0531005859375, 0.09088134765625, 0.128662109375, 0.16644287109375, 0.2042236328125, 0.24200439453125, 0.27978515625, 0.31756591796875, 0.3553466796875, 0.39312744140625, 0.430908203125, 0.46868896484375, 0.5064697265625, 0.54425048828125, 0.58203125, 0.61981201171875, 0.6575927734375, 0.69537353515625, 0.733154296875, 0.77093505859375, 0.8087158203125, 0.84649658203125, 0.88427734375, 0.92205810546875, 0.9598388671875, 0.99761962890625, 1.035400390625, 1.07318115234375, 1.1109619140625, 1.14874267578125, 1.1865234375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 5.0, 4.0, 6.0, 11.0, 12.0, 8.0, 15.0, 18.0, 16.0, 21.0, 25.0, 33.0, 35.0, 30.0, 41.0, 45.0, 44.0, 57.0, 42.0, 1059.0, 53.0, 40.0, 38.0, 50.0, 38.0, 38.0, 36.0, 34.0, 27.0, 22.0, 21.0, 16.0, 16.0, 15.0, 10.0, 13.0, 8.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.26171875, -6.065185546875, -5.86865234375, -5.672119140625, -5.4755859375, -5.279052734375, -5.08251953125, -4.885986328125, -4.689453125, -4.492919921875, -4.29638671875, -4.099853515625, -3.9033203125, -3.706787109375, -3.51025390625, -3.313720703125, -3.1171875, -2.920654296875, -2.72412109375, -2.527587890625, -2.3310546875, -2.134521484375, -1.93798828125, -1.741455078125, -1.544921875, -1.348388671875, -1.15185546875, -0.955322265625, -0.7587890625, -0.562255859375, -0.36572265625, -0.169189453125, 0.02734375, 0.223876953125, 0.42041015625, 0.616943359375, 0.8134765625, 1.010009765625, 1.20654296875, 1.403076171875, 1.599609375, 1.796142578125, 1.99267578125, 2.189208984375, 2.3857421875, 2.582275390625, 2.77880859375, 2.975341796875, 3.171875, 3.368408203125, 3.56494140625, 3.761474609375, 3.9580078125, 4.154541015625, 4.35107421875, 4.547607421875, 4.744140625, 4.940673828125, 5.13720703125, 5.333740234375, 5.5302734375, 5.726806640625, 5.92333984375, 6.119873046875, 6.31640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 15.0, 28.0, 23.0, 29.0, 56.0, 70.0, 91.0, 150.0, 227.0, 307.0, 453.0, 681.0, 930.0, 1418.0, 2123.0, 3549.0, 5780.0, 9497.0, 16974.0, 35945.0, 298676.0, 1620349.0, 50225.0, 20472.0, 11256.0, 6416.0, 3981.0, 2462.0, 1599.0, 1023.0, 766.0, 456.0, 334.0, 237.0, 157.0, 105.0, 77.0, 53.0, 32.0, 31.0, 23.0, 18.0, 13.0, 4.0, 4.0, 3.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7509765625, -1.6947479248046875, -1.638519287109375, -1.5822906494140625, -1.52606201171875, -1.4698333740234375, -1.413604736328125, -1.3573760986328125, -1.3011474609375, -1.2449188232421875, -1.188690185546875, -1.1324615478515625, -1.07623291015625, -1.0200042724609375, -0.963775634765625, -0.9075469970703125, -0.851318359375, -0.7950897216796875, -0.738861083984375, -0.6826324462890625, -0.62640380859375, -0.5701751708984375, -0.513946533203125, -0.4577178955078125, -0.4014892578125, -0.3452606201171875, -0.289031982421875, -0.2328033447265625, -0.17657470703125, -0.1203460693359375, -0.064117431640625, -0.0078887939453125, 0.04833984375, 0.1045684814453125, 0.160797119140625, 0.2170257568359375, 0.27325439453125, 0.3294830322265625, 0.385711669921875, 0.4419403076171875, 0.4981689453125, 0.5543975830078125, 0.610626220703125, 0.6668548583984375, 0.72308349609375, 0.7793121337890625, 0.835540771484375, 0.8917694091796875, 0.947998046875, 1.0042266845703125, 1.060455322265625, 1.1166839599609375, 1.17291259765625, 1.2291412353515625, 1.285369873046875, 1.3415985107421875, 1.3978271484375, 1.4540557861328125, 1.510284423828125, 1.5665130615234375, 1.62274169921875, 1.6789703369140625, 1.735198974609375, 1.7914276123046875, 1.84765625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 11.0, 7.0, 15.0, 15.0, 23.0, 23.0, 39.0, 42.0, 46.0, 41.0, 51.0, 69.0, 80.0, 86.0, 73.0, 71.0, 52.0, 57.0, 50.0, 27.0, 21.0, 21.0, 17.0, 18.0, 12.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10009765625, -0.09726810455322266, -0.09443855285644531, -0.09160900115966797, -0.08877944946289062, -0.08594989776611328, -0.08312034606933594, -0.0802907943725586, -0.07746124267578125, -0.0746316909790039, -0.07180213928222656, -0.06897258758544922, -0.06614303588867188, -0.06331348419189453, -0.06048393249511719, -0.057654380798339844, -0.0548248291015625, -0.051995277404785156, -0.04916572570800781, -0.04633617401123047, -0.043506622314453125, -0.04067707061767578, -0.03784751892089844, -0.035017967224121094, -0.03218841552734375, -0.029358863830566406, -0.026529312133789062, -0.02369976043701172, -0.020870208740234375, -0.01804065704345703, -0.015211105346679688, -0.012381553649902344, -0.009552001953125, -0.006722450256347656, -0.0038928985595703125, -0.0010633468627929688, 0.001766204833984375, 0.004595756530761719, 0.0074253082275390625, 0.010254859924316406, 0.01308441162109375, 0.015913963317871094, 0.018743515014648438, 0.02157306671142578, 0.024402618408203125, 0.02723217010498047, 0.030061721801757812, 0.032891273498535156, 0.0357208251953125, 0.038550376892089844, 0.04137992858886719, 0.04420948028564453, 0.047039031982421875, 0.04986858367919922, 0.05269813537597656, 0.055527687072753906, 0.05835723876953125, 0.061186790466308594, 0.06401634216308594, 0.06684589385986328, 0.06967544555664062, 0.07250499725341797, 0.07533454895019531, 0.07816410064697266, 0.08099365234375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 7.0, 11.0, 11.0, 11.0, 22.0, 29.0, 31.0, 44.0, 89.0, 133.0, 208.0, 439.0, 6458.0, 821598.0, 216413.0, 2146.0, 335.0, 170.0, 125.0, 80.0, 57.0, 35.0, 21.0, 17.0, 21.0, 10.0, 10.0, 6.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.447998046875, -1.39599609375, -1.343994140625, -1.2919921875, -1.239990234375, -1.18798828125, -1.135986328125, -1.083984375, -1.031982421875, -0.97998046875, -0.927978515625, -0.8759765625, -0.823974609375, -0.77197265625, -0.719970703125, -0.66796875, -0.615966796875, -0.56396484375, -0.511962890625, -0.4599609375, -0.407958984375, -0.35595703125, -0.303955078125, -0.251953125, -0.199951171875, -0.14794921875, -0.095947265625, -0.0439453125, 0.008056640625, 0.06005859375, 0.112060546875, 0.1640625, 0.216064453125, 0.26806640625, 0.320068359375, 0.3720703125, 0.424072265625, 0.47607421875, 0.528076171875, 0.580078125, 0.632080078125, 0.68408203125, 0.736083984375, 0.7880859375, 0.840087890625, 0.89208984375, 0.944091796875, 0.99609375, 1.048095703125, 1.10009765625, 1.152099609375, 1.2041015625, 1.256103515625, 1.30810546875, 1.360107421875, 1.412109375, 1.464111328125, 1.51611328125, 1.568115234375, 1.6201171875, 1.672119140625, 1.72412109375, 1.776123046875, 1.828125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 17.0, 31.0, 108.0, 365.0, 349.0, 86.0, 35.0, 12.0, 3.0, 4.0, 3.0], "bins": [-1.0827451944351196, -1.0637441873550415, -1.044743299484253, -1.0257422924041748, -1.0067412853240967, -0.9877403974533081, -0.96873939037323, -0.9497384428977966, -0.9307374954223633, -0.9117365479469299, -0.8927355408668518, -0.8737345933914185, -0.8547336459159851, -0.8357326984405518, -0.8167316913604736, -0.7977307438850403, -0.7787297964096069, -0.7597288489341736, -0.7407278418540955, -0.7217268943786621, -0.7027259469032288, -0.6837249994277954, -0.6647239923477173, -0.6457230448722839, -0.6267220377922058, -0.6077210903167725, -0.5887200832366943, -0.569719135761261, -0.5507181882858276, -0.5317172408103943, -0.5127162337303162, -0.4937152862548828, -0.47471436858177185, -0.4557133913040161, -0.43671244382858276, -0.417711466550827, -0.3987105190753937, -0.37970954179763794, -0.3607085943222046, -0.34170761704444885, -0.3227066397666931, -0.3037056624889374, -0.28470471501350403, -0.2657037377357483, -0.24670279026031494, -0.2277018129825592, -0.20870085060596466, -0.18969988822937012, -0.17069894075393677, -0.15169797837734222, -0.13269701600074768, -0.11369604617357254, -0.094695083796978, -0.07569412142038345, -0.05669315159320831, -0.03769218921661377, -0.018691226840019226, 0.0003097373992204666, 0.01931070163846016, 0.038311667740345, 0.057312630116939545, 0.07631359249353409, 0.09531456232070923, 0.11431552469730377, 0.13331648707389832]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 11.0, 10.0, 8.0, 22.0, 18.0, 18.0, 21.0, 20.0, 22.0, 37.0, 36.0, 47.0, 41.0, 46.0, 50.0, 52.0, 44.0, 60.0, 55.0, 38.0, 31.0, 44.0, 26.0, 43.0, 36.0, 26.0, 19.0, 19.0, 15.0, 13.0, 10.0, 12.0, 11.0, 4.0, 4.0, 6.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08637356758117676, -0.08362570405006409, -0.08087784051895142, -0.07812998443841934, -0.07538212090730667, -0.072634257376194, -0.06988640129566193, -0.06713853776454926, -0.06439067423343658, -0.061642810702323914, -0.05889495089650154, -0.05614709109067917, -0.0533992275595665, -0.05065136402845383, -0.047903504222631454, -0.04515564441680908, -0.04240778088569641, -0.03965991735458374, -0.03691205754876137, -0.034164197742938995, -0.031416334211826324, -0.028668472543358803, -0.02592061087489128, -0.02317274920642376, -0.020424887537956238, -0.017677025869488716, -0.014929164201021194, -0.012181302532553673, -0.009433440864086151, -0.0066855791956186295, -0.003937717527151108, -0.0011898558586835861, 0.0015580058097839355, 0.004305867478251457, 0.007053729146718979, 0.0098015908151865, 0.012549452483654022, 0.015297314152121544, 0.018045175820589066, 0.020793037489056587, 0.02354089915752411, 0.02628876082599163, 0.029036622494459152, 0.031784482300281525, 0.034532345831394196, 0.037280209362506866, 0.04002806916832924, 0.04277592897415161, 0.04552379250526428, 0.04827165603637695, 0.051019515842199326, 0.0537673756480217, 0.05651523917913437, 0.05926310271024704, 0.06201096251606941, 0.06475882232189178, 0.06750668585300446, 0.07025454938411713, 0.0730024129152298, 0.07575026899576187, 0.07849813252687454, 0.08124599605798721, 0.08399385213851929, 0.08674171566963196, 0.08948957920074463]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 6.0, 15.0, 17.0, 16.0, 20.0, 32.0, 27.0, 37.0, 24.0, 57.0, 66.0, 61.0, 63.0, 61.0, 51.0, 57.0, 58.0, 48.0, 42.0, 38.0, 39.0, 38.0, 28.0, 22.0, 18.0, 10.0, 8.0, 14.0, 10.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.3203125, -12.9798583984375, -12.639404296875, -12.2989501953125, -11.95849609375, -11.6180419921875, -11.277587890625, -10.9371337890625, -10.5966796875, -10.2562255859375, -9.915771484375, -9.5753173828125, -9.23486328125, -8.8944091796875, -8.553955078125, -8.2135009765625, -7.873046875, -7.5325927734375, -7.192138671875, -6.8516845703125, -6.51123046875, -6.1707763671875, -5.830322265625, -5.4898681640625, -5.1494140625, -4.8089599609375, -4.468505859375, -4.1280517578125, -3.78759765625, -3.4471435546875, -3.106689453125, -2.7662353515625, -2.42578125, -2.0853271484375, -1.744873046875, -1.4044189453125, -1.06396484375, -0.7235107421875, -0.383056640625, -0.0426025390625, 0.2978515625, 0.6383056640625, 0.978759765625, 1.3192138671875, 1.65966796875, 2.0001220703125, 2.340576171875, 2.6810302734375, 3.021484375, 3.3619384765625, 3.702392578125, 4.0428466796875, 4.38330078125, 4.7237548828125, 5.064208984375, 5.4046630859375, 5.7451171875, 6.0855712890625, 6.426025390625, 6.7664794921875, 7.10693359375, 7.4473876953125, 7.787841796875, 8.1282958984375, 8.46875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 9.0, 11.0, 12.0, 15.0, 33.0, 74.0, 109.0, 281.0, 466.0, 1013.0, 2016.0, 4369.0, 10548.0, 31295.0, 131141.0, 575216.0, 222347.0, 45003.0, 14219.0, 5484.0, 2464.0, 1209.0, 581.0, 301.0, 132.0, 81.0, 45.0, 29.0, 14.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.078125, -23.4384765625, -22.798828125, -22.1591796875, -21.51953125, -20.8798828125, -20.240234375, -19.6005859375, -18.9609375, -18.3212890625, -17.681640625, -17.0419921875, -16.40234375, -15.7626953125, -15.123046875, -14.4833984375, -13.84375, -13.2041015625, -12.564453125, -11.9248046875, -11.28515625, -10.6455078125, -10.005859375, -9.3662109375, -8.7265625, -8.0869140625, -7.447265625, -6.8076171875, -6.16796875, -5.5283203125, -4.888671875, -4.2490234375, -3.609375, -2.9697265625, -2.330078125, -1.6904296875, -1.05078125, -0.4111328125, 0.228515625, 0.8681640625, 1.5078125, 2.1474609375, 2.787109375, 3.4267578125, 4.06640625, 4.7060546875, 5.345703125, 5.9853515625, 6.625, 7.2646484375, 7.904296875, 8.5439453125, 9.18359375, 9.8232421875, 10.462890625, 11.1025390625, 11.7421875, 12.3818359375, 13.021484375, 13.6611328125, 14.30078125, 14.9404296875, 15.580078125, 16.2197265625, 16.859375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 7.0, 14.0, 9.0, 6.0, 23.0, 13.0, 17.0, 28.0, 32.0, 41.0, 42.0, 63.0, 62.0, 80.0, 142.0, 294.0, 1456.0, 203.0, 106.0, 61.0, 51.0, 35.0, 35.0, 39.0, 29.0, 16.0, 20.0, 21.0, 19.0, 11.0, 8.0, 11.0, 7.0, 10.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.203125, -26.333251953125, -25.46337890625, -24.593505859375, -23.7236328125, -22.853759765625, -21.98388671875, -21.114013671875, -20.244140625, -19.374267578125, -18.50439453125, -17.634521484375, -16.7646484375, -15.894775390625, -15.02490234375, -14.155029296875, -13.28515625, -12.415283203125, -11.54541015625, -10.675537109375, -9.8056640625, -8.935791015625, -8.06591796875, -7.196044921875, -6.326171875, -5.456298828125, -4.58642578125, -3.716552734375, -2.8466796875, -1.976806640625, -1.10693359375, -0.237060546875, 0.6328125, 1.502685546875, 2.37255859375, 3.242431640625, 4.1123046875, 4.982177734375, 5.85205078125, 6.721923828125, 7.591796875, 8.461669921875, 9.33154296875, 10.201416015625, 11.0712890625, 11.941162109375, 12.81103515625, 13.680908203125, 14.55078125, 15.420654296875, 16.29052734375, 17.160400390625, 18.0302734375, 18.900146484375, 19.77001953125, 20.639892578125, 21.509765625, 22.379638671875, 23.24951171875, 24.119384765625, 24.9892578125, 25.859130859375, 26.72900390625, 27.598876953125, 28.46875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 5.0, 6.0, 6.0, 10.0, 15.0, 9.0, 7.0, 18.0, 27.0, 28.0, 36.0, 46.0, 78.0, 121.0, 188.0, 304.0, 706.0, 1867.0, 6989.0, 40946.0, 961357.0, 2052586.0, 66353.0, 9702.0, 2414.0, 857.0, 347.0, 224.0, 123.0, 83.0, 60.0, 41.0, 34.0, 22.0, 15.0, 14.0, 8.0, 11.0, 9.0, 8.0, 6.0, 6.0, 1.0, 1.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.90625, -34.751953125, -33.59765625, -32.443359375, -31.2890625, -30.134765625, -28.98046875, -27.826171875, -26.671875, -25.517578125, -24.36328125, -23.208984375, -22.0546875, -20.900390625, -19.74609375, -18.591796875, -17.4375, -16.283203125, -15.12890625, -13.974609375, -12.8203125, -11.666015625, -10.51171875, -9.357421875, -8.203125, -7.048828125, -5.89453125, -4.740234375, -3.5859375, -2.431640625, -1.27734375, -0.123046875, 1.03125, 2.185546875, 3.33984375, 4.494140625, 5.6484375, 6.802734375, 7.95703125, 9.111328125, 10.265625, 11.419921875, 12.57421875, 13.728515625, 14.8828125, 16.037109375, 17.19140625, 18.345703125, 19.5, 20.654296875, 21.80859375, 22.962890625, 24.1171875, 25.271484375, 26.42578125, 27.580078125, 28.734375, 29.888671875, 31.04296875, 32.197265625, 33.3515625, 34.505859375, 35.66015625, 36.814453125, 37.96875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 26.0, 481.0, 495.0, 15.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.3052520751953, -124.83965301513672, -112.37405395507812, -99.90846252441406, -87.44286346435547, -74.97726440429688, -62.51167297363281, -50.04607391357422, -37.580474853515625, -25.114877700805664, -12.649280548095703, -0.183685302734375, 12.281913757324219, 24.747512817382812, 37.213104248046875, 49.67870330810547, 62.14430236816406, 74.60990142822266, 87.07550048828125, 99.54109191894531, 112.0066909790039, 124.4722900390625, 136.93788146972656, 149.40347290039062, 161.86907958984375, 174.3346710205078, 186.80027770996094, 199.265869140625, 211.73147583007812, 224.1970672607422, 236.66265869140625, 249.12826538085938, 261.5938720703125, 274.0594787597656, 286.5250549316406, 298.99066162109375, 311.4562683105469, 323.921875, 336.387451171875, 348.8530578613281, 361.31866455078125, 373.7842712402344, 386.2498474121094, 398.7154541015625, 411.1810607910156, 423.64666748046875, 436.11224365234375, 448.5778503417969, 461.0434265136719, 473.509033203125, 485.974609375, 498.4402160644531, 510.90582275390625, 523.3713989257812, 535.8370361328125, 548.3026123046875, 560.7681884765625, 573.2337646484375, 585.6994018554688, 598.1649780273438, 610.6305541992188, 623.09619140625, 635.561767578125, 648.02734375, 660.4929809570312]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 2.0, 7.0, 11.0, 6.0, 12.0, 28.0, 25.0, 23.0, 25.0, 27.0, 25.0, 31.0, 32.0, 43.0, 46.0, 36.0, 42.0, 46.0, 40.0, 61.0, 34.0, 49.0, 39.0, 35.0, 39.0, 35.0, 29.0, 33.0, 17.0, 17.0, 16.0, 16.0, 14.0, 15.0, 7.0, 9.0, 9.0, 5.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.49227142333984, -73.33744812011719, -71.18263244628906, -69.0278091430664, -66.87299346923828, -64.71817016601562, -62.563350677490234, -60.408531188964844, -58.25371170043945, -56.09889221191406, -53.94407272338867, -51.78925323486328, -49.634429931640625, -47.4796142578125, -45.324790954589844, -43.16997146606445, -41.01515197753906, -38.86033248901367, -36.70551300048828, -34.55069351196289, -32.3958740234375, -30.241052627563477, -28.086231231689453, -25.931411743164062, -23.776592254638672, -21.62177276611328, -19.46695327758789, -17.312131881713867, -15.157312393188477, -13.002492904663086, -10.847672462463379, -8.692852020263672, -6.538028717041016, -4.383208751678467, -2.228388786315918, -0.07356882095336914, 2.0812511444091797, 4.23607063293457, 6.390891075134277, 8.545711517333984, 10.700531005859375, 12.855350494384766, 15.010170936584473, 17.16499137878418, 19.31981086730957, 21.47463035583496, 23.629451751708984, 25.784271240234375, 27.939090728759766, 30.093910217285156, 32.24872970581055, 34.40354919433594, 36.558372497558594, 38.71318817138672, 40.868011474609375, 43.022830963134766, 45.177650451660156, 47.33246994018555, 49.48728942871094, 51.64210891723633, 53.79692840576172, 55.951751708984375, 58.106571197509766, 60.261390686035156, 62.41621017456055]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 3.0, 6.0, 5.0, 11.0, 7.0, 17.0, 14.0, 18.0, 17.0, 33.0, 32.0, 40.0, 35.0, 53.0, 42.0, 66.0, 55.0, 46.0, 57.0, 52.0, 45.0, 45.0, 34.0, 49.0, 43.0, 23.0, 33.0, 20.0, 24.0, 22.0, 14.0, 9.0, 9.0, 12.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-12.1796875, -11.860595703125, -11.54150390625, -11.222412109375, -10.9033203125, -10.584228515625, -10.26513671875, -9.946044921875, -9.626953125, -9.307861328125, -8.98876953125, -8.669677734375, -8.3505859375, -8.031494140625, -7.71240234375, -7.393310546875, -7.07421875, -6.755126953125, -6.43603515625, -6.116943359375, -5.7978515625, -5.478759765625, -5.15966796875, -4.840576171875, -4.521484375, -4.202392578125, -3.88330078125, -3.564208984375, -3.2451171875, -2.926025390625, -2.60693359375, -2.287841796875, -1.96875, -1.649658203125, -1.33056640625, -1.011474609375, -0.6923828125, -0.373291015625, -0.05419921875, 0.264892578125, 0.583984375, 0.903076171875, 1.22216796875, 1.541259765625, 1.8603515625, 2.179443359375, 2.49853515625, 2.817626953125, 3.13671875, 3.455810546875, 3.77490234375, 4.093994140625, 4.4130859375, 4.732177734375, 5.05126953125, 5.370361328125, 5.689453125, 6.008544921875, 6.32763671875, 6.646728515625, 6.9658203125, 7.284912109375, 7.60400390625, 7.923095703125, 8.2421875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 14.0, 22.0, 26.0, 29.0, 58.0, 82.0, 133.0, 239.0, 487.0, 1100.0, 2671.0, 7135.0, 28649.0, 387615.0, 3413556.0, 315404.0, 26131.0, 6504.0, 2370.0, 1005.0, 449.0, 243.0, 121.0, 77.0, 47.0, 42.0, 23.0, 13.0, 8.0, 8.0, 4.0, 1.0, 5.0, 4.0], "bins": [-43.1875, -42.21630859375, -41.2451171875, -40.27392578125, -39.302734375, -38.33154296875, -37.3603515625, -36.38916015625, -35.41796875, -34.44677734375, -33.4755859375, -32.50439453125, -31.533203125, -30.56201171875, -29.5908203125, -28.61962890625, -27.6484375, -26.67724609375, -25.7060546875, -24.73486328125, -23.763671875, -22.79248046875, -21.8212890625, -20.85009765625, -19.87890625, -18.90771484375, -17.9365234375, -16.96533203125, -15.994140625, -15.02294921875, -14.0517578125, -13.08056640625, -12.109375, -11.13818359375, -10.1669921875, -9.19580078125, -8.224609375, -7.25341796875, -6.2822265625, -5.31103515625, -4.33984375, -3.36865234375, -2.3974609375, -1.42626953125, -0.455078125, 0.51611328125, 1.4873046875, 2.45849609375, 3.4296875, 4.40087890625, 5.3720703125, 6.34326171875, 7.314453125, 8.28564453125, 9.2568359375, 10.22802734375, 11.19921875, 12.17041015625, 13.1416015625, 14.11279296875, 15.083984375, 16.05517578125, 17.0263671875, 17.99755859375, 18.96875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 3.0, 7.0, 14.0, 13.0, 19.0, 29.0, 45.0, 59.0, 100.0, 176.0, 244.0, 395.0, 632.0, 740.0, 586.0, 327.0, 208.0, 125.0, 82.0, 69.0, 48.0, 28.0, 27.0, 21.0, 16.0, 16.0, 10.0, 9.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.78125, -19.188720703125, -18.59619140625, -18.003662109375, -17.4111328125, -16.818603515625, -16.22607421875, -15.633544921875, -15.041015625, -14.448486328125, -13.85595703125, -13.263427734375, -12.6708984375, -12.078369140625, -11.48583984375, -10.893310546875, -10.30078125, -9.708251953125, -9.11572265625, -8.523193359375, -7.9306640625, -7.338134765625, -6.74560546875, -6.153076171875, -5.560546875, -4.968017578125, -4.37548828125, -3.782958984375, -3.1904296875, -2.597900390625, -2.00537109375, -1.412841796875, -0.8203125, -0.227783203125, 0.36474609375, 0.957275390625, 1.5498046875, 2.142333984375, 2.73486328125, 3.327392578125, 3.919921875, 4.512451171875, 5.10498046875, 5.697509765625, 6.2900390625, 6.882568359375, 7.47509765625, 8.067626953125, 8.66015625, 9.252685546875, 9.84521484375, 10.437744140625, 11.0302734375, 11.622802734375, 12.21533203125, 12.807861328125, 13.400390625, 13.992919921875, 14.58544921875, 15.177978515625, 15.7705078125, 16.363037109375, 16.95556640625, 17.548095703125, 18.140625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 3.0, 12.0, 13.0, 17.0, 16.0, 23.0, 30.0, 55.0, 97.0, 168.0, 317.0, 784.0, 2356.0, 8704.0, 60392.0, 2987493.0, 1087734.0, 36613.0, 6443.0, 1766.0, 640.0, 258.0, 136.0, 93.0, 39.0, 18.0, 25.0, 6.0, 8.0, 7.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.40625, -54.51904296875, -52.6318359375, -50.74462890625, -48.857421875, -46.97021484375, -45.0830078125, -43.19580078125, -41.30859375, -39.42138671875, -37.5341796875, -35.64697265625, -33.759765625, -31.87255859375, -29.9853515625, -28.09814453125, -26.2109375, -24.32373046875, -22.4365234375, -20.54931640625, -18.662109375, -16.77490234375, -14.8876953125, -13.00048828125, -11.11328125, -9.22607421875, -7.3388671875, -5.45166015625, -3.564453125, -1.67724609375, 0.2099609375, 2.09716796875, 3.984375, 5.87158203125, 7.7587890625, 9.64599609375, 11.533203125, 13.42041015625, 15.3076171875, 17.19482421875, 19.08203125, 20.96923828125, 22.8564453125, 24.74365234375, 26.630859375, 28.51806640625, 30.4052734375, 32.29248046875, 34.1796875, 36.06689453125, 37.9541015625, 39.84130859375, 41.728515625, 43.61572265625, 45.5029296875, 47.39013671875, 49.27734375, 51.16455078125, 53.0517578125, 54.93896484375, 56.826171875, 58.71337890625, 60.6005859375, 62.48779296875, 64.375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 17.0, 29.0, 85.0, 232.0, 317.0, 205.0, 88.0, 24.0, 14.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.62684631347656, -117.24624633789062, -110.86564636230469, -104.48504638671875, -98.10444641113281, -91.72384643554688, -85.34325408935547, -78.96265411376953, -72.5820541381836, -66.20145416259766, -59.82085418701172, -53.44025802612305, -47.05965805053711, -40.67905807495117, -34.2984619140625, -27.917861938476562, -21.537261962890625, -15.156662940979004, -8.776063919067383, -2.395465850830078, 3.9851341247558594, 10.365734100341797, 16.74633026123047, 23.126930236816406, 29.507530212402344, 35.88813018798828, 42.26873016357422, 48.64932632446289, 55.02992630004883, 61.410526275634766, 67.79112243652344, 74.17172241210938, 80.55230712890625, 86.93290710449219, 93.31350708007812, 99.69410705566406, 106.07470703125, 112.45530700683594, 118.83589935302734, 125.21649932861328, 131.59710693359375, 137.9777069091797, 144.35830688476562, 150.73890686035156, 157.1195068359375, 163.50010681152344, 169.88070678710938, 176.26129150390625, 182.6418914794922, 189.02249145507812, 195.40309143066406, 201.78369140625, 208.16429138183594, 214.54489135742188, 220.92547607421875, 227.30609130859375, 233.68667602539062, 240.06727600097656, 246.4478759765625, 252.82847595214844, 259.2090759277344, 265.58966064453125, 271.97027587890625, 278.3508605957031, 284.7314758300781]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 4.0, 12.0, 8.0, 10.0, 19.0, 11.0, 20.0, 15.0, 30.0, 21.0, 27.0, 55.0, 41.0, 41.0, 41.0, 40.0, 44.0, 38.0, 41.0, 43.0, 46.0, 38.0, 45.0, 38.0, 35.0, 40.0, 33.0, 22.0, 16.0, 15.0, 21.0, 11.0, 22.0, 19.0, 4.0, 12.0, 6.0, 6.0, 3.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.41863250732422, -56.53989028930664, -54.66114807128906, -52.78240966796875, -50.90366744995117, -49.024925231933594, -47.146183013916016, -45.26744079589844, -43.388702392578125, -41.50996017456055, -39.63121795654297, -37.752479553222656, -35.87373733520508, -33.9949951171875, -32.11625289916992, -30.237510681152344, -28.358768463134766, -26.480026245117188, -24.601285934448242, -22.722543716430664, -20.84380340576172, -18.96506118774414, -17.086318969726562, -15.2075777053833, -13.328836441040039, -11.450095176696777, -9.571353912353516, -7.6926116943359375, -5.813870429992676, -3.935129165649414, -2.056386947631836, -0.17764568328857422, 1.7010917663574219, 3.5798332691192627, 5.4585747718811035, 7.337316513061523, 9.216057777404785, 11.094799041748047, 12.973541259765625, 14.852282524108887, 16.73102378845215, 18.609766006469727, 20.488506317138672, 22.36724853515625, 24.245990753173828, 26.124731063842773, 28.00347328186035, 29.882213592529297, 31.760955810546875, 33.63969802856445, 35.51844024658203, 37.397178649902344, 39.27592086791992, 41.1546630859375, 43.03340530395508, 44.912147521972656, 46.79088592529297, 48.66962814331055, 50.548370361328125, 52.42710876464844, 54.305850982666016, 56.184593200683594, 58.06333541870117, 59.94207763671875, 61.82081985473633]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 0.0, 6.0, 9.0, 6.0, 15.0, 4.0, 14.0, 7.0, 15.0, 17.0, 18.0, 26.0, 17.0, 27.0, 25.0, 38.0, 41.0, 27.0, 36.0, 40.0, 46.0, 40.0, 36.0, 39.0, 41.0, 29.0, 29.0, 32.0, 37.0, 25.0, 27.0, 22.0, 19.0, 32.0, 25.0, 17.0, 20.0, 10.0, 17.0, 8.0, 10.0, 10.0, 7.0, 8.0, 6.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.5, -7.2652587890625, -7.030517578125, -6.7957763671875, -6.56103515625, -6.3262939453125, -6.091552734375, -5.8568115234375, -5.6220703125, -5.3873291015625, -5.152587890625, -4.9178466796875, -4.68310546875, -4.4483642578125, -4.213623046875, -3.9788818359375, -3.744140625, -3.5093994140625, -3.274658203125, -3.0399169921875, -2.80517578125, -2.5704345703125, -2.335693359375, -2.1009521484375, -1.8662109375, -1.6314697265625, -1.396728515625, -1.1619873046875, -0.92724609375, -0.6925048828125, -0.457763671875, -0.2230224609375, 0.01171875, 0.2464599609375, 0.481201171875, 0.7159423828125, 0.95068359375, 1.1854248046875, 1.420166015625, 1.6549072265625, 1.8896484375, 2.1243896484375, 2.359130859375, 2.5938720703125, 2.82861328125, 3.0633544921875, 3.298095703125, 3.5328369140625, 3.767578125, 4.0023193359375, 4.237060546875, 4.4718017578125, 4.70654296875, 4.9412841796875, 5.176025390625, 5.4107666015625, 5.6455078125, 5.8802490234375, 6.114990234375, 6.3497314453125, 6.58447265625, 6.8192138671875, 7.053955078125, 7.2886962890625, 7.5234375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 14.0, 11.0, 28.0, 30.0, 61.0, 89.0, 157.0, 250.0, 358.0, 557.0, 807.0, 1296.0, 2137.0, 3233.0, 5115.0, 8352.0, 13259.0, 22286.0, 37698.0, 64539.0, 110641.0, 174428.0, 205040.0, 158506.0, 98160.0, 56971.0, 33096.0, 19616.0, 12032.0, 7367.0, 4386.0, 2873.0, 1790.0, 1162.0, 778.0, 496.0, 340.0, 199.0, 131.0, 93.0, 53.0, 30.0, 23.0, 21.0, 18.0, 7.0, 10.0, 4.0, 3.0, 3.0, 2.0], "bins": [-1.1962890625, -1.1624755859375, -1.128662109375, -1.0948486328125, -1.06103515625, -1.0272216796875, -0.993408203125, -0.9595947265625, -0.92578125, -0.8919677734375, -0.858154296875, -0.8243408203125, -0.79052734375, -0.7567138671875, -0.722900390625, -0.6890869140625, -0.6552734375, -0.6214599609375, -0.587646484375, -0.5538330078125, -0.52001953125, -0.4862060546875, -0.452392578125, -0.4185791015625, -0.384765625, -0.3509521484375, -0.317138671875, -0.2833251953125, -0.24951171875, -0.2156982421875, -0.181884765625, -0.1480712890625, -0.1142578125, -0.0804443359375, -0.046630859375, -0.0128173828125, 0.02099609375, 0.0548095703125, 0.088623046875, 0.1224365234375, 0.15625, 0.1900634765625, 0.223876953125, 0.2576904296875, 0.29150390625, 0.3253173828125, 0.359130859375, 0.3929443359375, 0.4267578125, 0.4605712890625, 0.494384765625, 0.5281982421875, 0.56201171875, 0.5958251953125, 0.629638671875, 0.6634521484375, 0.697265625, 0.7310791015625, 0.764892578125, 0.7987060546875, 0.83251953125, 0.8663330078125, 0.900146484375, 0.9339599609375, 0.9677734375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 1.0, 13.0, 12.0, 12.0, 19.0, 20.0, 22.0, 19.0, 24.0, 32.0, 19.0, 31.0, 43.0, 45.0, 40.0, 46.0, 40.0, 62.0, 1078.0, 42.0, 36.0, 42.0, 41.0, 33.0, 35.0, 34.0, 24.0, 36.0, 27.0, 18.0, 18.0, 11.0, 11.0, 6.0, 7.0, 5.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.58758544921875, -5.3822021484375, -5.17681884765625, -4.971435546875, -4.76605224609375, -4.5606689453125, -4.35528564453125, -4.14990234375, -3.94451904296875, -3.7391357421875, -3.53375244140625, -3.328369140625, -3.12298583984375, -2.9176025390625, -2.71221923828125, -2.5068359375, -2.30145263671875, -2.0960693359375, -1.89068603515625, -1.685302734375, -1.47991943359375, -1.2745361328125, -1.06915283203125, -0.86376953125, -0.65838623046875, -0.4530029296875, -0.24761962890625, -0.042236328125, 0.16314697265625, 0.3685302734375, 0.57391357421875, 0.779296875, 0.98468017578125, 1.1900634765625, 1.39544677734375, 1.600830078125, 1.80621337890625, 2.0115966796875, 2.21697998046875, 2.42236328125, 2.62774658203125, 2.8331298828125, 3.03851318359375, 3.243896484375, 3.44927978515625, 3.6546630859375, 3.86004638671875, 4.0654296875, 4.27081298828125, 4.4761962890625, 4.68157958984375, 4.886962890625, 5.09234619140625, 5.2977294921875, 5.50311279296875, 5.70849609375, 5.91387939453125, 6.1192626953125, 6.32464599609375, 6.530029296875, 6.73541259765625, 6.9407958984375, 7.14617919921875, 7.3515625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 10.0, 13.0, 14.0, 28.0, 47.0, 51.0, 88.0, 143.0, 221.0, 305.0, 480.0, 707.0, 1103.0, 1839.0, 3146.0, 5225.0, 9808.0, 19448.0, 53585.0, 1789737.0, 153115.0, 27824.0, 13278.0, 6963.0, 3757.0, 2346.0, 1423.0, 911.0, 506.0, 335.0, 244.0, 140.0, 105.0, 50.0, 43.0, 30.0, 24.0, 11.0, 12.0, 9.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.181640625, -2.110626220703125, -2.03961181640625, -1.968597412109375, -1.8975830078125, -1.826568603515625, -1.75555419921875, -1.684539794921875, -1.613525390625, -1.542510986328125, -1.47149658203125, -1.400482177734375, -1.3294677734375, -1.258453369140625, -1.18743896484375, -1.116424560546875, -1.04541015625, -0.974395751953125, -0.90338134765625, -0.832366943359375, -0.7613525390625, -0.690338134765625, -0.61932373046875, -0.548309326171875, -0.477294921875, -0.406280517578125, -0.33526611328125, -0.264251708984375, -0.1932373046875, -0.122222900390625, -0.05120849609375, 0.019805908203125, 0.0908203125, 0.161834716796875, 0.23284912109375, 0.303863525390625, 0.3748779296875, 0.445892333984375, 0.51690673828125, 0.587921142578125, 0.658935546875, 0.729949951171875, 0.80096435546875, 0.871978759765625, 0.9429931640625, 1.014007568359375, 1.08502197265625, 1.156036376953125, 1.22705078125, 1.298065185546875, 1.36907958984375, 1.440093994140625, 1.5111083984375, 1.582122802734375, 1.65313720703125, 1.724151611328125, 1.795166015625, 1.866180419921875, 1.93719482421875, 2.008209228515625, 2.0792236328125, 2.150238037109375, 2.22125244140625, 2.292266845703125, 2.36328125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 10.0, 15.0, 17.0, 8.0, 15.0, 22.0, 15.0, 21.0, 33.0, 32.0, 26.0, 30.0, 31.0, 38.0, 53.0, 42.0, 51.0, 42.0, 46.0, 47.0, 40.0, 43.0, 37.0, 32.0, 35.0, 37.0, 27.0, 20.0, 22.0, 14.0, 12.0, 10.0, 17.0, 9.0, 9.0, 7.0, 5.0, 5.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0513916015625, -0.04978513717651367, -0.048178672790527344, -0.046572208404541016, -0.04496574401855469, -0.04335927963256836, -0.04175281524658203, -0.0401463508605957, -0.038539886474609375, -0.03693342208862305, -0.03532695770263672, -0.03372049331665039, -0.03211402893066406, -0.030507564544677734, -0.028901100158691406, -0.027294635772705078, -0.02568817138671875, -0.024081707000732422, -0.022475242614746094, -0.020868778228759766, -0.019262313842773438, -0.01765584945678711, -0.01604938507080078, -0.014442920684814453, -0.012836456298828125, -0.011229991912841797, -0.009623527526855469, -0.00801706314086914, -0.0064105987548828125, -0.004804134368896484, -0.0031976699829101562, -0.0015912055969238281, 1.52587890625e-05, 0.0016217231750488281, 0.0032281875610351562, 0.004834651947021484, 0.0064411163330078125, 0.00804758071899414, 0.009654045104980469, 0.011260509490966797, 0.012866973876953125, 0.014473438262939453, 0.01607990264892578, 0.01768636703491211, 0.019292831420898438, 0.020899295806884766, 0.022505760192871094, 0.024112224578857422, 0.02571868896484375, 0.027325153350830078, 0.028931617736816406, 0.030538082122802734, 0.03214454650878906, 0.03375101089477539, 0.03535747528076172, 0.03696393966674805, 0.038570404052734375, 0.0401768684387207, 0.04178333282470703, 0.04338979721069336, 0.04499626159667969, 0.046602725982666016, 0.048209190368652344, 0.04981565475463867, 0.051422119140625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 4.0, 6.0, 6.0, 12.0, 8.0, 9.0, 13.0, 15.0, 13.0, 27.0, 31.0, 39.0, 47.0, 70.0, 77.0, 112.0, 157.0, 256.0, 611.0, 4494.0, 171584.0, 839611.0, 28777.0, 1520.0, 327.0, 199.0, 116.0, 79.0, 73.0, 49.0, 42.0, 36.0, 24.0, 17.0, 13.0, 20.0, 10.0, 15.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.01953125, -0.987945556640625, -0.95635986328125, -0.924774169921875, -0.8931884765625, -0.861602783203125, -0.83001708984375, -0.798431396484375, -0.766845703125, -0.735260009765625, -0.70367431640625, -0.672088623046875, -0.6405029296875, -0.608917236328125, -0.57733154296875, -0.545745849609375, -0.51416015625, -0.482574462890625, -0.45098876953125, -0.419403076171875, -0.3878173828125, -0.356231689453125, -0.32464599609375, -0.293060302734375, -0.261474609375, -0.229888916015625, -0.19830322265625, -0.166717529296875, -0.1351318359375, -0.103546142578125, -0.07196044921875, -0.040374755859375, -0.0087890625, 0.022796630859375, 0.05438232421875, 0.085968017578125, 0.1175537109375, 0.149139404296875, 0.18072509765625, 0.212310791015625, 0.243896484375, 0.275482177734375, 0.30706787109375, 0.338653564453125, 0.3702392578125, 0.401824951171875, 0.43341064453125, 0.464996337890625, 0.49658203125, 0.528167724609375, 0.55975341796875, 0.591339111328125, 0.6229248046875, 0.654510498046875, 0.68609619140625, 0.717681884765625, 0.749267578125, 0.780853271484375, 0.81243896484375, 0.844024658203125, 0.8756103515625, 0.907196044921875, 0.93878173828125, 0.970367431640625, 1.001953125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 13.0, 29.0, 91.0, 252.0, 371.0, 174.0, 49.0, 25.0, 10.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4961630403995514, -0.4854554831981659, -0.4747479259967804, -0.4640403985977173, -0.4533328413963318, -0.4426252841949463, -0.4319177269935608, -0.4212101697921753, -0.4105026125907898, -0.3997950553894043, -0.3890874981880188, -0.3783799409866333, -0.3676724135875702, -0.3569648563861847, -0.3462572991847992, -0.3355497419834137, -0.3248422145843506, -0.3141346573829651, -0.3034271001815796, -0.2927195429801941, -0.282012015581131, -0.2713044583797455, -0.26059690117836, -0.2498893439769745, -0.23918180167675018, -0.22847424447536469, -0.21776670217514038, -0.20705914497375488, -0.19635158777236938, -0.18564404547214508, -0.17493648827075958, -0.16422894597053528, -0.15352141857147217, -0.14281386137008667, -0.13210631906986237, -0.12139876186847687, -0.11069121211767197, -0.09998366236686707, -0.08927610516548157, -0.07856855541467667, -0.06786100566387177, -0.057153455913066864, -0.046445902436971664, -0.035738348960876465, -0.025030799210071564, -0.014323249459266663, -0.0036156922578811646, 0.007091857492923737, 0.017799407243728638, 0.028506958857178688, 0.03921451047062874, 0.04992206394672394, 0.06062961369752884, 0.07133716344833374, 0.08204472064971924, 0.09275227040052414, 0.10345982015132904, 0.11416736990213394, 0.12487491965293884, 0.13558247685432434, 0.14629003405570984, 0.15699757635593414, 0.16770513355731964, 0.17841267585754395, 0.18912023305892944]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 4.0, 11.0, 9.0, 9.0, 17.0, 11.0, 22.0, 33.0, 31.0, 25.0, 35.0, 34.0, 33.0, 38.0, 49.0, 45.0, 38.0, 49.0, 37.0, 44.0, 43.0, 54.0, 45.0, 30.0, 40.0, 35.0, 42.0, 18.0, 21.0, 15.0, 13.0, 11.0, 6.0, 11.0, 9.0, 5.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04856717586517334, -0.04692624509334564, -0.045285314321517944, -0.04364438354969025, -0.04200345277786255, -0.04036252200603485, -0.03872159123420715, -0.037080660462379456, -0.03543972969055176, -0.03379879891872406, -0.03215786814689636, -0.030516937375068665, -0.028876006603240967, -0.02723507583141327, -0.02559414505958557, -0.023953214287757874, -0.022312283515930176, -0.020671352744102478, -0.01903042197227478, -0.017389491200447083, -0.015748560428619385, -0.014107629656791687, -0.01246669888496399, -0.010825768113136292, -0.009184837341308594, -0.007543906569480896, -0.005902975797653198, -0.0042620450258255005, -0.0026211142539978027, -0.000980183482170105, 0.0006607472896575928, 0.0023016780614852905, 0.003942608833312988, 0.005583539605140686, 0.007224470376968384, 0.008865401148796082, 0.01050633192062378, 0.012147262692451477, 0.013788193464279175, 0.015429124236106873, 0.01707005500793457, 0.018710985779762268, 0.020351916551589966, 0.021992847323417664, 0.02363377809524536, 0.02527470886707306, 0.026915639638900757, 0.028556570410728455, 0.030197501182556152, 0.03183843195438385, 0.03347936272621155, 0.035120293498039246, 0.03676122426986694, 0.03840215504169464, 0.04004308581352234, 0.04168401658535004, 0.043324947357177734, 0.04496587812900543, 0.04660680890083313, 0.04824773967266083, 0.049888670444488525, 0.05152960121631622, 0.05317053198814392, 0.05481146275997162, 0.056452393531799316]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 0.0, 6.0, 9.0, 6.0, 15.0, 4.0, 14.0, 6.0, 17.0, 16.0, 17.0, 27.0, 17.0, 27.0, 25.0, 38.0, 40.0, 28.0, 36.0, 39.0, 47.0, 40.0, 36.0, 39.0, 42.0, 28.0, 29.0, 32.0, 37.0, 25.0, 27.0, 22.0, 20.0, 29.0, 27.0, 17.0, 20.0, 10.0, 17.0, 8.0, 11.0, 9.0, 7.0, 8.0, 6.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.5, -7.2652587890625, -7.030517578125, -6.7957763671875, -6.56103515625, -6.3262939453125, -6.091552734375, -5.8568115234375, -5.6220703125, -5.3873291015625, -5.152587890625, -4.9178466796875, -4.68310546875, -4.4483642578125, -4.213623046875, -3.9788818359375, -3.744140625, -3.5093994140625, -3.274658203125, -3.0399169921875, -2.80517578125, -2.5704345703125, -2.335693359375, -2.1009521484375, -1.8662109375, -1.6314697265625, -1.396728515625, -1.1619873046875, -0.92724609375, -0.6925048828125, -0.457763671875, -0.2230224609375, 0.01171875, 0.2464599609375, 0.481201171875, 0.7159423828125, 0.95068359375, 1.1854248046875, 1.420166015625, 1.6549072265625, 1.8896484375, 2.1243896484375, 2.359130859375, 2.5938720703125, 2.82861328125, 3.0633544921875, 3.298095703125, 3.5328369140625, 3.767578125, 4.0023193359375, 4.237060546875, 4.4718017578125, 4.70654296875, 4.9412841796875, 5.176025390625, 5.4107666015625, 5.6455078125, 5.8802490234375, 6.114990234375, 6.3497314453125, 6.58447265625, 6.8192138671875, 7.053955078125, 7.2886962890625, 7.5234375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 5.0, 8.0, 3.0, 11.0, 15.0, 13.0, 20.0, 31.0, 24.0, 46.0, 55.0, 105.0, 133.0, 295.0, 598.0, 1384.0, 3183.0, 7769.0, 19459.0, 60499.0, 236300.0, 495005.0, 155973.0, 42488.0, 14598.0, 5787.0, 2468.0, 1062.0, 509.0, 259.0, 147.0, 75.0, 55.0, 44.0, 28.0, 20.0, 14.0, 13.0, 12.0, 8.0, 14.0, 9.0, 4.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-14.6015625, -14.176513671875, -13.75146484375, -13.326416015625, -12.9013671875, -12.476318359375, -12.05126953125, -11.626220703125, -11.201171875, -10.776123046875, -10.35107421875, -9.926025390625, -9.5009765625, -9.075927734375, -8.65087890625, -8.225830078125, -7.80078125, -7.375732421875, -6.95068359375, -6.525634765625, -6.1005859375, -5.675537109375, -5.25048828125, -4.825439453125, -4.400390625, -3.975341796875, -3.55029296875, -3.125244140625, -2.7001953125, -2.275146484375, -1.85009765625, -1.425048828125, -1.0, -0.574951171875, -0.14990234375, 0.275146484375, 0.7001953125, 1.125244140625, 1.55029296875, 1.975341796875, 2.400390625, 2.825439453125, 3.25048828125, 3.675537109375, 4.1005859375, 4.525634765625, 4.95068359375, 5.375732421875, 5.80078125, 6.225830078125, 6.65087890625, 7.075927734375, 7.5009765625, 7.926025390625, 8.35107421875, 8.776123046875, 9.201171875, 9.626220703125, 10.05126953125, 10.476318359375, 10.9013671875, 11.326416015625, 11.75146484375, 12.176513671875, 12.6015625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 7.0, 7.0, 5.0, 10.0, 22.0, 19.0, 29.0, 24.0, 32.0, 31.0, 37.0, 44.0, 43.0, 53.0, 102.0, 155.0, 1408.0, 364.0, 168.0, 79.0, 43.0, 41.0, 31.0, 42.0, 41.0, 32.0, 23.0, 26.0, 21.0, 13.0, 13.0, 12.0, 5.0, 8.0, 12.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.140625, -23.359130859375, -22.57763671875, -21.796142578125, -21.0146484375, -20.233154296875, -19.45166015625, -18.670166015625, -17.888671875, -17.107177734375, -16.32568359375, -15.544189453125, -14.7626953125, -13.981201171875, -13.19970703125, -12.418212890625, -11.63671875, -10.855224609375, -10.07373046875, -9.292236328125, -8.5107421875, -7.729248046875, -6.94775390625, -6.166259765625, -5.384765625, -4.603271484375, -3.82177734375, -3.040283203125, -2.2587890625, -1.477294921875, -0.69580078125, 0.085693359375, 0.8671875, 1.648681640625, 2.43017578125, 3.211669921875, 3.9931640625, 4.774658203125, 5.55615234375, 6.337646484375, 7.119140625, 7.900634765625, 8.68212890625, 9.463623046875, 10.2451171875, 11.026611328125, 11.80810546875, 12.589599609375, 13.37109375, 14.152587890625, 14.93408203125, 15.715576171875, 16.4970703125, 17.278564453125, 18.06005859375, 18.841552734375, 19.623046875, 20.404541015625, 21.18603515625, 21.967529296875, 22.7490234375, 23.530517578125, 24.31201171875, 25.093505859375, 25.875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 10.0, 12.0, 9.0, 6.0, 17.0, 16.0, 14.0, 33.0, 34.0, 27.0, 53.0, 85.0, 108.0, 140.0, 267.0, 595.0, 2034.0, 11678.0, 279230.0, 2780136.0, 63284.0, 5496.0, 1260.0, 435.0, 232.0, 116.0, 90.0, 61.0, 37.0, 34.0, 31.0, 24.0, 26.0, 13.0, 8.0, 11.0, 9.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-45.5, -44.13427734375, -42.7685546875, -41.40283203125, -40.037109375, -38.67138671875, -37.3056640625, -35.93994140625, -34.57421875, -33.20849609375, -31.8427734375, -30.47705078125, -29.111328125, -27.74560546875, -26.3798828125, -25.01416015625, -23.6484375, -22.28271484375, -20.9169921875, -19.55126953125, -18.185546875, -16.81982421875, -15.4541015625, -14.08837890625, -12.72265625, -11.35693359375, -9.9912109375, -8.62548828125, -7.259765625, -5.89404296875, -4.5283203125, -3.16259765625, -1.796875, -0.43115234375, 0.9345703125, 2.30029296875, 3.666015625, 5.03173828125, 6.3974609375, 7.76318359375, 9.12890625, 10.49462890625, 11.8603515625, 13.22607421875, 14.591796875, 15.95751953125, 17.3232421875, 18.68896484375, 20.0546875, 21.42041015625, 22.7861328125, 24.15185546875, 25.517578125, 26.88330078125, 28.2490234375, 29.61474609375, 30.98046875, 32.34619140625, 33.7119140625, 35.07763671875, 36.443359375, 37.80908203125, 39.1748046875, 40.54052734375, 41.90625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 12.0, 14.0, 22.0, 26.0, 45.0, 63.0, 91.0, 107.0, 115.0, 103.0, 128.0, 91.0, 74.0, 41.0, 28.0, 23.0, 12.0, 2.0, 4.0, 4.0, 3.0], "bins": [-67.54576873779297, -66.24527740478516, -64.94479370117188, -63.64430236816406, -62.343814849853516, -61.0433235168457, -59.742835998535156, -58.442344665527344, -57.1418571472168, -55.84136962890625, -54.54087829589844, -53.24039077758789, -51.939903259277344, -50.63941192626953, -49.338924407958984, -48.03843688964844, -46.737945556640625, -45.43745803833008, -44.136966705322266, -42.83647918701172, -41.53599166870117, -40.23550033569336, -38.93501281738281, -37.634521484375, -36.33403778076172, -35.03355026245117, -33.73305892944336, -32.43257141113281, -31.132081985473633, -29.831592559814453, -28.531105041503906, -27.230615615844727, -25.93012237548828, -24.6296329498291, -23.329145431518555, -22.028656005859375, -20.728166580200195, -19.427677154541016, -18.12718963623047, -16.82670021057129, -15.526212692260742, -14.225724220275879, -12.9252347946167, -11.624746322631836, -10.324256896972656, -9.023768424987793, -7.72327995300293, -6.42279052734375, -5.122302055358887, -3.8218131065368652, -2.521324396133423, -1.2208356857299805, 0.07965326309204102, 1.3801422119140625, 2.680630683898926, 3.9811201095581055, 5.281608581542969, 6.58209753036499, 7.882586479187012, 9.183074951171875, 10.483564376831055, 11.784052848815918, 13.084541320800781, 14.385030746459961, 15.685519218444824]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 6.0, 14.0, 9.0, 15.0, 17.0, 25.0, 22.0, 27.0, 27.0, 28.0, 27.0, 24.0, 36.0, 30.0, 42.0, 55.0, 47.0, 50.0, 44.0, 26.0, 43.0, 44.0, 38.0, 38.0, 38.0, 36.0, 34.0, 25.0, 26.0, 19.0, 23.0, 7.0, 12.0, 7.0, 12.0, 6.0, 4.0, 9.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.02754592895508, -53.94403839111328, -51.86053466796875, -49.77702713012695, -47.693519592285156, -45.610015869140625, -43.52650833129883, -41.44300079345703, -39.3594970703125, -37.2759895324707, -35.19248580932617, -33.108978271484375, -31.025470733642578, -28.941965103149414, -26.85845947265625, -24.774951934814453, -22.691444396972656, -20.607938766479492, -18.524431228637695, -16.44092559814453, -14.35741901397705, -12.27391242980957, -10.190406799316406, -8.106900215148926, -6.023393630981445, -3.939887285232544, -1.8563809394836426, 0.2271251678466797, 2.31063175201416, 4.394138336181641, 6.477643966674805, 8.561150550842285, 10.644660949707031, 12.728167533874512, 14.811674118041992, 16.895179748535156, 18.978687286376953, 21.062192916870117, 23.14569854736328, 25.229206085205078, 27.312711715698242, 29.396217346191406, 31.479724884033203, 33.563232421875, 35.64673614501953, 37.73024368286133, 39.813751220703125, 41.897254943847656, 43.98076248168945, 46.06427001953125, 48.14777374267578, 50.23128128051758, 52.314788818359375, 54.398292541503906, 56.4818000793457, 58.5653076171875, 60.64881134033203, 62.73231887817383, 64.81582641601562, 66.89933013916016, 68.98283386230469, 71.06634521484375, 73.14984893798828, 75.23335266113281, 77.31686401367188]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 4.0, 6.0, 9.0, 8.0, 11.0, 5.0, 22.0, 22.0, 24.0, 28.0, 14.0, 39.0, 21.0, 33.0, 34.0, 35.0, 41.0, 31.0, 41.0, 46.0, 33.0, 43.0, 39.0, 33.0, 30.0, 28.0, 38.0, 27.0, 31.0, 30.0, 20.0, 16.0, 20.0, 21.0, 14.0, 23.0, 12.0, 13.0, 8.0, 6.0, 9.0, 4.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.1328125, -7.8836669921875, -7.634521484375, -7.3853759765625, -7.13623046875, -6.8870849609375, -6.637939453125, -6.3887939453125, -6.1396484375, -5.8905029296875, -5.641357421875, -5.3922119140625, -5.14306640625, -4.8939208984375, -4.644775390625, -4.3956298828125, -4.146484375, -3.8973388671875, -3.648193359375, -3.3990478515625, -3.14990234375, -2.9007568359375, -2.651611328125, -2.4024658203125, -2.1533203125, -1.9041748046875, -1.655029296875, -1.4058837890625, -1.15673828125, -0.9075927734375, -0.658447265625, -0.4093017578125, -0.16015625, 0.0889892578125, 0.338134765625, 0.5872802734375, 0.83642578125, 1.0855712890625, 1.334716796875, 1.5838623046875, 1.8330078125, 2.0821533203125, 2.331298828125, 2.5804443359375, 2.82958984375, 3.0787353515625, 3.327880859375, 3.5770263671875, 3.826171875, 4.0753173828125, 4.324462890625, 4.5736083984375, 4.82275390625, 5.0718994140625, 5.321044921875, 5.5701904296875, 5.8193359375, 6.0684814453125, 6.317626953125, 6.5667724609375, 6.81591796875, 7.0650634765625, 7.314208984375, 7.5633544921875, 7.8125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 16.0, 19.0, 24.0, 41.0, 53.0, 57.0, 97.0, 143.0, 195.0, 299.0, 378.0, 576.0, 843.0, 1189.0, 1810.0, 2618.0, 4225.0, 6603.0, 11907.0, 25812.0, 77996.0, 329953.0, 1458103.0, 1704353.0, 412338.0, 92469.0, 29229.0, 13124.0, 7087.0, 4233.0, 2713.0, 1855.0, 1218.0, 812.0, 567.0, 420.0, 261.0, 171.0, 152.0, 100.0, 61.0, 48.0, 30.0, 27.0, 9.0, 13.0, 6.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-13.78125, -13.364501953125, -12.94775390625, -12.531005859375, -12.1142578125, -11.697509765625, -11.28076171875, -10.864013671875, -10.447265625, -10.030517578125, -9.61376953125, -9.197021484375, -8.7802734375, -8.363525390625, -7.94677734375, -7.530029296875, -7.11328125, -6.696533203125, -6.27978515625, -5.863037109375, -5.4462890625, -5.029541015625, -4.61279296875, -4.196044921875, -3.779296875, -3.362548828125, -2.94580078125, -2.529052734375, -2.1123046875, -1.695556640625, -1.27880859375, -0.862060546875, -0.4453125, -0.028564453125, 0.38818359375, 0.804931640625, 1.2216796875, 1.638427734375, 2.05517578125, 2.471923828125, 2.888671875, 3.305419921875, 3.72216796875, 4.138916015625, 4.5556640625, 4.972412109375, 5.38916015625, 5.805908203125, 6.22265625, 6.639404296875, 7.05615234375, 7.472900390625, 7.8896484375, 8.306396484375, 8.72314453125, 9.139892578125, 9.556640625, 9.973388671875, 10.39013671875, 10.806884765625, 11.2236328125, 11.640380859375, 12.05712890625, 12.473876953125, 12.890625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 8.0, 22.0, 26.0, 28.0, 29.0, 46.0, 76.0, 84.0, 152.0, 215.0, 344.0, 530.0, 635.0, 572.0, 402.0, 279.0, 177.0, 126.0, 75.0, 59.0, 38.0, 27.0, 19.0, 17.0, 10.0, 10.0, 5.0, 9.0, 7.0, 5.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.625, -17.1004638671875, -16.575927734375, -16.0513916015625, -15.52685546875, -15.0023193359375, -14.477783203125, -13.9532470703125, -13.4287109375, -12.9041748046875, -12.379638671875, -11.8551025390625, -11.33056640625, -10.8060302734375, -10.281494140625, -9.7569580078125, -9.232421875, -8.7078857421875, -8.183349609375, -7.6588134765625, -7.13427734375, -6.6097412109375, -6.085205078125, -5.5606689453125, -5.0361328125, -4.5115966796875, -3.987060546875, -3.4625244140625, -2.93798828125, -2.4134521484375, -1.888916015625, -1.3643798828125, -0.83984375, -0.3153076171875, 0.209228515625, 0.7337646484375, 1.25830078125, 1.7828369140625, 2.307373046875, 2.8319091796875, 3.3564453125, 3.8809814453125, 4.405517578125, 4.9300537109375, 5.45458984375, 5.9791259765625, 6.503662109375, 7.0281982421875, 7.552734375, 8.0772705078125, 8.601806640625, 9.1263427734375, 9.65087890625, 10.1754150390625, 10.699951171875, 11.2244873046875, 11.7490234375, 12.2735595703125, 12.798095703125, 13.3226318359375, 13.84716796875, 14.3717041015625, 14.896240234375, 15.4207763671875, 15.9453125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 5.0, 9.0, 3.0, 8.0, 12.0, 12.0, 12.0, 34.0, 57.0, 75.0, 146.0, 234.0, 450.0, 1009.0, 2295.0, 6887.0, 25804.0, 178877.0, 3344340.0, 569599.0, 47558.0, 10819.0, 3316.0, 1316.0, 598.0, 310.0, 175.0, 107.0, 63.0, 39.0, 34.0, 26.0, 21.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.0625, -36.7802734375, -35.498046875, -34.2158203125, -32.93359375, -31.6513671875, -30.369140625, -29.0869140625, -27.8046875, -26.5224609375, -25.240234375, -23.9580078125, -22.67578125, -21.3935546875, -20.111328125, -18.8291015625, -17.546875, -16.2646484375, -14.982421875, -13.7001953125, -12.41796875, -11.1357421875, -9.853515625, -8.5712890625, -7.2890625, -6.0068359375, -4.724609375, -3.4423828125, -2.16015625, -0.8779296875, 0.404296875, 1.6865234375, 2.96875, 4.2509765625, 5.533203125, 6.8154296875, 8.09765625, 9.3798828125, 10.662109375, 11.9443359375, 13.2265625, 14.5087890625, 15.791015625, 17.0732421875, 18.35546875, 19.6376953125, 20.919921875, 22.2021484375, 23.484375, 24.7666015625, 26.048828125, 27.3310546875, 28.61328125, 29.8955078125, 31.177734375, 32.4599609375, 33.7421875, 35.0244140625, 36.306640625, 37.5888671875, 38.87109375, 40.1533203125, 41.435546875, 42.7177734375, 44.0]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 9.0, 28.0, 59.0, 121.0, 248.0, 252.0, 172.0, 65.0, 30.0, 14.0, 9.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-284.0709228515625, -278.7209167480469, -273.37091064453125, -268.0209045410156, -262.6708984375, -257.3208923339844, -251.9708709716797, -246.62086486816406, -241.27085876464844, -235.9208526611328, -230.5708465576172, -225.2208251953125, -219.87081909179688, -214.52081298828125, -209.17080688476562, -203.82080078125, -198.47079467773438, -193.12078857421875, -187.77078247070312, -182.4207763671875, -177.0707550048828, -171.7207489013672, -166.37074279785156, -161.02073669433594, -155.67071533203125, -150.32070922851562, -144.970703125, -139.62069702148438, -134.2706756591797, -128.92066955566406, -123.57066345214844, -118.22065734863281, -112.87065124511719, -107.52064514160156, -102.1706314086914, -96.82062530517578, -91.47061920166016, -86.12060546875, -80.77059936523438, -75.42059326171875, -70.07058715820312, -64.7205810546875, -59.37057113647461, -54.02056121826172, -48.670555114746094, -43.3205451965332, -37.97053527832031, -32.62052917480469, -27.27051544189453, -21.920507431030273, -16.570499420166016, -11.220489501953125, -5.870481491088867, -0.5204734802246094, 4.829536437988281, 10.179542541503906, 15.529552459716797, 20.879560470581055, 26.229568481445312, 31.579578399658203, 36.929588317871094, 42.27959442138672, 47.62960433959961, 52.979610443115234, 58.329620361328125]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 15.0, 7.0, 7.0, 11.0, 20.0, 23.0, 31.0, 20.0, 19.0, 29.0, 27.0, 42.0, 32.0, 37.0, 37.0, 44.0, 48.0, 44.0, 38.0, 40.0, 33.0, 40.0, 37.0, 37.0, 30.0, 26.0, 26.0, 23.0, 26.0, 23.0, 15.0, 22.0, 15.0, 12.0, 8.0, 10.0, 6.0, 2.0, 7.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.920989990234375, -53.25605010986328, -51.59111404418945, -49.92617416381836, -48.26123809814453, -46.59629821777344, -44.931358337402344, -43.26641845703125, -41.60148239135742, -39.93654251098633, -38.2716064453125, -36.606666564941406, -34.94172668457031, -33.276790618896484, -31.61185073852539, -29.94691276550293, -28.28197479248047, -26.617036819458008, -24.952098846435547, -23.287158966064453, -21.622220993041992, -19.95728302001953, -18.292343139648438, -16.627405166625977, -14.962467193603516, -13.297529220581055, -11.632590293884277, -9.9676513671875, -8.302713394165039, -6.637775421142578, -4.972836494445801, -3.3078975677490234, -1.6429557800292969, 0.021982669830322266, 1.6869211196899414, 3.3518595695495605, 5.01679801940918, 6.681735992431641, 8.346674919128418, 10.011613845825195, 11.676551818847656, 13.341489791870117, 15.006428718566895, 16.671367645263672, 18.336305618286133, 20.001243591308594, 21.666183471679688, 23.33112144470215, 24.99605941772461, 26.66099739074707, 28.32593536376953, 29.990875244140625, 31.655813217163086, 33.32075119018555, 34.98569107055664, 36.65062713623047, 38.31556701660156, 39.980506896972656, 41.645442962646484, 43.31038284301758, 44.975318908691406, 46.6402587890625, 48.305198669433594, 49.97013854980469, 51.635074615478516]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 8.0, 6.0, 9.0, 12.0, 10.0, 13.0, 17.0, 20.0, 35.0, 29.0, 37.0, 28.0, 35.0, 38.0, 32.0, 41.0, 47.0, 40.0, 35.0, 39.0, 38.0, 33.0, 40.0, 37.0, 37.0, 39.0, 24.0, 21.0, 40.0, 26.0, 12.0, 21.0, 20.0, 15.0, 5.0, 12.0, 9.0, 7.0, 7.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.734375, -9.4473876953125, -9.160400390625, -8.8734130859375, -8.58642578125, -8.2994384765625, -8.012451171875, -7.7254638671875, -7.4384765625, -7.1514892578125, -6.864501953125, -6.5775146484375, -6.29052734375, -6.0035400390625, -5.716552734375, -5.4295654296875, -5.142578125, -4.8555908203125, -4.568603515625, -4.2816162109375, -3.99462890625, -3.7076416015625, -3.420654296875, -3.1336669921875, -2.8466796875, -2.5596923828125, -2.272705078125, -1.9857177734375, -1.69873046875, -1.4117431640625, -1.124755859375, -0.8377685546875, -0.55078125, -0.2637939453125, 0.023193359375, 0.3101806640625, 0.59716796875, 0.8841552734375, 1.171142578125, 1.4581298828125, 1.7451171875, 2.0321044921875, 2.319091796875, 2.6060791015625, 2.89306640625, 3.1800537109375, 3.467041015625, 3.7540283203125, 4.041015625, 4.3280029296875, 4.614990234375, 4.9019775390625, 5.18896484375, 5.4759521484375, 5.762939453125, 6.0499267578125, 6.3369140625, 6.6239013671875, 6.910888671875, 7.1978759765625, 7.48486328125, 7.7718505859375, 8.058837890625, 8.3458251953125, 8.6328125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 5.0, 10.0, 7.0, 13.0, 20.0, 28.0, 54.0, 75.0, 128.0, 227.0, 339.0, 596.0, 864.0, 1345.0, 2162.0, 3441.0, 5482.0, 8971.0, 14605.0, 23974.0, 40137.0, 68138.0, 113389.0, 176271.0, 202174.0, 151685.0, 93892.0, 55733.0, 33318.0, 19598.0, 12075.0, 7335.0, 4661.0, 2869.0, 1822.0, 1168.0, 692.0, 454.0, 307.0, 183.0, 112.0, 77.0, 47.0, 24.0, 12.0, 15.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0], "bins": [-1.2158203125, -1.1823348999023438, -1.1488494873046875, -1.1153640747070312, -1.081878662109375, -1.0483932495117188, -1.0149078369140625, -0.9814224243164062, -0.94793701171875, -0.9144515991210938, -0.8809661865234375, -0.8474807739257812, -0.813995361328125, -0.7805099487304688, -0.7470245361328125, -0.7135391235351562, -0.6800537109375, -0.6465682983398438, -0.6130828857421875, -0.5795974731445312, -0.546112060546875, -0.5126266479492188, -0.4791412353515625, -0.44565582275390625, -0.41217041015625, -0.37868499755859375, -0.3451995849609375, -0.31171417236328125, -0.278228759765625, -0.24474334716796875, -0.2112579345703125, -0.17777252197265625, -0.144287109375, -0.11080169677734375, -0.0773162841796875, -0.04383087158203125, -0.010345458984375, 0.02313995361328125, 0.0566253662109375, 0.09011077880859375, 0.12359619140625, 0.15708160400390625, 0.1905670166015625, 0.22405242919921875, 0.257537841796875, 0.29102325439453125, 0.3245086669921875, 0.35799407958984375, 0.3914794921875, 0.42496490478515625, 0.4584503173828125, 0.49193572998046875, 0.525421142578125, 0.5589065551757812, 0.5923919677734375, 0.6258773803710938, 0.65936279296875, 0.6928482055664062, 0.7263336181640625, 0.7598190307617188, 0.793304443359375, 0.8267898559570312, 0.8602752685546875, 0.8937606811523438, 0.92724609375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 1.0, 7.0, 6.0, 4.0, 8.0, 10.0, 7.0, 13.0, 14.0, 12.0, 14.0, 25.0, 21.0, 23.0, 22.0, 26.0, 31.0, 37.0, 36.0, 45.0, 41.0, 48.0, 29.0, 1059.0, 32.0, 41.0, 36.0, 42.0, 51.0, 38.0, 34.0, 22.0, 32.0, 18.0, 23.0, 25.0, 19.0, 14.0, 14.0, 5.0, 8.0, 3.0, 4.0, 9.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-6.2578125, -6.07220458984375, -5.8865966796875, -5.70098876953125, -5.515380859375, -5.32977294921875, -5.1441650390625, -4.95855712890625, -4.77294921875, -4.58734130859375, -4.4017333984375, -4.21612548828125, -4.030517578125, -3.84490966796875, -3.6593017578125, -3.47369384765625, -3.2880859375, -3.10247802734375, -2.9168701171875, -2.73126220703125, -2.545654296875, -2.36004638671875, -2.1744384765625, -1.98883056640625, -1.80322265625, -1.61761474609375, -1.4320068359375, -1.24639892578125, -1.060791015625, -0.87518310546875, -0.6895751953125, -0.50396728515625, -0.318359375, -0.13275146484375, 0.0528564453125, 0.23846435546875, 0.424072265625, 0.60968017578125, 0.7952880859375, 0.98089599609375, 1.16650390625, 1.35211181640625, 1.5377197265625, 1.72332763671875, 1.908935546875, 2.09454345703125, 2.2801513671875, 2.46575927734375, 2.6513671875, 2.83697509765625, 3.0225830078125, 3.20819091796875, 3.393798828125, 3.57940673828125, 3.7650146484375, 3.95062255859375, 4.13623046875, 4.32183837890625, 4.5074462890625, 4.69305419921875, 4.878662109375, 5.06427001953125, 5.2498779296875, 5.43548583984375, 5.62109375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 16.0, 21.0, 20.0, 25.0, 44.0, 64.0, 86.0, 125.0, 177.0, 246.0, 363.0, 561.0, 781.0, 1198.0, 1838.0, 3021.0, 4871.0, 8533.0, 16386.0, 35936.0, 357323.0, 1578401.0, 44412.0, 18429.0, 9685.0, 5501.0, 3243.0, 1956.0, 1290.0, 815.0, 562.0, 372.0, 234.0, 173.0, 135.0, 77.0, 61.0, 39.0, 31.0, 13.0, 17.0, 11.0, 11.0, 12.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.033203125, -1.9698486328125, -1.906494140625, -1.8431396484375, -1.77978515625, -1.7164306640625, -1.653076171875, -1.5897216796875, -1.5263671875, -1.4630126953125, -1.399658203125, -1.3363037109375, -1.27294921875, -1.2095947265625, -1.146240234375, -1.0828857421875, -1.01953125, -0.9561767578125, -0.892822265625, -0.8294677734375, -0.76611328125, -0.7027587890625, -0.639404296875, -0.5760498046875, -0.5126953125, -0.4493408203125, -0.385986328125, -0.3226318359375, -0.25927734375, -0.1959228515625, -0.132568359375, -0.0692138671875, -0.005859375, 0.0574951171875, 0.120849609375, 0.1842041015625, 0.24755859375, 0.3109130859375, 0.374267578125, 0.4376220703125, 0.5009765625, 0.5643310546875, 0.627685546875, 0.6910400390625, 0.75439453125, 0.8177490234375, 0.881103515625, 0.9444580078125, 1.0078125, 1.0711669921875, 1.134521484375, 1.1978759765625, 1.26123046875, 1.3245849609375, 1.387939453125, 1.4512939453125, 1.5146484375, 1.5780029296875, 1.641357421875, 1.7047119140625, 1.76806640625, 1.8314208984375, 1.894775390625, 1.9581298828125, 2.021484375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 5.0, 9.0, 16.0, 15.0, 11.0, 14.0, 20.0, 23.0, 30.0, 43.0, 37.0, 46.0, 35.0, 44.0, 63.0, 59.0, 68.0, 66.0, 56.0, 69.0, 38.0, 46.0, 35.0, 16.0, 21.0, 19.0, 15.0, 16.0, 10.0, 11.0, 7.0, 8.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.077880859375, -0.07563591003417969, -0.07339096069335938, -0.07114601135253906, -0.06890106201171875, -0.06665611267089844, -0.06441116333007812, -0.06216621398925781, -0.0599212646484375, -0.05767631530761719, -0.055431365966796875, -0.05318641662597656, -0.05094146728515625, -0.04869651794433594, -0.046451568603515625, -0.04420661926269531, -0.041961669921875, -0.03971672058105469, -0.037471771240234375, -0.03522682189941406, -0.03298187255859375, -0.030736923217773438, -0.028491973876953125, -0.026247024536132812, -0.0240020751953125, -0.021757125854492188, -0.019512176513671875, -0.017267227172851562, -0.01502227783203125, -0.012777328491210938, -0.010532379150390625, -0.008287429809570312, -0.00604248046875, -0.0037975311279296875, -0.001552581787109375, 0.0006923675537109375, 0.00293731689453125, 0.0051822662353515625, 0.007427215576171875, 0.009672164916992188, 0.0119171142578125, 0.014162063598632812, 0.016407012939453125, 0.018651962280273438, 0.02089691162109375, 0.023141860961914062, 0.025386810302734375, 0.027631759643554688, 0.029876708984375, 0.03212165832519531, 0.034366607666015625, 0.03661155700683594, 0.03885650634765625, 0.04110145568847656, 0.043346405029296875, 0.04559135437011719, 0.0478363037109375, 0.05008125305175781, 0.052326202392578125, 0.05457115173339844, 0.05681610107421875, 0.05906105041503906, 0.061305999755859375, 0.06355094909667969, 0.0657958984375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 6.0, 4.0, 14.0, 15.0, 16.0, 15.0, 27.0, 37.0, 37.0, 56.0, 107.0, 129.0, 222.0, 400.0, 1949.0, 374192.0, 667208.0, 2973.0, 423.0, 215.0, 132.0, 90.0, 74.0, 49.0, 39.0, 21.0, 19.0, 15.0, 15.0, 8.0, 13.0, 6.0, 7.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3671875, -1.3201446533203125, -1.273101806640625, -1.2260589599609375, -1.17901611328125, -1.1319732666015625, -1.084930419921875, -1.0378875732421875, -0.9908447265625, -0.9438018798828125, -0.896759033203125, -0.8497161865234375, -0.80267333984375, -0.7556304931640625, -0.708587646484375, -0.6615447998046875, -0.614501953125, -0.5674591064453125, -0.520416259765625, -0.4733734130859375, -0.42633056640625, -0.3792877197265625, -0.332244873046875, -0.2852020263671875, -0.2381591796875, -0.1911163330078125, -0.144073486328125, -0.0970306396484375, -0.04998779296875, -0.0029449462890625, 0.044097900390625, 0.0911407470703125, 0.13818359375, 0.1852264404296875, 0.232269287109375, 0.2793121337890625, 0.32635498046875, 0.3733978271484375, 0.420440673828125, 0.4674835205078125, 0.5145263671875, 0.5615692138671875, 0.608612060546875, 0.6556549072265625, 0.70269775390625, 0.7497406005859375, 0.796783447265625, 0.8438262939453125, 0.890869140625, 0.9379119873046875, 0.984954833984375, 1.0319976806640625, 1.07904052734375, 1.1260833740234375, 1.173126220703125, 1.2201690673828125, 1.2672119140625, 1.3142547607421875, 1.361297607421875, 1.4083404541015625, 1.45538330078125, 1.5024261474609375, 1.549468994140625, 1.5965118408203125, 1.6435546875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 18.0, 105.0, 533.0, 301.0, 43.0, 10.0, 2.0, 0.0, 1.0], "bins": [-1.1139705181121826, -1.0946913957595825, -1.075412392616272, -1.0561332702636719, -1.0368542671203613, -1.0175751447677612, -0.9982960224151611, -0.9790169596672058, -0.9597378969192505, -0.9404588341712952, -0.9211797714233398, -0.9019006490707397, -0.8826215863227844, -0.8633425235748291, -0.844063401222229, -0.8247843384742737, -0.8055052757263184, -0.786226212978363, -0.7669471502304077, -0.7476680278778076, -0.7283889651298523, -0.709109902381897, -0.6898307800292969, -0.6705517172813416, -0.6512726545333862, -0.6319935917854309, -0.6127145290374756, -0.5934354066848755, -0.5741563439369202, -0.5548772811889648, -0.5355981588363647, -0.5163190960884094, -0.4970400333404541, -0.4777609705924988, -0.45848187804222107, -0.43920278549194336, -0.41992372274398804, -0.4006446599960327, -0.381365567445755, -0.3620864748954773, -0.342807412147522, -0.32352834939956665, -0.30424925684928894, -0.28497016429901123, -0.2656911015510559, -0.2464120239019394, -0.22713294625282288, -0.20785386860370636, -0.18857477605342865, -0.16929569840431213, -0.15001662075519562, -0.1307375431060791, -0.11145846545696259, -0.09217938780784607, -0.07290031015872955, -0.05362123250961304, -0.03434215486049652, -0.015063077211380005, 0.004216000437736511, 0.023495078086853027, 0.04277415573596954, 0.06205323338508606, 0.08133231103420258, 0.10061138868331909, 0.11989046633243561]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 4.0, 11.0, 9.0, 11.0, 11.0, 8.0, 23.0, 15.0, 24.0, 29.0, 33.0, 41.0, 32.0, 49.0, 41.0, 47.0, 47.0, 49.0, 56.0, 51.0, 48.0, 45.0, 42.0, 43.0, 32.0, 40.0, 25.0, 14.0, 26.0, 16.0, 16.0, 11.0, 11.0, 16.0, 3.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05746734142303467, -0.05527535080909729, -0.05308336392045021, -0.05089137703180313, -0.04869938641786575, -0.046507395803928375, -0.044315408915281296, -0.042123422026634216, -0.03993143141269684, -0.03773944079875946, -0.03554745391011238, -0.0333554670214653, -0.031163476407527924, -0.028971487656235695, -0.026779498904943466, -0.024587510153651237, -0.02239552140235901, -0.02020353265106678, -0.01801154389977455, -0.015819555148482323, -0.013627566397190094, -0.011435577645897865, -0.009243588894605637, -0.007051600143313408, -0.004859611392021179, -0.0026676226407289505, -0.0004756338894367218, 0.001716354861855507, 0.003908343613147736, 0.006100332364439964, 0.008292321115732193, 0.010484309867024422, 0.01267629861831665, 0.014868287369608879, 0.017060276120901108, 0.019252264872193336, 0.021444253623485565, 0.023636242374777794, 0.025828231126070023, 0.02802021987736225, 0.03021220862865448, 0.03240419924259186, 0.03459618613123894, 0.03678817301988602, 0.038980163633823395, 0.04117215424776077, 0.04336414113640785, 0.04555612802505493, 0.04774811863899231, 0.04994010925292969, 0.05213209614157677, 0.054324083030223846, 0.056516073644161224, 0.0587080642580986, 0.06090005114674568, 0.06309203803539276, 0.06528402864933014, 0.06747601926326752, 0.0696680098772049, 0.07185999304056168, 0.07405198365449905, 0.07624397426843643, 0.07843595743179321, 0.08062794804573059, 0.08281993865966797]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 4.0, 8.0, 6.0, 9.0, 12.0, 10.0, 13.0, 17.0, 20.0, 34.0, 30.0, 37.0, 28.0, 35.0, 37.0, 33.0, 42.0, 46.0, 40.0, 35.0, 39.0, 38.0, 33.0, 41.0, 37.0, 35.0, 40.0, 23.0, 22.0, 40.0, 25.0, 13.0, 21.0, 20.0, 15.0, 5.0, 12.0, 9.0, 7.0, 7.0, 7.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.734375, -9.4473876953125, -9.160400390625, -8.8734130859375, -8.58642578125, -8.2994384765625, -8.012451171875, -7.7254638671875, -7.4384765625, -7.1514892578125, -6.864501953125, -6.5775146484375, -6.29052734375, -6.0035400390625, -5.716552734375, -5.4295654296875, -5.142578125, -4.8555908203125, -4.568603515625, -4.2816162109375, -3.99462890625, -3.7076416015625, -3.420654296875, -3.1336669921875, -2.8466796875, -2.5596923828125, -2.272705078125, -1.9857177734375, -1.69873046875, -1.4117431640625, -1.124755859375, -0.8377685546875, -0.55078125, -0.2637939453125, 0.023193359375, 0.3101806640625, 0.59716796875, 0.8841552734375, 1.171142578125, 1.4581298828125, 1.7451171875, 2.0321044921875, 2.319091796875, 2.6060791015625, 2.89306640625, 3.1800537109375, 3.467041015625, 3.7540283203125, 4.041015625, 4.3280029296875, 4.614990234375, 4.9019775390625, 5.18896484375, 5.4759521484375, 5.762939453125, 6.0499267578125, 6.3369140625, 6.6239013671875, 6.910888671875, 7.1978759765625, 7.48486328125, 7.7718505859375, 8.058837890625, 8.3458251953125, 8.6328125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 2.0, 5.0, 12.0, 15.0, 10.0, 14.0, 26.0, 19.0, 33.0, 43.0, 62.0, 88.0, 128.0, 179.0, 298.0, 437.0, 755.0, 1197.0, 2265.0, 4371.0, 9313.0, 24253.0, 80682.0, 391205.0, 405308.0, 83444.0, 24944.0, 9420.0, 4336.0, 2215.0, 1292.0, 723.0, 446.0, 296.0, 220.0, 165.0, 102.0, 57.0, 37.0, 34.0, 25.0, 24.0, 17.0, 12.0, 7.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 5.0, 0.0, 2.0], "bins": [-18.359375, -17.819580078125, -17.27978515625, -16.739990234375, -16.2001953125, -15.660400390625, -15.12060546875, -14.580810546875, -14.041015625, -13.501220703125, -12.96142578125, -12.421630859375, -11.8818359375, -11.342041015625, -10.80224609375, -10.262451171875, -9.72265625, -9.182861328125, -8.64306640625, -8.103271484375, -7.5634765625, -7.023681640625, -6.48388671875, -5.944091796875, -5.404296875, -4.864501953125, -4.32470703125, -3.784912109375, -3.2451171875, -2.705322265625, -2.16552734375, -1.625732421875, -1.0859375, -0.546142578125, -0.00634765625, 0.533447265625, 1.0732421875, 1.613037109375, 2.15283203125, 2.692626953125, 3.232421875, 3.772216796875, 4.31201171875, 4.851806640625, 5.3916015625, 5.931396484375, 6.47119140625, 7.010986328125, 7.55078125, 8.090576171875, 8.63037109375, 9.170166015625, 9.7099609375, 10.249755859375, 10.78955078125, 11.329345703125, 11.869140625, 12.408935546875, 12.94873046875, 13.488525390625, 14.0283203125, 14.568115234375, 15.10791015625, 15.647705078125, 16.1875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 7.0, 7.0, 3.0, 9.0, 6.0, 10.0, 6.0, 9.0, 14.0, 16.0, 21.0, 18.0, 36.0, 38.0, 32.0, 36.0, 34.0, 64.0, 46.0, 52.0, 69.0, 153.0, 336.0, 1389.0, 141.0, 77.0, 53.0, 37.0, 44.0, 30.0, 30.0, 26.0, 26.0, 21.0, 29.0, 21.0, 15.0, 14.0, 10.0, 10.0, 14.0, 6.0, 8.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-23.34375, -22.591064453125, -21.83837890625, -21.085693359375, -20.3330078125, -19.580322265625, -18.82763671875, -18.074951171875, -17.322265625, -16.569580078125, -15.81689453125, -15.064208984375, -14.3115234375, -13.558837890625, -12.80615234375, -12.053466796875, -11.30078125, -10.548095703125, -9.79541015625, -9.042724609375, -8.2900390625, -7.537353515625, -6.78466796875, -6.031982421875, -5.279296875, -4.526611328125, -3.77392578125, -3.021240234375, -2.2685546875, -1.515869140625, -0.76318359375, -0.010498046875, 0.7421875, 1.494873046875, 2.24755859375, 3.000244140625, 3.7529296875, 4.505615234375, 5.25830078125, 6.010986328125, 6.763671875, 7.516357421875, 8.26904296875, 9.021728515625, 9.7744140625, 10.527099609375, 11.27978515625, 12.032470703125, 12.78515625, 13.537841796875, 14.29052734375, 15.043212890625, 15.7958984375, 16.548583984375, 17.30126953125, 18.053955078125, 18.806640625, 19.559326171875, 20.31201171875, 21.064697265625, 21.8173828125, 22.570068359375, 23.32275390625, 24.075439453125, 24.828125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 5.0, 9.0, 10.0, 12.0, 22.0, 14.0, 21.0, 34.0, 37.0, 62.0, 69.0, 99.0, 203.0, 420.0, 999.0, 3480.0, 18982.0, 887131.0, 2201850.0, 25531.0, 4372.0, 1176.0, 515.0, 194.0, 128.0, 89.0, 59.0, 48.0, 27.0, 24.0, 15.0, 16.0, 10.0, 11.0, 9.0, 6.0, 2.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.375, -59.51904296875, -57.6630859375, -55.80712890625, -53.951171875, -52.09521484375, -50.2392578125, -48.38330078125, -46.52734375, -44.67138671875, -42.8154296875, -40.95947265625, -39.103515625, -37.24755859375, -35.3916015625, -33.53564453125, -31.6796875, -29.82373046875, -27.9677734375, -26.11181640625, -24.255859375, -22.39990234375, -20.5439453125, -18.68798828125, -16.83203125, -14.97607421875, -13.1201171875, -11.26416015625, -9.408203125, -7.55224609375, -5.6962890625, -3.84033203125, -1.984375, -0.12841796875, 1.7275390625, 3.58349609375, 5.439453125, 7.29541015625, 9.1513671875, 11.00732421875, 12.86328125, 14.71923828125, 16.5751953125, 18.43115234375, 20.287109375, 22.14306640625, 23.9990234375, 25.85498046875, 27.7109375, 29.56689453125, 31.4228515625, 33.27880859375, 35.134765625, 36.99072265625, 38.8466796875, 40.70263671875, 42.55859375, 44.41455078125, 46.2705078125, 48.12646484375, 49.982421875, 51.83837890625, 53.6943359375, 55.55029296875, 57.40625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 25.0, 195.0, 513.0, 229.0, 44.0, 8.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.058589935302734, -35.57137680053711, -29.084163665771484, -22.596948623657227, -16.1097354888916, -9.622520446777344, -3.1353073120117188, 3.3519058227539062, 9.839118957519531, 16.326332092285156, 22.81354522705078, 29.30076026916504, 35.78797149658203, 42.27518844604492, 48.76240158081055, 55.24961471557617, 61.7368278503418, 68.22404479980469, 74.71125793457031, 81.19847106933594, 87.68568420410156, 94.17289733886719, 100.66011047363281, 107.14732360839844, 113.63453674316406, 120.12174987792969, 126.60896301269531, 133.09617614746094, 139.58338928222656, 146.0706024169922, 152.5578155517578, 159.04502868652344, 165.53224182128906, 172.0194549560547, 178.5066680908203, 184.99388122558594, 191.48109436035156, 197.9683074951172, 204.4555206298828, 210.94273376464844, 217.42994689941406, 223.9171600341797, 230.4043731689453, 236.89158630371094, 243.37879943847656, 249.8660125732422, 256.3532409667969, 262.8404541015625, 269.3276672363281, 275.81488037109375, 282.3020935058594, 288.789306640625, 295.2765197753906, 301.76373291015625, 308.2509460449219, 314.7381591796875, 321.2253723144531, 327.71258544921875, 334.1997985839844, 340.68701171875, 347.1742248535156, 353.66143798828125, 360.1486511230469, 366.6358642578125, 373.1230773925781]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 3.0, 5.0, 4.0, 15.0, 3.0, 10.0, 18.0, 20.0, 16.0, 18.0, 23.0, 28.0, 23.0, 18.0, 30.0, 37.0, 27.0, 37.0, 39.0, 37.0, 34.0, 44.0, 41.0, 38.0, 41.0, 39.0, 32.0, 38.0, 31.0, 23.0, 25.0, 25.0, 26.0, 25.0, 19.0, 26.0, 10.0, 10.0, 8.0, 7.0, 12.0, 9.0, 3.0, 11.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-65.70665740966797, -63.660003662109375, -61.61334991455078, -59.56669616699219, -57.520042419433594, -55.473388671875, -53.426734924316406, -51.38008117675781, -49.33342742919922, -47.286773681640625, -45.24011993408203, -43.19346618652344, -41.146812438964844, -39.10015869140625, -37.053504943847656, -35.00685119628906, -32.96019744873047, -30.913543701171875, -28.86688995361328, -26.820236206054688, -24.773582458496094, -22.7269287109375, -20.680274963378906, -18.633621215820312, -16.58696746826172, -14.540313720703125, -12.493659973144531, -10.447006225585938, -8.400352478027344, -6.35369873046875, -4.307044982910156, -2.2603912353515625, -0.21373748779296875, 1.832916259765625, 3.8795700073242188, 5.9262237548828125, 7.972877502441406, 10.01953125, 12.066184997558594, 14.112838745117188, 16.15949249267578, 18.206146240234375, 20.25279998779297, 22.299453735351562, 24.346107482910156, 26.39276123046875, 28.439414978027344, 30.486068725585938, 32.53272247314453, 34.579376220703125, 36.62602996826172, 38.67268371582031, 40.719337463378906, 42.7659912109375, 44.812644958496094, 46.85929870605469, 48.90595245361328, 50.952606201171875, 52.99925994873047, 55.04591369628906, 57.092567443847656, 59.13922119140625, 61.185874938964844, 63.23252868652344, 65.27918243408203]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 6.0, 3.0, 6.0, 6.0, 4.0, 8.0, 13.0, 14.0, 16.0, 19.0, 21.0, 31.0, 38.0, 32.0, 34.0, 41.0, 28.0, 36.0, 39.0, 42.0, 36.0, 49.0, 41.0, 44.0, 42.0, 33.0, 34.0, 27.0, 36.0, 35.0, 29.0, 18.0, 17.0, 19.0, 15.0, 13.0, 10.0, 15.0, 17.0, 8.0, 6.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-9.125, -8.84326171875, -8.5615234375, -8.27978515625, -7.998046875, -7.71630859375, -7.4345703125, -7.15283203125, -6.87109375, -6.58935546875, -6.3076171875, -6.02587890625, -5.744140625, -5.46240234375, -5.1806640625, -4.89892578125, -4.6171875, -4.33544921875, -4.0537109375, -3.77197265625, -3.490234375, -3.20849609375, -2.9267578125, -2.64501953125, -2.36328125, -2.08154296875, -1.7998046875, -1.51806640625, -1.236328125, -0.95458984375, -0.6728515625, -0.39111328125, -0.109375, 0.17236328125, 0.4541015625, 0.73583984375, 1.017578125, 1.29931640625, 1.5810546875, 1.86279296875, 2.14453125, 2.42626953125, 2.7080078125, 2.98974609375, 3.271484375, 3.55322265625, 3.8349609375, 4.11669921875, 4.3984375, 4.68017578125, 4.9619140625, 5.24365234375, 5.525390625, 5.80712890625, 6.0888671875, 6.37060546875, 6.65234375, 6.93408203125, 7.2158203125, 7.49755859375, 7.779296875, 8.06103515625, 8.3427734375, 8.62451171875, 8.90625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 13.0, 14.0, 11.0, 20.0, 35.0, 47.0, 64.0, 60.0, 91.0, 141.0, 191.0, 267.0, 422.0, 645.0, 1004.0, 1708.0, 2981.0, 6014.0, 15431.0, 64192.0, 478641.0, 2631514.0, 851708.0, 101756.0, 21067.0, 7490.0, 3474.0, 1910.0, 1145.0, 705.0, 477.0, 319.0, 193.0, 128.0, 108.0, 82.0, 56.0, 45.0, 31.0, 28.0, 15.0, 20.0, 9.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-20.640625, -20.02685546875, -19.4130859375, -18.79931640625, -18.185546875, -17.57177734375, -16.9580078125, -16.34423828125, -15.73046875, -15.11669921875, -14.5029296875, -13.88916015625, -13.275390625, -12.66162109375, -12.0478515625, -11.43408203125, -10.8203125, -10.20654296875, -9.5927734375, -8.97900390625, -8.365234375, -7.75146484375, -7.1376953125, -6.52392578125, -5.91015625, -5.29638671875, -4.6826171875, -4.06884765625, -3.455078125, -2.84130859375, -2.2275390625, -1.61376953125, -1.0, -0.38623046875, 0.2275390625, 0.84130859375, 1.455078125, 2.06884765625, 2.6826171875, 3.29638671875, 3.91015625, 4.52392578125, 5.1376953125, 5.75146484375, 6.365234375, 6.97900390625, 7.5927734375, 8.20654296875, 8.8203125, 9.43408203125, 10.0478515625, 10.66162109375, 11.275390625, 11.88916015625, 12.5029296875, 13.11669921875, 13.73046875, 14.34423828125, 14.9580078125, 15.57177734375, 16.185546875, 16.79931640625, 17.4130859375, 18.02685546875, 18.640625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 3.0, 4.0, 5.0, 16.0, 20.0, 16.0, 21.0, 29.0, 42.0, 66.0, 92.0, 115.0, 232.0, 394.0, 700.0, 805.0, 632.0, 353.0, 208.0, 107.0, 71.0, 44.0, 22.0, 22.0, 8.0, 13.0, 14.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.0, -24.3125, -23.625, -22.9375, -22.25, -21.5625, -20.875, -20.1875, -19.5, -18.8125, -18.125, -17.4375, -16.75, -16.0625, -15.375, -14.6875, -14.0, -13.3125, -12.625, -11.9375, -11.25, -10.5625, -9.875, -9.1875, -8.5, -7.8125, -7.125, -6.4375, -5.75, -5.0625, -4.375, -3.6875, -3.0, -2.3125, -1.625, -0.9375, -0.25, 0.4375, 1.125, 1.8125, 2.5, 3.1875, 3.875, 4.5625, 5.25, 5.9375, 6.625, 7.3125, 8.0, 8.6875, 9.375, 10.0625, 10.75, 11.4375, 12.125, 12.8125, 13.5, 14.1875, 14.875, 15.5625, 16.25, 16.9375, 17.625, 18.3125, 19.0]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 13.0, 19.0, 34.0, 32.0, 64.0, 101.0, 234.0, 538.0, 1349.0, 4563.0, 19522.0, 196583.0, 3771288.0, 174840.0, 18281.0, 4310.0, 1356.0, 547.0, 261.0, 115.0, 72.0, 42.0, 20.0, 32.0, 12.0, 12.0, 9.0, 1.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.78125, -47.00634765625, -45.2314453125, -43.45654296875, -41.681640625, -39.90673828125, -38.1318359375, -36.35693359375, -34.58203125, -32.80712890625, -31.0322265625, -29.25732421875, -27.482421875, -25.70751953125, -23.9326171875, -22.15771484375, -20.3828125, -18.60791015625, -16.8330078125, -15.05810546875, -13.283203125, -11.50830078125, -9.7333984375, -7.95849609375, -6.18359375, -4.40869140625, -2.6337890625, -0.85888671875, 0.916015625, 2.69091796875, 4.4658203125, 6.24072265625, 8.015625, 9.79052734375, 11.5654296875, 13.34033203125, 15.115234375, 16.89013671875, 18.6650390625, 20.43994140625, 22.21484375, 23.98974609375, 25.7646484375, 27.53955078125, 29.314453125, 31.08935546875, 32.8642578125, 34.63916015625, 36.4140625, 38.18896484375, 39.9638671875, 41.73876953125, 43.513671875, 45.28857421875, 47.0634765625, 48.83837890625, 50.61328125, 52.38818359375, 54.1630859375, 55.93798828125, 57.712890625, 59.48779296875, 61.2626953125, 63.03759765625, 64.8125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 8.0, 12.0, 28.0, 36.0, 56.0, 113.0, 176.0, 193.0, 156.0, 97.0, 63.0, 30.0, 18.0, 9.0, 9.0, 1.0, 3.0], "bins": [-205.96827697753906, -202.1875457763672, -198.4068145751953, -194.62606811523438, -190.8453369140625, -187.06460571289062, -183.28387451171875, -179.50314331054688, -175.722412109375, -171.94168090820312, -168.16094970703125, -164.38021850585938, -160.59947204589844, -156.81874084472656, -153.0380096435547, -149.2572784423828, -145.47653198242188, -141.69580078125, -137.91506958007812, -134.13433837890625, -130.3535919189453, -126.57286071777344, -122.79212951660156, -119.01139831542969, -115.23066711425781, -111.44993591308594, -107.66919708251953, -103.88846588134766, -100.10773468017578, -96.32699584960938, -92.5462646484375, -88.76553344726562, -84.98480224609375, -81.20407104492188, -77.42333221435547, -73.6426010131836, -69.86186981201172, -66.08113098144531, -62.30039978027344, -58.51966857910156, -54.738929748535156, -50.958194732666016, -47.17746353149414, -43.396728515625, -39.615997314453125, -35.835262298583984, -32.054527282714844, -28.273794174194336, -24.493061065673828, -20.71232795715332, -16.931594848632812, -13.150859832763672, -9.370126724243164, -5.589393615722656, -1.8086585998535156, 1.9720745086669922, 5.7528076171875, 9.533540725708008, 13.314274787902832, 17.095008850097656, 20.875741958618164, 24.656475067138672, 28.437210083007812, 32.21794128417969, 35.99867630004883]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 7.0, 2.0, 10.0, 14.0, 12.0, 10.0, 13.0, 18.0, 20.0, 27.0, 16.0, 31.0, 28.0, 27.0, 27.0, 36.0, 40.0, 36.0, 33.0, 31.0, 46.0, 44.0, 38.0, 48.0, 35.0, 20.0, 38.0, 26.0, 37.0, 18.0, 34.0, 28.0, 22.0, 16.0, 22.0, 14.0, 16.0, 13.0, 11.0, 10.0, 6.0, 4.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-52.46464538574219, -50.86648941040039, -49.268333435058594, -47.67018127441406, -46.072025299072266, -44.47386932373047, -42.87571334838867, -41.277557373046875, -39.67940139770508, -38.08124542236328, -36.483089447021484, -34.88493347167969, -33.286781311035156, -31.68862533569336, -30.090469360351562, -28.492313385009766, -26.8941593170166, -25.296003341674805, -23.69784927368164, -22.099693298339844, -20.501537322998047, -18.90338134765625, -17.305227279663086, -15.707071304321289, -14.108916282653809, -12.510761260986328, -10.912605285644531, -9.31445026397705, -7.716294765472412, -6.118139266967773, -4.519984245300293, -2.921828269958496, -1.3236732482910156, 0.2744821310043335, 1.8726375102996826, 3.470792770385742, 5.068948268890381, 6.6671037673950195, 8.2652587890625, 9.863414764404297, 11.461569786071777, 13.059724807739258, 14.657880783081055, 16.25603485107422, 17.854190826416016, 19.452346801757812, 21.05050277709961, 22.648658752441406, 24.24681282043457, 25.844968795776367, 27.44312286376953, 29.041278839111328, 30.639434814453125, 32.23759078979492, 33.83574676513672, 35.43389892578125, 37.03205490112305, 38.630210876464844, 40.22836685180664, 41.82652282714844, 43.42467498779297, 45.022830963134766, 46.62098693847656, 48.21914291381836, 49.817298889160156]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 6.0, 8.0, 6.0, 12.0, 15.0, 11.0, 18.0, 22.0, 32.0, 14.0, 36.0, 42.0, 36.0, 30.0, 41.0, 38.0, 39.0, 50.0, 33.0, 34.0, 50.0, 37.0, 45.0, 34.0, 33.0, 30.0, 31.0, 28.0, 16.0, 18.0, 20.0, 18.0, 17.0, 19.0, 10.0, 16.0, 11.0, 7.0, 1.0, 7.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.801513671875, -8.51708984375, -8.232666015625, -7.9482421875, -7.663818359375, -7.37939453125, -7.094970703125, -6.810546875, -6.526123046875, -6.24169921875, -5.957275390625, -5.6728515625, -5.388427734375, -5.10400390625, -4.819580078125, -4.53515625, -4.250732421875, -3.96630859375, -3.681884765625, -3.3974609375, -3.113037109375, -2.82861328125, -2.544189453125, -2.259765625, -1.975341796875, -1.69091796875, -1.406494140625, -1.1220703125, -0.837646484375, -0.55322265625, -0.268798828125, 0.015625, 0.300048828125, 0.58447265625, 0.868896484375, 1.1533203125, 1.437744140625, 1.72216796875, 2.006591796875, 2.291015625, 2.575439453125, 2.85986328125, 3.144287109375, 3.4287109375, 3.713134765625, 3.99755859375, 4.281982421875, 4.56640625, 4.850830078125, 5.13525390625, 5.419677734375, 5.7041015625, 5.988525390625, 6.27294921875, 6.557373046875, 6.841796875, 7.126220703125, 7.41064453125, 7.695068359375, 7.9794921875, 8.263916015625, 8.54833984375, 8.832763671875, 9.1171875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 1.0, 5.0, 6.0, 4.0, 17.0, 16.0, 30.0, 38.0, 50.0, 84.0, 122.0, 159.0, 241.0, 339.0, 467.0, 735.0, 1064.0, 1508.0, 2264.0, 3329.0, 4847.0, 7174.0, 10599.0, 16291.0, 24143.0, 36653.0, 56634.0, 84709.0, 123680.0, 159946.0, 156396.0, 118672.0, 80465.0, 53439.0, 34494.0, 23123.0, 15426.0, 10115.0, 6743.0, 4562.0, 3173.0, 2140.0, 1408.0, 971.0, 677.0, 501.0, 330.0, 266.0, 167.0, 115.0, 62.0, 55.0, 42.0, 20.0, 17.0, 11.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.7587890625, -0.7342605590820312, -0.7097320556640625, -0.6852035522460938, -0.660675048828125, -0.6361465454101562, -0.6116180419921875, -0.5870895385742188, -0.56256103515625, -0.5380325317382812, -0.5135040283203125, -0.48897552490234375, -0.464447021484375, -0.43991851806640625, -0.4153900146484375, -0.39086151123046875, -0.3663330078125, -0.34180450439453125, -0.3172760009765625, -0.29274749755859375, -0.268218994140625, -0.24369049072265625, -0.2191619873046875, -0.19463348388671875, -0.17010498046875, -0.14557647705078125, -0.1210479736328125, -0.09651947021484375, -0.071990966796875, -0.04746246337890625, -0.0229339599609375, 0.00159454345703125, 0.026123046875, 0.05065155029296875, 0.0751800537109375, 0.09970855712890625, 0.124237060546875, 0.14876556396484375, 0.1732940673828125, 0.19782257080078125, 0.22235107421875, 0.24687957763671875, 0.2714080810546875, 0.29593658447265625, 0.320465087890625, 0.34499359130859375, 0.3695220947265625, 0.39405059814453125, 0.4185791015625, 0.44310760498046875, 0.4676361083984375, 0.49216461181640625, 0.516693115234375, 0.5412216186523438, 0.5657501220703125, 0.5902786254882812, 0.61480712890625, 0.6393356323242188, 0.6638641357421875, 0.6883926391601562, 0.712921142578125, 0.7374496459960938, 0.7619781494140625, 0.7865066528320312, 0.81103515625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 2.0, 6.0, 4.0, 7.0, 9.0, 4.0, 12.0, 16.0, 18.0, 14.0, 30.0, 21.0, 23.0, 24.0, 30.0, 28.0, 37.0, 28.0, 31.0, 40.0, 43.0, 47.0, 1076.0, 31.0, 36.0, 33.0, 36.0, 37.0, 18.0, 42.0, 15.0, 33.0, 30.0, 18.0, 22.0, 14.0, 19.0, 13.0, 11.0, 15.0, 18.0, 10.0, 5.0, 8.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.26171875, -6.07366943359375, -5.8856201171875, -5.69757080078125, -5.509521484375, -5.32147216796875, -5.1334228515625, -4.94537353515625, -4.75732421875, -4.56927490234375, -4.3812255859375, -4.19317626953125, -4.005126953125, -3.81707763671875, -3.6290283203125, -3.44097900390625, -3.2529296875, -3.06488037109375, -2.8768310546875, -2.68878173828125, -2.500732421875, -2.31268310546875, -2.1246337890625, -1.93658447265625, -1.74853515625, -1.56048583984375, -1.3724365234375, -1.18438720703125, -0.996337890625, -0.80828857421875, -0.6202392578125, -0.43218994140625, -0.244140625, -0.05609130859375, 0.1319580078125, 0.32000732421875, 0.508056640625, 0.69610595703125, 0.8841552734375, 1.07220458984375, 1.26025390625, 1.44830322265625, 1.6363525390625, 1.82440185546875, 2.012451171875, 2.20050048828125, 2.3885498046875, 2.57659912109375, 2.7646484375, 2.95269775390625, 3.1407470703125, 3.32879638671875, 3.516845703125, 3.70489501953125, 3.8929443359375, 4.08099365234375, 4.26904296875, 4.45709228515625, 4.6451416015625, 4.83319091796875, 5.021240234375, 5.20928955078125, 5.3973388671875, 5.58538818359375, 5.7734375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 11.0, 21.0, 21.0, 23.0, 31.0, 41.0, 82.0, 105.0, 160.0, 194.0, 354.0, 444.0, 691.0, 951.0, 1397.0, 2111.0, 3217.0, 5112.0, 8557.0, 14880.0, 30141.0, 153918.0, 1755318.0, 65300.0, 22404.0, 11729.0, 6928.0, 4201.0, 2807.0, 1795.0, 1292.0, 894.0, 601.0, 427.0, 281.0, 206.0, 148.0, 107.0, 75.0, 54.0, 31.0, 15.0, 15.0, 5.0, 14.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-2.01171875, -1.953094482421875, -1.89447021484375, -1.835845947265625, -1.7772216796875, -1.718597412109375, -1.65997314453125, -1.601348876953125, -1.542724609375, -1.484100341796875, -1.42547607421875, -1.366851806640625, -1.3082275390625, -1.249603271484375, -1.19097900390625, -1.132354736328125, -1.07373046875, -1.015106201171875, -0.95648193359375, -0.897857666015625, -0.8392333984375, -0.780609130859375, -0.72198486328125, -0.663360595703125, -0.604736328125, -0.546112060546875, -0.48748779296875, -0.428863525390625, -0.3702392578125, -0.311614990234375, -0.25299072265625, -0.194366455078125, -0.1357421875, -0.077117919921875, -0.01849365234375, 0.040130615234375, 0.0987548828125, 0.157379150390625, 0.21600341796875, 0.274627685546875, 0.333251953125, 0.391876220703125, 0.45050048828125, 0.509124755859375, 0.5677490234375, 0.626373291015625, 0.68499755859375, 0.743621826171875, 0.80224609375, 0.860870361328125, 0.91949462890625, 0.978118896484375, 1.0367431640625, 1.095367431640625, 1.15399169921875, 1.212615966796875, 1.271240234375, 1.329864501953125, 1.38848876953125, 1.447113037109375, 1.5057373046875, 1.564361572265625, 1.62298583984375, 1.681610107421875, 1.740234375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 6.0, 12.0, 10.0, 12.0, 14.0, 16.0, 6.0, 16.0, 17.0, 30.0, 21.0, 29.0, 24.0, 29.0, 31.0, 43.0, 32.0, 41.0, 37.0, 51.0, 41.0, 35.0, 54.0, 32.0, 40.0, 46.0, 33.0, 30.0, 40.0, 22.0, 26.0, 17.0, 17.0, 21.0, 17.0, 9.0, 11.0, 5.0, 9.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.045074462890625, -0.04375314712524414, -0.04243183135986328, -0.04111051559448242, -0.03978919982910156, -0.0384678840637207, -0.037146568298339844, -0.035825252532958984, -0.034503936767578125, -0.033182621002197266, -0.031861305236816406, -0.030539989471435547, -0.029218673706054688, -0.027897357940673828, -0.02657604217529297, -0.02525472640991211, -0.02393341064453125, -0.02261209487915039, -0.02129077911376953, -0.019969463348388672, -0.018648147583007812, -0.017326831817626953, -0.016005516052246094, -0.014684200286865234, -0.013362884521484375, -0.012041568756103516, -0.010720252990722656, -0.009398937225341797, -0.008077621459960938, -0.006756305694580078, -0.005434989929199219, -0.004113674163818359, -0.0027923583984375, -0.0014710426330566406, -0.00014972686767578125, 0.0011715888977050781, 0.0024929046630859375, 0.003814220428466797, 0.005135536193847656, 0.006456851959228516, 0.007778167724609375, 0.009099483489990234, 0.010420799255371094, 0.011742115020751953, 0.013063430786132812, 0.014384746551513672, 0.01570606231689453, 0.01702737808227539, 0.01834869384765625, 0.01967000961303711, 0.02099132537841797, 0.022312641143798828, 0.023633956909179688, 0.024955272674560547, 0.026276588439941406, 0.027597904205322266, 0.028919219970703125, 0.030240535736083984, 0.031561851501464844, 0.0328831672668457, 0.03420448303222656, 0.03552579879760742, 0.03684711456298828, 0.03816843032836914, 0.03948974609375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 9.0, 7.0, 6.0, 10.0, 23.0, 20.0, 25.0, 21.0, 33.0, 44.0, 69.0, 77.0, 107.0, 129.0, 199.0, 403.0, 1222.0, 22696.0, 820620.0, 197133.0, 4181.0, 556.0, 275.0, 171.0, 107.0, 80.0, 61.0, 60.0, 38.0, 27.0, 24.0, 26.0, 11.0, 18.0, 10.0, 11.0, 7.0, 10.0, 7.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.82568359375, -0.7979354858398438, -0.7701873779296875, -0.7424392700195312, -0.714691162109375, -0.6869430541992188, -0.6591949462890625, -0.6314468383789062, -0.60369873046875, -0.5759506225585938, -0.5482025146484375, -0.5204544067382812, -0.492706298828125, -0.46495819091796875, -0.4372100830078125, -0.40946197509765625, -0.3817138671875, -0.35396575927734375, -0.3262176513671875, -0.29846954345703125, -0.270721435546875, -0.24297332763671875, -0.2152252197265625, -0.18747711181640625, -0.15972900390625, -0.13198089599609375, -0.1042327880859375, -0.07648468017578125, -0.048736572265625, -0.02098846435546875, 0.0067596435546875, 0.03450775146484375, 0.062255859375, 0.09000396728515625, 0.1177520751953125, 0.14550018310546875, 0.173248291015625, 0.20099639892578125, 0.2287445068359375, 0.25649261474609375, 0.28424072265625, 0.31198883056640625, 0.3397369384765625, 0.36748504638671875, 0.395233154296875, 0.42298126220703125, 0.4507293701171875, 0.47847747802734375, 0.5062255859375, 0.5339736938476562, 0.5617218017578125, 0.5894699096679688, 0.617218017578125, 0.6449661254882812, 0.6727142333984375, 0.7004623413085938, 0.72821044921875, 0.7559585571289062, 0.7837066650390625, 0.8114547729492188, 0.839202880859375, 0.8669509887695312, 0.8946990966796875, 0.9224472045898438, 0.9501953125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 24.0, 56.0, 174.0, 353.0, 243.0, 94.0, 36.0, 19.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0666302740573883, -0.057972416281700134, -0.049314554780721664, -0.040656693279743195, -0.03199883550405502, -0.023340977728366852, -0.014683116227388382, -0.006025254726409912, 0.0026326030492782593, 0.01129046268761158, 0.0199483223259449, 0.02860618196427822, 0.03726404160261154, 0.04592189937829971, 0.05457976087927818, 0.06323762238025665, 0.07189548015594482, 0.080553337931633, 0.08921119570732117, 0.09786906093358994, 0.1065269187092781, 0.11518477648496628, 0.12384264171123505, 0.13250049948692322, 0.1411583572626114, 0.14981621503829956, 0.15847407281398773, 0.1671319305896759, 0.17578980326652527, 0.18444764614105225, 0.1931055188179016, 0.20176337659358978, 0.21042123436927795, 0.21907909214496613, 0.2277369499206543, 0.23639480769634247, 0.24505266547203064, 0.25371053814888, 0.262368381023407, 0.27102625370025635, 0.2796841263771057, 0.2883419990539551, 0.29699984192848206, 0.3056577146053314, 0.3143155574798584, 0.32297343015670776, 0.33163127303123474, 0.3402891457080841, 0.3489469885826111, 0.35760486125946045, 0.3662627041339874, 0.3749205768108368, 0.38357841968536377, 0.39223629236221313, 0.4008941352367401, 0.4095520079135895, 0.41820985078811646, 0.4268677234649658, 0.4355255663394928, 0.44418343901634216, 0.45284128189086914, 0.4614991545677185, 0.4701569974422455, 0.47881487011909485, 0.4874727427959442]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 8.0, 2.0, 3.0, 7.0, 12.0, 5.0, 22.0, 29.0, 26.0, 27.0, 20.0, 42.0, 34.0, 34.0, 47.0, 41.0, 46.0, 47.0, 47.0, 46.0, 42.0, 47.0, 45.0, 45.0, 36.0, 34.0, 39.0, 23.0, 31.0, 22.0, 23.0, 14.0, 13.0, 10.0, 14.0, 7.0, 3.0, 2.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.060799479484558105, -0.05910597741603851, -0.05741247162222862, -0.05571896582841873, -0.05402546375989914, -0.05233196169137955, -0.050638455897569656, -0.048944950103759766, -0.04725144803524017, -0.04555794596672058, -0.04386444017291069, -0.0421709343791008, -0.04047743231058121, -0.038783930242061615, -0.037090424448251724, -0.035396918654441833, -0.03370341658592224, -0.03200991451740265, -0.030316408723592758, -0.028622904792428017, -0.026929400861263275, -0.025235896930098534, -0.023542392998933792, -0.02184888906776905, -0.02015538513660431, -0.018461881205439568, -0.016768377274274826, -0.015074873343110085, -0.013381369411945343, -0.011687865480780602, -0.00999436154961586, -0.008300857618451118, -0.006607353687286377, -0.0049138497561216354, -0.003220345824956894, -0.0015268418937921524, 0.0001666620373725891, 0.0018601659685373306, 0.003553669899702072, 0.005247173830866814, 0.006940677762031555, 0.008634181693196297, 0.010327685624361038, 0.01202118955552578, 0.013714693486690521, 0.015408197417855263, 0.017101701349020004, 0.018795205280184746, 0.020488709211349487, 0.02218221314251423, 0.02387571707367897, 0.025569221004843712, 0.027262724936008453, 0.028956228867173195, 0.030649732798337936, 0.03234323859214783, 0.03403674066066742, 0.03573024272918701, 0.0374237485229969, 0.03911725431680679, 0.040810756385326385, 0.04250425845384598, 0.04419776424765587, 0.04589127004146576, 0.04758477210998535]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 6.0, 8.0, 6.0, 12.0, 15.0, 11.0, 19.0, 21.0, 32.0, 14.0, 35.0, 42.0, 37.0, 30.0, 41.0, 38.0, 38.0, 49.0, 35.0, 34.0, 50.0, 37.0, 45.0, 34.0, 33.0, 30.0, 31.0, 28.0, 16.0, 18.0, 20.0, 18.0, 16.0, 20.0, 10.0, 16.0, 11.0, 7.0, 1.0, 7.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.801513671875, -8.51708984375, -8.232666015625, -7.9482421875, -7.663818359375, -7.37939453125, -7.094970703125, -6.810546875, -6.526123046875, -6.24169921875, -5.957275390625, -5.6728515625, -5.388427734375, -5.10400390625, -4.819580078125, -4.53515625, -4.250732421875, -3.96630859375, -3.681884765625, -3.3974609375, -3.113037109375, -2.82861328125, -2.544189453125, -2.259765625, -1.975341796875, -1.69091796875, -1.406494140625, -1.1220703125, -0.837646484375, -0.55322265625, -0.268798828125, 0.015625, 0.300048828125, 0.58447265625, 0.868896484375, 1.1533203125, 1.437744140625, 1.72216796875, 2.006591796875, 2.291015625, 2.575439453125, 2.85986328125, 3.144287109375, 3.4287109375, 3.713134765625, 3.99755859375, 4.281982421875, 4.56640625, 4.850830078125, 5.13525390625, 5.419677734375, 5.7041015625, 5.988525390625, 6.27294921875, 6.557373046875, 6.841796875, 7.126220703125, 7.41064453125, 7.695068359375, 7.9794921875, 8.263916015625, 8.54833984375, 8.832763671875, 9.1171875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 13.0, 21.0, 43.0, 56.0, 73.0, 106.0, 176.0, 259.0, 398.0, 584.0, 1002.0, 1574.0, 2550.0, 4025.0, 6664.0, 11222.0, 19617.0, 38036.0, 87599.0, 238159.0, 357424.0, 153091.0, 59768.0, 27955.0, 14881.0, 8884.0, 5381.0, 3264.0, 2138.0, 1333.0, 785.0, 514.0, 332.0, 231.0, 133.0, 71.0, 65.0, 32.0, 25.0, 18.0, 15.0, 10.0, 9.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2890625, -13.832275390625, -13.37548828125, -12.918701171875, -12.4619140625, -12.005126953125, -11.54833984375, -11.091552734375, -10.634765625, -10.177978515625, -9.72119140625, -9.264404296875, -8.8076171875, -8.350830078125, -7.89404296875, -7.437255859375, -6.98046875, -6.523681640625, -6.06689453125, -5.610107421875, -5.1533203125, -4.696533203125, -4.23974609375, -3.782958984375, -3.326171875, -2.869384765625, -2.41259765625, -1.955810546875, -1.4990234375, -1.042236328125, -0.58544921875, -0.128662109375, 0.328125, 0.784912109375, 1.24169921875, 1.698486328125, 2.1552734375, 2.612060546875, 3.06884765625, 3.525634765625, 3.982421875, 4.439208984375, 4.89599609375, 5.352783203125, 5.8095703125, 6.266357421875, 6.72314453125, 7.179931640625, 7.63671875, 8.093505859375, 8.55029296875, 9.007080078125, 9.4638671875, 9.920654296875, 10.37744140625, 10.834228515625, 11.291015625, 11.747802734375, 12.20458984375, 12.661376953125, 13.1181640625, 13.574951171875, 14.03173828125, 14.488525390625, 14.9453125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 1.0, 5.0, 12.0, 12.0, 12.0, 16.0, 18.0, 29.0, 24.0, 23.0, 28.0, 35.0, 40.0, 48.0, 57.0, 83.0, 154.0, 256.0, 1387.0, 206.0, 113.0, 92.0, 57.0, 48.0, 41.0, 33.0, 37.0, 25.0, 28.0, 25.0, 19.0, 17.0, 13.0, 12.0, 11.0, 8.0, 5.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.328125, -22.47607421875, -21.6240234375, -20.77197265625, -19.919921875, -19.06787109375, -18.2158203125, -17.36376953125, -16.51171875, -15.65966796875, -14.8076171875, -13.95556640625, -13.103515625, -12.25146484375, -11.3994140625, -10.54736328125, -9.6953125, -8.84326171875, -7.9912109375, -7.13916015625, -6.287109375, -5.43505859375, -4.5830078125, -3.73095703125, -2.87890625, -2.02685546875, -1.1748046875, -0.32275390625, 0.529296875, 1.38134765625, 2.2333984375, 3.08544921875, 3.9375, 4.78955078125, 5.6416015625, 6.49365234375, 7.345703125, 8.19775390625, 9.0498046875, 9.90185546875, 10.75390625, 11.60595703125, 12.4580078125, 13.31005859375, 14.162109375, 15.01416015625, 15.8662109375, 16.71826171875, 17.5703125, 18.42236328125, 19.2744140625, 20.12646484375, 20.978515625, 21.83056640625, 22.6826171875, 23.53466796875, 24.38671875, 25.23876953125, 26.0908203125, 26.94287109375, 27.794921875, 28.64697265625, 29.4990234375, 30.35107421875, 31.203125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 8.0, 4.0, 4.0, 9.0, 10.0, 10.0, 15.0, 27.0, 47.0, 51.0, 80.0, 132.0, 212.0, 344.0, 678.0, 1551.0, 4208.0, 12848.0, 49995.0, 546967.0, 2355920.0, 135405.0, 25068.0, 7286.0, 2597.0, 1004.0, 495.0, 289.0, 143.0, 94.0, 72.0, 36.0, 27.0, 16.0, 16.0, 13.0, 5.0, 6.0, 4.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-42.5625, -41.388671875, -40.21484375, -39.041015625, -37.8671875, -36.693359375, -35.51953125, -34.345703125, -33.171875, -31.998046875, -30.82421875, -29.650390625, -28.4765625, -27.302734375, -26.12890625, -24.955078125, -23.78125, -22.607421875, -21.43359375, -20.259765625, -19.0859375, -17.912109375, -16.73828125, -15.564453125, -14.390625, -13.216796875, -12.04296875, -10.869140625, -9.6953125, -8.521484375, -7.34765625, -6.173828125, -5.0, -3.826171875, -2.65234375, -1.478515625, -0.3046875, 0.869140625, 2.04296875, 3.216796875, 4.390625, 5.564453125, 6.73828125, 7.912109375, 9.0859375, 10.259765625, 11.43359375, 12.607421875, 13.78125, 14.955078125, 16.12890625, 17.302734375, 18.4765625, 19.650390625, 20.82421875, 21.998046875, 23.171875, 24.345703125, 25.51953125, 26.693359375, 27.8671875, 29.041015625, 30.21484375, 31.388671875, 32.5625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 128.0, 860.0, 26.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.8132781982422, -104.7552490234375, -80.69722747802734, -56.63920593261719, -32.5811767578125, -8.523147583007812, 15.534866333007812, 39.5928955078125, 63.65092468261719, 87.70895385742188, 111.76697540283203, 135.8249969482422, 159.88302612304688, 183.94105529785156, 207.9990692138672, 232.05709838867188, 256.1151123046875, 280.1731262207031, 304.2311706542969, 328.2891845703125, 352.34722900390625, 376.4052429199219, 400.4632568359375, 424.52130126953125, 448.579345703125, 472.6373596191406, 496.6954040527344, 520.75341796875, 544.8114624023438, 568.8695068359375, 592.927490234375, 616.9855346679688, 641.0435791015625, 665.1016235351562, 689.1596069335938, 713.2176513671875, 737.2756958007812, 761.333740234375, 785.3917236328125, 809.4497680664062, 833.5078125, 857.5658569335938, 881.6238403320312, 905.681884765625, 929.7399291992188, 953.7979736328125, 977.85595703125, 1001.9140014648438, 1025.971923828125, 1050.0299072265625, 1074.0880126953125, 1098.14599609375, 1122.2039794921875, 1146.2620849609375, 1170.320068359375, 1194.3780517578125, 1218.4361572265625, 1242.494140625, 1266.55224609375, 1290.6102294921875, 1314.668212890625, 1338.726318359375, 1362.7843017578125, 1386.84228515625, 1410.900390625]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 2.0, 9.0, 11.0, 10.0, 15.0, 18.0, 16.0, 29.0, 23.0, 32.0, 29.0, 24.0, 27.0, 39.0, 43.0, 41.0, 46.0, 43.0, 55.0, 48.0, 43.0, 42.0, 36.0, 37.0, 45.0, 34.0, 33.0, 20.0, 21.0, 22.0, 11.0, 18.0, 18.0, 11.0, 10.0, 5.0, 9.0, 4.0, 2.0, 2.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.98616790771484, -68.80818939208984, -66.63021850585938, -64.45223999023438, -62.27426528930664, -60.096290588378906, -57.918312072753906, -55.74033737182617, -53.56236267089844, -51.3843879699707, -49.20641326904297, -47.02843475341797, -44.850460052490234, -42.6724853515625, -40.4945068359375, -38.316532135009766, -36.13855743408203, -33.9605827331543, -31.78260612487793, -29.604629516601562, -27.426654815673828, -25.248680114746094, -23.070703506469727, -20.89272689819336, -18.714752197265625, -16.53677749633789, -14.358800888061523, -12.180825233459473, -10.002849578857422, -7.824873924255371, -5.64689826965332, -3.4689226150512695, -1.2909393310546875, 0.8870363235473633, 3.065011978149414, 5.242987632751465, 7.420963287353516, 9.598938941955566, 11.776914596557617, 13.954890251159668, 16.13286590576172, 18.310840606689453, 20.48881721496582, 22.666793823242188, 24.844768524169922, 27.022743225097656, 29.200719833374023, 31.37869644165039, 33.556671142578125, 35.73464584350586, 37.912620544433594, 40.090599060058594, 42.26857376098633, 44.44654846191406, 46.62452697753906, 48.8025016784668, 50.98047637939453, 53.158451080322266, 55.33642578125, 57.514404296875, 59.692378997802734, 61.87035369873047, 64.04833221435547, 66.22630310058594, 68.40428161621094]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 6.0, 8.0, 10.0, 6.0, 8.0, 22.0, 14.0, 24.0, 28.0, 21.0, 40.0, 30.0, 35.0, 30.0, 50.0, 55.0, 58.0, 39.0, 48.0, 41.0, 48.0, 43.0, 36.0, 34.0, 25.0, 25.0, 30.0, 36.0, 19.0, 22.0, 16.0, 16.0, 15.0, 13.0, 14.0, 8.0, 6.0, 4.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-11.3515625, -11.0330810546875, -10.714599609375, -10.3961181640625, -10.07763671875, -9.7591552734375, -9.440673828125, -9.1221923828125, -8.8037109375, -8.4852294921875, -8.166748046875, -7.8482666015625, -7.52978515625, -7.2113037109375, -6.892822265625, -6.5743408203125, -6.255859375, -5.9373779296875, -5.618896484375, -5.3004150390625, -4.98193359375, -4.6634521484375, -4.344970703125, -4.0264892578125, -3.7080078125, -3.3895263671875, -3.071044921875, -2.7525634765625, -2.43408203125, -2.1156005859375, -1.797119140625, -1.4786376953125, -1.16015625, -0.8416748046875, -0.523193359375, -0.2047119140625, 0.11376953125, 0.4322509765625, 0.750732421875, 1.0692138671875, 1.3876953125, 1.7061767578125, 2.024658203125, 2.3431396484375, 2.66162109375, 2.9801025390625, 3.298583984375, 3.6170654296875, 3.935546875, 4.2540283203125, 4.572509765625, 4.8909912109375, 5.20947265625, 5.5279541015625, 5.846435546875, 6.1649169921875, 6.4833984375, 6.8018798828125, 7.120361328125, 7.4388427734375, 7.75732421875, 8.0758056640625, 8.394287109375, 8.7127685546875, 9.03125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 12.0, 22.0, 18.0, 32.0, 48.0, 55.0, 81.0, 119.0, 144.0, 225.0, 323.0, 540.0, 832.0, 1340.0, 2192.0, 3968.0, 7984.0, 19599.0, 73154.0, 420807.0, 2219279.0, 1196021.0, 183020.0, 37712.0, 12598.0, 5912.0, 3143.0, 1803.0, 1055.0, 718.0, 488.0, 298.0, 219.0, 143.0, 102.0, 71.0, 53.0, 28.0, 32.0, 21.0, 20.0, 16.0, 6.0, 8.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.4453125, -14.9434814453125, -14.441650390625, -13.9398193359375, -13.43798828125, -12.9361572265625, -12.434326171875, -11.9324951171875, -11.4306640625, -10.9288330078125, -10.427001953125, -9.9251708984375, -9.42333984375, -8.9215087890625, -8.419677734375, -7.9178466796875, -7.416015625, -6.9141845703125, -6.412353515625, -5.9105224609375, -5.40869140625, -4.9068603515625, -4.405029296875, -3.9031982421875, -3.4013671875, -2.8995361328125, -2.397705078125, -1.8958740234375, -1.39404296875, -0.8922119140625, -0.390380859375, 0.1114501953125, 0.61328125, 1.1151123046875, 1.616943359375, 2.1187744140625, 2.62060546875, 3.1224365234375, 3.624267578125, 4.1260986328125, 4.6279296875, 5.1297607421875, 5.631591796875, 6.1334228515625, 6.63525390625, 7.1370849609375, 7.638916015625, 8.1407470703125, 8.642578125, 9.1444091796875, 9.646240234375, 10.1480712890625, 10.64990234375, 11.1517333984375, 11.653564453125, 12.1553955078125, 12.6572265625, 13.1590576171875, 13.660888671875, 14.1627197265625, 14.66455078125, 15.1663818359375, 15.668212890625, 16.1700439453125, 16.671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 4.0, 10.0, 18.0, 24.0, 30.0, 40.0, 70.0, 89.0, 127.0, 213.0, 354.0, 579.0, 805.0, 577.0, 407.0, 221.0, 153.0, 103.0, 54.0, 46.0, 21.0, 21.0, 18.0, 13.0, 12.0, 8.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.765625, -19.2244873046875, -18.683349609375, -18.1422119140625, -17.60107421875, -17.0599365234375, -16.518798828125, -15.9776611328125, -15.4365234375, -14.8953857421875, -14.354248046875, -13.8131103515625, -13.27197265625, -12.7308349609375, -12.189697265625, -11.6485595703125, -11.107421875, -10.5662841796875, -10.025146484375, -9.4840087890625, -8.94287109375, -8.4017333984375, -7.860595703125, -7.3194580078125, -6.7783203125, -6.2371826171875, -5.696044921875, -5.1549072265625, -4.61376953125, -4.0726318359375, -3.531494140625, -2.9903564453125, -2.44921875, -1.9080810546875, -1.366943359375, -0.8258056640625, -0.28466796875, 0.2564697265625, 0.797607421875, 1.3387451171875, 1.8798828125, 2.4210205078125, 2.962158203125, 3.5032958984375, 4.04443359375, 4.5855712890625, 5.126708984375, 5.6678466796875, 6.208984375, 6.7501220703125, 7.291259765625, 7.8323974609375, 8.37353515625, 8.9146728515625, 9.455810546875, 9.9969482421875, 10.5380859375, 11.0792236328125, 11.620361328125, 12.1614990234375, 12.70263671875, 13.2437744140625, 13.784912109375, 14.3260498046875, 14.8671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 6.0, 3.0, 7.0, 10.0, 11.0, 14.0, 18.0, 30.0, 44.0, 73.0, 97.0, 155.0, 256.0, 375.0, 640.0, 1168.0, 2173.0, 4770.0, 10844.0, 30098.0, 118686.0, 1415909.0, 2376321.0, 170871.0, 37465.0, 13015.0, 5398.0, 2620.0, 1287.0, 724.0, 415.0, 267.0, 159.0, 112.0, 72.0, 50.0, 37.0, 27.0, 11.0, 9.0, 14.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-30.546875, -29.676513671875, -28.80615234375, -27.935791015625, -27.0654296875, -26.195068359375, -25.32470703125, -24.454345703125, -23.583984375, -22.713623046875, -21.84326171875, -20.972900390625, -20.1025390625, -19.232177734375, -18.36181640625, -17.491455078125, -16.62109375, -15.750732421875, -14.88037109375, -14.010009765625, -13.1396484375, -12.269287109375, -11.39892578125, -10.528564453125, -9.658203125, -8.787841796875, -7.91748046875, -7.047119140625, -6.1767578125, -5.306396484375, -4.43603515625, -3.565673828125, -2.6953125, -1.824951171875, -0.95458984375, -0.084228515625, 0.7861328125, 1.656494140625, 2.52685546875, 3.397216796875, 4.267578125, 5.137939453125, 6.00830078125, 6.878662109375, 7.7490234375, 8.619384765625, 9.48974609375, 10.360107421875, 11.23046875, 12.100830078125, 12.97119140625, 13.841552734375, 14.7119140625, 15.582275390625, 16.45263671875, 17.322998046875, 18.193359375, 19.063720703125, 19.93408203125, 20.804443359375, 21.6748046875, 22.545166015625, 23.41552734375, 24.285888671875, 25.15625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 7.0, 7.0, 5.0, 15.0, 18.0, 14.0, 25.0, 26.0, 32.0, 38.0, 65.0, 58.0, 67.0, 82.0, 88.0, 86.0, 75.0, 61.0, 50.0, 35.0, 32.0, 29.0, 21.0, 12.0, 13.0, 12.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.7536506652832, -41.252784729003906, -39.751914978027344, -38.25104522705078, -36.750179290771484, -35.24931335449219, -33.748443603515625, -32.24757385253906, -30.746707916259766, -29.245840072631836, -27.744972229003906, -26.244104385375977, -24.743236541748047, -23.242368698120117, -21.741500854492188, -20.240633010864258, -18.739765167236328, -17.2388973236084, -15.738029479980469, -14.237161636352539, -12.73629379272461, -11.23542594909668, -9.73455810546875, -8.23369026184082, -6.732822418212891, -5.231954574584961, -3.7310867309570312, -2.2302188873291016, -0.7293510437011719, 0.7715167999267578, 2.2723846435546875, 3.773252487182617, 5.2741241455078125, 6.774991989135742, 8.275859832763672, 9.776727676391602, 11.277595520019531, 12.778463363647461, 14.27933120727539, 15.78019905090332, 17.28106689453125, 18.78193473815918, 20.28280258178711, 21.78367042541504, 23.28453826904297, 24.7854061126709, 26.286273956298828, 27.787141799926758, 29.288009643554688, 30.788877487182617, 32.28974533081055, 33.790611267089844, 35.291481018066406, 36.79235076904297, 38.293216705322266, 39.79408264160156, 41.294952392578125, 42.79582214355469, 44.296688079833984, 45.79755401611328, 47.298423767089844, 48.799293518066406, 50.3001594543457, 51.801025390625, 53.30189514160156]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 4.0, 9.0, 12.0, 7.0, 12.0, 11.0, 24.0, 17.0, 24.0, 24.0, 31.0, 34.0, 28.0, 33.0, 34.0, 46.0, 34.0, 49.0, 33.0, 50.0, 41.0, 41.0, 46.0, 39.0, 34.0, 32.0, 27.0, 27.0, 30.0, 28.0, 25.0, 17.0, 23.0, 16.0, 13.0, 14.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-45.515384674072266, -43.931427001953125, -42.347469329833984, -40.763511657714844, -39.1795539855957, -37.59559631347656, -36.011634826660156, -34.42768096923828, -32.843719482421875, -31.259761810302734, -29.675804138183594, -28.091846466064453, -26.507888793945312, -24.923931121826172, -23.3399715423584, -21.756013870239258, -20.17205810546875, -18.58810043334961, -17.00414276123047, -15.420184135437012, -13.836226463317871, -12.25226879119873, -10.668310165405273, -9.084352493286133, -7.500394821166992, -5.916437149047852, -4.332479000091553, -2.748520851135254, -1.1645631790161133, 0.41939449310302734, 2.0033531188964844, 3.587310791015625, 5.1712646484375, 6.755222320556641, 8.339179992675781, 9.923138618469238, 11.507096290588379, 13.09105396270752, 14.675012588500977, 16.258970260620117, 17.842927932739258, 19.4268856048584, 21.01084327697754, 22.594802856445312, 24.178760528564453, 25.762718200683594, 27.346675872802734, 28.930633544921875, 30.514591217041016, 32.098548889160156, 33.6825065612793, 35.26646423339844, 36.85042190551758, 38.43437957763672, 40.018341064453125, 41.602294921875, 43.186256408691406, 44.77021408081055, 46.35417175292969, 47.93812942504883, 49.52208709716797, 51.10604476928711, 52.69000244140625, 54.273963928222656, 55.85791778564453]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 9.0, 10.0, 15.0, 21.0, 20.0, 26.0, 21.0, 27.0, 35.0, 41.0, 39.0, 39.0, 53.0, 49.0, 59.0, 45.0, 42.0, 41.0, 48.0, 38.0, 48.0, 29.0, 28.0, 29.0, 24.0, 25.0, 25.0, 15.0, 18.0, 16.0, 8.0, 9.0, 5.0, 6.0, 4.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-11.9296875, -11.6044921875, -11.279296875, -10.9541015625, -10.62890625, -10.3037109375, -9.978515625, -9.6533203125, -9.328125, -9.0029296875, -8.677734375, -8.3525390625, -8.02734375, -7.7021484375, -7.376953125, -7.0517578125, -6.7265625, -6.4013671875, -6.076171875, -5.7509765625, -5.42578125, -5.1005859375, -4.775390625, -4.4501953125, -4.125, -3.7998046875, -3.474609375, -3.1494140625, -2.82421875, -2.4990234375, -2.173828125, -1.8486328125, -1.5234375, -1.1982421875, -0.873046875, -0.5478515625, -0.22265625, 0.1025390625, 0.427734375, 0.7529296875, 1.078125, 1.4033203125, 1.728515625, 2.0537109375, 2.37890625, 2.7041015625, 3.029296875, 3.3544921875, 3.6796875, 4.0048828125, 4.330078125, 4.6552734375, 4.98046875, 5.3056640625, 5.630859375, 5.9560546875, 6.28125, 6.6064453125, 6.931640625, 7.2568359375, 7.58203125, 7.9072265625, 8.232421875, 8.5576171875, 8.8828125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 4.0, 2.0, 10.0, 12.0, 16.0, 16.0, 37.0, 66.0, 114.0, 154.0, 229.0, 333.0, 504.0, 774.0, 1196.0, 1857.0, 2703.0, 4229.0, 6560.0, 10470.0, 17082.0, 28062.0, 47264.0, 80194.0, 132623.0, 191898.0, 191413.0, 130770.0, 79382.0, 47021.0, 27789.0, 16750.0, 10530.0, 6352.0, 4197.0, 2709.0, 1843.0, 1161.0, 780.0, 478.0, 328.0, 236.0, 145.0, 91.0, 67.0, 38.0, 25.0, 20.0, 14.0, 9.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9248046875, -0.8939666748046875, -0.863128662109375, -0.8322906494140625, -0.80145263671875, -0.7706146240234375, -0.739776611328125, -0.7089385986328125, -0.6781005859375, -0.6472625732421875, -0.616424560546875, -0.5855865478515625, -0.55474853515625, -0.5239105224609375, -0.493072509765625, -0.4622344970703125, -0.431396484375, -0.4005584716796875, -0.369720458984375, -0.3388824462890625, -0.30804443359375, -0.2772064208984375, -0.246368408203125, -0.2155303955078125, -0.1846923828125, -0.1538543701171875, -0.123016357421875, -0.0921783447265625, -0.06134033203125, -0.0305023193359375, 0.000335693359375, 0.0311737060546875, 0.06201171875, 0.0928497314453125, 0.123687744140625, 0.1545257568359375, 0.18536376953125, 0.2162017822265625, 0.247039794921875, 0.2778778076171875, 0.3087158203125, 0.3395538330078125, 0.370391845703125, 0.4012298583984375, 0.43206787109375, 0.4629058837890625, 0.493743896484375, 0.5245819091796875, 0.555419921875, 0.5862579345703125, 0.617095947265625, 0.6479339599609375, 0.67877197265625, 0.7096099853515625, 0.740447998046875, 0.7712860107421875, 0.8021240234375, 0.8329620361328125, 0.863800048828125, 0.8946380615234375, 0.92547607421875, 0.9563140869140625, 0.987152099609375, 1.0179901123046875, 1.048828125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 4.0, 10.0, 10.0, 8.0, 22.0, 15.0, 13.0, 18.0, 24.0, 27.0, 25.0, 31.0, 28.0, 28.0, 33.0, 31.0, 28.0, 38.0, 46.0, 39.0, 1068.0, 41.0, 45.0, 41.0, 46.0, 29.0, 35.0, 28.0, 20.0, 27.0, 22.0, 22.0, 15.0, 22.0, 22.0, 14.0, 9.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.375, -6.19012451171875, -6.0052490234375, -5.82037353515625, -5.635498046875, -5.45062255859375, -5.2657470703125, -5.08087158203125, -4.89599609375, -4.71112060546875, -4.5262451171875, -4.34136962890625, -4.156494140625, -3.97161865234375, -3.7867431640625, -3.60186767578125, -3.4169921875, -3.23211669921875, -3.0472412109375, -2.86236572265625, -2.677490234375, -2.49261474609375, -2.3077392578125, -2.12286376953125, -1.93798828125, -1.75311279296875, -1.5682373046875, -1.38336181640625, -1.198486328125, -1.01361083984375, -0.8287353515625, -0.64385986328125, -0.458984375, -0.27410888671875, -0.0892333984375, 0.09564208984375, 0.280517578125, 0.46539306640625, 0.6502685546875, 0.83514404296875, 1.02001953125, 1.20489501953125, 1.3897705078125, 1.57464599609375, 1.759521484375, 1.94439697265625, 2.1292724609375, 2.31414794921875, 2.4990234375, 2.68389892578125, 2.8687744140625, 3.05364990234375, 3.238525390625, 3.42340087890625, 3.6082763671875, 3.79315185546875, 3.97802734375, 4.16290283203125, 4.3477783203125, 4.53265380859375, 4.717529296875, 4.90240478515625, 5.0872802734375, 5.27215576171875, 5.45703125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 10.0, 19.0, 24.0, 28.0, 42.0, 56.0, 85.0, 121.0, 194.0, 291.0, 405.0, 586.0, 820.0, 1406.0, 2046.0, 3355.0, 5565.0, 9807.0, 18580.0, 45112.0, 1589129.0, 344784.0, 36058.0, 16397.0, 8761.0, 5058.0, 3015.0, 1869.0, 1229.0, 762.0, 498.0, 345.0, 230.0, 141.0, 97.0, 69.0, 42.0, 25.0, 23.0, 14.0, 8.0, 8.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.96185302734375, -1.9022216796875, -1.84259033203125, -1.782958984375, -1.72332763671875, -1.6636962890625, -1.60406494140625, -1.54443359375, -1.48480224609375, -1.4251708984375, -1.36553955078125, -1.305908203125, -1.24627685546875, -1.1866455078125, -1.12701416015625, -1.0673828125, -1.00775146484375, -0.9481201171875, -0.88848876953125, -0.828857421875, -0.76922607421875, -0.7095947265625, -0.64996337890625, -0.59033203125, -0.53070068359375, -0.4710693359375, -0.41143798828125, -0.351806640625, -0.29217529296875, -0.2325439453125, -0.17291259765625, -0.11328125, -0.05364990234375, 0.0059814453125, 0.06561279296875, 0.125244140625, 0.18487548828125, 0.2445068359375, 0.30413818359375, 0.36376953125, 0.42340087890625, 0.4830322265625, 0.54266357421875, 0.602294921875, 0.66192626953125, 0.7215576171875, 0.78118896484375, 0.8408203125, 0.90045166015625, 0.9600830078125, 1.01971435546875, 1.079345703125, 1.13897705078125, 1.1986083984375, 1.25823974609375, 1.31787109375, 1.37750244140625, 1.4371337890625, 1.49676513671875, 1.556396484375, 1.61602783203125, 1.6756591796875, 1.73529052734375, 1.794921875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 7.0, 6.0, 6.0, 7.0, 13.0, 10.0, 13.0, 31.0, 27.0, 23.0, 49.0, 54.0, 41.0, 47.0, 53.0, 59.0, 64.0, 64.0, 70.0, 64.0, 60.0, 34.0, 33.0, 35.0, 31.0, 16.0, 21.0, 10.0, 9.0, 8.0, 9.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06817626953125, -0.0660247802734375, -0.063873291015625, -0.0617218017578125, -0.0595703125, -0.0574188232421875, -0.055267333984375, -0.0531158447265625, -0.05096435546875, -0.0488128662109375, -0.046661376953125, -0.0445098876953125, -0.0423583984375, -0.0402069091796875, -0.038055419921875, -0.0359039306640625, -0.03375244140625, -0.0316009521484375, -0.029449462890625, -0.0272979736328125, -0.025146484375, -0.0229949951171875, -0.020843505859375, -0.0186920166015625, -0.01654052734375, -0.0143890380859375, -0.012237548828125, -0.0100860595703125, -0.0079345703125, -0.0057830810546875, -0.003631591796875, -0.0014801025390625, 0.00067138671875, 0.0028228759765625, 0.004974365234375, 0.0071258544921875, 0.00927734375, 0.0114288330078125, 0.013580322265625, 0.0157318115234375, 0.01788330078125, 0.0200347900390625, 0.022186279296875, 0.0243377685546875, 0.0264892578125, 0.0286407470703125, 0.030792236328125, 0.0329437255859375, 0.03509521484375, 0.0372467041015625, 0.039398193359375, 0.0415496826171875, 0.043701171875, 0.0458526611328125, 0.048004150390625, 0.0501556396484375, 0.05230712890625, 0.0544586181640625, 0.056610107421875, 0.0587615966796875, 0.0609130859375, 0.0630645751953125, 0.065216064453125, 0.0673675537109375, 0.06951904296875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 8.0, 13.0, 6.0, 28.0, 25.0, 32.0, 48.0, 61.0, 73.0, 152.0, 226.0, 410.0, 2041.0, 665419.0, 377457.0, 1495.0, 359.0, 203.0, 126.0, 99.0, 71.0, 43.0, 45.0, 19.0, 21.0, 12.0, 8.0, 10.0, 7.0, 6.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4931640625, -1.4464263916015625, -1.399688720703125, -1.3529510498046875, -1.30621337890625, -1.2594757080078125, -1.212738037109375, -1.1660003662109375, -1.1192626953125, -1.0725250244140625, -1.025787353515625, -0.9790496826171875, -0.93231201171875, -0.8855743408203125, -0.838836669921875, -0.7920989990234375, -0.745361328125, -0.6986236572265625, -0.651885986328125, -0.6051483154296875, -0.55841064453125, -0.5116729736328125, -0.464935302734375, -0.4181976318359375, -0.3714599609375, -0.3247222900390625, -0.277984619140625, -0.2312469482421875, -0.18450927734375, -0.1377716064453125, -0.091033935546875, -0.0442962646484375, 0.00244140625, 0.0491790771484375, 0.095916748046875, 0.1426544189453125, 0.18939208984375, 0.2361297607421875, 0.282867431640625, 0.3296051025390625, 0.3763427734375, 0.4230804443359375, 0.469818115234375, 0.5165557861328125, 0.56329345703125, 0.6100311279296875, 0.656768798828125, 0.7035064697265625, 0.750244140625, 0.7969818115234375, 0.843719482421875, 0.8904571533203125, 0.93719482421875, 0.9839324951171875, 1.030670166015625, 1.0774078369140625, 1.1241455078125, 1.1708831787109375, 1.217620849609375, 1.2643585205078125, 1.31109619140625, 1.3578338623046875, 1.404571533203125, 1.4513092041015625, 1.498046875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [5.0, 3.0, 16.0, 32.0, 111.0, 376.0, 332.0, 98.0, 28.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06401155889034271, -0.05321356654167175, -0.04241557419300079, -0.031617581844329834, -0.020819589495658875, -0.010021597146987915, 0.0007763952016830444, 0.011574387550354004, 0.022372379899024963, 0.03317037224769592, 0.04396836459636688, 0.05476635694503784, 0.0655643492937088, 0.07636234164237976, 0.08716033399105072, 0.09795832633972168, 0.10875631868839264, 0.1195543110370636, 0.13035230338573456, 0.14115029573440552, 0.15194828808307648, 0.16274628043174744, 0.1735442727804184, 0.18434226512908936, 0.19514025747776031, 0.20593824982643127, 0.21673624217510223, 0.2275342345237732, 0.23833222687244415, 0.2491302192211151, 0.25992822647094727, 0.27072620391845703, 0.2815241813659668, 0.29232215881347656, 0.3031201660633087, 0.31391817331314087, 0.32471615076065063, 0.3355141282081604, 0.34631213545799255, 0.3571101427078247, 0.3679081201553345, 0.37870609760284424, 0.3895041048526764, 0.40030211210250854, 0.4111000895500183, 0.4218980669975281, 0.43269607424736023, 0.4434940814971924, 0.45429205894470215, 0.4650900363922119, 0.47588804364204407, 0.4866860508918762, 0.497484028339386, 0.5082820057868958, 0.5190800428390503, 0.5298780202865601, 0.5406759977340698, 0.5514739751815796, 0.5622719526290894, 0.5730699896812439, 0.5838679671287537, 0.5946659445762634, 0.605463981628418, 0.6162619590759277, 0.6270599365234375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 7.0, 1.0, 5.0, 3.0, 9.0, 8.0, 6.0, 17.0, 13.0, 18.0, 25.0, 29.0, 20.0, 24.0, 26.0, 33.0, 37.0, 46.0, 41.0, 37.0, 45.0, 37.0, 34.0, 40.0, 57.0, 40.0, 45.0, 45.0, 30.0, 43.0, 25.0, 28.0, 14.0, 22.0, 18.0, 13.0, 14.0, 13.0, 4.0, 3.0, 6.0, 2.0, 12.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.05833578109741211, -0.0566730722784996, -0.0550103634595871, -0.05334765836596489, -0.05168494954705238, -0.05002224072813988, -0.04835953563451767, -0.046696826815605164, -0.04503411799669266, -0.04337140917778015, -0.041708700358867645, -0.04004599526524544, -0.03838328644633293, -0.036720577627420425, -0.03505787253379822, -0.03339516371488571, -0.031732454895973206, -0.0300697460770607, -0.028407039120793343, -0.026744332164525986, -0.02508162334561348, -0.023418914526700974, -0.021756207570433617, -0.02009350061416626, -0.018430791795253754, -0.016768082976341248, -0.01510537602007389, -0.01344266813248396, -0.011779960244894028, -0.010117252357304096, -0.008454544469714165, -0.006791836582124233, -0.005129128694534302, -0.0034664208069443703, -0.0018037129193544388, -0.0001410050317645073, 0.0015217028558254242, 0.0031844107434153557, 0.004847118631005287, 0.006509826518595219, 0.00817253440618515, 0.009835242293775082, 0.011497950181365013, 0.013160658068954945, 0.014823365956544876, 0.016486074775457382, 0.01814878173172474, 0.019811488687992096, 0.021474197506904602, 0.023136906325817108, 0.024799613282084465, 0.026462320238351822, 0.028125029057264328, 0.029787737876176834, 0.03145044296979904, 0.03311315178871155, 0.034775860607624054, 0.03643856942653656, 0.038101278245449066, 0.039763983339071274, 0.04142669215798378, 0.043089400976896286, 0.044752106070518494, 0.046414814889431, 0.048077523708343506]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 5.0, 9.0, 9.0, 10.0, 15.0, 21.0, 21.0, 25.0, 21.0, 27.0, 36.0, 40.0, 39.0, 41.0, 52.0, 48.0, 59.0, 46.0, 42.0, 40.0, 48.0, 39.0, 47.0, 29.0, 29.0, 29.0, 23.0, 25.0, 25.0, 15.0, 18.0, 17.0, 7.0, 9.0, 5.0, 6.0, 4.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-11.921875, -11.5968017578125, -11.271728515625, -10.9466552734375, -10.62158203125, -10.2965087890625, -9.971435546875, -9.6463623046875, -9.3212890625, -8.9962158203125, -8.671142578125, -8.3460693359375, -8.02099609375, -7.6959228515625, -7.370849609375, -7.0457763671875, -6.720703125, -6.3956298828125, -6.070556640625, -5.7454833984375, -5.42041015625, -5.0953369140625, -4.770263671875, -4.4451904296875, -4.1201171875, -3.7950439453125, -3.469970703125, -3.1448974609375, -2.81982421875, -2.4947509765625, -2.169677734375, -1.8446044921875, -1.51953125, -1.1944580078125, -0.869384765625, -0.5443115234375, -0.21923828125, 0.1058349609375, 0.430908203125, 0.7559814453125, 1.0810546875, 1.4061279296875, 1.731201171875, 2.0562744140625, 2.38134765625, 2.7064208984375, 3.031494140625, 3.3565673828125, 3.681640625, 4.0067138671875, 4.331787109375, 4.6568603515625, 4.98193359375, 5.3070068359375, 5.632080078125, 5.9571533203125, 6.2822265625, 6.6072998046875, 6.932373046875, 7.2574462890625, 7.58251953125, 7.9075927734375, 8.232666015625, 8.5577392578125, 8.8828125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 11.0, 8.0, 13.0, 16.0, 23.0, 45.0, 50.0, 94.0, 115.0, 147.0, 243.0, 400.0, 640.0, 1033.0, 1592.0, 2985.0, 5674.0, 11144.0, 23218.0, 52749.0, 133434.0, 317927.0, 289999.0, 117057.0, 46772.0, 20840.0, 10298.0, 5259.0, 2664.0, 1528.0, 877.0, 564.0, 350.0, 260.0, 155.0, 123.0, 73.0, 60.0, 29.0, 20.0, 15.0, 13.0, 6.0, 4.0, 10.0, 6.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.140625, -14.651123046875, -14.16162109375, -13.672119140625, -13.1826171875, -12.693115234375, -12.20361328125, -11.714111328125, -11.224609375, -10.735107421875, -10.24560546875, -9.756103515625, -9.2666015625, -8.777099609375, -8.28759765625, -7.798095703125, -7.30859375, -6.819091796875, -6.32958984375, -5.840087890625, -5.3505859375, -4.861083984375, -4.37158203125, -3.882080078125, -3.392578125, -2.903076171875, -2.41357421875, -1.924072265625, -1.4345703125, -0.945068359375, -0.45556640625, 0.033935546875, 0.5234375, 1.012939453125, 1.50244140625, 1.991943359375, 2.4814453125, 2.970947265625, 3.46044921875, 3.949951171875, 4.439453125, 4.928955078125, 5.41845703125, 5.907958984375, 6.3974609375, 6.886962890625, 7.37646484375, 7.865966796875, 8.35546875, 8.844970703125, 9.33447265625, 9.823974609375, 10.3134765625, 10.802978515625, 11.29248046875, 11.781982421875, 12.271484375, 12.760986328125, 13.25048828125, 13.739990234375, 14.2294921875, 14.718994140625, 15.20849609375, 15.697998046875, 16.1875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 10.0, 13.0, 13.0, 10.0, 15.0, 24.0, 22.0, 39.0, 25.0, 35.0, 29.0, 48.0, 62.0, 69.0, 105.0, 189.0, 284.0, 1313.0, 193.0, 115.0, 72.0, 61.0, 46.0, 42.0, 39.0, 28.0, 23.0, 15.0, 17.0, 18.0, 10.0, 9.0, 12.0, 9.0, 5.0, 7.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.921875, -22.16064453125, -21.3994140625, -20.63818359375, -19.876953125, -19.11572265625, -18.3544921875, -17.59326171875, -16.83203125, -16.07080078125, -15.3095703125, -14.54833984375, -13.787109375, -13.02587890625, -12.2646484375, -11.50341796875, -10.7421875, -9.98095703125, -9.2197265625, -8.45849609375, -7.697265625, -6.93603515625, -6.1748046875, -5.41357421875, -4.65234375, -3.89111328125, -3.1298828125, -2.36865234375, -1.607421875, -0.84619140625, -0.0849609375, 0.67626953125, 1.4375, 2.19873046875, 2.9599609375, 3.72119140625, 4.482421875, 5.24365234375, 6.0048828125, 6.76611328125, 7.52734375, 8.28857421875, 9.0498046875, 9.81103515625, 10.572265625, 11.33349609375, 12.0947265625, 12.85595703125, 13.6171875, 14.37841796875, 15.1396484375, 15.90087890625, 16.662109375, 17.42333984375, 18.1845703125, 18.94580078125, 19.70703125, 20.46826171875, 21.2294921875, 21.99072265625, 22.751953125, 23.51318359375, 24.2744140625, 25.03564453125, 25.796875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 2.0, 8.0, 8.0, 13.0, 13.0, 21.0, 40.0, 46.0, 74.0, 96.0, 139.0, 220.0, 430.0, 945.0, 2673.0, 10512.0, 64748.0, 1483710.0, 1501248.0, 65340.0, 10610.0, 2635.0, 959.0, 442.0, 251.0, 166.0, 93.0, 84.0, 46.0, 32.0, 32.0, 19.0, 20.0, 8.0, 5.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.28125, -38.1259765625, -36.970703125, -35.8154296875, -34.66015625, -33.5048828125, -32.349609375, -31.1943359375, -30.0390625, -28.8837890625, -27.728515625, -26.5732421875, -25.41796875, -24.2626953125, -23.107421875, -21.9521484375, -20.796875, -19.6416015625, -18.486328125, -17.3310546875, -16.17578125, -15.0205078125, -13.865234375, -12.7099609375, -11.5546875, -10.3994140625, -9.244140625, -8.0888671875, -6.93359375, -5.7783203125, -4.623046875, -3.4677734375, -2.3125, -1.1572265625, -0.001953125, 1.1533203125, 2.30859375, 3.4638671875, 4.619140625, 5.7744140625, 6.9296875, 8.0849609375, 9.240234375, 10.3955078125, 11.55078125, 12.7060546875, 13.861328125, 15.0166015625, 16.171875, 17.3271484375, 18.482421875, 19.6376953125, 20.79296875, 21.9482421875, 23.103515625, 24.2587890625, 25.4140625, 26.5693359375, 27.724609375, 28.8798828125, 30.03515625, 31.1904296875, 32.345703125, 33.5009765625, 34.65625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 22.0, 233.0, 596.0, 146.0, 18.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.10861206054688, -126.11270141601562, -115.11678314208984, -104.12086486816406, -93.12495422363281, -82.12904357910156, -71.13312530517578, -60.13720703125, -49.14129638671875, -38.145381927490234, -27.14946746826172, -16.153553009033203, -5.1576385498046875, 5.838275909423828, 16.834190368652344, 27.830108642578125, 38.826019287109375, 49.82193374633789, 60.817848205566406, 71.81376647949219, 82.80967712402344, 93.80558776855469, 104.80150604248047, 115.79742431640625, 126.7933349609375, 137.78924560546875, 148.78515625, 159.7810821533203, 170.77699279785156, 181.7729034423828, 192.76882934570312, 203.76473999023438, 214.7606201171875, 225.75653076171875, 236.75244140625, 247.7483673095703, 258.7442626953125, 269.7402038574219, 280.7361145019531, 291.7320251464844, 302.7279357910156, 313.7238464355469, 324.7197570800781, 335.7156677246094, 346.71160888671875, 357.70751953125, 368.70343017578125, 379.6993408203125, 390.69525146484375, 401.691162109375, 412.68707275390625, 423.6829833984375, 434.67889404296875, 445.6748352050781, 456.6707458496094, 467.6666564941406, 478.6625671386719, 489.6584777832031, 500.6543884277344, 511.6502990722656, 522.646240234375, 533.6421508789062, 544.6380615234375, 555.6339721679688, 566.6298828125]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 2.0, 4.0, 6.0, 7.0, 13.0, 13.0, 14.0, 15.0, 18.0, 22.0, 18.0, 23.0, 22.0, 29.0, 44.0, 35.0, 24.0, 32.0, 32.0, 32.0, 54.0, 36.0, 48.0, 41.0, 37.0, 54.0, 32.0, 54.0, 30.0, 28.0, 24.0, 29.0, 12.0, 21.0, 13.0, 13.0, 14.0, 10.0, 8.0, 4.0, 5.0, 12.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-60.26881408691406, -58.4549674987793, -56.641117095947266, -54.8272705078125, -53.013423919677734, -51.19957733154297, -49.38572692871094, -47.57188034057617, -45.758033752441406, -43.94418716430664, -42.13033676147461, -40.316490173339844, -38.50264358520508, -36.68879699707031, -34.87494659423828, -33.061100006103516, -31.247249603271484, -29.433401107788086, -27.61955451965332, -25.805706024169922, -23.991859436035156, -22.178010940551758, -20.36416244506836, -18.550315856933594, -16.736467361450195, -14.922619819641113, -13.108772277832031, -11.294923782348633, -9.48107624053955, -7.667228698730469, -5.85338020324707, -4.039532661437988, -2.225688934326172, -0.41184115409851074, 1.4020066261291504, 3.2158546447753906, 5.029702186584473, 6.843549728393555, 8.657398223876953, 10.471245765686035, 12.285093307495117, 14.0989408493042, 15.912788391113281, 17.72663688659668, 19.540485382080078, 21.354331970214844, 23.168180465698242, 24.98202896118164, 26.795875549316406, 28.609724044799805, 30.42357063293457, 32.23741912841797, 34.051265716552734, 35.8651123046875, 37.67896270751953, 39.4928092956543, 41.30665588378906, 43.12050247192383, 44.93435287475586, 46.748199462890625, 48.56204605102539, 50.375892639160156, 52.18974304199219, 54.00358963012695, 55.817440032958984]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 5.0, 9.0, 7.0, 8.0, 17.0, 16.0, 25.0, 19.0, 30.0, 35.0, 32.0, 38.0, 49.0, 48.0, 53.0, 42.0, 44.0, 54.0, 46.0, 42.0, 46.0, 42.0, 39.0, 40.0, 35.0, 26.0, 31.0, 23.0, 16.0, 18.0, 13.0, 7.0, 10.0, 8.0, 7.0, 2.0, 2.0, 2.0, 5.0, 0.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1171875, -10.773681640625, -10.43017578125, -10.086669921875, -9.7431640625, -9.399658203125, -9.05615234375, -8.712646484375, -8.369140625, -8.025634765625, -7.68212890625, -7.338623046875, -6.9951171875, -6.651611328125, -6.30810546875, -5.964599609375, -5.62109375, -5.277587890625, -4.93408203125, -4.590576171875, -4.2470703125, -3.903564453125, -3.56005859375, -3.216552734375, -2.873046875, -2.529541015625, -2.18603515625, -1.842529296875, -1.4990234375, -1.155517578125, -0.81201171875, -0.468505859375, -0.125, 0.218505859375, 0.56201171875, 0.905517578125, 1.2490234375, 1.592529296875, 1.93603515625, 2.279541015625, 2.623046875, 2.966552734375, 3.31005859375, 3.653564453125, 3.9970703125, 4.340576171875, 4.68408203125, 5.027587890625, 5.37109375, 5.714599609375, 6.05810546875, 6.401611328125, 6.7451171875, 7.088623046875, 7.43212890625, 7.775634765625, 8.119140625, 8.462646484375, 8.80615234375, 9.149658203125, 9.4931640625, 9.836669921875, 10.18017578125, 10.523681640625, 10.8671875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 12.0, 4.0, 5.0, 15.0, 23.0, 16.0, 22.0, 26.0, 36.0, 42.0, 66.0, 79.0, 95.0, 148.0, 200.0, 301.0, 587.0, 2046.0, 57775.0, 4112185.0, 17608.0, 1461.0, 499.0, 258.0, 191.0, 134.0, 95.0, 63.0, 61.0, 35.0, 43.0, 27.0, 13.0, 17.0, 19.0, 13.0, 9.0, 9.0, 11.0, 4.0, 7.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-97.3125, -94.3076171875, -91.302734375, -88.2978515625, -85.29296875, -82.2880859375, -79.283203125, -76.2783203125, -73.2734375, -70.2685546875, -67.263671875, -64.2587890625, -61.25390625, -58.2490234375, -55.244140625, -52.2392578125, -49.234375, -46.2294921875, -43.224609375, -40.2197265625, -37.21484375, -34.2099609375, -31.205078125, -28.2001953125, -25.1953125, -22.1904296875, -19.185546875, -16.1806640625, -13.17578125, -10.1708984375, -7.166015625, -4.1611328125, -1.15625, 1.8486328125, 4.853515625, 7.8583984375, 10.86328125, 13.8681640625, 16.873046875, 19.8779296875, 22.8828125, 25.8876953125, 28.892578125, 31.8974609375, 34.90234375, 37.9072265625, 40.912109375, 43.9169921875, 46.921875, 49.9267578125, 52.931640625, 55.9365234375, 58.94140625, 61.9462890625, 64.951171875, 67.9560546875, 70.9609375, 73.9658203125, 76.970703125, 79.9755859375, 82.98046875, 85.9853515625, 88.990234375, 91.9951171875, 95.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 7.0, 4.0, 16.0, 15.0, 26.0, 27.0, 52.0, 43.0, 80.0, 109.0, 174.0, 231.0, 403.0, 548.0, 676.0, 514.0, 310.0, 238.0, 142.0, 99.0, 75.0, 62.0, 47.0, 39.0, 22.0, 27.0, 19.0, 14.0, 9.0, 4.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.90625, -14.45947265625, -14.0126953125, -13.56591796875, -13.119140625, -12.67236328125, -12.2255859375, -11.77880859375, -11.33203125, -10.88525390625, -10.4384765625, -9.99169921875, -9.544921875, -9.09814453125, -8.6513671875, -8.20458984375, -7.7578125, -7.31103515625, -6.8642578125, -6.41748046875, -5.970703125, -5.52392578125, -5.0771484375, -4.63037109375, -4.18359375, -3.73681640625, -3.2900390625, -2.84326171875, -2.396484375, -1.94970703125, -1.5029296875, -1.05615234375, -0.609375, -0.16259765625, 0.2841796875, 0.73095703125, 1.177734375, 1.62451171875, 2.0712890625, 2.51806640625, 2.96484375, 3.41162109375, 3.8583984375, 4.30517578125, 4.751953125, 5.19873046875, 5.6455078125, 6.09228515625, 6.5390625, 6.98583984375, 7.4326171875, 7.87939453125, 8.326171875, 8.77294921875, 9.2197265625, 9.66650390625, 10.11328125, 10.56005859375, 11.0068359375, 11.45361328125, 11.900390625, 12.34716796875, 12.7939453125, 13.24072265625, 13.6875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 2.0, 5.0, 2.0, 7.0, 5.0, 9.0, 13.0, 13.0, 21.0, 30.0, 25.0, 54.0, 74.0, 187.0, 458.0, 1421.0, 5512.0, 33237.0, 876188.0, 3197448.0, 67577.0, 8812.0, 2047.0, 594.0, 213.0, 117.0, 70.0, 34.0, 28.0, 19.0, 11.0, 11.0, 11.0, 10.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.15625, -43.60693359375, -42.0576171875, -40.50830078125, -38.958984375, -37.40966796875, -35.8603515625, -34.31103515625, -32.76171875, -31.21240234375, -29.6630859375, -28.11376953125, -26.564453125, -25.01513671875, -23.4658203125, -21.91650390625, -20.3671875, -18.81787109375, -17.2685546875, -15.71923828125, -14.169921875, -12.62060546875, -11.0712890625, -9.52197265625, -7.97265625, -6.42333984375, -4.8740234375, -3.32470703125, -1.775390625, -0.22607421875, 1.3232421875, 2.87255859375, 4.421875, 5.97119140625, 7.5205078125, 9.06982421875, 10.619140625, 12.16845703125, 13.7177734375, 15.26708984375, 16.81640625, 18.36572265625, 19.9150390625, 21.46435546875, 23.013671875, 24.56298828125, 26.1123046875, 27.66162109375, 29.2109375, 30.76025390625, 32.3095703125, 33.85888671875, 35.408203125, 36.95751953125, 38.5068359375, 40.05615234375, 41.60546875, 43.15478515625, 44.7041015625, 46.25341796875, 47.802734375, 49.35205078125, 50.9013671875, 52.45068359375, 54.0]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 137.0, 641.0, 215.0, 14.0, 0.0, 1.0, 1.0], "bins": [-721.2644653320312, -708.9523315429688, -696.6401977539062, -684.3280029296875, -672.015869140625, -659.7037353515625, -647.3916015625, -635.0794677734375, -622.767333984375, -610.4552001953125, -598.14306640625, -585.8309326171875, -573.5187377929688, -561.2066040039062, -548.8944702148438, -536.5823364257812, -524.2701416015625, -511.9580078125, -499.6458435058594, -487.3337097167969, -475.0215759277344, -462.70941162109375, -450.39727783203125, -438.08514404296875, -425.77301025390625, -413.46087646484375, -401.1487121582031, -388.8365783691406, -376.5244445800781, -364.2122802734375, -351.900146484375, -339.5880126953125, -327.2758483886719, -314.9637145996094, -302.65155029296875, -290.33941650390625, -278.02728271484375, -265.71514892578125, -253.40298461914062, -241.09085083007812, -228.77871704101562, -216.46656799316406, -204.15443420410156, -191.84228515625, -179.5301513671875, -167.21800231933594, -154.90585327148438, -142.59371948242188, -130.28155517578125, -117.96941375732422, -105.65727233886719, -93.34512329101562, -81.0329818725586, -68.72084045410156, -56.40869140625, -44.09654998779297, -31.78441619873047, -19.472272872924805, -7.160129547119141, 5.152015686035156, 17.464157104492188, 29.77629852294922, 42.08844757080078, 54.40058898925781, 66.71273040771484]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 0.0, 7.0, 3.0, 8.0, 9.0, 14.0, 19.0, 24.0, 22.0, 28.0, 30.0, 30.0, 35.0, 41.0, 54.0, 39.0, 42.0, 38.0, 50.0, 53.0, 44.0, 45.0, 44.0, 35.0, 36.0, 31.0, 29.0, 31.0, 26.0, 19.0, 21.0, 14.0, 19.0, 13.0, 13.0, 6.0, 7.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-58.151607513427734, -56.59189224243164, -55.03217697143555, -53.47246170043945, -51.91274642944336, -50.353031158447266, -48.79331970214844, -47.233604431152344, -45.67388916015625, -44.114173889160156, -42.55445861816406, -40.99474334716797, -39.435028076171875, -37.87531280517578, -36.31559753417969, -34.755882263183594, -33.1961669921875, -31.636451721191406, -30.076736450195312, -28.51702117919922, -26.957305908203125, -25.39759063720703, -23.83787727355957, -22.278162002563477, -20.718446731567383, -19.15873146057129, -17.599016189575195, -16.039302825927734, -14.479586601257324, -12.91987133026123, -11.360157012939453, -9.80044174194336, -8.24072265625, -6.681007385253906, -5.121292591094971, -3.561577796936035, -2.0018625259399414, -0.44214725494384766, 1.1175670623779297, 2.6772823333740234, 4.236997604370117, 5.796712875366211, 7.3564276695251465, 8.916142463684082, 10.475857734680176, 12.03557300567627, 13.595287322998047, 15.15500259399414, 16.714717864990234, 18.274433135986328, 19.834148406982422, 21.393863677978516, 22.95357894897461, 24.513294219970703, 26.073007583618164, 27.632722854614258, 29.19243812561035, 30.752153396606445, 32.311866760253906, 33.87158203125, 35.431297302246094, 36.99101257324219, 38.55072784423828, 40.110443115234375, 41.67015838623047]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 2.0, 7.0, 7.0, 7.0, 18.0, 20.0, 20.0, 32.0, 29.0, 23.0, 37.0, 42.0, 48.0, 47.0, 39.0, 42.0, 50.0, 46.0, 62.0, 49.0, 42.0, 45.0, 38.0, 27.0, 27.0, 38.0, 22.0, 28.0, 18.0, 18.0, 13.0, 12.0, 9.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8515625, -8.519775390625, -8.18798828125, -7.856201171875, -7.5244140625, -7.192626953125, -6.86083984375, -6.529052734375, -6.197265625, -5.865478515625, -5.53369140625, -5.201904296875, -4.8701171875, -4.538330078125, -4.20654296875, -3.874755859375, -3.54296875, -3.211181640625, -2.87939453125, -2.547607421875, -2.2158203125, -1.884033203125, -1.55224609375, -1.220458984375, -0.888671875, -0.556884765625, -0.22509765625, 0.106689453125, 0.4384765625, 0.770263671875, 1.10205078125, 1.433837890625, 1.765625, 2.097412109375, 2.42919921875, 2.760986328125, 3.0927734375, 3.424560546875, 3.75634765625, 4.088134765625, 4.419921875, 4.751708984375, 5.08349609375, 5.415283203125, 5.7470703125, 6.078857421875, 6.41064453125, 6.742431640625, 7.07421875, 7.406005859375, 7.73779296875, 8.069580078125, 8.4013671875, 8.733154296875, 9.06494140625, 9.396728515625, 9.728515625, 10.060302734375, 10.39208984375, 10.723876953125, 11.0556640625, 11.387451171875, 11.71923828125, 12.051025390625, 12.3828125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 7.0, 16.0, 14.0, 20.0, 46.0, 57.0, 85.0, 137.0, 209.0, 320.0, 528.0, 793.0, 1242.0, 2105.0, 3499.0, 5961.0, 10195.0, 17985.0, 32204.0, 58677.0, 106391.0, 180530.0, 228876.0, 171587.0, 100933.0, 54834.0, 30398.0, 16995.0, 9520.0, 5725.0, 3271.0, 1989.0, 1285.0, 788.0, 478.0, 290.0, 190.0, 139.0, 90.0, 45.0, 38.0, 23.0, 16.0, 11.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2177734375, -1.181365966796875, -1.14495849609375, -1.108551025390625, -1.0721435546875, -1.035736083984375, -0.99932861328125, -0.962921142578125, -0.926513671875, -0.890106201171875, -0.85369873046875, -0.817291259765625, -0.7808837890625, -0.744476318359375, -0.70806884765625, -0.671661376953125, -0.63525390625, -0.598846435546875, -0.56243896484375, -0.526031494140625, -0.4896240234375, -0.453216552734375, -0.41680908203125, -0.380401611328125, -0.343994140625, -0.307586669921875, -0.27117919921875, -0.234771728515625, -0.1983642578125, -0.161956787109375, -0.12554931640625, -0.089141845703125, -0.052734375, -0.016326904296875, 0.02008056640625, 0.056488037109375, 0.0928955078125, 0.129302978515625, 0.16571044921875, 0.202117919921875, 0.238525390625, 0.274932861328125, 0.31134033203125, 0.347747802734375, 0.3841552734375, 0.420562744140625, 0.45697021484375, 0.493377685546875, 0.52978515625, 0.566192626953125, 0.60260009765625, 0.639007568359375, 0.6754150390625, 0.711822509765625, 0.74822998046875, 0.784637451171875, 0.821044921875, 0.857452392578125, 0.89385986328125, 0.930267333984375, 0.9666748046875, 1.003082275390625, 1.03948974609375, 1.075897216796875, 1.1123046875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 3.0, 8.0, 11.0, 12.0, 11.0, 10.0, 15.0, 18.0, 21.0, 26.0, 21.0, 26.0, 18.0, 29.0, 29.0, 27.0, 32.0, 29.0, 38.0, 48.0, 30.0, 1064.0, 44.0, 44.0, 25.0, 38.0, 37.0, 29.0, 31.0, 25.0, 32.0, 30.0, 26.0, 23.0, 10.0, 19.0, 16.0, 20.0, 8.0, 8.0, 6.0, 3.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.4765625, -5.290283203125, -5.10400390625, -4.917724609375, -4.7314453125, -4.545166015625, -4.35888671875, -4.172607421875, -3.986328125, -3.800048828125, -3.61376953125, -3.427490234375, -3.2412109375, -3.054931640625, -2.86865234375, -2.682373046875, -2.49609375, -2.309814453125, -2.12353515625, -1.937255859375, -1.7509765625, -1.564697265625, -1.37841796875, -1.192138671875, -1.005859375, -0.819580078125, -0.63330078125, -0.447021484375, -0.2607421875, -0.074462890625, 0.11181640625, 0.298095703125, 0.484375, 0.670654296875, 0.85693359375, 1.043212890625, 1.2294921875, 1.415771484375, 1.60205078125, 1.788330078125, 1.974609375, 2.160888671875, 2.34716796875, 2.533447265625, 2.7197265625, 2.906005859375, 3.09228515625, 3.278564453125, 3.46484375, 3.651123046875, 3.83740234375, 4.023681640625, 4.2099609375, 4.396240234375, 4.58251953125, 4.768798828125, 4.955078125, 5.141357421875, 5.32763671875, 5.513916015625, 5.7001953125, 5.886474609375, 6.07275390625, 6.259033203125, 6.4453125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 11.0, 5.0, 19.0, 16.0, 29.0, 43.0, 76.0, 102.0, 125.0, 238.0, 299.0, 457.0, 698.0, 1133.0, 1769.0, 2729.0, 4653.0, 7836.0, 14381.0, 29484.0, 157743.0, 1768862.0, 57849.0, 21188.0, 11065.0, 6159.0, 3735.0, 2226.0, 1425.0, 949.0, 624.0, 391.0, 261.0, 177.0, 108.0, 82.0, 56.0, 48.0, 23.0, 12.0, 14.0, 7.0, 10.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8564453125, -1.7908172607421875, -1.725189208984375, -1.6595611572265625, -1.59393310546875, -1.5283050537109375, -1.462677001953125, -1.3970489501953125, -1.3314208984375, -1.2657928466796875, -1.200164794921875, -1.1345367431640625, -1.06890869140625, -1.0032806396484375, -0.937652587890625, -0.8720245361328125, -0.806396484375, -0.7407684326171875, -0.675140380859375, -0.6095123291015625, -0.54388427734375, -0.4782562255859375, -0.412628173828125, -0.3470001220703125, -0.2813720703125, -0.2157440185546875, -0.150115966796875, -0.0844879150390625, -0.01885986328125, 0.0467681884765625, 0.112396240234375, 0.1780242919921875, 0.24365234375, 0.3092803955078125, 0.374908447265625, 0.4405364990234375, 0.50616455078125, 0.5717926025390625, 0.637420654296875, 0.7030487060546875, 0.7686767578125, 0.8343048095703125, 0.899932861328125, 0.9655609130859375, 1.03118896484375, 1.0968170166015625, 1.162445068359375, 1.2280731201171875, 1.293701171875, 1.3593292236328125, 1.424957275390625, 1.4905853271484375, 1.55621337890625, 1.6218414306640625, 1.687469482421875, 1.7530975341796875, 1.8187255859375, 1.8843536376953125, 1.949981689453125, 2.0156097412109375, 2.08123779296875, 2.1468658447265625, 2.212493896484375, 2.2781219482421875, 2.34375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 3.0, 5.0, 14.0, 11.0, 18.0, 15.0, 17.0, 21.0, 23.0, 21.0, 27.0, 39.0, 34.0, 51.0, 32.0, 51.0, 40.0, 44.0, 45.0, 59.0, 43.0, 51.0, 35.0, 42.0, 40.0, 30.0, 26.0, 20.0, 24.0, 18.0, 16.0, 10.0, 7.0, 15.0, 6.0, 11.0, 3.0, 11.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051971435546875, -0.05025339126586914, -0.04853534698486328, -0.04681730270385742, -0.04509925842285156, -0.0433812141418457, -0.041663169860839844, -0.039945125579833984, -0.038227081298828125, -0.036509037017822266, -0.034790992736816406, -0.03307294845581055, -0.03135490417480469, -0.029636859893798828, -0.02791881561279297, -0.02620077133178711, -0.02448272705078125, -0.02276468276977539, -0.02104663848876953, -0.019328594207763672, -0.017610549926757812, -0.015892505645751953, -0.014174461364746094, -0.012456417083740234, -0.010738372802734375, -0.009020328521728516, -0.007302284240722656, -0.005584239959716797, -0.0038661956787109375, -0.002148151397705078, -0.00043010711669921875, 0.0012879371643066406, 0.0030059814453125, 0.004724025726318359, 0.006442070007324219, 0.008160114288330078, 0.009878158569335938, 0.011596202850341797, 0.013314247131347656, 0.015032291412353516, 0.016750335693359375, 0.018468379974365234, 0.020186424255371094, 0.021904468536376953, 0.023622512817382812, 0.025340557098388672, 0.02705860137939453, 0.02877664566040039, 0.03049468994140625, 0.03221273422241211, 0.03393077850341797, 0.03564882278442383, 0.03736686706542969, 0.03908491134643555, 0.040802955627441406, 0.042520999908447266, 0.044239044189453125, 0.045957088470458984, 0.047675132751464844, 0.0493931770324707, 0.05111122131347656, 0.05282926559448242, 0.05454730987548828, 0.05626535415649414, 0.0579833984375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 14.0, 12.0, 12.0, 11.0, 21.0, 16.0, 32.0, 36.0, 44.0, 49.0, 52.0, 114.0, 122.0, 188.0, 276.0, 610.0, 3367.0, 160333.0, 864603.0, 16258.0, 1154.0, 390.0, 209.0, 140.0, 101.0, 82.0, 55.0, 50.0, 41.0, 32.0, 24.0, 18.0, 16.0, 19.0, 9.0, 9.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.1630859375, -1.129119873046875, -1.09515380859375, -1.061187744140625, -1.0272216796875, -0.993255615234375, -0.95928955078125, -0.925323486328125, -0.891357421875, -0.857391357421875, -0.82342529296875, -0.789459228515625, -0.7554931640625, -0.721527099609375, -0.68756103515625, -0.653594970703125, -0.61962890625, -0.585662841796875, -0.55169677734375, -0.517730712890625, -0.4837646484375, -0.449798583984375, -0.41583251953125, -0.381866455078125, -0.347900390625, -0.313934326171875, -0.27996826171875, -0.246002197265625, -0.2120361328125, -0.178070068359375, -0.14410400390625, -0.110137939453125, -0.076171875, -0.042205810546875, -0.00823974609375, 0.025726318359375, 0.0596923828125, 0.093658447265625, 0.12762451171875, 0.161590576171875, 0.195556640625, 0.229522705078125, 0.26348876953125, 0.297454833984375, 0.3314208984375, 0.365386962890625, 0.39935302734375, 0.433319091796875, 0.46728515625, 0.501251220703125, 0.53521728515625, 0.569183349609375, 0.6031494140625, 0.637115478515625, 0.67108154296875, 0.705047607421875, 0.739013671875, 0.772979736328125, 0.80694580078125, 0.840911865234375, 0.8748779296875, 0.908843994140625, 0.94281005859375, 0.976776123046875, 1.0107421875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 25.0, 162.0, 500.0, 261.0, 48.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7792996168136597, -0.7642106413841248, -0.7491216659545898, -0.7340327501296997, -0.7189437747001648, -0.7038547992706299, -0.688765823841095, -0.6736768484115601, -0.6585879325866699, -0.643498957157135, -0.6284099817276001, -0.61332106590271, -0.598232090473175, -0.5831431150436401, -0.5680541396141052, -0.5529651641845703, -0.5378761887550354, -0.5227872133255005, -0.5076982378959656, -0.49260929226875305, -0.4775203466415405, -0.4624313712120056, -0.4473423957824707, -0.4322534501552582, -0.41716450452804565, -0.40207552909851074, -0.3869865834712982, -0.3718976080417633, -0.3568086624145508, -0.34171968698501587, -0.32663071155548096, -0.31154176592826843, -0.29645276069641113, -0.2813637852668762, -0.2662748396396637, -0.2511858642101288, -0.23609690368175507, -0.22100794315338135, -0.20591898262500763, -0.1908300220966339, -0.1757410764694214, -0.16065211594104767, -0.14556315541267395, -0.13047417998313904, -0.11538521945476532, -0.1002962589263916, -0.08520729839801788, -0.07011833041906357, -0.05502936244010925, -0.039940398186445236, -0.02485143579542637, -0.009762473404407501, 0.0053264908492565155, 0.020415455102920532, 0.03550441563129425, 0.050593383610248566, 0.06568234413862228, 0.080771304666996, 0.09586027264595032, 0.11094923317432404, 0.12603819370269775, 0.14112716913223267, 0.1562161147594452, 0.1713050901889801, 0.18639405071735382]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 3.0, 9.0, 7.0, 6.0, 17.0, 17.0, 26.0, 24.0, 21.0, 23.0, 27.0, 21.0, 34.0, 21.0, 27.0, 39.0, 37.0, 45.0, 41.0, 47.0, 59.0, 49.0, 41.0, 45.0, 38.0, 27.0, 27.0, 42.0, 25.0, 24.0, 14.0, 17.0, 23.0, 9.0, 8.0, 10.0, 12.0, 10.0, 6.0, 9.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0], "bins": [-0.06028711795806885, -0.05865182727575302, -0.057016536593437195, -0.05538124218583107, -0.053745951503515244, -0.05211066082119942, -0.05047536641359329, -0.048840075731277466, -0.04720478504896164, -0.04556949436664581, -0.04393420368432999, -0.04229890927672386, -0.040663618594408035, -0.03902832791209221, -0.037393033504486084, -0.03575774282217026, -0.03412245213985443, -0.032487161457538605, -0.03085186891257763, -0.029216576367616653, -0.027581285685300827, -0.025945995002985, -0.024310702458024025, -0.02267540991306305, -0.021040119230747223, -0.019404828548431396, -0.01776953600347042, -0.016134243458509445, -0.014498952776193619, -0.012863661162555218, -0.011228369548916817, -0.009593077935278416, -0.007957786321640015, -0.006322494708001614, -0.004687203094363213, -0.0030519114807248116, -0.0014166198670864105, 0.0002186717465519905, 0.0018539633601903915, 0.0034892549738287926, 0.005124546587467194, 0.006759838201105595, 0.008395129814743996, 0.010030421428382397, 0.011665713042020798, 0.013301004655659199, 0.0149362962692976, 0.016571588814258575, 0.018206879496574402, 0.01984217017889023, 0.021477462723851204, 0.02311275526881218, 0.024748045951128006, 0.026383336633443832, 0.028018629178404808, 0.029653921723365784, 0.03128921240568161, 0.032924503087997437, 0.03455979377031326, 0.03619508817791939, 0.037830378860235214, 0.03946566954255104, 0.041100963950157166, 0.04273625463247299, 0.04437154531478882]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 7.0, 7.0, 7.0, 17.0, 21.0, 21.0, 31.0, 29.0, 23.0, 36.0, 43.0, 49.0, 46.0, 39.0, 42.0, 50.0, 46.0, 63.0, 48.0, 42.0, 45.0, 38.0, 27.0, 27.0, 38.0, 23.0, 25.0, 20.0, 18.0, 13.0, 12.0, 9.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8515625, -8.519775390625, -8.18798828125, -7.856201171875, -7.5244140625, -7.192626953125, -6.86083984375, -6.529052734375, -6.197265625, -5.865478515625, -5.53369140625, -5.201904296875, -4.8701171875, -4.538330078125, -4.20654296875, -3.874755859375, -3.54296875, -3.211181640625, -2.87939453125, -2.547607421875, -2.2158203125, -1.884033203125, -1.55224609375, -1.220458984375, -0.888671875, -0.556884765625, -0.22509765625, 0.106689453125, 0.4384765625, 0.770263671875, 1.10205078125, 1.433837890625, 1.765625, 2.097412109375, 2.42919921875, 2.760986328125, 3.0927734375, 3.424560546875, 3.75634765625, 4.088134765625, 4.419921875, 4.751708984375, 5.08349609375, 5.415283203125, 5.7470703125, 6.078857421875, 6.41064453125, 6.742431640625, 7.07421875, 7.406005859375, 7.73779296875, 8.069580078125, 8.4013671875, 8.733154296875, 9.06494140625, 9.396728515625, 9.728515625, 10.060302734375, 10.39208984375, 10.723876953125, 11.0556640625, 11.387451171875, 11.71923828125, 12.051025390625, 12.3828125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 8.0, 8.0, 13.0, 18.0, 21.0, 34.0, 39.0, 63.0, 91.0, 144.0, 201.0, 315.0, 497.0, 907.0, 1807.0, 3517.0, 8582.0, 24196.0, 78051.0, 284385.0, 442549.0, 138247.0, 40543.0, 13613.0, 5325.0, 2392.0, 1198.0, 647.0, 402.0, 221.0, 168.0, 86.0, 73.0, 61.0, 43.0, 17.0, 16.0, 16.0, 11.0, 5.0, 4.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -16.99658203125, -16.4150390625, -15.83349609375, -15.251953125, -14.67041015625, -14.0888671875, -13.50732421875, -12.92578125, -12.34423828125, -11.7626953125, -11.18115234375, -10.599609375, -10.01806640625, -9.4365234375, -8.85498046875, -8.2734375, -7.69189453125, -7.1103515625, -6.52880859375, -5.947265625, -5.36572265625, -4.7841796875, -4.20263671875, -3.62109375, -3.03955078125, -2.4580078125, -1.87646484375, -1.294921875, -0.71337890625, -0.1318359375, 0.44970703125, 1.03125, 1.61279296875, 2.1943359375, 2.77587890625, 3.357421875, 3.93896484375, 4.5205078125, 5.10205078125, 5.68359375, 6.26513671875, 6.8466796875, 7.42822265625, 8.009765625, 8.59130859375, 9.1728515625, 9.75439453125, 10.3359375, 10.91748046875, 11.4990234375, 12.08056640625, 12.662109375, 13.24365234375, 13.8251953125, 14.40673828125, 14.98828125, 15.56982421875, 16.1513671875, 16.73291015625, 17.314453125, 17.89599609375, 18.4775390625, 19.05908203125, 19.640625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 11.0, 13.0, 9.0, 14.0, 17.0, 20.0, 25.0, 34.0, 34.0, 29.0, 51.0, 50.0, 66.0, 127.0, 218.0, 1390.0, 293.0, 161.0, 80.0, 64.0, 37.0, 47.0, 43.0, 31.0, 22.0, 23.0, 32.0, 16.0, 17.0, 10.0, 7.0, 7.0, 9.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.65625, -22.911865234375, -22.16748046875, -21.423095703125, -20.6787109375, -19.934326171875, -19.18994140625, -18.445556640625, -17.701171875, -16.956787109375, -16.21240234375, -15.468017578125, -14.7236328125, -13.979248046875, -13.23486328125, -12.490478515625, -11.74609375, -11.001708984375, -10.25732421875, -9.512939453125, -8.7685546875, -8.024169921875, -7.27978515625, -6.535400390625, -5.791015625, -5.046630859375, -4.30224609375, -3.557861328125, -2.8134765625, -2.069091796875, -1.32470703125, -0.580322265625, 0.1640625, 0.908447265625, 1.65283203125, 2.397216796875, 3.1416015625, 3.885986328125, 4.63037109375, 5.374755859375, 6.119140625, 6.863525390625, 7.60791015625, 8.352294921875, 9.0966796875, 9.841064453125, 10.58544921875, 11.329833984375, 12.07421875, 12.818603515625, 13.56298828125, 14.307373046875, 15.0517578125, 15.796142578125, 16.54052734375, 17.284912109375, 18.029296875, 18.773681640625, 19.51806640625, 20.262451171875, 21.0068359375, 21.751220703125, 22.49560546875, 23.239990234375, 23.984375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 8.0, 3.0, 9.0, 9.0, 7.0, 9.0, 14.0, 27.0, 24.0, 47.0, 61.0, 61.0, 107.0, 149.0, 201.0, 284.0, 480.0, 890.0, 3019.0, 94985.0, 3023598.0, 18092.0, 1660.0, 669.0, 388.0, 259.0, 196.0, 123.0, 86.0, 53.0, 38.0, 43.0, 27.0, 16.0, 14.0, 13.0, 7.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-63.21875, -61.06298828125, -58.9072265625, -56.75146484375, -54.595703125, -52.43994140625, -50.2841796875, -48.12841796875, -45.97265625, -43.81689453125, -41.6611328125, -39.50537109375, -37.349609375, -35.19384765625, -33.0380859375, -30.88232421875, -28.7265625, -26.57080078125, -24.4150390625, -22.25927734375, -20.103515625, -17.94775390625, -15.7919921875, -13.63623046875, -11.48046875, -9.32470703125, -7.1689453125, -5.01318359375, -2.857421875, -0.70166015625, 1.4541015625, 3.60986328125, 5.765625, 7.92138671875, 10.0771484375, 12.23291015625, 14.388671875, 16.54443359375, 18.7001953125, 20.85595703125, 23.01171875, 25.16748046875, 27.3232421875, 29.47900390625, 31.634765625, 33.79052734375, 35.9462890625, 38.10205078125, 40.2578125, 42.41357421875, 44.5693359375, 46.72509765625, 48.880859375, 51.03662109375, 53.1923828125, 55.34814453125, 57.50390625, 59.65966796875, 61.8154296875, 63.97119140625, 66.126953125, 68.28271484375, 70.4384765625, 72.59423828125, 74.75]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 15.0, 118.0, 379.0, 360.0, 108.0, 30.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-212.55931091308594, -205.94418334960938, -199.32904052734375, -192.7139129638672, -186.09877014160156, -179.483642578125, -172.86849975585938, -166.2533721923828, -159.63824462890625, -153.0231170654297, -146.40797424316406, -139.7928466796875, -133.17770385742188, -126.56257629394531, -119.94744110107422, -113.33230590820312, -106.7171630859375, -100.1020278930664, -93.48689270019531, -86.87176513671875, -80.25662231445312, -73.64149475097656, -67.02635955810547, -60.411224365234375, -53.79608917236328, -47.18095397949219, -40.565818786621094, -33.950687408447266, -27.335552215576172, -20.720417022705078, -14.10528564453125, -7.490150451660156, -0.8750152587890625, 5.740118980407715, 12.355253219604492, 18.970386505126953, 25.585521697998047, 32.20065689086914, 38.81578826904297, 45.43092346191406, 52.046058654785156, 58.66119384765625, 65.27632904052734, 71.89146423339844, 78.506591796875, 85.12173461914062, 91.73686218261719, 98.35199737548828, 104.96713256835938, 111.58226776123047, 118.19740295410156, 124.81253051757812, 131.42767333984375, 138.0428009033203, 144.65792846679688, 151.2730712890625, 157.88821411132812, 164.5033416748047, 171.1184844970703, 177.73361206054688, 184.3487548828125, 190.96388244628906, 197.57901000976562, 204.19415283203125, 210.8092803955078]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 2.0, 9.0, 8.0, 4.0, 15.0, 13.0, 12.0, 15.0, 19.0, 16.0, 27.0, 13.0, 19.0, 23.0, 23.0, 31.0, 36.0, 32.0, 35.0, 39.0, 32.0, 38.0, 38.0, 41.0, 29.0, 38.0, 38.0, 37.0, 41.0, 29.0, 22.0, 24.0, 27.0, 18.0, 28.0, 19.0, 25.0, 11.0, 11.0, 16.0, 13.0, 9.0, 6.0, 7.0, 6.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-70.94068908691406, -69.0074234008789, -67.07415771484375, -65.14089965820312, -63.20763397216797, -61.27436828613281, -59.34110641479492, -57.40784454345703, -55.474578857421875, -53.54131317138672, -51.60805130004883, -49.67478942871094, -47.74152374267578, -45.808258056640625, -43.874996185302734, -41.941734313964844, -40.00846862792969, -38.07520294189453, -36.14194107055664, -34.20867919921875, -32.275413513183594, -30.34214973449707, -28.408885955810547, -26.475622177124023, -24.5423583984375, -22.609094619750977, -20.675830841064453, -18.74256706237793, -16.809303283691406, -14.876039505004883, -12.94277572631836, -11.009511947631836, -9.076244354248047, -7.142980575561523, -5.209716796875, -3.2764530181884766, -1.3431892395019531, 0.5900745391845703, 2.5233383178710938, 4.456602096557617, 6.389865875244141, 8.323129653930664, 10.256393432617188, 12.189657211303711, 14.122920989990234, 16.056184768676758, 17.98944854736328, 19.922712326049805, 21.855976104736328, 23.78923988342285, 25.722503662109375, 27.6557674407959, 29.589031219482422, 31.522294998168945, 33.45555877685547, 35.388824462890625, 37.322086334228516, 39.255348205566406, 41.18861389160156, 43.12187957763672, 45.05514144897461, 46.9884033203125, 48.921669006347656, 50.85493469238281, 52.7881965637207]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 7.0, 8.0, 10.0, 15.0, 7.0, 19.0, 22.0, 28.0, 30.0, 36.0, 28.0, 35.0, 38.0, 44.0, 55.0, 47.0, 52.0, 42.0, 60.0, 44.0, 47.0, 43.0, 34.0, 32.0, 36.0, 39.0, 23.0, 36.0, 16.0, 8.0, 13.0, 9.0, 8.0, 10.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.5447998046875, -9.198974609375, -8.8531494140625, -8.50732421875, -8.1614990234375, -7.815673828125, -7.4698486328125, -7.1240234375, -6.7781982421875, -6.432373046875, -6.0865478515625, -5.74072265625, -5.3948974609375, -5.049072265625, -4.7032470703125, -4.357421875, -4.0115966796875, -3.665771484375, -3.3199462890625, -2.97412109375, -2.6282958984375, -2.282470703125, -1.9366455078125, -1.5908203125, -1.2449951171875, -0.899169921875, -0.5533447265625, -0.20751953125, 0.1383056640625, 0.484130859375, 0.8299560546875, 1.17578125, 1.5216064453125, 1.867431640625, 2.2132568359375, 2.55908203125, 2.9049072265625, 3.250732421875, 3.5965576171875, 3.9423828125, 4.2882080078125, 4.634033203125, 4.9798583984375, 5.32568359375, 5.6715087890625, 6.017333984375, 6.3631591796875, 6.708984375, 7.0548095703125, 7.400634765625, 7.7464599609375, 8.09228515625, 8.4381103515625, 8.783935546875, 9.1297607421875, 9.4755859375, 9.8214111328125, 10.167236328125, 10.5130615234375, 10.85888671875, 11.2047119140625, 11.550537109375, 11.8963623046875, 12.2421875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 6.0, 12.0, 14.0, 20.0, 19.0, 40.0, 54.0, 48.0, 71.0, 101.0, 144.0, 182.0, 285.0, 408.0, 661.0, 1069.0, 1798.0, 3201.0, 7052.0, 20465.0, 96165.0, 593554.0, 2326249.0, 945596.0, 148702.0, 29066.0, 9377.0, 4130.0, 2163.0, 1167.0, 764.0, 483.0, 344.0, 221.0, 182.0, 112.0, 77.0, 65.0, 43.0, 29.0, 36.0, 22.0, 14.0, 14.0, 12.0, 7.0, 10.0, 7.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-19.375, -18.78125, -18.1875, -17.59375, -17.0, -16.40625, -15.8125, -15.21875, -14.625, -14.03125, -13.4375, -12.84375, -12.25, -11.65625, -11.0625, -10.46875, -9.875, -9.28125, -8.6875, -8.09375, -7.5, -6.90625, -6.3125, -5.71875, -5.125, -4.53125, -3.9375, -3.34375, -2.75, -2.15625, -1.5625, -0.96875, -0.375, 0.21875, 0.8125, 1.40625, 2.0, 2.59375, 3.1875, 3.78125, 4.375, 4.96875, 5.5625, 6.15625, 6.75, 7.34375, 7.9375, 8.53125, 9.125, 9.71875, 10.3125, 10.90625, 11.5, 12.09375, 12.6875, 13.28125, 13.875, 14.46875, 15.0625, 15.65625, 16.25, 16.84375, 17.4375, 18.03125, 18.625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 8.0, 13.0, 10.0, 9.0, 31.0, 36.0, 52.0, 82.0, 112.0, 224.0, 269.0, 459.0, 726.0, 665.0, 450.0, 292.0, 197.0, 124.0, 87.0, 62.0, 50.0, 35.0, 21.0, 16.0, 12.0, 8.0, 8.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5, -15.839111328125, -15.17822265625, -14.517333984375, -13.8564453125, -13.195556640625, -12.53466796875, -11.873779296875, -11.212890625, -10.552001953125, -9.89111328125, -9.230224609375, -8.5693359375, -7.908447265625, -7.24755859375, -6.586669921875, -5.92578125, -5.264892578125, -4.60400390625, -3.943115234375, -3.2822265625, -2.621337890625, -1.96044921875, -1.299560546875, -0.638671875, 0.022216796875, 0.68310546875, 1.343994140625, 2.0048828125, 2.665771484375, 3.32666015625, 3.987548828125, 4.6484375, 5.309326171875, 5.97021484375, 6.631103515625, 7.2919921875, 7.952880859375, 8.61376953125, 9.274658203125, 9.935546875, 10.596435546875, 11.25732421875, 11.918212890625, 12.5791015625, 13.239990234375, 13.90087890625, 14.561767578125, 15.22265625, 15.883544921875, 16.54443359375, 17.205322265625, 17.8662109375, 18.527099609375, 19.18798828125, 19.848876953125, 20.509765625, 21.170654296875, 21.83154296875, 22.492431640625, 23.1533203125, 23.814208984375, 24.47509765625, 25.135986328125, 25.796875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 7.0, 5.0, 11.0, 21.0, 34.0, 51.0, 104.0, 177.0, 379.0, 820.0, 1833.0, 5281.0, 19564.0, 131095.0, 2691126.0, 1248235.0, 75253.0, 13483.0, 4026.0, 1441.0, 659.0, 320.0, 148.0, 77.0, 62.0, 30.0, 16.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.640625, -28.537841796875, -27.43505859375, -26.332275390625, -25.2294921875, -24.126708984375, -23.02392578125, -21.921142578125, -20.818359375, -19.715576171875, -18.61279296875, -17.510009765625, -16.4072265625, -15.304443359375, -14.20166015625, -13.098876953125, -11.99609375, -10.893310546875, -9.79052734375, -8.687744140625, -7.5849609375, -6.482177734375, -5.37939453125, -4.276611328125, -3.173828125, -2.071044921875, -0.96826171875, 0.134521484375, 1.2373046875, 2.340087890625, 3.44287109375, 4.545654296875, 5.6484375, 6.751220703125, 7.85400390625, 8.956787109375, 10.0595703125, 11.162353515625, 12.26513671875, 13.367919921875, 14.470703125, 15.573486328125, 16.67626953125, 17.779052734375, 18.8818359375, 19.984619140625, 21.08740234375, 22.190185546875, 23.29296875, 24.395751953125, 25.49853515625, 26.601318359375, 27.7041015625, 28.806884765625, 29.90966796875, 31.012451171875, 32.115234375, 33.218017578125, 34.32080078125, 35.423583984375, 36.5263671875, 37.629150390625, 38.73193359375, 39.834716796875, 40.9375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 15.0, 902.0, 98.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1472.0360107421875, -1437.5185546875, -1403.0010986328125, -1368.4835205078125, -1333.966064453125, -1299.4486083984375, -1264.93115234375, -1230.41357421875, -1195.8961181640625, -1161.378662109375, -1126.8612060546875, -1092.3436279296875, -1057.826171875, -1023.3087158203125, -988.791259765625, -954.2737426757812, -919.7562866210938, -885.2388305664062, -850.7213134765625, -816.203857421875, -781.6863403320312, -747.1688842773438, -712.6513671875, -678.1339111328125, -643.616455078125, -609.0989990234375, -574.5814819335938, -540.0640258789062, -505.5465087890625, -471.029052734375, -436.5115661621094, -401.99407958984375, -367.47662353515625, -332.9591369628906, -298.441650390625, -263.9241943359375, -229.4066925048828, -194.8892059326172, -160.37173461914062, -125.854248046875, -91.33676147460938, -56.819278717041016, -22.301795959472656, 12.215682983398438, 46.73316955566406, 81.25065612792969, 115.76812744140625, 150.28561401367188, 184.8031005859375, 219.32058715820312, 253.83807373046875, 288.35552978515625, 322.873046875, 357.3905029296875, 391.9079895019531, 426.42547607421875, 460.9429626464844, 495.46044921875, 529.9779052734375, 564.4954223632812, 599.0128784179688, 633.5303955078125, 668.0478515625, 702.5653076171875, 737.0828247070312]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 7.0, 10.0, 11.0, 10.0, 20.0, 13.0, 30.0, 33.0, 32.0, 34.0, 46.0, 49.0, 53.0, 56.0, 51.0, 34.0, 66.0, 60.0, 43.0, 48.0, 57.0, 35.0, 37.0, 24.0, 22.0, 32.0, 18.0, 15.0, 8.0, 11.0, 5.0, 15.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.10401916503906, -75.67633819580078, -73.24866485595703, -70.82098388671875, -68.393310546875, -65.96562957763672, -63.53795623779297, -61.11027526855469, -58.68260192871094, -56.25492477416992, -53.827247619628906, -51.39957046508789, -48.971893310546875, -46.54421615600586, -44.116539001464844, -41.68885803222656, -39.26118087768555, -36.83350372314453, -34.405826568603516, -31.9781494140625, -29.550472259521484, -27.12279510498047, -24.69511604309082, -22.267438888549805, -19.83976173400879, -17.412084579467773, -14.984407424926758, -12.556729316711426, -10.12905216217041, -7.7013750076293945, -5.2736968994140625, -2.846019744873047, -0.41834259033203125, 2.0093348026275635, 4.437012195587158, 6.864689826965332, 9.292366981506348, 11.720044136047363, 14.147722244262695, 16.57539939880371, 19.003076553344727, 21.430753707885742, 23.858430862426758, 26.286109924316406, 28.713787078857422, 31.141464233398438, 33.56914138793945, 35.99681854248047, 38.424495697021484, 40.8521728515625, 43.279850006103516, 45.70752716064453, 48.13520431518555, 50.56288146972656, 52.990562438964844, 55.418235778808594, 57.845916748046875, 60.27359390258789, 62.701271057128906, 65.12895202636719, 67.55662536621094, 69.98430633544922, 72.41197967529297, 74.83966064453125, 77.267333984375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 1.0, 5.0, 11.0, 11.0, 11.0, 15.0, 21.0, 10.0, 33.0, 36.0, 35.0, 40.0, 36.0, 37.0, 43.0, 44.0, 41.0, 57.0, 38.0, 53.0, 28.0, 40.0, 55.0, 37.0, 42.0, 35.0, 30.0, 23.0, 21.0, 13.0, 19.0, 16.0, 12.0, 11.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7421875, -7.4610595703125, -7.179931640625, -6.8988037109375, -6.61767578125, -6.3365478515625, -6.055419921875, -5.7742919921875, -5.4931640625, -5.2120361328125, -4.930908203125, -4.6497802734375, -4.36865234375, -4.0875244140625, -3.806396484375, -3.5252685546875, -3.244140625, -2.9630126953125, -2.681884765625, -2.4007568359375, -2.11962890625, -1.8385009765625, -1.557373046875, -1.2762451171875, -0.9951171875, -0.7139892578125, -0.432861328125, -0.1517333984375, 0.12939453125, 0.4105224609375, 0.691650390625, 0.9727783203125, 1.25390625, 1.5350341796875, 1.816162109375, 2.0972900390625, 2.37841796875, 2.6595458984375, 2.940673828125, 3.2218017578125, 3.5029296875, 3.7840576171875, 4.065185546875, 4.3463134765625, 4.62744140625, 4.9085693359375, 5.189697265625, 5.4708251953125, 5.751953125, 6.0330810546875, 6.314208984375, 6.5953369140625, 6.87646484375, 7.1575927734375, 7.438720703125, 7.7198486328125, 8.0009765625, 8.2821044921875, 8.563232421875, 8.8443603515625, 9.12548828125, 9.4066162109375, 9.687744140625, 9.9688720703125, 10.25]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 0.0, 10.0, 17.0, 24.0, 40.0, 48.0, 82.0, 104.0, 192.0, 303.0, 459.0, 666.0, 1083.0, 1784.0, 2885.0, 4605.0, 7746.0, 13601.0, 23311.0, 43001.0, 80144.0, 145203.0, 220280.0, 209669.0, 131647.0, 71935.0, 38226.0, 20997.0, 12172.0, 7098.0, 4303.0, 2612.0, 1593.0, 959.0, 623.0, 417.0, 274.0, 148.0, 101.0, 71.0, 38.0, 29.0, 25.0, 7.0, 12.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96142578125, -0.9303207397460938, -0.8992156982421875, -0.8681106567382812, -0.837005615234375, -0.8059005737304688, -0.7747955322265625, -0.7436904907226562, -0.71258544921875, -0.6814804077148438, -0.6503753662109375, -0.6192703247070312, -0.588165283203125, -0.5570602416992188, -0.5259552001953125, -0.49485015869140625, -0.4637451171875, -0.43264007568359375, -0.4015350341796875, -0.37042999267578125, -0.339324951171875, -0.30821990966796875, -0.2771148681640625, -0.24600982666015625, -0.21490478515625, -0.18379974365234375, -0.1526947021484375, -0.12158966064453125, -0.090484619140625, -0.05937957763671875, -0.0282745361328125, 0.00283050537109375, 0.033935546875, 0.06504058837890625, 0.0961456298828125, 0.12725067138671875, 0.158355712890625, 0.18946075439453125, 0.2205657958984375, 0.25167083740234375, 0.28277587890625, 0.31388092041015625, 0.3449859619140625, 0.37609100341796875, 0.407196044921875, 0.43830108642578125, 0.4694061279296875, 0.5005111694335938, 0.5316162109375, 0.5627212524414062, 0.5938262939453125, 0.6249313354492188, 0.656036376953125, 0.6871414184570312, 0.7182464599609375, 0.7493515014648438, 0.78045654296875, 0.8115615844726562, 0.8426666259765625, 0.8737716674804688, 0.904876708984375, 0.9359817504882812, 0.9670867919921875, 0.9981918334960938, 1.029296875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 9.0, 5.0, 4.0, 9.0, 6.0, 12.0, 13.0, 22.0, 16.0, 25.0, 18.0, 32.0, 30.0, 32.0, 37.0, 34.0, 36.0, 39.0, 28.0, 49.0, 41.0, 1066.0, 42.0, 39.0, 32.0, 30.0, 38.0, 32.0, 40.0, 25.0, 29.0, 20.0, 17.0, 21.0, 19.0, 14.0, 15.0, 14.0, 5.0, 6.0, 4.0, 9.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.0625, -5.87969970703125, -5.6968994140625, -5.51409912109375, -5.331298828125, -5.14849853515625, -4.9656982421875, -4.78289794921875, -4.60009765625, -4.41729736328125, -4.2344970703125, -4.05169677734375, -3.868896484375, -3.68609619140625, -3.5032958984375, -3.32049560546875, -3.1376953125, -2.95489501953125, -2.7720947265625, -2.58929443359375, -2.406494140625, -2.22369384765625, -2.0408935546875, -1.85809326171875, -1.67529296875, -1.49249267578125, -1.3096923828125, -1.12689208984375, -0.944091796875, -0.76129150390625, -0.5784912109375, -0.39569091796875, -0.212890625, -0.03009033203125, 0.1527099609375, 0.33551025390625, 0.518310546875, 0.70111083984375, 0.8839111328125, 1.06671142578125, 1.24951171875, 1.43231201171875, 1.6151123046875, 1.79791259765625, 1.980712890625, 2.16351318359375, 2.3463134765625, 2.52911376953125, 2.7119140625, 2.89471435546875, 3.0775146484375, 3.26031494140625, 3.443115234375, 3.62591552734375, 3.8087158203125, 3.99151611328125, 4.17431640625, 4.35711669921875, 4.5399169921875, 4.72271728515625, 4.905517578125, 5.08831787109375, 5.2711181640625, 5.45391845703125, 5.63671875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 11.0, 12.0, 19.0, 28.0, 31.0, 66.0, 76.0, 103.0, 169.0, 236.0, 370.0, 547.0, 875.0, 1306.0, 2140.0, 3513.0, 6150.0, 11552.0, 24228.0, 81318.0, 1818485.0, 92672.0, 25022.0, 12053.0, 6382.0, 3633.0, 2199.0, 1374.0, 901.0, 567.0, 362.0, 246.0, 162.0, 115.0, 71.0, 39.0, 33.0, 21.0, 20.0, 9.0, 5.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.92578125, -1.8665771484375, -1.807373046875, -1.7481689453125, -1.68896484375, -1.6297607421875, -1.570556640625, -1.5113525390625, -1.4521484375, -1.3929443359375, -1.333740234375, -1.2745361328125, -1.21533203125, -1.1561279296875, -1.096923828125, -1.0377197265625, -0.978515625, -0.9193115234375, -0.860107421875, -0.8009033203125, -0.74169921875, -0.6824951171875, -0.623291015625, -0.5640869140625, -0.5048828125, -0.4456787109375, -0.386474609375, -0.3272705078125, -0.26806640625, -0.2088623046875, -0.149658203125, -0.0904541015625, -0.03125, 0.0279541015625, 0.087158203125, 0.1463623046875, 0.20556640625, 0.2647705078125, 0.323974609375, 0.3831787109375, 0.4423828125, 0.5015869140625, 0.560791015625, 0.6199951171875, 0.67919921875, 0.7384033203125, 0.797607421875, 0.8568115234375, 0.916015625, 0.9752197265625, 1.034423828125, 1.0936279296875, 1.15283203125, 1.2120361328125, 1.271240234375, 1.3304443359375, 1.3896484375, 1.4488525390625, 1.508056640625, 1.5672607421875, 1.62646484375, 1.6856689453125, 1.744873046875, 1.8040771484375, 1.86328125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 8.0, 7.0, 10.0, 17.0, 23.0, 27.0, 27.0, 32.0, 26.0, 43.0, 41.0, 41.0, 61.0, 53.0, 61.0, 59.0, 55.0, 47.0, 42.0, 39.0, 37.0, 43.0, 32.0, 34.0, 24.0, 16.0, 22.0, 13.0, 5.0, 8.0, 12.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0643310546875, -0.06260156631469727, -0.06087207794189453, -0.0591425895690918, -0.05741310119628906, -0.05568361282348633, -0.053954124450683594, -0.05222463607788086, -0.050495147705078125, -0.04876565933227539, -0.047036170959472656, -0.04530668258666992, -0.04357719421386719, -0.04184770584106445, -0.04011821746826172, -0.038388729095458984, -0.03665924072265625, -0.034929752349853516, -0.03320026397705078, -0.03147077560424805, -0.029741287231445312, -0.028011798858642578, -0.026282310485839844, -0.02455282211303711, -0.022823333740234375, -0.02109384536743164, -0.019364356994628906, -0.017634868621826172, -0.015905380249023438, -0.014175891876220703, -0.012446403503417969, -0.010716915130615234, -0.0089874267578125, -0.007257938385009766, -0.005528450012207031, -0.003798961639404297, -0.0020694732666015625, -0.0003399848937988281, 0.0013895034790039062, 0.0031189918518066406, 0.004848480224609375, 0.006577968597412109, 0.008307456970214844, 0.010036945343017578, 0.011766433715820312, 0.013495922088623047, 0.015225410461425781, 0.016954898834228516, 0.01868438720703125, 0.020413875579833984, 0.02214336395263672, 0.023872852325439453, 0.025602340698242188, 0.027331829071044922, 0.029061317443847656, 0.03079080581665039, 0.032520294189453125, 0.03424978256225586, 0.035979270935058594, 0.03770875930786133, 0.03943824768066406, 0.0411677360534668, 0.04289722442626953, 0.044626712799072266, 0.046356201171875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 11.0, 12.0, 13.0, 17.0, 16.0, 25.0, 36.0, 37.0, 56.0, 64.0, 96.0, 131.0, 197.0, 289.0, 468.0, 1310.0, 46014.0, 966878.0, 30236.0, 1218.0, 449.0, 277.0, 167.0, 125.0, 104.0, 81.0, 49.0, 41.0, 32.0, 23.0, 22.0, 11.0, 10.0, 12.0, 5.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85498046875, -0.8238449096679688, -0.7927093505859375, -0.7615737915039062, -0.730438232421875, -0.6993026733398438, -0.6681671142578125, -0.6370315551757812, -0.60589599609375, -0.5747604370117188, -0.5436248779296875, -0.5124893188476562, -0.481353759765625, -0.45021820068359375, -0.4190826416015625, -0.38794708251953125, -0.3568115234375, -0.32567596435546875, -0.2945404052734375, -0.26340484619140625, -0.232269287109375, -0.20113372802734375, -0.1699981689453125, -0.13886260986328125, -0.10772705078125, -0.07659149169921875, -0.0454559326171875, -0.01432037353515625, 0.016815185546875, 0.04795074462890625, 0.0790863037109375, 0.11022186279296875, 0.141357421875, 0.17249298095703125, 0.2036285400390625, 0.23476409912109375, 0.265899658203125, 0.29703521728515625, 0.3281707763671875, 0.35930633544921875, 0.39044189453125, 0.42157745361328125, 0.4527130126953125, 0.48384857177734375, 0.514984130859375, 0.5461196899414062, 0.5772552490234375, 0.6083908081054688, 0.6395263671875, 0.6706619262695312, 0.7017974853515625, 0.7329330444335938, 0.764068603515625, 0.7952041625976562, 0.8263397216796875, 0.8574752807617188, 0.88861083984375, 0.9197463989257812, 0.9508819580078125, 0.9820175170898438, 1.013153076171875, 1.0442886352539062, 1.0754241943359375, 1.1065597534179688, 1.1376953125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 31.0, 368.0, 531.0, 76.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30367860198020935, -0.2893121838569641, -0.27494579553604126, -0.260579377412796, -0.24621295928955078, -0.23184655606746674, -0.2174801528453827, -0.20311373472213745, -0.1887473315000534, -0.17438092827796936, -0.16001451015472412, -0.14564810693264008, -0.13128170371055603, -0.11691528558731079, -0.10254888236522675, -0.0881824716925621, -0.07381606101989746, -0.05944965034723282, -0.045083243399858475, -0.03071683645248413, -0.01635042577981949, -0.001984015107154846, 0.0123823881149292, 0.02674879878759384, 0.041115209460258484, 0.055481620132923126, 0.06984803080558777, 0.08421443402767181, 0.09858084470033646, 0.1129472553730011, 0.12731365859508514, 0.1416800618171692, 0.15604650974273682, 0.17041291296482086, 0.1847793310880661, 0.19914573431015015, 0.21351215243339539, 0.22787855565547943, 0.24224495887756348, 0.2566113770008087, 0.27097779512405396, 0.2853442132472992, 0.29971060156822205, 0.3140770196914673, 0.3284434378147125, 0.34280985593795776, 0.3571762442588806, 0.37154266238212585, 0.3859090507030487, 0.40027546882629395, 0.4146418571472168, 0.42900827527046204, 0.4433746933937073, 0.4577410817146301, 0.47210749983787537, 0.4864739179611206, 0.5008403062820435, 0.5152066946029663, 0.5295731425285339, 0.5439395308494568, 0.5583059191703796, 0.5726723670959473, 0.5870387554168701, 0.601405143737793, 0.6157715916633606]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 7.0, 4.0, 7.0, 12.0, 13.0, 16.0, 12.0, 20.0, 18.0, 32.0, 24.0, 26.0, 34.0, 26.0, 36.0, 30.0, 49.0, 44.0, 41.0, 37.0, 37.0, 42.0, 48.0, 26.0, 32.0, 31.0, 33.0, 28.0, 27.0, 21.0, 18.0, 22.0, 26.0, 17.0, 18.0, 10.0, 12.0, 12.0, 7.0, 7.0, 5.0, 7.0, 10.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.04535651206970215, -0.04406628757715225, -0.042776063084602356, -0.04148583486676216, -0.040195610374212265, -0.03890538588166237, -0.037615157663822174, -0.03632493317127228, -0.03503470867872238, -0.033744484186172485, -0.03245425969362259, -0.031164031475782394, -0.029873806983232498, -0.028583582490682602, -0.027293356135487556, -0.02600312978029251, -0.024712905287742615, -0.02342268079519272, -0.022132454439997673, -0.020842228084802628, -0.01955200359225273, -0.018261779099702835, -0.01697155274450779, -0.015681326389312744, -0.014391101896762848, -0.013100876472890377, -0.011810651049017906, -0.010520425625145435, -0.009230200201272964, -0.007939974777400494, -0.006649749353528023, -0.005359523929655552, -0.004069298505783081, -0.00277907308191061, -0.0014888476580381393, -0.0001986222341656685, 0.0010916031897068024, 0.0023818286135792732, 0.003672054037451744, 0.004962279461324215, 0.006252504885196686, 0.007542730309069157, 0.008832955732941628, 0.010123181156814098, 0.01141340658068657, 0.01270363200455904, 0.013993857428431511, 0.015284082852303982, 0.016574308276176453, 0.01786453276872635, 0.019154759123921394, 0.02044498547911644, 0.021735209971666336, 0.023025434464216232, 0.024315660819411278, 0.025605887174606323, 0.02689611166715622, 0.028186336159706116, 0.02947656251490116, 0.030766788870096207, 0.0320570133626461, 0.033347237855196, 0.034637466073036194, 0.03592769056558609, 0.037217915058135986]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 1.0, 5.0, 10.0, 11.0, 12.0, 15.0, 21.0, 10.0, 33.0, 35.0, 35.0, 41.0, 36.0, 37.0, 42.0, 45.0, 41.0, 58.0, 37.0, 52.0, 30.0, 41.0, 53.0, 36.0, 43.0, 35.0, 30.0, 23.0, 22.0, 12.0, 19.0, 16.0, 12.0, 11.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7421875, -7.4610595703125, -7.179931640625, -6.8988037109375, -6.61767578125, -6.3365478515625, -6.055419921875, -5.7742919921875, -5.4931640625, -5.2120361328125, -4.930908203125, -4.6497802734375, -4.36865234375, -4.0875244140625, -3.806396484375, -3.5252685546875, -3.244140625, -2.9630126953125, -2.681884765625, -2.4007568359375, -2.11962890625, -1.8385009765625, -1.557373046875, -1.2762451171875, -0.9951171875, -0.7139892578125, -0.432861328125, -0.1517333984375, 0.12939453125, 0.4105224609375, 0.691650390625, 0.9727783203125, 1.25390625, 1.5350341796875, 1.816162109375, 2.0972900390625, 2.37841796875, 2.6595458984375, 2.940673828125, 3.2218017578125, 3.5029296875, 3.7840576171875, 4.065185546875, 4.3463134765625, 4.62744140625, 4.9085693359375, 5.189697265625, 5.4708251953125, 5.751953125, 6.0330810546875, 6.314208984375, 6.5953369140625, 6.87646484375, 7.1575927734375, 7.438720703125, 7.7198486328125, 8.0009765625, 8.2821044921875, 8.563232421875, 8.8443603515625, 9.12548828125, 9.4066162109375, 9.687744140625, 9.9688720703125, 10.25]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 10.0, 9.0, 11.0, 27.0, 29.0, 37.0, 44.0, 62.0, 110.0, 136.0, 185.0, 288.0, 471.0, 642.0, 903.0, 1578.0, 3024.0, 6707.0, 17765.0, 64337.0, 397967.0, 448996.0, 71380.0, 18797.0, 6952.0, 3243.0, 1692.0, 1013.0, 654.0, 446.0, 319.0, 196.0, 148.0, 120.0, 82.0, 45.0, 37.0, 32.0, 18.0, 14.0, 10.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.640625, -21.0400390625, -20.439453125, -19.8388671875, -19.23828125, -18.6376953125, -18.037109375, -17.4365234375, -16.8359375, -16.2353515625, -15.634765625, -15.0341796875, -14.43359375, -13.8330078125, -13.232421875, -12.6318359375, -12.03125, -11.4306640625, -10.830078125, -10.2294921875, -9.62890625, -9.0283203125, -8.427734375, -7.8271484375, -7.2265625, -6.6259765625, -6.025390625, -5.4248046875, -4.82421875, -4.2236328125, -3.623046875, -3.0224609375, -2.421875, -1.8212890625, -1.220703125, -0.6201171875, -0.01953125, 0.5810546875, 1.181640625, 1.7822265625, 2.3828125, 2.9833984375, 3.583984375, 4.1845703125, 4.78515625, 5.3857421875, 5.986328125, 6.5869140625, 7.1875, 7.7880859375, 8.388671875, 8.9892578125, 9.58984375, 10.1904296875, 10.791015625, 11.3916015625, 11.9921875, 12.5927734375, 13.193359375, 13.7939453125, 14.39453125, 14.9951171875, 15.595703125, 16.1962890625, 16.796875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 9.0, 7.0, 15.0, 7.0, 15.0, 25.0, 29.0, 20.0, 39.0, 26.0, 42.0, 36.0, 43.0, 65.0, 92.0, 160.0, 301.0, 1375.0, 191.0, 107.0, 71.0, 47.0, 56.0, 44.0, 26.0, 35.0, 26.0, 27.0, 19.0, 18.0, 10.0, 9.0, 9.0, 9.0, 7.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-22.125, -21.51123046875, -20.8974609375, -20.28369140625, -19.669921875, -19.05615234375, -18.4423828125, -17.82861328125, -17.21484375, -16.60107421875, -15.9873046875, -15.37353515625, -14.759765625, -14.14599609375, -13.5322265625, -12.91845703125, -12.3046875, -11.69091796875, -11.0771484375, -10.46337890625, -9.849609375, -9.23583984375, -8.6220703125, -8.00830078125, -7.39453125, -6.78076171875, -6.1669921875, -5.55322265625, -4.939453125, -4.32568359375, -3.7119140625, -3.09814453125, -2.484375, -1.87060546875, -1.2568359375, -0.64306640625, -0.029296875, 0.58447265625, 1.1982421875, 1.81201171875, 2.42578125, 3.03955078125, 3.6533203125, 4.26708984375, 4.880859375, 5.49462890625, 6.1083984375, 6.72216796875, 7.3359375, 7.94970703125, 8.5634765625, 9.17724609375, 9.791015625, 10.40478515625, 11.0185546875, 11.63232421875, 12.24609375, 12.85986328125, 13.4736328125, 14.08740234375, 14.701171875, 15.31494140625, 15.9287109375, 16.54248046875, 17.15625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 8.0, 13.0, 19.0, 20.0, 23.0, 36.0, 45.0, 55.0, 108.0, 160.0, 200.0, 306.0, 523.0, 1160.0, 4550.0, 96333.0, 3022700.0, 15133.0, 2253.0, 768.0, 441.0, 257.0, 157.0, 134.0, 72.0, 57.0, 38.0, 25.0, 29.0, 20.0, 17.0, 11.0, 9.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.71875, -48.71240234375, -46.7060546875, -44.69970703125, -42.693359375, -40.68701171875, -38.6806640625, -36.67431640625, -34.66796875, -32.66162109375, -30.6552734375, -28.64892578125, -26.642578125, -24.63623046875, -22.6298828125, -20.62353515625, -18.6171875, -16.61083984375, -14.6044921875, -12.59814453125, -10.591796875, -8.58544921875, -6.5791015625, -4.57275390625, -2.56640625, -0.56005859375, 1.4462890625, 3.45263671875, 5.458984375, 7.46533203125, 9.4716796875, 11.47802734375, 13.484375, 15.49072265625, 17.4970703125, 19.50341796875, 21.509765625, 23.51611328125, 25.5224609375, 27.52880859375, 29.53515625, 31.54150390625, 33.5478515625, 35.55419921875, 37.560546875, 39.56689453125, 41.5732421875, 43.57958984375, 45.5859375, 47.59228515625, 49.5986328125, 51.60498046875, 53.611328125, 55.61767578125, 57.6240234375, 59.63037109375, 61.63671875, 63.64306640625, 65.6494140625, 67.65576171875, 69.662109375, 71.66845703125, 73.6748046875, 75.68115234375, 77.6875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 9.0, 8.0, 40.0, 54.0, 74.0, 138.0, 181.0, 170.0, 127.0, 91.0, 53.0, 28.0, 14.0, 7.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.39653396606445, -35.5035400390625, -31.610549926757812, -27.717557907104492, -23.824565887451172, -19.93157386779785, -16.03858184814453, -12.145589828491211, -8.25259780883789, -4.35960578918457, -0.46661376953125, 3.4263782501220703, 7.319370269775391, 11.212362289428711, 15.105354309082031, 18.99834632873535, 22.891338348388672, 26.784330368041992, 30.677322387695312, 34.5703125, 38.46330642700195, 42.356300354003906, 46.249290466308594, 50.14228057861328, 54.035274505615234, 57.92826843261719, 61.821258544921875, 65.71424865722656, 69.60723876953125, 73.50023651123047, 77.39322662353516, 81.28621673583984, 85.17921447753906, 89.07220458984375, 92.96519470214844, 96.85819244384766, 100.75118255615234, 104.64417266845703, 108.53717041015625, 112.43016052246094, 116.32315063476562, 120.21614074707031, 124.109130859375, 128.0021209716797, 131.89511108398438, 135.78811645507812, 139.6811065673828, 143.5740966796875, 147.4670867919922, 151.36007690429688, 155.25306701660156, 159.14605712890625, 163.0390625, 166.9320526123047, 170.82504272460938, 174.71803283691406, 178.61102294921875, 182.50401306152344, 186.39700317382812, 190.2899932861328, 194.1829833984375, 198.07598876953125, 201.96897888183594, 205.86196899414062, 209.7549591064453]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 3.0, 6.0, 4.0, 7.0, 12.0, 10.0, 12.0, 14.0, 12.0, 17.0, 11.0, 17.0, 18.0, 28.0, 29.0, 29.0, 45.0, 32.0, 38.0, 36.0, 40.0, 31.0, 40.0, 41.0, 40.0, 39.0, 31.0, 32.0, 32.0, 33.0, 36.0, 27.0, 21.0, 25.0, 19.0, 16.0, 17.0, 16.0, 19.0, 9.0, 10.0, 11.0, 4.0, 5.0, 10.0, 2.0, 5.0, 6.0, 5.0, 0.0, 2.0], "bins": [-75.525634765625, -73.54178619384766, -71.55793762207031, -69.57408905029297, -67.59024047851562, -65.60638427734375, -63.622535705566406, -61.63868713378906, -59.65483856201172, -57.670989990234375, -55.68714141845703, -53.70328903198242, -51.71944046020508, -49.735591888427734, -47.751739501953125, -45.76789093017578, -43.78404235839844, -41.800193786621094, -39.81634521484375, -37.83249282836914, -35.8486442565918, -33.86479568481445, -31.880945205688477, -29.8970947265625, -27.913246154785156, -25.929397583007812, -23.945547103881836, -21.96169662475586, -19.977848052978516, -17.993999481201172, -16.010149002075195, -14.026299476623535, -12.04245376586914, -10.05860424041748, -8.07475471496582, -6.09090518951416, -4.1070556640625, -2.12320613861084, -0.1393566131591797, 1.8444929122924805, 3.8283424377441406, 5.812191963195801, 7.796041488647461, 9.779891014099121, 11.763740539550781, 13.747590065002441, 15.731439590454102, 17.715290069580078, 19.699138641357422, 21.682987213134766, 23.666837692260742, 25.65068817138672, 27.634536743164062, 29.618385314941406, 31.602235794067383, 33.58608627319336, 35.5699348449707, 37.55378341674805, 39.537635803222656, 41.521484375, 43.505332946777344, 45.48918151855469, 47.47303009033203, 49.45688247680664, 51.440731048583984]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 11.0, 8.0, 5.0, 20.0, 16.0, 23.0, 24.0, 32.0, 31.0, 36.0, 33.0, 43.0, 37.0, 57.0, 37.0, 51.0, 45.0, 53.0, 42.0, 45.0, 49.0, 52.0, 35.0, 36.0, 34.0, 23.0, 21.0, 26.0, 16.0, 12.0, 6.0, 9.0, 4.0, 6.0, 5.0, 1.0, 7.0, 6.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.453125, -10.123046875, -9.79296875, -9.462890625, -9.1328125, -8.802734375, -8.47265625, -8.142578125, -7.8125, -7.482421875, -7.15234375, -6.822265625, -6.4921875, -6.162109375, -5.83203125, -5.501953125, -5.171875, -4.841796875, -4.51171875, -4.181640625, -3.8515625, -3.521484375, -3.19140625, -2.861328125, -2.53125, -2.201171875, -1.87109375, -1.541015625, -1.2109375, -0.880859375, -0.55078125, -0.220703125, 0.109375, 0.439453125, 0.76953125, 1.099609375, 1.4296875, 1.759765625, 2.08984375, 2.419921875, 2.75, 3.080078125, 3.41015625, 3.740234375, 4.0703125, 4.400390625, 4.73046875, 5.060546875, 5.390625, 5.720703125, 6.05078125, 6.380859375, 6.7109375, 7.041015625, 7.37109375, 7.701171875, 8.03125, 8.361328125, 8.69140625, 9.021484375, 9.3515625, 9.681640625, 10.01171875, 10.341796875, 10.671875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 7.0, 9.0, 11.0, 21.0, 24.0, 44.0, 37.0, 61.0, 80.0, 120.0, 156.0, 232.0, 312.0, 448.0, 706.0, 1128.0, 2088.0, 4443.0, 12571.0, 58281.0, 683583.0, 2895690.0, 469426.0, 44839.0, 10807.0, 4098.0, 1896.0, 1017.0, 652.0, 434.0, 278.0, 202.0, 169.0, 115.0, 68.0, 68.0, 36.0, 29.0, 27.0, 20.0, 12.0, 12.0, 8.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.53125, -23.750732421875, -22.97021484375, -22.189697265625, -21.4091796875, -20.628662109375, -19.84814453125, -19.067626953125, -18.287109375, -17.506591796875, -16.72607421875, -15.945556640625, -15.1650390625, -14.384521484375, -13.60400390625, -12.823486328125, -12.04296875, -11.262451171875, -10.48193359375, -9.701416015625, -8.9208984375, -8.140380859375, -7.35986328125, -6.579345703125, -5.798828125, -5.018310546875, -4.23779296875, -3.457275390625, -2.6767578125, -1.896240234375, -1.11572265625, -0.335205078125, 0.4453125, 1.225830078125, 2.00634765625, 2.786865234375, 3.5673828125, 4.347900390625, 5.12841796875, 5.908935546875, 6.689453125, 7.469970703125, 8.25048828125, 9.031005859375, 9.8115234375, 10.592041015625, 11.37255859375, 12.153076171875, 12.93359375, 13.714111328125, 14.49462890625, 15.275146484375, 16.0556640625, 16.836181640625, 17.61669921875, 18.397216796875, 19.177734375, 19.958251953125, 20.73876953125, 21.519287109375, 22.2998046875, 23.080322265625, 23.86083984375, 24.641357421875, 25.421875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 11.0, 13.0, 14.0, 28.0, 55.0, 92.0, 143.0, 283.0, 436.0, 759.0, 873.0, 582.0, 303.0, 175.0, 119.0, 72.0, 36.0, 28.0, 18.0, 8.0, 9.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.265625, -26.444091796875, -25.62255859375, -24.801025390625, -23.9794921875, -23.157958984375, -22.33642578125, -21.514892578125, -20.693359375, -19.871826171875, -19.05029296875, -18.228759765625, -17.4072265625, -16.585693359375, -15.76416015625, -14.942626953125, -14.12109375, -13.299560546875, -12.47802734375, -11.656494140625, -10.8349609375, -10.013427734375, -9.19189453125, -8.370361328125, -7.548828125, -6.727294921875, -5.90576171875, -5.084228515625, -4.2626953125, -3.441162109375, -2.61962890625, -1.798095703125, -0.9765625, -0.155029296875, 0.66650390625, 1.488037109375, 2.3095703125, 3.131103515625, 3.95263671875, 4.774169921875, 5.595703125, 6.417236328125, 7.23876953125, 8.060302734375, 8.8818359375, 9.703369140625, 10.52490234375, 11.346435546875, 12.16796875, 12.989501953125, 13.81103515625, 14.632568359375, 15.4541015625, 16.275634765625, 17.09716796875, 17.918701171875, 18.740234375, 19.561767578125, 20.38330078125, 21.204833984375, 22.0263671875, 22.847900390625, 23.66943359375, 24.490966796875, 25.3125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 10.0, 14.0, 14.0, 26.0, 64.0, 97.0, 238.0, 569.0, 1649.0, 6284.0, 40885.0, 1572106.0, 2510729.0, 51486.0, 7180.0, 1867.0, 573.0, 245.0, 98.0, 58.0, 33.0, 21.0, 15.0, 7.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.78125, -43.3388671875, -41.896484375, -40.4541015625, -39.01171875, -37.5693359375, -36.126953125, -34.6845703125, -33.2421875, -31.7998046875, -30.357421875, -28.9150390625, -27.47265625, -26.0302734375, -24.587890625, -23.1455078125, -21.703125, -20.2607421875, -18.818359375, -17.3759765625, -15.93359375, -14.4912109375, -13.048828125, -11.6064453125, -10.1640625, -8.7216796875, -7.279296875, -5.8369140625, -4.39453125, -2.9521484375, -1.509765625, -0.0673828125, 1.375, 2.8173828125, 4.259765625, 5.7021484375, 7.14453125, 8.5869140625, 10.029296875, 11.4716796875, 12.9140625, 14.3564453125, 15.798828125, 17.2412109375, 18.68359375, 20.1259765625, 21.568359375, 23.0107421875, 24.453125, 25.8955078125, 27.337890625, 28.7802734375, 30.22265625, 31.6650390625, 33.107421875, 34.5498046875, 35.9921875, 37.4345703125, 38.876953125, 40.3193359375, 41.76171875, 43.2041015625, 44.646484375, 46.0888671875, 47.53125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 45.0, 273.0, 568.0, 113.0, 10.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-578.3043212890625, -564.6124877929688, -550.920654296875, -537.2288818359375, -523.5370483398438, -509.84521484375, -496.1534118652344, -482.4615783691406, -468.769775390625, -455.07794189453125, -441.3861389160156, -427.6943054199219, -414.00250244140625, -400.3106689453125, -386.6188659667969, -372.9270324707031, -359.2352294921875, -345.54339599609375, -331.8515930175781, -318.1597595214844, -304.46795654296875, -290.776123046875, -277.0843200683594, -263.3924865722656, -249.70065307617188, -236.0088348388672, -222.3170166015625, -208.6251983642578, -194.93338012695312, -181.24154663085938, -167.54974365234375, -153.85791015625, -140.16610717773438, -126.47428894042969, -112.782470703125, -99.09065246582031, -85.39883422851562, -71.7070083618164, -58.01519012451172, -44.32337188720703, -30.631553649902344, -16.939735412597656, -3.247915267944336, 10.443904876708984, 24.135723114013672, 37.827545166015625, 51.51936340332031, 65.211181640625, 78.90299987792969, 92.59481811523438, 106.28663635253906, 119.97845458984375, 133.67027282714844, 147.36209106445312, 161.05392456054688, 174.7457275390625, 188.43756103515625, 202.12937927246094, 215.82119750976562, 229.5130157470703, 243.204833984375, 256.89666748046875, 270.5884704589844, 284.2803039550781, 297.97210693359375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 7.0, 5.0, 4.0, 5.0, 16.0, 6.0, 4.0, 7.0, 7.0, 18.0, 22.0, 17.0, 20.0, 27.0, 26.0, 30.0, 28.0, 37.0, 32.0, 36.0, 36.0, 44.0, 38.0, 40.0, 47.0, 35.0, 45.0, 35.0, 41.0, 39.0, 35.0, 26.0, 28.0, 24.0, 17.0, 28.0, 21.0, 10.0, 8.0, 12.0, 11.0, 13.0, 3.0, 7.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.41654968261719, -56.6412467956543, -54.865943908691406, -53.090641021728516, -51.315338134765625, -49.540035247802734, -47.764732360839844, -45.98942947387695, -44.21412658691406, -42.43882369995117, -40.66352081298828, -38.88821792602539, -37.1129150390625, -35.33761215209961, -33.56230926513672, -31.787006378173828, -30.01170539855957, -28.23640251159668, -26.46109962463379, -24.6857967376709, -22.910493850708008, -21.13519287109375, -19.35988998413086, -17.58458709716797, -15.809283256530762, -14.033980369567871, -12.25867748260498, -10.483375549316406, -8.708072662353516, -6.932769775390625, -5.157466888427734, -3.3821640014648438, -1.6068611145019531, 0.16844165325164795, 1.943744421005249, 3.7190470695495605, 5.494349956512451, 7.269652366638184, 9.044955253601074, 10.820258140563965, 12.595561027526855, 14.370863914489746, 16.14616584777832, 17.92146873474121, 19.6967716217041, 21.472074508666992, 23.247377395629883, 25.022680282592773, 26.797983169555664, 28.573286056518555, 30.348588943481445, 32.1238899230957, 33.899192810058594, 35.674495697021484, 37.449798583984375, 39.225101470947266, 41.000404357910156, 42.77570724487305, 44.55101013183594, 46.32631301879883, 48.10161590576172, 49.87691879272461, 51.6522216796875, 53.42752456665039, 55.20282745361328]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 4.0, 7.0, 6.0, 12.0, 7.0, 11.0, 16.0, 20.0, 19.0, 21.0, 27.0, 30.0, 28.0, 29.0, 45.0, 46.0, 46.0, 49.0, 46.0, 54.0, 44.0, 43.0, 50.0, 37.0, 44.0, 28.0, 30.0, 31.0, 21.0, 27.0, 17.0, 23.0, 7.0, 11.0, 13.0, 10.0, 8.0, 6.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.171875, -7.920654296875, -7.66943359375, -7.418212890625, -7.1669921875, -6.915771484375, -6.66455078125, -6.413330078125, -6.162109375, -5.910888671875, -5.65966796875, -5.408447265625, -5.1572265625, -4.906005859375, -4.65478515625, -4.403564453125, -4.15234375, -3.901123046875, -3.64990234375, -3.398681640625, -3.1474609375, -2.896240234375, -2.64501953125, -2.393798828125, -2.142578125, -1.891357421875, -1.64013671875, -1.388916015625, -1.1376953125, -0.886474609375, -0.63525390625, -0.384033203125, -0.1328125, 0.118408203125, 0.36962890625, 0.620849609375, 0.8720703125, 1.123291015625, 1.37451171875, 1.625732421875, 1.876953125, 2.128173828125, 2.37939453125, 2.630615234375, 2.8818359375, 3.133056640625, 3.38427734375, 3.635498046875, 3.88671875, 4.137939453125, 4.38916015625, 4.640380859375, 4.8916015625, 5.142822265625, 5.39404296875, 5.645263671875, 5.896484375, 6.147705078125, 6.39892578125, 6.650146484375, 6.9013671875, 7.152587890625, 7.40380859375, 7.655029296875, 7.90625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 6.0, 13.0, 12.0, 28.0, 41.0, 69.0, 88.0, 146.0, 198.0, 296.0, 462.0, 742.0, 1013.0, 1592.0, 2669.0, 4197.0, 7136.0, 11908.0, 20953.0, 38439.0, 73188.0, 138966.0, 229342.0, 225374.0, 134607.0, 70364.0, 37061.0, 20075.0, 11454.0, 6857.0, 4113.0, 2549.0, 1591.0, 1000.0, 670.0, 461.0, 288.0, 198.0, 140.0, 86.0, 61.0, 28.0, 33.0, 13.0, 13.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86572265625, -0.8377685546875, -0.809814453125, -0.7818603515625, -0.75390625, -0.7259521484375, -0.697998046875, -0.6700439453125, -0.64208984375, -0.6141357421875, -0.586181640625, -0.5582275390625, -0.5302734375, -0.5023193359375, -0.474365234375, -0.4464111328125, -0.41845703125, -0.3905029296875, -0.362548828125, -0.3345947265625, -0.306640625, -0.2786865234375, -0.250732421875, -0.2227783203125, -0.19482421875, -0.1668701171875, -0.138916015625, -0.1109619140625, -0.0830078125, -0.0550537109375, -0.027099609375, 0.0008544921875, 0.02880859375, 0.0567626953125, 0.084716796875, 0.1126708984375, 0.140625, 0.1685791015625, 0.196533203125, 0.2244873046875, 0.25244140625, 0.2803955078125, 0.308349609375, 0.3363037109375, 0.3642578125, 0.3922119140625, 0.420166015625, 0.4481201171875, 0.47607421875, 0.5040283203125, 0.531982421875, 0.5599365234375, 0.587890625, 0.6158447265625, 0.643798828125, 0.6717529296875, 0.69970703125, 0.7276611328125, 0.755615234375, 0.7835693359375, 0.8115234375, 0.8394775390625, 0.867431640625, 0.8953857421875, 0.92333984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 8.0, 5.0, 11.0, 9.0, 4.0, 11.0, 25.0, 23.0, 22.0, 28.0, 28.0, 32.0, 29.0, 26.0, 42.0, 33.0, 43.0, 55.0, 52.0, 1057.0, 34.0, 45.0, 45.0, 29.0, 51.0, 38.0, 27.0, 28.0, 28.0, 21.0, 31.0, 21.0, 14.0, 17.0, 11.0, 12.0, 10.0, 8.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.19921875, -6.0185546875, -5.837890625, -5.6572265625, -5.4765625, -5.2958984375, -5.115234375, -4.9345703125, -4.75390625, -4.5732421875, -4.392578125, -4.2119140625, -4.03125, -3.8505859375, -3.669921875, -3.4892578125, -3.30859375, -3.1279296875, -2.947265625, -2.7666015625, -2.5859375, -2.4052734375, -2.224609375, -2.0439453125, -1.86328125, -1.6826171875, -1.501953125, -1.3212890625, -1.140625, -0.9599609375, -0.779296875, -0.5986328125, -0.41796875, -0.2373046875, -0.056640625, 0.1240234375, 0.3046875, 0.4853515625, 0.666015625, 0.8466796875, 1.02734375, 1.2080078125, 1.388671875, 1.5693359375, 1.75, 1.9306640625, 2.111328125, 2.2919921875, 2.47265625, 2.6533203125, 2.833984375, 3.0146484375, 3.1953125, 3.3759765625, 3.556640625, 3.7373046875, 3.91796875, 4.0986328125, 4.279296875, 4.4599609375, 4.640625, 4.8212890625, 5.001953125, 5.1826171875, 5.36328125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 12.0, 5.0, 16.0, 27.0, 40.0, 59.0, 95.0, 160.0, 242.0, 383.0, 641.0, 1029.0, 1740.0, 2923.0, 5432.0, 10637.0, 23822.0, 98546.0, 1849796.0, 61363.0, 19628.0, 9164.0, 4652.0, 2714.0, 1493.0, 937.0, 549.0, 343.0, 252.0, 146.0, 109.0, 51.0, 40.0, 30.0, 17.0, 13.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9990234375, -1.9353485107421875, -1.871673583984375, -1.8079986572265625, -1.74432373046875, -1.6806488037109375, -1.616973876953125, -1.5532989501953125, -1.4896240234375, -1.4259490966796875, -1.362274169921875, -1.2985992431640625, -1.23492431640625, -1.1712493896484375, -1.107574462890625, -1.0438995361328125, -0.980224609375, -0.9165496826171875, -0.852874755859375, -0.7891998291015625, -0.72552490234375, -0.6618499755859375, -0.598175048828125, -0.5345001220703125, -0.4708251953125, -0.4071502685546875, -0.343475341796875, -0.2798004150390625, -0.21612548828125, -0.1524505615234375, -0.088775634765625, -0.0251007080078125, 0.03857421875, 0.1022491455078125, 0.165924072265625, 0.2295989990234375, 0.29327392578125, 0.3569488525390625, 0.420623779296875, 0.4842987060546875, 0.5479736328125, 0.6116485595703125, 0.675323486328125, 0.7389984130859375, 0.80267333984375, 0.8663482666015625, 0.930023193359375, 0.9936981201171875, 1.057373046875, 1.1210479736328125, 1.184722900390625, 1.2483978271484375, 1.31207275390625, 1.3757476806640625, 1.439422607421875, 1.5030975341796875, 1.5667724609375, 1.6304473876953125, 1.694122314453125, 1.7577972412109375, 1.82147216796875, 1.8851470947265625, 1.948822021484375, 2.0124969482421875, 2.076171875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 7.0, 5.0, 11.0, 7.0, 16.0, 12.0, 19.0, 20.0, 15.0, 26.0, 32.0, 36.0, 31.0, 43.0, 45.0, 54.0, 49.0, 54.0, 43.0, 42.0, 49.0, 45.0, 42.0, 44.0, 35.0, 35.0, 23.0, 30.0, 22.0, 23.0, 18.0, 8.0, 12.0, 6.0, 5.0, 12.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.043243408203125, -0.04189109802246094, -0.040538787841796875, -0.03918647766113281, -0.03783416748046875, -0.03648185729980469, -0.035129547119140625, -0.03377723693847656, -0.0324249267578125, -0.031072616577148438, -0.029720306396484375, -0.028367996215820312, -0.02701568603515625, -0.025663375854492188, -0.024311065673828125, -0.022958755493164062, -0.0216064453125, -0.020254135131835938, -0.018901824951171875, -0.017549514770507812, -0.01619720458984375, -0.014844894409179688, -0.013492584228515625, -0.012140274047851562, -0.0107879638671875, -0.009435653686523438, -0.008083343505859375, -0.0067310333251953125, -0.00537872314453125, -0.0040264129638671875, -0.002674102783203125, -0.0013217926025390625, 3.0517578125e-05, 0.0013828277587890625, 0.002735137939453125, 0.0040874481201171875, 0.00543975830078125, 0.0067920684814453125, 0.008144378662109375, 0.009496688842773438, 0.0108489990234375, 0.012201309204101562, 0.013553619384765625, 0.014905929565429688, 0.01625823974609375, 0.017610549926757812, 0.018962860107421875, 0.020315170288085938, 0.02166748046875, 0.023019790649414062, 0.024372100830078125, 0.025724411010742188, 0.02707672119140625, 0.028429031372070312, 0.029781341552734375, 0.031133651733398438, 0.0324859619140625, 0.03383827209472656, 0.035190582275390625, 0.03654289245605469, 0.03789520263671875, 0.03924751281738281, 0.040599822998046875, 0.04195213317871094, 0.043304443359375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 9.0, 5.0, 11.0, 8.0, 13.0, 15.0, 20.0, 34.0, 38.0, 48.0, 58.0, 68.0, 103.0, 115.0, 178.0, 212.0, 313.0, 566.0, 1296.0, 21327.0, 924743.0, 95086.0, 2242.0, 702.0, 349.0, 252.0, 165.0, 137.0, 99.0, 71.0, 46.0, 42.0, 41.0, 30.0, 31.0, 19.0, 11.0, 13.0, 5.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.734375, -0.7111740112304688, -0.6879730224609375, -0.6647720336914062, -0.641571044921875, -0.6183700561523438, -0.5951690673828125, -0.5719680786132812, -0.54876708984375, -0.5255661010742188, -0.5023651123046875, -0.47916412353515625, -0.455963134765625, -0.43276214599609375, -0.4095611572265625, -0.38636016845703125, -0.3631591796875, -0.33995819091796875, -0.3167572021484375, -0.29355621337890625, -0.270355224609375, -0.24715423583984375, -0.2239532470703125, -0.20075225830078125, -0.17755126953125, -0.15435028076171875, -0.1311492919921875, -0.10794830322265625, -0.084747314453125, -0.06154632568359375, -0.0383453369140625, -0.01514434814453125, 0.008056640625, 0.03125762939453125, 0.0544586181640625, 0.07765960693359375, 0.100860595703125, 0.12406158447265625, 0.1472625732421875, 0.17046356201171875, 0.19366455078125, 0.21686553955078125, 0.2400665283203125, 0.26326751708984375, 0.286468505859375, 0.30966949462890625, 0.3328704833984375, 0.35607147216796875, 0.3792724609375, 0.40247344970703125, 0.4256744384765625, 0.44887542724609375, 0.472076416015625, 0.49527740478515625, 0.5184783935546875, 0.5416793823242188, 0.56488037109375, 0.5880813598632812, 0.6112823486328125, 0.6344833374023438, 0.657684326171875, 0.6808853149414062, 0.7040863037109375, 0.7272872924804688, 0.75048828125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 27.0, 48.0, 160.0, 359.0, 274.0, 104.0, 25.0, 6.0, 5.0, 2.0], "bins": [-0.3857949674129486, -0.3791176676750183, -0.3724403381347656, -0.3657630383968353, -0.35908570885658264, -0.35240840911865234, -0.34573107957839966, -0.33905377984046936, -0.3323764503002167, -0.3256991505622864, -0.3190218210220337, -0.3123445212841034, -0.3056671917438507, -0.2989898920059204, -0.2923125624656677, -0.2856352627277374, -0.27895796298980713, -0.27228066325187683, -0.26560333371162415, -0.25892603397369385, -0.25224870443344116, -0.24557140469551086, -0.23889407515525818, -0.23221677541732788, -0.2255394458770752, -0.2188621312379837, -0.2121848165988922, -0.20550750195980072, -0.19883018732070923, -0.19215288758277893, -0.18547555804252625, -0.17879825830459595, -0.17212095856666565, -0.16544364392757416, -0.15876632928848267, -0.15208901464939117, -0.14541170001029968, -0.13873440027236938, -0.1320570707321167, -0.1253797709941864, -0.11870244890451431, -0.11202513426542282, -0.10534781962633133, -0.09867051243782043, -0.09199319779872894, -0.08531588315963745, -0.07863856852054596, -0.07196125388145447, -0.06528393924236298, -0.058606624603271484, -0.05192931368947029, -0.0452519990503788, -0.038574688136577606, -0.031897373497486115, -0.025220058858394623, -0.01854274794459343, -0.011865437030792236, -0.0051881237886846066, 0.0014891894534230232, 0.00816650316119194, 0.014843815937638283, 0.021521128714084625, 0.028198443353176117, 0.03487575426697731, 0.0415530689060688]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 5.0, 8.0, 8.0, 5.0, 17.0, 18.0, 19.0, 19.0, 20.0, 25.0, 35.0, 24.0, 28.0, 33.0, 42.0, 47.0, 34.0, 36.0, 34.0, 44.0, 44.0, 42.0, 53.0, 50.0, 31.0, 35.0, 33.0, 31.0, 39.0, 23.0, 22.0, 14.0, 18.0, 18.0, 9.0, 10.0, 8.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.05068361759185791, -0.049212515354156494, -0.04774141311645508, -0.04627031087875366, -0.044799208641052246, -0.04332810640335083, -0.041857004165649414, -0.040385901927948, -0.03891479969024658, -0.037443697452545166, -0.03597259521484375, -0.034501492977142334, -0.03303039073944092, -0.0315592885017395, -0.030088186264038086, -0.02861708402633667, -0.027145981788635254, -0.025674879550933838, -0.024203777313232422, -0.022732675075531006, -0.02126157283782959, -0.019790470600128174, -0.018319368362426758, -0.016848266124725342, -0.015377163887023926, -0.01390606164932251, -0.012434959411621094, -0.010963857173919678, -0.009492754936218262, -0.008021652698516846, -0.00655055046081543, -0.005079448223114014, -0.0036083459854125977, -0.0021372437477111816, -0.0006661415100097656, 0.0008049607276916504, 0.0022760629653930664, 0.0037471652030944824, 0.0052182674407958984, 0.0066893696784973145, 0.00816047191619873, 0.009631574153900146, 0.011102676391601562, 0.012573778629302979, 0.014044880867004395, 0.01551598310470581, 0.016987085342407227, 0.018458187580108643, 0.01992928981781006, 0.021400392055511475, 0.02287149429321289, 0.024342596530914307, 0.025813698768615723, 0.02728480100631714, 0.028755903244018555, 0.03022700548171997, 0.03169810771942139, 0.0331692099571228, 0.03464031219482422, 0.036111414432525635, 0.03758251667022705, 0.03905361890792847, 0.04052472114562988, 0.0419958233833313, 0.043466925621032715]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 4.0, 4.0, 7.0, 6.0, 13.0, 6.0, 11.0, 16.0, 20.0, 19.0, 21.0, 28.0, 29.0, 28.0, 30.0, 44.0, 46.0, 47.0, 48.0, 47.0, 53.0, 44.0, 43.0, 50.0, 38.0, 43.0, 29.0, 30.0, 30.0, 22.0, 27.0, 16.0, 23.0, 9.0, 9.0, 13.0, 10.0, 8.0, 6.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.171875, -7.92059326171875, -7.6693115234375, -7.41802978515625, -7.166748046875, -6.91546630859375, -6.6641845703125, -6.41290283203125, -6.16162109375, -5.91033935546875, -5.6590576171875, -5.40777587890625, -5.156494140625, -4.90521240234375, -4.6539306640625, -4.40264892578125, -4.1513671875, -3.90008544921875, -3.6488037109375, -3.39752197265625, -3.146240234375, -2.89495849609375, -2.6436767578125, -2.39239501953125, -2.14111328125, -1.88983154296875, -1.6385498046875, -1.38726806640625, -1.135986328125, -0.88470458984375, -0.6334228515625, -0.38214111328125, -0.130859375, 0.12042236328125, 0.3717041015625, 0.62298583984375, 0.874267578125, 1.12554931640625, 1.3768310546875, 1.62811279296875, 1.87939453125, 2.13067626953125, 2.3819580078125, 2.63323974609375, 2.884521484375, 3.13580322265625, 3.3870849609375, 3.63836669921875, 3.8896484375, 4.14093017578125, 4.3922119140625, 4.64349365234375, 4.894775390625, 5.14605712890625, 5.3973388671875, 5.64862060546875, 5.89990234375, 6.15118408203125, 6.4024658203125, 6.65374755859375, 6.905029296875, 7.15631103515625, 7.4075927734375, 7.65887451171875, 7.91015625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 5.0, 10.0, 8.0, 9.0, 9.0, 9.0, 8.0, 22.0, 17.0, 26.0, 40.0, 48.0, 95.0, 90.0, 118.0, 175.0, 283.0, 397.0, 662.0, 1192.0, 2143.0, 4937.0, 14405.0, 60202.0, 396798.0, 468213.0, 71009.0, 16342.0, 5568.0, 2451.0, 1177.0, 664.0, 438.0, 301.0, 163.0, 128.0, 100.0, 63.0, 67.0, 32.0, 29.0, 33.0, 19.0, 21.0, 6.0, 11.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4609375, -11.06640625, -10.671875, -10.27734375, -9.8828125, -9.48828125, -9.09375, -8.69921875, -8.3046875, -7.91015625, -7.515625, -7.12109375, -6.7265625, -6.33203125, -5.9375, -5.54296875, -5.1484375, -4.75390625, -4.359375, -3.96484375, -3.5703125, -3.17578125, -2.78125, -2.38671875, -1.9921875, -1.59765625, -1.203125, -0.80859375, -0.4140625, -0.01953125, 0.375, 0.76953125, 1.1640625, 1.55859375, 1.953125, 2.34765625, 2.7421875, 3.13671875, 3.53125, 3.92578125, 4.3203125, 4.71484375, 5.109375, 5.50390625, 5.8984375, 6.29296875, 6.6875, 7.08203125, 7.4765625, 7.87109375, 8.265625, 8.66015625, 9.0546875, 9.44921875, 9.84375, 10.23828125, 10.6328125, 11.02734375, 11.421875, 11.81640625, 12.2109375, 12.60546875, 13.0, 13.39453125, 13.7890625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 4.0, 7.0, 6.0, 8.0, 10.0, 14.0, 24.0, 27.0, 24.0, 34.0, 48.0, 38.0, 50.0, 69.0, 69.0, 144.0, 302.0, 1522.0, 200.0, 83.0, 64.0, 53.0, 37.0, 42.0, 27.0, 33.0, 19.0, 12.0, 12.0, 15.0, 8.0, 7.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.703125, -19.99658203125, -19.2900390625, -18.58349609375, -17.876953125, -17.17041015625, -16.4638671875, -15.75732421875, -15.05078125, -14.34423828125, -13.6376953125, -12.93115234375, -12.224609375, -11.51806640625, -10.8115234375, -10.10498046875, -9.3984375, -8.69189453125, -7.9853515625, -7.27880859375, -6.572265625, -5.86572265625, -5.1591796875, -4.45263671875, -3.74609375, -3.03955078125, -2.3330078125, -1.62646484375, -0.919921875, -0.21337890625, 0.4931640625, 1.19970703125, 1.90625, 2.61279296875, 3.3193359375, 4.02587890625, 4.732421875, 5.43896484375, 6.1455078125, 6.85205078125, 7.55859375, 8.26513671875, 8.9716796875, 9.67822265625, 10.384765625, 11.09130859375, 11.7978515625, 12.50439453125, 13.2109375, 13.91748046875, 14.6240234375, 15.33056640625, 16.037109375, 16.74365234375, 17.4501953125, 18.15673828125, 18.86328125, 19.56982421875, 20.2763671875, 20.98291015625, 21.689453125, 22.39599609375, 23.1025390625, 23.80908203125, 24.515625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 8.0, 5.0, 4.0, 7.0, 8.0, 8.0, 15.0, 12.0, 25.0, 32.0, 34.0, 41.0, 61.0, 73.0, 103.0, 149.0, 236.0, 455.0, 934.0, 5261.0, 2757603.0, 375662.0, 2830.0, 810.0, 423.0, 268.0, 160.0, 96.0, 90.0, 63.0, 57.0, 25.0, 28.0, 24.0, 12.0, 25.0, 14.0, 8.0, 9.0, 8.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-44.0, -42.73828125, -41.4765625, -40.21484375, -38.953125, -37.69140625, -36.4296875, -35.16796875, -33.90625, -32.64453125, -31.3828125, -30.12109375, -28.859375, -27.59765625, -26.3359375, -25.07421875, -23.8125, -22.55078125, -21.2890625, -20.02734375, -18.765625, -17.50390625, -16.2421875, -14.98046875, -13.71875, -12.45703125, -11.1953125, -9.93359375, -8.671875, -7.41015625, -6.1484375, -4.88671875, -3.625, -2.36328125, -1.1015625, 0.16015625, 1.421875, 2.68359375, 3.9453125, 5.20703125, 6.46875, 7.73046875, 8.9921875, 10.25390625, 11.515625, 12.77734375, 14.0390625, 15.30078125, 16.5625, 17.82421875, 19.0859375, 20.34765625, 21.609375, 22.87109375, 24.1328125, 25.39453125, 26.65625, 27.91796875, 29.1796875, 30.44140625, 31.703125, 32.96484375, 34.2265625, 35.48828125, 36.75]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 14.0, 123.0, 467.0, 322.0, 73.0, 12.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.11021041870117, -39.975101470947266, -34.839996337890625, -29.70488739013672, -24.569778442382812, -19.434669494628906, -14.299562454223633, -9.16445541381836, -4.029346466064453, 1.1057615280151367, 6.240869522094727, 11.375977516174316, 16.511085510253906, 21.646194458007812, 26.781301498413086, 31.91640853881836, 37.051517486572266, 42.18662643432617, 47.32173156738281, 52.45684051513672, 57.591949462890625, 62.72705841064453, 67.86216735839844, 72.99726867675781, 78.13238525390625, 83.26749420166016, 88.40260314941406, 93.53771209716797, 98.67282104492188, 103.80792236328125, 108.94303131103516, 114.07814025878906, 119.2132568359375, 124.3483657836914, 129.4834747314453, 134.6185760498047, 139.75369262695312, 144.8887939453125, 150.02391052246094, 155.1590118408203, 160.29412841796875, 165.42922973632812, 170.56434631347656, 175.69944763183594, 180.83456420898438, 185.96966552734375, 191.1047821044922, 196.23988342285156, 201.37498474121094, 206.5100860595703, 211.64520263671875, 216.78030395507812, 221.91542053222656, 227.05052185058594, 232.18563842773438, 237.32073974609375, 242.45584106445312, 247.5909423828125, 252.72605895996094, 257.8611755371094, 262.99627685546875, 268.1313781738281, 273.2664794921875, 278.401611328125, 283.5367126464844]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 6.0, 7.0, 9.0, 9.0, 3.0, 9.0, 16.0, 12.0, 15.0, 16.0, 10.0, 26.0, 23.0, 23.0, 27.0, 29.0, 42.0, 25.0, 36.0, 38.0, 41.0, 49.0, 29.0, 44.0, 40.0, 32.0, 30.0, 36.0, 24.0, 40.0, 37.0, 31.0, 25.0, 37.0, 15.0, 22.0, 12.0, 14.0, 12.0, 10.0, 8.0, 14.0, 3.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-38.69164276123047, -37.42092514038086, -36.150203704833984, -34.879486083984375, -33.608768463134766, -32.338050842285156, -31.06732940673828, -29.796611785888672, -28.52589225769043, -27.255172729492188, -25.984455108642578, -24.713735580444336, -23.443016052246094, -22.172298431396484, -20.901578903198242, -19.630859375, -18.36014175415039, -17.08942222595215, -15.818704605102539, -14.547985076904297, -13.277266502380371, -12.006547927856445, -10.735828399658203, -9.465109825134277, -8.194391250610352, -6.923672676086426, -5.652953624725342, -4.382234573364258, -3.111515998840332, -1.8407974243164062, -0.5700783729553223, 0.7006406784057617, 1.9713554382324219, 3.2420742511749268, 4.512793064117432, 5.783512115478516, 7.054230690002441, 8.324949264526367, 9.59566879272461, 10.866387367248535, 12.137105941772461, 13.407824516296387, 14.678543090820312, 15.949262619018555, 17.219982147216797, 18.490699768066406, 19.76141929626465, 21.03213882446289, 22.3028564453125, 23.573575973510742, 24.84429359436035, 26.115013122558594, 27.385730743408203, 28.656450271606445, 29.927169799804688, 31.197887420654297, 32.468605041503906, 33.739322662353516, 35.01004409790039, 36.28076171875, 37.55147933959961, 38.82219696044922, 40.092918395996094, 41.3636360168457, 42.63435745239258]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 3.0, 4.0, 3.0, 4.0, 16.0, 9.0, 14.0, 14.0, 16.0, 21.0, 24.0, 29.0, 31.0, 47.0, 63.0, 41.0, 45.0, 55.0, 53.0, 55.0, 57.0, 53.0, 37.0, 47.0, 43.0, 37.0, 19.0, 23.0, 19.0, 28.0, 12.0, 15.0, 14.0, 11.0, 11.0, 6.0, 4.0, 5.0, 5.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.7890625, -10.4730224609375, -10.156982421875, -9.8409423828125, -9.52490234375, -9.2088623046875, -8.892822265625, -8.5767822265625, -8.2607421875, -7.9447021484375, -7.628662109375, -7.3126220703125, -6.99658203125, -6.6805419921875, -6.364501953125, -6.0484619140625, -5.732421875, -5.4163818359375, -5.100341796875, -4.7843017578125, -4.46826171875, -4.1522216796875, -3.836181640625, -3.5201416015625, -3.2041015625, -2.8880615234375, -2.572021484375, -2.2559814453125, -1.93994140625, -1.6239013671875, -1.307861328125, -0.9918212890625, -0.67578125, -0.3597412109375, -0.043701171875, 0.2723388671875, 0.58837890625, 0.9044189453125, 1.220458984375, 1.5364990234375, 1.8525390625, 2.1685791015625, 2.484619140625, 2.8006591796875, 3.11669921875, 3.4327392578125, 3.748779296875, 4.0648193359375, 4.380859375, 4.6968994140625, 5.012939453125, 5.3289794921875, 5.64501953125, 5.9610595703125, 6.277099609375, 6.5931396484375, 6.9091796875, 7.2252197265625, 7.541259765625, 7.8572998046875, 8.17333984375, 8.4893798828125, 8.805419921875, 9.1214599609375, 9.4375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 7.0, 11.0, 11.0, 16.0, 30.0, 35.0, 66.0, 67.0, 102.0, 130.0, 216.0, 367.0, 731.0, 1493.0, 3499.0, 9384.0, 31084.0, 221263.0, 3420234.0, 445459.0, 41178.0, 11519.0, 4018.0, 1559.0, 655.0, 375.0, 218.0, 146.0, 107.0, 68.0, 65.0, 37.0, 29.0, 28.0, 21.0, 12.0, 9.0, 12.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-48.71875, -47.310546875, -45.90234375, -44.494140625, -43.0859375, -41.677734375, -40.26953125, -38.861328125, -37.453125, -36.044921875, -34.63671875, -33.228515625, -31.8203125, -30.412109375, -29.00390625, -27.595703125, -26.1875, -24.779296875, -23.37109375, -21.962890625, -20.5546875, -19.146484375, -17.73828125, -16.330078125, -14.921875, -13.513671875, -12.10546875, -10.697265625, -9.2890625, -7.880859375, -6.47265625, -5.064453125, -3.65625, -2.248046875, -0.83984375, 0.568359375, 1.9765625, 3.384765625, 4.79296875, 6.201171875, 7.609375, 9.017578125, 10.42578125, 11.833984375, 13.2421875, 14.650390625, 16.05859375, 17.466796875, 18.875, 20.283203125, 21.69140625, 23.099609375, 24.5078125, 25.916015625, 27.32421875, 28.732421875, 30.140625, 31.548828125, 32.95703125, 34.365234375, 35.7734375, 37.181640625, 38.58984375, 39.998046875, 41.40625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 3.0, 8.0, 13.0, 13.0, 9.0, 19.0, 29.0, 31.0, 31.0, 39.0, 52.0, 52.0, 99.0, 154.0, 210.0, 319.0, 384.0, 545.0, 524.0, 421.0, 298.0, 210.0, 152.0, 95.0, 80.0, 63.0, 57.0, 36.0, 27.0, 23.0, 18.0, 18.0, 6.0, 7.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0, -17.3818359375, -16.763671875, -16.1455078125, -15.52734375, -14.9091796875, -14.291015625, -13.6728515625, -13.0546875, -12.4365234375, -11.818359375, -11.2001953125, -10.58203125, -9.9638671875, -9.345703125, -8.7275390625, -8.109375, -7.4912109375, -6.873046875, -6.2548828125, -5.63671875, -5.0185546875, -4.400390625, -3.7822265625, -3.1640625, -2.5458984375, -1.927734375, -1.3095703125, -0.69140625, -0.0732421875, 0.544921875, 1.1630859375, 1.78125, 2.3994140625, 3.017578125, 3.6357421875, 4.25390625, 4.8720703125, 5.490234375, 6.1083984375, 6.7265625, 7.3447265625, 7.962890625, 8.5810546875, 9.19921875, 9.8173828125, 10.435546875, 11.0537109375, 11.671875, 12.2900390625, 12.908203125, 13.5263671875, 14.14453125, 14.7626953125, 15.380859375, 15.9990234375, 16.6171875, 17.2353515625, 17.853515625, 18.4716796875, 19.08984375, 19.7080078125, 20.326171875, 20.9443359375, 21.5625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 8.0, 21.0, 20.0, 55.0, 49.0, 86.0, 123.0, 212.0, 308.0, 482.0, 802.0, 1297.0, 2164.0, 3546.0, 6488.0, 11394.0, 21575.0, 42751.0, 95951.0, 275505.0, 1236416.0, 1818216.0, 433415.0, 129560.0, 54416.0, 26743.0, 14115.0, 7621.0, 4388.0, 2483.0, 1549.0, 898.0, 597.0, 353.0, 245.0, 160.0, 84.0, 64.0, 49.0, 29.0, 12.0, 18.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.46875, -13.022216796875, -12.57568359375, -12.129150390625, -11.6826171875, -11.236083984375, -10.78955078125, -10.343017578125, -9.896484375, -9.449951171875, -9.00341796875, -8.556884765625, -8.1103515625, -7.663818359375, -7.21728515625, -6.770751953125, -6.32421875, -5.877685546875, -5.43115234375, -4.984619140625, -4.5380859375, -4.091552734375, -3.64501953125, -3.198486328125, -2.751953125, -2.305419921875, -1.85888671875, -1.412353515625, -0.9658203125, -0.519287109375, -0.07275390625, 0.373779296875, 0.8203125, 1.266845703125, 1.71337890625, 2.159912109375, 2.6064453125, 3.052978515625, 3.49951171875, 3.946044921875, 4.392578125, 4.839111328125, 5.28564453125, 5.732177734375, 6.1787109375, 6.625244140625, 7.07177734375, 7.518310546875, 7.96484375, 8.411376953125, 8.85791015625, 9.304443359375, 9.7509765625, 10.197509765625, 10.64404296875, 11.090576171875, 11.537109375, 11.983642578125, 12.43017578125, 12.876708984375, 13.3232421875, 13.769775390625, 14.21630859375, 14.662841796875, 15.109375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 4.0, 4.0, 1.0, 8.0, 6.0, 6.0, 12.0, 14.0, 22.0, 21.0, 30.0, 31.0, 48.0, 54.0, 65.0, 67.0, 65.0, 77.0, 67.0, 73.0, 65.0, 45.0, 41.0, 37.0, 20.0, 18.0, 18.0, 13.0, 10.0, 12.0, 8.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-126.52803802490234, -123.04978942871094, -119.57154846191406, -116.09329986572266, -112.61505126953125, -109.13680267333984, -105.65855407714844, -102.18031311035156, -98.70206451416016, -95.22381591796875, -91.74557495117188, -88.26732635498047, -84.78907775878906, -81.31082916259766, -77.83258056640625, -74.35433959960938, -70.87609100341797, -67.39784240722656, -63.91959762573242, -60.44135284423828, -56.963104248046875, -53.48485565185547, -50.00661087036133, -46.52836608886719, -43.05011749267578, -39.571868896484375, -36.093624114990234, -32.615379333496094, -29.137130737304688, -25.658884048461914, -22.18063735961914, -18.702390670776367, -15.224143981933594, -11.74589729309082, -8.267650604248047, -4.789403915405273, -1.3111572265625, 2.1670894622802734, 5.645336151123047, 9.12358283996582, 12.601829528808594, 16.080076217651367, 19.55832290649414, 23.036569595336914, 26.514816284179688, 29.99306297302246, 33.471309661865234, 36.949554443359375, 40.42780303955078, 43.90605163574219, 47.38429641723633, 50.86254119873047, 54.340789794921875, 57.81903839111328, 61.29728317260742, 64.77552795410156, 68.25377655029297, 71.73202514648438, 75.21026611328125, 78.68851470947266, 82.16676330566406, 85.64501190185547, 89.12326049804688, 92.60150146484375, 96.07975006103516]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 10.0, 7.0, 10.0, 8.0, 10.0, 19.0, 19.0, 13.0, 27.0, 35.0, 36.0, 39.0, 32.0, 47.0, 56.0, 47.0, 53.0, 46.0, 42.0, 51.0, 50.0, 38.0, 39.0, 33.0, 31.0, 34.0, 35.0, 24.0, 21.0, 12.0, 17.0, 12.0, 10.0, 11.0, 9.0, 5.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-104.31660461425781, -101.14911651611328, -97.98162841796875, -94.81414794921875, -91.64665985107422, -88.47917175292969, -85.31168365478516, -82.14419555664062, -78.97671508789062, -75.8092269897461, -72.64173889160156, -69.47425842285156, -66.30677032470703, -63.1392822265625, -59.97179412841797, -56.80430603027344, -53.636817932128906, -50.469329833984375, -47.30184555053711, -44.13435745239258, -40.96687316894531, -37.79938507080078, -34.63189697265625, -31.46441078186035, -28.296924591064453, -25.129438400268555, -21.961952209472656, -18.794464111328125, -15.626977920532227, -12.459491729736328, -9.292003631591797, -6.124517440795898, -2.95703125, 0.21045541763305664, 3.3779420852661133, 6.545429229736328, 9.712915420532227, 12.880401611328125, 16.047889709472656, 19.215375900268555, 22.382862091064453, 25.55034828186035, 28.71783447265625, 31.88532257080078, 35.05281066894531, 38.22029495239258, 41.38778305053711, 44.555267333984375, 47.722755432128906, 50.89024353027344, 54.0577278137207, 57.225215911865234, 60.3927001953125, 63.56018829345703, 66.72767639160156, 69.8951644897461, 73.06265258789062, 76.23014068603516, 79.39762878417969, 82.56510925292969, 85.73259735107422, 88.90008544921875, 92.06757354736328, 95.23506164550781, 98.40254211425781]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 9.0, 5.0, 6.0, 11.0, 7.0, 10.0, 18.0, 13.0, 16.0, 29.0, 28.0, 27.0, 37.0, 47.0, 39.0, 56.0, 54.0, 47.0, 42.0, 71.0, 41.0, 49.0, 40.0, 35.0, 47.0, 29.0, 26.0, 23.0, 29.0, 27.0, 17.0, 15.0, 11.0, 5.0, 10.0, 10.0, 4.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-194.5, -188.62109375, -182.7421875, -176.86328125, -170.984375, -165.10546875, -159.2265625, -153.34765625, -147.46875, -141.58984375, -135.7109375, -129.83203125, -123.953125, -118.07421875, -112.1953125, -106.31640625, -100.4375, -94.55859375, -88.6796875, -82.80078125, -76.921875, -71.04296875, -65.1640625, -59.28515625, -53.40625, -47.52734375, -41.6484375, -35.76953125, -29.890625, -24.01171875, -18.1328125, -12.25390625, -6.375, -0.49609375, 5.3828125, 11.26171875, 17.140625, 23.01953125, 28.8984375, 34.77734375, 40.65625, 46.53515625, 52.4140625, 58.29296875, 64.171875, 70.05078125, 75.9296875, 81.80859375, 87.6875, 93.56640625, 99.4453125, 105.32421875, 111.203125, 117.08203125, 122.9609375, 128.83984375, 134.71875, 140.59765625, 146.4765625, 152.35546875, 158.234375, 164.11328125, 169.9921875, 175.87109375, 181.75]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 23.0, 14.0, 22.0, 38.0, 69.0, 96.0, 186.0, 247.0, 370.0, 611.0, 963.0, 1520.0, 2303.0, 3766.0, 6189.0, 10530.0, 18357.0, 33248.0, 63778.0, 129927.0, 248544.0, 251509.0, 132132.0, 64525.0, 33592.0, 18391.0, 10813.0, 6421.0, 3902.0, 2357.0, 1450.0, 960.0, 582.0, 345.0, 235.0, 195.0, 119.0, 61.0, 58.0, 23.0, 25.0, 23.0, 9.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0, -10.6563720703125, -10.312744140625, -9.9691162109375, -9.62548828125, -9.2818603515625, -8.938232421875, -8.5946044921875, -8.2509765625, -7.9073486328125, -7.563720703125, -7.2200927734375, -6.87646484375, -6.5328369140625, -6.189208984375, -5.8455810546875, -5.501953125, -5.1583251953125, -4.814697265625, -4.4710693359375, -4.12744140625, -3.7838134765625, -3.440185546875, -3.0965576171875, -2.7529296875, -2.4093017578125, -2.065673828125, -1.7220458984375, -1.37841796875, -1.0347900390625, -0.691162109375, -0.3475341796875, -0.00390625, 0.3397216796875, 0.683349609375, 1.0269775390625, 1.37060546875, 1.7142333984375, 2.057861328125, 2.4014892578125, 2.7451171875, 3.0887451171875, 3.432373046875, 3.7760009765625, 4.11962890625, 4.4632568359375, 4.806884765625, 5.1505126953125, 5.494140625, 5.8377685546875, 6.181396484375, 6.5250244140625, 6.86865234375, 7.2122802734375, 7.555908203125, 7.8995361328125, 8.2431640625, 8.5867919921875, 8.930419921875, 9.2740478515625, 9.61767578125, 9.9613037109375, 10.304931640625, 10.6485595703125, 10.9921875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 7.0, 4.0, 7.0, 11.0, 15.0, 13.0, 15.0, 17.0, 21.0, 25.0, 23.0, 24.0, 23.0, 38.0, 34.0, 33.0, 39.0, 34.0, 35.0, 47.0, 1070.0, 40.0, 44.0, 34.0, 39.0, 44.0, 30.0, 27.0, 28.0, 43.0, 25.0, 19.0, 15.0, 15.0, 17.0, 16.0, 10.0, 6.0, 6.0, 4.0, 7.0, 9.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-95.375, -92.2177734375, -89.060546875, -85.9033203125, -82.74609375, -79.5888671875, -76.431640625, -73.2744140625, -70.1171875, -66.9599609375, -63.802734375, -60.6455078125, -57.48828125, -54.3310546875, -51.173828125, -48.0166015625, -44.859375, -41.7021484375, -38.544921875, -35.3876953125, -32.23046875, -29.0732421875, -25.916015625, -22.7587890625, -19.6015625, -16.4443359375, -13.287109375, -10.1298828125, -6.97265625, -3.8154296875, -0.658203125, 2.4990234375, 5.65625, 8.8134765625, 11.970703125, 15.1279296875, 18.28515625, 21.4423828125, 24.599609375, 27.7568359375, 30.9140625, 34.0712890625, 37.228515625, 40.3857421875, 43.54296875, 46.7001953125, 49.857421875, 53.0146484375, 56.171875, 59.3291015625, 62.486328125, 65.6435546875, 68.80078125, 71.9580078125, 75.115234375, 78.2724609375, 81.4296875, 84.5869140625, 87.744140625, 90.9013671875, 94.05859375, 97.2158203125, 100.373046875, 103.5302734375, 106.6875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 15.0, 11.0, 17.0, 29.0, 36.0, 69.0, 111.0, 153.0, 218.0, 331.0, 529.0, 736.0, 1133.0, 1847.0, 2918.0, 4907.0, 8674.0, 16835.0, 42444.0, 1364636.0, 574126.0, 39983.0, 16029.0, 8307.0, 4851.0, 2936.0, 1793.0, 1193.0, 727.0, 468.0, 315.0, 240.0, 158.0, 116.0, 81.0, 41.0, 39.0, 26.0, 17.0, 7.0, 12.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.609375, -22.84716796875, -22.0849609375, -21.32275390625, -20.560546875, -19.79833984375, -19.0361328125, -18.27392578125, -17.51171875, -16.74951171875, -15.9873046875, -15.22509765625, -14.462890625, -13.70068359375, -12.9384765625, -12.17626953125, -11.4140625, -10.65185546875, -9.8896484375, -9.12744140625, -8.365234375, -7.60302734375, -6.8408203125, -6.07861328125, -5.31640625, -4.55419921875, -3.7919921875, -3.02978515625, -2.267578125, -1.50537109375, -0.7431640625, 0.01904296875, 0.78125, 1.54345703125, 2.3056640625, 3.06787109375, 3.830078125, 4.59228515625, 5.3544921875, 6.11669921875, 6.87890625, 7.64111328125, 8.4033203125, 9.16552734375, 9.927734375, 10.68994140625, 11.4521484375, 12.21435546875, 12.9765625, 13.73876953125, 14.5009765625, 15.26318359375, 16.025390625, 16.78759765625, 17.5498046875, 18.31201171875, 19.07421875, 19.83642578125, 20.5986328125, 21.36083984375, 22.123046875, 22.88525390625, 23.6474609375, 24.40966796875, 25.171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 0.0, 7.0, 5.0, 5.0, 11.0, 6.0, 19.0, 18.0, 17.0, 25.0, 23.0, 26.0, 46.0, 38.0, 45.0, 49.0, 55.0, 65.0, 52.0, 64.0, 71.0, 60.0, 52.0, 40.0, 38.0, 39.0, 20.0, 18.0, 20.0, 11.0, 7.0, 9.0, 15.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.4892578125, -0.47376251220703125, -0.4582672119140625, -0.44277191162109375, -0.427276611328125, -0.41178131103515625, -0.3962860107421875, -0.38079071044921875, -0.36529541015625, -0.34980010986328125, -0.3343048095703125, -0.31880950927734375, -0.303314208984375, -0.28781890869140625, -0.2723236083984375, -0.25682830810546875, -0.2413330078125, -0.22583770751953125, -0.2103424072265625, -0.19484710693359375, -0.179351806640625, -0.16385650634765625, -0.1483612060546875, -0.13286590576171875, -0.11737060546875, -0.10187530517578125, -0.0863800048828125, -0.07088470458984375, -0.055389404296875, -0.03989410400390625, -0.0243988037109375, -0.00890350341796875, 0.006591796875, 0.02208709716796875, 0.0375823974609375, 0.05307769775390625, 0.068572998046875, 0.08406829833984375, 0.0995635986328125, 0.11505889892578125, 0.13055419921875, 0.14604949951171875, 0.1615447998046875, 0.17704010009765625, 0.192535400390625, 0.20803070068359375, 0.2235260009765625, 0.23902130126953125, 0.2545166015625, 0.27001190185546875, 0.2855072021484375, 0.30100250244140625, 0.316497802734375, 0.33199310302734375, 0.3474884033203125, 0.36298370361328125, 0.37847900390625, 0.39397430419921875, 0.4094696044921875, 0.42496490478515625, 0.440460205078125, 0.45595550537109375, 0.4714508056640625, 0.48694610595703125, 0.50244140625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 7.0, 11.0, 16.0, 11.0, 20.0, 42.0, 49.0, 62.0, 115.0, 163.0, 266.0, 424.0, 696.0, 1079.0, 1718.0, 2979.0, 5076.0, 9470.0, 18530.0, 39372.0, 90993.0, 218426.0, 323080.0, 188271.0, 77680.0, 33984.0, 15997.0, 8488.0, 4621.0, 2618.0, 1599.0, 929.0, 610.0, 399.0, 258.0, 166.0, 119.0, 65.0, 47.0, 39.0, 13.0, 12.0, 15.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.017578125, -1.953338623046875, -1.88909912109375, -1.824859619140625, -1.7606201171875, -1.696380615234375, -1.63214111328125, -1.567901611328125, -1.503662109375, -1.439422607421875, -1.37518310546875, -1.310943603515625, -1.2467041015625, -1.182464599609375, -1.11822509765625, -1.053985595703125, -0.98974609375, -0.925506591796875, -0.86126708984375, -0.797027587890625, -0.7327880859375, -0.668548583984375, -0.60430908203125, -0.540069580078125, -0.475830078125, -0.411590576171875, -0.34735107421875, -0.283111572265625, -0.2188720703125, -0.154632568359375, -0.09039306640625, -0.026153564453125, 0.0380859375, 0.102325439453125, 0.16656494140625, 0.230804443359375, 0.2950439453125, 0.359283447265625, 0.42352294921875, 0.487762451171875, 0.552001953125, 0.616241455078125, 0.68048095703125, 0.744720458984375, 0.8089599609375, 0.873199462890625, 0.93743896484375, 1.001678466796875, 1.06591796875, 1.130157470703125, 1.19439697265625, 1.258636474609375, 1.3228759765625, 1.387115478515625, 1.45135498046875, 1.515594482421875, 1.579833984375, 1.644073486328125, 1.70831298828125, 1.772552490234375, 1.8367919921875, 1.901031494140625, 1.96527099609375, 2.029510498046875, 2.09375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 6.0, 4.0, 7.0, 8.0, 15.0, 18.0, 23.0, 22.0, 32.0, 37.0, 48.0, 71.0, 56.0, 99.0, 87.0, 97.0, 82.0, 58.0, 62.0, 43.0, 31.0, 22.0, 14.0, 11.0, 9.0, 6.0, 6.0, 11.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7657334804534912, -0.7423852682113647, -0.7190370559692383, -0.6956888437271118, -0.6723406314849854, -0.6489924788475037, -0.6256442666053772, -0.6022960543632507, -0.5789478421211243, -0.5555996298789978, -0.5322514176368713, -0.5089032053947449, -0.4855550229549408, -0.46220681071281433, -0.43885862827301025, -0.4155104160308838, -0.3921622037887573, -0.36881399154663086, -0.3454657793045044, -0.3221175968647003, -0.29876938462257385, -0.2754211723804474, -0.2520729899406433, -0.22872477769851685, -0.20537656545639038, -0.18202835321426392, -0.15868015587329865, -0.13533195853233337, -0.11198374629020691, -0.08863554149866104, -0.06528733670711517, -0.0419391393661499, -0.018590927124023438, 0.00475727766752243, 0.0281054824590683, 0.051453687250614166, 0.07480189204216003, 0.0981500968337059, 0.12149830162525177, 0.14484649896621704, 0.1681947112083435, 0.19154292345046997, 0.21489112079143524, 0.2382393181324005, 0.261587530374527, 0.28493574261665344, 0.3082839250564575, 0.331632137298584, 0.35498034954071045, 0.3783285617828369, 0.4016767740249634, 0.42502495646476746, 0.4483731687068939, 0.4717213809490204, 0.49506956338882446, 0.5184177756309509, 0.5417659878730774, 0.5651142001152039, 0.5884624123573303, 0.6118106245994568, 0.6351587772369385, 0.6585069894790649, 0.6818552017211914, 0.7052034139633179, 0.7285516262054443]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 7.0, 11.0, 10.0, 7.0, 17.0, 12.0, 21.0, 24.0, 30.0, 23.0, 29.0, 35.0, 50.0, 44.0, 42.0, 52.0, 42.0, 41.0, 48.0, 40.0, 36.0, 48.0, 31.0, 38.0, 38.0, 35.0, 24.0, 25.0, 21.0, 27.0, 17.0, 9.0, 12.0, 10.0, 10.0, 4.0, 1.0, 7.0, 3.0, 10.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.40622490644454956, -0.3929535448551178, -0.37968218326568604, -0.36641085147857666, -0.3531394898891449, -0.33986812829971313, -0.32659679651260376, -0.313325434923172, -0.30005407333374023, -0.28678271174430847, -0.2735113501548767, -0.26024001836776733, -0.24696865677833557, -0.2336972951889038, -0.22042594850063324, -0.20715460181236267, -0.1938832402229309, -0.18061187863349915, -0.16734053194522858, -0.154069185256958, -0.14079782366752625, -0.12752646207809448, -0.11425511538982391, -0.10098376125097275, -0.08771240711212158, -0.07444105297327042, -0.06116969883441925, -0.047898344695568085, -0.03462699055671692, -0.021355636417865753, -0.008084282279014587, 0.005187071859836578, 0.018458425998687744, 0.03172978013753891, 0.045001134276390076, 0.05827248841524124, 0.07154384255409241, 0.08481519669294357, 0.09808655083179474, 0.1113579049706459, 0.12462925910949707, 0.13790062069892883, 0.1511719673871994, 0.16444331407546997, 0.17771467566490173, 0.1909860372543335, 0.20425738394260406, 0.21752873063087463, 0.2308000922203064, 0.24407145380973816, 0.2573428153991699, 0.2706141471862793, 0.28388550877571106, 0.2971568703651428, 0.3104282021522522, 0.32369956374168396, 0.3369709253311157, 0.3502422869205475, 0.36351364850997925, 0.3767849802970886, 0.3900563418865204, 0.40332770347595215, 0.4165990352630615, 0.4298703968524933, 0.44314175844192505]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 9.0, 4.0, 7.0, 10.0, 8.0, 10.0, 19.0, 13.0, 18.0, 27.0, 32.0, 26.0, 39.0, 42.0, 44.0, 49.0, 60.0, 48.0, 41.0, 70.0, 42.0, 45.0, 41.0, 35.0, 48.0, 26.0, 30.0, 21.0, 31.0, 21.0, 21.0, 11.0, 13.0, 6.0, 8.0, 12.0, 3.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-194.0, -188.119140625, -182.23828125, -176.357421875, -170.4765625, -164.595703125, -158.71484375, -152.833984375, -146.953125, -141.072265625, -135.19140625, -129.310546875, -123.4296875, -117.548828125, -111.66796875, -105.787109375, -99.90625, -94.025390625, -88.14453125, -82.263671875, -76.3828125, -70.501953125, -64.62109375, -58.740234375, -52.859375, -46.978515625, -41.09765625, -35.216796875, -29.3359375, -23.455078125, -17.57421875, -11.693359375, -5.8125, 0.068359375, 5.94921875, 11.830078125, 17.7109375, 23.591796875, 29.47265625, 35.353515625, 41.234375, 47.115234375, 52.99609375, 58.876953125, 64.7578125, 70.638671875, 76.51953125, 82.400390625, 88.28125, 94.162109375, 100.04296875, 105.923828125, 111.8046875, 117.685546875, 123.56640625, 129.447265625, 135.328125, 141.208984375, 147.08984375, 152.970703125, 158.8515625, 164.732421875, 170.61328125, 176.494140625, 182.375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 4.0, 11.0, 7.0, 8.0, 16.0, 11.0, 17.0, 15.0, 43.0, 52.0, 68.0, 127.0, 266.0, 598.0, 2009.0, 8397.0, 59631.0, 707484.0, 242280.0, 21570.0, 3915.0, 1154.0, 383.0, 155.0, 98.0, 48.0, 35.0, 39.0, 20.0, 20.0, 17.0, 11.0, 7.0, 7.0, 10.0, 3.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-43.03125, -41.7177734375, -40.404296875, -39.0908203125, -37.77734375, -36.4638671875, -35.150390625, -33.8369140625, -32.5234375, -31.2099609375, -29.896484375, -28.5830078125, -27.26953125, -25.9560546875, -24.642578125, -23.3291015625, -22.015625, -20.7021484375, -19.388671875, -18.0751953125, -16.76171875, -15.4482421875, -14.134765625, -12.8212890625, -11.5078125, -10.1943359375, -8.880859375, -7.5673828125, -6.25390625, -4.9404296875, -3.626953125, -2.3134765625, -1.0, 0.3134765625, 1.626953125, 2.9404296875, 4.25390625, 5.5673828125, 6.880859375, 8.1943359375, 9.5078125, 10.8212890625, 12.134765625, 13.4482421875, 14.76171875, 16.0751953125, 17.388671875, 18.7021484375, 20.015625, 21.3291015625, 22.642578125, 23.9560546875, 25.26953125, 26.5830078125, 27.896484375, 29.2099609375, 30.5234375, 31.8369140625, 33.150390625, 34.4638671875, 35.77734375, 37.0908203125, 38.404296875, 39.7177734375, 41.03125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 7.0, 5.0, 11.0, 19.0, 15.0, 34.0, 33.0, 26.0, 37.0, 48.0, 52.0, 50.0, 62.0, 62.0, 2114.0, 82.0, 67.0, 44.0, 47.0, 42.0, 33.0, 41.0, 28.0, 19.0, 23.0, 15.0, 7.0, 8.0, 3.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.25, -254.30859375, -245.3671875, -236.42578125, -227.484375, -218.54296875, -209.6015625, -200.66015625, -191.71875, -182.77734375, -173.8359375, -164.89453125, -155.953125, -147.01171875, -138.0703125, -129.12890625, -120.1875, -111.24609375, -102.3046875, -93.36328125, -84.421875, -75.48046875, -66.5390625, -57.59765625, -48.65625, -39.71484375, -30.7734375, -21.83203125, -12.890625, -3.94921875, 4.9921875, 13.93359375, 22.875, 31.81640625, 40.7578125, 49.69921875, 58.640625, 67.58203125, 76.5234375, 85.46484375, 94.40625, 103.34765625, 112.2890625, 121.23046875, 130.171875, 139.11328125, 148.0546875, 156.99609375, 165.9375, 174.87890625, 183.8203125, 192.76171875, 201.703125, 210.64453125, 219.5859375, 228.52734375, 237.46875, 246.41015625, 255.3515625, 264.29296875, 273.234375, 282.17578125, 291.1171875, 300.05859375, 309.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 9.0, 4.0, 11.0, 13.0, 22.0, 38.0, 46.0, 70.0, 134.0, 202.0, 309.0, 623.0, 1072.0, 2537.0, 6950.0, 25592.0, 137421.0, 2699774.0, 218357.0, 37007.0, 9429.0, 3043.0, 1347.0, 628.0, 406.0, 250.0, 140.0, 95.0, 57.0, 36.0, 26.0, 17.0, 9.0, 9.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.125, -22.45703125, -21.7890625, -21.12109375, -20.453125, -19.78515625, -19.1171875, -18.44921875, -17.78125, -17.11328125, -16.4453125, -15.77734375, -15.109375, -14.44140625, -13.7734375, -13.10546875, -12.4375, -11.76953125, -11.1015625, -10.43359375, -9.765625, -9.09765625, -8.4296875, -7.76171875, -7.09375, -6.42578125, -5.7578125, -5.08984375, -4.421875, -3.75390625, -3.0859375, -2.41796875, -1.75, -1.08203125, -0.4140625, 0.25390625, 0.921875, 1.58984375, 2.2578125, 2.92578125, 3.59375, 4.26171875, 4.9296875, 5.59765625, 6.265625, 6.93359375, 7.6015625, 8.26953125, 8.9375, 9.60546875, 10.2734375, 10.94140625, 11.609375, 12.27734375, 12.9453125, 13.61328125, 14.28125, 14.94921875, 15.6171875, 16.28515625, 16.953125, 17.62109375, 18.2890625, 18.95703125, 19.625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 6.0, 4.0, 12.0, 15.0, 35.0, 62.0, 82.0, 147.0, 161.0, 167.0, 110.0, 70.0, 35.0, 31.0, 7.0, 13.0, 8.0, 4.0, 6.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-362.7062683105469, -352.2384338378906, -341.7705993652344, -331.3027648925781, -320.8349304199219, -310.3670654296875, -299.89923095703125, -289.431396484375, -278.96356201171875, -268.4957275390625, -258.02789306640625, -247.56005859375, -237.0922088623047, -226.62437438964844, -216.1565399169922, -205.68869018554688, -195.2208709716797, -184.75303649902344, -174.2852020263672, -163.81735229492188, -153.34951782226562, -142.88168334960938, -132.41384887695312, -121.94600677490234, -111.4781723022461, -101.01033782958984, -90.54249572753906, -80.07466125488281, -69.60682678222656, -59.13898468017578, -48.67115020751953, -38.20330810546875, -27.7354736328125, -17.267635345458984, -6.799798965454102, 3.6680374145507812, 14.135875701904297, 24.603713989257812, 35.07154846191406, 45.539390563964844, 56.007225036621094, 66.47505950927734, 76.94290161132812, 87.41073608398438, 97.87857055664062, 108.3464126586914, 118.81424713134766, 129.28208923339844, 139.7499237060547, 150.21775817871094, 160.6855926513672, 171.1534423828125, 181.62127685546875, 192.089111328125, 202.55694580078125, 213.0247802734375, 223.49261474609375, 233.96044921875, 244.42828369140625, 254.8961181640625, 265.36395263671875, 275.831787109375, 286.29962158203125, 296.7674865722656, 307.2353210449219]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 7.0, 5.0, 14.0, 11.0, 7.0, 11.0, 23.0, 26.0, 31.0, 26.0, 31.0, 43.0, 33.0, 44.0, 45.0, 37.0, 50.0, 48.0, 54.0, 47.0, 38.0, 31.0, 31.0, 38.0, 38.0, 39.0, 28.0, 20.0, 22.0, 24.0, 20.0, 12.0, 16.0, 6.0, 7.0, 10.0, 7.0, 5.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-264.3106384277344, -255.05584716796875, -245.80105590820312, -236.5462646484375, -227.29147338867188, -218.03668212890625, -208.78187561035156, -199.52708435058594, -190.2722930908203, -181.0175018310547, -171.76271057128906, -162.50791931152344, -153.25311279296875, -143.99832153320312, -134.7435302734375, -125.48873901367188, -116.23394775390625, -106.97915649414062, -97.724365234375, -88.46956634521484, -79.21477508544922, -69.9599838256836, -60.7051887512207, -51.45039367675781, -42.19560241699219, -32.94081115722656, -23.686016082763672, -14.431222915649414, -5.176429748535156, 4.078361511230469, 13.33315658569336, 22.58795166015625, 31.842742919921875, 41.0975341796875, 50.35232925415039, 59.60712432861328, 68.8619155883789, 78.11670684814453, 87.37150573730469, 96.62629699707031, 105.88108825683594, 115.13587951660156, 124.39067077636719, 133.6454620361328, 142.9002685546875, 152.15505981445312, 161.40985107421875, 170.66464233398438, 179.91943359375, 189.17422485351562, 198.42901611328125, 207.68380737304688, 216.9385986328125, 226.19338989257812, 235.4481964111328, 244.70298767089844, 253.95777893066406, 263.21258544921875, 272.4673767089844, 281.72216796875, 290.9769592285156, 300.23175048828125, 309.4865417480469, 318.7413330078125, 327.9961242675781]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 8.0, 7.0, 13.0, 14.0, 13.0, 18.0, 25.0, 34.0, 25.0, 36.0, 53.0, 64.0, 76.0, 110.0, 202.0, 622.0, 2952.0, 1021834.0, 18336.0, 2819.0, 592.0, 188.0, 109.0, 55.0, 62.0, 46.0, 46.0, 31.0, 26.0, 18.0, 27.0, 14.0, 16.0, 12.0, 7.0, 4.0, 10.0, 5.0, 3.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-134.8987579345703, -130.39950561523438, -125.9002456665039, -121.40098571777344, -116.9017333984375, -112.40248107910156, -107.9032211303711, -103.40396118164062, -98.90470886230469, -94.40545654296875, -89.90619659423828, -85.40693664550781, -80.90768432617188, -76.40843200683594, -71.90917205810547, -67.409912109375, -62.91065979003906, -58.41140365600586, -53.912147521972656, -49.41289138793945, -44.91363525390625, -40.41437911987305, -35.915122985839844, -31.41586685180664, -26.916610717773438, -22.417354583740234, -17.91809844970703, -13.418842315673828, -8.919586181640625, -4.420330047607422, 0.07892608642578125, 4.578182220458984, 9.077438354492188, 13.57669448852539, 18.075950622558594, 22.575206756591797, 27.074462890625, 31.573719024658203, 36.072975158691406, 40.57223129272461, 45.07148742675781, 49.570743560791016, 54.06999969482422, 58.56925582885742, 63.068511962890625, 67.56776428222656, 72.06702423095703, 76.5662841796875, 81.06553649902344, 85.56478881835938, 90.06404876708984, 94.56330871582031, 99.06256103515625, 103.56181335449219, 108.06107330322266, 112.56033325195312, 117.05958557128906, 121.558837890625, 126.05809783935547, 130.55735778808594, 135.05661010742188, 139.5558624267578, 144.05511474609375, 148.55438232421875, 153.0536346435547]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 8.0, 10.0, 9.0, 22.0, 110.0, 12289.0, 51450424.0, 234.0, 32.0, 13.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1703.0, -1625.929443359375, -1548.8587646484375, -1471.7880859375, -1394.717529296875, -1317.64697265625, -1240.5762939453125, -1163.505615234375, -1086.43505859375, -1009.3644409179688, -932.2938232421875, -855.2232055664062, -778.152587890625, -701.0819702148438, -624.0113525390625, -546.9407348632812, -469.8701171875, -392.79949951171875, -315.7288818359375, -238.65826416015625, -161.587646484375, -84.51702880859375, -7.4464111328125, 69.62420654296875, 146.69482421875, 223.76544189453125, 300.8360595703125, 377.90667724609375, 454.977294921875, 532.0479125976562, 609.1185302734375, 686.1891479492188, 763.259521484375, 840.3301391601562, 917.4007568359375, 994.4713745117188, 1071.5419921875, 1148.612548828125, 1225.6832275390625, 1302.75390625, 1379.824462890625, 1456.89501953125, 1533.9656982421875, 1611.036376953125, 1688.10693359375, 1765.177490234375, 1842.2481689453125, 1919.31884765625, 1996.389404296875, 2073.4599609375, 2150.53076171875, 2227.601318359375, 2304.671875, 2381.742431640625, 2458.81298828125, 2535.8837890625, 2612.954345703125, 2690.02490234375, 2767.095703125, 2844.166259765625, 2921.23681640625, 2998.307373046875, 3075.3779296875, 3152.44873046875, 3229.519287109375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 4.0, 13.0, 22.0, 30.0, 36.0, 68.0, 96.0, 150.0, 169.0, 133.0, 78.0, 49.0, 33.0, 25.0, 24.0, 14.0, 10.0, 11.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-473.2582702636719, -461.255859375, -449.25341796875, -437.2510070800781, -425.2485656738281, -413.24615478515625, -401.24371337890625, -389.2413024902344, -377.2388916015625, -365.2364807128906, -353.2340393066406, -341.23162841796875, -329.22918701171875, -317.2267761230469, -305.224365234375, -293.221923828125, -281.219482421875, -269.2170715332031, -257.2146301269531, -245.21221923828125, -233.20977783203125, -221.20736694335938, -209.20494079589844, -197.2025146484375, -185.20008850097656, -173.19766235351562, -161.1952362060547, -149.19281005859375, -137.19039916992188, -125.1879653930664, -113.185546875, -101.18312072753906, -89.18072509765625, -77.17829895019531, -65.17587280273438, -53.17345428466797, -41.17102813720703, -29.168601989746094, -17.166183471679688, -5.16375732421875, 6.8386688232421875, 18.841093063354492, 30.843517303466797, 42.84593963623047, 54.848365783691406, 66.85079193115234, 78.85321044921875, 90.85563659667969, 102.85806274414062, 114.86048889160156, 126.8629150390625, 138.86532592773438, 150.86776733398438, 162.87017822265625, 174.8726043701172, 186.87503051757812, 198.87745666503906, 210.8798828125, 222.88230895996094, 234.88473510742188, 246.88714599609375, 258.88958740234375, 270.8919982910156, 282.8944091796875, 294.8968505859375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 6.0, 3.0, 5.0, 12.0, 12.0, 21.0, 15.0, 24.0, 25.0, 30.0, 38.0, 28.0, 48.0, 52.0, 56.0, 41.0, 50.0, 41.0, 52.0, 39.0, 41.0, 41.0, 44.0, 41.0, 42.0, 28.0, 29.0, 21.0, 21.0, 13.0, 18.0, 11.0, 10.0, 11.0, 8.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.5557861328125, -119.46653747558594, -115.3772964477539, -111.28804779052734, -107.19880676269531, -103.10955810546875, -99.02030944824219, -94.93106079101562, -90.8418197631836, -86.75257110595703, -82.663330078125, -78.57408142089844, -74.48483276367188, -70.39559173583984, -66.30634307861328, -62.217098236083984, -58.12785339355469, -54.03860855102539, -49.949363708496094, -45.86011505126953, -41.770870208740234, -37.68162536621094, -33.592376708984375, -29.503131866455078, -25.41388702392578, -21.324642181396484, -17.235395431518555, -13.146149635314941, -9.056903839111328, -4.967658996582031, -0.8784122467041016, 3.210834503173828, 7.300079345703125, 11.389325141906738, 15.478570938110352, 19.56781768798828, 23.657062530517578, 27.746307373046875, 31.835554122924805, 35.924800872802734, 40.01404571533203, 44.10329055786133, 48.192535400390625, 52.28178405761719, 56.371028900146484, 60.46027374267578, 64.54952239990234, 68.63876342773438, 72.72801208496094, 76.8172607421875, 80.90650177001953, 84.9957504272461, 89.08499145507812, 93.17424011230469, 97.26348876953125, 101.35273742675781, 105.44197845458984, 109.5312271118164, 113.62046813964844, 117.709716796875, 121.79896545410156, 125.8882064819336, 129.97744750976562, 134.0666961669922, 138.15594482421875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 9.0, 13.0, 12.0, 28.0, 34.0, 41.0, 76.0, 116.0, 178.0, 282.0, 396.0, 607.0, 1062.0, 1784.0, 3105.0, 5439.0, 10596.0, 21945.0, 54093.0, 181282.0, 2999128.0, 720861.0, 123120.0, 37277.0, 14781.0, 7181.0, 3973.0, 2406.0, 1479.0, 962.0, 625.0, 427.0, 292.0, 196.0, 135.0, 103.0, 65.0, 51.0, 27.0, 27.0, 19.0, 11.0, 13.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.2578125, -11.84716796875, -11.4365234375, -11.02587890625, -10.615234375, -10.20458984375, -9.7939453125, -9.38330078125, -8.97265625, -8.56201171875, -8.1513671875, -7.74072265625, -7.330078125, -6.91943359375, -6.5087890625, -6.09814453125, -5.6875, -5.27685546875, -4.8662109375, -4.45556640625, -4.044921875, -3.63427734375, -3.2236328125, -2.81298828125, -2.40234375, -1.99169921875, -1.5810546875, -1.17041015625, -0.759765625, -0.34912109375, 0.0615234375, 0.47216796875, 0.8828125, 1.29345703125, 1.7041015625, 2.11474609375, 2.525390625, 2.93603515625, 3.3466796875, 3.75732421875, 4.16796875, 4.57861328125, 4.9892578125, 5.39990234375, 5.810546875, 6.22119140625, 6.6318359375, 7.04248046875, 7.453125, 7.86376953125, 8.2744140625, 8.68505859375, 9.095703125, 9.50634765625, 9.9169921875, 10.32763671875, 10.73828125, 11.14892578125, 11.5595703125, 11.97021484375, 12.380859375, 12.79150390625, 13.2021484375, 13.61279296875, 14.0234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 6.0, 4.0, 4.0, 9.0, 7.0, 20.0, 24.0, 31.0, 52.0, 41.0, 60.0, 75.0, 86.0, 99.0, 87.0, 71.0, 71.0, 65.0, 49.0, 33.0, 22.0, 19.0, 15.0, 12.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.71728515625, -0.6969985961914062, -0.6767120361328125, -0.6564254760742188, -0.636138916015625, -0.6158523559570312, -0.5955657958984375, -0.5752792358398438, -0.55499267578125, -0.5347061157226562, -0.5144195556640625, -0.49413299560546875, -0.473846435546875, -0.45355987548828125, -0.4332733154296875, -0.41298675537109375, -0.3927001953125, -0.37241363525390625, -0.3521270751953125, -0.33184051513671875, -0.311553955078125, -0.29126739501953125, -0.2709808349609375, -0.25069427490234375, -0.23040771484375, -0.21012115478515625, -0.1898345947265625, -0.16954803466796875, -0.149261474609375, -0.12897491455078125, -0.1086883544921875, -0.08840179443359375, -0.068115234375, -0.04782867431640625, -0.0275421142578125, -0.00725555419921875, 0.013031005859375, 0.03331756591796875, 0.0536041259765625, 0.07389068603515625, 0.09417724609375, 0.11446380615234375, 0.1347503662109375, 0.15503692626953125, 0.175323486328125, 0.19561004638671875, 0.2158966064453125, 0.23618316650390625, 0.2564697265625, 0.27675628662109375, 0.2970428466796875, 0.31732940673828125, 0.337615966796875, 0.35790252685546875, 0.3781890869140625, 0.39847564697265625, 0.41876220703125, 0.43904876708984375, 0.4593353271484375, 0.47962188720703125, 0.499908447265625, 0.5201950073242188, 0.5404815673828125, 0.5607681274414062, 0.5810546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 8.0, 14.0, 11.0, 16.0, 29.0, 42.0, 93.0, 153.0, 226.0, 469.0, 866.0, 1614.0, 3108.0, 6953.0, 16914.0, 48475.0, 180706.0, 2674953.0, 1056978.0, 136955.0, 39643.0, 14215.0, 6000.0, 2715.0, 1388.0, 749.0, 402.0, 208.0, 145.0, 82.0, 46.0, 36.0, 24.0, 11.0, 9.0, 10.0, 2.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3984375, -14.915771484375, -14.43310546875, -13.950439453125, -13.4677734375, -12.985107421875, -12.50244140625, -12.019775390625, -11.537109375, -11.054443359375, -10.57177734375, -10.089111328125, -9.6064453125, -9.123779296875, -8.64111328125, -8.158447265625, -7.67578125, -7.193115234375, -6.71044921875, -6.227783203125, -5.7451171875, -5.262451171875, -4.77978515625, -4.297119140625, -3.814453125, -3.331787109375, -2.84912109375, -2.366455078125, -1.8837890625, -1.401123046875, -0.91845703125, -0.435791015625, 0.046875, 0.529541015625, 1.01220703125, 1.494873046875, 1.9775390625, 2.460205078125, 2.94287109375, 3.425537109375, 3.908203125, 4.390869140625, 4.87353515625, 5.356201171875, 5.8388671875, 6.321533203125, 6.80419921875, 7.286865234375, 7.76953125, 8.252197265625, 8.73486328125, 9.217529296875, 9.7001953125, 10.182861328125, 10.66552734375, 11.148193359375, 11.630859375, 12.113525390625, 12.59619140625, 13.078857421875, 13.5615234375, 14.044189453125, 14.52685546875, 15.009521484375, 15.4921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 9.0, 8.0, 17.0, 14.0, 21.0, 28.0, 34.0, 46.0, 69.0, 81.0, 119.0, 157.0, 286.0, 537.0, 1068.0, 528.0, 292.0, 235.0, 136.0, 103.0, 78.0, 38.0, 40.0, 20.0, 14.0, 17.0, 13.0, 16.0, 5.0, 6.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.349609375, -2.277130126953125, -2.20465087890625, -2.132171630859375, -2.0596923828125, -1.987213134765625, -1.91473388671875, -1.842254638671875, -1.769775390625, -1.697296142578125, -1.62481689453125, -1.552337646484375, -1.4798583984375, -1.407379150390625, -1.33489990234375, -1.262420654296875, -1.18994140625, -1.117462158203125, -1.04498291015625, -0.972503662109375, -0.9000244140625, -0.827545166015625, -0.75506591796875, -0.682586669921875, -0.610107421875, -0.537628173828125, -0.46514892578125, -0.392669677734375, -0.3201904296875, -0.247711181640625, -0.17523193359375, -0.102752685546875, -0.0302734375, 0.042205810546875, 0.11468505859375, 0.187164306640625, 0.2596435546875, 0.332122802734375, 0.40460205078125, 0.477081298828125, 0.549560546875, 0.622039794921875, 0.69451904296875, 0.766998291015625, 0.8394775390625, 0.911956787109375, 0.98443603515625, 1.056915283203125, 1.12939453125, 1.201873779296875, 1.27435302734375, 1.346832275390625, 1.4193115234375, 1.491790771484375, 1.56427001953125, 1.636749267578125, 1.709228515625, 1.781707763671875, 1.85418701171875, 1.926666259765625, 1.9991455078125, 2.071624755859375, 2.14410400390625, 2.216583251953125, 2.2890625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 3.0, 10.0, 13.0, 22.0, 38.0, 44.0, 68.0, 84.0, 133.0, 145.0, 135.0, 76.0, 66.0, 33.0, 34.0, 18.0, 19.0, 15.0, 6.0, 5.0, 4.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.07182312011719, -35.952171325683594, -34.832523345947266, -33.71287155151367, -32.593223571777344, -31.47357177734375, -30.353919982910156, -29.234270095825195, -28.114620208740234, -26.994970321655273, -25.875320434570312, -24.75566864013672, -23.636018753051758, -22.516368865966797, -21.396717071533203, -20.277067184448242, -19.15741729736328, -18.03776741027832, -16.91811752319336, -15.798465728759766, -14.678815841674805, -13.559165954589844, -12.439515113830566, -11.319864273071289, -10.200214385986328, -9.080564498901367, -7.96091365814209, -6.841263294219971, -5.721612930297852, -4.601962566375732, -3.4823122024536133, -2.362661838531494, -1.2430076599121094, -0.12335729598999023, 0.9962930679321289, 2.115943431854248, 3.235593795776367, 4.355244159698486, 5.4748945236206055, 6.594544887542725, 7.714195251464844, 8.833845138549805, 9.953495979309082, 11.07314682006836, 12.19279670715332, 13.312446594238281, 14.432097434997559, 15.551748275756836, 16.671398162841797, 17.791048049926758, 18.91069793701172, 20.030349731445312, 21.149999618530273, 22.269649505615234, 23.389301300048828, 24.50895118713379, 25.62860107421875, 26.74825096130371, 27.867900848388672, 28.987552642822266, 30.107202529907227, 31.226852416992188, 32.34650421142578, 33.46615219116211, 34.5858039855957]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 5.0, 9.0, 9.0, 6.0, 9.0, 23.0, 14.0, 19.0, 22.0, 18.0, 23.0, 32.0, 31.0, 40.0, 38.0, 35.0, 46.0, 34.0, 37.0, 50.0, 41.0, 45.0, 51.0, 35.0, 36.0, 33.0, 39.0, 29.0, 27.0, 24.0, 18.0, 23.0, 17.0, 14.0, 15.0, 11.0, 7.0, 7.0, 8.0, 7.0, 4.0, 3.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.434606552124023, -9.142040252685547, -8.849474906921387, -8.55690860748291, -8.26434326171875, -7.971776962280273, -7.679210662841797, -7.3866448402404785, -7.09407901763916, -6.801513195037842, -6.508947372436523, -6.216381072998047, -5.9238152503967285, -5.63124942779541, -5.338683128356934, -5.046117305755615, -4.753551483154297, -4.4609856605529785, -4.16841983795166, -3.8758535385131836, -3.5832877159118652, -3.290721893310547, -2.9981558322906494, -2.705589771270752, -2.4130239486694336, -2.1204581260681152, -1.8278920650482178, -1.5353261232376099, -1.242760181427002, -0.950194239616394, -0.6576282978057861, -0.36506223678588867, -0.0724954605102539, 0.220070481300354, 0.5126364231109619, 0.8052023649215698, 1.0977683067321777, 1.3903342485427856, 1.6829001903533936, 1.975466251373291, 2.2680320739746094, 2.5605978965759277, 2.853163957595825, 3.1457300186157227, 3.438295841217041, 3.7308616638183594, 4.023427963256836, 4.315993785858154, 4.608559608459473, 4.901125431060791, 5.193691253662109, 5.486257553100586, 5.778823375701904, 6.071389198303223, 6.363955497741699, 6.656521320343018, 6.949087142944336, 7.241652965545654, 7.534218788146973, 7.826785087585449, 8.11935043334961, 8.411916732788086, 8.704483032226562, 8.997049331665039, 9.2896146774292]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 9.0, 5.0, 6.0, 10.0, 16.0, 26.0, 30.0, 39.0, 50.0, 64.0, 80.0, 136.0, 197.0, 271.0, 453.0, 771.0, 1250.0, 2126.0, 4124.0, 8972.0, 23327.0, 81155.0, 423736.0, 387076.0, 74822.0, 21979.0, 8555.0, 3941.0, 2057.0, 1123.0, 761.0, 398.0, 294.0, 202.0, 120.0, 97.0, 73.0, 47.0, 38.0, 40.0, 22.0, 12.0, 11.0, 8.0, 9.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-8.9296875, -8.641357421875, -8.35302734375, -8.064697265625, -7.7763671875, -7.488037109375, -7.19970703125, -6.911376953125, -6.623046875, -6.334716796875, -6.04638671875, -5.758056640625, -5.4697265625, -5.181396484375, -4.89306640625, -4.604736328125, -4.31640625, -4.028076171875, -3.73974609375, -3.451416015625, -3.1630859375, -2.874755859375, -2.58642578125, -2.298095703125, -2.009765625, -1.721435546875, -1.43310546875, -1.144775390625, -0.8564453125, -0.568115234375, -0.27978515625, 0.008544921875, 0.296875, 0.585205078125, 0.87353515625, 1.161865234375, 1.4501953125, 1.738525390625, 2.02685546875, 2.315185546875, 2.603515625, 2.891845703125, 3.18017578125, 3.468505859375, 3.7568359375, 4.045166015625, 4.33349609375, 4.621826171875, 4.91015625, 5.198486328125, 5.48681640625, 5.775146484375, 6.0634765625, 6.351806640625, 6.64013671875, 6.928466796875, 7.216796875, 7.505126953125, 7.79345703125, 8.081787109375, 8.3701171875, 8.658447265625, 8.94677734375, 9.235107421875, 9.5234375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 8.0, 5.0, 6.0, 6.0, 12.0, 19.0, 21.0, 33.0, 28.0, 48.0, 62.0, 66.0, 63.0, 77.0, 76.0, 65.0, 64.0, 66.0, 54.0, 44.0, 24.0, 28.0, 25.0, 17.0, 19.0, 13.0, 14.0, 10.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.70458984375, -0.685699462890625, -0.66680908203125, -0.647918701171875, -0.6290283203125, -0.610137939453125, -0.59124755859375, -0.572357177734375, -0.553466796875, -0.534576416015625, -0.51568603515625, -0.496795654296875, -0.4779052734375, -0.459014892578125, -0.44012451171875, -0.421234130859375, -0.40234375, -0.383453369140625, -0.36456298828125, -0.345672607421875, -0.3267822265625, -0.307891845703125, -0.28900146484375, -0.270111083984375, -0.251220703125, -0.232330322265625, -0.21343994140625, -0.194549560546875, -0.1756591796875, -0.156768798828125, -0.13787841796875, -0.118988037109375, -0.10009765625, -0.081207275390625, -0.06231689453125, -0.043426513671875, -0.0245361328125, -0.005645751953125, 0.01324462890625, 0.032135009765625, 0.051025390625, 0.069915771484375, 0.08880615234375, 0.107696533203125, 0.1265869140625, 0.145477294921875, 0.16436767578125, 0.183258056640625, 0.2021484375, 0.221038818359375, 0.23992919921875, 0.258819580078125, 0.2777099609375, 0.296600341796875, 0.31549072265625, 0.334381103515625, 0.353271484375, 0.372161865234375, 0.39105224609375, 0.409942626953125, 0.4288330078125, 0.447723388671875, 0.46661376953125, 0.485504150390625, 0.50439453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 8.0, 7.0, 11.0, 19.0, 20.0, 32.0, 56.0, 83.0, 155.0, 310.0, 524.0, 992.0, 1945.0, 3987.0, 9682.0, 29910.0, 152453.0, 664418.0, 138575.0, 28116.0, 9278.0, 3958.0, 1871.0, 928.0, 519.0, 265.0, 147.0, 92.0, 57.0, 27.0, 25.0, 12.0, 16.0, 11.0, 2.0, 4.0, 4.0, 6.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.3125, -9.0257568359375, -8.739013671875, -8.4522705078125, -8.16552734375, -7.8787841796875, -7.592041015625, -7.3052978515625, -7.0185546875, -6.7318115234375, -6.445068359375, -6.1583251953125, -5.87158203125, -5.5848388671875, -5.298095703125, -5.0113525390625, -4.724609375, -4.4378662109375, -4.151123046875, -3.8643798828125, -3.57763671875, -3.2908935546875, -3.004150390625, -2.7174072265625, -2.4306640625, -2.1439208984375, -1.857177734375, -1.5704345703125, -1.28369140625, -0.9969482421875, -0.710205078125, -0.4234619140625, -0.13671875, 0.1500244140625, 0.436767578125, 0.7235107421875, 1.01025390625, 1.2969970703125, 1.583740234375, 1.8704833984375, 2.1572265625, 2.4439697265625, 2.730712890625, 3.0174560546875, 3.30419921875, 3.5909423828125, 3.877685546875, 4.1644287109375, 4.451171875, 4.7379150390625, 5.024658203125, 5.3114013671875, 5.59814453125, 5.8848876953125, 6.171630859375, 6.4583740234375, 6.7451171875, 7.0318603515625, 7.318603515625, 7.6053466796875, 7.89208984375, 8.1788330078125, 8.465576171875, 8.7523193359375, 9.0390625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 7.0, 4.0, 14.0, 7.0, 18.0, 14.0, 17.0, 19.0, 17.0, 22.0, 25.0, 36.0, 36.0, 35.0, 41.0, 45.0, 43.0, 31.0, 41.0, 41.0, 42.0, 48.0, 37.0, 32.0, 43.0, 34.0, 32.0, 33.0, 31.0, 25.0, 12.0, 14.0, 13.0, 22.0, 14.0, 8.0, 9.0, 10.0, 6.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5703125, -2.48956298828125, -2.4088134765625, -2.32806396484375, -2.247314453125, -2.16656494140625, -2.0858154296875, -2.00506591796875, -1.92431640625, -1.84356689453125, -1.7628173828125, -1.68206787109375, -1.601318359375, -1.52056884765625, -1.4398193359375, -1.35906982421875, -1.2783203125, -1.19757080078125, -1.1168212890625, -1.03607177734375, -0.955322265625, -0.87457275390625, -0.7938232421875, -0.71307373046875, -0.63232421875, -0.55157470703125, -0.4708251953125, -0.39007568359375, -0.309326171875, -0.22857666015625, -0.1478271484375, -0.06707763671875, 0.013671875, 0.09442138671875, 0.1751708984375, 0.25592041015625, 0.336669921875, 0.41741943359375, 0.4981689453125, 0.57891845703125, 0.65966796875, 0.74041748046875, 0.8211669921875, 0.90191650390625, 0.982666015625, 1.06341552734375, 1.1441650390625, 1.22491455078125, 1.3056640625, 1.38641357421875, 1.4671630859375, 1.54791259765625, 1.628662109375, 1.70941162109375, 1.7901611328125, 1.87091064453125, 1.95166015625, 2.03240966796875, 2.1131591796875, 2.19390869140625, 2.274658203125, 2.35540771484375, 2.4361572265625, 2.51690673828125, 2.59765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 2.0, 4.0, 7.0, 13.0, 26.0, 34.0, 69.0, 107.0, 223.0, 451.0, 1074.0, 3087.0, 11720.0, 107062.0, 867924.0, 45596.0, 7380.0, 2200.0, 815.0, 351.0, 167.0, 101.0, 55.0, 27.0, 24.0, 14.0, 7.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.15625, -34.0693359375, -32.982421875, -31.8955078125, -30.80859375, -29.7216796875, -28.634765625, -27.5478515625, -26.4609375, -25.3740234375, -24.287109375, -23.2001953125, -22.11328125, -21.0263671875, -19.939453125, -18.8525390625, -17.765625, -16.6787109375, -15.591796875, -14.5048828125, -13.41796875, -12.3310546875, -11.244140625, -10.1572265625, -9.0703125, -7.9833984375, -6.896484375, -5.8095703125, -4.72265625, -3.6357421875, -2.548828125, -1.4619140625, -0.375, 0.7119140625, 1.798828125, 2.8857421875, 3.97265625, 5.0595703125, 6.146484375, 7.2333984375, 8.3203125, 9.4072265625, 10.494140625, 11.5810546875, 12.66796875, 13.7548828125, 14.841796875, 15.9287109375, 17.015625, 18.1025390625, 19.189453125, 20.2763671875, 21.36328125, 22.4501953125, 23.537109375, 24.6240234375, 25.7109375, 26.7978515625, 27.884765625, 28.9716796875, 30.05859375, 31.1455078125, 32.232421875, 33.3193359375, 34.40625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 9.0, 5.0, 11.0, 14.0, 12.0, 17.0, 26.0, 27.0, 51.0, 83.0, 105.0, 147.0, 159.0, 101.0, 71.0, 48.0, 29.0, 33.0, 10.0, 13.0, 7.0, 3.0, 3.0, 6.0, 2.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00144195556640625, -0.0013995617628097534, -0.0013571679592132568, -0.0013147741556167603, -0.0012723803520202637, -0.001229986548423767, -0.0011875927448272705, -0.001145198941230774, -0.0011028051376342773, -0.0010604113340377808, -0.0010180175304412842, -0.0009756237268447876, -0.000933229923248291, -0.0008908361196517944, -0.0008484423160552979, -0.0008060485124588013, -0.0007636547088623047, -0.0007212609052658081, -0.0006788671016693115, -0.0006364732980728149, -0.0005940794944763184, -0.0005516856908798218, -0.0005092918872833252, -0.0004668980836868286, -0.00042450428009033203, -0.00038211047649383545, -0.00033971667289733887, -0.0002973228693008423, -0.0002549290657043457, -0.00021253526210784912, -0.00017014145851135254, -0.00012774765491485596, -8.535385131835938e-05, -4.296004772186279e-05, -5.662441253662109e-07, 4.182755947113037e-05, 8.422136306762695e-05, 0.00012661516666412354, 0.00016900897026062012, 0.0002114027738571167, 0.0002537965774536133, 0.00029619038105010986, 0.00033858418464660645, 0.00038097798824310303, 0.0004233717918395996, 0.0004657655954360962, 0.0005081593990325928, 0.0005505532026290894, 0.0005929470062255859, 0.0006353408098220825, 0.0006777346134185791, 0.0007201284170150757, 0.0007625222206115723, 0.0008049160242080688, 0.0008473098278045654, 0.000889703631401062, 0.0009320974349975586, 0.0009744912385940552, 0.0010168850421905518, 0.0010592788457870483, 0.001101672649383545, 0.0011440664529800415, 0.001186460256576538, 0.0012288540601730347, 0.0012712478637695312]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 6.0, 10.0, 10.0, 16.0, 31.0, 39.0, 57.0, 73.0, 99.0, 189.0, 332.0, 494.0, 914.0, 1710.0, 3479.0, 8469.0, 28019.0, 185911.0, 720761.0, 70465.0, 16113.0, 5742.0, 2515.0, 1267.0, 725.0, 397.0, 272.0, 151.0, 87.0, 66.0, 39.0, 26.0, 14.0, 16.0, 13.0, 6.0, 7.0, 6.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.125, -19.437744140625, -18.75048828125, -18.063232421875, -17.3759765625, -16.688720703125, -16.00146484375, -15.314208984375, -14.626953125, -13.939697265625, -13.25244140625, -12.565185546875, -11.8779296875, -11.190673828125, -10.50341796875, -9.816162109375, -9.12890625, -8.441650390625, -7.75439453125, -7.067138671875, -6.3798828125, -5.692626953125, -5.00537109375, -4.318115234375, -3.630859375, -2.943603515625, -2.25634765625, -1.569091796875, -0.8818359375, -0.194580078125, 0.49267578125, 1.179931640625, 1.8671875, 2.554443359375, 3.24169921875, 3.928955078125, 4.6162109375, 5.303466796875, 5.99072265625, 6.677978515625, 7.365234375, 8.052490234375, 8.73974609375, 9.427001953125, 10.1142578125, 10.801513671875, 11.48876953125, 12.176025390625, 12.86328125, 13.550537109375, 14.23779296875, 14.925048828125, 15.6123046875, 16.299560546875, 16.98681640625, 17.674072265625, 18.361328125, 19.048583984375, 19.73583984375, 20.423095703125, 21.1103515625, 21.797607421875, 22.48486328125, 23.172119140625, 23.859375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 8.0, 8.0, 7.0, 11.0, 13.0, 12.0, 14.0, 18.0, 28.0, 33.0, 45.0, 62.0, 91.0, 103.0, 77.0, 99.0, 87.0, 72.0, 47.0, 37.0, 28.0, 21.0, 19.0, 11.0, 15.0, 7.0, 7.0, 5.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.4017333984375, -7.158935546875, -6.9161376953125, -6.67333984375, -6.4305419921875, -6.187744140625, -5.9449462890625, -5.7021484375, -5.4593505859375, -5.216552734375, -4.9737548828125, -4.73095703125, -4.4881591796875, -4.245361328125, -4.0025634765625, -3.759765625, -3.5169677734375, -3.274169921875, -3.0313720703125, -2.78857421875, -2.5457763671875, -2.302978515625, -2.0601806640625, -1.8173828125, -1.5745849609375, -1.331787109375, -1.0889892578125, -0.84619140625, -0.6033935546875, -0.360595703125, -0.1177978515625, 0.125, 0.3677978515625, 0.610595703125, 0.8533935546875, 1.09619140625, 1.3389892578125, 1.581787109375, 1.8245849609375, 2.0673828125, 2.3101806640625, 2.552978515625, 2.7957763671875, 3.03857421875, 3.2813720703125, 3.524169921875, 3.7669677734375, 4.009765625, 4.2525634765625, 4.495361328125, 4.7381591796875, 4.98095703125, 5.2237548828125, 5.466552734375, 5.7093505859375, 5.9521484375, 6.1949462890625, 6.437744140625, 6.6805419921875, 6.92333984375, 7.1661376953125, 7.408935546875, 7.6517333984375, 7.89453125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 9.0, 13.0, 19.0, 41.0, 91.0, 161.0, 254.0, 216.0, 84.0, 39.0, 23.0, 10.0, 5.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-159.4042205810547, -154.65611267089844, -149.90798950195312, -145.15988159179688, -140.41177368164062, -135.6636505126953, -130.91554260253906, -126.16742706298828, -121.4193115234375, -116.67119598388672, -111.92308044433594, -107.17497253417969, -102.4268569946289, -97.67874145507812, -92.93063354492188, -88.1825180053711, -83.43440246582031, -78.68628692626953, -73.93817138671875, -69.1900634765625, -64.44194793701172, -59.69383239746094, -54.94572067260742, -50.197608947753906, -45.449493408203125, -40.701377868652344, -35.95326614379883, -31.20515251159668, -26.45703887939453, -21.708925247192383, -16.960811614990234, -12.212699890136719, -7.4645843505859375, -2.716470718383789, 2.0316429138183594, 6.779756546020508, 11.527870178222656, 16.275983810424805, 21.024097442626953, 25.77220916748047, 30.52032470703125, 35.26844024658203, 40.01655197143555, 44.76466369628906, 49.512779235839844, 54.260894775390625, 59.00900650024414, 63.757118225097656, 68.50523376464844, 73.25334930419922, 78.00146484375, 82.74957275390625, 87.49768829345703, 92.24580383300781, 96.99391174316406, 101.74202728271484, 106.49014282226562, 111.2382583618164, 115.98637390136719, 120.73448181152344, 125.48259735107422, 130.230712890625, 134.97882080078125, 139.7269287109375, 144.4750518798828]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [3.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 11.0, 14.0, 9.0, 16.0, 37.0, 45.0, 48.0, 77.0, 96.0, 85.0, 98.0, 103.0, 100.0, 71.0, 54.0, 28.0, 27.0, 11.0, 8.0, 10.0, 6.0, 2.0, 4.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.56913757324219, -35.88054275512695, -34.19194793701172, -32.50334930419922, -30.814754486083984, -29.12615966796875, -27.437564849853516, -25.74896812438965, -24.06037139892578, -22.371776580810547, -20.68317985534668, -18.994585037231445, -17.305988311767578, -15.617393493652344, -13.928797721862793, -12.240201950073242, -10.551607131958008, -8.863011360168457, -7.174415588378906, -5.485820293426514, -3.797224521636963, -2.1086292266845703, -0.42003345489501953, 1.2685623168945312, 2.957158088684082, 4.645753860473633, 6.334349632263184, 8.022945404052734, 9.711540222167969, 11.40013599395752, 13.08873176574707, 14.777327537536621, 16.465923309326172, 18.154518127441406, 19.843114852905273, 21.531709671020508, 23.220306396484375, 24.90890121459961, 26.597496032714844, 28.28609275817871, 29.974689483642578, 31.663284301757812, 33.35187911987305, 35.04047775268555, 36.72907257080078, 38.417667388916016, 40.10626220703125, 41.79486083984375, 43.48345184326172, 45.17204666137695, 46.86064147949219, 48.54924011230469, 50.23783493041992, 51.926429748535156, 53.61502456665039, 55.303619384765625, 56.992218017578125, 58.68081283569336, 60.369407653808594, 62.058006286621094, 63.74660110473633, 65.43519592285156, 67.12379455566406, 68.81238555908203, 70.50098419189453]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 11.0, 16.0, 24.0, 18.0, 23.0, 48.0, 78.0, 103.0, 173.0, 267.0, 401.0, 627.0, 1270.0, 2313.0, 4477.0, 10148.0, 28913.0, 127150.0, 3754720.0, 201402.0, 37428.0, 12878.0, 5562.0, 2680.0, 1441.0, 790.0, 473.0, 278.0, 185.0, 116.0, 69.0, 61.0, 43.0, 23.0, 16.0, 16.0, 8.0, 7.0, 9.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-18.4375, -17.8720703125, -17.306640625, -16.7412109375, -16.17578125, -15.6103515625, -15.044921875, -14.4794921875, -13.9140625, -13.3486328125, -12.783203125, -12.2177734375, -11.65234375, -11.0869140625, -10.521484375, -9.9560546875, -9.390625, -8.8251953125, -8.259765625, -7.6943359375, -7.12890625, -6.5634765625, -5.998046875, -5.4326171875, -4.8671875, -4.3017578125, -3.736328125, -3.1708984375, -2.60546875, -2.0400390625, -1.474609375, -0.9091796875, -0.34375, 0.2216796875, 0.787109375, 1.3525390625, 1.91796875, 2.4833984375, 3.048828125, 3.6142578125, 4.1796875, 4.7451171875, 5.310546875, 5.8759765625, 6.44140625, 7.0068359375, 7.572265625, 8.1376953125, 8.703125, 9.2685546875, 9.833984375, 10.3994140625, 10.96484375, 11.5302734375, 12.095703125, 12.6611328125, 13.2265625, 13.7919921875, 14.357421875, 14.9228515625, 15.48828125, 16.0537109375, 16.619140625, 17.1845703125, 17.75]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 8.0, 6.0, 5.0, 9.0, 5.0, 16.0, 27.0, 20.0, 35.0, 67.0, 63.0, 62.0, 79.0, 75.0, 82.0, 75.0, 73.0, 56.0, 44.0, 43.0, 22.0, 34.0, 16.0, 15.0, 13.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6044921875, -0.585540771484375, -0.56658935546875, -0.547637939453125, -0.5286865234375, -0.509735107421875, -0.49078369140625, -0.471832275390625, -0.452880859375, -0.433929443359375, -0.41497802734375, -0.396026611328125, -0.3770751953125, -0.358123779296875, -0.33917236328125, -0.320220947265625, -0.30126953125, -0.282318115234375, -0.26336669921875, -0.244415283203125, -0.2254638671875, -0.206512451171875, -0.18756103515625, -0.168609619140625, -0.149658203125, -0.130706787109375, -0.11175537109375, -0.092803955078125, -0.0738525390625, -0.054901123046875, -0.03594970703125, -0.016998291015625, 0.001953125, 0.020904541015625, 0.03985595703125, 0.058807373046875, 0.0777587890625, 0.096710205078125, 0.11566162109375, 0.134613037109375, 0.153564453125, 0.172515869140625, 0.19146728515625, 0.210418701171875, 0.2293701171875, 0.248321533203125, 0.26727294921875, 0.286224365234375, 0.30517578125, 0.324127197265625, 0.34307861328125, 0.362030029296875, 0.3809814453125, 0.399932861328125, 0.41888427734375, 0.437835693359375, 0.456787109375, 0.475738525390625, 0.49468994140625, 0.513641357421875, 0.5325927734375, 0.551544189453125, 0.57049560546875, 0.589447021484375, 0.6083984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 11.0, 19.0, 23.0, 24.0, 48.0, 86.0, 111.0, 164.0, 307.0, 532.0, 929.0, 1996.0, 4814.0, 13455.0, 50275.0, 713669.0, 3315179.0, 65434.0, 16556.0, 5683.0, 2394.0, 1110.0, 596.0, 322.0, 176.0, 145.0, 63.0, 48.0, 27.0, 18.0, 22.0, 10.0, 8.0, 5.0, 6.0, 2.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.578125, -19.757568359375, -18.93701171875, -18.116455078125, -17.2958984375, -16.475341796875, -15.65478515625, -14.834228515625, -14.013671875, -13.193115234375, -12.37255859375, -11.552001953125, -10.7314453125, -9.910888671875, -9.09033203125, -8.269775390625, -7.44921875, -6.628662109375, -5.80810546875, -4.987548828125, -4.1669921875, -3.346435546875, -2.52587890625, -1.705322265625, -0.884765625, -0.064208984375, 0.75634765625, 1.576904296875, 2.3974609375, 3.218017578125, 4.03857421875, 4.859130859375, 5.6796875, 6.500244140625, 7.32080078125, 8.141357421875, 8.9619140625, 9.782470703125, 10.60302734375, 11.423583984375, 12.244140625, 13.064697265625, 13.88525390625, 14.705810546875, 15.5263671875, 16.346923828125, 17.16748046875, 17.988037109375, 18.80859375, 19.629150390625, 20.44970703125, 21.270263671875, 22.0908203125, 22.911376953125, 23.73193359375, 24.552490234375, 25.373046875, 26.193603515625, 27.01416015625, 27.834716796875, 28.6552734375, 29.475830078125, 30.29638671875, 31.116943359375, 31.9375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 0.0, 9.0, 14.0, 13.0, 11.0, 18.0, 33.0, 30.0, 50.0, 65.0, 140.0, 435.0, 2216.0, 512.0, 171.0, 91.0, 69.0, 37.0, 35.0, 25.0, 26.0, 18.0, 11.0, 11.0, 7.0, 6.0, 1.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.00390625, -1.92242431640625, -1.8409423828125, -1.75946044921875, -1.677978515625, -1.59649658203125, -1.5150146484375, -1.43353271484375, -1.35205078125, -1.27056884765625, -1.1890869140625, -1.10760498046875, -1.026123046875, -0.94464111328125, -0.8631591796875, -0.78167724609375, -0.7001953125, -0.61871337890625, -0.5372314453125, -0.45574951171875, -0.374267578125, -0.29278564453125, -0.2113037109375, -0.12982177734375, -0.04833984375, 0.03314208984375, 0.1146240234375, 0.19610595703125, 0.277587890625, 0.35906982421875, 0.4405517578125, 0.52203369140625, 0.603515625, 0.68499755859375, 0.7664794921875, 0.84796142578125, 0.929443359375, 1.01092529296875, 1.0924072265625, 1.17388916015625, 1.25537109375, 1.33685302734375, 1.4183349609375, 1.49981689453125, 1.581298828125, 1.66278076171875, 1.7442626953125, 1.82574462890625, 1.9072265625, 1.98870849609375, 2.0701904296875, 2.15167236328125, 2.233154296875, 2.31463623046875, 2.3961181640625, 2.47760009765625, 2.55908203125, 2.64056396484375, 2.7220458984375, 2.80352783203125, 2.885009765625, 2.96649169921875, 3.0479736328125, 3.12945556640625, 3.2109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 10.0, 13.0, 37.0, 97.0, 250.0, 315.0, 160.0, 64.0, 32.0, 8.0, 7.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.46794509887695, -42.033355712890625, -40.59877014160156, -39.1641845703125, -37.72959518432617, -36.295005798339844, -34.86042022705078, -33.42583465576172, -31.99124526977539, -30.556657791137695, -29.1220703125, -27.687482833862305, -26.25289535522461, -24.818307876586914, -23.38372039794922, -21.949132919311523, -20.514545440673828, -19.079957962036133, -17.645370483398438, -16.210783004760742, -14.776195526123047, -13.341608047485352, -11.907020568847656, -10.472433090209961, -9.037845611572266, -7.60325813293457, -6.168670654296875, -4.73408317565918, -3.2994956970214844, -1.864908218383789, -0.43032073974609375, 1.0042667388916016, 2.438854217529297, 3.873441696166992, 5.3080291748046875, 6.742616653442383, 8.177204132080078, 9.611791610717773, 11.046379089355469, 12.480966567993164, 13.91555404663086, 15.350141525268555, 16.78472900390625, 18.219316482543945, 19.65390396118164, 21.088491439819336, 22.52307891845703, 23.957666397094727, 25.392253875732422, 26.826841354370117, 28.261428833007812, 29.696016311645508, 31.130603790283203, 32.56519317626953, 33.999778747558594, 35.434364318847656, 36.868953704833984, 38.30354309082031, 39.738128662109375, 41.17271423339844, 42.607303619384766, 44.041893005371094, 45.476478576660156, 46.91106414794922, 48.34565353393555]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 2.0, 8.0, 11.0, 9.0, 15.0, 20.0, 25.0, 36.0, 35.0, 54.0, 75.0, 71.0, 78.0, 82.0, 77.0, 67.0, 75.0, 53.0, 39.0, 46.0, 34.0, 33.0, 19.0, 11.0, 12.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.599422454833984, -12.184976577758789, -11.770530700683594, -11.356084823608398, -10.941638946533203, -10.527193069458008, -10.112747192382812, -9.6983003616333, -9.283854484558105, -8.86940860748291, -8.454962730407715, -8.04051685333252, -7.626070499420166, -7.211624622344971, -6.797178745269775, -6.382732391357422, -5.968286991119385, -5.5538411140441895, -5.139395236968994, -4.724948883056641, -4.310503005981445, -3.89605712890625, -3.4816112518310547, -3.0671651363372803, -2.652719259262085, -2.2382733821868896, -1.8238272666931152, -1.40938138961792, -0.9949353933334351, -0.5804893970489502, -0.16604351997375488, 0.24840259552001953, 0.6628484725952148, 1.0772944688796997, 1.4917404651641846, 1.9061863422393799, 2.3206324577331543, 2.7350783348083496, 3.149524211883545, 3.5639703273773193, 3.9784162044525146, 4.392862319946289, 4.807308197021484, 5.22175407409668, 5.636199951171875, 6.05064582824707, 6.465091705322266, 6.879538059234619, 7.2939839363098145, 7.70842981338501, 8.122876167297363, 8.537322044372559, 8.951767921447754, 9.36621379852295, 9.780659675598145, 10.19510555267334, 10.609551429748535, 11.02399730682373, 11.438443183898926, 11.852889060974121, 12.267334938049316, 12.681781768798828, 13.096227645874023, 13.510673522949219, 13.925119400024414]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 6.0, 10.0, 13.0, 19.0, 14.0, 37.0, 37.0, 71.0, 86.0, 119.0, 173.0, 257.0, 410.0, 590.0, 1020.0, 1607.0, 2785.0, 4905.0, 9428.0, 19405.0, 44453.0, 112755.0, 291041.0, 328866.0, 132831.0, 51588.0, 22066.0, 10695.0, 5498.0, 3031.0, 1768.0, 1001.0, 673.0, 392.0, 276.0, 204.0, 134.0, 91.0, 59.0, 31.0, 34.0, 30.0, 11.0, 11.0, 9.0, 9.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.55859375, -7.322998046875, -7.08740234375, -6.851806640625, -6.6162109375, -6.380615234375, -6.14501953125, -5.909423828125, -5.673828125, -5.438232421875, -5.20263671875, -4.967041015625, -4.7314453125, -4.495849609375, -4.26025390625, -4.024658203125, -3.7890625, -3.553466796875, -3.31787109375, -3.082275390625, -2.8466796875, -2.611083984375, -2.37548828125, -2.139892578125, -1.904296875, -1.668701171875, -1.43310546875, -1.197509765625, -0.9619140625, -0.726318359375, -0.49072265625, -0.255126953125, -0.01953125, 0.216064453125, 0.45166015625, 0.687255859375, 0.9228515625, 1.158447265625, 1.39404296875, 1.629638671875, 1.865234375, 2.100830078125, 2.33642578125, 2.572021484375, 2.8076171875, 3.043212890625, 3.27880859375, 3.514404296875, 3.75, 3.985595703125, 4.22119140625, 4.456787109375, 4.6923828125, 4.927978515625, 5.16357421875, 5.399169921875, 5.634765625, 5.870361328125, 6.10595703125, 6.341552734375, 6.5771484375, 6.812744140625, 7.04833984375, 7.283935546875, 7.51953125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 13.0, 12.0, 9.0, 27.0, 22.0, 41.0, 43.0, 56.0, 49.0, 63.0, 73.0, 71.0, 76.0, 74.0, 62.0, 59.0, 56.0, 39.0, 40.0, 23.0, 18.0, 10.0, 10.0, 7.0, 3.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.7919921875, -0.7708740234375, -0.749755859375, -0.7286376953125, -0.70751953125, -0.6864013671875, -0.665283203125, -0.6441650390625, -0.623046875, -0.6019287109375, -0.580810546875, -0.5596923828125, -0.53857421875, -0.5174560546875, -0.496337890625, -0.4752197265625, -0.4541015625, -0.4329833984375, -0.411865234375, -0.3907470703125, -0.36962890625, -0.3485107421875, -0.327392578125, -0.3062744140625, -0.28515625, -0.2640380859375, -0.242919921875, -0.2218017578125, -0.20068359375, -0.1795654296875, -0.158447265625, -0.1373291015625, -0.1162109375, -0.0950927734375, -0.073974609375, -0.0528564453125, -0.03173828125, -0.0106201171875, 0.010498046875, 0.0316162109375, 0.052734375, 0.0738525390625, 0.094970703125, 0.1160888671875, 0.13720703125, 0.1583251953125, 0.179443359375, 0.2005615234375, 0.2216796875, 0.2427978515625, 0.263916015625, 0.2850341796875, 0.30615234375, 0.3272705078125, 0.348388671875, 0.3695068359375, 0.390625, 0.4117431640625, 0.432861328125, 0.4539794921875, 0.47509765625, 0.4962158203125, 0.517333984375, 0.5384521484375, 0.5595703125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 5.0, 6.0, 13.0, 14.0, 23.0, 18.0, 29.0, 52.0, 65.0, 82.0, 144.0, 209.0, 326.0, 638.0, 1156.0, 2301.0, 5158.0, 13103.0, 40862.0, 175338.0, 571536.0, 174208.0, 40211.0, 12859.0, 5101.0, 2322.0, 1206.0, 581.0, 343.0, 208.0, 149.0, 87.0, 50.0, 30.0, 37.0, 25.0, 10.0, 11.0, 9.0, 11.0, 2.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-9.3515625, -9.0723876953125, -8.793212890625, -8.5140380859375, -8.23486328125, -7.9556884765625, -7.676513671875, -7.3973388671875, -7.1181640625, -6.8389892578125, -6.559814453125, -6.2806396484375, -6.00146484375, -5.7222900390625, -5.443115234375, -5.1639404296875, -4.884765625, -4.6055908203125, -4.326416015625, -4.0472412109375, -3.76806640625, -3.4888916015625, -3.209716796875, -2.9305419921875, -2.6513671875, -2.3721923828125, -2.093017578125, -1.8138427734375, -1.53466796875, -1.2554931640625, -0.976318359375, -0.6971435546875, -0.41796875, -0.1387939453125, 0.140380859375, 0.4195556640625, 0.69873046875, 0.9779052734375, 1.257080078125, 1.5362548828125, 1.8154296875, 2.0946044921875, 2.373779296875, 2.6529541015625, 2.93212890625, 3.2113037109375, 3.490478515625, 3.7696533203125, 4.048828125, 4.3280029296875, 4.607177734375, 4.8863525390625, 5.16552734375, 5.4447021484375, 5.723876953125, 6.0030517578125, 6.2822265625, 6.5614013671875, 6.840576171875, 7.1197509765625, 7.39892578125, 7.6781005859375, 7.957275390625, 8.2364501953125, 8.515625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 8.0, 9.0, 5.0, 9.0, 16.0, 16.0, 23.0, 27.0, 16.0, 29.0, 21.0, 40.0, 41.0, 46.0, 40.0, 39.0, 44.0, 48.0, 50.0, 52.0, 46.0, 45.0, 46.0, 55.0, 30.0, 34.0, 22.0, 18.0, 22.0, 19.0, 15.0, 19.0, 12.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.970703125, -2.883209228515625, -2.79571533203125, -2.708221435546875, -2.6207275390625, -2.533233642578125, -2.44573974609375, -2.358245849609375, -2.270751953125, -2.183258056640625, -2.09576416015625, -2.008270263671875, -1.9207763671875, -1.833282470703125, -1.74578857421875, -1.658294677734375, -1.57080078125, -1.483306884765625, -1.39581298828125, -1.308319091796875, -1.2208251953125, -1.133331298828125, -1.04583740234375, -0.958343505859375, -0.870849609375, -0.783355712890625, -0.69586181640625, -0.608367919921875, -0.5208740234375, -0.433380126953125, -0.34588623046875, -0.258392333984375, -0.1708984375, -0.083404541015625, 0.00408935546875, 0.091583251953125, 0.1790771484375, 0.266571044921875, 0.35406494140625, 0.441558837890625, 0.529052734375, 0.616546630859375, 0.70404052734375, 0.791534423828125, 0.8790283203125, 0.966522216796875, 1.05401611328125, 1.141510009765625, 1.22900390625, 1.316497802734375, 1.40399169921875, 1.491485595703125, 1.5789794921875, 1.666473388671875, 1.75396728515625, 1.841461181640625, 1.928955078125, 2.016448974609375, 2.10394287109375, 2.191436767578125, 2.2789306640625, 2.366424560546875, 2.45391845703125, 2.541412353515625, 2.62890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 6.0, 11.0, 11.0, 15.0, 28.0, 38.0, 74.0, 107.0, 222.0, 462.0, 1097.0, 3103.0, 11119.0, 63372.0, 780147.0, 161772.0, 19332.0, 4744.0, 1603.0, 608.0, 284.0, 151.0, 85.0, 58.0, 30.0, 21.0, 12.0, 11.0, 8.0, 1.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.71875, -16.222412109375, -15.72607421875, -15.229736328125, -14.7333984375, -14.237060546875, -13.74072265625, -13.244384765625, -12.748046875, -12.251708984375, -11.75537109375, -11.259033203125, -10.7626953125, -10.266357421875, -9.77001953125, -9.273681640625, -8.77734375, -8.281005859375, -7.78466796875, -7.288330078125, -6.7919921875, -6.295654296875, -5.79931640625, -5.302978515625, -4.806640625, -4.310302734375, -3.81396484375, -3.317626953125, -2.8212890625, -2.324951171875, -1.82861328125, -1.332275390625, -0.8359375, -0.339599609375, 0.15673828125, 0.653076171875, 1.1494140625, 1.645751953125, 2.14208984375, 2.638427734375, 3.134765625, 3.631103515625, 4.12744140625, 4.623779296875, 5.1201171875, 5.616455078125, 6.11279296875, 6.609130859375, 7.10546875, 7.601806640625, 8.09814453125, 8.594482421875, 9.0908203125, 9.587158203125, 10.08349609375, 10.579833984375, 11.076171875, 11.572509765625, 12.06884765625, 12.565185546875, 13.0615234375, 13.557861328125, 14.05419921875, 14.550537109375, 15.046875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 7.0, 10.0, 11.0, 14.0, 24.0, 31.0, 43.0, 56.0, 89.0, 94.0, 121.0, 121.0, 89.0, 64.0, 68.0, 47.0, 35.0, 14.0, 11.0, 12.0, 14.0, 9.0, 4.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007572174072265625, -0.000734969973564148, -0.0007127225399017334, -0.0006904751062393188, -0.0006682276725769043, -0.0006459802389144897, -0.0006237328052520752, -0.0006014853715896606, -0.0005792379379272461, -0.0005569905042648315, -0.000534743070602417, -0.0005124956369400024, -0.0004902482032775879, -0.00046800076961517334, -0.0004457533359527588, -0.00042350590229034424, -0.0004012584686279297, -0.00037901103496551514, -0.0003567636013031006, -0.00033451616764068604, -0.0003122687339782715, -0.00029002130031585693, -0.0002677738666534424, -0.00024552643299102783, -0.00022327899932861328, -0.00020103156566619873, -0.00017878413200378418, -0.00015653669834136963, -0.00013428926467895508, -0.00011204183101654053, -8.979439735412598e-05, -6.754696369171143e-05, -4.5299530029296875e-05, -2.3052096366882324e-05, -8.046627044677734e-07, 2.1442770957946777e-05, 4.369020462036133e-05, 6.593763828277588e-05, 8.818507194519043e-05, 0.00011043250560760498, 0.00013267993927001953, 0.00015492737293243408, 0.00017717480659484863, 0.00019942224025726318, 0.00022166967391967773, 0.00024391710758209229, 0.00026616454124450684, 0.0002884119749069214, 0.00031065940856933594, 0.0003329068422317505, 0.00035515427589416504, 0.0003774017095565796, 0.00039964914321899414, 0.0004218965768814087, 0.00044414401054382324, 0.0004663914442062378, 0.0004886388778686523, 0.0005108863115310669, 0.0005331337451934814, 0.000555381178855896, 0.0005776286125183105, 0.0005998760461807251, 0.0006221234798431396, 0.0006443709135055542, 0.0006666183471679688]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 6.0, 13.0, 22.0, 25.0, 33.0, 41.0, 70.0, 105.0, 159.0, 291.0, 521.0, 1001.0, 2069.0, 4595.0, 13129.0, 54665.0, 504876.0, 401235.0, 45932.0, 11664.0, 4221.0, 1785.0, 903.0, 500.0, 247.0, 162.0, 92.0, 60.0, 34.0, 18.0, 20.0, 14.0, 13.0, 9.0, 7.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.9453125, -9.601806640625, -9.25830078125, -8.914794921875, -8.5712890625, -8.227783203125, -7.88427734375, -7.540771484375, -7.197265625, -6.853759765625, -6.51025390625, -6.166748046875, -5.8232421875, -5.479736328125, -5.13623046875, -4.792724609375, -4.44921875, -4.105712890625, -3.76220703125, -3.418701171875, -3.0751953125, -2.731689453125, -2.38818359375, -2.044677734375, -1.701171875, -1.357666015625, -1.01416015625, -0.670654296875, -0.3271484375, 0.016357421875, 0.35986328125, 0.703369140625, 1.046875, 1.390380859375, 1.73388671875, 2.077392578125, 2.4208984375, 2.764404296875, 3.10791015625, 3.451416015625, 3.794921875, 4.138427734375, 4.48193359375, 4.825439453125, 5.1689453125, 5.512451171875, 5.85595703125, 6.199462890625, 6.54296875, 6.886474609375, 7.22998046875, 7.573486328125, 7.9169921875, 8.260498046875, 8.60400390625, 8.947509765625, 9.291015625, 9.634521484375, 9.97802734375, 10.321533203125, 10.6650390625, 11.008544921875, 11.35205078125, 11.695556640625, 12.0390625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 10.0, 9.0, 7.0, 21.0, 22.0, 22.0, 24.0, 34.0, 62.0, 61.0, 85.0, 93.0, 115.0, 92.0, 83.0, 54.0, 47.0, 33.0, 21.0, 19.0, 11.0, 11.0, 9.0, 6.0, 6.0, 5.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.32421875, -4.20233154296875, -4.0804443359375, -3.95855712890625, -3.836669921875, -3.71478271484375, -3.5928955078125, -3.47100830078125, -3.34912109375, -3.22723388671875, -3.1053466796875, -2.98345947265625, -2.861572265625, -2.73968505859375, -2.6177978515625, -2.49591064453125, -2.3740234375, -2.25213623046875, -2.1302490234375, -2.00836181640625, -1.886474609375, -1.76458740234375, -1.6427001953125, -1.52081298828125, -1.39892578125, -1.27703857421875, -1.1551513671875, -1.03326416015625, -0.911376953125, -0.78948974609375, -0.6676025390625, -0.54571533203125, -0.423828125, -0.30194091796875, -0.1800537109375, -0.05816650390625, 0.063720703125, 0.18560791015625, 0.3074951171875, 0.42938232421875, 0.55126953125, 0.67315673828125, 0.7950439453125, 0.91693115234375, 1.038818359375, 1.16070556640625, 1.2825927734375, 1.40447998046875, 1.5263671875, 1.64825439453125, 1.7701416015625, 1.89202880859375, 2.013916015625, 2.13580322265625, 2.2576904296875, 2.37957763671875, 2.50146484375, 2.62335205078125, 2.7452392578125, 2.86712646484375, 2.989013671875, 3.11090087890625, 3.2327880859375, 3.35467529296875, 3.4765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 6.0, 9.0, 25.0, 48.0, 113.0, 276.0, 307.0, 132.0, 51.0, 17.0, 11.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.13977813720703, -121.0463638305664, -117.95295715332031, -114.85954284667969, -111.7661361694336, -108.67272186279297, -105.57931518554688, -102.48590087890625, -99.39248657226562, -96.299072265625, -93.2056655883789, -90.11225128173828, -87.01884460449219, -83.92543029785156, -80.83201599121094, -77.73860931396484, -74.64520263671875, -71.55178833007812, -68.45838165283203, -65.3649673461914, -62.27156066894531, -59.17814636230469, -56.08473587036133, -52.99132537841797, -49.89791488647461, -46.80450439453125, -43.71109390258789, -40.61768341064453, -37.524269104003906, -34.43086242675781, -31.337448120117188, -28.244037628173828, -25.15062713623047, -22.05721664428711, -18.96380615234375, -15.870393753051758, -12.776983261108398, -9.683572769165039, -6.590160369873047, -3.4967498779296875, -0.4033393859863281, 2.6900715827941895, 5.783482551574707, 8.876893997192383, 11.970304489135742, 15.063714981079102, 18.157127380371094, 21.250537872314453, 24.343948364257812, 27.437358856201172, 30.53076934814453, 33.624183654785156, 36.71759033203125, 39.811004638671875, 42.904415130615234, 45.997825622558594, 49.09123611450195, 52.18464660644531, 55.27805709838867, 58.37146759033203, 61.464881896972656, 64.55828857421875, 67.65170288085938, 70.7451171875, 73.8385238647461]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 1.0, 3.0, 1.0, 6.0, 8.0, 5.0, 8.0, 12.0, 15.0, 14.0, 25.0, 20.0, 40.0, 45.0, 61.0, 52.0, 59.0, 48.0, 62.0, 74.0, 78.0, 52.0, 57.0, 53.0, 44.0, 31.0, 22.0, 22.0, 17.0, 12.0, 9.0, 12.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.982357025146484, -21.205860137939453, -20.429365158081055, -19.652868270874023, -18.876371383666992, -18.099876403808594, -17.323379516601562, -16.54688262939453, -15.770386695861816, -14.993890762329102, -14.21739387512207, -13.440897941589355, -12.66440200805664, -11.88790512084961, -11.111409187316895, -10.33491325378418, -9.558416366577148, -8.781920433044434, -8.005423545837402, -7.2289276123046875, -6.4524312019348145, -5.675934791564941, -4.899438858032227, -4.1229424476623535, -3.3464460372924805, -2.5699496269226074, -1.7934534549713135, -1.0169572830200195, -0.24046087265014648, 0.5360355377197266, 1.3125314712524414, 2.0890278816223145, 2.8655242919921875, 3.6420207023620605, 4.418517112731934, 5.195013046264648, 5.9715094566345215, 6.7480058670043945, 7.524501800537109, 8.30099868774414, 9.077494621276855, 9.85399055480957, 10.630487442016602, 11.406983375549316, 12.183479309082031, 12.959976196289062, 13.736472129821777, 14.512968063354492, 15.289464950561523, 16.065961837768555, 16.842456817626953, 17.618953704833984, 18.395450592041016, 19.171947479248047, 19.948442459106445, 20.724939346313477, 21.501434326171875, 22.277931213378906, 23.054426193237305, 23.830923080444336, 24.607419967651367, 25.383914947509766, 26.160411834716797, 26.936908721923828, 27.71340560913086]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 4.0, 10.0, 17.0, 19.0, 21.0, 36.0, 50.0, 79.0, 124.0, 156.0, 243.0, 380.0, 584.0, 1045.0, 1801.0, 3072.0, 5922.0, 11857.0, 27102.0, 80262.0, 2759214.0, 1176952.0, 74624.0, 26264.0, 11746.0, 5702.0, 2887.0, 1576.0, 921.0, 547.0, 338.0, 203.0, 150.0, 96.0, 76.0, 47.0, 24.0, 39.0, 19.0, 12.0, 14.0, 11.0, 8.0, 10.0, 5.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-12.453125, -12.008056640625, -11.56298828125, -11.117919921875, -10.6728515625, -10.227783203125, -9.78271484375, -9.337646484375, -8.892578125, -8.447509765625, -8.00244140625, -7.557373046875, -7.1123046875, -6.667236328125, -6.22216796875, -5.777099609375, -5.33203125, -4.886962890625, -4.44189453125, -3.996826171875, -3.5517578125, -3.106689453125, -2.66162109375, -2.216552734375, -1.771484375, -1.326416015625, -0.88134765625, -0.436279296875, 0.0087890625, 0.453857421875, 0.89892578125, 1.343994140625, 1.7890625, 2.234130859375, 2.67919921875, 3.124267578125, 3.5693359375, 4.014404296875, 4.45947265625, 4.904541015625, 5.349609375, 5.794677734375, 6.23974609375, 6.684814453125, 7.1298828125, 7.574951171875, 8.02001953125, 8.465087890625, 8.91015625, 9.355224609375, 9.80029296875, 10.245361328125, 10.6904296875, 11.135498046875, 11.58056640625, 12.025634765625, 12.470703125, 12.915771484375, 13.36083984375, 13.805908203125, 14.2509765625, 14.696044921875, 15.14111328125, 15.586181640625, 16.03125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 0.0, 8.0, 5.0, 7.0, 13.0, 14.0, 25.0, 28.0, 47.0, 36.0, 60.0, 89.0, 77.0, 98.0, 106.0, 81.0, 71.0, 68.0, 52.0, 40.0, 20.0, 15.0, 17.0, 6.0, 5.0, 5.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7275390625, -0.7003326416015625, -0.673126220703125, -0.6459197998046875, -0.61871337890625, -0.5915069580078125, -0.564300537109375, -0.5370941162109375, -0.5098876953125, -0.4826812744140625, -0.455474853515625, -0.4282684326171875, -0.40106201171875, -0.3738555908203125, -0.346649169921875, -0.3194427490234375, -0.292236328125, -0.2650299072265625, -0.237823486328125, -0.2106170654296875, -0.18341064453125, -0.1562042236328125, -0.128997802734375, -0.1017913818359375, -0.0745849609375, -0.0473785400390625, -0.020172119140625, 0.0070343017578125, 0.03424072265625, 0.0614471435546875, 0.088653564453125, 0.1158599853515625, 0.14306640625, 0.1702728271484375, 0.197479248046875, 0.2246856689453125, 0.25189208984375, 0.2790985107421875, 0.306304931640625, 0.3335113525390625, 0.3607177734375, 0.3879241943359375, 0.415130615234375, 0.4423370361328125, 0.46954345703125, 0.4967498779296875, 0.523956298828125, 0.5511627197265625, 0.578369140625, 0.6055755615234375, 0.632781982421875, 0.6599884033203125, 0.68719482421875, 0.7144012451171875, 0.741607666015625, 0.7688140869140625, 0.7960205078125, 0.8232269287109375, 0.850433349609375, 0.8776397705078125, 0.90484619140625, 0.9320526123046875, 0.959259033203125, 0.9864654541015625, 1.013671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 6.0, 13.0, 27.0, 35.0, 80.0, 134.0, 233.0, 538.0, 1726.0, 7469.0, 50294.0, 3926368.0, 185196.0, 17111.0, 3341.0, 971.0, 356.0, 155.0, 90.0, 38.0, 40.0, 14.0, 16.0, 12.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.625, -39.30322265625, -37.9814453125, -36.65966796875, -35.337890625, -34.01611328125, -32.6943359375, -31.37255859375, -30.05078125, -28.72900390625, -27.4072265625, -26.08544921875, -24.763671875, -23.44189453125, -22.1201171875, -20.79833984375, -19.4765625, -18.15478515625, -16.8330078125, -15.51123046875, -14.189453125, -12.86767578125, -11.5458984375, -10.22412109375, -8.90234375, -7.58056640625, -6.2587890625, -4.93701171875, -3.615234375, -2.29345703125, -0.9716796875, 0.35009765625, 1.671875, 2.99365234375, 4.3154296875, 5.63720703125, 6.958984375, 8.28076171875, 9.6025390625, 10.92431640625, 12.24609375, 13.56787109375, 14.8896484375, 16.21142578125, 17.533203125, 18.85498046875, 20.1767578125, 21.49853515625, 22.8203125, 24.14208984375, 25.4638671875, 26.78564453125, 28.107421875, 29.42919921875, 30.7509765625, 32.07275390625, 33.39453125, 34.71630859375, 36.0380859375, 37.35986328125, 38.681640625, 40.00341796875, 41.3251953125, 42.64697265625, 43.96875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 6.0, 6.0, 12.0, 11.0, 12.0, 12.0, 19.0, 28.0, 25.0, 35.0, 53.0, 84.0, 130.0, 282.0, 1668.0, 994.0, 274.0, 106.0, 74.0, 55.0, 35.0, 22.0, 26.0, 15.0, 13.0, 14.0, 13.0, 5.0, 7.0, 8.0, 7.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.3125, -2.242279052734375, -2.17205810546875, -2.101837158203125, -2.0316162109375, -1.961395263671875, -1.89117431640625, -1.820953369140625, -1.750732421875, -1.680511474609375, -1.61029052734375, -1.540069580078125, -1.4698486328125, -1.399627685546875, -1.32940673828125, -1.259185791015625, -1.18896484375, -1.118743896484375, -1.04852294921875, -0.978302001953125, -0.9080810546875, -0.837860107421875, -0.76763916015625, -0.697418212890625, -0.627197265625, -0.556976318359375, -0.48675537109375, -0.416534423828125, -0.3463134765625, -0.276092529296875, -0.20587158203125, -0.135650634765625, -0.0654296875, 0.004791259765625, 0.07501220703125, 0.145233154296875, 0.2154541015625, 0.285675048828125, 0.35589599609375, 0.426116943359375, 0.496337890625, 0.566558837890625, 0.63677978515625, 0.707000732421875, 0.7772216796875, 0.847442626953125, 0.91766357421875, 0.987884521484375, 1.05810546875, 1.128326416015625, 1.19854736328125, 1.268768310546875, 1.3389892578125, 1.409210205078125, 1.47943115234375, 1.549652099609375, 1.619873046875, 1.690093994140625, 1.76031494140625, 1.830535888671875, 1.9007568359375, 1.970977783203125, 2.04119873046875, 2.111419677734375, 2.181640625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 7.0, 11.0, 17.0, 25.0, 37.0, 49.0, 65.0, 111.0, 168.0, 158.0, 122.0, 75.0, 55.0, 29.0, 21.0, 11.0, 7.0, 6.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.633610725402832, -12.007352828979492, -11.381093978881836, -10.754836082458496, -10.128578186035156, -9.502320289611816, -8.876062393188477, -8.24980354309082, -7.6235456466674805, -6.997287750244141, -6.371029376983643, -5.7447710037231445, -5.118513107299805, -4.492255210876465, -3.865996837615967, -3.2397384643554688, -2.613480567932129, -1.98722243309021, -1.360964298248291, -0.7347061634063721, -0.10844802856445312, 0.5178101062774658, 1.1440682411193848, 1.7703266143798828, 2.3965845108032227, 3.0228426456451416, 3.6491007804870605, 4.275359153747559, 4.901617050170898, 5.527874946594238, 6.154133319854736, 6.780391693115234, 7.406648635864258, 8.032906532287598, 8.659164428710938, 9.285423278808594, 9.911681175231934, 10.537939071655273, 11.16419792175293, 11.79045581817627, 12.41671371459961, 13.04297161102295, 13.669229507446289, 14.295488357543945, 14.921746253967285, 15.548004150390625, 16.17426300048828, 16.800521850585938, 17.42677879333496, 18.053037643432617, 18.67929458618164, 19.305553436279297, 19.931812286376953, 20.558069229125977, 21.184328079223633, 21.810585021972656, 22.436843872070312, 23.06310272216797, 23.689359664916992, 24.31561851501465, 24.941875457763672, 25.568134307861328, 26.194393157958984, 26.82065200805664, 27.446908950805664]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 4.0, 9.0, 7.0, 8.0, 10.0, 18.0, 30.0, 18.0, 26.0, 30.0, 37.0, 36.0, 45.0, 47.0, 45.0, 54.0, 56.0, 44.0, 55.0, 36.0, 52.0, 53.0, 38.0, 41.0, 32.0, 25.0, 27.0, 24.0, 11.0, 14.0, 18.0, 11.0, 10.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.850435256958008, -9.578157424926758, -9.305879592895508, -9.033601760864258, -8.761323928833008, -8.489046096801758, -8.216768264770508, -7.944490909576416, -7.672213077545166, -7.399935245513916, -7.127657413482666, -6.855379581451416, -6.583102226257324, -6.310824394226074, -6.038546562194824, -5.766268730163574, -5.493990898132324, -5.221713066101074, -4.949435234069824, -4.677157402038574, -4.404879570007324, -4.132601737976074, -3.8603243827819824, -3.5880465507507324, -3.3157687187194824, -3.0434908866882324, -2.7712130546569824, -2.4989354610443115, -2.2266576290130615, -1.9543797969818115, -1.682102084159851, -1.4098243713378906, -1.1375455856323242, -0.865267813205719, -0.5929900407791138, -0.32071226835250854, -0.04843449592590332, 0.22384333610534668, 0.49612104892730713, 0.7683987617492676, 1.0406765937805176, 1.3129544258117676, 1.585232138633728, 1.8575098514556885, 2.1297876834869385, 2.4020655155181885, 2.6743431091308594, 2.9466209411621094, 3.2188987731933594, 3.4911766052246094, 3.7634544372558594, 4.035732269287109, 4.308010101318359, 4.580287933349609, 4.852565288543701, 5.124843120574951, 5.397120952606201, 5.669398784637451, 5.941676616668701, 6.213954448699951, 6.486231803894043, 6.758509635925293, 7.030787467956543, 7.303065299987793, 7.575343132019043]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 13.0, 9.0, 19.0, 18.0, 32.0, 56.0, 74.0, 91.0, 170.0, 271.0, 473.0, 741.0, 1353.0, 2575.0, 4788.0, 9488.0, 21191.0, 50873.0, 133184.0, 340595.0, 294144.0, 110324.0, 42317.0, 18119.0, 8344.0, 4090.0, 2164.0, 1180.0, 698.0, 430.0, 249.0, 158.0, 108.0, 64.0, 47.0, 36.0, 17.0, 17.0, 9.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.9921875, -8.7103271484375, -8.428466796875, -8.1466064453125, -7.86474609375, -7.5828857421875, -7.301025390625, -7.0191650390625, -6.7373046875, -6.4554443359375, -6.173583984375, -5.8917236328125, -5.60986328125, -5.3280029296875, -5.046142578125, -4.7642822265625, -4.482421875, -4.2005615234375, -3.918701171875, -3.6368408203125, -3.35498046875, -3.0731201171875, -2.791259765625, -2.5093994140625, -2.2275390625, -1.9456787109375, -1.663818359375, -1.3819580078125, -1.10009765625, -0.8182373046875, -0.536376953125, -0.2545166015625, 0.02734375, 0.3092041015625, 0.591064453125, 0.8729248046875, 1.15478515625, 1.4366455078125, 1.718505859375, 2.0003662109375, 2.2822265625, 2.5640869140625, 2.845947265625, 3.1278076171875, 3.40966796875, 3.6915283203125, 3.973388671875, 4.2552490234375, 4.537109375, 4.8189697265625, 5.100830078125, 5.3826904296875, 5.66455078125, 5.9464111328125, 6.228271484375, 6.5101318359375, 6.7919921875, 7.0738525390625, 7.355712890625, 7.6375732421875, 7.91943359375, 8.2012939453125, 8.483154296875, 8.7650146484375, 9.046875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 8.0, 10.0, 10.0, 13.0, 15.0, 9.0, 21.0, 24.0, 32.0, 37.0, 44.0, 54.0, 48.0, 56.0, 58.0, 64.0, 48.0, 77.0, 54.0, 67.0, 53.0, 37.0, 31.0, 27.0, 19.0, 14.0, 14.0, 8.0, 6.0, 15.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.71044921875, -0.6915054321289062, -0.6725616455078125, -0.6536178588867188, -0.634674072265625, -0.6157302856445312, -0.5967864990234375, -0.5778427124023438, -0.55889892578125, -0.5399551391601562, -0.5210113525390625, -0.5020675659179688, -0.483123779296875, -0.46417999267578125, -0.4452362060546875, -0.42629241943359375, -0.4073486328125, -0.38840484619140625, -0.3694610595703125, -0.35051727294921875, -0.331573486328125, -0.31262969970703125, -0.2936859130859375, -0.27474212646484375, -0.25579833984375, -0.23685455322265625, -0.2179107666015625, -0.19896697998046875, -0.180023193359375, -0.16107940673828125, -0.1421356201171875, -0.12319183349609375, -0.104248046875, -0.08530426025390625, -0.0663604736328125, -0.04741668701171875, -0.028472900390625, -0.00952911376953125, 0.0094146728515625, 0.02835845947265625, 0.04730224609375, 0.06624603271484375, 0.0851898193359375, 0.10413360595703125, 0.123077392578125, 0.14202117919921875, 0.1609649658203125, 0.17990875244140625, 0.1988525390625, 0.21779632568359375, 0.2367401123046875, 0.25568389892578125, 0.274627685546875, 0.29357147216796875, 0.3125152587890625, 0.33145904541015625, 0.35040283203125, 0.36934661865234375, 0.3882904052734375, 0.40723419189453125, 0.426177978515625, 0.44512176513671875, 0.4640655517578125, 0.48300933837890625, 0.501953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 10.0, 10.0, 14.0, 17.0, 25.0, 36.0, 50.0, 77.0, 104.0, 181.0, 279.0, 415.0, 753.0, 1354.0, 2875.0, 7236.0, 21107.0, 80017.0, 371355.0, 426754.0, 96074.0, 24663.0, 8087.0, 3189.0, 1607.0, 862.0, 491.0, 311.0, 191.0, 132.0, 83.0, 66.0, 22.0, 32.0, 22.0, 16.0, 6.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.7109375, -12.314453125, -11.91796875, -11.521484375, -11.125, -10.728515625, -10.33203125, -9.935546875, -9.5390625, -9.142578125, -8.74609375, -8.349609375, -7.953125, -7.556640625, -7.16015625, -6.763671875, -6.3671875, -5.970703125, -5.57421875, -5.177734375, -4.78125, -4.384765625, -3.98828125, -3.591796875, -3.1953125, -2.798828125, -2.40234375, -2.005859375, -1.609375, -1.212890625, -0.81640625, -0.419921875, -0.0234375, 0.373046875, 0.76953125, 1.166015625, 1.5625, 1.958984375, 2.35546875, 2.751953125, 3.1484375, 3.544921875, 3.94140625, 4.337890625, 4.734375, 5.130859375, 5.52734375, 5.923828125, 6.3203125, 6.716796875, 7.11328125, 7.509765625, 7.90625, 8.302734375, 8.69921875, 9.095703125, 9.4921875, 9.888671875, 10.28515625, 10.681640625, 11.078125, 11.474609375, 11.87109375, 12.267578125, 12.6640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 4.0, 5.0, 10.0, 7.0, 16.0, 12.0, 12.0, 21.0, 19.0, 29.0, 37.0, 33.0, 46.0, 44.0, 43.0, 53.0, 43.0, 51.0, 66.0, 50.0, 55.0, 42.0, 41.0, 24.0, 36.0, 31.0, 32.0, 11.0, 15.0, 17.0, 19.0, 16.0, 11.0, 9.0, 6.0, 3.0, 5.0, 6.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.08984375, -2.981109619140625, -2.87237548828125, -2.763641357421875, -2.6549072265625, -2.546173095703125, -2.43743896484375, -2.328704833984375, -2.219970703125, -2.111236572265625, -2.00250244140625, -1.893768310546875, -1.7850341796875, -1.676300048828125, -1.56756591796875, -1.458831787109375, -1.35009765625, -1.241363525390625, -1.13262939453125, -1.023895263671875, -0.9151611328125, -0.806427001953125, -0.69769287109375, -0.588958740234375, -0.480224609375, -0.371490478515625, -0.26275634765625, -0.154022216796875, -0.0452880859375, 0.063446044921875, 0.17218017578125, 0.280914306640625, 0.3896484375, 0.498382568359375, 0.60711669921875, 0.715850830078125, 0.8245849609375, 0.933319091796875, 1.04205322265625, 1.150787353515625, 1.259521484375, 1.368255615234375, 1.47698974609375, 1.585723876953125, 1.6944580078125, 1.803192138671875, 1.91192626953125, 2.020660400390625, 2.12939453125, 2.238128662109375, 2.34686279296875, 2.455596923828125, 2.5643310546875, 2.673065185546875, 2.78179931640625, 2.890533447265625, 2.999267578125, 3.108001708984375, 3.21673583984375, 3.325469970703125, 3.4342041015625, 3.542938232421875, 3.65167236328125, 3.760406494140625, 3.869140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 11.0, 9.0, 12.0, 20.0, 37.0, 42.0, 86.0, 118.0, 202.0, 357.0, 537.0, 992.0, 2107.0, 5134.0, 17072.0, 117012.0, 772078.0, 106885.0, 16424.0, 5011.0, 2020.0, 1003.0, 554.0, 331.0, 182.0, 113.0, 57.0, 37.0, 28.0, 16.0, 15.0, 12.0, 7.0, 3.0, 7.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.59375, -10.2218017578125, -9.849853515625, -9.4779052734375, -9.10595703125, -8.7340087890625, -8.362060546875, -7.9901123046875, -7.6181640625, -7.2462158203125, -6.874267578125, -6.5023193359375, -6.13037109375, -5.7584228515625, -5.386474609375, -5.0145263671875, -4.642578125, -4.2706298828125, -3.898681640625, -3.5267333984375, -3.15478515625, -2.7828369140625, -2.410888671875, -2.0389404296875, -1.6669921875, -1.2950439453125, -0.923095703125, -0.5511474609375, -0.17919921875, 0.1927490234375, 0.564697265625, 0.9366455078125, 1.30859375, 1.6805419921875, 2.052490234375, 2.4244384765625, 2.79638671875, 3.1683349609375, 3.540283203125, 3.9122314453125, 4.2841796875, 4.6561279296875, 5.028076171875, 5.4000244140625, 5.77197265625, 6.1439208984375, 6.515869140625, 6.8878173828125, 7.259765625, 7.6317138671875, 8.003662109375, 8.3756103515625, 8.74755859375, 9.1195068359375, 9.491455078125, 9.8634033203125, 10.2353515625, 10.6072998046875, 10.979248046875, 11.3511962890625, 11.72314453125, 12.0950927734375, 12.467041015625, 12.8389892578125, 13.2109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 7.0, 9.0, 7.0, 14.0, 20.0, 23.0, 43.0, 53.0, 97.0, 149.0, 173.0, 145.0, 83.0, 56.0, 42.0, 19.0, 22.0, 12.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0014925003051757812, -0.0014525353908538818, -0.0014125704765319824, -0.001372605562210083, -0.0013326406478881836, -0.0012926757335662842, -0.0012527108192443848, -0.0012127459049224854, -0.001172780990600586, -0.0011328160762786865, -0.0010928511619567871, -0.0010528862476348877, -0.0010129213333129883, -0.0009729564189910889, -0.0009329915046691895, -0.00089302659034729, -0.0008530616760253906, -0.0008130967617034912, -0.0007731318473815918, -0.0007331669330596924, -0.000693202018737793, -0.0006532371044158936, -0.0006132721900939941, -0.0005733072757720947, -0.0005333423614501953, -0.0004933774471282959, -0.0004534125328063965, -0.00041344761848449707, -0.00037348270416259766, -0.00033351778984069824, -0.00029355287551879883, -0.0002535879611968994, -0.000213623046875, -0.00017365813255310059, -0.00013369321823120117, -9.372830390930176e-05, -5.3763389587402344e-05, -1.379847526550293e-05, 2.6166439056396484e-05, 6.61313533782959e-05, 0.00010609626770019531, 0.00014606118202209473, 0.00018602609634399414, 0.00022599101066589355, 0.00026595592498779297, 0.0003059208393096924, 0.0003458857536315918, 0.0003858506679534912, 0.0004258155822753906, 0.00046578049659729004, 0.0005057454109191895, 0.0005457103252410889, 0.0005856752395629883, 0.0006256401538848877, 0.0006656050682067871, 0.0007055699825286865, 0.0007455348968505859, 0.0007854998111724854, 0.0008254647254943848, 0.0008654296398162842, 0.0009053945541381836, 0.000945359468460083, 0.0009853243827819824, 0.0010252892971038818, 0.0010652542114257812]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 11.0, 7.0, 16.0, 21.0, 35.0, 31.0, 47.0, 54.0, 88.0, 149.0, 228.0, 342.0, 554.0, 933.0, 2009.0, 4737.0, 14442.0, 69416.0, 649846.0, 258421.0, 32056.0, 8435.0, 3219.0, 1421.0, 730.0, 445.0, 269.0, 172.0, 114.0, 89.0, 65.0, 39.0, 22.0, 16.0, 17.0, 11.0, 10.0, 9.0, 3.0, 0.0, 5.0, 2.0, 0.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-10.6953125, -10.378662109375, -10.06201171875, -9.745361328125, -9.4287109375, -9.112060546875, -8.79541015625, -8.478759765625, -8.162109375, -7.845458984375, -7.52880859375, -7.212158203125, -6.8955078125, -6.578857421875, -6.26220703125, -5.945556640625, -5.62890625, -5.312255859375, -4.99560546875, -4.678955078125, -4.3623046875, -4.045654296875, -3.72900390625, -3.412353515625, -3.095703125, -2.779052734375, -2.46240234375, -2.145751953125, -1.8291015625, -1.512451171875, -1.19580078125, -0.879150390625, -0.5625, -0.245849609375, 0.07080078125, 0.387451171875, 0.7041015625, 1.020751953125, 1.33740234375, 1.654052734375, 1.970703125, 2.287353515625, 2.60400390625, 2.920654296875, 3.2373046875, 3.553955078125, 3.87060546875, 4.187255859375, 4.50390625, 4.820556640625, 5.13720703125, 5.453857421875, 5.7705078125, 6.087158203125, 6.40380859375, 6.720458984375, 7.037109375, 7.353759765625, 7.67041015625, 7.987060546875, 8.3037109375, 8.620361328125, 8.93701171875, 9.253662109375, 9.5703125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 3.0, 10.0, 11.0, 13.0, 28.0, 34.0, 51.0, 66.0, 85.0, 99.0, 104.0, 117.0, 86.0, 74.0, 55.0, 39.0, 28.0, 29.0, 10.0, 9.0, 9.0, 6.0, 7.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.42578125, -4.29376220703125, -4.1617431640625, -4.02972412109375, -3.897705078125, -3.76568603515625, -3.6336669921875, -3.50164794921875, -3.36962890625, -3.23760986328125, -3.1055908203125, -2.97357177734375, -2.841552734375, -2.70953369140625, -2.5775146484375, -2.44549560546875, -2.3134765625, -2.18145751953125, -2.0494384765625, -1.91741943359375, -1.785400390625, -1.65338134765625, -1.5213623046875, -1.38934326171875, -1.25732421875, -1.12530517578125, -0.9932861328125, -0.86126708984375, -0.729248046875, -0.59722900390625, -0.4652099609375, -0.33319091796875, -0.201171875, -0.06915283203125, 0.0628662109375, 0.19488525390625, 0.326904296875, 0.45892333984375, 0.5909423828125, 0.72296142578125, 0.85498046875, 0.98699951171875, 1.1190185546875, 1.25103759765625, 1.383056640625, 1.51507568359375, 1.6470947265625, 1.77911376953125, 1.9111328125, 2.04315185546875, 2.1751708984375, 2.30718994140625, 2.439208984375, 2.57122802734375, 2.7032470703125, 2.83526611328125, 2.96728515625, 3.09930419921875, 3.2313232421875, 3.36334228515625, 3.495361328125, 3.62738037109375, 3.7593994140625, 3.89141845703125, 4.0234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 8.0, 13.0, 27.0, 51.0, 141.0, 289.0, 280.0, 120.0, 42.0, 24.0, 6.0, 1.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.36195373535156, -79.93295288085938, -75.50395202636719, -71.074951171875, -66.64595031738281, -62.21695327758789, -57.78795623779297, -53.35895538330078, -48.929954528808594, -44.500953674316406, -40.07195281982422, -35.6429557800293, -31.21395492553711, -26.784954071044922, -22.355955123901367, -17.926956176757812, -13.497955322265625, -9.068955421447754, -4.639955520629883, -0.21095561981201172, 4.218044281005859, 8.647045135498047, 13.076044082641602, 17.505043029785156, 21.934043884277344, 26.36304473876953, 30.792043685913086, 35.22104263305664, 39.65004348754883, 44.079044342041016, 48.50804138183594, 52.937042236328125, 57.366058349609375, 61.79505920410156, 66.22406005859375, 70.65306091308594, 75.08206176757812, 79.51106262207031, 83.94005584716797, 88.36905670166016, 92.79805755615234, 97.22705841064453, 101.65605926513672, 106.0850601196289, 110.51405334472656, 114.94305419921875, 119.37205505371094, 123.80105590820312, 128.2300567626953, 132.6590576171875, 137.0880584716797, 141.51705932617188, 145.94606018066406, 150.37506103515625, 154.80406188964844, 159.23306274414062, 163.66204833984375, 168.09104919433594, 172.52005004882812, 176.9490509033203, 181.3780517578125, 185.8070526123047, 190.23605346679688, 194.6650390625, 199.09405517578125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 8.0, 9.0, 7.0, 20.0, 22.0, 25.0, 34.0, 44.0, 42.0, 60.0, 80.0, 62.0, 65.0, 71.0, 58.0, 77.0, 63.0, 53.0, 47.0, 36.0, 42.0, 19.0, 15.0, 22.0, 5.0, 7.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.399044036865234, -30.235790252685547, -29.072538375854492, -27.909286499023438, -26.74603271484375, -25.582778930664062, -24.419527053833008, -23.256275177001953, -22.093021392822266, -20.929767608642578, -19.766515731811523, -18.60326385498047, -17.44001007080078, -16.276756286621094, -15.113504409790039, -13.950251579284668, -12.786998748779297, -11.623745918273926, -10.460493087768555, -9.297240257263184, -8.133987426757812, -6.970734596252441, -5.80748176574707, -4.644228935241699, -3.480976104736328, -2.317723274230957, -1.154470443725586, 0.008782386779785156, 1.1720352172851562, 2.3352880477905273, 3.4985408782958984, 4.6617937088012695, 5.825050354003906, 6.988303184509277, 8.151556015014648, 9.31480884552002, 10.47806167602539, 11.641314506530762, 12.804567337036133, 13.967820167541504, 15.131072998046875, 16.294326782226562, 17.457578659057617, 18.620830535888672, 19.78408432006836, 20.947338104248047, 22.1105899810791, 23.273841857910156, 24.437095642089844, 25.60034942626953, 26.763601303100586, 27.92685317993164, 29.090106964111328, 30.253360748291016, 31.41661262512207, 32.579864501953125, 33.74311828613281, 34.9063720703125, 36.06962585449219, 37.23287582397461, 38.3961296081543, 39.559383392333984, 40.722633361816406, 41.885887145996094, 43.04914093017578]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 12.0, 13.0, 12.0, 20.0, 24.0, 51.0, 83.0, 147.0, 369.0, 1140.0, 5618.0, 50677.0, 4078552.0, 50286.0, 5490.0, 1137.0, 310.0, 123.0, 76.0, 39.0, 28.0, 13.0, 17.0, 5.0, 9.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.28125, -41.0556640625, -39.830078125, -38.6044921875, -37.37890625, -36.1533203125, -34.927734375, -33.7021484375, -32.4765625, -31.2509765625, -30.025390625, -28.7998046875, -27.57421875, -26.3486328125, -25.123046875, -23.8974609375, -22.671875, -21.4462890625, -20.220703125, -18.9951171875, -17.76953125, -16.5439453125, -15.318359375, -14.0927734375, -12.8671875, -11.6416015625, -10.416015625, -9.1904296875, -7.96484375, -6.7392578125, -5.513671875, -4.2880859375, -3.0625, -1.8369140625, -0.611328125, 0.6142578125, 1.83984375, 3.0654296875, 4.291015625, 5.5166015625, 6.7421875, 7.9677734375, 9.193359375, 10.4189453125, 11.64453125, 12.8701171875, 14.095703125, 15.3212890625, 16.546875, 17.7724609375, 18.998046875, 20.2236328125, 21.44921875, 22.6748046875, 23.900390625, 25.1259765625, 26.3515625, 27.5771484375, 28.802734375, 30.0283203125, 31.25390625, 32.4794921875, 33.705078125, 34.9306640625, 36.15625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 4.0, 10.0, 17.0, 12.0, 11.0, 23.0, 33.0, 45.0, 41.0, 58.0, 59.0, 67.0, 74.0, 79.0, 61.0, 60.0, 81.0, 54.0, 49.0, 33.0, 36.0, 22.0, 17.0, 6.0, 10.0, 6.0, 6.0, 9.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9287109375, -0.9017257690429688, -0.8747406005859375, -0.8477554321289062, -0.820770263671875, -0.7937850952148438, -0.7667999267578125, -0.7398147583007812, -0.71282958984375, -0.6858444213867188, -0.6588592529296875, -0.6318740844726562, -0.604888916015625, -0.5779037475585938, -0.5509185791015625, -0.5239334106445312, -0.4969482421875, -0.46996307373046875, -0.4429779052734375, -0.41599273681640625, -0.389007568359375, -0.36202239990234375, -0.3350372314453125, -0.30805206298828125, -0.28106689453125, -0.25408172607421875, -0.2270965576171875, -0.20011138916015625, -0.173126220703125, -0.14614105224609375, -0.1191558837890625, -0.09217071533203125, -0.065185546875, -0.03820037841796875, -0.0112152099609375, 0.01576995849609375, 0.042755126953125, 0.06974029541015625, 0.0967254638671875, 0.12371063232421875, 0.15069580078125, 0.17768096923828125, 0.2046661376953125, 0.23165130615234375, 0.258636474609375, 0.28562164306640625, 0.3126068115234375, 0.33959197998046875, 0.3665771484375, 0.39356231689453125, 0.4205474853515625, 0.44753265380859375, 0.474517822265625, 0.5015029907226562, 0.5284881591796875, 0.5554733276367188, 0.58245849609375, 0.6094436645507812, 0.6364288330078125, 0.6634140014648438, 0.690399169921875, 0.7173843383789062, 0.7443695068359375, 0.7713546752929688, 0.79833984375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 7.0, 14.0, 11.0, 17.0, 31.0, 32.0, 49.0, 85.0, 104.0, 212.0, 459.0, 998.0, 2421.0, 6929.0, 28141.0, 275476.0, 3797062.0, 63173.0, 12550.0, 3677.0, 1431.0, 594.0, 318.0, 184.0, 105.0, 58.0, 44.0, 28.0, 27.0, 12.0, 9.0, 6.0, 3.0, 6.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.9375, -27.14453125, -26.3515625, -25.55859375, -24.765625, -23.97265625, -23.1796875, -22.38671875, -21.59375, -20.80078125, -20.0078125, -19.21484375, -18.421875, -17.62890625, -16.8359375, -16.04296875, -15.25, -14.45703125, -13.6640625, -12.87109375, -12.078125, -11.28515625, -10.4921875, -9.69921875, -8.90625, -8.11328125, -7.3203125, -6.52734375, -5.734375, -4.94140625, -4.1484375, -3.35546875, -2.5625, -1.76953125, -0.9765625, -0.18359375, 0.609375, 1.40234375, 2.1953125, 2.98828125, 3.78125, 4.57421875, 5.3671875, 6.16015625, 6.953125, 7.74609375, 8.5390625, 9.33203125, 10.125, 10.91796875, 11.7109375, 12.50390625, 13.296875, 14.08984375, 14.8828125, 15.67578125, 16.46875, 17.26171875, 18.0546875, 18.84765625, 19.640625, 20.43359375, 21.2265625, 22.01953125, 22.8125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 7.0, 7.0, 18.0, 20.0, 29.0, 36.0, 54.0, 64.0, 112.0, 274.0, 1810.0, 1067.0, 250.0, 95.0, 67.0, 34.0, 36.0, 15.0, 12.0, 13.0, 13.0, 12.0, 3.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.55078125, -3.45965576171875, -3.3685302734375, -3.27740478515625, -3.186279296875, -3.09515380859375, -3.0040283203125, -2.91290283203125, -2.82177734375, -2.73065185546875, -2.6395263671875, -2.54840087890625, -2.457275390625, -2.36614990234375, -2.2750244140625, -2.18389892578125, -2.0927734375, -2.00164794921875, -1.9105224609375, -1.81939697265625, -1.728271484375, -1.63714599609375, -1.5460205078125, -1.45489501953125, -1.36376953125, -1.27264404296875, -1.1815185546875, -1.09039306640625, -0.999267578125, -0.90814208984375, -0.8170166015625, -0.72589111328125, -0.634765625, -0.54364013671875, -0.4525146484375, -0.36138916015625, -0.270263671875, -0.17913818359375, -0.0880126953125, 0.00311279296875, 0.09423828125, 0.18536376953125, 0.2764892578125, 0.36761474609375, 0.458740234375, 0.54986572265625, 0.6409912109375, 0.73211669921875, 0.8232421875, 0.91436767578125, 1.0054931640625, 1.09661865234375, 1.187744140625, 1.27886962890625, 1.3699951171875, 1.46112060546875, 1.55224609375, 1.64337158203125, 1.7344970703125, 1.82562255859375, 1.916748046875, 2.00787353515625, 2.0989990234375, 2.19012451171875, 2.28125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 9.0, 12.0, 9.0, 21.0, 32.0, 58.0, 101.0, 173.0, 190.0, 179.0, 102.0, 57.0, 26.0, 15.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-38.571475982666016, -37.75764083862305, -36.94380569458008, -36.12997055053711, -35.31613540649414, -34.50230026245117, -33.6884651184082, -32.874629974365234, -32.060794830322266, -31.246959686279297, -30.433124542236328, -29.61928939819336, -28.80545425415039, -27.991619110107422, -27.177783966064453, -26.363948822021484, -25.550113677978516, -24.736278533935547, -23.922443389892578, -23.10860824584961, -22.29477310180664, -21.480937957763672, -20.667102813720703, -19.853267669677734, -19.039432525634766, -18.225597381591797, -17.411762237548828, -16.59792709350586, -15.78409194946289, -14.970256805419922, -14.156421661376953, -13.342586517333984, -12.528752326965332, -11.714917182922363, -10.901082038879395, -10.087246894836426, -9.273411750793457, -8.459576606750488, -7.6457414627075195, -6.831906318664551, -6.018071174621582, -5.204236030578613, -4.3904008865356445, -3.576565742492676, -2.762730598449707, -1.9488954544067383, -1.1350603103637695, -0.3212251663208008, 0.49260997772216797, 1.3064451217651367, 2.1202802658081055, 2.934115409851074, 3.747950553894043, 4.561785697937012, 5.3756208419799805, 6.189455986022949, 7.003291130065918, 7.817126274108887, 8.630961418151855, 9.444796562194824, 10.258631706237793, 11.072466850280762, 11.88630199432373, 12.7001371383667, 13.513972282409668]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 12.0, 8.0, 13.0, 6.0, 10.0, 14.0, 16.0, 18.0, 26.0, 23.0, 22.0, 37.0, 34.0, 29.0, 32.0, 40.0, 39.0, 46.0, 32.0, 35.0, 32.0, 36.0, 36.0, 41.0, 32.0, 29.0, 26.0, 34.0, 22.0, 14.0, 28.0, 26.0, 19.0, 16.0, 15.0, 15.0, 11.0, 10.0, 10.0, 7.0, 15.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-7.2342305183410645, -7.0278000831604, -6.8213701248168945, -6.6149396896362305, -6.408509254455566, -6.202078819274902, -5.995648384094238, -5.789218425750732, -5.582787990570068, -5.376357555389404, -5.169927597045898, -4.963497161865234, -4.75706672668457, -4.550636291503906, -4.344205856323242, -4.137775897979736, -3.9313454627990723, -3.724915027618408, -3.5184848308563232, -3.3120546340942383, -3.105624198913574, -2.89919376373291, -2.692763566970825, -2.4863333702087402, -2.279902935028076, -2.073472499847412, -1.8670423030853271, -1.6606119871139526, -1.4541816711425781, -1.2477513551712036, -1.041321039199829, -0.8348907232284546, -0.6284608840942383, -0.42203056812286377, -0.21560025215148926, -0.009169936180114746, 0.19726037979125977, 0.4036906957626343, 0.6101210117340088, 0.8165513277053833, 1.0229816436767578, 1.2294119596481323, 1.4358422756195068, 1.6422725915908813, 1.8487029075622559, 2.05513334274292, 2.261563539505005, 2.46799373626709, 2.674424171447754, 2.880854606628418, 3.087284803390503, 3.293715000152588, 3.500145435333252, 3.706575870513916, 3.913006067276001, 4.119436264038086, 4.32586669921875, 4.532297134399414, 4.738727569580078, 4.945157527923584, 5.151587963104248, 5.358018398284912, 5.564448356628418, 5.770878791809082, 5.977309226989746]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 18.0, 7.0, 14.0, 24.0, 24.0, 47.0, 61.0, 126.0, 184.0, 256.0, 376.0, 639.0, 1044.0, 1905.0, 3715.0, 7228.0, 15424.0, 33112.0, 76871.0, 179191.0, 319419.0, 227438.0, 99843.0, 43196.0, 19243.0, 8955.0, 4500.0, 2328.0, 1305.0, 759.0, 462.0, 284.0, 166.0, 113.0, 89.0, 66.0, 35.0, 23.0, 18.0, 9.0, 10.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.2265625, -7.0052490234375, -6.783935546875, -6.5626220703125, -6.34130859375, -6.1199951171875, -5.898681640625, -5.6773681640625, -5.4560546875, -5.2347412109375, -5.013427734375, -4.7921142578125, -4.57080078125, -4.3494873046875, -4.128173828125, -3.9068603515625, -3.685546875, -3.4642333984375, -3.242919921875, -3.0216064453125, -2.80029296875, -2.5789794921875, -2.357666015625, -2.1363525390625, -1.9150390625, -1.6937255859375, -1.472412109375, -1.2510986328125, -1.02978515625, -0.8084716796875, -0.587158203125, -0.3658447265625, -0.14453125, 0.0767822265625, 0.298095703125, 0.5194091796875, 0.74072265625, 0.9620361328125, 1.183349609375, 1.4046630859375, 1.6259765625, 1.8472900390625, 2.068603515625, 2.2899169921875, 2.51123046875, 2.7325439453125, 2.953857421875, 3.1751708984375, 3.396484375, 3.6177978515625, 3.839111328125, 4.0604248046875, 4.28173828125, 4.5030517578125, 4.724365234375, 4.9456787109375, 5.1669921875, 5.3883056640625, 5.609619140625, 5.8309326171875, 6.05224609375, 6.2735595703125, 6.494873046875, 6.7161865234375, 6.9375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 14.0, 5.0, 15.0, 17.0, 21.0, 27.0, 41.0, 39.0, 43.0, 51.0, 75.0, 45.0, 72.0, 56.0, 76.0, 60.0, 63.0, 48.0, 46.0, 33.0, 29.0, 34.0, 19.0, 18.0, 9.0, 9.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.84130859375, -0.8152008056640625, -0.789093017578125, -0.7629852294921875, -0.73687744140625, -0.7107696533203125, -0.684661865234375, -0.6585540771484375, -0.6324462890625, -0.6063385009765625, -0.580230712890625, -0.5541229248046875, -0.52801513671875, -0.5019073486328125, -0.475799560546875, -0.4496917724609375, -0.423583984375, -0.3974761962890625, -0.371368408203125, -0.3452606201171875, -0.31915283203125, -0.2930450439453125, -0.266937255859375, -0.2408294677734375, -0.2147216796875, -0.1886138916015625, -0.162506103515625, -0.1363983154296875, -0.11029052734375, -0.0841827392578125, -0.058074951171875, -0.0319671630859375, -0.005859375, 0.0202484130859375, 0.046356201171875, 0.0724639892578125, 0.09857177734375, 0.1246795654296875, 0.150787353515625, 0.1768951416015625, 0.2030029296875, 0.2291107177734375, 0.255218505859375, 0.2813262939453125, 0.30743408203125, 0.3335418701171875, 0.359649658203125, 0.3857574462890625, 0.411865234375, 0.4379730224609375, 0.464080810546875, 0.4901885986328125, 0.51629638671875, 0.5424041748046875, 0.568511962890625, 0.5946197509765625, 0.6207275390625, 0.6468353271484375, 0.672943115234375, 0.6990509033203125, 0.72515869140625, 0.7512664794921875, 0.777374267578125, 0.8034820556640625, 0.82958984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 1.0, 4.0, 14.0, 12.0, 21.0, 15.0, 29.0, 30.0, 61.0, 98.0, 146.0, 197.0, 301.0, 487.0, 795.0, 1490.0, 3082.0, 6723.0, 17889.0, 54564.0, 197576.0, 462106.0, 211325.0, 58566.0, 18804.0, 7181.0, 3213.0, 1610.0, 837.0, 475.0, 285.0, 192.0, 156.0, 81.0, 57.0, 36.0, 25.0, 18.0, 14.0, 13.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.046875, -10.7174072265625, -10.387939453125, -10.0584716796875, -9.72900390625, -9.3995361328125, -9.070068359375, -8.7406005859375, -8.4111328125, -8.0816650390625, -7.752197265625, -7.4227294921875, -7.09326171875, -6.7637939453125, -6.434326171875, -6.1048583984375, -5.775390625, -5.4459228515625, -5.116455078125, -4.7869873046875, -4.45751953125, -4.1280517578125, -3.798583984375, -3.4691162109375, -3.1396484375, -2.8101806640625, -2.480712890625, -2.1512451171875, -1.82177734375, -1.4923095703125, -1.162841796875, -0.8333740234375, -0.50390625, -0.1744384765625, 0.155029296875, 0.4844970703125, 0.81396484375, 1.1434326171875, 1.472900390625, 1.8023681640625, 2.1318359375, 2.4613037109375, 2.790771484375, 3.1202392578125, 3.44970703125, 3.7791748046875, 4.108642578125, 4.4381103515625, 4.767578125, 5.0970458984375, 5.426513671875, 5.7559814453125, 6.08544921875, 6.4149169921875, 6.744384765625, 7.0738525390625, 7.4033203125, 7.7327880859375, 8.062255859375, 8.3917236328125, 8.72119140625, 9.0506591796875, 9.380126953125, 9.7095947265625, 10.0390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 2.0, 2.0, 10.0, 10.0, 11.0, 18.0, 15.0, 20.0, 20.0, 31.0, 33.0, 29.0, 33.0, 46.0, 37.0, 47.0, 42.0, 49.0, 54.0, 49.0, 48.0, 50.0, 36.0, 38.0, 33.0, 44.0, 35.0, 28.0, 26.0, 25.0, 11.0, 15.0, 11.0, 9.0, 7.0, 7.0, 2.0, 2.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.125, -3.98834228515625, -3.8516845703125, -3.71502685546875, -3.578369140625, -3.44171142578125, -3.3050537109375, -3.16839599609375, -3.03173828125, -2.89508056640625, -2.7584228515625, -2.62176513671875, -2.485107421875, -2.34844970703125, -2.2117919921875, -2.07513427734375, -1.9384765625, -1.80181884765625, -1.6651611328125, -1.52850341796875, -1.391845703125, -1.25518798828125, -1.1185302734375, -0.98187255859375, -0.84521484375, -0.70855712890625, -0.5718994140625, -0.43524169921875, -0.298583984375, -0.16192626953125, -0.0252685546875, 0.11138916015625, 0.248046875, 0.38470458984375, 0.5213623046875, 0.65802001953125, 0.794677734375, 0.93133544921875, 1.0679931640625, 1.20465087890625, 1.34130859375, 1.47796630859375, 1.6146240234375, 1.75128173828125, 1.887939453125, 2.02459716796875, 2.1612548828125, 2.29791259765625, 2.4345703125, 2.57122802734375, 2.7078857421875, 2.84454345703125, 2.981201171875, 3.11785888671875, 3.2545166015625, 3.39117431640625, 3.52783203125, 3.66448974609375, 3.8011474609375, 3.93780517578125, 4.074462890625, 4.21112060546875, 4.3477783203125, 4.48443603515625, 4.62109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 8.0, 11.0, 15.0, 27.0, 52.0, 95.0, 149.0, 311.0, 640.0, 1724.0, 5668.0, 24302.0, 161312.0, 717533.0, 111117.0, 18494.0, 4526.0, 1427.0, 545.0, 263.0, 132.0, 69.0, 48.0, 30.0, 14.0, 12.0, 6.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.453125, -9.19354248046875, -8.9339599609375, -8.67437744140625, -8.414794921875, -8.15521240234375, -7.8956298828125, -7.63604736328125, -7.37646484375, -7.11688232421875, -6.8572998046875, -6.59771728515625, -6.338134765625, -6.07855224609375, -5.8189697265625, -5.55938720703125, -5.2998046875, -5.04022216796875, -4.7806396484375, -4.52105712890625, -4.261474609375, -4.00189208984375, -3.7423095703125, -3.48272705078125, -3.22314453125, -2.96356201171875, -2.7039794921875, -2.44439697265625, -2.184814453125, -1.92523193359375, -1.6656494140625, -1.40606689453125, -1.146484375, -0.88690185546875, -0.6273193359375, -0.36773681640625, -0.108154296875, 0.15142822265625, 0.4110107421875, 0.67059326171875, 0.93017578125, 1.18975830078125, 1.4493408203125, 1.70892333984375, 1.968505859375, 2.22808837890625, 2.4876708984375, 2.74725341796875, 3.0068359375, 3.26641845703125, 3.5260009765625, 3.78558349609375, 4.045166015625, 4.30474853515625, 4.5643310546875, 4.82391357421875, 5.08349609375, 5.34307861328125, 5.6026611328125, 5.86224365234375, 6.121826171875, 6.38140869140625, 6.6409912109375, 6.90057373046875, 7.16015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 4.0, 11.0, 12.0, 32.0, 29.0, 45.0, 69.0, 99.0, 124.0, 126.0, 101.0, 103.0, 65.0, 56.0, 37.0, 21.0, 16.0, 9.0, 8.0, 9.0, 4.0, 3.0, 5.0, 0.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006451606750488281, -0.0006186738610267639, -0.0005921870470046997, -0.0005657002329826355, -0.0005392134189605713, -0.0005127266049385071, -0.00048623979091644287, -0.00045975297689437866, -0.00043326616287231445, -0.00040677934885025024, -0.00038029253482818604, -0.0003538057208061218, -0.0003273189067840576, -0.0003008320927619934, -0.0002743452787399292, -0.000247858464717865, -0.00022137165069580078, -0.00019488483667373657, -0.00016839802265167236, -0.00014191120862960815, -0.00011542439460754395, -8.893758058547974e-05, -6.245076656341553e-05, -3.596395254135132e-05, -9.47713851928711e-06, 1.70096755027771e-05, 4.349648952484131e-05, 6.998330354690552e-05, 9.647011756896973e-05, 0.00012295693159103394, 0.00014944374561309814, 0.00017593055963516235, 0.00020241737365722656, 0.00022890418767929077, 0.000255391001701355, 0.0002818778157234192, 0.0003083646297454834, 0.0003348514437675476, 0.0003613382577896118, 0.000387825071811676, 0.00041431188583374023, 0.00044079869985580444, 0.00046728551387786865, 0.0004937723278999329, 0.0005202591419219971, 0.0005467459559440613, 0.0005732327699661255, 0.0005997195839881897, 0.0006262063980102539, 0.0006526932120323181, 0.0006791800260543823, 0.0007056668400764465, 0.0007321536540985107, 0.000758640468120575, 0.0007851272821426392, 0.0008116140961647034, 0.0008381009101867676, 0.0008645877242088318, 0.000891074538230896, 0.0009175613522529602, 0.0009440481662750244, 0.0009705349802970886, 0.0009970217943191528, 0.001023508608341217, 0.0010499954223632812]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 6.0, 24.0, 23.0, 32.0, 52.0, 104.0, 166.0, 313.0, 658.0, 1386.0, 3488.0, 13747.0, 129109.0, 827724.0, 57818.0, 8992.0, 2586.0, 1085.0, 523.0, 285.0, 156.0, 97.0, 53.0, 29.0, 22.0, 17.0, 8.0, 15.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4921875, -13.0751953125, -12.658203125, -12.2412109375, -11.82421875, -11.4072265625, -10.990234375, -10.5732421875, -10.15625, -9.7392578125, -9.322265625, -8.9052734375, -8.48828125, -8.0712890625, -7.654296875, -7.2373046875, -6.8203125, -6.4033203125, -5.986328125, -5.5693359375, -5.15234375, -4.7353515625, -4.318359375, -3.9013671875, -3.484375, -3.0673828125, -2.650390625, -2.2333984375, -1.81640625, -1.3994140625, -0.982421875, -0.5654296875, -0.1484375, 0.2685546875, 0.685546875, 1.1025390625, 1.51953125, 1.9365234375, 2.353515625, 2.7705078125, 3.1875, 3.6044921875, 4.021484375, 4.4384765625, 4.85546875, 5.2724609375, 5.689453125, 6.1064453125, 6.5234375, 6.9404296875, 7.357421875, 7.7744140625, 8.19140625, 8.6083984375, 9.025390625, 9.4423828125, 9.859375, 10.2763671875, 10.693359375, 11.1103515625, 11.52734375, 11.9443359375, 12.361328125, 12.7783203125, 13.1953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 1.0, 2.0, 4.0, 5.0, 10.0, 6.0, 16.0, 17.0, 23.0, 33.0, 53.0, 71.0, 104.0, 112.0, 120.0, 107.0, 82.0, 63.0, 40.0, 28.0, 24.0, 8.0, 12.0, 15.0, 8.0, 7.0, 4.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.3359375, -3.21734619140625, -3.0987548828125, -2.98016357421875, -2.861572265625, -2.74298095703125, -2.6243896484375, -2.50579833984375, -2.38720703125, -2.26861572265625, -2.1500244140625, -2.03143310546875, -1.912841796875, -1.79425048828125, -1.6756591796875, -1.55706787109375, -1.4384765625, -1.31988525390625, -1.2012939453125, -1.08270263671875, -0.964111328125, -0.84552001953125, -0.7269287109375, -0.60833740234375, -0.48974609375, -0.37115478515625, -0.2525634765625, -0.13397216796875, -0.015380859375, 0.10321044921875, 0.2218017578125, 0.34039306640625, 0.458984375, 0.57757568359375, 0.6961669921875, 0.81475830078125, 0.933349609375, 1.05194091796875, 1.1705322265625, 1.28912353515625, 1.40771484375, 1.52630615234375, 1.6448974609375, 1.76348876953125, 1.882080078125, 2.00067138671875, 2.1192626953125, 2.23785400390625, 2.3564453125, 2.47503662109375, 2.5936279296875, 2.71221923828125, 2.830810546875, 2.94940185546875, 3.0679931640625, 3.18658447265625, 3.30517578125, 3.42376708984375, 3.5423583984375, 3.66094970703125, 3.779541015625, 3.89813232421875, 4.0167236328125, 4.13531494140625, 4.25390625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 17.0, 25.0, 49.0, 89.0, 129.0, 165.0, 156.0, 126.0, 99.0, 66.0, 27.0, 23.0, 8.0, 10.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.94715118408203, -53.52459716796875, -51.10204315185547, -48.67948913574219, -46.256935119628906, -43.834381103515625, -41.41183090209961, -38.98927688598633, -36.56672286987305, -34.144168853759766, -31.721614837646484, -29.299062728881836, -26.876508712768555, -24.453954696655273, -22.031402587890625, -19.608848571777344, -17.186294555664062, -14.763740539550781, -12.341187477111816, -9.918634414672852, -7.49608039855957, -5.073526382446289, -2.650973320007324, -0.22842025756835938, 2.194133758544922, 4.616687297821045, 7.039240837097168, 9.461793899536133, 11.884347915649414, 14.306901931762695, 16.729454040527344, 19.152008056640625, 21.574554443359375, 23.997108459472656, 26.419662475585938, 28.842214584350586, 31.264768600463867, 33.68732452392578, 36.1098747253418, 38.53242874145508, 40.95498275756836, 43.37753677368164, 45.80009078979492, 48.2226448059082, 50.64519500732422, 53.0677490234375, 55.49030303955078, 57.91285705566406, 60.335411071777344, 62.757965087890625, 65.1805191040039, 67.60307312011719, 70.02562713623047, 72.44818115234375, 74.87073516845703, 77.29328918457031, 79.71583557128906, 82.13838958740234, 84.56094360351562, 86.9834976196289, 89.40605163574219, 91.82860565185547, 94.25115966796875, 96.6737060546875, 99.09626770019531]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 7.0, 11.0, 12.0, 14.0, 11.0, 19.0, 15.0, 21.0, 27.0, 36.0, 29.0, 40.0, 34.0, 38.0, 40.0, 42.0, 33.0, 40.0, 40.0, 35.0, 38.0, 26.0, 40.0, 31.0, 34.0, 32.0, 41.0, 27.0, 29.0, 22.0, 18.0, 19.0, 17.0, 11.0, 9.0, 7.0, 14.0, 3.0, 11.0, 2.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-25.35921859741211, -24.59548568725586, -23.831750869750977, -23.068017959594727, -22.304283142089844, -21.540550231933594, -20.776817321777344, -20.01308250427246, -19.249347686767578, -18.485614776611328, -17.721879959106445, -16.958147048950195, -16.194412231445312, -15.430679321289062, -14.666945457458496, -13.90321159362793, -13.13947868347168, -12.375744819641113, -11.612010955810547, -10.848278045654297, -10.084543228149414, -9.320810317993164, -8.557076454162598, -7.793342590332031, -7.029608726501465, -6.265874862670898, -5.502140998840332, -4.738407611846924, -3.9746737480163574, -3.210939884185791, -2.447206497192383, -1.6834726333618164, -0.9197406768798828, -0.15600693225860596, 0.6077268123626709, 1.3714604377746582, 2.1351943016052246, 2.898928165435791, 3.662661552429199, 4.426395416259766, 5.190129280090332, 5.953863143920898, 6.717597007751465, 7.481330394744873, 8.245063781738281, 9.008798599243164, 9.772531509399414, 10.53626537322998, 11.299999237060547, 12.063733100891113, 12.82746696472168, 13.59119987487793, 14.354934692382812, 15.118667602539062, 15.882401466369629, 16.646135330200195, 17.409870147705078, 18.173603057861328, 18.93733787536621, 19.70107078552246, 20.464805603027344, 21.228538513183594, 21.992271423339844, 22.756006240844727, 23.519739151000977]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 7.0, 6.0, 9.0, 28.0, 36.0, 38.0, 69.0, 86.0, 162.0, 239.0, 395.0, 706.0, 1291.0, 2497.0, 5045.0, 11964.0, 34163.0, 181901.0, 3775535.0, 130903.0, 29243.0, 10704.0, 4546.0, 2240.0, 1038.0, 601.0, 332.0, 159.0, 120.0, 74.0, 35.0, 36.0, 21.0, 15.0, 8.0, 5.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.90625, -12.5313720703125, -12.156494140625, -11.7816162109375, -11.40673828125, -11.0318603515625, -10.656982421875, -10.2821044921875, -9.9072265625, -9.5323486328125, -9.157470703125, -8.7825927734375, -8.40771484375, -8.0328369140625, -7.657958984375, -7.2830810546875, -6.908203125, -6.5333251953125, -6.158447265625, -5.7835693359375, -5.40869140625, -5.0338134765625, -4.658935546875, -4.2840576171875, -3.9091796875, -3.5343017578125, -3.159423828125, -2.7845458984375, -2.40966796875, -2.0347900390625, -1.659912109375, -1.2850341796875, -0.91015625, -0.5352783203125, -0.160400390625, 0.2144775390625, 0.58935546875, 0.9642333984375, 1.339111328125, 1.7139892578125, 2.0888671875, 2.4637451171875, 2.838623046875, 3.2135009765625, 3.58837890625, 3.9632568359375, 4.338134765625, 4.7130126953125, 5.087890625, 5.4627685546875, 5.837646484375, 6.2125244140625, 6.58740234375, 6.9622802734375, 7.337158203125, 7.7120361328125, 8.0869140625, 8.4617919921875, 8.836669921875, 9.2115478515625, 9.58642578125, 9.9613037109375, 10.336181640625, 10.7110595703125, 11.0859375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 18.0, 19.0, 24.0, 18.0, 34.0, 40.0, 44.0, 43.0, 59.0, 46.0, 54.0, 52.0, 50.0, 61.0, 48.0, 58.0, 48.0, 42.0, 47.0, 37.0, 34.0, 24.0, 15.0, 17.0, 10.0, 8.0, 3.0, 10.0, 3.0, 3.0, 4.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.931640625, -0.9045944213867188, -0.8775482177734375, -0.8505020141601562, -0.823455810546875, -0.7964096069335938, -0.7693634033203125, -0.7423171997070312, -0.71527099609375, -0.6882247924804688, -0.6611785888671875, -0.6341323852539062, -0.607086181640625, -0.5800399780273438, -0.5529937744140625, -0.5259475708007812, -0.4989013671875, -0.47185516357421875, -0.4448089599609375, -0.41776275634765625, -0.390716552734375, -0.36367034912109375, -0.3366241455078125, -0.30957794189453125, -0.28253173828125, -0.25548553466796875, -0.2284393310546875, -0.20139312744140625, -0.174346923828125, -0.14730072021484375, -0.1202545166015625, -0.09320831298828125, -0.066162109375, -0.03911590576171875, -0.0120697021484375, 0.01497650146484375, 0.042022705078125, 0.06906890869140625, 0.0961151123046875, 0.12316131591796875, 0.15020751953125, 0.17725372314453125, 0.2042999267578125, 0.23134613037109375, 0.258392333984375, 0.28543853759765625, 0.3124847412109375, 0.33953094482421875, 0.3665771484375, 0.39362335205078125, 0.4206695556640625, 0.44771575927734375, 0.474761962890625, 0.5018081665039062, 0.5288543701171875, 0.5559005737304688, 0.58294677734375, 0.6099929809570312, 0.6370391845703125, 0.6640853881835938, 0.691131591796875, 0.7181777954101562, 0.7452239990234375, 0.7722702026367188, 0.79931640625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 4.0, 9.0, 10.0, 14.0, 25.0, 35.0, 68.0, 102.0, 164.0, 295.0, 564.0, 1073.0, 2325.0, 5427.0, 14103.0, 43564.0, 310827.0, 3663761.0, 109804.0, 25989.0, 9164.0, 3660.0, 1508.0, 711.0, 431.0, 218.0, 146.0, 83.0, 46.0, 47.0, 28.0, 26.0, 18.0, 10.0, 7.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.875, -12.4033203125, -11.931640625, -11.4599609375, -10.98828125, -10.5166015625, -10.044921875, -9.5732421875, -9.1015625, -8.6298828125, -8.158203125, -7.6865234375, -7.21484375, -6.7431640625, -6.271484375, -5.7998046875, -5.328125, -4.8564453125, -4.384765625, -3.9130859375, -3.44140625, -2.9697265625, -2.498046875, -2.0263671875, -1.5546875, -1.0830078125, -0.611328125, -0.1396484375, 0.33203125, 0.8037109375, 1.275390625, 1.7470703125, 2.21875, 2.6904296875, 3.162109375, 3.6337890625, 4.10546875, 4.5771484375, 5.048828125, 5.5205078125, 5.9921875, 6.4638671875, 6.935546875, 7.4072265625, 7.87890625, 8.3505859375, 8.822265625, 9.2939453125, 9.765625, 10.2373046875, 10.708984375, 11.1806640625, 11.65234375, 12.1240234375, 12.595703125, 13.0673828125, 13.5390625, 14.0107421875, 14.482421875, 14.9541015625, 15.42578125, 15.8974609375, 16.369140625, 16.8408203125, 17.3125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 11.0, 12.0, 10.0, 13.0, 8.0, 14.0, 28.0, 33.0, 58.0, 58.0, 111.0, 224.0, 708.0, 1979.0, 377.0, 142.0, 83.0, 58.0, 35.0, 21.0, 22.0, 14.0, 14.0, 7.0, 10.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763671875, -2.67523193359375, -2.5867919921875, -2.49835205078125, -2.409912109375, -2.32147216796875, -2.2330322265625, -2.14459228515625, -2.05615234375, -1.96771240234375, -1.8792724609375, -1.79083251953125, -1.702392578125, -1.61395263671875, -1.5255126953125, -1.43707275390625, -1.3486328125, -1.26019287109375, -1.1717529296875, -1.08331298828125, -0.994873046875, -0.90643310546875, -0.8179931640625, -0.72955322265625, -0.64111328125, -0.55267333984375, -0.4642333984375, -0.37579345703125, -0.287353515625, -0.19891357421875, -0.1104736328125, -0.02203369140625, 0.06640625, 0.15484619140625, 0.2432861328125, 0.33172607421875, 0.420166015625, 0.50860595703125, 0.5970458984375, 0.68548583984375, 0.77392578125, 0.86236572265625, 0.9508056640625, 1.03924560546875, 1.127685546875, 1.21612548828125, 1.3045654296875, 1.39300537109375, 1.4814453125, 1.56988525390625, 1.6583251953125, 1.74676513671875, 1.835205078125, 1.92364501953125, 2.0120849609375, 2.10052490234375, 2.18896484375, 2.27740478515625, 2.3658447265625, 2.45428466796875, 2.542724609375, 2.63116455078125, 2.7196044921875, 2.80804443359375, 2.896484375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 11.0, 12.0, 51.0, 110.0, 213.0, 254.0, 184.0, 93.0, 39.0, 24.0, 9.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.580196380615234, -30.468481063842773, -29.356765747070312, -28.24505043029785, -27.13333511352539, -26.021621704101562, -24.9099063873291, -23.79819107055664, -22.68647575378418, -21.57476043701172, -20.463045120239258, -19.351329803466797, -18.23961639404297, -17.127899169921875, -16.016185760498047, -14.904470443725586, -13.792755126953125, -12.681039810180664, -11.569324493408203, -10.457610130310059, -9.345894813537598, -8.234179496765137, -7.122464656829834, -6.010749816894531, -4.89903450012207, -3.7873194217681885, -2.6756043434143066, -1.5638892650604248, -0.45217418670654297, 0.659541130065918, 1.7712559700012207, 2.8829708099365234, 3.99468994140625, 5.106405258178711, 6.218120098114014, 7.329834938049316, 8.441550254821777, 9.553265571594238, 10.664979934692383, 11.776695251464844, 12.888410568237305, 14.000125885009766, 15.111841201782227, 16.223556518554688, 17.335269927978516, 18.44698715209961, 19.558700561523438, 20.6704158782959, 21.78213119506836, 22.89384651184082, 24.00556182861328, 25.117277145385742, 26.228992462158203, 27.34070587158203, 28.452421188354492, 29.564136505126953, 30.675851821899414, 31.787567138671875, 32.8992805480957, 34.0109977722168, 35.122711181640625, 36.23442840576172, 37.34614181518555, 38.457855224609375, 39.56957244873047]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 4.0, 3.0, 6.0, 7.0, 10.0, 15.0, 19.0, 12.0, 15.0, 28.0, 33.0, 36.0, 41.0, 41.0, 31.0, 42.0, 55.0, 43.0, 50.0, 47.0, 44.0, 50.0, 46.0, 42.0, 53.0, 40.0, 35.0, 29.0, 25.0, 16.0, 20.0, 18.0, 8.0, 7.0, 4.0, 5.0, 5.0, 5.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.317593574523926, -9.037435531616211, -8.75727653503418, -8.477118492126465, -8.19696044921875, -7.916801929473877, -7.636643409729004, -7.356485366821289, -7.076326847076416, -6.796168327331543, -6.516010284423828, -6.235851764678955, -5.955693244934082, -5.675535202026367, -5.395376682281494, -5.115218162536621, -4.835060119628906, -4.554901599884033, -4.274743556976318, -3.9945850372314453, -3.7144267559051514, -3.4342684745788574, -3.1541099548339844, -2.8739516735076904, -2.5937933921813965, -2.3136351108551025, -2.0334768295288086, -1.7533183097839355, -1.4731600284576416, -1.1930017471313477, -0.9128433465957642, -0.6326849460601807, -0.3525276184082031, -0.0723692774772644, 0.20778906345367432, 0.48794740438461304, 0.7681057453155518, 1.0482640266418457, 1.3284224271774292, 1.6085808277130127, 1.8887391090393066, 2.1688973903656006, 2.4490556716918945, 2.7292141914367676, 3.0093724727630615, 3.2895307540893555, 3.5696892738342285, 3.8498475551605225, 4.130005836486816, 4.4101643562316895, 4.690322399139404, 4.970480918884277, 5.250638961791992, 5.530797481536865, 5.810956001281738, 6.091114044189453, 6.371272563934326, 6.651431083679199, 6.931589126586914, 7.211747646331787, 7.49190616607666, 7.772064208984375, 8.05222225189209, 8.332381248474121, 8.612539291381836]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 14.0, 17.0, 16.0, 38.0, 48.0, 57.0, 105.0, 181.0, 302.0, 436.0, 682.0, 1254.0, 2110.0, 3631.0, 6422.0, 11905.0, 22080.0, 41290.0, 78455.0, 145960.0, 255386.0, 220596.0, 119604.0, 63877.0, 33838.0, 17670.0, 9673.0, 5469.0, 3011.0, 1734.0, 982.0, 605.0, 384.0, 232.0, 147.0, 105.0, 65.0, 60.0, 34.0, 14.0, 8.0, 19.0, 10.0, 1.0, 8.0, 3.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.99609375, -4.83917236328125, -4.6822509765625, -4.52532958984375, -4.368408203125, -4.21148681640625, -4.0545654296875, -3.89764404296875, -3.74072265625, -3.58380126953125, -3.4268798828125, -3.26995849609375, -3.113037109375, -2.95611572265625, -2.7991943359375, -2.64227294921875, -2.4853515625, -2.32843017578125, -2.1715087890625, -2.01458740234375, -1.857666015625, -1.70074462890625, -1.5438232421875, -1.38690185546875, -1.22998046875, -1.07305908203125, -0.9161376953125, -0.75921630859375, -0.602294921875, -0.44537353515625, -0.2884521484375, -0.13153076171875, 0.025390625, 0.18231201171875, 0.3392333984375, 0.49615478515625, 0.653076171875, 0.80999755859375, 0.9669189453125, 1.12384033203125, 1.28076171875, 1.43768310546875, 1.5946044921875, 1.75152587890625, 1.908447265625, 2.06536865234375, 2.2222900390625, 2.37921142578125, 2.5361328125, 2.69305419921875, 2.8499755859375, 3.00689697265625, 3.163818359375, 3.32073974609375, 3.4776611328125, 3.63458251953125, 3.79150390625, 3.94842529296875, 4.1053466796875, 4.26226806640625, 4.419189453125, 4.57611083984375, 4.7330322265625, 4.88995361328125, 5.046875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 5.0, 7.0, 19.0, 21.0, 29.0, 33.0, 35.0, 30.0, 46.0, 42.0, 53.0, 63.0, 71.0, 65.0, 51.0, 58.0, 47.0, 59.0, 47.0, 31.0, 32.0, 24.0, 26.0, 24.0, 18.0, 13.0, 6.0, 5.0, 7.0, 6.0, 4.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9970703125, -0.968994140625, -0.94091796875, -0.912841796875, -0.884765625, -0.856689453125, -0.82861328125, -0.800537109375, -0.7724609375, -0.744384765625, -0.71630859375, -0.688232421875, -0.66015625, -0.632080078125, -0.60400390625, -0.575927734375, -0.5478515625, -0.519775390625, -0.49169921875, -0.463623046875, -0.435546875, -0.407470703125, -0.37939453125, -0.351318359375, -0.3232421875, -0.295166015625, -0.26708984375, -0.239013671875, -0.2109375, -0.182861328125, -0.15478515625, -0.126708984375, -0.0986328125, -0.070556640625, -0.04248046875, -0.014404296875, 0.013671875, 0.041748046875, 0.06982421875, 0.097900390625, 0.1259765625, 0.154052734375, 0.18212890625, 0.210205078125, 0.23828125, 0.266357421875, 0.29443359375, 0.322509765625, 0.3505859375, 0.378662109375, 0.40673828125, 0.434814453125, 0.462890625, 0.490966796875, 0.51904296875, 0.547119140625, 0.5751953125, 0.603271484375, 0.63134765625, 0.659423828125, 0.6875, 0.715576171875, 0.74365234375, 0.771728515625, 0.7998046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 5.0, 3.0, 6.0, 6.0, 9.0, 21.0, 20.0, 29.0, 29.0, 42.0, 63.0, 115.0, 101.0, 139.0, 209.0, 337.0, 484.0, 766.0, 1250.0, 2050.0, 3620.0, 7278.0, 14714.0, 32870.0, 74785.0, 170820.0, 331222.0, 224374.0, 100153.0, 43166.0, 19150.0, 9280.0, 4585.0, 2531.0, 1518.0, 909.0, 568.0, 369.0, 268.0, 168.0, 143.0, 93.0, 82.0, 67.0, 33.0, 29.0, 20.0, 21.0, 8.0, 8.0, 10.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.77734375, -5.5826416015625, -5.387939453125, -5.1932373046875, -4.99853515625, -4.8038330078125, -4.609130859375, -4.4144287109375, -4.2197265625, -4.0250244140625, -3.830322265625, -3.6356201171875, -3.44091796875, -3.2462158203125, -3.051513671875, -2.8568115234375, -2.662109375, -2.4674072265625, -2.272705078125, -2.0780029296875, -1.88330078125, -1.6885986328125, -1.493896484375, -1.2991943359375, -1.1044921875, -0.9097900390625, -0.715087890625, -0.5203857421875, -0.32568359375, -0.1309814453125, 0.063720703125, 0.2584228515625, 0.453125, 0.6478271484375, 0.842529296875, 1.0372314453125, 1.23193359375, 1.4266357421875, 1.621337890625, 1.8160400390625, 2.0107421875, 2.2054443359375, 2.400146484375, 2.5948486328125, 2.78955078125, 2.9842529296875, 3.178955078125, 3.3736572265625, 3.568359375, 3.7630615234375, 3.957763671875, 4.1524658203125, 4.34716796875, 4.5418701171875, 4.736572265625, 4.9312744140625, 5.1259765625, 5.3206787109375, 5.515380859375, 5.7100830078125, 5.90478515625, 6.0994873046875, 6.294189453125, 6.4888916015625, 6.68359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 9.0, 5.0, 8.0, 12.0, 11.0, 16.0, 14.0, 7.0, 22.0, 21.0, 25.0, 30.0, 29.0, 26.0, 28.0, 42.0, 36.0, 35.0, 40.0, 38.0, 45.0, 40.0, 35.0, 48.0, 40.0, 44.0, 39.0, 31.0, 23.0, 22.0, 16.0, 16.0, 16.0, 18.0, 20.0, 14.0, 10.0, 11.0, 12.0, 7.0, 7.0, 6.0, 2.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.595703125, -3.48052978515625, -3.3653564453125, -3.25018310546875, -3.135009765625, -3.01983642578125, -2.9046630859375, -2.78948974609375, -2.67431640625, -2.55914306640625, -2.4439697265625, -2.32879638671875, -2.213623046875, -2.09844970703125, -1.9832763671875, -1.86810302734375, -1.7529296875, -1.63775634765625, -1.5225830078125, -1.40740966796875, -1.292236328125, -1.17706298828125, -1.0618896484375, -0.94671630859375, -0.83154296875, -0.71636962890625, -0.6011962890625, -0.48602294921875, -0.370849609375, -0.25567626953125, -0.1405029296875, -0.02532958984375, 0.08984375, 0.20501708984375, 0.3201904296875, 0.43536376953125, 0.550537109375, 0.66571044921875, 0.7808837890625, 0.89605712890625, 1.01123046875, 1.12640380859375, 1.2415771484375, 1.35675048828125, 1.471923828125, 1.58709716796875, 1.7022705078125, 1.81744384765625, 1.9326171875, 2.04779052734375, 2.1629638671875, 2.27813720703125, 2.393310546875, 2.50848388671875, 2.6236572265625, 2.73883056640625, 2.85400390625, 2.96917724609375, 3.0843505859375, 3.19952392578125, 3.314697265625, 3.42987060546875, 3.5450439453125, 3.66021728515625, 3.775390625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 8.0, 17.0, 19.0, 26.0, 31.0, 57.0, 83.0, 122.0, 226.0, 357.0, 733.0, 1521.0, 3795.0, 11047.0, 42731.0, 403580.0, 513497.0, 50688.0, 12273.0, 4308.0, 1648.0, 786.0, 379.0, 218.0, 130.0, 77.0, 59.0, 31.0, 21.0, 22.0, 14.0, 9.0, 6.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0390625, -6.7967529296875, -6.554443359375, -6.3121337890625, -6.06982421875, -5.8275146484375, -5.585205078125, -5.3428955078125, -5.1005859375, -4.8582763671875, -4.615966796875, -4.3736572265625, -4.13134765625, -3.8890380859375, -3.646728515625, -3.4044189453125, -3.162109375, -2.9197998046875, -2.677490234375, -2.4351806640625, -2.19287109375, -1.9505615234375, -1.708251953125, -1.4659423828125, -1.2236328125, -0.9813232421875, -0.739013671875, -0.4967041015625, -0.25439453125, -0.0120849609375, 0.230224609375, 0.4725341796875, 0.71484375, 0.9571533203125, 1.199462890625, 1.4417724609375, 1.68408203125, 1.9263916015625, 2.168701171875, 2.4110107421875, 2.6533203125, 2.8956298828125, 3.137939453125, 3.3802490234375, 3.62255859375, 3.8648681640625, 4.107177734375, 4.3494873046875, 4.591796875, 4.8341064453125, 5.076416015625, 5.3187255859375, 5.56103515625, 5.8033447265625, 6.045654296875, 6.2879638671875, 6.5302734375, 6.7725830078125, 7.014892578125, 7.2572021484375, 7.49951171875, 7.7418212890625, 7.984130859375, 8.2264404296875, 8.46875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 4.0, 5.0, 9.0, 13.0, 12.0, 25.0, 39.0, 51.0, 83.0, 143.0, 179.0, 146.0, 98.0, 73.0, 33.0, 22.0, 18.0, 9.0, 8.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0012302398681640625, -0.0011982619762420654, -0.0011662840843200684, -0.0011343061923980713, -0.0011023283004760742, -0.0010703504085540771, -0.00103837251663208, -0.001006394624710083, -0.0009744167327880859, -0.0009424388408660889, -0.0009104609489440918, -0.0008784830570220947, -0.0008465051651000977, -0.0008145272731781006, -0.0007825493812561035, -0.0007505714893341064, -0.0007185935974121094, -0.0006866157054901123, -0.0006546378135681152, -0.0006226599216461182, -0.0005906820297241211, -0.000558704137802124, -0.000526726245880127, -0.0004947483539581299, -0.0004627704620361328, -0.00043079257011413574, -0.00039881467819213867, -0.0003668367862701416, -0.00033485889434814453, -0.00030288100242614746, -0.0002709031105041504, -0.00023892521858215332, -0.00020694732666015625, -0.00017496943473815918, -0.0001429915428161621, -0.00011101365089416504, -7.903575897216797e-05, -4.70578670501709e-05, -1.5079975128173828e-05, 1.6897916793823242e-05, 4.887580871582031e-05, 8.085370063781738e-05, 0.00011283159255981445, 0.00014480948448181152, 0.0001767873764038086, 0.00020876526832580566, 0.00024074316024780273, 0.0002727210521697998, 0.0003046989440917969, 0.00033667683601379395, 0.000368654727935791, 0.0004006326198577881, 0.00043261051177978516, 0.0004645884037017822, 0.0004965662956237793, 0.0005285441875457764, 0.0005605220794677734, 0.0005924999713897705, 0.0006244778633117676, 0.0006564557552337646, 0.0006884336471557617, 0.0007204115390777588, 0.0007523894309997559, 0.0007843673229217529, 0.00081634521484375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 18.0, 27.0, 38.0, 63.0, 115.0, 218.0, 389.0, 879.0, 2379.0, 7897.0, 36856.0, 556728.0, 401572.0, 30568.0, 7047.0, 2100.0, 801.0, 393.0, 189.0, 106.0, 57.0, 34.0, 22.0, 11.0, 7.0, 8.0, 6.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.546875, -9.2384033203125, -8.929931640625, -8.6214599609375, -8.31298828125, -8.0045166015625, -7.696044921875, -7.3875732421875, -7.0791015625, -6.7706298828125, -6.462158203125, -6.1536865234375, -5.84521484375, -5.5367431640625, -5.228271484375, -4.9197998046875, -4.611328125, -4.3028564453125, -3.994384765625, -3.6859130859375, -3.37744140625, -3.0689697265625, -2.760498046875, -2.4520263671875, -2.1435546875, -1.8350830078125, -1.526611328125, -1.2181396484375, -0.90966796875, -0.6011962890625, -0.292724609375, 0.0157470703125, 0.32421875, 0.6326904296875, 0.941162109375, 1.2496337890625, 1.55810546875, 1.8665771484375, 2.175048828125, 2.4835205078125, 2.7919921875, 3.1004638671875, 3.408935546875, 3.7174072265625, 4.02587890625, 4.3343505859375, 4.642822265625, 4.9512939453125, 5.259765625, 5.5682373046875, 5.876708984375, 6.1851806640625, 6.49365234375, 6.8021240234375, 7.110595703125, 7.4190673828125, 7.7275390625, 8.0360107421875, 8.344482421875, 8.6529541015625, 8.96142578125, 9.2698974609375, 9.578369140625, 9.8868408203125, 10.1953125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 8.0, 11.0, 20.0, 25.0, 45.0, 71.0, 123.0, 170.0, 170.0, 124.0, 70.0, 51.0, 32.0, 21.0, 18.0, 6.0, 7.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.833984375, -3.660003662109375, -3.48602294921875, -3.312042236328125, -3.1380615234375, -2.964080810546875, -2.79010009765625, -2.616119384765625, -2.442138671875, -2.268157958984375, -2.09417724609375, -1.920196533203125, -1.7462158203125, -1.572235107421875, -1.39825439453125, -1.224273681640625, -1.05029296875, -0.876312255859375, -0.70233154296875, -0.528350830078125, -0.3543701171875, -0.180389404296875, -0.00640869140625, 0.167572021484375, 0.341552734375, 0.515533447265625, 0.68951416015625, 0.863494873046875, 1.0374755859375, 1.211456298828125, 1.38543701171875, 1.559417724609375, 1.7333984375, 1.907379150390625, 2.08135986328125, 2.255340576171875, 2.4293212890625, 2.603302001953125, 2.77728271484375, 2.951263427734375, 3.125244140625, 3.299224853515625, 3.47320556640625, 3.647186279296875, 3.8211669921875, 3.995147705078125, 4.16912841796875, 4.343109130859375, 4.51708984375, 4.691070556640625, 4.86505126953125, 5.039031982421875, 5.2130126953125, 5.386993408203125, 5.56097412109375, 5.734954833984375, 5.908935546875, 6.082916259765625, 6.25689697265625, 6.430877685546875, 6.6048583984375, 6.778839111328125, 6.95281982421875, 7.126800537109375, 7.30078125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 12.0, 10.0, 28.0, 46.0, 93.0, 121.0, 178.0, 178.0, 141.0, 83.0, 57.0, 27.0, 14.0, 11.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.0477294921875, -68.32931518554688, -65.61090850830078, -62.892494201660156, -60.1740837097168, -57.45567321777344, -54.73725891113281, -52.01884841918945, -49.300437927246094, -46.582027435302734, -43.863616943359375, -41.14520263671875, -38.42679214477539, -35.70838165283203, -32.989967346191406, -30.271556854248047, -27.553146362304688, -24.834735870361328, -22.116323471069336, -19.397911071777344, -16.679500579833984, -13.961089134216309, -11.242677688598633, -8.52426528930664, -5.805854797363281, -3.0874433517456055, -0.3690319061279297, 2.349379539489746, 5.067790985107422, 7.786202430725098, 10.504613876342773, 13.223026275634766, 15.941436767578125, 18.659847259521484, 21.378259658813477, 24.09667205810547, 26.815082550048828, 29.533493041992188, 32.25190734863281, 34.97031784057617, 37.68872833251953, 40.40713882446289, 43.12554931640625, 45.843963623046875, 48.562374114990234, 51.280784606933594, 53.99919891357422, 56.71760940551758, 59.43601989746094, 62.1544303894043, 64.87284088134766, 67.59125518798828, 70.30966186523438, 73.028076171875, 75.74649047851562, 78.46490478515625, 81.18331146240234, 83.90172576904297, 86.62013244628906, 89.33854675292969, 92.05696105957031, 94.7753677368164, 97.49378204345703, 100.21218872070312, 102.93060302734375]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 6.0, 15.0, 13.0, 16.0, 18.0, 19.0, 41.0, 36.0, 44.0, 54.0, 62.0, 54.0, 62.0, 61.0, 67.0, 50.0, 57.0, 54.0, 45.0, 52.0, 35.0, 34.0, 28.0, 17.0, 13.0, 6.0, 13.0, 7.0, 2.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.942474365234375, -38.793426513671875, -37.644378662109375, -36.49532699584961, -35.34627914428711, -34.19723129272461, -33.04818344116211, -31.89913558959961, -30.750085830688477, -29.601037979125977, -28.451988220214844, -27.302940368652344, -26.153892517089844, -25.00484275817871, -23.85579490661621, -22.706745147705078, -21.557697296142578, -20.408649444580078, -19.259599685668945, -18.110551834106445, -16.961502075195312, -15.812454223632812, -14.663406372070312, -13.514357566833496, -12.36530876159668, -11.216259956359863, -10.067211151123047, -8.918163299560547, -7.7691144943237305, -6.620065689086914, -5.471017360687256, -4.321969032287598, -3.172924041748047, -2.0238754749298096, -0.8748269081115723, 0.27422165870666504, 1.4232702255249023, 2.5723190307617188, 3.721367359161377, 4.870415687561035, 6.019464492797852, 7.168513298034668, 8.317562103271484, 9.466609954833984, 10.6156587600708, 11.764707565307617, 12.913755416870117, 14.062804222106934, 15.21185302734375, 16.36090087890625, 17.509950637817383, 18.658998489379883, 19.808048248291016, 20.957096099853516, 22.106143951416016, 23.255191802978516, 24.40424156188965, 25.55328941345215, 26.70233917236328, 27.85138702392578, 29.00043487548828, 30.149484634399414, 31.298532485961914, 32.44758224487305, 33.59663009643555]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 15.0, 15.0, 20.0, 43.0, 47.0, 84.0, 132.0, 248.0, 430.0, 926.0, 2019.0, 4813.0, 14464.0, 69224.0, 3832206.0, 228526.0, 27725.0, 7879.0, 2919.0, 1232.0, 608.0, 303.0, 167.0, 90.0, 46.0, 26.0, 26.0, 21.0, 7.0, 8.0, 1.0, 2.0, 0.0, 4.0], "bins": [-18.296875, -17.8878173828125, -17.478759765625, -17.0697021484375, -16.66064453125, -16.2515869140625, -15.842529296875, -15.4334716796875, -15.0244140625, -14.6153564453125, -14.206298828125, -13.7972412109375, -13.38818359375, -12.9791259765625, -12.570068359375, -12.1610107421875, -11.751953125, -11.3428955078125, -10.933837890625, -10.5247802734375, -10.11572265625, -9.7066650390625, -9.297607421875, -8.8885498046875, -8.4794921875, -8.0704345703125, -7.661376953125, -7.2523193359375, -6.84326171875, -6.4342041015625, -6.025146484375, -5.6160888671875, -5.20703125, -4.7979736328125, -4.388916015625, -3.9798583984375, -3.57080078125, -3.1617431640625, -2.752685546875, -2.3436279296875, -1.9345703125, -1.5255126953125, -1.116455078125, -0.7073974609375, -0.29833984375, 0.1107177734375, 0.519775390625, 0.9288330078125, 1.337890625, 1.7469482421875, 2.156005859375, 2.5650634765625, 2.97412109375, 3.3831787109375, 3.792236328125, 4.2012939453125, 4.6103515625, 5.0194091796875, 5.428466796875, 5.8375244140625, 6.24658203125, 6.6556396484375, 7.064697265625, 7.4737548828125, 7.8828125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 13.0, 13.0, 7.0, 22.0, 20.0, 31.0, 32.0, 53.0, 50.0, 73.0, 67.0, 68.0, 77.0, 81.0, 66.0, 56.0, 51.0, 43.0, 31.0, 33.0, 22.0, 23.0, 22.0, 11.0, 7.0, 9.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.509765625, -1.4750289916992188, -1.4402923583984375, -1.4055557250976562, -1.370819091796875, -1.3360824584960938, -1.3013458251953125, -1.2666091918945312, -1.23187255859375, -1.1971359252929688, -1.1623992919921875, -1.1276626586914062, -1.092926025390625, -1.0581893920898438, -1.0234527587890625, -0.9887161254882812, -0.9539794921875, -0.9192428588867188, -0.8845062255859375, -0.8497695922851562, -0.815032958984375, -0.7802963256835938, -0.7455596923828125, -0.7108230590820312, -0.67608642578125, -0.6413497924804688, -0.6066131591796875, -0.5718765258789062, -0.537139892578125, -0.5024032592773438, -0.4676666259765625, -0.43292999267578125, -0.398193359375, -0.36345672607421875, -0.3287200927734375, -0.29398345947265625, -0.259246826171875, -0.22451019287109375, -0.1897735595703125, -0.15503692626953125, -0.12030029296875, -0.08556365966796875, -0.0508270263671875, -0.01609039306640625, 0.018646240234375, 0.05338287353515625, 0.0881195068359375, 0.12285614013671875, 0.1575927734375, 0.19232940673828125, 0.2270660400390625, 0.26180267333984375, 0.296539306640625, 0.33127593994140625, 0.3660125732421875, 0.40074920654296875, 0.43548583984375, 0.47022247314453125, 0.5049591064453125, 0.5396957397460938, 0.574432373046875, 0.6091690063476562, 0.6439056396484375, 0.6786422729492188, 0.71337890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 10.0, 8.0, 17.0, 21.0, 35.0, 51.0, 60.0, 142.0, 234.0, 399.0, 731.0, 1428.0, 2783.0, 5804.0, 13163.0, 36054.0, 154436.0, 3634011.0, 265387.0, 48842.0, 16585.0, 7021.0, 3387.0, 1651.0, 824.0, 494.0, 253.0, 150.0, 100.0, 68.0, 37.0, 23.0, 21.0, 19.0, 10.0, 8.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.921875, -8.5736083984375, -8.225341796875, -7.8770751953125, -7.52880859375, -7.1805419921875, -6.832275390625, -6.4840087890625, -6.1357421875, -5.7874755859375, -5.439208984375, -5.0909423828125, -4.74267578125, -4.3944091796875, -4.046142578125, -3.6978759765625, -3.349609375, -3.0013427734375, -2.653076171875, -2.3048095703125, -1.95654296875, -1.6082763671875, -1.260009765625, -0.9117431640625, -0.5634765625, -0.2152099609375, 0.133056640625, 0.4813232421875, 0.82958984375, 1.1778564453125, 1.526123046875, 1.8743896484375, 2.22265625, 2.5709228515625, 2.919189453125, 3.2674560546875, 3.61572265625, 3.9639892578125, 4.312255859375, 4.6605224609375, 5.0087890625, 5.3570556640625, 5.705322265625, 6.0535888671875, 6.40185546875, 6.7501220703125, 7.098388671875, 7.4466552734375, 7.794921875, 8.1431884765625, 8.491455078125, 8.8397216796875, 9.18798828125, 9.5362548828125, 9.884521484375, 10.2327880859375, 10.5810546875, 10.9293212890625, 11.277587890625, 11.6258544921875, 11.97412109375, 12.3223876953125, 12.670654296875, 13.0189208984375, 13.3671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 5.0, 5.0, 9.0, 14.0, 17.0, 17.0, 29.0, 28.0, 39.0, 67.0, 105.0, 233.0, 800.0, 1918.0, 291.0, 147.0, 96.0, 49.0, 54.0, 31.0, 27.0, 13.0, 11.0, 13.0, 10.0, 9.0, 10.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.818359375, -1.7430419921875, -1.667724609375, -1.5924072265625, -1.51708984375, -1.4417724609375, -1.366455078125, -1.2911376953125, -1.2158203125, -1.1405029296875, -1.065185546875, -0.9898681640625, -0.91455078125, -0.8392333984375, -0.763916015625, -0.6885986328125, -0.61328125, -0.5379638671875, -0.462646484375, -0.3873291015625, -0.31201171875, -0.2366943359375, -0.161376953125, -0.0860595703125, -0.0107421875, 0.0645751953125, 0.139892578125, 0.2152099609375, 0.29052734375, 0.3658447265625, 0.441162109375, 0.5164794921875, 0.591796875, 0.6671142578125, 0.742431640625, 0.8177490234375, 0.89306640625, 0.9683837890625, 1.043701171875, 1.1190185546875, 1.1943359375, 1.2696533203125, 1.344970703125, 1.4202880859375, 1.49560546875, 1.5709228515625, 1.646240234375, 1.7215576171875, 1.796875, 1.8721923828125, 1.947509765625, 2.0228271484375, 2.09814453125, 2.1734619140625, 2.248779296875, 2.3240966796875, 2.3994140625, 2.4747314453125, 2.550048828125, 2.6253662109375, 2.70068359375, 2.7760009765625, 2.851318359375, 2.9266357421875, 3.001953125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 13.0, 20.0, 49.0, 108.0, 156.0, 213.0, 187.0, 126.0, 66.0, 28.0, 16.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.00547790527344, -38.11093521118164, -37.216392517089844, -36.32184982299805, -35.42730712890625, -34.53276062011719, -33.63821792602539, -32.743675231933594, -31.849132537841797, -30.95458984375, -30.060047149658203, -29.165502548217773, -28.270959854125977, -27.37641716003418, -26.48187255859375, -25.587329864501953, -24.692787170410156, -23.79824447631836, -22.903701782226562, -22.009157180786133, -21.114614486694336, -20.22007179260254, -19.32552719116211, -18.430984497070312, -17.536441802978516, -16.64189910888672, -15.747355461120605, -14.852811813354492, -13.958269119262695, -13.063726425170898, -12.169182777404785, -11.274639129638672, -10.380096435546875, -9.485553741455078, -8.591010093688965, -7.69646692276001, -6.801923751831055, -5.9073805809021, -5.0128374099731445, -4.1182942390441895, -3.2237510681152344, -2.3292078971862793, -1.4346647262573242, -0.5401215553283691, 0.35442161560058594, 1.248964786529541, 2.143507957458496, 3.038051128387451, 3.9325942993164062, 4.827137470245361, 5.721680641174316, 6.6162238121032715, 7.510766983032227, 8.405309677124023, 9.299853324890137, 10.19439697265625, 11.088939666748047, 11.983482360839844, 12.878026008605957, 13.77256965637207, 14.667112350463867, 15.561655044555664, 16.456199645996094, 17.35074234008789, 18.245285034179688]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 4.0, 5.0, 5.0, 7.0, 14.0, 17.0, 23.0, 13.0, 11.0, 23.0, 35.0, 31.0, 36.0, 40.0, 48.0, 39.0, 38.0, 43.0, 51.0, 43.0, 42.0, 42.0, 46.0, 37.0, 30.0, 44.0, 33.0, 33.0, 30.0, 16.0, 33.0, 23.0, 17.0, 11.0, 5.0, 11.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.430156707763672, -7.18192195892334, -6.933687686920166, -6.685452938079834, -6.43721866607666, -6.188983917236328, -5.940749168395996, -5.692514896392822, -5.444280624389648, -5.196045875549316, -4.947811603546143, -4.6995768547058105, -4.451342582702637, -4.203107833862305, -3.9548733234405518, -3.706638813018799, -3.458404064178467, -3.210169553756714, -2.961935043334961, -2.713700294494629, -2.465466022491455, -2.217231273651123, -1.9689967632293701, -1.7207622528076172, -1.4725277423858643, -1.2242932319641113, -0.9760586619377136, -0.7278240919113159, -0.479589581489563, -0.23135507106781006, 0.016879558563232422, 0.26511406898498535, 0.5133485794067383, 0.7615830898284912, 1.0098176002502441, 1.2580522298812866, 1.5062867403030396, 1.7545212507247925, 2.002755880355835, 2.250990390777588, 2.499224901199341, 2.7474594116210938, 2.9956939220428467, 3.2439284324645996, 3.4921631813049316, 3.7403974533081055, 3.9886322021484375, 4.2368669509887695, 4.485101222991943, 4.733335971832275, 4.981570243835449, 5.229804992675781, 5.478039264678955, 5.726274013519287, 5.974508285522461, 6.222743034362793, 6.470977783203125, 6.719212532043457, 6.967446804046631, 7.215681552886963, 7.463915824890137, 7.712150573730469, 7.960385322570801, 8.208620071411133, 8.456853866577148]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 6.0, 6.0, 12.0, 19.0, 26.0, 54.0, 70.0, 104.0, 187.0, 350.0, 629.0, 1088.0, 2115.0, 4302.0, 9193.0, 20265.0, 46746.0, 108120.0, 230911.0, 308661.0, 175071.0, 78224.0, 33771.0, 14914.0, 6783.0, 3273.0, 1655.0, 843.0, 474.0, 268.0, 158.0, 101.0, 65.0, 30.0, 21.0, 13.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.078125, -5.8956298828125, -5.713134765625, -5.5306396484375, -5.34814453125, -5.1656494140625, -4.983154296875, -4.8006591796875, -4.6181640625, -4.4356689453125, -4.253173828125, -4.0706787109375, -3.88818359375, -3.7056884765625, -3.523193359375, -3.3406982421875, -3.158203125, -2.9757080078125, -2.793212890625, -2.6107177734375, -2.42822265625, -2.2457275390625, -2.063232421875, -1.8807373046875, -1.6982421875, -1.5157470703125, -1.333251953125, -1.1507568359375, -0.96826171875, -0.7857666015625, -0.603271484375, -0.4207763671875, -0.23828125, -0.0557861328125, 0.126708984375, 0.3092041015625, 0.49169921875, 0.6741943359375, 0.856689453125, 1.0391845703125, 1.2216796875, 1.4041748046875, 1.586669921875, 1.7691650390625, 1.95166015625, 2.1341552734375, 2.316650390625, 2.4991455078125, 2.681640625, 2.8641357421875, 3.046630859375, 3.2291259765625, 3.41162109375, 3.5941162109375, 3.776611328125, 3.9591064453125, 4.1416015625, 4.3240966796875, 4.506591796875, 4.6890869140625, 4.87158203125, 5.0540771484375, 5.236572265625, 5.4190673828125, 5.6015625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 5.0, 6.0, 6.0, 13.0, 13.0, 17.0, 12.0, 29.0, 38.0, 30.0, 47.0, 54.0, 41.0, 51.0, 59.0, 51.0, 55.0, 49.0, 55.0, 57.0, 39.0, 41.0, 37.0, 30.0, 29.0, 29.0, 18.0, 12.0, 20.0, 12.0, 11.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.037109375, -1.00927734375, -0.9814453125, -0.95361328125, -0.92578125, -0.89794921875, -0.8701171875, -0.84228515625, -0.814453125, -0.78662109375, -0.7587890625, -0.73095703125, -0.703125, -0.67529296875, -0.6474609375, -0.61962890625, -0.591796875, -0.56396484375, -0.5361328125, -0.50830078125, -0.48046875, -0.45263671875, -0.4248046875, -0.39697265625, -0.369140625, -0.34130859375, -0.3134765625, -0.28564453125, -0.2578125, -0.22998046875, -0.2021484375, -0.17431640625, -0.146484375, -0.11865234375, -0.0908203125, -0.06298828125, -0.03515625, -0.00732421875, 0.0205078125, 0.04833984375, 0.076171875, 0.10400390625, 0.1318359375, 0.15966796875, 0.1875, 0.21533203125, 0.2431640625, 0.27099609375, 0.298828125, 0.32666015625, 0.3544921875, 0.38232421875, 0.41015625, 0.43798828125, 0.4658203125, 0.49365234375, 0.521484375, 0.54931640625, 0.5771484375, 0.60498046875, 0.6328125, 0.66064453125, 0.6884765625, 0.71630859375, 0.744140625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 9.0, 16.0, 17.0, 27.0, 28.0, 43.0, 69.0, 120.0, 160.0, 270.0, 474.0, 765.0, 1276.0, 2305.0, 4822.0, 11459.0, 32475.0, 110127.0, 356455.0, 360370.0, 112326.0, 32855.0, 11532.0, 4845.0, 2408.0, 1259.0, 744.0, 455.0, 303.0, 165.0, 112.0, 87.0, 37.0, 34.0, 25.0, 25.0, 13.0, 14.0, 8.0, 6.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.94140625, -6.68438720703125, -6.4273681640625, -6.17034912109375, -5.913330078125, -5.65631103515625, -5.3992919921875, -5.14227294921875, -4.88525390625, -4.62823486328125, -4.3712158203125, -4.11419677734375, -3.857177734375, -3.60015869140625, -3.3431396484375, -3.08612060546875, -2.8291015625, -2.57208251953125, -2.3150634765625, -2.05804443359375, -1.801025390625, -1.54400634765625, -1.2869873046875, -1.02996826171875, -0.77294921875, -0.51593017578125, -0.2589111328125, -0.00189208984375, 0.255126953125, 0.51214599609375, 0.7691650390625, 1.02618408203125, 1.283203125, 1.54022216796875, 1.7972412109375, 2.05426025390625, 2.311279296875, 2.56829833984375, 2.8253173828125, 3.08233642578125, 3.33935546875, 3.59637451171875, 3.8533935546875, 4.11041259765625, 4.367431640625, 4.62445068359375, 4.8814697265625, 5.13848876953125, 5.3955078125, 5.65252685546875, 5.9095458984375, 6.16656494140625, 6.423583984375, 6.68060302734375, 6.9376220703125, 7.19464111328125, 7.45166015625, 7.70867919921875, 7.9656982421875, 8.22271728515625, 8.479736328125, 8.73675537109375, 8.9937744140625, 9.25079345703125, 9.5078125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 2.0, 8.0, 5.0, 7.0, 11.0, 11.0, 10.0, 20.0, 15.0, 18.0, 16.0, 32.0, 19.0, 22.0, 36.0, 49.0, 57.0, 45.0, 36.0, 51.0, 49.0, 49.0, 46.0, 35.0, 30.0, 32.0, 24.0, 42.0, 32.0, 22.0, 21.0, 30.0, 20.0, 18.0, 16.0, 10.0, 11.0, 12.0, 8.0, 6.0, 4.0, 4.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44921875, -3.326904296875, -3.20458984375, -3.082275390625, -2.9599609375, -2.837646484375, -2.71533203125, -2.593017578125, -2.470703125, -2.348388671875, -2.22607421875, -2.103759765625, -1.9814453125, -1.859130859375, -1.73681640625, -1.614501953125, -1.4921875, -1.369873046875, -1.24755859375, -1.125244140625, -1.0029296875, -0.880615234375, -0.75830078125, -0.635986328125, -0.513671875, -0.391357421875, -0.26904296875, -0.146728515625, -0.0244140625, 0.097900390625, 0.22021484375, 0.342529296875, 0.46484375, 0.587158203125, 0.70947265625, 0.831787109375, 0.9541015625, 1.076416015625, 1.19873046875, 1.321044921875, 1.443359375, 1.565673828125, 1.68798828125, 1.810302734375, 1.9326171875, 2.054931640625, 2.17724609375, 2.299560546875, 2.421875, 2.544189453125, 2.66650390625, 2.788818359375, 2.9111328125, 3.033447265625, 3.15576171875, 3.278076171875, 3.400390625, 3.522705078125, 3.64501953125, 3.767333984375, 3.8896484375, 4.011962890625, 4.13427734375, 4.256591796875, 4.37890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 6.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 10.0, 12.0, 24.0, 21.0, 38.0, 43.0, 81.0, 113.0, 250.0, 453.0, 992.0, 2491.0, 7344.0, 38716.0, 933849.0, 50814.0, 8177.0, 2766.0, 1166.0, 526.0, 236.0, 143.0, 88.0, 55.0, 34.0, 21.0, 12.0, 17.0, 4.0, 9.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.51904296875, -15.9599609375, -15.40087890625, -14.841796875, -14.28271484375, -13.7236328125, -13.16455078125, -12.60546875, -12.04638671875, -11.4873046875, -10.92822265625, -10.369140625, -9.81005859375, -9.2509765625, -8.69189453125, -8.1328125, -7.57373046875, -7.0146484375, -6.45556640625, -5.896484375, -5.33740234375, -4.7783203125, -4.21923828125, -3.66015625, -3.10107421875, -2.5419921875, -1.98291015625, -1.423828125, -0.86474609375, -0.3056640625, 0.25341796875, 0.8125, 1.37158203125, 1.9306640625, 2.48974609375, 3.048828125, 3.60791015625, 4.1669921875, 4.72607421875, 5.28515625, 5.84423828125, 6.4033203125, 6.96240234375, 7.521484375, 8.08056640625, 8.6396484375, 9.19873046875, 9.7578125, 10.31689453125, 10.8759765625, 11.43505859375, 11.994140625, 12.55322265625, 13.1123046875, 13.67138671875, 14.23046875, 14.78955078125, 15.3486328125, 15.90771484375, 16.466796875, 17.02587890625, 17.5849609375, 18.14404296875, 18.703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 12.0, 17.0, 22.0, 38.0, 68.0, 158.0, 244.0, 210.0, 103.0, 40.0, 38.0, 19.0, 9.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0018491744995117188, -0.001801416277885437, -0.0017536580562591553, -0.0017058998346328735, -0.0016581416130065918, -0.00161038339138031, -0.0015626251697540283, -0.0015148669481277466, -0.0014671087265014648, -0.001419350504875183, -0.0013715922832489014, -0.0013238340616226196, -0.0012760758399963379, -0.0012283176183700562, -0.0011805593967437744, -0.0011328011751174927, -0.001085042953491211, -0.0010372847318649292, -0.0009895265102386475, -0.0009417682886123657, -0.000894010066986084, -0.0008462518453598022, -0.0007984936237335205, -0.0007507354021072388, -0.000702977180480957, -0.0006552189588546753, -0.0006074607372283936, -0.0005597025156021118, -0.0005119442939758301, -0.00046418607234954834, -0.0004164278507232666, -0.00036866962909698486, -0.0003209114074707031, -0.0002731531858444214, -0.00022539496421813965, -0.0001776367425918579, -0.00012987852096557617, -8.212029933929443e-05, -3.4362077713012695e-05, 1.3396143913269043e-05, 6.115436553955078e-05, 0.00010891258716583252, 0.00015667080879211426, 0.000204429030418396, 0.00025218725204467773, 0.00029994547367095947, 0.0003477036952972412, 0.00039546191692352295, 0.0004432201385498047, 0.0004909783601760864, 0.0005387365818023682, 0.0005864948034286499, 0.0006342530250549316, 0.0006820112466812134, 0.0007297694683074951, 0.0007775276899337769, 0.0008252859115600586, 0.0008730441331863403, 0.0009208023548126221, 0.0009685605764389038, 0.0010163187980651855, 0.0010640770196914673, 0.001111835241317749, 0.0011595934629440308, 0.0012073516845703125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 13.0, 13.0, 26.0, 28.0, 56.0, 63.0, 107.0, 184.0, 299.0, 548.0, 1160.0, 2654.0, 6625.0, 23874.0, 913203.0, 81491.0, 10867.0, 4006.0, 1651.0, 715.0, 395.0, 209.0, 117.0, 77.0, 41.0, 36.0, 20.0, 14.0, 12.0, 4.0, 7.0, 4.0, 4.0, 1.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.15625, -20.4892578125, -19.822265625, -19.1552734375, -18.48828125, -17.8212890625, -17.154296875, -16.4873046875, -15.8203125, -15.1533203125, -14.486328125, -13.8193359375, -13.15234375, -12.4853515625, -11.818359375, -11.1513671875, -10.484375, -9.8173828125, -9.150390625, -8.4833984375, -7.81640625, -7.1494140625, -6.482421875, -5.8154296875, -5.1484375, -4.4814453125, -3.814453125, -3.1474609375, -2.48046875, -1.8134765625, -1.146484375, -0.4794921875, 0.1875, 0.8544921875, 1.521484375, 2.1884765625, 2.85546875, 3.5224609375, 4.189453125, 4.8564453125, 5.5234375, 6.1904296875, 6.857421875, 7.5244140625, 8.19140625, 8.8583984375, 9.525390625, 10.1923828125, 10.859375, 11.5263671875, 12.193359375, 12.8603515625, 13.52734375, 14.1943359375, 14.861328125, 15.5283203125, 16.1953125, 16.8623046875, 17.529296875, 18.1962890625, 18.86328125, 19.5302734375, 20.197265625, 20.8642578125, 21.53125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 7.0, 2.0, 4.0, 9.0, 9.0, 6.0, 11.0, 35.0, 66.0, 228.0, 400.0, 122.0, 37.0, 16.0, 13.0, 4.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.1796875, -10.810546875, -10.44140625, -10.072265625, -9.703125, -9.333984375, -8.96484375, -8.595703125, -8.2265625, -7.857421875, -7.48828125, -7.119140625, -6.75, -6.380859375, -6.01171875, -5.642578125, -5.2734375, -4.904296875, -4.53515625, -4.166015625, -3.796875, -3.427734375, -3.05859375, -2.689453125, -2.3203125, -1.951171875, -1.58203125, -1.212890625, -0.84375, -0.474609375, -0.10546875, 0.263671875, 0.6328125, 1.001953125, 1.37109375, 1.740234375, 2.109375, 2.478515625, 2.84765625, 3.216796875, 3.5859375, 3.955078125, 4.32421875, 4.693359375, 5.0625, 5.431640625, 5.80078125, 6.169921875, 6.5390625, 6.908203125, 7.27734375, 7.646484375, 8.015625, 8.384765625, 8.75390625, 9.123046875, 9.4921875, 9.861328125, 10.23046875, 10.599609375, 10.96875, 11.337890625, 11.70703125, 12.076171875, 12.4453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 13.0, 43.0, 185.0, 342.0, 260.0, 104.0, 41.0, 12.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-194.1646728515625, -187.86563110351562, -181.56658935546875, -175.26754760742188, -168.96849060058594, -162.66944885253906, -156.3704071044922, -150.0713653564453, -143.77230834960938, -137.4732666015625, -131.17422485351562, -124.87517547607422, -118.57612609863281, -112.27708435058594, -105.97804260253906, -99.67900085449219, -93.37995910644531, -87.08091735839844, -80.78186798095703, -74.48282623291016, -68.18377685546875, -61.884735107421875, -55.585693359375, -49.28664779663086, -42.98760223388672, -36.68855667114258, -30.38951301574707, -24.090469360351562, -17.791423797607422, -11.492378234863281, -5.193336486816406, 1.1057090759277344, 7.4047698974609375, 13.703814506530762, 20.002859115600586, 26.301902770996094, 32.600948333740234, 38.899993896484375, 45.19903564453125, 51.49808120727539, 57.79712677001953, 64.0961685180664, 70.39521789550781, 76.69425964355469, 82.99330139160156, 89.29235076904297, 95.59139251708984, 101.89044189453125, 108.18948364257812, 114.488525390625, 120.7875747680664, 127.08661651611328, 133.3856658935547, 139.68470764160156, 145.98374938964844, 152.2827911376953, 158.58184814453125, 164.88088989257812, 171.179931640625, 177.47897338867188, 183.7780303955078, 190.0770721435547, 196.37611389160156, 202.67515563964844, 208.9741973876953]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 7.0, 6.0, 13.0, 10.0, 20.0, 31.0, 57.0, 35.0, 42.0, 63.0, 52.0, 75.0, 80.0, 78.0, 82.0, 64.0, 55.0, 54.0, 38.0, 38.0, 35.0, 17.0, 15.0, 10.0, 7.0, 11.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.678260803222656, -42.210792541503906, -40.743324279785156, -39.275856018066406, -37.80838394165039, -36.34091567993164, -34.87344741821289, -33.40597915649414, -31.938508987426758, -30.471040725708008, -29.003570556640625, -27.536102294921875, -26.068634033203125, -24.601163864135742, -23.133695602416992, -21.66622543334961, -20.19875717163086, -18.73128890991211, -17.263818740844727, -15.796350479125977, -14.32888126373291, -12.861412048339844, -11.393943786621094, -9.926474571228027, -8.459005355834961, -6.9915361404418945, -5.524067401885986, -4.056598663330078, -2.5891294479370117, -1.1216602325439453, 0.3458080291748047, 1.813277244567871, 3.2807464599609375, 4.748215675354004, 6.215684413909912, 7.68315315246582, 9.150622367858887, 10.618091583251953, 12.085559844970703, 13.55302906036377, 15.020498275756836, 16.487966537475586, 17.95543670654297, 19.42290496826172, 20.89037322998047, 22.35784339904785, 23.8253116607666, 25.292781829833984, 26.760250091552734, 28.227718353271484, 29.695188522338867, 31.162656784057617, 32.630126953125, 34.09759521484375, 35.5650634765625, 37.03253173828125, 38.5, 39.96746826171875, 41.4349365234375, 42.90240478515625, 44.369876861572266, 45.837345123291016, 47.304813385009766, 48.772281646728516, 50.23975372314453]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 8.0, 16.0, 20.0, 34.0, 49.0, 65.0, 111.0, 169.0, 314.0, 517.0, 950.0, 1794.0, 3639.0, 8395.0, 21806.0, 68555.0, 467748.0, 3419623.0, 139844.0, 36463.0, 13134.0, 5583.0, 2660.0, 1279.0, 650.0, 367.0, 193.0, 115.0, 60.0, 40.0, 25.0, 15.0, 15.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -8.038818359375, -7.77294921875, -7.507080078125, -7.2412109375, -6.975341796875, -6.70947265625, -6.443603515625, -6.177734375, -5.911865234375, -5.64599609375, -5.380126953125, -5.1142578125, -4.848388671875, -4.58251953125, -4.316650390625, -4.05078125, -3.784912109375, -3.51904296875, -3.253173828125, -2.9873046875, -2.721435546875, -2.45556640625, -2.189697265625, -1.923828125, -1.657958984375, -1.39208984375, -1.126220703125, -0.8603515625, -0.594482421875, -0.32861328125, -0.062744140625, 0.203125, 0.468994140625, 0.73486328125, 1.000732421875, 1.2666015625, 1.532470703125, 1.79833984375, 2.064208984375, 2.330078125, 2.595947265625, 2.86181640625, 3.127685546875, 3.3935546875, 3.659423828125, 3.92529296875, 4.191162109375, 4.45703125, 4.722900390625, 4.98876953125, 5.254638671875, 5.5205078125, 5.786376953125, 6.05224609375, 6.318115234375, 6.583984375, 6.849853515625, 7.11572265625, 7.381591796875, 7.6474609375, 7.913330078125, 8.17919921875, 8.445068359375, 8.7109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 2.0, 4.0, 8.0, 14.0, 21.0, 21.0, 29.0, 29.0, 34.0, 47.0, 40.0, 39.0, 54.0, 53.0, 68.0, 63.0, 53.0, 57.0, 54.0, 32.0, 50.0, 38.0, 37.0, 28.0, 28.0, 25.0, 18.0, 16.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.07421875, -1.0429840087890625, -1.011749267578125, -0.9805145263671875, -0.94927978515625, -0.9180450439453125, -0.886810302734375, -0.8555755615234375, -0.8243408203125, -0.7931060791015625, -0.761871337890625, -0.7306365966796875, -0.69940185546875, -0.6681671142578125, -0.636932373046875, -0.6056976318359375, -0.574462890625, -0.5432281494140625, -0.511993408203125, -0.4807586669921875, -0.44952392578125, -0.4182891845703125, -0.387054443359375, -0.3558197021484375, -0.3245849609375, -0.2933502197265625, -0.262115478515625, -0.2308807373046875, -0.19964599609375, -0.1684112548828125, -0.137176513671875, -0.1059417724609375, -0.07470703125, -0.0434722900390625, -0.012237548828125, 0.0189971923828125, 0.05023193359375, 0.0814666748046875, 0.112701416015625, 0.1439361572265625, 0.1751708984375, 0.2064056396484375, 0.237640380859375, 0.2688751220703125, 0.30010986328125, 0.3313446044921875, 0.362579345703125, 0.3938140869140625, 0.425048828125, 0.4562835693359375, 0.487518310546875, 0.5187530517578125, 0.54998779296875, 0.5812225341796875, 0.612457275390625, 0.6436920166015625, 0.6749267578125, 0.7061614990234375, 0.737396240234375, 0.7686309814453125, 0.79986572265625, 0.8311004638671875, 0.862335205078125, 0.8935699462890625, 0.9248046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 10.0, 10.0, 17.0, 18.0, 32.0, 64.0, 119.0, 192.0, 329.0, 564.0, 1344.0, 2796.0, 7039.0, 20785.0, 78723.0, 751832.0, 3155461.0, 128145.0, 30218.0, 9779.0, 3642.0, 1538.0, 748.0, 374.0, 188.0, 115.0, 66.0, 40.0, 31.0, 19.0, 13.0, 8.0, 6.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.546875, -11.208740234375, -10.87060546875, -10.532470703125, -10.1943359375, -9.856201171875, -9.51806640625, -9.179931640625, -8.841796875, -8.503662109375, -8.16552734375, -7.827392578125, -7.4892578125, -7.151123046875, -6.81298828125, -6.474853515625, -6.13671875, -5.798583984375, -5.46044921875, -5.122314453125, -4.7841796875, -4.446044921875, -4.10791015625, -3.769775390625, -3.431640625, -3.093505859375, -2.75537109375, -2.417236328125, -2.0791015625, -1.740966796875, -1.40283203125, -1.064697265625, -0.7265625, -0.388427734375, -0.05029296875, 0.287841796875, 0.6259765625, 0.964111328125, 1.30224609375, 1.640380859375, 1.978515625, 2.316650390625, 2.65478515625, 2.992919921875, 3.3310546875, 3.669189453125, 4.00732421875, 4.345458984375, 4.68359375, 5.021728515625, 5.35986328125, 5.697998046875, 6.0361328125, 6.374267578125, 6.71240234375, 7.050537109375, 7.388671875, 7.726806640625, 8.06494140625, 8.403076171875, 8.7412109375, 9.079345703125, 9.41748046875, 9.755615234375, 10.09375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 6.0, 10.0, 6.0, 22.0, 23.0, 23.0, 36.0, 40.0, 52.0, 83.0, 121.0, 197.0, 363.0, 1076.0, 1024.0, 331.0, 183.0, 117.0, 85.0, 58.0, 50.0, 26.0, 23.0, 21.0, 10.0, 14.0, 21.0, 8.0, 8.0, 4.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.296875, -3.212310791015625, -3.12774658203125, -3.043182373046875, -2.9586181640625, -2.874053955078125, -2.78948974609375, -2.704925537109375, -2.620361328125, -2.535797119140625, -2.45123291015625, -2.366668701171875, -2.2821044921875, -2.197540283203125, -2.11297607421875, -2.028411865234375, -1.94384765625, -1.859283447265625, -1.77471923828125, -1.690155029296875, -1.6055908203125, -1.521026611328125, -1.43646240234375, -1.351898193359375, -1.267333984375, -1.182769775390625, -1.09820556640625, -1.013641357421875, -0.9290771484375, -0.844512939453125, -0.75994873046875, -0.675384521484375, -0.5908203125, -0.506256103515625, -0.42169189453125, -0.337127685546875, -0.2525634765625, -0.167999267578125, -0.08343505859375, 0.001129150390625, 0.085693359375, 0.170257568359375, 0.25482177734375, 0.339385986328125, 0.4239501953125, 0.508514404296875, 0.59307861328125, 0.677642822265625, 0.76220703125, 0.846771240234375, 0.93133544921875, 1.015899658203125, 1.1004638671875, 1.185028076171875, 1.26959228515625, 1.354156494140625, 1.438720703125, 1.523284912109375, 1.60784912109375, 1.692413330078125, 1.7769775390625, 1.861541748046875, 1.94610595703125, 2.030670166015625, 2.115234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 11.0, 19.0, 27.0, 46.0, 83.0, 123.0, 169.0, 169.0, 141.0, 90.0, 63.0, 18.0, 16.0, 9.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.63536071777344, -35.559444427490234, -34.48352813720703, -33.40761184692383, -32.331695556640625, -31.255779266357422, -30.17986297607422, -29.103946685791016, -28.028030395507812, -26.95211410522461, -25.876197814941406, -24.800281524658203, -23.724365234375, -22.648448944091797, -21.572532653808594, -20.49661636352539, -19.42070198059082, -18.344785690307617, -17.268869400024414, -16.19295310974121, -15.117036819458008, -14.041120529174805, -12.965205192565918, -11.889288902282715, -10.813372611999512, -9.737456321716309, -8.661540031433105, -7.5856242179870605, -6.509707927703857, -5.433791637420654, -4.357875823974609, -3.2819595336914062, -2.206043243408203, -1.1301270723342896, -0.05421090126037598, 1.021705150604248, 2.097621440887451, 3.1735377311706543, 4.249453544616699, 5.325369834899902, 6.4012861251831055, 7.477202415466309, 8.553118705749512, 9.629034042358398, 10.704950332641602, 11.780866622924805, 12.856782913208008, 13.932699203491211, 15.008615493774414, 16.084531784057617, 17.16044807434082, 18.236364364624023, 19.312280654907227, 20.38819694519043, 21.464111328125, 22.540027618408203, 23.615943908691406, 24.69186019897461, 25.767776489257812, 26.843692779541016, 27.91960906982422, 28.995525360107422, 30.071441650390625, 31.147357940673828, 32.22327423095703]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 10.0, 13.0, 11.0, 13.0, 11.0, 16.0, 18.0, 25.0, 15.0, 24.0, 35.0, 28.0, 45.0, 30.0, 29.0, 28.0, 41.0, 42.0, 43.0, 49.0, 31.0, 47.0, 40.0, 23.0, 31.0, 45.0, 37.0, 31.0, 23.0, 25.0, 20.0, 16.0, 20.0, 13.0, 13.0, 13.0, 7.0, 3.0, 4.0, 7.0, 4.0, 0.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.70316219329834, -8.419821739196777, -8.136481285095215, -7.8531413078308105, -7.569801330566406, -7.286460876464844, -7.003120422363281, -6.719779968261719, -6.4364399909973145, -6.153099536895752, -5.869759559631348, -5.586419105529785, -5.303078651428223, -5.019738674163818, -4.736398220062256, -4.453058242797852, -4.169717788696289, -3.8863775730133057, -3.6030373573303223, -3.3196969032287598, -3.0363566875457764, -2.753016471862793, -2.4696760177612305, -2.186335802078247, -1.9029955863952637, -1.6196553707122803, -1.3363150358200073, -1.0529747009277344, -0.769634485244751, -0.4862942695617676, -0.20295393466949463, 0.08038640022277832, 0.3637256622314453, 0.6470659375190735, 0.9304062128067017, 1.2137465476989746, 1.497086763381958, 1.7804269790649414, 2.063767433166504, 2.3471076488494873, 2.6304478645324707, 2.913788080215454, 3.1971282958984375, 3.48046875, 3.7638089656829834, 4.047149181365967, 4.330489635467529, 4.613829612731934, 4.897170066833496, 5.180510520935059, 5.463850498199463, 5.747190952301025, 6.03053092956543, 6.313871383666992, 6.597211837768555, 6.880552291870117, 7.1638922691345215, 7.447232723236084, 7.730572700500488, 8.01391315460205, 8.297253608703613, 8.58059310913086, 8.863933563232422, 9.147274017333984, 9.430614471435547]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 4.0, 9.0, 22.0, 24.0, 39.0, 75.0, 76.0, 143.0, 223.0, 382.0, 562.0, 965.0, 1618.0, 2868.0, 5210.0, 9709.0, 19292.0, 39006.0, 81396.0, 187274.0, 365248.0, 178369.0, 78529.0, 37584.0, 18517.0, 9561.0, 5001.0, 2763.0, 1610.0, 931.0, 567.0, 345.0, 199.0, 152.0, 75.0, 54.0, 52.0, 25.0, 23.0, 13.0, 12.0, 6.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.18359375, -6.968994140625, -6.75439453125, -6.539794921875, -6.3251953125, -6.110595703125, -5.89599609375, -5.681396484375, -5.466796875, -5.252197265625, -5.03759765625, -4.822998046875, -4.6083984375, -4.393798828125, -4.17919921875, -3.964599609375, -3.75, -3.535400390625, -3.32080078125, -3.106201171875, -2.8916015625, -2.677001953125, -2.46240234375, -2.247802734375, -2.033203125, -1.818603515625, -1.60400390625, -1.389404296875, -1.1748046875, -0.960205078125, -0.74560546875, -0.531005859375, -0.31640625, -0.101806640625, 0.11279296875, 0.327392578125, 0.5419921875, 0.756591796875, 0.97119140625, 1.185791015625, 1.400390625, 1.614990234375, 1.82958984375, 2.044189453125, 2.2587890625, 2.473388671875, 2.68798828125, 2.902587890625, 3.1171875, 3.331787109375, 3.54638671875, 3.760986328125, 3.9755859375, 4.190185546875, 4.40478515625, 4.619384765625, 4.833984375, 5.048583984375, 5.26318359375, 5.477783203125, 5.6923828125, 5.906982421875, 6.12158203125, 6.336181640625, 6.55078125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 8.0, 23.0, 18.0, 28.0, 32.0, 29.0, 36.0, 50.0, 57.0, 62.0, 62.0, 56.0, 63.0, 68.0, 40.0, 52.0, 56.0, 45.0, 43.0, 32.0, 26.0, 24.0, 19.0, 10.0, 10.0, 12.0, 4.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.042633056640625, -1.00909423828125, -0.975555419921875, -0.9420166015625, -0.908477783203125, -0.87493896484375, -0.841400146484375, -0.807861328125, -0.774322509765625, -0.74078369140625, -0.707244873046875, -0.6737060546875, -0.640167236328125, -0.60662841796875, -0.573089599609375, -0.53955078125, -0.506011962890625, -0.47247314453125, -0.438934326171875, -0.4053955078125, -0.371856689453125, -0.33831787109375, -0.304779052734375, -0.271240234375, -0.237701416015625, -0.20416259765625, -0.170623779296875, -0.1370849609375, -0.103546142578125, -0.07000732421875, -0.036468505859375, -0.0029296875, 0.030609130859375, 0.06414794921875, 0.097686767578125, 0.1312255859375, 0.164764404296875, 0.19830322265625, 0.231842041015625, 0.265380859375, 0.298919677734375, 0.33245849609375, 0.365997314453125, 0.3995361328125, 0.433074951171875, 0.46661376953125, 0.500152587890625, 0.53369140625, 0.567230224609375, 0.60076904296875, 0.634307861328125, 0.6678466796875, 0.701385498046875, 0.73492431640625, 0.768463134765625, 0.802001953125, 0.835540771484375, 0.86907958984375, 0.902618408203125, 0.9361572265625, 0.969696044921875, 1.00323486328125, 1.036773681640625, 1.0703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 7.0, 5.0, 6.0, 10.0, 19.0, 26.0, 44.0, 42.0, 89.0, 151.0, 214.0, 340.0, 567.0, 1145.0, 2086.0, 4563.0, 10827.0, 29874.0, 94730.0, 362668.0, 387708.0, 100880.0, 31745.0, 11369.0, 4655.0, 2125.0, 1120.0, 616.0, 343.0, 222.0, 119.0, 77.0, 59.0, 28.0, 28.0, 15.0, 15.0, 7.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.0562744140625, -7.768798828125, -7.4813232421875, -7.19384765625, -6.9063720703125, -6.618896484375, -6.3314208984375, -6.0439453125, -5.7564697265625, -5.468994140625, -5.1815185546875, -4.89404296875, -4.6065673828125, -4.319091796875, -4.0316162109375, -3.744140625, -3.4566650390625, -3.169189453125, -2.8817138671875, -2.59423828125, -2.3067626953125, -2.019287109375, -1.7318115234375, -1.4443359375, -1.1568603515625, -0.869384765625, -0.5819091796875, -0.29443359375, -0.0069580078125, 0.280517578125, 0.5679931640625, 0.85546875, 1.1429443359375, 1.430419921875, 1.7178955078125, 2.00537109375, 2.2928466796875, 2.580322265625, 2.8677978515625, 3.1552734375, 3.4427490234375, 3.730224609375, 4.0177001953125, 4.30517578125, 4.5926513671875, 4.880126953125, 5.1676025390625, 5.455078125, 5.7425537109375, 6.030029296875, 6.3175048828125, 6.60498046875, 6.8924560546875, 7.179931640625, 7.4674072265625, 7.7548828125, 8.0423583984375, 8.329833984375, 8.6173095703125, 8.90478515625, 9.1922607421875, 9.479736328125, 9.7672119140625, 10.0546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 5.0, 3.0, 3.0, 4.0, 7.0, 9.0, 9.0, 11.0, 12.0, 16.0, 14.0, 19.0, 30.0, 17.0, 27.0, 34.0, 39.0, 51.0, 26.0, 42.0, 46.0, 39.0, 47.0, 42.0, 46.0, 49.0, 39.0, 39.0, 32.0, 29.0, 37.0, 23.0, 29.0, 19.0, 14.0, 19.0, 16.0, 14.0, 9.0, 4.0, 2.0, 2.0, 5.0, 6.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-4.34765625, -4.217864990234375, -4.08807373046875, -3.958282470703125, -3.8284912109375, -3.698699951171875, -3.56890869140625, -3.439117431640625, -3.309326171875, -3.179534912109375, -3.04974365234375, -2.919952392578125, -2.7901611328125, -2.660369873046875, -2.53057861328125, -2.400787353515625, -2.27099609375, -2.141204833984375, -2.01141357421875, -1.881622314453125, -1.7518310546875, -1.622039794921875, -1.49224853515625, -1.362457275390625, -1.232666015625, -1.102874755859375, -0.97308349609375, -0.843292236328125, -0.7135009765625, -0.583709716796875, -0.45391845703125, -0.324127197265625, -0.1943359375, -0.064544677734375, 0.06524658203125, 0.195037841796875, 0.3248291015625, 0.454620361328125, 0.58441162109375, 0.714202880859375, 0.843994140625, 0.973785400390625, 1.10357666015625, 1.233367919921875, 1.3631591796875, 1.492950439453125, 1.62274169921875, 1.752532958984375, 1.88232421875, 2.012115478515625, 2.14190673828125, 2.271697998046875, 2.4014892578125, 2.531280517578125, 2.66107177734375, 2.790863037109375, 2.920654296875, 3.050445556640625, 3.18023681640625, 3.310028076171875, 3.4398193359375, 3.569610595703125, 3.69940185546875, 3.829193115234375, 3.958984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 8.0, 9.0, 10.0, 17.0, 24.0, 33.0, 46.0, 68.0, 103.0, 176.0, 278.0, 508.0, 930.0, 2231.0, 5663.0, 17504.0, 119672.0, 760181.0, 113994.0, 17196.0, 5462.0, 2199.0, 995.0, 511.0, 281.0, 156.0, 105.0, 64.0, 31.0, 30.0, 23.0, 7.0, 6.0, 6.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6796875, -8.39501953125, -8.1103515625, -7.82568359375, -7.541015625, -7.25634765625, -6.9716796875, -6.68701171875, -6.40234375, -6.11767578125, -5.8330078125, -5.54833984375, -5.263671875, -4.97900390625, -4.6943359375, -4.40966796875, -4.125, -3.84033203125, -3.5556640625, -3.27099609375, -2.986328125, -2.70166015625, -2.4169921875, -2.13232421875, -1.84765625, -1.56298828125, -1.2783203125, -0.99365234375, -0.708984375, -0.42431640625, -0.1396484375, 0.14501953125, 0.4296875, 0.71435546875, 0.9990234375, 1.28369140625, 1.568359375, 1.85302734375, 2.1376953125, 2.42236328125, 2.70703125, 2.99169921875, 3.2763671875, 3.56103515625, 3.845703125, 4.13037109375, 4.4150390625, 4.69970703125, 4.984375, 5.26904296875, 5.5537109375, 5.83837890625, 6.123046875, 6.40771484375, 6.6923828125, 6.97705078125, 7.26171875, 7.54638671875, 7.8310546875, 8.11572265625, 8.400390625, 8.68505859375, 8.9697265625, 9.25439453125, 9.5390625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 5.0, 6.0, 8.0, 13.0, 16.0, 31.0, 40.0, 66.0, 123.0, 223.0, 186.0, 94.0, 59.0, 32.0, 25.0, 17.0, 13.0, 14.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008220672607421875, -0.0007827728986740112, -0.000743478536605835, -0.0007041841745376587, -0.0006648898124694824, -0.0006255954504013062, -0.0005863010883331299, -0.0005470067262649536, -0.0005077123641967773, -0.0004684180021286011, -0.0004291236400604248, -0.00038982927799224854, -0.00035053491592407227, -0.000311240553855896, -0.0002719461917877197, -0.00023265182971954346, -0.0001933574676513672, -0.00015406310558319092, -0.00011476874351501465, -7.547438144683838e-05, -3.618001937866211e-05, 3.11434268951416e-06, 4.240870475769043e-05, 8.17030668258667e-05, 0.00012099742889404297, 0.00016029179096221924, 0.0001995861530303955, 0.00023888051509857178, 0.00027817487716674805, 0.0003174692392349243, 0.0003567636013031006, 0.00039605796337127686, 0.0004353523254394531, 0.0004746466875076294, 0.0005139410495758057, 0.0005532354116439819, 0.0005925297737121582, 0.0006318241357803345, 0.0006711184978485107, 0.000710412859916687, 0.0007497072219848633, 0.0007890015840530396, 0.0008282959461212158, 0.0008675903081893921, 0.0009068846702575684, 0.0009461790323257446, 0.000985473394393921, 0.0010247677564620972, 0.0010640621185302734, 0.0011033564805984497, 0.001142650842666626, 0.0011819452047348022, 0.0012212395668029785, 0.0012605339288711548, 0.001299828290939331, 0.0013391226530075073, 0.0013784170150756836, 0.0014177113771438599, 0.0014570057392120361, 0.0014963001012802124, 0.0015355944633483887, 0.001574888825416565, 0.0016141831874847412, 0.0016534775495529175, 0.0016927719116210938]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 2.0, 4.0, 8.0, 5.0, 11.0, 21.0, 29.0, 32.0, 63.0, 97.0, 135.0, 193.0, 344.0, 595.0, 1123.0, 2154.0, 4398.0, 10467.0, 33430.0, 240717.0, 645522.0, 77975.0, 18113.0, 6526.0, 3038.0, 1489.0, 800.0, 472.0, 305.0, 171.0, 103.0, 79.0, 44.0, 27.0, 15.0, 14.0, 12.0, 7.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.59375, -8.356689453125, -8.11962890625, -7.882568359375, -7.6455078125, -7.408447265625, -7.17138671875, -6.934326171875, -6.697265625, -6.460205078125, -6.22314453125, -5.986083984375, -5.7490234375, -5.511962890625, -5.27490234375, -5.037841796875, -4.80078125, -4.563720703125, -4.32666015625, -4.089599609375, -3.8525390625, -3.615478515625, -3.37841796875, -3.141357421875, -2.904296875, -2.667236328125, -2.43017578125, -2.193115234375, -1.9560546875, -1.718994140625, -1.48193359375, -1.244873046875, -1.0078125, -0.770751953125, -0.53369140625, -0.296630859375, -0.0595703125, 0.177490234375, 0.41455078125, 0.651611328125, 0.888671875, 1.125732421875, 1.36279296875, 1.599853515625, 1.8369140625, 2.073974609375, 2.31103515625, 2.548095703125, 2.78515625, 3.022216796875, 3.25927734375, 3.496337890625, 3.7333984375, 3.970458984375, 4.20751953125, 4.444580078125, 4.681640625, 4.918701171875, 5.15576171875, 5.392822265625, 5.6298828125, 5.866943359375, 6.10400390625, 6.341064453125, 6.578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 7.0, 11.0, 5.0, 11.0, 21.0, 27.0, 51.0, 55.0, 95.0, 124.0, 153.0, 126.0, 105.0, 64.0, 23.0, 21.0, 31.0, 13.0, 6.0, 10.0, 3.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.73944091796875, -4.5843505859375, -4.42926025390625, -4.274169921875, -4.11907958984375, -3.9639892578125, -3.80889892578125, -3.65380859375, -3.49871826171875, -3.3436279296875, -3.18853759765625, -3.033447265625, -2.87835693359375, -2.7232666015625, -2.56817626953125, -2.4130859375, -2.25799560546875, -2.1029052734375, -1.94781494140625, -1.792724609375, -1.63763427734375, -1.4825439453125, -1.32745361328125, -1.17236328125, -1.01727294921875, -0.8621826171875, -0.70709228515625, -0.552001953125, -0.39691162109375, -0.2418212890625, -0.08673095703125, 0.068359375, 0.22344970703125, 0.3785400390625, 0.53363037109375, 0.688720703125, 0.84381103515625, 0.9989013671875, 1.15399169921875, 1.30908203125, 1.46417236328125, 1.6192626953125, 1.77435302734375, 1.929443359375, 2.08453369140625, 2.2396240234375, 2.39471435546875, 2.5498046875, 2.70489501953125, 2.8599853515625, 3.01507568359375, 3.170166015625, 3.32525634765625, 3.4803466796875, 3.63543701171875, 3.79052734375, 3.94561767578125, 4.1007080078125, 4.25579833984375, 4.410888671875, 4.56597900390625, 4.7210693359375, 4.87615966796875, 5.03125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 10.0, 27.0, 53.0, 100.0, 203.0, 249.0, 167.0, 94.0, 59.0, 24.0, 13.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.76547241210938, -179.80079650878906, -175.83612060546875, -171.8714599609375, -167.9067840576172, -163.94210815429688, -159.97743225097656, -156.01275634765625, -152.048095703125, -148.0834197998047, -144.11874389648438, -140.15408325195312, -136.1894073486328, -132.2247314453125, -128.2600555419922, -124.29537963867188, -120.33070373535156, -116.36602783203125, -112.40135955810547, -108.43668365478516, -104.47201538085938, -100.50733947753906, -96.54266357421875, -92.57798767089844, -88.61331939697266, -84.64864349365234, -80.68397521972656, -76.71929931640625, -72.75462341308594, -68.78995513916016, -64.82527923583984, -60.8606071472168, -56.89592742919922, -52.93125534057617, -48.966583251953125, -45.00190734863281, -41.037235260009766, -37.07256317138672, -33.107887268066406, -29.14321517944336, -25.178543090820312, -21.213871002197266, -17.249197006225586, -13.284523963928223, -9.31985092163086, -5.3551788330078125, -1.3905048370361328, 2.574169158935547, 6.538841247558594, 10.503514289855957, 14.46818733215332, 18.432861328125, 22.397533416748047, 26.362205505371094, 30.326879501342773, 34.29155349731445, 38.2562255859375, 42.22089767456055, 46.185569763183594, 50.150245666503906, 54.11491775512695, 58.07958984375, 62.04426574707031, 66.00894165039062, 69.9736099243164]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 9.0, 5.0, 14.0, 9.0, 12.0, 15.0, 22.0, 26.0, 25.0, 25.0, 27.0, 33.0, 39.0, 40.0, 46.0, 39.0, 38.0, 40.0, 40.0, 53.0, 41.0, 37.0, 46.0, 35.0, 40.0, 40.0, 26.0, 22.0, 25.0, 25.0, 16.0, 17.0, 14.0, 11.0, 9.0, 10.0, 8.0, 1.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.604516983032227, -22.777881622314453, -21.95124626159668, -21.124610900878906, -20.297977447509766, -19.47134017944336, -18.64470672607422, -17.818071365356445, -16.991436004638672, -16.1648006439209, -15.338165283203125, -14.511530876159668, -13.684895515441895, -12.858260154724121, -12.031625747680664, -11.20499038696289, -10.378355026245117, -9.551719665527344, -8.72508430480957, -7.898449897766113, -7.07181453704834, -6.245179176330566, -5.418544292449951, -4.591909408569336, -3.7652740478515625, -2.938638925552368, -2.112003803253174, -1.2853686809539795, -0.45873355865478516, 0.3679018020629883, 1.1945366859436035, 2.0211715698242188, 2.8478050231933594, 3.6744401454925537, 4.501075267791748, 5.327710151672363, 6.154345512390137, 6.98098087310791, 7.807615756988525, 8.63425064086914, 9.460886001586914, 10.287521362304688, 11.114156723022461, 11.940791130065918, 12.767426490783691, 13.594061851501465, 14.420696258544922, 15.247331619262695, 16.07396697998047, 16.900602340698242, 17.727237701416016, 18.55387306213379, 19.380508422851562, 20.207141876220703, 21.033777236938477, 21.86041259765625, 22.687047958374023, 23.513683319091797, 24.34031867980957, 25.166954040527344, 25.993587493896484, 26.82022476196289, 27.64685821533203, 28.473493576049805, 29.300128936767578]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 8.0, 7.0, 9.0, 10.0, 8.0, 22.0, 29.0, 31.0, 40.0, 66.0, 112.0, 151.0, 178.0, 320.0, 390.0, 582.0, 947.0, 1476.0, 2506.0, 4195.0, 7462.0, 14701.0, 31627.0, 85304.0, 556735.0, 3274290.0, 128701.0, 42360.0, 18896.0, 9555.0, 5289.0, 3020.0, 1814.0, 1144.0, 785.0, 493.0, 333.0, 231.0, 137.0, 81.0, 71.0, 49.0, 33.0, 23.0, 23.0, 17.0, 8.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.5078125, -6.31158447265625, -6.1153564453125, -5.91912841796875, -5.722900390625, -5.52667236328125, -5.3304443359375, -5.13421630859375, -4.93798828125, -4.74176025390625, -4.5455322265625, -4.34930419921875, -4.153076171875, -3.95684814453125, -3.7606201171875, -3.56439208984375, -3.3681640625, -3.17193603515625, -2.9757080078125, -2.77947998046875, -2.583251953125, -2.38702392578125, -2.1907958984375, -1.99456787109375, -1.79833984375, -1.60211181640625, -1.4058837890625, -1.20965576171875, -1.013427734375, -0.81719970703125, -0.6209716796875, -0.42474365234375, -0.228515625, -0.03228759765625, 0.1639404296875, 0.36016845703125, 0.556396484375, 0.75262451171875, 0.9488525390625, 1.14508056640625, 1.34130859375, 1.53753662109375, 1.7337646484375, 1.92999267578125, 2.126220703125, 2.32244873046875, 2.5186767578125, 2.71490478515625, 2.9111328125, 3.10736083984375, 3.3035888671875, 3.49981689453125, 3.696044921875, 3.89227294921875, 4.0885009765625, 4.28472900390625, 4.48095703125, 4.67718505859375, 4.8734130859375, 5.06964111328125, 5.265869140625, 5.46209716796875, 5.6583251953125, 5.85455322265625, 6.05078125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 11.0, 16.0, 22.0, 20.0, 32.0, 43.0, 34.0, 51.0, 51.0, 51.0, 55.0, 61.0, 54.0, 70.0, 57.0, 60.0, 43.0, 45.0, 41.0, 35.0, 35.0, 20.0, 21.0, 12.0, 12.0, 6.0, 7.0, 8.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.109375, -1.074127197265625, -1.03887939453125, -1.003631591796875, -0.9683837890625, -0.933135986328125, -0.89788818359375, -0.862640380859375, -0.827392578125, -0.792144775390625, -0.75689697265625, -0.721649169921875, -0.6864013671875, -0.651153564453125, -0.61590576171875, -0.580657958984375, -0.54541015625, -0.510162353515625, -0.47491455078125, -0.439666748046875, -0.4044189453125, -0.369171142578125, -0.33392333984375, -0.298675537109375, -0.263427734375, -0.228179931640625, -0.19293212890625, -0.157684326171875, -0.1224365234375, -0.087188720703125, -0.05194091796875, -0.016693115234375, 0.0185546875, 0.053802490234375, 0.08905029296875, 0.124298095703125, 0.1595458984375, 0.194793701171875, 0.23004150390625, 0.265289306640625, 0.300537109375, 0.335784912109375, 0.37103271484375, 0.406280517578125, 0.4415283203125, 0.476776123046875, 0.51202392578125, 0.547271728515625, 0.58251953125, 0.617767333984375, 0.65301513671875, 0.688262939453125, 0.7235107421875, 0.758758544921875, 0.79400634765625, 0.829254150390625, 0.864501953125, 0.899749755859375, 0.93499755859375, 0.970245361328125, 1.0054931640625, 1.040740966796875, 1.07598876953125, 1.111236572265625, 1.146484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 1.0, 2.0, 8.0, 14.0, 9.0, 18.0, 27.0, 28.0, 43.0, 77.0, 80.0, 123.0, 217.0, 332.0, 480.0, 884.0, 1434.0, 2545.0, 4460.0, 8588.0, 17684.0, 41108.0, 115212.0, 819720.0, 2926303.0, 158951.0, 51541.0, 21721.0, 10225.0, 5213.0, 2891.0, 1634.0, 998.0, 625.0, 371.0, 232.0, 153.0, 107.0, 64.0, 55.0, 35.0, 22.0, 17.0, 7.0, 6.0, 11.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.60546875, -6.39324951171875, -6.1810302734375, -5.96881103515625, -5.756591796875, -5.54437255859375, -5.3321533203125, -5.11993408203125, -4.90771484375, -4.69549560546875, -4.4832763671875, -4.27105712890625, -4.058837890625, -3.84661865234375, -3.6343994140625, -3.42218017578125, -3.2099609375, -2.99774169921875, -2.7855224609375, -2.57330322265625, -2.361083984375, -2.14886474609375, -1.9366455078125, -1.72442626953125, -1.51220703125, -1.29998779296875, -1.0877685546875, -0.87554931640625, -0.663330078125, -0.45111083984375, -0.2388916015625, -0.02667236328125, 0.185546875, 0.39776611328125, 0.6099853515625, 0.82220458984375, 1.034423828125, 1.24664306640625, 1.4588623046875, 1.67108154296875, 1.88330078125, 2.09552001953125, 2.3077392578125, 2.51995849609375, 2.732177734375, 2.94439697265625, 3.1566162109375, 3.36883544921875, 3.5810546875, 3.79327392578125, 4.0054931640625, 4.21771240234375, 4.429931640625, 4.64215087890625, 4.8543701171875, 5.06658935546875, 5.27880859375, 5.49102783203125, 5.7032470703125, 5.91546630859375, 6.127685546875, 6.33990478515625, 6.5521240234375, 6.76434326171875, 6.9765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 9.0, 6.0, 6.0, 9.0, 24.0, 23.0, 29.0, 28.0, 35.0, 59.0, 78.0, 144.0, 253.0, 748.0, 1737.0, 360.0, 159.0, 80.0, 83.0, 44.0, 41.0, 24.0, 21.0, 17.0, 12.0, 9.0, 3.0, 10.0, 6.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.712890625, -2.623138427734375, -2.53338623046875, -2.443634033203125, -2.3538818359375, -2.264129638671875, -2.17437744140625, -2.084625244140625, -1.994873046875, -1.905120849609375, -1.81536865234375, -1.725616455078125, -1.6358642578125, -1.546112060546875, -1.45635986328125, -1.366607666015625, -1.27685546875, -1.187103271484375, -1.09735107421875, -1.007598876953125, -0.9178466796875, -0.828094482421875, -0.73834228515625, -0.648590087890625, -0.558837890625, -0.469085693359375, -0.37933349609375, -0.289581298828125, -0.1998291015625, -0.110076904296875, -0.02032470703125, 0.069427490234375, 0.1591796875, 0.248931884765625, 0.33868408203125, 0.428436279296875, 0.5181884765625, 0.607940673828125, 0.69769287109375, 0.787445068359375, 0.877197265625, 0.966949462890625, 1.05670166015625, 1.146453857421875, 1.2362060546875, 1.325958251953125, 1.41571044921875, 1.505462646484375, 1.59521484375, 1.684967041015625, 1.77471923828125, 1.864471435546875, 1.9542236328125, 2.043975830078125, 2.13372802734375, 2.223480224609375, 2.313232421875, 2.402984619140625, 2.49273681640625, 2.582489013671875, 2.6722412109375, 2.761993408203125, 2.85174560546875, 2.941497802734375, 3.03125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 18.0, 31.0, 58.0, 102.0, 154.0, 217.0, 176.0, 111.0, 72.0, 30.0, 16.0, 4.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.82215881347656, -39.79052734375, -38.75889587402344, -37.72726821899414, -36.69563674926758, -35.664005279541016, -34.63237762451172, -33.600746154785156, -32.569114685058594, -31.53748321533203, -30.5058536529541, -29.474224090576172, -28.44259262084961, -27.410961151123047, -26.379331588745117, -25.347702026367188, -24.316070556640625, -23.284439086914062, -22.252809524536133, -21.221179962158203, -20.18954849243164, -19.157917022705078, -18.12628746032715, -17.09465789794922, -16.063026428222656, -15.03139591217041, -13.999765396118164, -12.968134880065918, -11.936504364013672, -10.904873847961426, -9.87324333190918, -8.841612815856934, -7.8099822998046875, -6.778351783752441, -5.746721267700195, -4.715090751647949, -3.683460235595703, -2.651829719543457, -1.620199203491211, -0.5885686874389648, 0.44306182861328125, 1.4746923446655273, 2.5063228607177734, 3.5379533767700195, 4.569583892822266, 5.601214408874512, 6.632844924926758, 7.664475440979004, 8.69610595703125, 9.727736473083496, 10.759366989135742, 11.790997505187988, 12.822628021240234, 13.85425853729248, 14.885889053344727, 15.917519569396973, 16.94915008544922, 17.98078155517578, 19.01241111755371, 20.04404067993164, 21.075672149658203, 22.107303619384766, 23.138933181762695, 24.170562744140625, 25.202194213867188]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 6.0, 6.0, 9.0, 4.0, 10.0, 18.0, 25.0, 23.0, 25.0, 26.0, 29.0, 33.0, 41.0, 42.0, 38.0, 36.0, 45.0, 43.0, 49.0, 54.0, 30.0, 34.0, 40.0, 42.0, 43.0, 26.0, 28.0, 23.0, 25.0, 20.0, 28.0, 16.0, 24.0, 6.0, 12.0, 9.0, 4.0, 7.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.147253036499023, -9.837661743164062, -9.528070449829102, -9.21847915649414, -8.90888786315918, -8.599296569824219, -8.289705276489258, -7.980113983154297, -7.670522689819336, -7.360931396484375, -7.051340103149414, -6.741748809814453, -6.432157516479492, -6.122566223144531, -5.81297492980957, -5.503383636474609, -5.193792343139648, -4.8842010498046875, -4.574609756469727, -4.265018463134766, -3.9554271697998047, -3.6458358764648438, -3.336244583129883, -3.026653289794922, -2.717061996459961, -2.407470703125, -2.097879409790039, -1.7882881164550781, -1.4786968231201172, -1.1691055297851562, -0.8595142364501953, -0.5499229431152344, -0.24033069610595703, 0.0692605972290039, 0.37885189056396484, 0.6884431838989258, 0.9980344772338867, 1.3076257705688477, 1.6172170639038086, 1.9268083572387695, 2.2363996505737305, 2.5459909439086914, 2.8555822372436523, 3.1651735305786133, 3.474764823913574, 3.784356117248535, 4.093947410583496, 4.403538703918457, 4.713129997253418, 5.022721290588379, 5.33231258392334, 5.641903877258301, 5.951495170593262, 6.261086463928223, 6.570677757263184, 6.8802690505981445, 7.1898603439331055, 7.499451637268066, 7.809042930603027, 8.118634223937988, 8.42822551727295, 8.73781681060791, 9.047408103942871, 9.356999397277832, 9.666590690612793]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 12.0, 18.0, 31.0, 24.0, 43.0, 74.0, 106.0, 141.0, 255.0, 351.0, 564.0, 845.0, 1337.0, 2198.0, 3741.0, 6450.0, 11226.0, 20474.0, 38275.0, 72822.0, 144770.0, 290149.0, 223945.0, 107360.0, 55842.0, 29510.0, 16140.0, 8902.0, 5082.0, 3008.0, 1818.0, 1136.0, 680.0, 412.0, 275.0, 185.0, 107.0, 76.0, 60.0, 32.0, 26.0, 14.0, 14.0, 9.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.19140625, -5.01715087890625, -4.8428955078125, -4.66864013671875, -4.494384765625, -4.32012939453125, -4.1458740234375, -3.97161865234375, -3.79736328125, -3.62310791015625, -3.4488525390625, -3.27459716796875, -3.100341796875, -2.92608642578125, -2.7518310546875, -2.57757568359375, -2.4033203125, -2.22906494140625, -2.0548095703125, -1.88055419921875, -1.706298828125, -1.53204345703125, -1.3577880859375, -1.18353271484375, -1.00927734375, -0.83502197265625, -0.6607666015625, -0.48651123046875, -0.312255859375, -0.13800048828125, 0.0362548828125, 0.21051025390625, 0.384765625, 0.55902099609375, 0.7332763671875, 0.90753173828125, 1.081787109375, 1.25604248046875, 1.4302978515625, 1.60455322265625, 1.77880859375, 1.95306396484375, 2.1273193359375, 2.30157470703125, 2.475830078125, 2.65008544921875, 2.8243408203125, 2.99859619140625, 3.1728515625, 3.34710693359375, 3.5213623046875, 3.69561767578125, 3.869873046875, 4.04412841796875, 4.2183837890625, 4.39263916015625, 4.56689453125, 4.74114990234375, 4.9154052734375, 5.08966064453125, 5.263916015625, 5.43817138671875, 5.6124267578125, 5.78668212890625, 5.9609375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 7.0, 5.0, 7.0, 9.0, 11.0, 24.0, 21.0, 37.0, 33.0, 45.0, 57.0, 39.0, 52.0, 58.0, 41.0, 46.0, 57.0, 64.0, 52.0, 53.0, 50.0, 42.0, 37.0, 26.0, 24.0, 28.0, 15.0, 11.0, 12.0, 11.0, 7.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1240234375, -1.088714599609375, -1.05340576171875, -1.018096923828125, -0.9827880859375, -0.947479248046875, -0.91217041015625, -0.876861572265625, -0.841552734375, -0.806243896484375, -0.77093505859375, -0.735626220703125, -0.7003173828125, -0.665008544921875, -0.62969970703125, -0.594390869140625, -0.55908203125, -0.523773193359375, -0.48846435546875, -0.453155517578125, -0.4178466796875, -0.382537841796875, -0.34722900390625, -0.311920166015625, -0.276611328125, -0.241302490234375, -0.20599365234375, -0.170684814453125, -0.1353759765625, -0.100067138671875, -0.06475830078125, -0.029449462890625, 0.005859375, 0.041168212890625, 0.07647705078125, 0.111785888671875, 0.1470947265625, 0.182403564453125, 0.21771240234375, 0.253021240234375, 0.288330078125, 0.323638916015625, 0.35894775390625, 0.394256591796875, 0.4295654296875, 0.464874267578125, 0.50018310546875, 0.535491943359375, 0.57080078125, 0.606109619140625, 0.64141845703125, 0.676727294921875, 0.7120361328125, 0.747344970703125, 0.78265380859375, 0.817962646484375, 0.853271484375, 0.888580322265625, 0.92388916015625, 0.959197998046875, 0.9945068359375, 1.029815673828125, 1.06512451171875, 1.100433349609375, 1.1357421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 4.0, 15.0, 13.0, 17.0, 18.0, 36.0, 47.0, 73.0, 107.0, 151.0, 225.0, 331.0, 591.0, 1076.0, 1978.0, 4229.0, 9877.0, 26645.0, 78264.0, 273713.0, 449086.0, 132837.0, 41986.0, 15174.0, 5988.0, 2630.0, 1339.0, 744.0, 427.0, 290.0, 210.0, 108.0, 85.0, 60.0, 52.0, 37.0, 18.0, 22.0, 12.0, 10.0, 8.0, 7.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.6953125, -7.440673828125, -7.18603515625, -6.931396484375, -6.6767578125, -6.422119140625, -6.16748046875, -5.912841796875, -5.658203125, -5.403564453125, -5.14892578125, -4.894287109375, -4.6396484375, -4.385009765625, -4.13037109375, -3.875732421875, -3.62109375, -3.366455078125, -3.11181640625, -2.857177734375, -2.6025390625, -2.347900390625, -2.09326171875, -1.838623046875, -1.583984375, -1.329345703125, -1.07470703125, -0.820068359375, -0.5654296875, -0.310791015625, -0.05615234375, 0.198486328125, 0.453125, 0.707763671875, 0.96240234375, 1.217041015625, 1.4716796875, 1.726318359375, 1.98095703125, 2.235595703125, 2.490234375, 2.744873046875, 2.99951171875, 3.254150390625, 3.5087890625, 3.763427734375, 4.01806640625, 4.272705078125, 4.52734375, 4.781982421875, 5.03662109375, 5.291259765625, 5.5458984375, 5.800537109375, 6.05517578125, 6.309814453125, 6.564453125, 6.819091796875, 7.07373046875, 7.328369140625, 7.5830078125, 7.837646484375, 8.09228515625, 8.346923828125, 8.6015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 4.0, 5.0, 5.0, 8.0, 11.0, 19.0, 14.0, 13.0, 19.0, 24.0, 22.0, 29.0, 28.0, 33.0, 38.0, 46.0, 47.0, 44.0, 43.0, 60.0, 49.0, 62.0, 41.0, 40.0, 41.0, 38.0, 29.0, 27.0, 24.0, 24.0, 23.0, 17.0, 13.0, 14.0, 12.0, 6.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.87109375, -4.723388671875, -4.57568359375, -4.427978515625, -4.2802734375, -4.132568359375, -3.98486328125, -3.837158203125, -3.689453125, -3.541748046875, -3.39404296875, -3.246337890625, -3.0986328125, -2.950927734375, -2.80322265625, -2.655517578125, -2.5078125, -2.360107421875, -2.21240234375, -2.064697265625, -1.9169921875, -1.769287109375, -1.62158203125, -1.473876953125, -1.326171875, -1.178466796875, -1.03076171875, -0.883056640625, -0.7353515625, -0.587646484375, -0.43994140625, -0.292236328125, -0.14453125, 0.003173828125, 0.15087890625, 0.298583984375, 0.4462890625, 0.593994140625, 0.74169921875, 0.889404296875, 1.037109375, 1.184814453125, 1.33251953125, 1.480224609375, 1.6279296875, 1.775634765625, 1.92333984375, 2.071044921875, 2.21875, 2.366455078125, 2.51416015625, 2.661865234375, 2.8095703125, 2.957275390625, 3.10498046875, 3.252685546875, 3.400390625, 3.548095703125, 3.69580078125, 3.843505859375, 3.9912109375, 4.138916015625, 4.28662109375, 4.434326171875, 4.58203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 10.0, 12.0, 18.0, 20.0, 25.0, 48.0, 123.0, 208.0, 443.0, 954.0, 2463.0, 7867.0, 55048.0, 864014.0, 101052.0, 10961.0, 3057.0, 1144.0, 526.0, 264.0, 117.0, 84.0, 45.0, 20.0, 12.0, 11.0, 7.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.28125, -13.798828125, -13.31640625, -12.833984375, -12.3515625, -11.869140625, -11.38671875, -10.904296875, -10.421875, -9.939453125, -9.45703125, -8.974609375, -8.4921875, -8.009765625, -7.52734375, -7.044921875, -6.5625, -6.080078125, -5.59765625, -5.115234375, -4.6328125, -4.150390625, -3.66796875, -3.185546875, -2.703125, -2.220703125, -1.73828125, -1.255859375, -0.7734375, -0.291015625, 0.19140625, 0.673828125, 1.15625, 1.638671875, 2.12109375, 2.603515625, 3.0859375, 3.568359375, 4.05078125, 4.533203125, 5.015625, 5.498046875, 5.98046875, 6.462890625, 6.9453125, 7.427734375, 7.91015625, 8.392578125, 8.875, 9.357421875, 9.83984375, 10.322265625, 10.8046875, 11.287109375, 11.76953125, 12.251953125, 12.734375, 13.216796875, 13.69921875, 14.181640625, 14.6640625, 15.146484375, 15.62890625, 16.111328125, 16.59375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 7.0, 15.0, 13.0, 35.0, 42.0, 79.0, 177.0, 252.0, 136.0, 80.0, 49.0, 30.0, 15.0, 11.0, 13.0, 6.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017938613891601562, -0.0017431676387786865, -0.0016924738883972168, -0.001641780138015747, -0.0015910863876342773, -0.0015403926372528076, -0.0014896988868713379, -0.0014390051364898682, -0.0013883113861083984, -0.0013376176357269287, -0.001286923885345459, -0.0012362301349639893, -0.0011855363845825195, -0.0011348426342010498, -0.00108414888381958, -0.0010334551334381104, -0.0009827613830566406, -0.0009320676326751709, -0.0008813738822937012, -0.0008306801319122314, -0.0007799863815307617, -0.000729292631149292, -0.0006785988807678223, -0.0006279051303863525, -0.0005772113800048828, -0.0005265176296234131, -0.00047582387924194336, -0.00042513012886047363, -0.0003744363784790039, -0.0003237426280975342, -0.00027304887771606445, -0.00022235512733459473, -0.000171661376953125, -0.00012096762657165527, -7.027387619018555e-05, -1.958012580871582e-05, 3.1113624572753906e-05, 8.180737495422363e-05, 0.00013250112533569336, 0.00018319487571716309, 0.0002338886260986328, 0.00028458237648010254, 0.00033527612686157227, 0.000385969877243042, 0.0004366636276245117, 0.00048735737800598145, 0.0005380511283874512, 0.0005887448787689209, 0.0006394386291503906, 0.0006901323795318604, 0.0007408261299133301, 0.0007915198802947998, 0.0008422136306762695, 0.0008929073810577393, 0.000943601131439209, 0.0009942948818206787, 0.0010449886322021484, 0.0010956823825836182, 0.0011463761329650879, 0.0011970698833465576, 0.0012477636337280273, 0.001298457384109497, 0.0013491511344909668, 0.0013998448848724365, 0.0014505386352539062]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 8.0, 5.0, 9.0, 7.0, 21.0, 24.0, 37.0, 43.0, 69.0, 96.0, 200.0, 365.0, 866.0, 1821.0, 4943.0, 15663.0, 85469.0, 794068.0, 116803.0, 18421.0, 5651.0, 2122.0, 888.0, 434.0, 213.0, 106.0, 71.0, 40.0, 27.0, 22.0, 12.0, 6.0, 9.0, 5.0, 8.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-13.3984375, -13.031982421875, -12.66552734375, -12.299072265625, -11.9326171875, -11.566162109375, -11.19970703125, -10.833251953125, -10.466796875, -10.100341796875, -9.73388671875, -9.367431640625, -9.0009765625, -8.634521484375, -8.26806640625, -7.901611328125, -7.53515625, -7.168701171875, -6.80224609375, -6.435791015625, -6.0693359375, -5.702880859375, -5.33642578125, -4.969970703125, -4.603515625, -4.237060546875, -3.87060546875, -3.504150390625, -3.1376953125, -2.771240234375, -2.40478515625, -2.038330078125, -1.671875, -1.305419921875, -0.93896484375, -0.572509765625, -0.2060546875, 0.160400390625, 0.52685546875, 0.893310546875, 1.259765625, 1.626220703125, 1.99267578125, 2.359130859375, 2.7255859375, 3.092041015625, 3.45849609375, 3.824951171875, 4.19140625, 4.557861328125, 4.92431640625, 5.290771484375, 5.6572265625, 6.023681640625, 6.39013671875, 6.756591796875, 7.123046875, 7.489501953125, 7.85595703125, 8.222412109375, 8.5888671875, 8.955322265625, 9.32177734375, 9.688232421875, 10.0546875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 3.0, 10.0, 7.0, 14.0, 18.0, 21.0, 30.0, 29.0, 48.0, 101.0, 132.0, 172.0, 108.0, 90.0, 54.0, 29.0, 33.0, 21.0, 15.0, 4.0, 6.0, 3.0, 4.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5390625, -5.3560791015625, -5.173095703125, -4.9901123046875, -4.80712890625, -4.6241455078125, -4.441162109375, -4.2581787109375, -4.0751953125, -3.8922119140625, -3.709228515625, -3.5262451171875, -3.34326171875, -3.1602783203125, -2.977294921875, -2.7943115234375, -2.611328125, -2.4283447265625, -2.245361328125, -2.0623779296875, -1.87939453125, -1.6964111328125, -1.513427734375, -1.3304443359375, -1.1474609375, -0.9644775390625, -0.781494140625, -0.5985107421875, -0.41552734375, -0.2325439453125, -0.049560546875, 0.1334228515625, 0.31640625, 0.4993896484375, 0.682373046875, 0.8653564453125, 1.04833984375, 1.2313232421875, 1.414306640625, 1.5972900390625, 1.7802734375, 1.9632568359375, 2.146240234375, 2.3292236328125, 2.51220703125, 2.6951904296875, 2.878173828125, 3.0611572265625, 3.244140625, 3.4271240234375, 3.610107421875, 3.7930908203125, 3.97607421875, 4.1590576171875, 4.342041015625, 4.5250244140625, 4.7080078125, 4.8909912109375, 5.073974609375, 5.2569580078125, 5.43994140625, 5.6229248046875, 5.805908203125, 5.9888916015625, 6.171875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 8.0, 28.0, 43.0, 93.0, 166.0, 209.0, 200.0, 102.0, 68.0, 38.0, 25.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.59515380859375, -144.2839813232422, -140.97280883789062, -137.66165161132812, -134.35047912597656, -131.039306640625, -127.72814178466797, -124.41697692871094, -121.10580444335938, -117.79463195800781, -114.48346710205078, -111.17230224609375, -107.86112976074219, -104.54995727539062, -101.2387924194336, -97.92762756347656, -94.616455078125, -91.30528259277344, -87.9941177368164, -84.68295288085938, -81.37178039550781, -78.06060791015625, -74.74944305419922, -71.43827819824219, -68.12710571289062, -64.81593322753906, -61.50476837158203, -58.193599700927734, -54.88243103027344, -51.57126235961914, -48.260093688964844, -44.94892501831055, -41.63775634765625, -38.32658767700195, -35.015419006347656, -31.70425033569336, -28.393081665039062, -25.081912994384766, -21.77074432373047, -18.459575653076172, -15.148406982421875, -11.837238311767578, -8.526069641113281, -5.214900970458984, -1.9037322998046875, 1.4074363708496094, 4.718605041503906, 8.029773712158203, 11.3409423828125, 14.652111053466797, 17.963279724121094, 21.27444839477539, 24.585617065429688, 27.896785736083984, 31.20795440673828, 34.51912307739258, 37.830291748046875, 41.14146041870117, 44.45262908935547, 47.763797760009766, 51.07496643066406, 54.38613510131836, 57.697303771972656, 61.00847244262695, 64.31964111328125]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 6.0, 0.0, 2.0, 5.0, 5.0, 2.0, 7.0, 10.0, 16.0, 23.0, 12.0, 30.0, 35.0, 28.0, 30.0, 37.0, 54.0, 43.0, 44.0, 60.0, 45.0, 47.0, 54.0, 54.0, 50.0, 49.0, 43.0, 42.0, 22.0, 35.0, 16.0, 22.0, 26.0, 12.0, 6.0, 12.0, 6.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.28107452392578, -24.2728214263916, -23.26456642150879, -22.25631332397461, -21.248058319091797, -20.239805221557617, -19.231552124023438, -18.223297119140625, -17.215044021606445, -16.206790924072266, -15.198535919189453, -14.190282821655273, -13.182028770446777, -12.173774719238281, -11.165521621704102, -10.157267570495605, -9.14901351928711, -8.140759468078613, -7.132505893707275, -6.1242523193359375, -5.115998268127441, -4.107744216918945, -3.0994906425476074, -2.0912370681762695, -1.0829830169677734, -0.07472920417785645, 0.9335246086120605, 1.9417784214019775, 2.9500322341918945, 3.9582862854003906, 4.9665398597717285, 5.974793434143066, 6.9830474853515625, 7.991301536560059, 8.999555587768555, 10.007808685302734, 11.01606273651123, 12.024316787719727, 13.032569885253906, 14.040823936462402, 15.049077987670898, 16.057331085205078, 17.06558609008789, 18.07383918762207, 19.08209228515625, 20.090347290039062, 21.098600387573242, 22.106853485107422, 23.115108489990234, 24.123361587524414, 25.131616592407227, 26.139869689941406, 27.14812469482422, 28.1563777923584, 29.164630889892578, 30.17288589477539, 31.18113899230957, 32.18939208984375, 33.19764709472656, 34.205902099609375, 35.21415328979492, 36.222408294677734, 37.23066329956055, 38.238914489746094, 39.247169494628906]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 6.0, 3.0, 9.0, 9.0, 10.0, 11.0, 19.0, 48.0, 66.0, 99.0, 144.0, 217.0, 360.0, 661.0, 1243.0, 2247.0, 4785.0, 10863.0, 28607.0, 108121.0, 3300174.0, 627301.0, 69982.0, 21747.0, 8878.0, 4014.0, 2009.0, 1122.0, 629.0, 329.0, 215.0, 115.0, 96.0, 59.0, 28.0, 22.0, 13.0, 12.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2421875, -10.9287109375, -10.615234375, -10.3017578125, -9.98828125, -9.6748046875, -9.361328125, -9.0478515625, -8.734375, -8.4208984375, -8.107421875, -7.7939453125, -7.48046875, -7.1669921875, -6.853515625, -6.5400390625, -6.2265625, -5.9130859375, -5.599609375, -5.2861328125, -4.97265625, -4.6591796875, -4.345703125, -4.0322265625, -3.71875, -3.4052734375, -3.091796875, -2.7783203125, -2.46484375, -2.1513671875, -1.837890625, -1.5244140625, -1.2109375, -0.8974609375, -0.583984375, -0.2705078125, 0.04296875, 0.3564453125, 0.669921875, 0.9833984375, 1.296875, 1.6103515625, 1.923828125, 2.2373046875, 2.55078125, 2.8642578125, 3.177734375, 3.4912109375, 3.8046875, 4.1181640625, 4.431640625, 4.7451171875, 5.05859375, 5.3720703125, 5.685546875, 5.9990234375, 6.3125, 6.6259765625, 6.939453125, 7.2529296875, 7.56640625, 7.8798828125, 8.193359375, 8.5068359375, 8.8203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 4.0, 8.0, 16.0, 12.0, 13.0, 23.0, 33.0, 33.0, 32.0, 45.0, 49.0, 47.0, 44.0, 62.0, 58.0, 52.0, 55.0, 59.0, 61.0, 46.0, 38.0, 39.0, 42.0, 35.0, 16.0, 17.0, 15.0, 8.0, 9.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1591796875, -1.12200927734375, -1.0848388671875, -1.04766845703125, -1.010498046875, -0.97332763671875, -0.9361572265625, -0.89898681640625, -0.86181640625, -0.82464599609375, -0.7874755859375, -0.75030517578125, -0.713134765625, -0.67596435546875, -0.6387939453125, -0.60162353515625, -0.564453125, -0.52728271484375, -0.4901123046875, -0.45294189453125, -0.415771484375, -0.37860107421875, -0.3414306640625, -0.30426025390625, -0.26708984375, -0.22991943359375, -0.1927490234375, -0.15557861328125, -0.118408203125, -0.08123779296875, -0.0440673828125, -0.00689697265625, 0.0302734375, 0.06744384765625, 0.1046142578125, 0.14178466796875, 0.178955078125, 0.21612548828125, 0.2532958984375, 0.29046630859375, 0.32763671875, 0.36480712890625, 0.4019775390625, 0.43914794921875, 0.476318359375, 0.51348876953125, 0.5506591796875, 0.58782958984375, 0.625, 0.66217041015625, 0.6993408203125, 0.73651123046875, 0.773681640625, 0.81085205078125, 0.8480224609375, 0.88519287109375, 0.92236328125, 0.95953369140625, 0.9967041015625, 1.03387451171875, 1.071044921875, 1.10821533203125, 1.1453857421875, 1.18255615234375, 1.2197265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 9.0, 10.0, 8.0, 12.0, 24.0, 45.0, 57.0, 100.0, 152.0, 316.0, 618.0, 1289.0, 3010.0, 7707.0, 22230.0, 82335.0, 951573.0, 2970103.0, 111351.0, 27819.0, 9247.0, 3436.0, 1492.0, 620.0, 297.0, 165.0, 89.0, 53.0, 43.0, 29.0, 21.0, 13.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.859375, -12.5126953125, -12.166015625, -11.8193359375, -11.47265625, -11.1259765625, -10.779296875, -10.4326171875, -10.0859375, -9.7392578125, -9.392578125, -9.0458984375, -8.69921875, -8.3525390625, -8.005859375, -7.6591796875, -7.3125, -6.9658203125, -6.619140625, -6.2724609375, -5.92578125, -5.5791015625, -5.232421875, -4.8857421875, -4.5390625, -4.1923828125, -3.845703125, -3.4990234375, -3.15234375, -2.8056640625, -2.458984375, -2.1123046875, -1.765625, -1.4189453125, -1.072265625, -0.7255859375, -0.37890625, -0.0322265625, 0.314453125, 0.6611328125, 1.0078125, 1.3544921875, 1.701171875, 2.0478515625, 2.39453125, 2.7412109375, 3.087890625, 3.4345703125, 3.78125, 4.1279296875, 4.474609375, 4.8212890625, 5.16796875, 5.5146484375, 5.861328125, 6.2080078125, 6.5546875, 6.9013671875, 7.248046875, 7.5947265625, 7.94140625, 8.2880859375, 8.634765625, 8.9814453125, 9.328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 8.0, 10.0, 11.0, 13.0, 17.0, 14.0, 32.0, 30.0, 63.0, 117.0, 173.0, 539.0, 1937.0, 569.0, 219.0, 106.0, 62.0, 45.0, 35.0, 25.0, 14.0, 17.0, 9.0, 8.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16796875, -5.018310546875, -4.86865234375, -4.718994140625, -4.5693359375, -4.419677734375, -4.27001953125, -4.120361328125, -3.970703125, -3.821044921875, -3.67138671875, -3.521728515625, -3.3720703125, -3.222412109375, -3.07275390625, -2.923095703125, -2.7734375, -2.623779296875, -2.47412109375, -2.324462890625, -2.1748046875, -2.025146484375, -1.87548828125, -1.725830078125, -1.576171875, -1.426513671875, -1.27685546875, -1.127197265625, -0.9775390625, -0.827880859375, -0.67822265625, -0.528564453125, -0.37890625, -0.229248046875, -0.07958984375, 0.070068359375, 0.2197265625, 0.369384765625, 0.51904296875, 0.668701171875, 0.818359375, 0.968017578125, 1.11767578125, 1.267333984375, 1.4169921875, 1.566650390625, 1.71630859375, 1.865966796875, 2.015625, 2.165283203125, 2.31494140625, 2.464599609375, 2.6142578125, 2.763916015625, 2.91357421875, 3.063232421875, 3.212890625, 3.362548828125, 3.51220703125, 3.661865234375, 3.8115234375, 3.961181640625, 4.11083984375, 4.260498046875, 4.41015625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 13.0, 30.0, 45.0, 75.0, 118.0, 183.0, 173.0, 152.0, 101.0, 57.0, 31.0, 10.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.253610610961914, -24.00343132019043, -22.753252029418945, -21.50307273864746, -20.252893447875977, -19.002714157104492, -17.752532958984375, -16.50235366821289, -15.252175331115723, -14.001996040344238, -12.751816749572754, -11.501636505126953, -10.251457214355469, -9.001277923583984, -7.7510986328125, -6.500919342041016, -5.250740051269531, -4.000560760498047, -2.7503812313079834, -1.50020170211792, -0.25002241134643555, 1.0001568794250488, 2.2503366470336914, 3.500515937805176, 4.75069522857666, 6.0008745193481445, 7.251053810119629, 8.50123405456543, 9.751413345336914, 11.001592636108398, 12.251771926879883, 13.501951217651367, 14.752132415771484, 16.00231170654297, 17.252490997314453, 18.502670288085938, 19.752849578857422, 21.003028869628906, 22.25320816040039, 23.503387451171875, 24.75356674194336, 26.003746032714844, 27.253925323486328, 28.504104614257812, 29.754283905029297, 31.00446319580078, 32.254642486572266, 33.50482177734375, 34.7550048828125, 36.005184173583984, 37.25536346435547, 38.50554275512695, 39.75572204589844, 41.00590133666992, 42.256080627441406, 43.50625991821289, 44.756439208984375, 46.00661849975586, 47.256797790527344, 48.50697708129883, 49.75715637207031, 51.0073356628418, 52.25751495361328, 53.507694244384766, 54.75787353515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 5.0, 12.0, 9.0, 12.0, 14.0, 13.0, 13.0, 23.0, 21.0, 20.0, 27.0, 31.0, 44.0, 26.0, 26.0, 43.0, 55.0, 64.0, 41.0, 41.0, 58.0, 42.0, 44.0, 33.0, 34.0, 35.0, 26.0, 39.0, 27.0, 21.0, 19.0, 14.0, 13.0, 7.0, 11.0, 10.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.184621810913086, -10.795694351196289, -10.406766891479492, -10.017839431762695, -9.628911972045898, -9.239983558654785, -8.851056098937988, -8.462128639221191, -8.073201179504395, -7.684273719787598, -7.295346260070801, -6.906418323516846, -6.517490863800049, -6.128563404083252, -5.739635467529297, -5.3507080078125, -4.961780548095703, -4.572853088378906, -4.183925628662109, -3.7949976921081543, -3.4060702323913574, -3.0171427726745605, -2.6282150745391846, -2.2392873764038086, -1.8503599166870117, -1.4614323377609253, -1.0725047588348389, -0.6835771799087524, -0.294649600982666, 0.09427797794342041, 0.48320555686950684, 0.8721332550048828, 1.2610607147216797, 1.6499882936477661, 2.0389158725738525, 2.4278435707092285, 2.8167710304260254, 3.2056984901428223, 3.5946261882781982, 3.983553886413574, 4.372481346130371, 4.761408805847168, 5.150336265563965, 5.53926420211792, 5.928191661834717, 6.317119121551514, 6.706047058105469, 7.094974517822266, 7.4839019775390625, 7.872829437255859, 8.261756896972656, 8.650684356689453, 9.03961181640625, 9.428540229797363, 9.81746768951416, 10.206395149230957, 10.595322608947754, 10.98425006866455, 11.373177528381348, 11.762104988098145, 12.151033401489258, 12.539960861206055, 12.928888320922852, 13.317815780639648, 13.706743240356445]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 10.0, 19.0, 17.0, 29.0, 33.0, 66.0, 93.0, 132.0, 184.0, 294.0, 451.0, 669.0, 1063.0, 1710.0, 2863.0, 4556.0, 7604.0, 13261.0, 24101.0, 43031.0, 85487.0, 381015.0, 311121.0, 77374.0, 39831.0, 22494.0, 12489.0, 7193.0, 4319.0, 2585.0, 1596.0, 1006.0, 606.0, 446.0, 267.0, 173.0, 116.0, 79.0, 56.0, 32.0, 28.0, 23.0, 8.0, 8.0, 7.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.7734375, -6.5738525390625, -6.374267578125, -6.1746826171875, -5.97509765625, -5.7755126953125, -5.575927734375, -5.3763427734375, -5.1767578125, -4.9771728515625, -4.777587890625, -4.5780029296875, -4.37841796875, -4.1788330078125, -3.979248046875, -3.7796630859375, -3.580078125, -3.3804931640625, -3.180908203125, -2.9813232421875, -2.78173828125, -2.5821533203125, -2.382568359375, -2.1829833984375, -1.9833984375, -1.7838134765625, -1.584228515625, -1.3846435546875, -1.18505859375, -0.9854736328125, -0.785888671875, -0.5863037109375, -0.38671875, -0.1871337890625, 0.012451171875, 0.2120361328125, 0.41162109375, 0.6112060546875, 0.810791015625, 1.0103759765625, 1.2099609375, 1.4095458984375, 1.609130859375, 1.8087158203125, 2.00830078125, 2.2078857421875, 2.407470703125, 2.6070556640625, 2.806640625, 3.0062255859375, 3.205810546875, 3.4053955078125, 3.60498046875, 3.8045654296875, 4.004150390625, 4.2037353515625, 4.4033203125, 4.6029052734375, 4.802490234375, 5.0020751953125, 5.20166015625, 5.4012451171875, 5.600830078125, 5.8004150390625, 6.0]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 9.0, 17.0, 23.0, 22.0, 33.0, 31.0, 48.0, 41.0, 45.0, 41.0, 58.0, 74.0, 59.0, 55.0, 56.0, 55.0, 43.0, 44.0, 42.0, 44.0, 31.0, 19.0, 22.0, 15.0, 23.0, 7.0, 11.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.244140625, -1.2049713134765625, -1.165802001953125, -1.1266326904296875, -1.08746337890625, -1.0482940673828125, -1.009124755859375, -0.9699554443359375, -0.9307861328125, -0.8916168212890625, -0.852447509765625, -0.8132781982421875, -0.77410888671875, -0.7349395751953125, -0.695770263671875, -0.6566009521484375, -0.617431640625, -0.5782623291015625, -0.539093017578125, -0.4999237060546875, -0.46075439453125, -0.4215850830078125, -0.382415771484375, -0.3432464599609375, -0.3040771484375, -0.2649078369140625, -0.225738525390625, -0.1865692138671875, -0.14739990234375, -0.1082305908203125, -0.069061279296875, -0.0298919677734375, 0.00927734375, 0.0484466552734375, 0.087615966796875, 0.1267852783203125, 0.16595458984375, 0.2051239013671875, 0.244293212890625, 0.2834625244140625, 0.3226318359375, 0.3618011474609375, 0.400970458984375, 0.4401397705078125, 0.47930908203125, 0.5184783935546875, 0.557647705078125, 0.5968170166015625, 0.635986328125, 0.6751556396484375, 0.714324951171875, 0.7534942626953125, 0.79266357421875, 0.8318328857421875, 0.871002197265625, 0.9101715087890625, 0.9493408203125, 0.9885101318359375, 1.027679443359375, 1.0668487548828125, 1.10601806640625, 1.1451873779296875, 1.184356689453125, 1.2235260009765625, 1.2626953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 4.0, 9.0, 15.0, 13.0, 9.0, 16.0, 24.0, 34.0, 43.0, 58.0, 91.0, 128.0, 181.0, 274.0, 410.0, 784.0, 1552.0, 3395.0, 8123.0, 21315.0, 65246.0, 411998.0, 431352.0, 66075.0, 21823.0, 8360.0, 3410.0, 1593.0, 807.0, 454.0, 288.0, 199.0, 140.0, 95.0, 63.0, 60.0, 42.0, 18.0, 16.0, 7.0, 6.0, 4.0, 4.0, 5.0, 8.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-11.1796875, -10.8509521484375, -10.522216796875, -10.1934814453125, -9.86474609375, -9.5360107421875, -9.207275390625, -8.8785400390625, -8.5498046875, -8.2210693359375, -7.892333984375, -7.5635986328125, -7.23486328125, -6.9061279296875, -6.577392578125, -6.2486572265625, -5.919921875, -5.5911865234375, -5.262451171875, -4.9337158203125, -4.60498046875, -4.2762451171875, -3.947509765625, -3.6187744140625, -3.2900390625, -2.9613037109375, -2.632568359375, -2.3038330078125, -1.97509765625, -1.6463623046875, -1.317626953125, -0.9888916015625, -0.66015625, -0.3314208984375, -0.002685546875, 0.3260498046875, 0.65478515625, 0.9835205078125, 1.312255859375, 1.6409912109375, 1.9697265625, 2.2984619140625, 2.627197265625, 2.9559326171875, 3.28466796875, 3.6134033203125, 3.942138671875, 4.2708740234375, 4.599609375, 4.9283447265625, 5.257080078125, 5.5858154296875, 5.91455078125, 6.2432861328125, 6.572021484375, 6.9007568359375, 7.2294921875, 7.5582275390625, 7.886962890625, 8.2156982421875, 8.54443359375, 8.8731689453125, 9.201904296875, 9.5306396484375, 9.859375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 0.0, 2.0, 2.0, 7.0, 6.0, 6.0, 6.0, 8.0, 8.0, 8.0, 8.0, 23.0, 29.0, 34.0, 28.0, 47.0, 46.0, 37.0, 52.0, 64.0, 67.0, 53.0, 55.0, 52.0, 42.0, 41.0, 44.0, 33.0, 27.0, 23.0, 25.0, 29.0, 20.0, 15.0, 7.0, 13.0, 10.0, 6.0, 9.0, 8.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.640625, -5.4610595703125, -5.281494140625, -5.1019287109375, -4.92236328125, -4.7427978515625, -4.563232421875, -4.3836669921875, -4.2041015625, -4.0245361328125, -3.844970703125, -3.6654052734375, -3.48583984375, -3.3062744140625, -3.126708984375, -2.9471435546875, -2.767578125, -2.5880126953125, -2.408447265625, -2.2288818359375, -2.04931640625, -1.8697509765625, -1.690185546875, -1.5106201171875, -1.3310546875, -1.1514892578125, -0.971923828125, -0.7923583984375, -0.61279296875, -0.4332275390625, -0.253662109375, -0.0740966796875, 0.10546875, 0.2850341796875, 0.464599609375, 0.6441650390625, 0.82373046875, 1.0032958984375, 1.182861328125, 1.3624267578125, 1.5419921875, 1.7215576171875, 1.901123046875, 2.0806884765625, 2.26025390625, 2.4398193359375, 2.619384765625, 2.7989501953125, 2.978515625, 3.1580810546875, 3.337646484375, 3.5172119140625, 3.69677734375, 3.8763427734375, 4.055908203125, 4.2354736328125, 4.4150390625, 4.5946044921875, 4.774169921875, 4.9537353515625, 5.13330078125, 5.3128662109375, 5.492431640625, 5.6719970703125, 5.8515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 9.0, 6.0, 8.0, 17.0, 24.0, 35.0, 50.0, 82.0, 134.0, 286.0, 553.0, 1056.0, 2460.0, 6481.0, 21498.0, 182117.0, 765137.0, 50143.0, 11373.0, 3829.0, 1547.0, 766.0, 394.0, 209.0, 125.0, 83.0, 39.0, 29.0, 20.0, 15.0, 10.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.671875, -7.390380859375, -7.10888671875, -6.827392578125, -6.5458984375, -6.264404296875, -5.98291015625, -5.701416015625, -5.419921875, -5.138427734375, -4.85693359375, -4.575439453125, -4.2939453125, -4.012451171875, -3.73095703125, -3.449462890625, -3.16796875, -2.886474609375, -2.60498046875, -2.323486328125, -2.0419921875, -1.760498046875, -1.47900390625, -1.197509765625, -0.916015625, -0.634521484375, -0.35302734375, -0.071533203125, 0.2099609375, 0.491455078125, 0.77294921875, 1.054443359375, 1.3359375, 1.617431640625, 1.89892578125, 2.180419921875, 2.4619140625, 2.743408203125, 3.02490234375, 3.306396484375, 3.587890625, 3.869384765625, 4.15087890625, 4.432373046875, 4.7138671875, 4.995361328125, 5.27685546875, 5.558349609375, 5.83984375, 6.121337890625, 6.40283203125, 6.684326171875, 6.9658203125, 7.247314453125, 7.52880859375, 7.810302734375, 8.091796875, 8.373291015625, 8.65478515625, 8.936279296875, 9.2177734375, 9.499267578125, 9.78076171875, 10.062255859375, 10.34375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 4.0, 5.0, 5.0, 12.0, 13.0, 21.0, 24.0, 29.0, 60.0, 114.0, 281.0, 200.0, 78.0, 34.0, 30.0, 26.0, 10.0, 8.0, 14.0, 2.0, 5.0, 5.0, 10.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012197494506835938, -0.001180201768875122, -0.0011406540870666504, -0.0011011064052581787, -0.001061558723449707, -0.0010220110416412354, -0.0009824633598327637, -0.000942915678024292, -0.0009033679962158203, -0.0008638203144073486, -0.000824272632598877, -0.0007847249507904053, -0.0007451772689819336, -0.0007056295871734619, -0.0006660819053649902, -0.0006265342235565186, -0.0005869865417480469, -0.0005474388599395752, -0.0005078911781311035, -0.00046834349632263184, -0.00042879581451416016, -0.0003892481327056885, -0.0003497004508972168, -0.0003101527690887451, -0.00027060508728027344, -0.00023105740547180176, -0.00019150972366333008, -0.0001519620418548584, -0.00011241436004638672, -7.286667823791504e-05, -3.331899642944336e-05, 6.22868537902832e-06, 4.57763671875e-05, 8.532404899597168e-05, 0.00012487173080444336, 0.00016441941261291504, 0.00020396709442138672, 0.0002435147762298584, 0.0002830624580383301, 0.00032261013984680176, 0.00036215782165527344, 0.0004017055034637451, 0.0004412531852722168, 0.0004808008670806885, 0.0005203485488891602, 0.0005598962306976318, 0.0005994439125061035, 0.0006389915943145752, 0.0006785392761230469, 0.0007180869579315186, 0.0007576346397399902, 0.0007971823215484619, 0.0008367300033569336, 0.0008762776851654053, 0.000915825366973877, 0.0009553730487823486, 0.0009949207305908203, 0.001034468412399292, 0.0010740160942077637, 0.0011135637760162354, 0.001153111457824707, 0.0011926591396331787, 0.0012322068214416504, 0.001271754503250122, 0.0013113021850585938]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 2.0, 5.0, 4.0, 4.0, 9.0, 12.0, 15.0, 21.0, 24.0, 46.0, 61.0, 103.0, 167.0, 277.0, 592.0, 1317.0, 3095.0, 8850.0, 37956.0, 752238.0, 212977.0, 20452.0, 6030.0, 2230.0, 905.0, 457.0, 222.0, 126.0, 86.0, 53.0, 50.0, 34.0, 30.0, 28.0, 16.0, 17.0, 13.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-10.078125, -9.7886962890625, -9.499267578125, -9.2098388671875, -8.92041015625, -8.6309814453125, -8.341552734375, -8.0521240234375, -7.7626953125, -7.4732666015625, -7.183837890625, -6.8944091796875, -6.60498046875, -6.3155517578125, -6.026123046875, -5.7366943359375, -5.447265625, -5.1578369140625, -4.868408203125, -4.5789794921875, -4.28955078125, -4.0001220703125, -3.710693359375, -3.4212646484375, -3.1318359375, -2.8424072265625, -2.552978515625, -2.2635498046875, -1.97412109375, -1.6846923828125, -1.395263671875, -1.1058349609375, -0.81640625, -0.5269775390625, -0.237548828125, 0.0518798828125, 0.34130859375, 0.6307373046875, 0.920166015625, 1.2095947265625, 1.4990234375, 1.7884521484375, 2.077880859375, 2.3673095703125, 2.65673828125, 2.9461669921875, 3.235595703125, 3.5250244140625, 3.814453125, 4.1038818359375, 4.393310546875, 4.6827392578125, 4.97216796875, 5.2615966796875, 5.551025390625, 5.8404541015625, 6.1298828125, 6.4193115234375, 6.708740234375, 6.9981689453125, 7.28759765625, 7.5770263671875, 7.866455078125, 8.1558837890625, 8.4453125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 5.0, 10.0, 12.0, 11.0, 15.0, 26.0, 76.0, 143.0, 200.0, 184.0, 112.0, 50.0, 34.0, 17.0, 13.0, 12.0, 5.0, 6.0, 7.0, 6.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.73046875, -5.57037353515625, -5.4102783203125, -5.25018310546875, -5.090087890625, -4.92999267578125, -4.7698974609375, -4.60980224609375, -4.44970703125, -4.28961181640625, -4.1295166015625, -3.96942138671875, -3.809326171875, -3.64923095703125, -3.4891357421875, -3.32904052734375, -3.1689453125, -3.00885009765625, -2.8487548828125, -2.68865966796875, -2.528564453125, -2.36846923828125, -2.2083740234375, -2.04827880859375, -1.88818359375, -1.72808837890625, -1.5679931640625, -1.40789794921875, -1.247802734375, -1.08770751953125, -0.9276123046875, -0.76751708984375, -0.607421875, -0.44732666015625, -0.2872314453125, -0.12713623046875, 0.032958984375, 0.19305419921875, 0.3531494140625, 0.51324462890625, 0.67333984375, 0.83343505859375, 0.9935302734375, 1.15362548828125, 1.313720703125, 1.47381591796875, 1.6339111328125, 1.79400634765625, 1.9541015625, 2.11419677734375, 2.2742919921875, 2.43438720703125, 2.594482421875, 2.75457763671875, 2.9146728515625, 3.07476806640625, 3.23486328125, 3.39495849609375, 3.5550537109375, 3.71514892578125, 3.875244140625, 4.03533935546875, 4.1954345703125, 4.35552978515625, 4.515625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 19.0, 30.0, 62.0, 152.0, 179.0, 196.0, 164.0, 104.0, 57.0, 19.0, 9.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.7877197265625, -69.37320709228516, -65.95869445800781, -62.544189453125, -59.129676818847656, -55.71516418457031, -52.300655364990234, -48.886146545410156, -45.47163391113281, -42.05712127685547, -38.64261245727539, -35.22810363769531, -31.81359100341797, -28.399080276489258, -24.984569549560547, -21.570058822631836, -18.155548095703125, -14.741037368774414, -11.326526641845703, -7.912015914916992, -4.497505187988281, -1.0829944610595703, 2.3315162658691406, 5.746026992797852, 9.160537719726562, 12.575048446655273, 15.989559173583984, 19.404069900512695, 22.818580627441406, 26.233091354370117, 29.647602081298828, 33.062110900878906, 36.47662353515625, 39.891136169433594, 43.30564498901367, 46.72015380859375, 50.134666442871094, 53.54917907714844, 56.963687896728516, 60.378196716308594, 63.79270935058594, 67.20722198486328, 70.62173461914062, 74.03623962402344, 77.45075225830078, 80.86526489257812, 84.27976989746094, 87.69428253173828, 91.10879516601562, 94.52330780029297, 97.93782043457031, 101.35232543945312, 104.76683807373047, 108.18135070800781, 111.59585571289062, 115.01036834716797, 118.42488098144531, 121.83939361572266, 125.25390625, 128.6684112548828, 132.08291625976562, 135.4974365234375, 138.9119415283203, 142.3264617919922, 145.740966796875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 6.0, 11.0, 12.0, 14.0, 14.0, 22.0, 20.0, 24.0, 31.0, 46.0, 40.0, 38.0, 40.0, 50.0, 41.0, 51.0, 52.0, 45.0, 48.0, 36.0, 46.0, 53.0, 35.0, 36.0, 37.0, 31.0, 23.0, 22.0, 17.0, 14.0, 12.0, 8.0, 6.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.459569931030273, -25.506454467773438, -24.553340911865234, -23.6002254486084, -22.647109985351562, -21.69399642944336, -20.740880966186523, -19.787765502929688, -18.834651947021484, -17.88153648376465, -16.928422927856445, -15.97530746459961, -15.022192001342773, -14.069077491760254, -13.115962982177734, -12.162847518920898, -11.209732055664062, -10.256617546081543, -9.303502082824707, -8.350387573242188, -7.39727258682251, -6.444157600402832, -5.4910430908203125, -4.537928104400635, -3.584813117980957, -2.6316981315612793, -1.6785833835601807, -0.725468635559082, 0.2276463508605957, 1.1807613372802734, 2.133875846862793, 3.0869908332824707, 4.040103912353516, 4.993218898773193, 5.946333885192871, 6.899448394775391, 7.852563381195068, 8.805678367614746, 9.758792877197266, 10.711908340454102, 11.665022850036621, 12.61813735961914, 13.571252822875977, 14.524367332458496, 15.477481842041016, 16.43059730529785, 17.383712768554688, 18.33682632446289, 19.289941787719727, 20.243057250976562, 21.196170806884766, 22.1492862701416, 23.102401733398438, 24.05551528930664, 25.008630752563477, 25.961746215820312, 26.914859771728516, 27.86797523498535, 28.821088790893555, 29.77420425415039, 30.727319717407227, 31.680435180664062, 32.633548736572266, 33.58666229248047, 34.53977966308594]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 11.0, 14.0, 22.0, 36.0, 36.0, 61.0, 100.0, 145.0, 240.0, 393.0, 686.0, 1114.0, 2096.0, 4061.0, 8170.0, 17484.0, 44578.0, 200111.0, 3617753.0, 215164.0, 45950.0, 18118.0, 8524.0, 4197.0, 2194.0, 1260.0, 723.0, 385.0, 246.0, 156.0, 79.0, 69.0, 34.0, 18.0, 16.0, 12.0, 10.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1953125, -9.871826171875, -9.54833984375, -9.224853515625, -8.9013671875, -8.577880859375, -8.25439453125, -7.930908203125, -7.607421875, -7.283935546875, -6.96044921875, -6.636962890625, -6.3134765625, -5.989990234375, -5.66650390625, -5.343017578125, -5.01953125, -4.696044921875, -4.37255859375, -4.049072265625, -3.7255859375, -3.402099609375, -3.07861328125, -2.755126953125, -2.431640625, -2.108154296875, -1.78466796875, -1.461181640625, -1.1376953125, -0.814208984375, -0.49072265625, -0.167236328125, 0.15625, 0.479736328125, 0.80322265625, 1.126708984375, 1.4501953125, 1.773681640625, 2.09716796875, 2.420654296875, 2.744140625, 3.067626953125, 3.39111328125, 3.714599609375, 4.0380859375, 4.361572265625, 4.68505859375, 5.008544921875, 5.33203125, 5.655517578125, 5.97900390625, 6.302490234375, 6.6259765625, 6.949462890625, 7.27294921875, 7.596435546875, 7.919921875, 8.243408203125, 8.56689453125, 8.890380859375, 9.2138671875, 9.537353515625, 9.86083984375, 10.184326171875, 10.5078125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 6.0, 7.0, 22.0, 14.0, 33.0, 26.0, 38.0, 40.0, 45.0, 56.0, 47.0, 62.0, 57.0, 45.0, 68.0, 58.0, 47.0, 54.0, 60.0, 40.0, 40.0, 31.0, 26.0, 12.0, 10.0, 18.0, 7.0, 8.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.421875, -1.3782501220703125, -1.334625244140625, -1.2910003662109375, -1.24737548828125, -1.2037506103515625, -1.160125732421875, -1.1165008544921875, -1.0728759765625, -1.0292510986328125, -0.985626220703125, -0.9420013427734375, -0.89837646484375, -0.8547515869140625, -0.811126708984375, -0.7675018310546875, -0.723876953125, -0.6802520751953125, -0.636627197265625, -0.5930023193359375, -0.54937744140625, -0.5057525634765625, -0.462127685546875, -0.4185028076171875, -0.3748779296875, -0.3312530517578125, -0.287628173828125, -0.2440032958984375, -0.20037841796875, -0.1567535400390625, -0.113128662109375, -0.0695037841796875, -0.02587890625, 0.0177459716796875, 0.061370849609375, 0.1049957275390625, 0.14862060546875, 0.1922454833984375, 0.235870361328125, 0.2794952392578125, 0.3231201171875, 0.3667449951171875, 0.410369873046875, 0.4539947509765625, 0.49761962890625, 0.5412445068359375, 0.584869384765625, 0.6284942626953125, 0.672119140625, 0.7157440185546875, 0.759368896484375, 0.8029937744140625, 0.84661865234375, 0.8902435302734375, 0.933868408203125, 0.9774932861328125, 1.0211181640625, 1.0647430419921875, 1.108367919921875, 1.1519927978515625, 1.19561767578125, 1.2392425537109375, 1.282867431640625, 1.3264923095703125, 1.3701171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 14.0, 21.0, 26.0, 46.0, 79.0, 107.0, 148.0, 278.0, 549.0, 1009.0, 2059.0, 4690.0, 11516.0, 34017.0, 151572.0, 3563841.0, 342244.0, 53486.0, 16562.0, 6412.0, 2786.0, 1274.0, 679.0, 351.0, 198.0, 109.0, 67.0, 48.0, 23.0, 26.0, 12.0, 8.0, 7.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.21875, -11.8330078125, -11.447265625, -11.0615234375, -10.67578125, -10.2900390625, -9.904296875, -9.5185546875, -9.1328125, -8.7470703125, -8.361328125, -7.9755859375, -7.58984375, -7.2041015625, -6.818359375, -6.4326171875, -6.046875, -5.6611328125, -5.275390625, -4.8896484375, -4.50390625, -4.1181640625, -3.732421875, -3.3466796875, -2.9609375, -2.5751953125, -2.189453125, -1.8037109375, -1.41796875, -1.0322265625, -0.646484375, -0.2607421875, 0.125, 0.5107421875, 0.896484375, 1.2822265625, 1.66796875, 2.0537109375, 2.439453125, 2.8251953125, 3.2109375, 3.5966796875, 3.982421875, 4.3681640625, 4.75390625, 5.1396484375, 5.525390625, 5.9111328125, 6.296875, 6.6826171875, 7.068359375, 7.4541015625, 7.83984375, 8.2255859375, 8.611328125, 8.9970703125, 9.3828125, 9.7685546875, 10.154296875, 10.5400390625, 10.92578125, 11.3115234375, 11.697265625, 12.0830078125, 12.46875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 12.0, 17.0, 23.0, 16.0, 48.0, 70.0, 98.0, 149.0, 329.0, 1704.0, 943.0, 255.0, 130.0, 90.0, 43.0, 39.0, 25.0, 12.0, 15.0, 15.0, 5.0, 8.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.211669921875, -4.07958984375, -3.947509765625, -3.8154296875, -3.683349609375, -3.55126953125, -3.419189453125, -3.287109375, -3.155029296875, -3.02294921875, -2.890869140625, -2.7587890625, -2.626708984375, -2.49462890625, -2.362548828125, -2.23046875, -2.098388671875, -1.96630859375, -1.834228515625, -1.7021484375, -1.570068359375, -1.43798828125, -1.305908203125, -1.173828125, -1.041748046875, -0.90966796875, -0.777587890625, -0.6455078125, -0.513427734375, -0.38134765625, -0.249267578125, -0.1171875, 0.014892578125, 0.14697265625, 0.279052734375, 0.4111328125, 0.543212890625, 0.67529296875, 0.807373046875, 0.939453125, 1.071533203125, 1.20361328125, 1.335693359375, 1.4677734375, 1.599853515625, 1.73193359375, 1.864013671875, 1.99609375, 2.128173828125, 2.26025390625, 2.392333984375, 2.5244140625, 2.656494140625, 2.78857421875, 2.920654296875, 3.052734375, 3.184814453125, 3.31689453125, 3.448974609375, 3.5810546875, 3.713134765625, 3.84521484375, 3.977294921875, 4.109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 10.0, 9.0, 27.0, 26.0, 61.0, 64.0, 116.0, 113.0, 153.0, 101.0, 99.0, 85.0, 59.0, 37.0, 14.0, 11.0, 6.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.83433532714844, -44.87868881225586, -43.92304229736328, -42.96739959716797, -42.01175308227539, -41.05610656738281, -40.100460052490234, -39.144813537597656, -38.189170837402344, -37.233524322509766, -36.27787780761719, -35.322235107421875, -34.3665885925293, -33.41094207763672, -32.45529556274414, -31.499649047851562, -30.544002532958984, -29.588356018066406, -28.63271141052246, -27.677064895629883, -26.721420288085938, -25.76577377319336, -24.81012725830078, -23.854480743408203, -22.898836135864258, -21.94318962097168, -20.987545013427734, -20.031898498535156, -19.076251983642578, -18.120607376098633, -17.164960861206055, -16.20931625366211, -15.253671646118164, -14.298026084899902, -13.34238052368164, -12.386734008789062, -11.4310884475708, -10.475442886352539, -9.519796371459961, -8.5641508102417, -7.6085052490234375, -6.652859687805176, -5.697213649749756, -4.741567611694336, -3.785922050476074, -2.8302764892578125, -1.8746304512023926, -0.9189844131469727, 0.03666114807128906, 0.9923069477081299, 1.9479527473449707, 2.9035985469818115, 3.8592443466186523, 4.814889907836914, 5.770535945892334, 6.726181983947754, 7.681827545166016, 8.637473106384277, 9.593118667602539, 10.548765182495117, 11.504410743713379, 12.46005630493164, 13.415702819824219, 14.37134838104248, 15.326993942260742]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 11.0, 3.0, 8.0, 7.0, 7.0, 4.0, 15.0, 20.0, 17.0, 21.0, 22.0, 27.0, 31.0, 29.0, 30.0, 34.0, 37.0, 35.0, 38.0, 32.0, 45.0, 42.0, 41.0, 38.0, 33.0, 35.0, 35.0, 36.0, 25.0, 35.0, 26.0, 20.0, 30.0, 23.0, 20.0, 21.0, 10.0, 18.0, 8.0, 7.0, 13.0, 6.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.537696838378906, -12.187530517578125, -11.837364196777344, -11.487197875976562, -11.137031555175781, -10.786865234375, -10.436698913574219, -10.086532592773438, -9.736366271972656, -9.386199951171875, -9.036033630371094, -8.685867309570312, -8.335700988769531, -7.98553466796875, -7.6353678703308105, -7.285201549530029, -6.93503475189209, -6.584868431091309, -6.234702110290527, -5.884535789489746, -5.534369468688965, -5.184203147888184, -4.834036350250244, -4.483870029449463, -4.133703708648682, -3.7835373878479004, -3.433371067047119, -3.083204507827759, -2.7330381870269775, -2.3828718662261963, -2.032705307006836, -1.6825389862060547, -1.332371711730957, -0.982205331325531, -0.632038950920105, -0.2818725109100342, 0.06829380989074707, 0.4184601306915283, 0.7686266899108887, 1.11879301071167, 1.4689593315124512, 1.8191256523132324, 2.1692919731140137, 2.519458532333374, 2.8696248531341553, 3.2197911739349365, 3.569957733154297, 3.920124053955078, 4.270290374755859, 4.620456695556641, 4.970623016357422, 5.320789337158203, 5.670955657958984, 6.021121978759766, 6.371288776397705, 6.721455097198486, 7.071621417999268, 7.421787738800049, 7.77195405960083, 8.12212085723877, 8.47228717803955, 8.822453498840332, 9.172619819641113, 9.522786140441895, 9.872952461242676]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 5.0, 8.0, 19.0, 17.0, 26.0, 51.0, 85.0, 123.0, 175.0, 299.0, 415.0, 685.0, 1163.0, 1891.0, 3138.0, 5410.0, 9313.0, 16450.0, 28727.0, 56740.0, 198473.0, 513694.0, 111183.0, 44144.0, 23825.0, 13377.0, 7719.0, 4517.0, 2663.0, 1670.0, 946.0, 567.0, 347.0, 231.0, 150.0, 100.0, 61.0, 37.0, 26.0, 14.0, 22.0, 11.0, 10.0, 6.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.55078125, -6.34814453125, -6.1455078125, -5.94287109375, -5.740234375, -5.53759765625, -5.3349609375, -5.13232421875, -4.9296875, -4.72705078125, -4.5244140625, -4.32177734375, -4.119140625, -3.91650390625, -3.7138671875, -3.51123046875, -3.30859375, -3.10595703125, -2.9033203125, -2.70068359375, -2.498046875, -2.29541015625, -2.0927734375, -1.89013671875, -1.6875, -1.48486328125, -1.2822265625, -1.07958984375, -0.876953125, -0.67431640625, -0.4716796875, -0.26904296875, -0.06640625, 0.13623046875, 0.3388671875, 0.54150390625, 0.744140625, 0.94677734375, 1.1494140625, 1.35205078125, 1.5546875, 1.75732421875, 1.9599609375, 2.16259765625, 2.365234375, 2.56787109375, 2.7705078125, 2.97314453125, 3.17578125, 3.37841796875, 3.5810546875, 3.78369140625, 3.986328125, 4.18896484375, 4.3916015625, 4.59423828125, 4.796875, 4.99951171875, 5.2021484375, 5.40478515625, 5.607421875, 5.81005859375, 6.0126953125, 6.21533203125, 6.41796875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 11.0, 1.0, 9.0, 11.0, 19.0, 21.0, 27.0, 31.0, 35.0, 30.0, 42.0, 53.0, 58.0, 61.0, 41.0, 54.0, 56.0, 61.0, 56.0, 59.0, 48.0, 36.0, 36.0, 38.0, 21.0, 18.0, 18.0, 11.0, 12.0, 6.0, 9.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.416015625, -1.3726043701171875, -1.329193115234375, -1.2857818603515625, -1.24237060546875, -1.1989593505859375, -1.155548095703125, -1.1121368408203125, -1.0687255859375, -1.0253143310546875, -0.981903076171875, -0.9384918212890625, -0.89508056640625, -0.8516693115234375, -0.808258056640625, -0.7648468017578125, -0.721435546875, -0.6780242919921875, -0.634613037109375, -0.5912017822265625, -0.54779052734375, -0.5043792724609375, -0.460968017578125, -0.4175567626953125, -0.3741455078125, -0.3307342529296875, -0.287322998046875, -0.2439117431640625, -0.20050048828125, -0.1570892333984375, -0.113677978515625, -0.0702667236328125, -0.02685546875, 0.0165557861328125, 0.059967041015625, 0.1033782958984375, 0.14678955078125, 0.1902008056640625, 0.233612060546875, 0.2770233154296875, 0.3204345703125, 0.3638458251953125, 0.407257080078125, 0.4506683349609375, 0.49407958984375, 0.5374908447265625, 0.580902099609375, 0.6243133544921875, 0.667724609375, 0.7111358642578125, 0.754547119140625, 0.7979583740234375, 0.84136962890625, 0.8847808837890625, 0.928192138671875, 0.9716033935546875, 1.0150146484375, 1.0584259033203125, 1.101837158203125, 1.1452484130859375, 1.18865966796875, 1.2320709228515625, 1.275482177734375, 1.3188934326171875, 1.3623046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 6.0, 8.0, 11.0, 13.0, 25.0, 35.0, 65.0, 81.0, 120.0, 188.0, 313.0, 539.0, 950.0, 1729.0, 3323.0, 6731.0, 14446.0, 31727.0, 80692.0, 604452.0, 210151.0, 50288.0, 21823.0, 10139.0, 4991.0, 2520.0, 1312.0, 775.0, 406.0, 234.0, 160.0, 103.0, 57.0, 41.0, 25.0, 16.0, 14.0, 11.0, 7.0, 5.0, 5.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.6015625, -8.322021484375, -8.04248046875, -7.762939453125, -7.4833984375, -7.203857421875, -6.92431640625, -6.644775390625, -6.365234375, -6.085693359375, -5.80615234375, -5.526611328125, -5.2470703125, -4.967529296875, -4.68798828125, -4.408447265625, -4.12890625, -3.849365234375, -3.56982421875, -3.290283203125, -3.0107421875, -2.731201171875, -2.45166015625, -2.172119140625, -1.892578125, -1.613037109375, -1.33349609375, -1.053955078125, -0.7744140625, -0.494873046875, -0.21533203125, 0.064208984375, 0.34375, 0.623291015625, 0.90283203125, 1.182373046875, 1.4619140625, 1.741455078125, 2.02099609375, 2.300537109375, 2.580078125, 2.859619140625, 3.13916015625, 3.418701171875, 3.6982421875, 3.977783203125, 4.25732421875, 4.536865234375, 4.81640625, 5.095947265625, 5.37548828125, 5.655029296875, 5.9345703125, 6.214111328125, 6.49365234375, 6.773193359375, 7.052734375, 7.332275390625, 7.61181640625, 7.891357421875, 8.1708984375, 8.450439453125, 8.72998046875, 9.009521484375, 9.2890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 3.0, 5.0, 8.0, 6.0, 12.0, 9.0, 16.0, 27.0, 31.0, 31.0, 29.0, 44.0, 45.0, 41.0, 41.0, 48.0, 45.0, 61.0, 58.0, 69.0, 49.0, 54.0, 43.0, 39.0, 38.0, 30.0, 28.0, 24.0, 14.0, 11.0, 13.0, 7.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.765625, -6.56329345703125, -6.3609619140625, -6.15863037109375, -5.956298828125, -5.75396728515625, -5.5516357421875, -5.34930419921875, -5.14697265625, -4.94464111328125, -4.7423095703125, -4.53997802734375, -4.337646484375, -4.13531494140625, -3.9329833984375, -3.73065185546875, -3.5283203125, -3.32598876953125, -3.1236572265625, -2.92132568359375, -2.718994140625, -2.51666259765625, -2.3143310546875, -2.11199951171875, -1.90966796875, -1.70733642578125, -1.5050048828125, -1.30267333984375, -1.100341796875, -0.89801025390625, -0.6956787109375, -0.49334716796875, -0.291015625, -0.08868408203125, 0.1136474609375, 0.31597900390625, 0.518310546875, 0.72064208984375, 0.9229736328125, 1.12530517578125, 1.32763671875, 1.52996826171875, 1.7322998046875, 1.93463134765625, 2.136962890625, 2.33929443359375, 2.5416259765625, 2.74395751953125, 2.9462890625, 3.14862060546875, 3.3509521484375, 3.55328369140625, 3.755615234375, 3.95794677734375, 4.1602783203125, 4.36260986328125, 4.56494140625, 4.76727294921875, 4.9696044921875, 5.17193603515625, 5.374267578125, 5.57659912109375, 5.7789306640625, 5.98126220703125, 6.18359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 14.0, 13.0, 20.0, 27.0, 43.0, 74.0, 117.0, 200.0, 301.0, 537.0, 1001.0, 1953.0, 4402.0, 10528.0, 29856.0, 108325.0, 547817.0, 258788.0, 54363.0, 17451.0, 6540.0, 2955.0, 1404.0, 714.0, 417.0, 296.0, 137.0, 104.0, 49.0, 32.0, 24.0, 14.0, 10.0, 10.0, 4.0, 7.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.5078125, -3.38580322265625, -3.2637939453125, -3.14178466796875, -3.019775390625, -2.89776611328125, -2.7757568359375, -2.65374755859375, -2.53173828125, -2.40972900390625, -2.2877197265625, -2.16571044921875, -2.043701171875, -1.92169189453125, -1.7996826171875, -1.67767333984375, -1.5556640625, -1.43365478515625, -1.3116455078125, -1.18963623046875, -1.067626953125, -0.94561767578125, -0.8236083984375, -0.70159912109375, -0.57958984375, -0.45758056640625, -0.3355712890625, -0.21356201171875, -0.091552734375, 0.03045654296875, 0.1524658203125, 0.27447509765625, 0.396484375, 0.51849365234375, 0.6405029296875, 0.76251220703125, 0.884521484375, 1.00653076171875, 1.1285400390625, 1.25054931640625, 1.37255859375, 1.49456787109375, 1.6165771484375, 1.73858642578125, 1.860595703125, 1.98260498046875, 2.1046142578125, 2.22662353515625, 2.3486328125, 2.47064208984375, 2.5926513671875, 2.71466064453125, 2.836669921875, 2.95867919921875, 3.0806884765625, 3.20269775390625, 3.32470703125, 3.44671630859375, 3.5687255859375, 3.69073486328125, 3.812744140625, 3.93475341796875, 4.0567626953125, 4.17877197265625, 4.30078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 6.0, 6.0, 8.0, 5.0, 9.0, 7.0, 14.0, 15.0, 29.0, 30.0, 43.0, 82.0, 167.0, 239.0, 141.0, 52.0, 31.0, 19.0, 13.0, 8.0, 14.0, 13.0, 8.0, 10.0, 8.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0008349418640136719, -0.000811360776424408, -0.000787779688835144, -0.0007641986012458801, -0.0007406175136566162, -0.0007170364260673523, -0.0006934553384780884, -0.0006698742508888245, -0.0006462931632995605, -0.0006227120757102966, -0.0005991309881210327, -0.0005755499005317688, -0.0005519688129425049, -0.000528387725353241, -0.000504806637763977, -0.00048122555017471313, -0.0004576444625854492, -0.0004340633749961853, -0.0004104822874069214, -0.00038690119981765747, -0.00036332011222839355, -0.00033973902463912964, -0.0003161579370498657, -0.0002925768494606018, -0.0002689957618713379, -0.000245414674282074, -0.00022183358669281006, -0.00019825249910354614, -0.00017467141151428223, -0.0001510903239250183, -0.0001275092363357544, -0.00010392814874649048, -8.034706115722656e-05, -5.6765973567962646e-05, -3.318488597869873e-05, -9.603798389434814e-06, 1.3977289199829102e-05, 3.755837678909302e-05, 6.113946437835693e-05, 8.472055196762085e-05, 0.00010830163955688477, 0.00013188272714614868, 0.0001554638147354126, 0.00017904490232467651, 0.00020262598991394043, 0.00022620707750320435, 0.00024978816509246826, 0.0002733692526817322, 0.0002969503402709961, 0.00032053142786026, 0.0003441125154495239, 0.00036769360303878784, 0.00039127469062805176, 0.0004148557782173157, 0.0004384368658065796, 0.0004620179533958435, 0.0004855990409851074, 0.0005091801285743713, 0.0005327612161636353, 0.0005563423037528992, 0.0005799233913421631, 0.000603504478931427, 0.0006270855665206909, 0.0006506666541099548, 0.0006742477416992188]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 16.0, 9.0, 16.0, 23.0, 33.0, 59.0, 85.0, 127.0, 222.0, 404.0, 701.0, 1485.0, 3397.0, 8511.0, 26750.0, 115740.0, 675975.0, 164022.0, 33264.0, 10199.0, 3962.0, 1667.0, 839.0, 468.0, 215.0, 136.0, 78.0, 47.0, 33.0, 25.0, 12.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.453125, -5.3040771484375, -5.155029296875, -5.0059814453125, -4.85693359375, -4.7078857421875, -4.558837890625, -4.4097900390625, -4.2607421875, -4.1116943359375, -3.962646484375, -3.8135986328125, -3.66455078125, -3.5155029296875, -3.366455078125, -3.2174072265625, -3.068359375, -2.9193115234375, -2.770263671875, -2.6212158203125, -2.47216796875, -2.3231201171875, -2.174072265625, -2.0250244140625, -1.8759765625, -1.7269287109375, -1.577880859375, -1.4288330078125, -1.27978515625, -1.1307373046875, -0.981689453125, -0.8326416015625, -0.68359375, -0.5345458984375, -0.385498046875, -0.2364501953125, -0.08740234375, 0.0616455078125, 0.210693359375, 0.3597412109375, 0.5087890625, 0.6578369140625, 0.806884765625, 0.9559326171875, 1.10498046875, 1.2540283203125, 1.403076171875, 1.5521240234375, 1.701171875, 1.8502197265625, 1.999267578125, 2.1483154296875, 2.29736328125, 2.4464111328125, 2.595458984375, 2.7445068359375, 2.8935546875, 3.0426025390625, 3.191650390625, 3.3406982421875, 3.48974609375, 3.6387939453125, 3.787841796875, 3.9368896484375, 4.0859375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 4.0, 15.0, 13.0, 11.0, 16.0, 14.0, 22.0, 19.0, 42.0, 64.0, 85.0, 157.0, 159.0, 112.0, 64.0, 51.0, 38.0, 25.0, 16.0, 11.0, 9.0, 12.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.78125, -4.67291259765625, -4.5645751953125, -4.45623779296875, -4.347900390625, -4.23956298828125, -4.1312255859375, -4.02288818359375, -3.91455078125, -3.80621337890625, -3.6978759765625, -3.58953857421875, -3.481201171875, -3.37286376953125, -3.2645263671875, -3.15618896484375, -3.0478515625, -2.93951416015625, -2.8311767578125, -2.72283935546875, -2.614501953125, -2.50616455078125, -2.3978271484375, -2.28948974609375, -2.18115234375, -2.07281494140625, -1.9644775390625, -1.85614013671875, -1.747802734375, -1.63946533203125, -1.5311279296875, -1.42279052734375, -1.314453125, -1.20611572265625, -1.0977783203125, -0.98944091796875, -0.881103515625, -0.77276611328125, -0.6644287109375, -0.55609130859375, -0.44775390625, -0.33941650390625, -0.2310791015625, -0.12274169921875, -0.014404296875, 0.09393310546875, 0.2022705078125, 0.31060791015625, 0.4189453125, 0.52728271484375, 0.6356201171875, 0.74395751953125, 0.852294921875, 0.96063232421875, 1.0689697265625, 1.17730712890625, 1.28564453125, 1.39398193359375, 1.5023193359375, 1.61065673828125, 1.718994140625, 1.82733154296875, 1.9356689453125, 2.04400634765625, 2.15234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 18.0, 28.0, 71.0, 99.0, 131.0, 161.0, 164.0, 130.0, 79.0, 61.0, 26.0, 18.0, 5.0, 2.0, 8.0, 1.0, 0.0, 3.0], "bins": [-136.186767578125, -133.5499725341797, -130.91317749023438, -128.27639770507812, -125.63960266113281, -123.0028076171875, -120.36602020263672, -117.7292251586914, -115.09243774414062, -112.45564270019531, -109.81885528564453, -107.18206024169922, -104.54527282714844, -101.90847778320312, -99.27169036865234, -96.63489532470703, -93.99810028076172, -91.3613052368164, -88.72451782226562, -86.08772277832031, -83.45093536376953, -80.81414031982422, -78.17735290527344, -75.54055786132812, -72.90376281738281, -70.2669677734375, -67.63018035888672, -64.9933853149414, -62.356597900390625, -59.71980285644531, -57.083011627197266, -54.44622039794922, -51.80944061279297, -49.17264938354492, -46.535858154296875, -43.89906692504883, -41.26227569580078, -38.62548065185547, -35.98868942260742, -33.351898193359375, -30.715106964111328, -28.07831573486328, -25.441524505615234, -22.804731369018555, -20.167940139770508, -17.53114891052246, -14.894356727600098, -12.257564544677734, -9.620773315429688, -6.983981609344482, -4.347189903259277, -1.7103981971740723, 0.9263935089111328, 3.5631847381591797, 6.199976921081543, 8.836769104003906, 11.473560333251953, 14.1103515625, 16.747142791748047, 19.383935928344727, 22.020727157592773, 24.65751838684082, 27.2943115234375, 29.931102752685547, 32.567893981933594]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 8.0, 6.0, 11.0, 9.0, 7.0, 11.0, 14.0, 18.0, 19.0, 24.0, 15.0, 19.0, 32.0, 26.0, 33.0, 36.0, 36.0, 32.0, 33.0, 31.0, 43.0, 39.0, 41.0, 42.0, 54.0, 32.0, 27.0, 28.0, 20.0, 29.0, 34.0, 17.0, 25.0, 20.0, 23.0, 22.0, 18.0, 12.0, 4.0, 9.0, 11.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-24.20303726196289, -23.524555206298828, -22.846073150634766, -22.16758918762207, -21.489107131958008, -20.810625076293945, -20.13214111328125, -19.453659057617188, -18.775177001953125, -18.096694946289062, -17.418212890625, -16.739728927612305, -16.061246871948242, -15.38276481628418, -14.7042818069458, -14.025798797607422, -13.34731674194336, -12.668834686279297, -11.990351676940918, -11.311868667602539, -10.633386611938477, -9.954904556274414, -9.276421546936035, -8.597938537597656, -7.919456481933594, -7.240973949432373, -6.562491416931152, -5.884008884429932, -5.205526351928711, -4.52704381942749, -3.8485612869262695, -3.170078754425049, -2.491596221923828, -1.8131136894226074, -1.1346311569213867, -0.456148624420166, 0.2223339080810547, 0.9008164405822754, 1.579298973083496, 2.257781505584717, 2.9362640380859375, 3.614746570587158, 4.293229103088379, 4.9717116355896, 5.65019416809082, 6.328676700592041, 7.007159233093262, 7.685641765594482, 8.364124298095703, 9.042606353759766, 9.721089363098145, 10.399572372436523, 11.078054428100586, 11.756536483764648, 12.435019493103027, 13.113502502441406, 13.791984558105469, 14.470466613769531, 15.14894962310791, 15.827432632446289, 16.50591468811035, 17.184396743774414, 17.86288070678711, 18.541362762451172, 19.219844818115234]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 1.0, 5.0, 3.0, 6.0, 14.0, 12.0, 23.0, 35.0, 37.0, 76.0, 106.0, 169.0, 244.0, 433.0, 798.0, 1679.0, 3759.0, 9630.0, 30748.0, 159512.0, 3787412.0, 152582.0, 29735.0, 9737.0, 3701.0, 1731.0, 854.0, 438.0, 285.0, 166.0, 105.0, 91.0, 52.0, 29.0, 21.0, 15.0, 12.0, 3.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.625, -17.12841796875, -16.6318359375, -16.13525390625, -15.638671875, -15.14208984375, -14.6455078125, -14.14892578125, -13.65234375, -13.15576171875, -12.6591796875, -12.16259765625, -11.666015625, -11.16943359375, -10.6728515625, -10.17626953125, -9.6796875, -9.18310546875, -8.6865234375, -8.18994140625, -7.693359375, -7.19677734375, -6.7001953125, -6.20361328125, -5.70703125, -5.21044921875, -4.7138671875, -4.21728515625, -3.720703125, -3.22412109375, -2.7275390625, -2.23095703125, -1.734375, -1.23779296875, -0.7412109375, -0.24462890625, 0.251953125, 0.74853515625, 1.2451171875, 1.74169921875, 2.23828125, 2.73486328125, 3.2314453125, 3.72802734375, 4.224609375, 4.72119140625, 5.2177734375, 5.71435546875, 6.2109375, 6.70751953125, 7.2041015625, 7.70068359375, 8.197265625, 8.69384765625, 9.1904296875, 9.68701171875, 10.18359375, 10.68017578125, 11.1767578125, 11.67333984375, 12.169921875, 12.66650390625, 13.1630859375, 13.65966796875, 14.15625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 3.0, 7.0, 11.0, 11.0, 15.0, 24.0, 25.0, 37.0, 38.0, 40.0, 57.0, 51.0, 55.0, 66.0, 38.0, 39.0, 69.0, 51.0, 52.0, 55.0, 49.0, 34.0, 36.0, 23.0, 24.0, 21.0, 14.0, 14.0, 8.0, 10.0, 4.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.396484375, -1.3532562255859375, -1.310028076171875, -1.2667999267578125, -1.22357177734375, -1.1803436279296875, -1.137115478515625, -1.0938873291015625, -1.0506591796875, -1.0074310302734375, -0.964202880859375, -0.9209747314453125, -0.87774658203125, -0.8345184326171875, -0.791290283203125, -0.7480621337890625, -0.704833984375, -0.6616058349609375, -0.618377685546875, -0.5751495361328125, -0.53192138671875, -0.4886932373046875, -0.445465087890625, -0.4022369384765625, -0.3590087890625, -0.3157806396484375, -0.272552490234375, -0.2293243408203125, -0.18609619140625, -0.1428680419921875, -0.099639892578125, -0.0564117431640625, -0.01318359375, 0.0300445556640625, 0.073272705078125, 0.1165008544921875, 0.15972900390625, 0.2029571533203125, 0.246185302734375, 0.2894134521484375, 0.3326416015625, 0.3758697509765625, 0.419097900390625, 0.4623260498046875, 0.50555419921875, 0.5487823486328125, 0.592010498046875, 0.6352386474609375, 0.678466796875, 0.7216949462890625, 0.764923095703125, 0.8081512451171875, 0.85137939453125, 0.8946075439453125, 0.937835693359375, 0.9810638427734375, 1.0242919921875, 1.0675201416015625, 1.110748291015625, 1.1539764404296875, 1.19720458984375, 1.2404327392578125, 1.283660888671875, 1.3268890380859375, 1.3701171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 13.0, 14.0, 9.0, 36.0, 32.0, 48.0, 60.0, 100.0, 123.0, 190.0, 302.0, 432.0, 696.0, 1138.0, 1804.0, 3065.0, 5525.0, 9897.0, 19648.0, 42348.0, 114987.0, 979766.0, 2783438.0, 135292.0, 48041.0, 21556.0, 11066.0, 5810.0, 3266.0, 2008.0, 1283.0, 745.0, 504.0, 320.0, 213.0, 158.0, 99.0, 67.0, 63.0, 35.0, 27.0, 15.0, 11.0, 10.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 6.0], "bins": [-9.7265625, -9.432373046875, -9.13818359375, -8.843994140625, -8.5498046875, -8.255615234375, -7.96142578125, -7.667236328125, -7.373046875, -7.078857421875, -6.78466796875, -6.490478515625, -6.1962890625, -5.902099609375, -5.60791015625, -5.313720703125, -5.01953125, -4.725341796875, -4.43115234375, -4.136962890625, -3.8427734375, -3.548583984375, -3.25439453125, -2.960205078125, -2.666015625, -2.371826171875, -2.07763671875, -1.783447265625, -1.4892578125, -1.195068359375, -0.90087890625, -0.606689453125, -0.3125, -0.018310546875, 0.27587890625, 0.570068359375, 0.8642578125, 1.158447265625, 1.45263671875, 1.746826171875, 2.041015625, 2.335205078125, 2.62939453125, 2.923583984375, 3.2177734375, 3.511962890625, 3.80615234375, 4.100341796875, 4.39453125, 4.688720703125, 4.98291015625, 5.277099609375, 5.5712890625, 5.865478515625, 6.15966796875, 6.453857421875, 6.748046875, 7.042236328125, 7.33642578125, 7.630615234375, 7.9248046875, 8.218994140625, 8.51318359375, 8.807373046875, 9.1015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 9.0, 17.0, 12.0, 20.0, 25.0, 34.0, 51.0, 50.0, 132.0, 238.0, 1075.0, 1662.0, 276.0, 139.0, 82.0, 62.0, 40.0, 37.0, 19.0, 16.0, 15.0, 11.0, 4.0, 11.0, 6.0, 9.0, 2.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.68359375, -4.5418701171875, -4.400146484375, -4.2584228515625, -4.11669921875, -3.9749755859375, -3.833251953125, -3.6915283203125, -3.5498046875, -3.4080810546875, -3.266357421875, -3.1246337890625, -2.98291015625, -2.8411865234375, -2.699462890625, -2.5577392578125, -2.416015625, -2.2742919921875, -2.132568359375, -1.9908447265625, -1.84912109375, -1.7073974609375, -1.565673828125, -1.4239501953125, -1.2822265625, -1.1405029296875, -0.998779296875, -0.8570556640625, -0.71533203125, -0.5736083984375, -0.431884765625, -0.2901611328125, -0.1484375, -0.0067138671875, 0.135009765625, 0.2767333984375, 0.41845703125, 0.5601806640625, 0.701904296875, 0.8436279296875, 0.9853515625, 1.1270751953125, 1.268798828125, 1.4105224609375, 1.55224609375, 1.6939697265625, 1.835693359375, 1.9774169921875, 2.119140625, 2.2608642578125, 2.402587890625, 2.5443115234375, 2.68603515625, 2.8277587890625, 2.969482421875, 3.1112060546875, 3.2529296875, 3.3946533203125, 3.536376953125, 3.6781005859375, 3.81982421875, 3.9615478515625, 4.103271484375, 4.2449951171875, 4.38671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 12.0, 23.0, 42.0, 81.0, 116.0, 172.0, 176.0, 138.0, 93.0, 54.0, 39.0, 23.0, 16.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.2130184173584, -20.912256240844727, -19.611492156982422, -18.31072998046875, -17.009967803955078, -15.709203720092773, -14.408441543579102, -13.107678413391113, -11.806915283203125, -10.506152153015137, -9.205389022827148, -7.904626846313477, -6.603863716125488, -5.3031005859375, -4.00233793258667, -2.70157527923584, -1.4008121490478516, -0.10004925727844238, 1.2007136344909668, 2.501476526260376, 3.802239418029785, 5.103002548217773, 6.4037652015686035, 7.704527854919434, 9.005290985107422, 10.30605411529541, 11.606817245483398, 12.90757942199707, 14.208342552185059, 15.509105682373047, 16.80986785888672, 18.11063003540039, 19.411392211914062, 20.712154388427734, 22.01291847229004, 23.31368064880371, 24.614444732666016, 25.915206909179688, 27.21596908569336, 28.51673126220703, 29.817495346069336, 31.118257522583008, 32.41902160644531, 33.719783782958984, 35.020545959472656, 36.321311950683594, 37.622074127197266, 38.92283630371094, 40.22359848022461, 41.52436065673828, 42.82512283325195, 44.12588882446289, 45.42665100097656, 46.727413177490234, 48.028175354003906, 49.32893753051758, 50.62969970703125, 51.93046188354492, 53.231224060058594, 54.53199005126953, 55.8327522277832, 57.133514404296875, 58.43427658081055, 59.73503875732422, 61.035804748535156]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 9.0, 7.0, 6.0, 11.0, 22.0, 13.0, 26.0, 20.0, 21.0, 21.0, 26.0, 27.0, 39.0, 45.0, 50.0, 54.0, 51.0, 42.0, 31.0, 46.0, 41.0, 34.0, 30.0, 34.0, 30.0, 37.0, 32.0, 27.0, 26.0, 22.0, 21.0, 13.0, 16.0, 9.0, 8.0, 5.0, 10.0, 9.0, 7.0, 2.0, 1.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.97231674194336, -14.526285171508789, -14.080252647399902, -13.634221076965332, -13.188188552856445, -12.742156982421875, -12.296125411987305, -11.850092887878418, -11.404060363769531, -10.958028793334961, -10.511996269226074, -10.065964698791504, -9.619932174682617, -9.173900604248047, -8.727869033813477, -8.28183650970459, -7.8358049392700195, -7.389772891998291, -6.9437408447265625, -6.497709274291992, -6.0516767501831055, -5.605645179748535, -5.159613132476807, -4.713581085205078, -4.26754903793335, -3.821516990661621, -3.3754849433898926, -2.929453134536743, -2.4834210872650146, -2.037389039993286, -1.5913572311401367, -1.1453251838684082, -0.6992921829223633, -0.25326019525527954, 0.1927717924118042, 0.6388037204742432, 1.0848357677459717, 1.5308678150177002, 1.9768996238708496, 2.422931671142578, 2.8689637184143066, 3.314995765686035, 3.7610278129577637, 4.207059860229492, 4.6530914306640625, 5.099123954772949, 5.5451555252075195, 5.991187572479248, 6.437219619750977, 6.883251667022705, 7.329283714294434, 7.775315284729004, 8.22134780883789, 8.667379379272461, 9.113410949707031, 9.559443473815918, 10.005475997924805, 10.451507568359375, 10.897540092468262, 11.343571662902832, 11.789604187011719, 12.235635757446289, 12.68166732788086, 13.127699851989746, 13.573731422424316]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 10.0, 16.0, 14.0, 31.0, 52.0, 73.0, 154.0, 208.0, 337.0, 607.0, 1043.0, 1993.0, 3610.0, 6637.0, 13217.0, 25861.0, 48757.0, 90531.0, 189430.0, 347180.0, 151792.0, 78876.0, 42092.0, 21859.0, 11219.0, 5834.0, 3106.0, 1696.0, 983.0, 527.0, 285.0, 193.0, 120.0, 74.0, 41.0, 22.0, 17.0, 18.0, 11.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0], "bins": [-8.5390625, -8.31658935546875, -8.0941162109375, -7.87164306640625, -7.649169921875, -7.42669677734375, -7.2042236328125, -6.98175048828125, -6.75927734375, -6.53680419921875, -6.3143310546875, -6.09185791015625, -5.869384765625, -5.64691162109375, -5.4244384765625, -5.20196533203125, -4.9794921875, -4.75701904296875, -4.5345458984375, -4.31207275390625, -4.089599609375, -3.86712646484375, -3.6446533203125, -3.42218017578125, -3.19970703125, -2.97723388671875, -2.7547607421875, -2.53228759765625, -2.309814453125, -2.08734130859375, -1.8648681640625, -1.64239501953125, -1.419921875, -1.19744873046875, -0.9749755859375, -0.75250244140625, -0.530029296875, -0.30755615234375, -0.0850830078125, 0.13739013671875, 0.35986328125, 0.58233642578125, 0.8048095703125, 1.02728271484375, 1.249755859375, 1.47222900390625, 1.6947021484375, 1.91717529296875, 2.1396484375, 2.36212158203125, 2.5845947265625, 2.80706787109375, 3.029541015625, 3.25201416015625, 3.4744873046875, 3.69696044921875, 3.91943359375, 4.14190673828125, 4.3643798828125, 4.58685302734375, 4.809326171875, 5.03179931640625, 5.2542724609375, 5.47674560546875, 5.69921875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 3.0, 6.0, 8.0, 7.0, 9.0, 10.0, 14.0, 17.0, 25.0, 33.0, 21.0, 31.0, 46.0, 44.0, 53.0, 52.0, 45.0, 48.0, 52.0, 45.0, 50.0, 48.0, 36.0, 44.0, 30.0, 39.0, 29.0, 29.0, 28.0, 19.0, 11.0, 17.0, 8.0, 13.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.3974609375, -1.354461669921875, -1.31146240234375, -1.268463134765625, -1.2254638671875, -1.182464599609375, -1.13946533203125, -1.096466064453125, -1.053466796875, -1.010467529296875, -0.96746826171875, -0.924468994140625, -0.8814697265625, -0.838470458984375, -0.79547119140625, -0.752471923828125, -0.70947265625, -0.666473388671875, -0.62347412109375, -0.580474853515625, -0.5374755859375, -0.494476318359375, -0.45147705078125, -0.408477783203125, -0.365478515625, -0.322479248046875, -0.27947998046875, -0.236480712890625, -0.1934814453125, -0.150482177734375, -0.10748291015625, -0.064483642578125, -0.021484375, 0.021514892578125, 0.06451416015625, 0.107513427734375, 0.1505126953125, 0.193511962890625, 0.23651123046875, 0.279510498046875, 0.322509765625, 0.365509033203125, 0.40850830078125, 0.451507568359375, 0.4945068359375, 0.537506103515625, 0.58050537109375, 0.623504638671875, 0.66650390625, 0.709503173828125, 0.75250244140625, 0.795501708984375, 0.8385009765625, 0.881500244140625, 0.92449951171875, 0.967498779296875, 1.010498046875, 1.053497314453125, 1.09649658203125, 1.139495849609375, 1.1824951171875, 1.225494384765625, 1.26849365234375, 1.311492919921875, 1.3544921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 11.0, 7.0, 9.0, 20.0, 27.0, 37.0, 67.0, 75.0, 111.0, 156.0, 264.0, 409.0, 743.0, 1652.0, 3876.0, 11240.0, 37345.0, 137102.0, 588433.0, 192244.0, 50549.0, 14931.0, 5067.0, 1927.0, 887.0, 512.0, 263.0, 162.0, 122.0, 89.0, 69.0, 40.0, 21.0, 25.0, 20.0, 10.0, 5.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0], "bins": [-15.2421875, -14.8370361328125, -14.431884765625, -14.0267333984375, -13.62158203125, -13.2164306640625, -12.811279296875, -12.4061279296875, -12.0009765625, -11.5958251953125, -11.190673828125, -10.7855224609375, -10.38037109375, -9.9752197265625, -9.570068359375, -9.1649169921875, -8.759765625, -8.3546142578125, -7.949462890625, -7.5443115234375, -7.13916015625, -6.7340087890625, -6.328857421875, -5.9237060546875, -5.5185546875, -5.1134033203125, -4.708251953125, -4.3031005859375, -3.89794921875, -3.4927978515625, -3.087646484375, -2.6824951171875, -2.27734375, -1.8721923828125, -1.467041015625, -1.0618896484375, -0.65673828125, -0.2515869140625, 0.153564453125, 0.5587158203125, 0.9638671875, 1.3690185546875, 1.774169921875, 2.1793212890625, 2.58447265625, 2.9896240234375, 3.394775390625, 3.7999267578125, 4.205078125, 4.6102294921875, 5.015380859375, 5.4205322265625, 5.82568359375, 6.2308349609375, 6.635986328125, 7.0411376953125, 7.4462890625, 7.8514404296875, 8.256591796875, 8.6617431640625, 9.06689453125, 9.4720458984375, 9.877197265625, 10.2823486328125, 10.6875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 8.0, 9.0, 10.0, 20.0, 18.0, 32.0, 27.0, 34.0, 43.0, 42.0, 60.0, 41.0, 49.0, 51.0, 58.0, 65.0, 58.0, 50.0, 41.0, 46.0, 38.0, 35.0, 31.0, 19.0, 28.0, 12.0, 15.0, 11.0, 6.0, 10.0, 6.0, 3.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.8515625, -9.5963134765625, -9.341064453125, -9.0858154296875, -8.83056640625, -8.5753173828125, -8.320068359375, -8.0648193359375, -7.8095703125, -7.5543212890625, -7.299072265625, -7.0438232421875, -6.78857421875, -6.5333251953125, -6.278076171875, -6.0228271484375, -5.767578125, -5.5123291015625, -5.257080078125, -5.0018310546875, -4.74658203125, -4.4913330078125, -4.236083984375, -3.9808349609375, -3.7255859375, -3.4703369140625, -3.215087890625, -2.9598388671875, -2.70458984375, -2.4493408203125, -2.194091796875, -1.9388427734375, -1.68359375, -1.4283447265625, -1.173095703125, -0.9178466796875, -0.66259765625, -0.4073486328125, -0.152099609375, 0.1031494140625, 0.3583984375, 0.6136474609375, 0.868896484375, 1.1241455078125, 1.37939453125, 1.6346435546875, 1.889892578125, 2.1451416015625, 2.400390625, 2.6556396484375, 2.910888671875, 3.1661376953125, 3.42138671875, 3.6766357421875, 3.931884765625, 4.1871337890625, 4.4423828125, 4.6976318359375, 4.952880859375, 5.2081298828125, 5.46337890625, 5.7186279296875, 5.973876953125, 6.2291259765625, 6.484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 12.0, 13.0, 15.0, 29.0, 41.0, 41.0, 79.0, 97.0, 117.0, 172.0, 234.0, 300.0, 508.0, 696.0, 1154.0, 1995.0, 4098.0, 11513.0, 56021.0, 708039.0, 222164.0, 26733.0, 7101.0, 2888.0, 1510.0, 933.0, 594.0, 427.0, 288.0, 202.0, 160.0, 90.0, 63.0, 60.0, 32.0, 36.0, 17.0, 23.0, 13.0, 7.0, 8.0, 5.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.828125, -10.4764404296875, -10.124755859375, -9.7730712890625, -9.42138671875, -9.0697021484375, -8.718017578125, -8.3663330078125, -8.0146484375, -7.6629638671875, -7.311279296875, -6.9595947265625, -6.60791015625, -6.2562255859375, -5.904541015625, -5.5528564453125, -5.201171875, -4.8494873046875, -4.497802734375, -4.1461181640625, -3.79443359375, -3.4427490234375, -3.091064453125, -2.7393798828125, -2.3876953125, -2.0360107421875, -1.684326171875, -1.3326416015625, -0.98095703125, -0.6292724609375, -0.277587890625, 0.0740966796875, 0.42578125, 0.7774658203125, 1.129150390625, 1.4808349609375, 1.83251953125, 2.1842041015625, 2.535888671875, 2.8875732421875, 3.2392578125, 3.5909423828125, 3.942626953125, 4.2943115234375, 4.64599609375, 4.9976806640625, 5.349365234375, 5.7010498046875, 6.052734375, 6.4044189453125, 6.756103515625, 7.1077880859375, 7.45947265625, 7.8111572265625, 8.162841796875, 8.5145263671875, 8.8662109375, 9.2178955078125, 9.569580078125, 9.9212646484375, 10.27294921875, 10.6246337890625, 10.976318359375, 11.3280029296875, 11.6796875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 9.0, 9.0, 8.0, 19.0, 33.0, 52.0, 135.0, 362.0, 185.0, 73.0, 61.0, 25.0, 10.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025272369384765625, -0.002439051866531372, -0.0023508667945861816, -0.002262681722640991, -0.0021744966506958008, -0.0020863115787506104, -0.00199812650680542, -0.0019099414348602295, -0.001821756362915039, -0.0017335712909698486, -0.0016453862190246582, -0.0015572011470794678, -0.0014690160751342773, -0.001380831003189087, -0.0012926459312438965, -0.001204460859298706, -0.0011162757873535156, -0.0010280907154083252, -0.0009399056434631348, -0.0008517205715179443, -0.0007635354995727539, -0.0006753504276275635, -0.000587165355682373, -0.0004989802837371826, -0.0004107952117919922, -0.00032261013984680176, -0.00023442506790161133, -0.0001462399959564209, -5.805492401123047e-05, 3.013014793395996e-05, 0.00011831521987915039, 0.00020650029182434082, 0.00029468536376953125, 0.0003828704357147217, 0.0004710555076599121, 0.0005592405796051025, 0.000647425651550293, 0.0007356107234954834, 0.0008237957954406738, 0.0009119808673858643, 0.0010001659393310547, 0.0010883510112762451, 0.0011765360832214355, 0.001264721155166626, 0.0013529062271118164, 0.0014410912990570068, 0.0015292763710021973, 0.0016174614429473877, 0.0017056465148925781, 0.0017938315868377686, 0.001882016658782959, 0.0019702017307281494, 0.00205838680267334, 0.0021465718746185303, 0.0022347569465637207, 0.002322942018508911, 0.0024111270904541016, 0.002499312162399292, 0.0025874972343444824, 0.002675682306289673, 0.0027638673782348633, 0.0028520524501800537, 0.002940237522125244, 0.0030284225940704346, 0.003116607666015625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 3.0, 9.0, 5.0, 6.0, 10.0, 9.0, 17.0, 22.0, 28.0, 55.0, 92.0, 215.0, 698.0, 2358.0, 13352.0, 757370.0, 262632.0, 8875.0, 1765.0, 552.0, 218.0, 92.0, 53.0, 30.0, 12.0, 15.0, 13.0, 9.0, 10.0, 9.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.296875, -25.521240234375, -24.74560546875, -23.969970703125, -23.1943359375, -22.418701171875, -21.64306640625, -20.867431640625, -20.091796875, -19.316162109375, -18.54052734375, -17.764892578125, -16.9892578125, -16.213623046875, -15.43798828125, -14.662353515625, -13.88671875, -13.111083984375, -12.33544921875, -11.559814453125, -10.7841796875, -10.008544921875, -9.23291015625, -8.457275390625, -7.681640625, -6.906005859375, -6.13037109375, -5.354736328125, -4.5791015625, -3.803466796875, -3.02783203125, -2.252197265625, -1.4765625, -0.700927734375, 0.07470703125, 0.850341796875, 1.6259765625, 2.401611328125, 3.17724609375, 3.952880859375, 4.728515625, 5.504150390625, 6.27978515625, 7.055419921875, 7.8310546875, 8.606689453125, 9.38232421875, 10.157958984375, 10.93359375, 11.709228515625, 12.48486328125, 13.260498046875, 14.0361328125, 14.811767578125, 15.58740234375, 16.363037109375, 17.138671875, 17.914306640625, 18.68994140625, 19.465576171875, 20.2412109375, 21.016845703125, 21.79248046875, 22.568115234375, 23.34375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 3.0, 9.0, 15.0, 22.0, 36.0, 77.0, 177.0, 285.0, 175.0, 74.0, 49.0, 27.0, 13.0, 9.0, 6.0, 5.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8203125, -10.411865234375, -10.00341796875, -9.594970703125, -9.1865234375, -8.778076171875, -8.36962890625, -7.961181640625, -7.552734375, -7.144287109375, -6.73583984375, -6.327392578125, -5.9189453125, -5.510498046875, -5.10205078125, -4.693603515625, -4.28515625, -3.876708984375, -3.46826171875, -3.059814453125, -2.6513671875, -2.242919921875, -1.83447265625, -1.426025390625, -1.017578125, -0.609130859375, -0.20068359375, 0.207763671875, 0.6162109375, 1.024658203125, 1.43310546875, 1.841552734375, 2.25, 2.658447265625, 3.06689453125, 3.475341796875, 3.8837890625, 4.292236328125, 4.70068359375, 5.109130859375, 5.517578125, 5.926025390625, 6.33447265625, 6.742919921875, 7.1513671875, 7.559814453125, 7.96826171875, 8.376708984375, 8.78515625, 9.193603515625, 9.60205078125, 10.010498046875, 10.4189453125, 10.827392578125, 11.23583984375, 11.644287109375, 12.052734375, 12.461181640625, 12.86962890625, 13.278076171875, 13.6865234375, 14.094970703125, 14.50341796875, 14.911865234375, 15.3203125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 18.0, 25.0, 65.0, 109.0, 166.0, 203.0, 179.0, 122.0, 59.0, 22.0, 18.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-185.86895751953125, -181.02865600585938, -176.18836975097656, -171.3480682373047, -166.5077667236328, -161.66748046875, -156.82717895507812, -151.98687744140625, -147.14657592773438, -142.3062744140625, -137.4659881591797, -132.6256866455078, -127.78538513183594, -122.9450912475586, -118.10479736328125, -113.26449584960938, -108.42420959472656, -103.58391571044922, -98.74361419677734, -93.9033203125, -89.06301879882812, -84.22272491455078, -79.38243103027344, -74.54212951660156, -69.70183563232422, -64.86154174804688, -60.021240234375, -55.180946350097656, -50.34064865112305, -45.50035095214844, -40.660057067871094, -35.819759368896484, -30.979454040527344, -26.139156341552734, -21.298860549926758, -16.45856475830078, -11.618267059326172, -6.7779693603515625, -1.937673568725586, 2.9026222229003906, 7.742919921875, 12.583216667175293, 17.423513412475586, 22.263809204101562, 27.104106903076172, 31.94440460205078, 36.784698486328125, 41.624996185302734, 46.465293884277344, 51.30559158325195, 56.14588928222656, 60.986183166503906, 65.82647705078125, 70.66677856445312, 75.50707244873047, 80.34736633300781, 85.18766784667969, 90.02796173095703, 94.8682632446289, 99.70855712890625, 104.54885864257812, 109.38915252685547, 114.22944641113281, 119.06974792480469, 123.91004180908203]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 4.0, 4.0, 11.0, 9.0, 12.0, 8.0, 10.0, 22.0, 14.0, 23.0, 22.0, 25.0, 34.0, 25.0, 30.0, 38.0, 31.0, 28.0, 46.0, 35.0, 34.0, 49.0, 49.0, 38.0, 32.0, 38.0, 40.0, 34.0, 30.0, 24.0, 27.0, 29.0, 23.0, 19.0, 14.0, 14.0, 14.0, 16.0, 10.0, 5.0, 5.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.53325653076172, -37.36638259887695, -36.19950485229492, -35.032630920410156, -33.86575698852539, -32.698883056640625, -31.532005310058594, -30.365131378173828, -29.19825553894043, -28.03137969970703, -26.864505767822266, -25.697629928588867, -24.53075408935547, -23.363880157470703, -22.197004318237305, -21.030128479003906, -19.86325454711914, -18.696378707885742, -17.529504776000977, -16.362628936767578, -15.195754051208496, -14.028879165649414, -12.862003326416016, -11.695128440856934, -10.528253555297852, -9.36137866973877, -8.194503784179688, -7.027627944946289, -5.860753059387207, -4.693878173828125, -3.5270028114318848, -2.3601274490356445, -1.1932525634765625, -0.026377439498901367, 1.1404976844787598, 2.307372808456421, 3.474247932434082, 4.641122817993164, 5.807998180389404, 6.9748735427856445, 8.141748428344727, 9.308623313903809, 10.47549819946289, 11.642374038696289, 12.809248924255371, 13.976123809814453, 15.142999649047852, 16.30987548828125, 17.476749420166016, 18.643625259399414, 19.81049919128418, 20.977375030517578, 22.144248962402344, 23.311124801635742, 24.47800064086914, 25.644874572753906, 26.811750411987305, 27.978626251220703, 29.14550018310547, 30.312376022338867, 31.479251861572266, 32.64612579345703, 33.8129997253418, 34.97987747192383, 36.146751403808594]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 8.0, 7.0, 13.0, 7.0, 23.0, 27.0, 54.0, 78.0, 116.0, 194.0, 384.0, 674.0, 1224.0, 2544.0, 5669.0, 13806.0, 39844.0, 162406.0, 3528775.0, 345580.0, 59120.0, 19322.0, 7611.0, 3196.0, 1607.0, 836.0, 478.0, 261.0, 158.0, 87.0, 56.0, 30.0, 33.0, 18.0, 11.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.0625, -14.6151123046875, -14.167724609375, -13.7203369140625, -13.27294921875, -12.8255615234375, -12.378173828125, -11.9307861328125, -11.4833984375, -11.0360107421875, -10.588623046875, -10.1412353515625, -9.69384765625, -9.2464599609375, -8.799072265625, -8.3516845703125, -7.904296875, -7.4569091796875, -7.009521484375, -6.5621337890625, -6.11474609375, -5.6673583984375, -5.219970703125, -4.7725830078125, -4.3251953125, -3.8778076171875, -3.430419921875, -2.9830322265625, -2.53564453125, -2.0882568359375, -1.640869140625, -1.1934814453125, -0.74609375, -0.2987060546875, 0.148681640625, 0.5960693359375, 1.04345703125, 1.4908447265625, 1.938232421875, 2.3856201171875, 2.8330078125, 3.2803955078125, 3.727783203125, 4.1751708984375, 4.62255859375, 5.0699462890625, 5.517333984375, 5.9647216796875, 6.412109375, 6.8594970703125, 7.306884765625, 7.7542724609375, 8.20166015625, 8.6490478515625, 9.096435546875, 9.5438232421875, 9.9912109375, 10.4385986328125, 10.885986328125, 11.3333740234375, 11.78076171875, 12.2281494140625, 12.675537109375, 13.1229248046875, 13.5703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 6.0, 11.0, 14.0, 16.0, 17.0, 24.0, 29.0, 33.0, 37.0, 36.0, 38.0, 53.0, 49.0, 46.0, 54.0, 52.0, 51.0, 52.0, 51.0, 44.0, 47.0, 43.0, 32.0, 26.0, 21.0, 18.0, 20.0, 19.0, 11.0, 5.0, 10.0, 1.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5654296875, -1.516937255859375, -1.46844482421875, -1.419952392578125, -1.3714599609375, -1.322967529296875, -1.27447509765625, -1.225982666015625, -1.177490234375, -1.128997802734375, -1.08050537109375, -1.032012939453125, -0.9835205078125, -0.935028076171875, -0.88653564453125, -0.838043212890625, -0.78955078125, -0.741058349609375, -0.69256591796875, -0.644073486328125, -0.5955810546875, -0.547088623046875, -0.49859619140625, -0.450103759765625, -0.401611328125, -0.353118896484375, -0.30462646484375, -0.256134033203125, -0.2076416015625, -0.159149169921875, -0.11065673828125, -0.062164306640625, -0.013671875, 0.034820556640625, 0.08331298828125, 0.131805419921875, 0.1802978515625, 0.228790283203125, 0.27728271484375, 0.325775146484375, 0.374267578125, 0.422760009765625, 0.47125244140625, 0.519744873046875, 0.5682373046875, 0.616729736328125, 0.66522216796875, 0.713714599609375, 0.76220703125, 0.810699462890625, 0.85919189453125, 0.907684326171875, 0.9561767578125, 1.004669189453125, 1.05316162109375, 1.101654052734375, 1.150146484375, 1.198638916015625, 1.24713134765625, 1.295623779296875, 1.3441162109375, 1.392608642578125, 1.44110107421875, 1.489593505859375, 1.5380859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 16.0, 16.0, 37.0, 31.0, 61.0, 104.0, 155.0, 219.0, 334.0, 568.0, 958.0, 1698.0, 2909.0, 5416.0, 10904.0, 23295.0, 53066.0, 144473.0, 1127845.0, 2542687.0, 168663.0, 59920.0, 25387.0, 11885.0, 5956.0, 3138.0, 1822.0, 1057.0, 577.0, 368.0, 222.0, 156.0, 91.0, 72.0, 52.0, 36.0, 17.0, 11.0, 15.0, 10.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0], "bins": [-11.984375, -11.642578125, -11.30078125, -10.958984375, -10.6171875, -10.275390625, -9.93359375, -9.591796875, -9.25, -8.908203125, -8.56640625, -8.224609375, -7.8828125, -7.541015625, -7.19921875, -6.857421875, -6.515625, -6.173828125, -5.83203125, -5.490234375, -5.1484375, -4.806640625, -4.46484375, -4.123046875, -3.78125, -3.439453125, -3.09765625, -2.755859375, -2.4140625, -2.072265625, -1.73046875, -1.388671875, -1.046875, -0.705078125, -0.36328125, -0.021484375, 0.3203125, 0.662109375, 1.00390625, 1.345703125, 1.6875, 2.029296875, 2.37109375, 2.712890625, 3.0546875, 3.396484375, 3.73828125, 4.080078125, 4.421875, 4.763671875, 5.10546875, 5.447265625, 5.7890625, 6.130859375, 6.47265625, 6.814453125, 7.15625, 7.498046875, 7.83984375, 8.181640625, 8.5234375, 8.865234375, 9.20703125, 9.548828125, 9.890625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 1.0, 8.0, 8.0, 14.0, 11.0, 12.0, 31.0, 34.0, 43.0, 61.0, 67.0, 102.0, 202.0, 387.0, 1674.0, 650.0, 274.0, 120.0, 76.0, 65.0, 50.0, 24.0, 31.0, 27.0, 21.0, 12.0, 19.0, 11.0, 5.0, 6.0, 7.0, 1.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.359375, -6.17620849609375, -5.9930419921875, -5.80987548828125, -5.626708984375, -5.44354248046875, -5.2603759765625, -5.07720947265625, -4.89404296875, -4.71087646484375, -4.5277099609375, -4.34454345703125, -4.161376953125, -3.97821044921875, -3.7950439453125, -3.61187744140625, -3.4287109375, -3.24554443359375, -3.0623779296875, -2.87921142578125, -2.696044921875, -2.51287841796875, -2.3297119140625, -2.14654541015625, -1.96337890625, -1.78021240234375, -1.5970458984375, -1.41387939453125, -1.230712890625, -1.04754638671875, -0.8643798828125, -0.68121337890625, -0.498046875, -0.31488037109375, -0.1317138671875, 0.05145263671875, 0.234619140625, 0.41778564453125, 0.6009521484375, 0.78411865234375, 0.96728515625, 1.15045166015625, 1.3336181640625, 1.51678466796875, 1.699951171875, 1.88311767578125, 2.0662841796875, 2.24945068359375, 2.4326171875, 2.61578369140625, 2.7989501953125, 2.98211669921875, 3.165283203125, 3.34844970703125, 3.5316162109375, 3.71478271484375, 3.89794921875, 4.08111572265625, 4.2642822265625, 4.44744873046875, 4.630615234375, 4.81378173828125, 4.9969482421875, 5.18011474609375, 5.36328125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 20.0, 32.0, 84.0, 151.0, 212.0, 208.0, 152.0, 90.0, 36.0, 12.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-122.77835083007812, -120.00119018554688, -117.22402954101562, -114.44686889648438, -111.66970825195312, -108.8925552368164, -106.11539459228516, -103.3382339477539, -100.56107330322266, -97.7839126586914, -95.00675201416016, -92.2295913696289, -89.45243835449219, -86.67527770996094, -83.89811706542969, -81.12095642089844, -78.34379577636719, -75.56663513183594, -72.78947448730469, -70.01231384277344, -67.23515319824219, -64.45800018310547, -61.68083953857422, -58.90367889404297, -56.12651824951172, -53.34935760498047, -50.57219696044922, -47.795040130615234, -45.017879486083984, -42.240718841552734, -39.46356201171875, -36.6864013671875, -33.90924072265625, -31.132080078125, -28.354921340942383, -25.577762603759766, -22.800601959228516, -20.023441314697266, -17.24628257751465, -14.469123840332031, -11.691963195800781, -8.914803504943848, -6.137643814086914, -3.3604841232299805, -0.5833244323730469, 2.1938352584838867, 4.97099494934082, 7.7481536865234375, 10.525314331054688, 13.302474021911621, 16.079633712768555, 18.856792449951172, 21.633953094482422, 24.411113739013672, 27.18827247619629, 29.965431213378906, 32.742591857910156, 35.519752502441406, 38.296913146972656, 41.07406997680664, 43.85123062133789, 46.62839126586914, 49.405548095703125, 52.182708740234375, 54.959869384765625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 10.0, 6.0, 10.0, 11.0, 15.0, 18.0, 26.0, 25.0, 22.0, 18.0, 38.0, 39.0, 40.0, 41.0, 37.0, 38.0, 48.0, 51.0, 43.0, 42.0, 45.0, 41.0, 43.0, 38.0, 52.0, 27.0, 25.0, 24.0, 22.0, 20.0, 19.0, 15.0, 13.0, 6.0, 10.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.268680572509766, -23.513999938964844, -22.759321212768555, -22.004640579223633, -21.24995994567871, -20.49527931213379, -19.7406005859375, -18.985919952392578, -18.231239318847656, -17.476558685302734, -16.721879959106445, -15.967199325561523, -15.212518692016602, -14.457839012145996, -13.70315933227539, -12.948478698730469, -12.193799018859863, -11.439119338989258, -10.684438705444336, -9.92975902557373, -9.175078392028809, -8.420398712158203, -7.6657185554504395, -6.911038398742676, -6.156358242034912, -5.401678085327148, -4.646997928619385, -3.8923180103302, -3.1376378536224365, -2.382957696914673, -1.6282777786254883, -0.8735976219177246, -0.11891746520996094, 0.635762631893158, 1.3904427289962769, 2.145122766494751, 2.8998029232025146, 3.6544830799102783, 4.409162998199463, 5.163843154907227, 5.91852331161499, 6.673203468322754, 7.427883625030518, 8.182563781738281, 8.937243461608887, 9.691924095153809, 10.446603775024414, 11.201284408569336, 11.955964088439941, 12.710643768310547, 13.465324401855469, 14.220004081726074, 14.974684715270996, 15.729364395141602, 16.484045028686523, 17.238723754882812, 17.993404388427734, 18.748085021972656, 19.502763748168945, 20.257444381713867, 21.01212501525879, 21.76680564880371, 22.521484375, 23.276165008544922, 24.030845642089844]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 11.0, 16.0, 25.0, 23.0, 51.0, 79.0, 129.0, 221.0, 369.0, 687.0, 1279.0, 2672.0, 5598.0, 11881.0, 26006.0, 60384.0, 137693.0, 266633.0, 273028.0, 145722.0, 64082.0, 27734.0, 12473.0, 5744.0, 2843.0, 1421.0, 743.0, 392.0, 231.0, 120.0, 81.0, 56.0, 50.0, 18.0, 17.0, 20.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.296875, -8.029541015625, -7.76220703125, -7.494873046875, -7.2275390625, -6.960205078125, -6.69287109375, -6.425537109375, -6.158203125, -5.890869140625, -5.62353515625, -5.356201171875, -5.0888671875, -4.821533203125, -4.55419921875, -4.286865234375, -4.01953125, -3.752197265625, -3.48486328125, -3.217529296875, -2.9501953125, -2.682861328125, -2.41552734375, -2.148193359375, -1.880859375, -1.613525390625, -1.34619140625, -1.078857421875, -0.8115234375, -0.544189453125, -0.27685546875, -0.009521484375, 0.2578125, 0.525146484375, 0.79248046875, 1.059814453125, 1.3271484375, 1.594482421875, 1.86181640625, 2.129150390625, 2.396484375, 2.663818359375, 2.93115234375, 3.198486328125, 3.4658203125, 3.733154296875, 4.00048828125, 4.267822265625, 4.53515625, 4.802490234375, 5.06982421875, 5.337158203125, 5.6044921875, 5.871826171875, 6.13916015625, 6.406494140625, 6.673828125, 6.941162109375, 7.20849609375, 7.475830078125, 7.7431640625, 8.010498046875, 8.27783203125, 8.545166015625, 8.8125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 8.0, 3.0, 8.0, 9.0, 9.0, 11.0, 21.0, 10.0, 19.0, 20.0, 37.0, 26.0, 27.0, 35.0, 35.0, 46.0, 46.0, 47.0, 43.0, 46.0, 49.0, 43.0, 44.0, 49.0, 35.0, 43.0, 41.0, 26.0, 22.0, 34.0, 23.0, 14.0, 15.0, 13.0, 5.0, 8.0, 4.0, 8.0, 3.0, 3.0, 1.0, 0.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.62109375, -1.569854736328125, -1.51861572265625, -1.467376708984375, -1.4161376953125, -1.364898681640625, -1.31365966796875, -1.262420654296875, -1.211181640625, -1.159942626953125, -1.10870361328125, -1.057464599609375, -1.0062255859375, -0.954986572265625, -0.90374755859375, -0.852508544921875, -0.80126953125, -0.750030517578125, -0.69879150390625, -0.647552490234375, -0.5963134765625, -0.545074462890625, -0.49383544921875, -0.442596435546875, -0.391357421875, -0.340118408203125, -0.28887939453125, -0.237640380859375, -0.1864013671875, -0.135162353515625, -0.08392333984375, -0.032684326171875, 0.0185546875, 0.069793701171875, 0.12103271484375, 0.172271728515625, 0.2235107421875, 0.274749755859375, 0.32598876953125, 0.377227783203125, 0.428466796875, 0.479705810546875, 0.53094482421875, 0.582183837890625, 0.6334228515625, 0.684661865234375, 0.73590087890625, 0.787139892578125, 0.83837890625, 0.889617919921875, 0.94085693359375, 0.992095947265625, 1.0433349609375, 1.094573974609375, 1.14581298828125, 1.197052001953125, 1.248291015625, 1.299530029296875, 1.35076904296875, 1.402008056640625, 1.4532470703125, 1.504486083984375, 1.55572509765625, 1.606964111328125, 1.658203125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 11.0, 13.0, 13.0, 16.0, 25.0, 30.0, 54.0, 72.0, 112.0, 165.0, 273.0, 459.0, 806.0, 1743.0, 4450.0, 14842.0, 64193.0, 330001.0, 488251.0, 108784.0, 22949.0, 6458.0, 2243.0, 1055.0, 565.0, 316.0, 178.0, 132.0, 102.0, 67.0, 48.0, 36.0, 21.0, 18.0, 16.0, 8.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.546875, -17.0616455078125, -16.576416015625, -16.0911865234375, -15.60595703125, -15.1207275390625, -14.635498046875, -14.1502685546875, -13.6650390625, -13.1798095703125, -12.694580078125, -12.2093505859375, -11.72412109375, -11.2388916015625, -10.753662109375, -10.2684326171875, -9.783203125, -9.2979736328125, -8.812744140625, -8.3275146484375, -7.84228515625, -7.3570556640625, -6.871826171875, -6.3865966796875, -5.9013671875, -5.4161376953125, -4.930908203125, -4.4456787109375, -3.96044921875, -3.4752197265625, -2.989990234375, -2.5047607421875, -2.01953125, -1.5343017578125, -1.049072265625, -0.5638427734375, -0.07861328125, 0.4066162109375, 0.891845703125, 1.3770751953125, 1.8623046875, 2.3475341796875, 2.832763671875, 3.3179931640625, 3.80322265625, 4.2884521484375, 4.773681640625, 5.2589111328125, 5.744140625, 6.2293701171875, 6.714599609375, 7.1998291015625, 7.68505859375, 8.1702880859375, 8.655517578125, 9.1407470703125, 9.6259765625, 10.1112060546875, 10.596435546875, 11.0816650390625, 11.56689453125, 12.0521240234375, 12.537353515625, 13.0225830078125, 13.5078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 1.0, 5.0, 4.0, 3.0, 9.0, 12.0, 9.0, 13.0, 14.0, 15.0, 24.0, 18.0, 38.0, 23.0, 29.0, 28.0, 32.0, 37.0, 47.0, 33.0, 34.0, 44.0, 51.0, 34.0, 36.0, 43.0, 51.0, 39.0, 45.0, 39.0, 28.0, 19.0, 15.0, 15.0, 13.0, 17.0, 16.0, 13.0, 11.0, 6.0, 1.0, 10.0, 1.0, 11.0, 5.0, 5.0, 1.0, 4.0, 3.0], "bins": [-11.1328125, -10.8349609375, -10.537109375, -10.2392578125, -9.94140625, -9.6435546875, -9.345703125, -9.0478515625, -8.75, -8.4521484375, -8.154296875, -7.8564453125, -7.55859375, -7.2607421875, -6.962890625, -6.6650390625, -6.3671875, -6.0693359375, -5.771484375, -5.4736328125, -5.17578125, -4.8779296875, -4.580078125, -4.2822265625, -3.984375, -3.6865234375, -3.388671875, -3.0908203125, -2.79296875, -2.4951171875, -2.197265625, -1.8994140625, -1.6015625, -1.3037109375, -1.005859375, -0.7080078125, -0.41015625, -0.1123046875, 0.185546875, 0.4833984375, 0.78125, 1.0791015625, 1.376953125, 1.6748046875, 1.97265625, 2.2705078125, 2.568359375, 2.8662109375, 3.1640625, 3.4619140625, 3.759765625, 4.0576171875, 4.35546875, 4.6533203125, 4.951171875, 5.2490234375, 5.546875, 5.8447265625, 6.142578125, 6.4404296875, 6.73828125, 7.0361328125, 7.333984375, 7.6318359375, 7.9296875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 9.0, 22.0, 33.0, 64.0, 83.0, 182.0, 309.0, 586.0, 1166.0, 2607.0, 6384.0, 17974.0, 59691.0, 257642.0, 518925.0, 129879.0, 34083.0, 10960.0, 4306.0, 1778.0, 835.0, 427.0, 251.0, 134.0, 78.0, 46.0, 36.0, 14.0, 13.0, 7.0, 4.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.6875, -8.4183349609375, -8.149169921875, -7.8800048828125, -7.61083984375, -7.3416748046875, -7.072509765625, -6.8033447265625, -6.5341796875, -6.2650146484375, -5.995849609375, -5.7266845703125, -5.45751953125, -5.1883544921875, -4.919189453125, -4.6500244140625, -4.380859375, -4.1116943359375, -3.842529296875, -3.5733642578125, -3.30419921875, -3.0350341796875, -2.765869140625, -2.4967041015625, -2.2275390625, -1.9583740234375, -1.689208984375, -1.4200439453125, -1.15087890625, -0.8817138671875, -0.612548828125, -0.3433837890625, -0.07421875, 0.1949462890625, 0.464111328125, 0.7332763671875, 1.00244140625, 1.2716064453125, 1.540771484375, 1.8099365234375, 2.0791015625, 2.3482666015625, 2.617431640625, 2.8865966796875, 3.15576171875, 3.4249267578125, 3.694091796875, 3.9632568359375, 4.232421875, 4.5015869140625, 4.770751953125, 5.0399169921875, 5.30908203125, 5.5782470703125, 5.847412109375, 6.1165771484375, 6.3857421875, 6.6549072265625, 6.924072265625, 7.1932373046875, 7.46240234375, 7.7315673828125, 8.000732421875, 8.2698974609375, 8.5390625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 7.0, 5.0, 7.0, 12.0, 7.0, 25.0, 40.0, 45.0, 73.0, 92.0, 118.0, 122.0, 128.0, 99.0, 60.0, 45.0, 29.0, 23.0, 19.0, 9.0, 16.0, 5.0, 8.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002079010009765625, -0.002024903893470764, -0.0019707977771759033, -0.0019166916608810425, -0.0018625855445861816, -0.0018084794282913208, -0.00175437331199646, -0.0017002671957015991, -0.0016461610794067383, -0.0015920549631118774, -0.0015379488468170166, -0.0014838427305221558, -0.001429736614227295, -0.001375630497932434, -0.0013215243816375732, -0.0012674182653427124, -0.0012133121490478516, -0.0011592060327529907, -0.0011050999164581299, -0.001050993800163269, -0.0009968876838684082, -0.0009427815675735474, -0.0008886754512786865, -0.0008345693349838257, -0.0007804632186889648, -0.000726357102394104, -0.0006722509860992432, -0.0006181448698043823, -0.0005640387535095215, -0.0005099326372146606, -0.0004558265209197998, -0.00040172040462493896, -0.0003476142883300781, -0.0002935081720352173, -0.00023940205574035645, -0.0001852959394454956, -0.00013118982315063477, -7.708370685577393e-05, -2.2977590560913086e-05, 3.1128525733947754e-05, 8.52346420288086e-05, 0.00013934075832366943, 0.00019344687461853027, 0.0002475529909133911, 0.00030165910720825195, 0.0003557652235031128, 0.00040987133979797363, 0.00046397745609283447, 0.0005180835723876953, 0.0005721896886825562, 0.000626295804977417, 0.0006804019212722778, 0.0007345080375671387, 0.0007886141538619995, 0.0008427202701568604, 0.0008968263864517212, 0.000950932502746582, 0.0010050386190414429, 0.0010591447353363037, 0.0011132508516311646, 0.0011673569679260254, 0.0012214630842208862, 0.001275569200515747, 0.001329675316810608, 0.0013837814331054688]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 12.0, 12.0, 17.0, 32.0, 55.0, 62.0, 96.0, 195.0, 387.0, 923.0, 2601.0, 9440.0, 53186.0, 566248.0, 367546.0, 36750.0, 7289.0, 2131.0, 830.0, 321.0, 154.0, 103.0, 59.0, 34.0, 25.0, 9.0, 10.0, 5.0, 6.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.6171875, -15.1822509765625, -14.747314453125, -14.3123779296875, -13.87744140625, -13.4425048828125, -13.007568359375, -12.5726318359375, -12.1376953125, -11.7027587890625, -11.267822265625, -10.8328857421875, -10.39794921875, -9.9630126953125, -9.528076171875, -9.0931396484375, -8.658203125, -8.2232666015625, -7.788330078125, -7.3533935546875, -6.91845703125, -6.4835205078125, -6.048583984375, -5.6136474609375, -5.1787109375, -4.7437744140625, -4.308837890625, -3.8739013671875, -3.43896484375, -3.0040283203125, -2.569091796875, -2.1341552734375, -1.69921875, -1.2642822265625, -0.829345703125, -0.3944091796875, 0.04052734375, 0.4754638671875, 0.910400390625, 1.3453369140625, 1.7802734375, 2.2152099609375, 2.650146484375, 3.0850830078125, 3.52001953125, 3.9549560546875, 4.389892578125, 4.8248291015625, 5.259765625, 5.6947021484375, 6.129638671875, 6.5645751953125, 6.99951171875, 7.4344482421875, 7.869384765625, 8.3043212890625, 8.7392578125, 9.1741943359375, 9.609130859375, 10.0440673828125, 10.47900390625, 10.9139404296875, 11.348876953125, 11.7838134765625, 12.21875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 11.0, 4.0, 8.0, 13.0, 22.0, 17.0, 27.0, 39.0, 45.0, 63.0, 72.0, 90.0, 110.0, 90.0, 108.0, 68.0, 55.0, 35.0, 30.0, 19.0, 15.0, 20.0, 15.0, 6.0, 8.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.015625, -9.763671875, -9.51171875, -9.259765625, -9.0078125, -8.755859375, -8.50390625, -8.251953125, -8.0, -7.748046875, -7.49609375, -7.244140625, -6.9921875, -6.740234375, -6.48828125, -6.236328125, -5.984375, -5.732421875, -5.48046875, -5.228515625, -4.9765625, -4.724609375, -4.47265625, -4.220703125, -3.96875, -3.716796875, -3.46484375, -3.212890625, -2.9609375, -2.708984375, -2.45703125, -2.205078125, -1.953125, -1.701171875, -1.44921875, -1.197265625, -0.9453125, -0.693359375, -0.44140625, -0.189453125, 0.0625, 0.314453125, 0.56640625, 0.818359375, 1.0703125, 1.322265625, 1.57421875, 1.826171875, 2.078125, 2.330078125, 2.58203125, 2.833984375, 3.0859375, 3.337890625, 3.58984375, 3.841796875, 4.09375, 4.345703125, 4.59765625, 4.849609375, 5.1015625, 5.353515625, 5.60546875, 5.857421875, 6.109375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 27.0, 58.0, 102.0, 183.0, 226.0, 177.0, 120.0, 61.0, 29.0, 11.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-287.4256591796875, -281.5179138183594, -275.61016845703125, -269.7024230957031, -263.794677734375, -257.886962890625, -251.97921752929688, -246.07147216796875, -240.16372680664062, -234.2559814453125, -228.34823608398438, -222.4405059814453, -216.5327606201172, -210.62501525878906, -204.71728515625, -198.80953979492188, -192.90179443359375, -186.99404907226562, -181.0863037109375, -175.17857360839844, -169.2708282470703, -163.3630828857422, -157.45535278320312, -151.547607421875, -145.63986206054688, -139.73211669921875, -133.82437133789062, -127.91664123535156, -122.00889587402344, -116.10115051269531, -110.19341278076172, -104.28567504882812, -98.37794494628906, -92.47019958496094, -86.56246185302734, -80.65472412109375, -74.74697875976562, -68.8392333984375, -62.931495666503906, -57.02375411987305, -51.11601257324219, -45.20827102661133, -39.30052947998047, -33.39278793334961, -27.48504638671875, -21.57730484008789, -15.669563293457031, -9.761821746826172, -3.8540802001953125, 2.053661346435547, 7.961402893066406, 13.869144439697266, 19.776885986328125, 25.684627532958984, 31.592369079589844, 37.5001106262207, 43.40785217285156, 49.31559371948242, 55.22333526611328, 61.13107681274414, 67.038818359375, 72.94656372070312, 78.85430145263672, 84.76203918457031, 90.66978454589844]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 3.0, 9.0, 7.0, 12.0, 17.0, 13.0, 14.0, 18.0, 25.0, 28.0, 34.0, 36.0, 42.0, 45.0, 42.0, 50.0, 51.0, 63.0, 56.0, 49.0, 44.0, 49.0, 42.0, 29.0, 30.0, 30.0, 24.0, 29.0, 24.0, 16.0, 14.0, 14.0, 9.0, 13.0, 3.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.65349578857422, -49.78276062011719, -47.91202926635742, -46.04129409790039, -44.17055892944336, -42.299827575683594, -40.42909240722656, -38.55835723876953, -36.6876220703125, -34.81688690185547, -32.9461555480957, -31.075420379638672, -29.20468521118164, -27.333951950073242, -25.463218688964844, -23.592483520507812, -21.721750259399414, -19.851016998291016, -17.980281829833984, -16.109548568725586, -14.238813400268555, -12.368080139160156, -10.497345924377441, -8.626611709594727, -6.755877494812012, -4.885143280029297, -3.014409303665161, -1.1436753273010254, 0.7270588874816895, 2.597792625427246, 4.468526840209961, 6.339261054992676, 8.20999526977539, 10.080729484558105, 11.95146369934082, 13.822196960449219, 15.69293212890625, 17.56366539001465, 19.434398651123047, 21.305133819580078, 23.17586898803711, 25.046602249145508, 26.91733741760254, 28.788070678710938, 30.65880584716797, 32.529541015625, 34.400272369384766, 36.2710075378418, 38.14173889160156, 40.012474060058594, 41.88320541381836, 43.75394058227539, 45.62467575073242, 47.49540710449219, 49.36614227294922, 51.23687744140625, 53.10761260986328, 54.97834777832031, 56.84907913208008, 58.71981430053711, 60.59054946899414, 62.461280822753906, 64.33201599121094, 66.20275115966797, 68.073486328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 7.0, 8.0, 12.0, 14.0, 27.0, 29.0, 33.0, 54.0, 70.0, 117.0, 154.0, 260.0, 380.0, 639.0, 1248.0, 2376.0, 5934.0, 23211.0, 4053017.0, 88587.0, 10445.0, 3659.0, 1679.0, 830.0, 505.0, 278.0, 211.0, 151.0, 84.0, 59.0, 54.0, 38.0, 28.0, 22.0, 10.0, 10.0, 7.0, 5.0, 8.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.078125, -29.099853515625, -28.12158203125, -27.143310546875, -26.1650390625, -25.186767578125, -24.20849609375, -23.230224609375, -22.251953125, -21.273681640625, -20.29541015625, -19.317138671875, -18.3388671875, -17.360595703125, -16.38232421875, -15.404052734375, -14.42578125, -13.447509765625, -12.46923828125, -11.490966796875, -10.5126953125, -9.534423828125, -8.55615234375, -7.577880859375, -6.599609375, -5.621337890625, -4.64306640625, -3.664794921875, -2.6865234375, -1.708251953125, -0.72998046875, 0.248291015625, 1.2265625, 2.204833984375, 3.18310546875, 4.161376953125, 5.1396484375, 6.117919921875, 7.09619140625, 8.074462890625, 9.052734375, 10.031005859375, 11.00927734375, 11.987548828125, 12.9658203125, 13.944091796875, 14.92236328125, 15.900634765625, 16.87890625, 17.857177734375, 18.83544921875, 19.813720703125, 20.7919921875, 21.770263671875, 22.74853515625, 23.726806640625, 24.705078125, 25.683349609375, 26.66162109375, 27.639892578125, 28.6181640625, 29.596435546875, 30.57470703125, 31.552978515625, 32.53125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 8.0, 4.0, 13.0, 8.0, 25.0, 15.0, 22.0, 32.0, 33.0, 41.0, 56.0, 47.0, 61.0, 47.0, 69.0, 55.0, 58.0, 40.0, 49.0, 40.0, 36.0, 45.0, 44.0, 23.0, 28.0, 24.0, 11.0, 15.0, 10.0, 5.0, 4.0, 5.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.869140625, -1.8009033203125, -1.732666015625, -1.6644287109375, -1.59619140625, -1.5279541015625, -1.459716796875, -1.3914794921875, -1.3232421875, -1.2550048828125, -1.186767578125, -1.1185302734375, -1.05029296875, -0.9820556640625, -0.913818359375, -0.8455810546875, -0.77734375, -0.7091064453125, -0.640869140625, -0.5726318359375, -0.50439453125, -0.4361572265625, -0.367919921875, -0.2996826171875, -0.2314453125, -0.1632080078125, -0.094970703125, -0.0267333984375, 0.04150390625, 0.1097412109375, 0.177978515625, 0.2462158203125, 0.314453125, 0.3826904296875, 0.450927734375, 0.5191650390625, 0.58740234375, 0.6556396484375, 0.723876953125, 0.7921142578125, 0.8603515625, 0.9285888671875, 0.996826171875, 1.0650634765625, 1.13330078125, 1.2015380859375, 1.269775390625, 1.3380126953125, 1.40625, 1.4744873046875, 1.542724609375, 1.6109619140625, 1.67919921875, 1.7474365234375, 1.815673828125, 1.8839111328125, 1.9521484375, 2.0203857421875, 2.088623046875, 2.1568603515625, 2.22509765625, 2.2933349609375, 2.361572265625, 2.4298095703125, 2.498046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 9.0, 11.0, 19.0, 31.0, 44.0, 51.0, 84.0, 124.0, 143.0, 210.0, 336.0, 523.0, 878.0, 1643.0, 3235.0, 7603.0, 24859.0, 3926160.0, 198346.0, 17572.0, 6042.0, 2643.0, 1335.0, 786.0, 492.0, 326.0, 210.0, 138.0, 114.0, 63.0, 58.0, 51.0, 41.0, 18.0, 14.0, 18.0, 10.0, 5.0, 11.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-30.203125, -29.337158203125, -28.47119140625, -27.605224609375, -26.7392578125, -25.873291015625, -25.00732421875, -24.141357421875, -23.275390625, -22.409423828125, -21.54345703125, -20.677490234375, -19.8115234375, -18.945556640625, -18.07958984375, -17.213623046875, -16.34765625, -15.481689453125, -14.61572265625, -13.749755859375, -12.8837890625, -12.017822265625, -11.15185546875, -10.285888671875, -9.419921875, -8.553955078125, -7.68798828125, -6.822021484375, -5.9560546875, -5.090087890625, -4.22412109375, -3.358154296875, -2.4921875, -1.626220703125, -0.76025390625, 0.105712890625, 0.9716796875, 1.837646484375, 2.70361328125, 3.569580078125, 4.435546875, 5.301513671875, 6.16748046875, 7.033447265625, 7.8994140625, 8.765380859375, 9.63134765625, 10.497314453125, 11.36328125, 12.229248046875, 13.09521484375, 13.961181640625, 14.8271484375, 15.693115234375, 16.55908203125, 17.425048828125, 18.291015625, 19.156982421875, 20.02294921875, 20.888916015625, 21.7548828125, 22.620849609375, 23.48681640625, 24.352783203125, 25.21875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 18.0, 23.0, 38.0, 102.0, 3291.0, 393.0, 76.0, 34.0, 12.0, 12.0, 12.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.841796875, -2.705535888671875, -2.56927490234375, -2.433013916015625, -2.2967529296875, -2.160491943359375, -2.02423095703125, -1.887969970703125, -1.751708984375, -1.615447998046875, -1.47918701171875, -1.342926025390625, -1.2066650390625, -1.070404052734375, -0.93414306640625, -0.797882080078125, -0.66162109375, -0.525360107421875, -0.38909912109375, -0.252838134765625, -0.1165771484375, 0.019683837890625, 0.15594482421875, 0.292205810546875, 0.428466796875, 0.564727783203125, 0.70098876953125, 0.837249755859375, 0.9735107421875, 1.109771728515625, 1.24603271484375, 1.382293701171875, 1.5185546875, 1.654815673828125, 1.79107666015625, 1.927337646484375, 2.0635986328125, 2.199859619140625, 2.33612060546875, 2.472381591796875, 2.608642578125, 2.744903564453125, 2.88116455078125, 3.017425537109375, 3.1536865234375, 3.289947509765625, 3.42620849609375, 3.562469482421875, 3.69873046875, 3.834991455078125, 3.97125244140625, 4.107513427734375, 4.2437744140625, 4.380035400390625, 4.51629638671875, 4.652557373046875, 4.788818359375, 4.925079345703125, 5.06134033203125, 5.197601318359375, 5.3338623046875, 5.470123291015625, 5.60638427734375, 5.742645263671875, 5.87890625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 10.0, 13.0, 17.0, 21.0, 54.0, 62.0, 63.0, 90.0, 116.0, 136.0, 112.0, 97.0, 59.0, 47.0, 30.0, 20.0, 11.0, 8.0, 12.0, 3.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.826491355895996, -9.228620529174805, -8.630749702453613, -8.032878875732422, -7.4350080490112305, -6.837137222290039, -6.239266395568848, -5.641395568847656, -5.043524742126465, -4.445653915405273, -3.847783088684082, -3.2499122619628906, -2.652041435241699, -2.054170608520508, -1.4562997817993164, -0.858428955078125, -0.2605581283569336, 0.3373126983642578, 0.9351835250854492, 1.5330543518066406, 2.130925178527832, 2.7287960052490234, 3.326666831970215, 3.9245376586914062, 4.522408485412598, 5.120279312133789, 5.7181501388549805, 6.316020965576172, 6.913891792297363, 7.511762619018555, 8.109633445739746, 8.707504272460938, 9.305376052856445, 9.903246879577637, 10.501117706298828, 11.09898853302002, 11.696859359741211, 12.294730186462402, 12.892601013183594, 13.490471839904785, 14.088342666625977, 14.686213493347168, 15.28408432006836, 15.88195514678955, 16.479825973510742, 17.07769775390625, 17.675567626953125, 18.2734375, 18.871309280395508, 19.469181060791016, 20.06705093383789, 20.664920806884766, 21.262792587280273, 21.86066436767578, 22.458534240722656, 23.05640411376953, 23.65427589416504, 24.252147674560547, 24.850017547607422, 25.447887420654297, 26.045759201049805, 26.643630981445312, 27.241500854492188, 27.839370727539062, 28.43724250793457]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 6.0, 5.0, 6.0, 5.0, 9.0, 7.0, 10.0, 12.0, 21.0, 29.0, 19.0, 28.0, 21.0, 31.0, 34.0, 29.0, 26.0, 40.0, 33.0, 32.0, 31.0, 46.0, 38.0, 44.0, 30.0, 40.0, 35.0, 29.0, 37.0, 31.0, 37.0, 25.0, 24.0, 23.0, 25.0, 21.0, 12.0, 16.0, 8.0, 10.0, 7.0, 5.0, 2.0, 6.0, 9.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.383594036102295, -7.132969856262207, -6.882345676422119, -6.631721496582031, -6.381097316741943, -6.1304731369018555, -5.879849433898926, -5.62922477722168, -5.37860107421875, -5.127976894378662, -4.877352714538574, -4.626728534698486, -4.376104354858398, -4.1254801750183105, -3.8748562335968018, -3.624232053756714, -3.373607635498047, -3.122983455657959, -2.872359275817871, -2.621735095977783, -2.3711109161376953, -2.1204867362976074, -1.8698627948760986, -1.6192386150360107, -1.3686144351959229, -1.117990255355835, -0.8673661351203918, -0.6167420148849487, -0.36611783504486084, -0.11549365520477295, 0.1351304054260254, 0.3857545852661133, 0.6363792419433594, 0.8870034217834473, 1.1376276016235352, 1.3882516622543335, 1.6388758420944214, 1.8895000219345093, 2.1401240825653076, 2.3907482624053955, 2.6413724422454834, 2.8919966220855713, 3.142620801925659, 3.393244743347168, 3.643868923187256, 3.8944931030273438, 4.145117282867432, 4.3957414627075195, 4.646365642547607, 4.896989822387695, 5.147614002227783, 5.398238182067871, 5.648862361907959, 5.899486541748047, 6.150110244750977, 6.400734901428223, 6.651358604431152, 6.90198278427124, 7.152606964111328, 7.403231143951416, 7.653855323791504, 7.904479503631592, 8.15510368347168, 8.40572738647461, 8.656352043151855]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 0.0, 4.0, 9.0, 10.0, 11.0, 19.0, 20.0, 36.0, 66.0, 68.0, 111.0, 162.0, 228.0, 370.0, 582.0, 932.0, 1556.0, 2587.0, 4560.0, 8495.0, 15484.0, 28458.0, 53576.0, 96642.0, 163111.0, 218337.0, 188897.0, 119030.0, 66169.0, 35688.0, 19112.0, 10220.0, 5798.0, 3243.0, 1822.0, 1136.0, 713.0, 469.0, 273.0, 177.0, 110.0, 100.0, 56.0, 35.0, 21.0, 17.0, 14.0, 6.0, 8.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-7.234375, -7.01300048828125, -6.7916259765625, -6.57025146484375, -6.348876953125, -6.12750244140625, -5.9061279296875, -5.68475341796875, -5.46337890625, -5.24200439453125, -5.0206298828125, -4.79925537109375, -4.577880859375, -4.35650634765625, -4.1351318359375, -3.91375732421875, -3.6923828125, -3.47100830078125, -3.2496337890625, -3.02825927734375, -2.806884765625, -2.58551025390625, -2.3641357421875, -2.14276123046875, -1.92138671875, -1.70001220703125, -1.4786376953125, -1.25726318359375, -1.035888671875, -0.81451416015625, -0.5931396484375, -0.37176513671875, -0.150390625, 0.07098388671875, 0.2923583984375, 0.51373291015625, 0.735107421875, 0.95648193359375, 1.1778564453125, 1.39923095703125, 1.62060546875, 1.84197998046875, 2.0633544921875, 2.28472900390625, 2.506103515625, 2.72747802734375, 2.9488525390625, 3.17022705078125, 3.3916015625, 3.61297607421875, 3.8343505859375, 4.05572509765625, 4.277099609375, 4.49847412109375, 4.7198486328125, 4.94122314453125, 5.16259765625, 5.38397216796875, 5.6053466796875, 5.82672119140625, 6.048095703125, 6.26947021484375, 6.4908447265625, 6.71221923828125, 6.93359375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 7.0, 3.0, 9.0, 3.0, 9.0, 11.0, 8.0, 18.0, 13.0, 21.0, 20.0, 19.0, 30.0, 34.0, 34.0, 30.0, 50.0, 55.0, 56.0, 51.0, 54.0, 51.0, 60.0, 45.0, 37.0, 33.0, 35.0, 30.0, 27.0, 32.0, 21.0, 18.0, 19.0, 13.0, 8.0, 11.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.814453125, -1.743408203125, -1.67236328125, -1.601318359375, -1.5302734375, -1.459228515625, -1.38818359375, -1.317138671875, -1.24609375, -1.175048828125, -1.10400390625, -1.032958984375, -0.9619140625, -0.890869140625, -0.81982421875, -0.748779296875, -0.677734375, -0.606689453125, -0.53564453125, -0.464599609375, -0.3935546875, -0.322509765625, -0.25146484375, -0.180419921875, -0.109375, -0.038330078125, 0.03271484375, 0.103759765625, 0.1748046875, 0.245849609375, 0.31689453125, 0.387939453125, 0.458984375, 0.530029296875, 0.60107421875, 0.672119140625, 0.7431640625, 0.814208984375, 0.88525390625, 0.956298828125, 1.02734375, 1.098388671875, 1.16943359375, 1.240478515625, 1.3115234375, 1.382568359375, 1.45361328125, 1.524658203125, 1.595703125, 1.666748046875, 1.73779296875, 1.808837890625, 1.8798828125, 1.950927734375, 2.02197265625, 2.093017578125, 2.1640625, 2.235107421875, 2.30615234375, 2.377197265625, 2.4482421875, 2.519287109375, 2.59033203125, 2.661376953125, 2.732421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 10.0, 8.0, 13.0, 26.0, 23.0, 24.0, 36.0, 61.0, 72.0, 145.0, 181.0, 297.0, 434.0, 712.0, 1316.0, 2593.0, 6465.0, 21644.0, 104127.0, 517360.0, 313755.0, 56804.0, 13355.0, 4431.0, 1937.0, 959.0, 591.0, 365.0, 247.0, 177.0, 109.0, 76.0, 57.0, 42.0, 30.0, 23.0, 17.0, 7.0, 8.0, 9.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.265625, -15.75439453125, -15.2431640625, -14.73193359375, -14.220703125, -13.70947265625, -13.1982421875, -12.68701171875, -12.17578125, -11.66455078125, -11.1533203125, -10.64208984375, -10.130859375, -9.61962890625, -9.1083984375, -8.59716796875, -8.0859375, -7.57470703125, -7.0634765625, -6.55224609375, -6.041015625, -5.52978515625, -5.0185546875, -4.50732421875, -3.99609375, -3.48486328125, -2.9736328125, -2.46240234375, -1.951171875, -1.43994140625, -0.9287109375, -0.41748046875, 0.09375, 0.60498046875, 1.1162109375, 1.62744140625, 2.138671875, 2.64990234375, 3.1611328125, 3.67236328125, 4.18359375, 4.69482421875, 5.2060546875, 5.71728515625, 6.228515625, 6.73974609375, 7.2509765625, 7.76220703125, 8.2734375, 8.78466796875, 9.2958984375, 9.80712890625, 10.318359375, 10.82958984375, 11.3408203125, 11.85205078125, 12.36328125, 12.87451171875, 13.3857421875, 13.89697265625, 14.408203125, 14.91943359375, 15.4306640625, 15.94189453125, 16.453125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 4.0, 4.0, 4.0, 15.0, 11.0, 6.0, 10.0, 17.0, 22.0, 22.0, 16.0, 35.0, 37.0, 29.0, 32.0, 36.0, 29.0, 40.0, 47.0, 40.0, 39.0, 43.0, 39.0, 41.0, 37.0, 33.0, 30.0, 41.0, 27.0, 22.0, 29.0, 19.0, 24.0, 18.0, 12.0, 16.0, 17.0, 10.0, 10.0, 5.0, 6.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-11.8671875, -11.5084228515625, -11.149658203125, -10.7908935546875, -10.43212890625, -10.0733642578125, -9.714599609375, -9.3558349609375, -8.9970703125, -8.6383056640625, -8.279541015625, -7.9207763671875, -7.56201171875, -7.2032470703125, -6.844482421875, -6.4857177734375, -6.126953125, -5.7681884765625, -5.409423828125, -5.0506591796875, -4.69189453125, -4.3331298828125, -3.974365234375, -3.6156005859375, -3.2568359375, -2.8980712890625, -2.539306640625, -2.1805419921875, -1.82177734375, -1.4630126953125, -1.104248046875, -0.7454833984375, -0.38671875, -0.0279541015625, 0.330810546875, 0.6895751953125, 1.04833984375, 1.4071044921875, 1.765869140625, 2.1246337890625, 2.4833984375, 2.8421630859375, 3.200927734375, 3.5596923828125, 3.91845703125, 4.2772216796875, 4.635986328125, 4.9947509765625, 5.353515625, 5.7122802734375, 6.071044921875, 6.4298095703125, 6.78857421875, 7.1473388671875, 7.506103515625, 7.8648681640625, 8.2236328125, 8.5823974609375, 8.941162109375, 9.2999267578125, 9.65869140625, 10.0174560546875, 10.376220703125, 10.7349853515625, 11.09375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 6.0, 3.0, 3.0, 11.0, 12.0, 10.0, 16.0, 22.0, 33.0, 43.0, 56.0, 87.0, 109.0, 149.0, 243.0, 385.0, 611.0, 1147.0, 2016.0, 4284.0, 11387.0, 39507.0, 211641.0, 604302.0, 129065.0, 27121.0, 8723.0, 3428.0, 1689.0, 869.0, 485.0, 326.0, 233.0, 134.0, 108.0, 77.0, 47.0, 45.0, 33.0, 25.0, 19.0, 12.0, 7.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0], "bins": [-9.7109375, -9.44390869140625, -9.1768798828125, -8.90985107421875, -8.642822265625, -8.37579345703125, -8.1087646484375, -7.84173583984375, -7.57470703125, -7.30767822265625, -7.0406494140625, -6.77362060546875, -6.506591796875, -6.23956298828125, -5.9725341796875, -5.70550537109375, -5.4384765625, -5.17144775390625, -4.9044189453125, -4.63739013671875, -4.370361328125, -4.10333251953125, -3.8363037109375, -3.56927490234375, -3.30224609375, -3.03521728515625, -2.7681884765625, -2.50115966796875, -2.234130859375, -1.96710205078125, -1.7000732421875, -1.43304443359375, -1.166015625, -0.89898681640625, -0.6319580078125, -0.36492919921875, -0.097900390625, 0.16912841796875, 0.4361572265625, 0.70318603515625, 0.97021484375, 1.23724365234375, 1.5042724609375, 1.77130126953125, 2.038330078125, 2.30535888671875, 2.5723876953125, 2.83941650390625, 3.1064453125, 3.37347412109375, 3.6405029296875, 3.90753173828125, 4.174560546875, 4.44158935546875, 4.7086181640625, 4.97564697265625, 5.24267578125, 5.50970458984375, 5.7767333984375, 6.04376220703125, 6.310791015625, 6.57781982421875, 6.8448486328125, 7.11187744140625, 7.37890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 11.0, 23.0, 24.0, 35.0, 45.0, 52.0, 75.0, 90.0, 115.0, 130.0, 108.0, 78.0, 60.0, 42.0, 42.0, 26.0, 12.0, 12.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015039443969726562, -0.0014586597681045532, -0.0014133751392364502, -0.0013680905103683472, -0.0013228058815002441, -0.0012775212526321411, -0.001232236623764038, -0.001186951994895935, -0.001141667366027832, -0.001096382737159729, -0.001051098108291626, -0.001005813479423523, -0.0009605288505554199, -0.0009152442216873169, -0.0008699595928192139, -0.0008246749639511108, -0.0007793903350830078, -0.0007341057062149048, -0.0006888210773468018, -0.0006435364484786987, -0.0005982518196105957, -0.0005529671907424927, -0.0005076825618743896, -0.0004623979330062866, -0.0004171133041381836, -0.00037182867527008057, -0.00032654404640197754, -0.0002812594175338745, -0.00023597478866577148, -0.00019069015979766846, -0.00014540553092956543, -0.0001001209020614624, -5.4836273193359375e-05, -9.551644325256348e-06, 3.573298454284668e-05, 8.101761341094971e-05, 0.00012630224227905273, 0.00017158687114715576, 0.0002168715000152588, 0.0002621561288833618, 0.00030744075775146484, 0.00035272538661956787, 0.0003980100154876709, 0.0004432946443557739, 0.000488579273223877, 0.00053386390209198, 0.000579148530960083, 0.000624433159828186, 0.0006697177886962891, 0.0007150024175643921, 0.0007602870464324951, 0.0008055716753005981, 0.0008508563041687012, 0.0008961409330368042, 0.0009414255619049072, 0.0009867101907730103, 0.0010319948196411133, 0.0010772794485092163, 0.0011225640773773193, 0.0011678487062454224, 0.0012131333351135254, 0.0012584179639816284, 0.0013037025928497314, 0.0013489872217178345, 0.0013942718505859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 11.0, 12.0, 31.0, 42.0, 96.0, 177.0, 530.0, 2153.0, 22318.0, 928238.0, 89409.0, 4239.0, 782.0, 280.0, 103.0, 64.0, 31.0, 21.0, 11.0, 6.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.4375, -26.622802734375, -25.80810546875, -24.993408203125, -24.1787109375, -23.364013671875, -22.54931640625, -21.734619140625, -20.919921875, -20.105224609375, -19.29052734375, -18.475830078125, -17.6611328125, -16.846435546875, -16.03173828125, -15.217041015625, -14.40234375, -13.587646484375, -12.77294921875, -11.958251953125, -11.1435546875, -10.328857421875, -9.51416015625, -8.699462890625, -7.884765625, -7.070068359375, -6.25537109375, -5.440673828125, -4.6259765625, -3.811279296875, -2.99658203125, -2.181884765625, -1.3671875, -0.552490234375, 0.26220703125, 1.076904296875, 1.8916015625, 2.706298828125, 3.52099609375, 4.335693359375, 5.150390625, 5.965087890625, 6.77978515625, 7.594482421875, 8.4091796875, 9.223876953125, 10.03857421875, 10.853271484375, 11.66796875, 12.482666015625, 13.29736328125, 14.112060546875, 14.9267578125, 15.741455078125, 16.55615234375, 17.370849609375, 18.185546875, 19.000244140625, 19.81494140625, 20.629638671875, 21.4443359375, 22.259033203125, 23.07373046875, 23.888427734375, 24.703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 9.0, 12.0, 20.0, 53.0, 54.0, 109.0, 166.0, 174.0, 145.0, 92.0, 60.0, 34.0, 20.0, 18.0, 10.0, 7.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.25390625, -6.78289794921875, -6.3118896484375, -5.84088134765625, -5.369873046875, -4.89886474609375, -4.4278564453125, -3.95684814453125, -3.48583984375, -3.01483154296875, -2.5438232421875, -2.07281494140625, -1.601806640625, -1.13079833984375, -0.6597900390625, -0.18878173828125, 0.2822265625, 0.75323486328125, 1.2242431640625, 1.69525146484375, 2.166259765625, 2.63726806640625, 3.1082763671875, 3.57928466796875, 4.05029296875, 4.52130126953125, 4.9923095703125, 5.46331787109375, 5.934326171875, 6.40533447265625, 6.8763427734375, 7.34735107421875, 7.818359375, 8.28936767578125, 8.7603759765625, 9.23138427734375, 9.702392578125, 10.17340087890625, 10.6444091796875, 11.11541748046875, 11.58642578125, 12.05743408203125, 12.5284423828125, 12.99945068359375, 13.470458984375, 13.94146728515625, 14.4124755859375, 14.88348388671875, 15.3544921875, 15.82550048828125, 16.2965087890625, 16.76751708984375, 17.238525390625, 17.70953369140625, 18.1805419921875, 18.65155029296875, 19.12255859375, 19.59356689453125, 20.0645751953125, 20.53558349609375, 21.006591796875, 21.47760009765625, 21.9486083984375, 22.41961669921875, 22.890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 8.0, 17.0, 9.0, 36.0, 45.0, 67.0, 98.0, 105.0, 137.0, 119.0, 104.0, 74.0, 62.0, 38.0, 24.0, 20.0, 14.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.69902038574219, -121.880126953125, -118.06123352050781, -114.24234008789062, -110.42344665527344, -106.60455322265625, -102.78565979003906, -98.96676635742188, -95.14787292480469, -91.3289794921875, -87.51008605957031, -83.69119262695312, -79.87229919433594, -76.05340576171875, -72.23451232910156, -68.41561889648438, -64.59672546386719, -60.77783203125, -56.95893859863281, -53.140045166015625, -49.32115173339844, -45.50225830078125, -41.68336486816406, -37.864471435546875, -34.04557800292969, -30.2266845703125, -26.407791137695312, -22.588897705078125, -18.770004272460938, -14.95111083984375, -11.132217407226562, -7.313323974609375, -3.4944229125976562, 0.32447052001953125, 4.143363952636719, 7.962257385253906, 11.781150817871094, 15.600044250488281, 19.41893768310547, 23.237831115722656, 27.056724548339844, 30.87561798095703, 34.69451141357422, 38.513404846191406, 42.332298278808594, 46.15119171142578, 49.97008514404297, 53.788978576660156, 57.607872009277344, 61.42676544189453, 65.24565887451172, 69.0645523071289, 72.8834457397461, 76.70233917236328, 80.52123260498047, 84.34012603759766, 88.15901947021484, 91.97791290283203, 95.79680633544922, 99.6156997680664, 103.4345932006836, 107.25348663330078, 111.07238006591797, 114.89127349853516, 118.71016693115234]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 1.0, 6.0, 3.0, 4.0, 7.0, 9.0, 9.0, 7.0, 12.0, 14.0, 24.0, 14.0, 25.0, 23.0, 24.0, 35.0, 30.0, 46.0, 46.0, 54.0, 51.0, 52.0, 47.0, 49.0, 50.0, 60.0, 32.0, 37.0, 34.0, 30.0, 28.0, 30.0, 22.0, 18.0, 11.0, 16.0, 8.0, 8.0, 6.0, 8.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-77.9047622680664, -75.66313934326172, -73.4215087890625, -71.17988586425781, -68.93826293945312, -66.69664001464844, -64.45501708984375, -62.21338653564453, -59.971763610839844, -57.730140686035156, -55.4885139465332, -53.24688720703125, -51.00526428222656, -48.763641357421875, -46.52201461791992, -44.28038787841797, -42.03876495361328, -39.797142028808594, -37.55551528930664, -35.31388854980469, -33.072265625, -30.83064079284668, -28.58901596069336, -26.34739112854004, -24.10576629638672, -21.8641414642334, -19.622516632080078, -17.380891799926758, -15.139266967773438, -12.897642135620117, -10.656017303466797, -8.414392471313477, -6.172760009765625, -3.9311351776123047, -1.6895103454589844, 0.5521144866943359, 2.7937393188476562, 5.035364151000977, 7.276988983154297, 9.518613815307617, 11.760238647460938, 14.001863479614258, 16.243488311767578, 18.4851131439209, 20.72673797607422, 22.96836280822754, 25.20998764038086, 27.45161247253418, 29.6932373046875, 31.93486213684082, 34.17648696899414, 36.418113708496094, 38.65973663330078, 40.90135955810547, 43.14298629760742, 45.384613037109375, 47.62623596191406, 49.86785888671875, 52.1094856262207, 54.351112365722656, 56.592735290527344, 58.83435821533203, 61.075984954833984, 63.31761169433594, 65.55923461914062]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 8.0, 19.0, 17.0, 27.0, 44.0, 40.0, 84.0, 88.0, 156.0, 206.0, 280.0, 529.0, 797.0, 1501.0, 3209.0, 8127.0, 32381.0, 3998565.0, 123072.0, 15095.0, 4938.0, 2109.0, 1118.0, 629.0, 396.0, 257.0, 167.0, 136.0, 78.0, 60.0, 38.0, 35.0, 22.0, 18.0, 4.0, 8.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.8125, -24.077392578125, -23.34228515625, -22.607177734375, -21.8720703125, -21.136962890625, -20.40185546875, -19.666748046875, -18.931640625, -18.196533203125, -17.46142578125, -16.726318359375, -15.9912109375, -15.256103515625, -14.52099609375, -13.785888671875, -13.05078125, -12.315673828125, -11.58056640625, -10.845458984375, -10.1103515625, -9.375244140625, -8.64013671875, -7.905029296875, -7.169921875, -6.434814453125, -5.69970703125, -4.964599609375, -4.2294921875, -3.494384765625, -2.75927734375, -2.024169921875, -1.2890625, -0.553955078125, 0.18115234375, 0.916259765625, 1.6513671875, 2.386474609375, 3.12158203125, 3.856689453125, 4.591796875, 5.326904296875, 6.06201171875, 6.797119140625, 7.5322265625, 8.267333984375, 9.00244140625, 9.737548828125, 10.47265625, 11.207763671875, 11.94287109375, 12.677978515625, 13.4130859375, 14.148193359375, 14.88330078125, 15.618408203125, 16.353515625, 17.088623046875, 17.82373046875, 18.558837890625, 19.2939453125, 20.029052734375, 20.76416015625, 21.499267578125, 22.234375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 6.0, 0.0, 4.0, 2.0, 4.0, 9.0, 13.0, 20.0, 18.0, 15.0, 28.0, 33.0, 36.0, 38.0, 54.0, 63.0, 71.0, 64.0, 62.0, 58.0, 68.0, 61.0, 49.0, 46.0, 26.0, 34.0, 32.0, 19.0, 17.0, 20.0, 9.0, 7.0, 6.0, 6.0, 7.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.88671875, -2.792327880859375, -2.69793701171875, -2.603546142578125, -2.5091552734375, -2.414764404296875, -2.32037353515625, -2.225982666015625, -2.131591796875, -2.037200927734375, -1.94281005859375, -1.848419189453125, -1.7540283203125, -1.659637451171875, -1.56524658203125, -1.470855712890625, -1.37646484375, -1.282073974609375, -1.18768310546875, -1.093292236328125, -0.9989013671875, -0.904510498046875, -0.81011962890625, -0.715728759765625, -0.621337890625, -0.526947021484375, -0.43255615234375, -0.338165283203125, -0.2437744140625, -0.149383544921875, -0.05499267578125, 0.039398193359375, 0.1337890625, 0.228179931640625, 0.32257080078125, 0.416961669921875, 0.5113525390625, 0.605743408203125, 0.70013427734375, 0.794525146484375, 0.888916015625, 0.983306884765625, 1.07769775390625, 1.172088623046875, 1.2664794921875, 1.360870361328125, 1.45526123046875, 1.549652099609375, 1.64404296875, 1.738433837890625, 1.83282470703125, 1.927215576171875, 2.0216064453125, 2.115997314453125, 2.21038818359375, 2.304779052734375, 2.399169921875, 2.493560791015625, 2.58795166015625, 2.682342529296875, 2.7767333984375, 2.871124267578125, 2.96551513671875, 3.059906005859375, 3.154296875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 3.0, 6.0, 10.0, 11.0, 23.0, 18.0, 25.0, 45.0, 47.0, 73.0, 119.0, 174.0, 314.0, 704.0, 1723.0, 5001.0, 19036.0, 3820440.0, 323559.0, 15543.0, 4461.0, 1468.0, 640.0, 293.0, 180.0, 89.0, 66.0, 67.0, 37.0, 22.0, 25.0, 18.0, 13.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.890625, -28.781005859375, -27.67138671875, -26.561767578125, -25.4521484375, -24.342529296875, -23.23291015625, -22.123291015625, -21.013671875, -19.904052734375, -18.79443359375, -17.684814453125, -16.5751953125, -15.465576171875, -14.35595703125, -13.246337890625, -12.13671875, -11.027099609375, -9.91748046875, -8.807861328125, -7.6982421875, -6.588623046875, -5.47900390625, -4.369384765625, -3.259765625, -2.150146484375, -1.04052734375, 0.069091796875, 1.1787109375, 2.288330078125, 3.39794921875, 4.507568359375, 5.6171875, 6.726806640625, 7.83642578125, 8.946044921875, 10.0556640625, 11.165283203125, 12.27490234375, 13.384521484375, 14.494140625, 15.603759765625, 16.71337890625, 17.822998046875, 18.9326171875, 20.042236328125, 21.15185546875, 22.261474609375, 23.37109375, 24.480712890625, 25.59033203125, 26.699951171875, 27.8095703125, 28.919189453125, 30.02880859375, 31.138427734375, 32.248046875, 33.357666015625, 34.46728515625, 35.576904296875, 36.6865234375, 37.796142578125, 38.90576171875, 40.015380859375, 41.125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 3.0, 2.0, 8.0, 5.0, 17.0, 16.0, 29.0, 72.0, 255.0, 3375.0, 160.0, 52.0, 21.0, 12.0, 7.0, 10.0, 7.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.677734375, -3.497344970703125, -3.31695556640625, -3.136566162109375, -2.9561767578125, -2.775787353515625, -2.59539794921875, -2.415008544921875, -2.234619140625, -2.054229736328125, -1.87384033203125, -1.693450927734375, -1.5130615234375, -1.332672119140625, -1.15228271484375, -0.971893310546875, -0.79150390625, -0.611114501953125, -0.43072509765625, -0.250335693359375, -0.0699462890625, 0.110443115234375, 0.29083251953125, 0.471221923828125, 0.651611328125, 0.832000732421875, 1.01239013671875, 1.192779541015625, 1.3731689453125, 1.553558349609375, 1.73394775390625, 1.914337158203125, 2.0947265625, 2.275115966796875, 2.45550537109375, 2.635894775390625, 2.8162841796875, 2.996673583984375, 3.17706298828125, 3.357452392578125, 3.537841796875, 3.718231201171875, 3.89862060546875, 4.079010009765625, 4.2593994140625, 4.439788818359375, 4.62017822265625, 4.800567626953125, 4.98095703125, 5.161346435546875, 5.34173583984375, 5.522125244140625, 5.7025146484375, 5.882904052734375, 6.06329345703125, 6.243682861328125, 6.424072265625, 6.604461669921875, 6.78485107421875, 6.965240478515625, 7.1456298828125, 7.326019287109375, 7.50640869140625, 7.686798095703125, 7.8671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 11.0, 24.0, 31.0, 56.0, 132.0, 162.0, 194.0, 135.0, 106.0, 67.0, 35.0, 21.0, 8.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.16546630859375, -48.15174865722656, -47.138031005859375, -46.12431335449219, -45.110595703125, -44.09687805175781, -43.083160400390625, -42.06943893432617, -41.055721282958984, -40.0420036315918, -39.02828598022461, -38.01456832885742, -37.000850677490234, -35.98712921142578, -34.973411560058594, -33.959693908691406, -32.94597625732422, -31.93225860595703, -30.918540954589844, -29.904823303222656, -28.891103744506836, -27.87738609313965, -26.86366844177246, -25.849950790405273, -24.83623504638672, -23.82251739501953, -22.808799743652344, -21.795082092285156, -20.781362533569336, -19.76764488220215, -18.75392723083496, -17.740209579467773, -16.72648811340332, -15.712770462036133, -14.699051856994629, -13.685334205627441, -12.671615600585938, -11.65789794921875, -10.644180297851562, -9.630462646484375, -8.616744041442871, -7.603025913238525, -6.58930778503418, -5.575590133666992, -4.5618720054626465, -3.548153877258301, -2.5344362258911133, -1.5207180976867676, -0.5069999694824219, 0.5067180395126343, 1.5204360485076904, 2.534153938293457, 3.5478720664978027, 4.561590194702148, 5.575307846069336, 6.589025974273682, 7.602744102478027, 8.616461753845215, 9.630180358886719, 10.643898010253906, 11.657615661621094, 12.671334266662598, 13.685051918029785, 14.698770523071289, 15.712488174438477]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 2.0, 8.0, 13.0, 16.0, 16.0, 19.0, 24.0, 17.0, 24.0, 23.0, 34.0, 38.0, 42.0, 46.0, 55.0, 38.0, 52.0, 57.0, 37.0, 45.0, 40.0, 46.0, 42.0, 41.0, 44.0, 22.0, 28.0, 18.0, 21.0, 14.0, 16.0, 14.0, 13.0, 4.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.100080490112305, -11.745158195495605, -11.39023494720459, -11.03531265258789, -10.680389404296875, -10.325467109680176, -9.97054386138916, -9.615621566772461, -9.260698318481445, -8.905776023864746, -8.55085277557373, -8.195930480957031, -7.841007232666016, -7.486084461212158, -7.131161689758301, -6.776239395141602, -6.421316623687744, -6.066393852233887, -5.711471080780029, -5.356548309326172, -5.0016255378723145, -4.646702766418457, -4.291780471801758, -3.9368574619293213, -3.581934690475464, -3.2270119190216064, -2.872089147567749, -2.5171666145324707, -2.1622438430786133, -1.8073209524154663, -1.4523983001708984, -1.097475528717041, -0.7425527572631836, -0.38763001561164856, -0.032707273960113525, 0.3222154378890991, 0.6771382093429565, 1.032060980796814, 1.3869836330413818, 1.7419064044952393, 2.0968291759490967, 2.451751947402954, 2.8066747188568115, 3.16159725189209, 3.5165200233459473, 3.8714427947998047, 4.226365566253662, 4.5812883377075195, 4.936211109161377, 5.291133880615234, 5.646056652069092, 6.000979423522949, 6.355902194976807, 6.710824966430664, 7.065747261047363, 7.420670509338379, 7.775592803955078, 8.130515098571777, 8.485438346862793, 8.840360641479492, 9.195283889770508, 9.550206184387207, 9.905129432678223, 10.260051727294922, 10.614974975585938]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 13.0, 18.0, 30.0, 39.0, 55.0, 113.0, 205.0, 255.0, 448.0, 758.0, 1277.0, 2393.0, 4355.0, 8339.0, 16353.0, 31986.0, 63208.0, 119898.0, 198982.0, 233212.0, 169215.0, 95297.0, 49611.0, 25092.0, 12709.0, 6685.0, 3602.0, 1896.0, 1036.0, 581.0, 349.0, 192.0, 102.0, 109.0, 45.0, 30.0, 16.0, 19.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.921875, -4.759521484375, -4.59716796875, -4.434814453125, -4.2724609375, -4.110107421875, -3.94775390625, -3.785400390625, -3.623046875, -3.460693359375, -3.29833984375, -3.135986328125, -2.9736328125, -2.811279296875, -2.64892578125, -2.486572265625, -2.32421875, -2.161865234375, -1.99951171875, -1.837158203125, -1.6748046875, -1.512451171875, -1.35009765625, -1.187744140625, -1.025390625, -0.863037109375, -0.70068359375, -0.538330078125, -0.3759765625, -0.213623046875, -0.05126953125, 0.111083984375, 0.2734375, 0.435791015625, 0.59814453125, 0.760498046875, 0.9228515625, 1.085205078125, 1.24755859375, 1.409912109375, 1.572265625, 1.734619140625, 1.89697265625, 2.059326171875, 2.2216796875, 2.384033203125, 2.54638671875, 2.708740234375, 2.87109375, 3.033447265625, 3.19580078125, 3.358154296875, 3.5205078125, 3.682861328125, 3.84521484375, 4.007568359375, 4.169921875, 4.332275390625, 4.49462890625, 4.656982421875, 4.8193359375, 4.981689453125, 5.14404296875, 5.306396484375, 5.46875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 11.0, 9.0, 14.0, 22.0, 23.0, 28.0, 24.0, 23.0, 29.0, 42.0, 37.0, 58.0, 51.0, 53.0, 42.0, 61.0, 62.0, 54.0, 51.0, 37.0, 34.0, 45.0, 36.0, 31.0, 25.0, 12.0, 11.0, 18.0, 9.0, 10.0, 5.0, 7.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.68096923828125, -2.5885009765625, -2.49603271484375, -2.403564453125, -2.31109619140625, -2.2186279296875, -2.12615966796875, -2.03369140625, -1.94122314453125, -1.8487548828125, -1.75628662109375, -1.663818359375, -1.57135009765625, -1.4788818359375, -1.38641357421875, -1.2939453125, -1.20147705078125, -1.1090087890625, -1.01654052734375, -0.924072265625, -0.83160400390625, -0.7391357421875, -0.64666748046875, -0.55419921875, -0.46173095703125, -0.3692626953125, -0.27679443359375, -0.184326171875, -0.09185791015625, 0.0006103515625, 0.09307861328125, 0.185546875, 0.27801513671875, 0.3704833984375, 0.46295166015625, 0.555419921875, 0.64788818359375, 0.7403564453125, 0.83282470703125, 0.92529296875, 1.01776123046875, 1.1102294921875, 1.20269775390625, 1.295166015625, 1.38763427734375, 1.4801025390625, 1.57257080078125, 1.6650390625, 1.75750732421875, 1.8499755859375, 1.94244384765625, 2.034912109375, 2.12738037109375, 2.2198486328125, 2.31231689453125, 2.40478515625, 2.49725341796875, 2.5897216796875, 2.68218994140625, 2.774658203125, 2.86712646484375, 2.9595947265625, 3.05206298828125, 3.14453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 5.0, 13.0, 12.0, 9.0, 21.0, 32.0, 48.0, 60.0, 112.0, 173.0, 235.0, 339.0, 609.0, 1048.0, 2119.0, 5957.0, 31297.0, 363780.0, 578898.0, 50151.0, 8071.0, 2563.0, 1169.0, 637.0, 373.0, 272.0, 178.0, 104.0, 76.0, 55.0, 36.0, 23.0, 27.0, 7.0, 14.0, 6.0, 5.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.53125, -15.982177734375, -15.43310546875, -14.884033203125, -14.3349609375, -13.785888671875, -13.23681640625, -12.687744140625, -12.138671875, -11.589599609375, -11.04052734375, -10.491455078125, -9.9423828125, -9.393310546875, -8.84423828125, -8.295166015625, -7.74609375, -7.197021484375, -6.64794921875, -6.098876953125, -5.5498046875, -5.000732421875, -4.45166015625, -3.902587890625, -3.353515625, -2.804443359375, -2.25537109375, -1.706298828125, -1.1572265625, -0.608154296875, -0.05908203125, 0.489990234375, 1.0390625, 1.588134765625, 2.13720703125, 2.686279296875, 3.2353515625, 3.784423828125, 4.33349609375, 4.882568359375, 5.431640625, 5.980712890625, 6.52978515625, 7.078857421875, 7.6279296875, 8.177001953125, 8.72607421875, 9.275146484375, 9.82421875, 10.373291015625, 10.92236328125, 11.471435546875, 12.0205078125, 12.569580078125, 13.11865234375, 13.667724609375, 14.216796875, 14.765869140625, 15.31494140625, 15.864013671875, 16.4130859375, 16.962158203125, 17.51123046875, 18.060302734375, 18.609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 7.0, 3.0, 5.0, 16.0, 7.0, 12.0, 14.0, 20.0, 20.0, 20.0, 30.0, 26.0, 36.0, 34.0, 28.0, 33.0, 32.0, 56.0, 41.0, 39.0, 42.0, 45.0, 44.0, 32.0, 41.0, 43.0, 28.0, 29.0, 31.0, 23.0, 30.0, 17.0, 28.0, 17.0, 15.0, 15.0, 9.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.015625, -11.603515625, -11.19140625, -10.779296875, -10.3671875, -9.955078125, -9.54296875, -9.130859375, -8.71875, -8.306640625, -7.89453125, -7.482421875, -7.0703125, -6.658203125, -6.24609375, -5.833984375, -5.421875, -5.009765625, -4.59765625, -4.185546875, -3.7734375, -3.361328125, -2.94921875, -2.537109375, -2.125, -1.712890625, -1.30078125, -0.888671875, -0.4765625, -0.064453125, 0.34765625, 0.759765625, 1.171875, 1.583984375, 1.99609375, 2.408203125, 2.8203125, 3.232421875, 3.64453125, 4.056640625, 4.46875, 4.880859375, 5.29296875, 5.705078125, 6.1171875, 6.529296875, 6.94140625, 7.353515625, 7.765625, 8.177734375, 8.58984375, 9.001953125, 9.4140625, 9.826171875, 10.23828125, 10.650390625, 11.0625, 11.474609375, 11.88671875, 12.298828125, 12.7109375, 13.123046875, 13.53515625, 13.947265625, 14.359375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 3.0, 7.0, 13.0, 5.0, 19.0, 18.0, 29.0, 44.0, 53.0, 99.0, 170.0, 278.0, 550.0, 1127.0, 2860.0, 9426.0, 46238.0, 386406.0, 521744.0, 61785.0, 11686.0, 3359.0, 1238.0, 607.0, 293.0, 170.0, 120.0, 56.0, 67.0, 25.0, 21.0, 12.0, 3.0, 7.0, 2.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1328125, -9.83544921875, -9.5380859375, -9.24072265625, -8.943359375, -8.64599609375, -8.3486328125, -8.05126953125, -7.75390625, -7.45654296875, -7.1591796875, -6.86181640625, -6.564453125, -6.26708984375, -5.9697265625, -5.67236328125, -5.375, -5.07763671875, -4.7802734375, -4.48291015625, -4.185546875, -3.88818359375, -3.5908203125, -3.29345703125, -2.99609375, -2.69873046875, -2.4013671875, -2.10400390625, -1.806640625, -1.50927734375, -1.2119140625, -0.91455078125, -0.6171875, -0.31982421875, -0.0224609375, 0.27490234375, 0.572265625, 0.86962890625, 1.1669921875, 1.46435546875, 1.76171875, 2.05908203125, 2.3564453125, 2.65380859375, 2.951171875, 3.24853515625, 3.5458984375, 3.84326171875, 4.140625, 4.43798828125, 4.7353515625, 5.03271484375, 5.330078125, 5.62744140625, 5.9248046875, 6.22216796875, 6.51953125, 6.81689453125, 7.1142578125, 7.41162109375, 7.708984375, 8.00634765625, 8.3037109375, 8.60107421875, 8.8984375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 3.0, 4.0, 10.0, 12.0, 12.0, 20.0, 25.0, 33.0, 49.0, 79.0, 67.0, 99.0, 117.0, 101.0, 81.0, 62.0, 54.0, 43.0, 30.0, 29.0, 14.0, 10.0, 13.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009937286376953125, -0.000957876443862915, -0.0009220242500305176, -0.0008861720561981201, -0.0008503198623657227, -0.0008144676685333252, -0.0007786154747009277, -0.0007427632808685303, -0.0007069110870361328, -0.0006710588932037354, -0.0006352066993713379, -0.0005993545055389404, -0.000563502311706543, -0.0005276501178741455, -0.000491797924041748, -0.0004559457302093506, -0.0004200935363769531, -0.00038424134254455566, -0.0003483891487121582, -0.00031253695487976074, -0.0002766847610473633, -0.00024083256721496582, -0.00020498037338256836, -0.0001691281795501709, -0.00013327598571777344, -9.742379188537598e-05, -6.157159805297852e-05, -2.5719404220581055e-05, 1.0132789611816406e-05, 4.598498344421387e-05, 8.183717727661133e-05, 0.00011768937110900879, 0.00015354156494140625, 0.0001893937587738037, 0.00022524595260620117, 0.00026109814643859863, 0.0002969503402709961, 0.00033280253410339355, 0.000368654727935791, 0.0004045069217681885, 0.00044035911560058594, 0.0004762113094329834, 0.0005120635032653809, 0.0005479156970977783, 0.0005837678909301758, 0.0006196200847625732, 0.0006554722785949707, 0.0006913244724273682, 0.0007271766662597656, 0.0007630288600921631, 0.0007988810539245605, 0.000834733247756958, 0.0008705854415893555, 0.0009064376354217529, 0.0009422898292541504, 0.0009781420230865479, 0.0010139942169189453, 0.0010498464107513428, 0.0010856986045837402, 0.0011215507984161377, 0.0011574029922485352, 0.0011932551860809326, 0.00122910737991333, 0.0012649595737457275, 0.001300811767578125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 7.0, 8.0, 8.0, 16.0, 19.0, 45.0, 63.0, 103.0, 182.0, 371.0, 764.0, 1629.0, 4406.0, 17517.0, 130527.0, 717269.0, 148655.0, 18766.0, 4757.0, 1772.0, 800.0, 354.0, 185.0, 115.0, 65.0, 37.0, 29.0, 28.0, 9.0, 17.0, 7.0, 5.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.671875, -12.324951171875, -11.97802734375, -11.631103515625, -11.2841796875, -10.937255859375, -10.59033203125, -10.243408203125, -9.896484375, -9.549560546875, -9.20263671875, -8.855712890625, -8.5087890625, -8.161865234375, -7.81494140625, -7.468017578125, -7.12109375, -6.774169921875, -6.42724609375, -6.080322265625, -5.7333984375, -5.386474609375, -5.03955078125, -4.692626953125, -4.345703125, -3.998779296875, -3.65185546875, -3.304931640625, -2.9580078125, -2.611083984375, -2.26416015625, -1.917236328125, -1.5703125, -1.223388671875, -0.87646484375, -0.529541015625, -0.1826171875, 0.164306640625, 0.51123046875, 0.858154296875, 1.205078125, 1.552001953125, 1.89892578125, 2.245849609375, 2.5927734375, 2.939697265625, 3.28662109375, 3.633544921875, 3.98046875, 4.327392578125, 4.67431640625, 5.021240234375, 5.3681640625, 5.715087890625, 6.06201171875, 6.408935546875, 6.755859375, 7.102783203125, 7.44970703125, 7.796630859375, 8.1435546875, 8.490478515625, 8.83740234375, 9.184326171875, 9.53125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 10.0, 15.0, 17.0, 17.0, 14.0, 34.0, 52.0, 39.0, 59.0, 63.0, 78.0, 64.0, 81.0, 79.0, 86.0, 52.0, 55.0, 41.0, 33.0, 20.0, 25.0, 17.0, 11.0, 8.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.25, -8.02850341796875, -7.8070068359375, -7.58551025390625, -7.364013671875, -7.14251708984375, -6.9210205078125, -6.69952392578125, -6.47802734375, -6.25653076171875, -6.0350341796875, -5.81353759765625, -5.592041015625, -5.37054443359375, -5.1490478515625, -4.92755126953125, -4.7060546875, -4.48455810546875, -4.2630615234375, -4.04156494140625, -3.820068359375, -3.59857177734375, -3.3770751953125, -3.15557861328125, -2.93408203125, -2.71258544921875, -2.4910888671875, -2.26959228515625, -2.048095703125, -1.82659912109375, -1.6051025390625, -1.38360595703125, -1.162109375, -0.94061279296875, -0.7191162109375, -0.49761962890625, -0.276123046875, -0.05462646484375, 0.1668701171875, 0.38836669921875, 0.60986328125, 0.83135986328125, 1.0528564453125, 1.27435302734375, 1.495849609375, 1.71734619140625, 1.9388427734375, 2.16033935546875, 2.3818359375, 2.60333251953125, 2.8248291015625, 3.04632568359375, 3.267822265625, 3.48931884765625, 3.7108154296875, 3.93231201171875, 4.15380859375, 4.37530517578125, 4.5968017578125, 4.81829833984375, 5.039794921875, 5.26129150390625, 5.4827880859375, 5.70428466796875, 5.92578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 7.0, 9.0, 13.0, 44.0, 89.0, 141.0, 198.0, 197.0, 137.0, 86.0, 50.0, 16.0, 7.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-205.93653869628906, -200.35958862304688, -194.78265380859375, -189.20571899414062, -183.62876892089844, -178.05181884765625, -172.47488403320312, -166.89794921875, -161.3209991455078, -155.74404907226562, -150.1671142578125, -144.59017944335938, -139.0132293701172, -133.436279296875, -127.85934448242188, -122.28240203857422, -116.70545959472656, -111.1285171508789, -105.55157470703125, -99.9746322631836, -94.39768981933594, -88.82074737548828, -83.24380493164062, -77.66686248779297, -72.08992004394531, -66.51297760009766, -60.93603515625, -55.359092712402344, -49.78215026855469, -44.20520782470703, -38.628265380859375, -33.05132293701172, -27.474380493164062, -21.897438049316406, -16.32049560546875, -10.743553161621094, -5.1666107177734375, 0.41033172607421875, 5.987274169921875, 11.564216613769531, 17.141159057617188, 22.718101501464844, 28.2950439453125, 33.871986389160156, 39.44892883300781, 45.02587127685547, 50.602813720703125, 56.17975616455078, 61.75669860839844, 67.3336410522461, 72.91058349609375, 78.4875259399414, 84.06446838378906, 89.64141082763672, 95.21835327148438, 100.79529571533203, 106.37223815917969, 111.94918060302734, 117.526123046875, 123.10306549072266, 128.6800079345703, 134.2569580078125, 139.83389282226562, 145.41082763671875, 150.98777770996094]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 9.0, 6.0, 8.0, 16.0, 19.0, 16.0, 27.0, 31.0, 24.0, 41.0, 43.0, 45.0, 57.0, 76.0, 50.0, 68.0, 74.0, 61.0, 50.0, 48.0, 49.0, 31.0, 26.0, 23.0, 17.0, 21.0, 15.0, 15.0, 6.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.8560562133789, -90.27857971191406, -87.70110321044922, -85.1236343383789, -82.54615783691406, -79.96868133544922, -77.39120483398438, -74.81372833251953, -72.23625183105469, -69.65877532958984, -67.081298828125, -64.50382995605469, -61.926353454589844, -59.348876953125, -56.771400451660156, -54.19392395019531, -51.616455078125, -49.038978576660156, -46.46150588989258, -43.884029388427734, -41.306556701660156, -38.72908020019531, -36.15160369873047, -33.574127197265625, -30.996654510498047, -28.419179916381836, -25.841705322265625, -23.26422882080078, -20.68675422668457, -18.10927963256836, -15.531804084777832, -12.954328536987305, -10.376853942871094, -7.799378871917725, -5.2219038009643555, -2.6444287300109863, -0.06695365905761719, 2.5105209350585938, 5.087996482849121, 7.665472030639648, 10.24294662475586, 12.82042121887207, 15.397896766662598, 17.975372314453125, 20.552846908569336, 23.130321502685547, 25.70779800415039, 28.2852725982666, 30.862747192382812, 33.440223693847656, 36.017696380615234, 38.59517288208008, 41.172645568847656, 43.7501220703125, 46.327598571777344, 48.90507507324219, 51.482547760009766, 54.06002426147461, 56.63749694824219, 59.21497344970703, 61.792449951171875, 64.36991882324219, 66.94739532470703, 69.52487182617188, 72.10234832763672]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 9.0, 8.0, 6.0, 7.0, 16.0, 12.0, 14.0, 26.0, 26.0, 40.0, 57.0, 66.0, 113.0, 193.0, 375.0, 824.0, 2959.0, 27433.0, 4146548.0, 12043.0, 1995.0, 661.0, 297.0, 188.0, 96.0, 71.0, 58.0, 36.0, 33.0, 17.0, 19.0, 9.0, 4.0, 6.0, 4.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-52.71875, -51.3076171875, -49.896484375, -48.4853515625, -47.07421875, -45.6630859375, -44.251953125, -42.8408203125, -41.4296875, -40.0185546875, -38.607421875, -37.1962890625, -35.78515625, -34.3740234375, -32.962890625, -31.5517578125, -30.140625, -28.7294921875, -27.318359375, -25.9072265625, -24.49609375, -23.0849609375, -21.673828125, -20.2626953125, -18.8515625, -17.4404296875, -16.029296875, -14.6181640625, -13.20703125, -11.7958984375, -10.384765625, -8.9736328125, -7.5625, -6.1513671875, -4.740234375, -3.3291015625, -1.91796875, -0.5068359375, 0.904296875, 2.3154296875, 3.7265625, 5.1376953125, 6.548828125, 7.9599609375, 9.37109375, 10.7822265625, 12.193359375, 13.6044921875, 15.015625, 16.4267578125, 17.837890625, 19.2490234375, 20.66015625, 22.0712890625, 23.482421875, 24.8935546875, 26.3046875, 27.7158203125, 29.126953125, 30.5380859375, 31.94921875, 33.3603515625, 34.771484375, 36.1826171875, 37.59375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 7.0, 10.0, 10.0, 22.0, 24.0, 27.0, 31.0, 41.0, 33.0, 60.0, 58.0, 66.0, 64.0, 72.0, 68.0, 58.0, 61.0, 61.0, 43.0, 33.0, 18.0, 23.0, 25.0, 22.0, 13.0, 12.0, 10.0, 5.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.72265625, -3.6072998046875, -3.491943359375, -3.3765869140625, -3.26123046875, -3.1458740234375, -3.030517578125, -2.9151611328125, -2.7998046875, -2.6844482421875, -2.569091796875, -2.4537353515625, -2.33837890625, -2.2230224609375, -2.107666015625, -1.9923095703125, -1.876953125, -1.7615966796875, -1.646240234375, -1.5308837890625, -1.41552734375, -1.3001708984375, -1.184814453125, -1.0694580078125, -0.9541015625, -0.8387451171875, -0.723388671875, -0.6080322265625, -0.49267578125, -0.3773193359375, -0.261962890625, -0.1466064453125, -0.03125, 0.0841064453125, 0.199462890625, 0.3148193359375, 0.43017578125, 0.5455322265625, 0.660888671875, 0.7762451171875, 0.8916015625, 1.0069580078125, 1.122314453125, 1.2376708984375, 1.35302734375, 1.4683837890625, 1.583740234375, 1.6990966796875, 1.814453125, 1.9298095703125, 2.045166015625, 2.1605224609375, 2.27587890625, 2.3912353515625, 2.506591796875, 2.6219482421875, 2.7373046875, 2.8526611328125, 2.968017578125, 3.0833740234375, 3.19873046875, 3.3140869140625, 3.429443359375, 3.5447998046875, 3.66015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 4.0, 8.0, 13.0, 18.0, 20.0, 36.0, 32.0, 67.0, 75.0, 127.0, 180.0, 266.0, 396.0, 627.0, 1080.0, 1946.0, 3658.0, 9805.0, 66734.0, 4069073.0, 26757.0, 6581.0, 2794.0, 1534.0, 829.0, 523.0, 341.0, 230.0, 167.0, 103.0, 69.0, 45.0, 44.0, 32.0, 19.0, 19.0, 3.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.859375, -20.2333984375, -19.607421875, -18.9814453125, -18.35546875, -17.7294921875, -17.103515625, -16.4775390625, -15.8515625, -15.2255859375, -14.599609375, -13.9736328125, -13.34765625, -12.7216796875, -12.095703125, -11.4697265625, -10.84375, -10.2177734375, -9.591796875, -8.9658203125, -8.33984375, -7.7138671875, -7.087890625, -6.4619140625, -5.8359375, -5.2099609375, -4.583984375, -3.9580078125, -3.33203125, -2.7060546875, -2.080078125, -1.4541015625, -0.828125, -0.2021484375, 0.423828125, 1.0498046875, 1.67578125, 2.3017578125, 2.927734375, 3.5537109375, 4.1796875, 4.8056640625, 5.431640625, 6.0576171875, 6.68359375, 7.3095703125, 7.935546875, 8.5615234375, 9.1875, 9.8134765625, 10.439453125, 11.0654296875, 11.69140625, 12.3173828125, 12.943359375, 13.5693359375, 14.1953125, 14.8212890625, 15.447265625, 16.0732421875, 16.69921875, 17.3251953125, 17.951171875, 18.5771484375, 19.203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 5.0, 11.0, 6.0, 16.0, 41.0, 240.0, 3566.0, 95.0, 33.0, 16.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.99609375, -4.85009765625, -4.7041015625, -4.55810546875, -4.412109375, -4.26611328125, -4.1201171875, -3.97412109375, -3.828125, -3.68212890625, -3.5361328125, -3.39013671875, -3.244140625, -3.09814453125, -2.9521484375, -2.80615234375, -2.66015625, -2.51416015625, -2.3681640625, -2.22216796875, -2.076171875, -1.93017578125, -1.7841796875, -1.63818359375, -1.4921875, -1.34619140625, -1.2001953125, -1.05419921875, -0.908203125, -0.76220703125, -0.6162109375, -0.47021484375, -0.32421875, -0.17822265625, -0.0322265625, 0.11376953125, 0.259765625, 0.40576171875, 0.5517578125, 0.69775390625, 0.84375, 0.98974609375, 1.1357421875, 1.28173828125, 1.427734375, 1.57373046875, 1.7197265625, 1.86572265625, 2.01171875, 2.15771484375, 2.3037109375, 2.44970703125, 2.595703125, 2.74169921875, 2.8876953125, 3.03369140625, 3.1796875, 3.32568359375, 3.4716796875, 3.61767578125, 3.763671875, 3.90966796875, 4.0556640625, 4.20166015625, 4.34765625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 11.0, 15.0, 15.0, 29.0, 30.0, 37.0, 61.0, 65.0, 88.0, 101.0, 94.0, 99.0, 91.0, 74.0, 52.0, 36.0, 27.0, 22.0, 14.0, 11.0, 6.0, 8.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.490067481994629, -13.115971565246582, -12.741876602172852, -12.367780685424805, -11.993684768676758, -11.619589805603027, -11.24549388885498, -10.87139892578125, -10.497303009033203, -10.123207092285156, -9.749112129211426, -9.375016212463379, -9.000921249389648, -8.626825332641602, -8.252729415893555, -7.878633975982666, -7.504538536071777, -7.130443096160889, -6.75634765625, -6.382251739501953, -6.0081562995910645, -5.634060859680176, -5.259964942932129, -4.88586950302124, -4.511774063110352, -4.137678623199463, -3.763582944869995, -3.3894872665405273, -3.0153918266296387, -2.64129638671875, -2.2672007083892822, -1.8931050300598145, -1.5190086364746094, -1.1449130773544312, -0.7708175182342529, -0.3967219591140747, -0.022626399993896484, 0.35146915912628174, 0.72556471824646, 1.0996603965759277, 1.4737558364868164, 1.8478513956069946, 2.221946954727173, 2.5960426330566406, 2.9701380729675293, 3.344233512878418, 3.7183291912078857, 4.0924248695373535, 4.466520309448242, 4.840615749359131, 5.2147111892700195, 5.588807106018066, 5.962902545928955, 6.336997985839844, 6.711093902587891, 7.085189342498779, 7.459284782409668, 7.833380222320557, 8.207475662231445, 8.581571578979492, 8.955667495727539, 9.32976245880127, 9.703858375549316, 10.077953338623047, 10.452049255371094]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 4.0, 4.0, 8.0, 7.0, 12.0, 15.0, 20.0, 19.0, 17.0, 21.0, 24.0, 18.0, 27.0, 31.0, 32.0, 27.0, 41.0, 33.0, 51.0, 40.0, 53.0, 53.0, 43.0, 41.0, 30.0, 20.0, 28.0, 33.0, 31.0, 25.0, 35.0, 30.0, 27.0, 15.0, 12.0, 6.0, 8.0, 13.0, 7.0, 6.0, 8.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.134579658508301, -5.9267354011535645, -5.718891143798828, -5.511046886444092, -5.3032026290893555, -5.095357894897461, -4.887514114379883, -4.679669380187988, -4.471825122833252, -4.263980865478516, -4.056136608123779, -3.848292350769043, -3.6404478549957275, -3.432603597640991, -3.224759340286255, -3.0169148445129395, -2.8090708255767822, -2.601226568222046, -2.3933823108673096, -2.185537815093994, -1.9776935577392578, -1.7698493003845215, -1.5620050430297852, -1.3541606664657593, -1.146316409111023, -0.9384720921516418, -0.7306277751922607, -0.5227835178375244, -0.3149392008781433, -0.10709488391876221, 0.10074937343597412, 0.30859375, 0.5164380073547363, 0.7242823243141174, 0.9321266412734985, 1.1399708986282349, 1.3478152751922607, 1.555659532546997, 1.7635037899017334, 1.9713481664657593, 2.179192543029785, 2.3870368003845215, 2.594881057739258, 2.802725315093994, 3.0105698108673096, 3.218414068222046, 3.4262583255767822, 3.6341028213500977, 3.841946840286255, 4.04979133605957, 4.257635593414307, 4.465479850769043, 4.673324108123779, 4.881168365478516, 5.089012622833252, 5.296856880187988, 5.504701137542725, 5.712545394897461, 5.920389652252197, 6.128233909606934, 6.33607816696167, 6.543922424316406, 6.751767158508301, 6.959611415863037, 7.167455673217773]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 8.0, 20.0, 16.0, 26.0, 39.0, 69.0, 128.0, 195.0, 354.0, 585.0, 1087.0, 2227.0, 4495.0, 10181.0, 25038.0, 64284.0, 168240.0, 360094.0, 250230.0, 96568.0, 37356.0, 14756.0, 6255.0, 2967.0, 1445.0, 820.0, 430.0, 249.0, 132.0, 77.0, 63.0, 43.0, 23.0, 15.0, 17.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.24609375, -6.04913330078125, -5.8521728515625, -5.65521240234375, -5.458251953125, -5.26129150390625, -5.0643310546875, -4.86737060546875, -4.67041015625, -4.47344970703125, -4.2764892578125, -4.07952880859375, -3.882568359375, -3.68560791015625, -3.4886474609375, -3.29168701171875, -3.0947265625, -2.89776611328125, -2.7008056640625, -2.50384521484375, -2.306884765625, -2.10992431640625, -1.9129638671875, -1.71600341796875, -1.51904296875, -1.32208251953125, -1.1251220703125, -0.92816162109375, -0.731201171875, -0.53424072265625, -0.3372802734375, -0.14031982421875, 0.056640625, 0.25360107421875, 0.4505615234375, 0.64752197265625, 0.844482421875, 1.04144287109375, 1.2384033203125, 1.43536376953125, 1.63232421875, 1.82928466796875, 2.0262451171875, 2.22320556640625, 2.420166015625, 2.61712646484375, 2.8140869140625, 3.01104736328125, 3.2080078125, 3.40496826171875, 3.6019287109375, 3.79888916015625, 3.995849609375, 4.19281005859375, 4.3897705078125, 4.58673095703125, 4.78369140625, 4.98065185546875, 5.1776123046875, 5.37457275390625, 5.571533203125, 5.76849365234375, 5.9654541015625, 6.16241455078125, 6.359375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 4.0, 16.0, 15.0, 14.0, 27.0, 34.0, 33.0, 29.0, 35.0, 43.0, 53.0, 63.0, 58.0, 71.0, 62.0, 57.0, 49.0, 58.0, 44.0, 37.0, 23.0, 41.0, 26.0, 21.0, 20.0, 12.0, 16.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.458984375, -3.343048095703125, -3.22711181640625, -3.111175537109375, -2.9952392578125, -2.879302978515625, -2.76336669921875, -2.647430419921875, -2.531494140625, -2.415557861328125, -2.29962158203125, -2.183685302734375, -2.0677490234375, -1.951812744140625, -1.83587646484375, -1.719940185546875, -1.60400390625, -1.488067626953125, -1.37213134765625, -1.256195068359375, -1.1402587890625, -1.024322509765625, -0.90838623046875, -0.792449951171875, -0.676513671875, -0.560577392578125, -0.44464111328125, -0.328704833984375, -0.2127685546875, -0.096832275390625, 0.01910400390625, 0.135040283203125, 0.2509765625, 0.366912841796875, 0.48284912109375, 0.598785400390625, 0.7147216796875, 0.830657958984375, 0.94659423828125, 1.062530517578125, 1.178466796875, 1.294403076171875, 1.41033935546875, 1.526275634765625, 1.6422119140625, 1.758148193359375, 1.87408447265625, 1.990020751953125, 2.10595703125, 2.221893310546875, 2.33782958984375, 2.453765869140625, 2.5697021484375, 2.685638427734375, 2.80157470703125, 2.917510986328125, 3.033447265625, 3.149383544921875, 3.26531982421875, 3.381256103515625, 3.4971923828125, 3.613128662109375, 3.72906494140625, 3.845001220703125, 3.9609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 9.0, 23.0, 29.0, 41.0, 58.0, 104.0, 147.0, 315.0, 533.0, 1124.0, 3039.0, 26298.0, 837988.0, 168239.0, 7064.0, 1793.0, 747.0, 400.0, 234.0, 142.0, 83.0, 52.0, 32.0, 23.0, 14.0, 8.0, 5.0, 6.0, 0.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.796875, -23.091796875, -22.38671875, -21.681640625, -20.9765625, -20.271484375, -19.56640625, -18.861328125, -18.15625, -17.451171875, -16.74609375, -16.041015625, -15.3359375, -14.630859375, -13.92578125, -13.220703125, -12.515625, -11.810546875, -11.10546875, -10.400390625, -9.6953125, -8.990234375, -8.28515625, -7.580078125, -6.875, -6.169921875, -5.46484375, -4.759765625, -4.0546875, -3.349609375, -2.64453125, -1.939453125, -1.234375, -0.529296875, 0.17578125, 0.880859375, 1.5859375, 2.291015625, 2.99609375, 3.701171875, 4.40625, 5.111328125, 5.81640625, 6.521484375, 7.2265625, 7.931640625, 8.63671875, 9.341796875, 10.046875, 10.751953125, 11.45703125, 12.162109375, 12.8671875, 13.572265625, 14.27734375, 14.982421875, 15.6875, 16.392578125, 17.09765625, 17.802734375, 18.5078125, 19.212890625, 19.91796875, 20.623046875, 21.328125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 6.0, 5.0, 8.0, 12.0, 7.0, 17.0, 20.0, 23.0, 29.0, 46.0, 41.0, 41.0, 48.0, 62.0, 61.0, 63.0, 72.0, 65.0, 65.0, 62.0, 50.0, 41.0, 31.0, 27.0, 23.0, 26.0, 12.0, 8.0, 13.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -19.95263671875, -19.2490234375, -18.54541015625, -17.841796875, -17.13818359375, -16.4345703125, -15.73095703125, -15.02734375, -14.32373046875, -13.6201171875, -12.91650390625, -12.212890625, -11.50927734375, -10.8056640625, -10.10205078125, -9.3984375, -8.69482421875, -7.9912109375, -7.28759765625, -6.583984375, -5.88037109375, -5.1767578125, -4.47314453125, -3.76953125, -3.06591796875, -2.3623046875, -1.65869140625, -0.955078125, -0.25146484375, 0.4521484375, 1.15576171875, 1.859375, 2.56298828125, 3.2666015625, 3.97021484375, 4.673828125, 5.37744140625, 6.0810546875, 6.78466796875, 7.48828125, 8.19189453125, 8.8955078125, 9.59912109375, 10.302734375, 11.00634765625, 11.7099609375, 12.41357421875, 13.1171875, 13.82080078125, 14.5244140625, 15.22802734375, 15.931640625, 16.63525390625, 17.3388671875, 18.04248046875, 18.74609375, 19.44970703125, 20.1533203125, 20.85693359375, 21.560546875, 22.26416015625, 22.9677734375, 23.67138671875, 24.375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 7.0, 4.0, 4.0, 7.0, 8.0, 14.0, 23.0, 41.0, 52.0, 89.0, 95.0, 172.0, 329.0, 656.0, 1419.0, 4910.0, 35799.0, 804336.0, 184236.0, 11684.0, 2582.0, 964.0, 443.0, 239.0, 137.0, 80.0, 69.0, 37.0, 28.0, 30.0, 13.0, 16.0, 10.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8671875, -10.4892578125, -10.111328125, -9.7333984375, -9.35546875, -8.9775390625, -8.599609375, -8.2216796875, -7.84375, -7.4658203125, -7.087890625, -6.7099609375, -6.33203125, -5.9541015625, -5.576171875, -5.1982421875, -4.8203125, -4.4423828125, -4.064453125, -3.6865234375, -3.30859375, -2.9306640625, -2.552734375, -2.1748046875, -1.796875, -1.4189453125, -1.041015625, -0.6630859375, -0.28515625, 0.0927734375, 0.470703125, 0.8486328125, 1.2265625, 1.6044921875, 1.982421875, 2.3603515625, 2.73828125, 3.1162109375, 3.494140625, 3.8720703125, 4.25, 4.6279296875, 5.005859375, 5.3837890625, 5.76171875, 6.1396484375, 6.517578125, 6.8955078125, 7.2734375, 7.6513671875, 8.029296875, 8.4072265625, 8.78515625, 9.1630859375, 9.541015625, 9.9189453125, 10.296875, 10.6748046875, 11.052734375, 11.4306640625, 11.80859375, 12.1865234375, 12.564453125, 12.9423828125, 13.3203125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 12.0, 15.0, 26.0, 34.0, 73.0, 111.0, 237.0, 213.0, 125.0, 60.0, 34.0, 26.0, 14.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.002681732177734375, -0.002624496817588806, -0.0025672614574432373, -0.0025100260972976685, -0.0024527907371520996, -0.0023955553770065308, -0.002338320016860962, -0.002281084656715393, -0.0022238492965698242, -0.0021666139364242554, -0.0021093785762786865, -0.0020521432161331177, -0.001994907855987549, -0.00193767249584198, -0.0018804371356964111, -0.0018232017755508423, -0.0017659664154052734, -0.0017087310552597046, -0.0016514956951141357, -0.001594260334968567, -0.001537024974822998, -0.0014797896146774292, -0.0014225542545318604, -0.0013653188943862915, -0.0013080835342407227, -0.0012508481740951538, -0.001193612813949585, -0.0011363774538040161, -0.0010791420936584473, -0.0010219067335128784, -0.0009646713733673096, -0.0009074360132217407, -0.0008502006530761719, -0.000792965292930603, -0.0007357299327850342, -0.0006784945726394653, -0.0006212592124938965, -0.0005640238523483276, -0.0005067884922027588, -0.00044955313205718994, -0.0003923177719116211, -0.00033508241176605225, -0.0002778470516204834, -0.00022061169147491455, -0.0001633763313293457, -0.00010614097118377686, -4.890561103820801e-05, 8.32974910736084e-06, 6.556510925292969e-05, 0.00012280046939849854, 0.00018003582954406738, 0.00023727118968963623, 0.0002945065498352051, 0.0003517419099807739, 0.0004089772701263428, 0.0004662126302719116, 0.0005234479904174805, 0.0005806833505630493, 0.0006379187107086182, 0.000695154070854187, 0.0007523894309997559, 0.0008096247911453247, 0.0008668601512908936, 0.0009240955114364624, 0.0009813308715820312]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 12.0, 13.0, 15.0, 21.0, 32.0, 52.0, 75.0, 122.0, 268.0, 583.0, 1449.0, 5019.0, 28501.0, 645814.0, 341442.0, 19042.0, 3761.0, 1198.0, 548.0, 249.0, 125.0, 73.0, 49.0, 27.0, 16.0, 13.0, 9.0, 9.0, 7.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.15625, -11.762939453125, -11.36962890625, -10.976318359375, -10.5830078125, -10.189697265625, -9.79638671875, -9.403076171875, -9.009765625, -8.616455078125, -8.22314453125, -7.829833984375, -7.4365234375, -7.043212890625, -6.64990234375, -6.256591796875, -5.86328125, -5.469970703125, -5.07666015625, -4.683349609375, -4.2900390625, -3.896728515625, -3.50341796875, -3.110107421875, -2.716796875, -2.323486328125, -1.93017578125, -1.536865234375, -1.1435546875, -0.750244140625, -0.35693359375, 0.036376953125, 0.4296875, 0.822998046875, 1.21630859375, 1.609619140625, 2.0029296875, 2.396240234375, 2.78955078125, 3.182861328125, 3.576171875, 3.969482421875, 4.36279296875, 4.756103515625, 5.1494140625, 5.542724609375, 5.93603515625, 6.329345703125, 6.72265625, 7.115966796875, 7.50927734375, 7.902587890625, 8.2958984375, 8.689208984375, 9.08251953125, 9.475830078125, 9.869140625, 10.262451171875, 10.65576171875, 11.049072265625, 11.4423828125, 11.835693359375, 12.22900390625, 12.622314453125, 13.015625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 5.0, 8.0, 11.0, 13.0, 19.0, 27.0, 34.0, 59.0, 67.0, 119.0, 138.0, 137.0, 104.0, 82.0, 45.0, 31.0, 29.0, 18.0, 8.0, 11.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.7421875, -10.427490234375, -10.11279296875, -9.798095703125, -9.4833984375, -9.168701171875, -8.85400390625, -8.539306640625, -8.224609375, -7.909912109375, -7.59521484375, -7.280517578125, -6.9658203125, -6.651123046875, -6.33642578125, -6.021728515625, -5.70703125, -5.392333984375, -5.07763671875, -4.762939453125, -4.4482421875, -4.133544921875, -3.81884765625, -3.504150390625, -3.189453125, -2.874755859375, -2.56005859375, -2.245361328125, -1.9306640625, -1.615966796875, -1.30126953125, -0.986572265625, -0.671875, -0.357177734375, -0.04248046875, 0.272216796875, 0.5869140625, 0.901611328125, 1.21630859375, 1.531005859375, 1.845703125, 2.160400390625, 2.47509765625, 2.789794921875, 3.1044921875, 3.419189453125, 3.73388671875, 4.048583984375, 4.36328125, 4.677978515625, 4.99267578125, 5.307373046875, 5.6220703125, 5.936767578125, 6.25146484375, 6.566162109375, 6.880859375, 7.195556640625, 7.51025390625, 7.824951171875, 8.1396484375, 8.454345703125, 8.76904296875, 9.083740234375, 9.3984375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 11.0, 40.0, 108.0, 252.0, 280.0, 193.0, 75.0, 20.0, 11.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-271.41448974609375, -264.6665344238281, -257.9185485839844, -251.1705780029297, -244.422607421875, -237.67465209960938, -230.9266815185547, -224.1787109375, -217.4307403564453, -210.68276977539062, -203.93479919433594, -197.18682861328125, -190.43887329101562, -183.69088745117188, -176.94293212890625, -170.19496154785156, -163.44699096679688, -156.6990203857422, -149.9510498046875, -143.2030792236328, -136.45510864257812, -129.7071533203125, -122.95918273925781, -116.21121215820312, -109.46324157714844, -102.71527099609375, -95.96730041503906, -89.2193374633789, -82.47136688232422, -75.72339630126953, -68.97543334960938, -62.22746276855469, -55.4794921875, -48.73152160644531, -41.98355484008789, -35.23558807373047, -28.48761749267578, -21.739646911621094, -14.991680145263672, -8.24371337890625, -1.4957427978515625, 5.252225875854492, 12.000194549560547, 18.7481632232666, 25.496131896972656, 32.244102478027344, 38.992069244384766, 45.74003601074219, 52.488006591796875, 59.23597717285156, 65.98394775390625, 72.7319107055664, 79.4798812866211, 86.22785186767578, 92.97581481933594, 99.72378540039062, 106.47175598144531, 113.2197265625, 119.96769714355469, 126.71566009521484, 133.463623046875, 140.21160888671875, 146.95956420898438, 153.70753479003906, 160.45550537109375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 7.0, 16.0, 4.0, 17.0, 23.0, 18.0, 34.0, 22.0, 29.0, 33.0, 43.0, 46.0, 45.0, 60.0, 51.0, 43.0, 63.0, 44.0, 44.0, 58.0, 50.0, 39.0, 41.0, 34.0, 18.0, 15.0, 27.0, 16.0, 13.0, 13.0, 9.0, 7.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.1893310546875, -62.667686462402344, -60.14604187011719, -57.62439727783203, -55.102752685546875, -52.58110809326172, -50.05946350097656, -47.537818908691406, -45.01617431640625, -42.494529724121094, -39.97288513183594, -37.45124053955078, -34.929595947265625, -32.40795135498047, -29.886306762695312, -27.364662170410156, -24.843017578125, -22.321372985839844, -19.799728393554688, -17.27808380126953, -14.756439208984375, -12.234794616699219, -9.713150024414062, -7.191505432128906, -4.66986083984375, -2.1482162475585938, 0.3734283447265625, 2.8950729370117188, 5.416717529296875, 7.938362121582031, 10.460006713867188, 12.981651306152344, 15.5032958984375, 18.024940490722656, 20.546585083007812, 23.06822967529297, 25.589874267578125, 28.11151885986328, 30.633163452148438, 33.154808044433594, 35.67645263671875, 38.198097229003906, 40.71974182128906, 43.24138641357422, 45.763031005859375, 48.28467559814453, 50.80632019042969, 53.327964782714844, 55.849609375, 58.371253967285156, 60.89289855957031, 63.41454315185547, 65.93618774414062, 68.45783233642578, 70.97947692871094, 73.5011215209961, 76.02276611328125, 78.5444107055664, 81.06605529785156, 83.58769989013672, 86.10934448242188, 88.63098907470703, 91.15263366699219, 93.67427825927734, 96.1959228515625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 3.0, 3.0, 7.0, 3.0, 6.0, 13.0, 17.0, 15.0, 28.0, 40.0, 60.0, 75.0, 95.0, 151.0, 227.0, 351.0, 680.0, 1379.0, 3457.0, 13797.0, 565991.0, 3585854.0, 15081.0, 3651.0, 1457.0, 733.0, 420.0, 202.0, 163.0, 100.0, 71.0, 47.0, 31.0, 23.0, 10.0, 12.0, 8.0, 8.0, 7.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.984375, -21.252197265625, -20.52001953125, -19.787841796875, -19.0556640625, -18.323486328125, -17.59130859375, -16.859130859375, -16.126953125, -15.394775390625, -14.66259765625, -13.930419921875, -13.1982421875, -12.466064453125, -11.73388671875, -11.001708984375, -10.26953125, -9.537353515625, -8.80517578125, -8.072998046875, -7.3408203125, -6.608642578125, -5.87646484375, -5.144287109375, -4.412109375, -3.679931640625, -2.94775390625, -2.215576171875, -1.4833984375, -0.751220703125, -0.01904296875, 0.713134765625, 1.4453125, 2.177490234375, 2.90966796875, 3.641845703125, 4.3740234375, 5.106201171875, 5.83837890625, 6.570556640625, 7.302734375, 8.034912109375, 8.76708984375, 9.499267578125, 10.2314453125, 10.963623046875, 11.69580078125, 12.427978515625, 13.16015625, 13.892333984375, 14.62451171875, 15.356689453125, 16.0888671875, 16.821044921875, 17.55322265625, 18.285400390625, 19.017578125, 19.749755859375, 20.48193359375, 21.214111328125, 21.9462890625, 22.678466796875, 23.41064453125, 24.142822265625, 24.875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 12.0, 18.0, 21.0, 27.0, 39.0, 48.0, 57.0, 67.0, 69.0, 83.0, 67.0, 90.0, 72.0, 63.0, 60.0, 48.0, 31.0, 29.0, 26.0, 16.0, 17.0, 11.0, 2.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5703125, -5.421722412109375, -5.27313232421875, -5.124542236328125, -4.9759521484375, -4.827362060546875, -4.67877197265625, -4.530181884765625, -4.381591796875, -4.233001708984375, -4.08441162109375, -3.935821533203125, -3.7872314453125, -3.638641357421875, -3.49005126953125, -3.341461181640625, -3.19287109375, -3.044281005859375, -2.89569091796875, -2.747100830078125, -2.5985107421875, -2.449920654296875, -2.30133056640625, -2.152740478515625, -2.004150390625, -1.855560302734375, -1.70697021484375, -1.558380126953125, -1.4097900390625, -1.261199951171875, -1.11260986328125, -0.964019775390625, -0.8154296875, -0.666839599609375, -0.51824951171875, -0.369659423828125, -0.2210693359375, -0.072479248046875, 0.07611083984375, 0.224700927734375, 0.373291015625, 0.521881103515625, 0.67047119140625, 0.819061279296875, 0.9676513671875, 1.116241455078125, 1.26483154296875, 1.413421630859375, 1.56201171875, 1.710601806640625, 1.85919189453125, 2.007781982421875, 2.1563720703125, 2.304962158203125, 2.45355224609375, 2.602142333984375, 2.750732421875, 2.899322509765625, 3.04791259765625, 3.196502685546875, 3.3450927734375, 3.493682861328125, 3.64227294921875, 3.790863037109375, 3.939453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 15.0, 9.0, 11.0, 22.0, 30.0, 42.0, 56.0, 84.0, 126.0, 180.0, 266.0, 578.0, 979.0, 2302.0, 7900.0, 101872.0, 4055687.0, 17274.0, 3742.0, 1324.0, 639.0, 412.0, 256.0, 160.0, 77.0, 67.0, 49.0, 25.0, 28.0, 11.0, 15.0, 9.0, 13.0, 6.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.125, -31.1279296875, -30.130859375, -29.1337890625, -28.13671875, -27.1396484375, -26.142578125, -25.1455078125, -24.1484375, -23.1513671875, -22.154296875, -21.1572265625, -20.16015625, -19.1630859375, -18.166015625, -17.1689453125, -16.171875, -15.1748046875, -14.177734375, -13.1806640625, -12.18359375, -11.1865234375, -10.189453125, -9.1923828125, -8.1953125, -7.1982421875, -6.201171875, -5.2041015625, -4.20703125, -3.2099609375, -2.212890625, -1.2158203125, -0.21875, 0.7783203125, 1.775390625, 2.7724609375, 3.76953125, 4.7666015625, 5.763671875, 6.7607421875, 7.7578125, 8.7548828125, 9.751953125, 10.7490234375, 11.74609375, 12.7431640625, 13.740234375, 14.7373046875, 15.734375, 16.7314453125, 17.728515625, 18.7255859375, 19.72265625, 20.7197265625, 21.716796875, 22.7138671875, 23.7109375, 24.7080078125, 25.705078125, 26.7021484375, 27.69921875, 28.6962890625, 29.693359375, 30.6904296875, 31.6875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 12.0, 7.0, 25.0, 42.0, 180.0, 3343.0, 321.0, 58.0, 35.0, 14.0, 7.0, 11.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -6.97833251953125, -6.6558837890625, -6.33343505859375, -6.010986328125, -5.68853759765625, -5.3660888671875, -5.04364013671875, -4.72119140625, -4.39874267578125, -4.0762939453125, -3.75384521484375, -3.431396484375, -3.10894775390625, -2.7864990234375, -2.46405029296875, -2.1416015625, -1.81915283203125, -1.4967041015625, -1.17425537109375, -0.851806640625, -0.52935791015625, -0.2069091796875, 0.11553955078125, 0.43798828125, 0.76043701171875, 1.0828857421875, 1.40533447265625, 1.727783203125, 2.05023193359375, 2.3726806640625, 2.69512939453125, 3.017578125, 3.34002685546875, 3.6624755859375, 3.98492431640625, 4.307373046875, 4.62982177734375, 4.9522705078125, 5.27471923828125, 5.59716796875, 5.91961669921875, 6.2420654296875, 6.56451416015625, 6.886962890625, 7.20941162109375, 7.5318603515625, 7.85430908203125, 8.1767578125, 8.49920654296875, 8.8216552734375, 9.14410400390625, 9.466552734375, 9.78900146484375, 10.1114501953125, 10.43389892578125, 10.75634765625, 11.07879638671875, 11.4012451171875, 11.72369384765625, 12.046142578125, 12.36859130859375, 12.6910400390625, 13.01348876953125, 13.3359375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 8.0, 12.0, 20.0, 32.0, 39.0, 62.0, 83.0, 101.0, 106.0, 120.0, 114.0, 87.0, 46.0, 35.0, 29.0, 15.0, 19.0, 16.0, 11.0, 5.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.66485023498535, -20.82520866394043, -19.98556900024414, -19.14592742919922, -18.30628776550293, -17.466646194458008, -16.62700653076172, -15.787364959716797, -14.947724342346191, -14.108083724975586, -13.26844310760498, -12.428802490234375, -11.589160919189453, -10.749521255493164, -9.909879684448242, -9.070239067077637, -8.230598449707031, -7.390957832336426, -6.55131721496582, -5.711676120758057, -4.872035503387451, -4.032394886016846, -3.192753791809082, -2.3531131744384766, -1.513472557067871, -0.6738318204879761, 0.16580891609191895, 1.0054497718811035, 1.845090389251709, 2.6847310066223145, 3.524372100830078, 4.364012718200684, 5.203655242919922, 6.043295860290527, 6.882936477661133, 7.7225775718688965, 8.562217712402344, 9.401859283447266, 10.241499900817871, 11.081140518188477, 11.920781135559082, 12.760421752929688, 13.600062370300293, 14.439702987670898, 15.27934455871582, 16.11898422241211, 16.95862579345703, 17.798267364501953, 18.637907028198242, 19.477548599243164, 20.317188262939453, 21.156829833984375, 21.996469497680664, 22.836111068725586, 23.675750732421875, 24.515392303466797, 25.35503387451172, 26.19467544555664, 27.03431510925293, 27.87395668029785, 28.71359634399414, 29.553237915039062, 30.392879486083984, 31.232519149780273, 32.07215881347656]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 6.0, 7.0, 12.0, 12.0, 11.0, 24.0, 15.0, 26.0, 31.0, 41.0, 38.0, 44.0, 49.0, 65.0, 56.0, 48.0, 59.0, 60.0, 46.0, 64.0, 45.0, 47.0, 30.0, 35.0, 26.0, 30.0, 18.0, 17.0, 13.0, 8.0, 8.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.69904327392578, -17.978240966796875, -17.257436752319336, -16.53663444519043, -15.81583023071289, -15.095027923583984, -14.374224662780762, -13.653421401977539, -12.932618141174316, -12.211814880371094, -11.491011619567871, -10.770208358764648, -10.049406051635742, -9.328601837158203, -8.607799530029297, -7.886996269226074, -7.166193008422852, -6.445389747619629, -5.724586486816406, -5.003783702850342, -4.282980442047119, -3.5621771812438965, -2.841374397277832, -2.1205711364746094, -1.3997678756713867, -0.6789647340774536, 0.04183840751647949, 0.762641429901123, 1.4834446907043457, 2.2042479515075684, 2.925050735473633, 3.6458539962768555, 4.366657257080078, 5.087460517883301, 5.808263778686523, 6.529066562652588, 7.2498698234558105, 7.970673084259033, 8.691475868225098, 9.41227912902832, 10.133082389831543, 10.853885650634766, 11.574688911437988, 12.295492172241211, 13.016294479370117, 13.737098693847656, 14.457901000976562, 15.178704261779785, 15.899507522583008, 16.620309829711914, 17.341114044189453, 18.06191635131836, 18.7827205657959, 19.503522872924805, 20.224327087402344, 20.94512939453125, 21.665931701660156, 22.386734008789062, 23.1075382232666, 23.828340530395508, 24.549144744873047, 25.269947052001953, 25.99074935913086, 26.7115535736084, 27.432357788085938]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 13.0, 12.0, 9.0, 17.0, 15.0, 20.0, 41.0, 55.0, 68.0, 100.0, 154.0, 212.0, 300.0, 522.0, 756.0, 1313.0, 2310.0, 4261.0, 8432.0, 18159.0, 41556.0, 99072.0, 269596.0, 364726.0, 134704.0, 54977.0, 23805.0, 10978.0, 5324.0, 2795.0, 1559.0, 935.0, 564.0, 376.0, 260.0, 166.0, 107.0, 89.0, 51.0, 37.0, 38.0, 15.0, 14.0, 11.0, 14.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.0390625, -8.758056640625, -8.47705078125, -8.196044921875, -7.9150390625, -7.634033203125, -7.35302734375, -7.072021484375, -6.791015625, -6.510009765625, -6.22900390625, -5.947998046875, -5.6669921875, -5.385986328125, -5.10498046875, -4.823974609375, -4.54296875, -4.261962890625, -3.98095703125, -3.699951171875, -3.4189453125, -3.137939453125, -2.85693359375, -2.575927734375, -2.294921875, -2.013916015625, -1.73291015625, -1.451904296875, -1.1708984375, -0.889892578125, -0.60888671875, -0.327880859375, -0.046875, 0.234130859375, 0.51513671875, 0.796142578125, 1.0771484375, 1.358154296875, 1.63916015625, 1.920166015625, 2.201171875, 2.482177734375, 2.76318359375, 3.044189453125, 3.3251953125, 3.606201171875, 3.88720703125, 4.168212890625, 4.44921875, 4.730224609375, 5.01123046875, 5.292236328125, 5.5732421875, 5.854248046875, 6.13525390625, 6.416259765625, 6.697265625, 6.978271484375, 7.25927734375, 7.540283203125, 7.8212890625, 8.102294921875, 8.38330078125, 8.664306640625, 8.9453125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 4.0, 11.0, 18.0, 14.0, 28.0, 27.0, 44.0, 36.0, 38.0, 51.0, 59.0, 63.0, 72.0, 73.0, 67.0, 66.0, 57.0, 54.0, 44.0, 38.0, 29.0, 18.0, 23.0, 14.0, 10.0, 8.0, 6.0, 5.0, 10.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21484375, -5.07427978515625, -4.9337158203125, -4.79315185546875, -4.652587890625, -4.51202392578125, -4.3714599609375, -4.23089599609375, -4.09033203125, -3.94976806640625, -3.8092041015625, -3.66864013671875, -3.528076171875, -3.38751220703125, -3.2469482421875, -3.10638427734375, -2.9658203125, -2.82525634765625, -2.6846923828125, -2.54412841796875, -2.403564453125, -2.26300048828125, -2.1224365234375, -1.98187255859375, -1.84130859375, -1.70074462890625, -1.5601806640625, -1.41961669921875, -1.279052734375, -1.13848876953125, -0.9979248046875, -0.85736083984375, -0.716796875, -0.57623291015625, -0.4356689453125, -0.29510498046875, -0.154541015625, -0.01397705078125, 0.1265869140625, 0.26715087890625, 0.40771484375, 0.54827880859375, 0.6888427734375, 0.82940673828125, 0.969970703125, 1.11053466796875, 1.2510986328125, 1.39166259765625, 1.5322265625, 1.67279052734375, 1.8133544921875, 1.95391845703125, 2.094482421875, 2.23504638671875, 2.3756103515625, 2.51617431640625, 2.65673828125, 2.79730224609375, 2.9378662109375, 3.07843017578125, 3.218994140625, 3.35955810546875, 3.5001220703125, 3.64068603515625, 3.78125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 6.0, 8.0, 16.0, 21.0, 31.0, 45.0, 75.0, 107.0, 143.0, 231.0, 349.0, 639.0, 1400.0, 3786.0, 16478.0, 183799.0, 776236.0, 52735.0, 7847.0, 2250.0, 969.0, 517.0, 287.0, 202.0, 103.0, 74.0, 57.0, 31.0, 23.0, 25.0, 21.0, 5.0, 8.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-26.6875, -25.930908203125, -25.17431640625, -24.417724609375, -23.6611328125, -22.904541015625, -22.14794921875, -21.391357421875, -20.634765625, -19.878173828125, -19.12158203125, -18.364990234375, -17.6083984375, -16.851806640625, -16.09521484375, -15.338623046875, -14.58203125, -13.825439453125, -13.06884765625, -12.312255859375, -11.5556640625, -10.799072265625, -10.04248046875, -9.285888671875, -8.529296875, -7.772705078125, -7.01611328125, -6.259521484375, -5.5029296875, -4.746337890625, -3.98974609375, -3.233154296875, -2.4765625, -1.719970703125, -0.96337890625, -0.206787109375, 0.5498046875, 1.306396484375, 2.06298828125, 2.819580078125, 3.576171875, 4.332763671875, 5.08935546875, 5.845947265625, 6.6025390625, 7.359130859375, 8.11572265625, 8.872314453125, 9.62890625, 10.385498046875, 11.14208984375, 11.898681640625, 12.6552734375, 13.411865234375, 14.16845703125, 14.925048828125, 15.681640625, 16.438232421875, 17.19482421875, 17.951416015625, 18.7080078125, 19.464599609375, 20.22119140625, 20.977783203125, 21.734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 15.0, 10.0, 16.0, 37.0, 33.0, 33.0, 58.0, 38.0, 58.0, 46.0, 56.0, 65.0, 62.0, 52.0, 60.0, 59.0, 47.0, 47.0, 50.0, 45.0, 21.0, 20.0, 19.0, 13.0, 11.0, 5.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.71875, -21.06689453125, -20.4150390625, -19.76318359375, -19.111328125, -18.45947265625, -17.8076171875, -17.15576171875, -16.50390625, -15.85205078125, -15.2001953125, -14.54833984375, -13.896484375, -13.24462890625, -12.5927734375, -11.94091796875, -11.2890625, -10.63720703125, -9.9853515625, -9.33349609375, -8.681640625, -8.02978515625, -7.3779296875, -6.72607421875, -6.07421875, -5.42236328125, -4.7705078125, -4.11865234375, -3.466796875, -2.81494140625, -2.1630859375, -1.51123046875, -0.859375, -0.20751953125, 0.4443359375, 1.09619140625, 1.748046875, 2.39990234375, 3.0517578125, 3.70361328125, 4.35546875, 5.00732421875, 5.6591796875, 6.31103515625, 6.962890625, 7.61474609375, 8.2666015625, 8.91845703125, 9.5703125, 10.22216796875, 10.8740234375, 11.52587890625, 12.177734375, 12.82958984375, 13.4814453125, 14.13330078125, 14.78515625, 15.43701171875, 16.0888671875, 16.74072265625, 17.392578125, 18.04443359375, 18.6962890625, 19.34814453125, 20.0]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 7.0, 7.0, 11.0, 18.0, 27.0, 39.0, 72.0, 129.0, 197.0, 388.0, 765.0, 1800.0, 5809.0, 25141.0, 177546.0, 705091.0, 107057.0, 17215.0, 4412.0, 1482.0, 626.0, 267.0, 159.0, 101.0, 64.0, 42.0, 21.0, 27.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.125732421875, -4.91552734375, -4.705322265625, -4.4951171875, -4.284912109375, -4.07470703125, -3.864501953125, -3.654296875, -3.444091796875, -3.23388671875, -3.023681640625, -2.8134765625, -2.603271484375, -2.39306640625, -2.182861328125, -1.97265625, -1.762451171875, -1.55224609375, -1.342041015625, -1.1318359375, -0.921630859375, -0.71142578125, -0.501220703125, -0.291015625, -0.080810546875, 0.12939453125, 0.339599609375, 0.5498046875, 0.760009765625, 0.97021484375, 1.180419921875, 1.390625, 1.600830078125, 1.81103515625, 2.021240234375, 2.2314453125, 2.441650390625, 2.65185546875, 2.862060546875, 3.072265625, 3.282470703125, 3.49267578125, 3.702880859375, 3.9130859375, 4.123291015625, 4.33349609375, 4.543701171875, 4.75390625, 4.964111328125, 5.17431640625, 5.384521484375, 5.5947265625, 5.804931640625, 6.01513671875, 6.225341796875, 6.435546875, 6.645751953125, 6.85595703125, 7.066162109375, 7.2763671875, 7.486572265625, 7.69677734375, 7.906982421875, 8.1171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 9.0, 6.0, 12.0, 12.0, 24.0, 21.0, 27.0, 27.0, 40.0, 50.0, 75.0, 105.0, 131.0, 109.0, 71.0, 62.0, 43.0, 35.0, 24.0, 26.0, 16.0, 16.0, 13.0, 11.0, 6.0, 4.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009579658508300781, -0.0009255930781364441, -0.0008932203054428101, -0.000860847532749176, -0.000828474760055542, -0.000796101987361908, -0.0007637292146682739, -0.0007313564419746399, -0.0006989836692810059, -0.0006666108965873718, -0.0006342381238937378, -0.0006018653512001038, -0.0005694925785064697, -0.0005371198058128357, -0.0005047470331192017, -0.0004723742604255676, -0.0004400014877319336, -0.00040762871503829956, -0.00037525594234466553, -0.0003428831696510315, -0.00031051039695739746, -0.00027813762426376343, -0.0002457648515701294, -0.00021339207887649536, -0.00018101930618286133, -0.0001486465334892273, -0.00011627376079559326, -8.390098810195923e-05, -5.1528215408325195e-05, -1.9155442714691162e-05, 1.3217329978942871e-05, 4.5590102672576904e-05, 7.796287536621094e-05, 0.00011033564805984497, 0.000142708420753479, 0.00017508119344711304, 0.00020745396614074707, 0.0002398267388343811, 0.00027219951152801514, 0.00030457228422164917, 0.0003369450569152832, 0.00036931782960891724, 0.00040169060230255127, 0.0004340633749961853, 0.00046643614768981934, 0.0004988089203834534, 0.0005311816930770874, 0.0005635544657707214, 0.0005959272384643555, 0.0006283000111579895, 0.0006606727838516235, 0.0006930455565452576, 0.0007254183292388916, 0.0007577911019325256, 0.0007901638746261597, 0.0008225366473197937, 0.0008549094200134277, 0.0008872821927070618, 0.0009196549654006958, 0.0009520277380943298, 0.0009844005107879639, 0.001016773283481598, 0.001049146056175232, 0.001081518828868866, 0.0011138916015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 5.0, 9.0, 9.0, 22.0, 38.0, 47.0, 61.0, 127.0, 222.0, 399.0, 840.0, 2188.0, 7796.0, 46647.0, 627252.0, 327390.0, 26942.0, 5285.0, 1671.0, 701.0, 360.0, 205.0, 111.0, 85.0, 48.0, 37.0, 20.0, 13.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.890625, -8.64276123046875, -8.3948974609375, -8.14703369140625, -7.899169921875, -7.65130615234375, -7.4034423828125, -7.15557861328125, -6.90771484375, -6.65985107421875, -6.4119873046875, -6.16412353515625, -5.916259765625, -5.66839599609375, -5.4205322265625, -5.17266845703125, -4.9248046875, -4.67694091796875, -4.4290771484375, -4.18121337890625, -3.933349609375, -3.68548583984375, -3.4376220703125, -3.18975830078125, -2.94189453125, -2.69403076171875, -2.4461669921875, -2.19830322265625, -1.950439453125, -1.70257568359375, -1.4547119140625, -1.20684814453125, -0.958984375, -0.71112060546875, -0.4632568359375, -0.21539306640625, 0.032470703125, 0.28033447265625, 0.5281982421875, 0.77606201171875, 1.02392578125, 1.27178955078125, 1.5196533203125, 1.76751708984375, 2.015380859375, 2.26324462890625, 2.5111083984375, 2.75897216796875, 3.0068359375, 3.25469970703125, 3.5025634765625, 3.75042724609375, 3.998291015625, 4.24615478515625, 4.4940185546875, 4.74188232421875, 4.98974609375, 5.23760986328125, 5.4854736328125, 5.73333740234375, 5.981201171875, 6.22906494140625, 6.4769287109375, 6.72479248046875, 6.97265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 6.0, 8.0, 19.0, 9.0, 12.0, 19.0, 11.0, 25.0, 26.0, 34.0, 41.0, 41.0, 44.0, 45.0, 70.0, 70.0, 73.0, 74.0, 36.0, 62.0, 35.0, 38.0, 36.0, 25.0, 24.0, 21.0, 21.0, 12.0, 12.0, 11.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.1484375, -4.0257568359375, -3.903076171875, -3.7803955078125, -3.65771484375, -3.5350341796875, -3.412353515625, -3.2896728515625, -3.1669921875, -3.0443115234375, -2.921630859375, -2.7989501953125, -2.67626953125, -2.5535888671875, -2.430908203125, -2.3082275390625, -2.185546875, -2.0628662109375, -1.940185546875, -1.8175048828125, -1.69482421875, -1.5721435546875, -1.449462890625, -1.3267822265625, -1.2041015625, -1.0814208984375, -0.958740234375, -0.8360595703125, -0.71337890625, -0.5906982421875, -0.468017578125, -0.3453369140625, -0.22265625, -0.0999755859375, 0.022705078125, 0.1453857421875, 0.26806640625, 0.3907470703125, 0.513427734375, 0.6361083984375, 0.7587890625, 0.8814697265625, 1.004150390625, 1.1268310546875, 1.24951171875, 1.3721923828125, 1.494873046875, 1.6175537109375, 1.740234375, 1.8629150390625, 1.985595703125, 2.1082763671875, 2.23095703125, 2.3536376953125, 2.476318359375, 2.5989990234375, 2.7216796875, 2.8443603515625, 2.967041015625, 3.0897216796875, 3.21240234375, 3.3350830078125, 3.457763671875, 3.5804443359375, 3.703125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 7.0, 12.0, 19.0, 37.0, 57.0, 83.0, 96.0, 127.0, 126.0, 117.0, 108.0, 70.0, 40.0, 33.0, 18.0, 20.0, 9.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-84.27715301513672, -80.96037292480469, -77.64359283447266, -74.32681274414062, -71.01002502441406, -67.69325256347656, -64.37646484375, -61.05968475341797, -57.74290466308594, -54.426124572753906, -51.109344482421875, -47.79256057739258, -44.47578048706055, -41.159000396728516, -37.84221649169922, -34.52543640136719, -31.208656311035156, -27.891876220703125, -24.57509422302246, -21.258312225341797, -17.941532135009766, -14.624752044677734, -11.30797004699707, -7.991188049316406, -4.674407958984375, -1.3576269149780273, 1.9591541290283203, 5.275935173034668, 8.592716217041016, 11.909496307373047, 15.226278305053711, 18.543060302734375, 21.859848022460938, 25.17662811279297, 28.493410110473633, 31.810192108154297, 35.12697219848633, 38.44375228881836, 41.760536193847656, 45.07731628417969, 48.39409637451172, 51.71087646484375, 55.02765655517578, 58.34444046020508, 61.66122055053711, 64.97799682617188, 68.29478454589844, 71.61156463623047, 74.9283447265625, 78.24512481689453, 81.56190490722656, 84.8786849975586, 88.19546508789062, 91.51225280761719, 94.82903289794922, 98.14581298828125, 101.46259307861328, 104.77937316894531, 108.09615325927734, 111.41293334960938, 114.72972106933594, 118.04649353027344, 121.36328125, 124.68006134033203, 127.99684143066406]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 8.0, 8.0, 6.0, 13.0, 10.0, 13.0, 22.0, 12.0, 29.0, 24.0, 34.0, 30.0, 33.0, 34.0, 53.0, 65.0, 48.0, 60.0, 56.0, 59.0, 54.0, 38.0, 28.0, 44.0, 47.0, 22.0, 20.0, 24.0, 20.0, 17.0, 14.0, 14.0, 9.0, 10.0, 3.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.85090637207031, -48.74159622192383, -46.63228225708008, -44.522972106933594, -42.41366195678711, -40.304351806640625, -38.195037841796875, -36.08572769165039, -33.976417541503906, -31.86710548400879, -29.757795333862305, -27.648483276367188, -25.539173126220703, -23.429861068725586, -21.32054901123047, -19.211238861083984, -17.101924896240234, -14.992613792419434, -12.883302688598633, -10.773990631103516, -8.664679527282715, -6.555368423461914, -4.446056365966797, -2.336745262145996, -0.2274341583251953, 1.8818771839141846, 3.9911885261535645, 6.100500106811523, 8.209811210632324, 10.319122314453125, 12.428434371948242, 14.537745475769043, 16.647056579589844, 18.75636863708496, 20.865678787231445, 22.974990844726562, 25.084300994873047, 27.193613052368164, 29.30292510986328, 31.412235260009766, 33.52154541015625, 35.630855560302734, 37.740169525146484, 39.84947967529297, 41.95878982543945, 44.06809997558594, 46.17741394042969, 48.28672409057617, 50.39603805541992, 52.505348205566406, 54.614662170410156, 56.72397232055664, 58.833282470703125, 60.942596435546875, 63.05190658569336, 65.16121673583984, 67.2705307006836, 69.37984466552734, 71.48915100097656, 73.59846496582031, 75.70777893066406, 77.81708526611328, 79.92639923095703, 82.03571319580078, 84.14501953125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 4.0, 4.0, 4.0, 8.0, 11.0, 17.0, 31.0, 27.0, 44.0, 63.0, 88.0, 128.0, 198.0, 260.0, 391.0, 605.0, 1022.0, 1696.0, 2960.0, 5404.0, 10607.0, 22847.0, 60376.0, 266072.0, 3156630.0, 525522.0, 82028.0, 29156.0, 12970.0, 6476.0, 3391.0, 1919.0, 1164.0, 651.0, 467.0, 312.0, 192.0, 142.0, 111.0, 83.0, 53.0, 32.0, 32.0, 22.0, 16.0, 10.0, 9.0, 10.0, 6.0, 6.0, 0.0, 4.0, 2.0, 2.0], "bins": [-8.0859375, -7.85247802734375, -7.6190185546875, -7.38555908203125, -7.152099609375, -6.91864013671875, -6.6851806640625, -6.45172119140625, -6.21826171875, -5.98480224609375, -5.7513427734375, -5.51788330078125, -5.284423828125, -5.05096435546875, -4.8175048828125, -4.58404541015625, -4.3505859375, -4.11712646484375, -3.8836669921875, -3.65020751953125, -3.416748046875, -3.18328857421875, -2.9498291015625, -2.71636962890625, -2.48291015625, -2.24945068359375, -2.0159912109375, -1.78253173828125, -1.549072265625, -1.31561279296875, -1.0821533203125, -0.84869384765625, -0.615234375, -0.38177490234375, -0.1483154296875, 0.08514404296875, 0.318603515625, 0.55206298828125, 0.7855224609375, 1.01898193359375, 1.25244140625, 1.48590087890625, 1.7193603515625, 1.95281982421875, 2.186279296875, 2.41973876953125, 2.6531982421875, 2.88665771484375, 3.1201171875, 3.35357666015625, 3.5870361328125, 3.82049560546875, 4.053955078125, 4.28741455078125, 4.5208740234375, 4.75433349609375, 4.98779296875, 5.22125244140625, 5.4547119140625, 5.68817138671875, 5.921630859375, 6.15509033203125, 6.3885498046875, 6.62200927734375, 6.85546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 9.0, 10.0, 9.0, 12.0, 18.0, 26.0, 15.0, 22.0, 17.0, 33.0, 33.0, 37.0, 38.0, 49.0, 52.0, 42.0, 46.0, 58.0, 58.0, 48.0, 47.0, 36.0, 53.0, 37.0, 26.0, 44.0, 24.0, 14.0, 22.0, 16.0, 9.0, 5.0, 4.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.1875, -3.09173583984375, -2.9959716796875, -2.90020751953125, -2.804443359375, -2.70867919921875, -2.6129150390625, -2.51715087890625, -2.42138671875, -2.32562255859375, -2.2298583984375, -2.13409423828125, -2.038330078125, -1.94256591796875, -1.8468017578125, -1.75103759765625, -1.6552734375, -1.55950927734375, -1.4637451171875, -1.36798095703125, -1.272216796875, -1.17645263671875, -1.0806884765625, -0.98492431640625, -0.88916015625, -0.79339599609375, -0.6976318359375, -0.60186767578125, -0.506103515625, -0.41033935546875, -0.3145751953125, -0.21881103515625, -0.123046875, -0.02728271484375, 0.0684814453125, 0.16424560546875, 0.260009765625, 0.35577392578125, 0.4515380859375, 0.54730224609375, 0.64306640625, 0.73883056640625, 0.8345947265625, 0.93035888671875, 1.026123046875, 1.12188720703125, 1.2176513671875, 1.31341552734375, 1.4091796875, 1.50494384765625, 1.6007080078125, 1.69647216796875, 1.792236328125, 1.88800048828125, 1.9837646484375, 2.07952880859375, 2.17529296875, 2.27105712890625, 2.3668212890625, 2.46258544921875, 2.558349609375, 2.65411376953125, 2.7498779296875, 2.84564208984375, 2.94140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 7.0, 7.0, 15.0, 21.0, 21.0, 38.0, 59.0, 97.0, 170.0, 234.0, 406.0, 772.0, 1529.0, 3127.0, 7063.0, 18991.0, 63372.0, 410183.0, 3436636.0, 186420.0, 41320.0, 13628.0, 5245.0, 2317.0, 1129.0, 638.0, 324.0, 172.0, 109.0, 61.0, 52.0, 34.0, 23.0, 20.0, 14.0, 9.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8203125, -9.4610595703125, -9.101806640625, -8.7425537109375, -8.38330078125, -8.0240478515625, -7.664794921875, -7.3055419921875, -6.9462890625, -6.5870361328125, -6.227783203125, -5.8685302734375, -5.50927734375, -5.1500244140625, -4.790771484375, -4.4315185546875, -4.072265625, -3.7130126953125, -3.353759765625, -2.9945068359375, -2.63525390625, -2.2760009765625, -1.916748046875, -1.5574951171875, -1.1982421875, -0.8389892578125, -0.479736328125, -0.1204833984375, 0.23876953125, 0.5980224609375, 0.957275390625, 1.3165283203125, 1.67578125, 2.0350341796875, 2.394287109375, 2.7535400390625, 3.11279296875, 3.4720458984375, 3.831298828125, 4.1905517578125, 4.5498046875, 4.9090576171875, 5.268310546875, 5.6275634765625, 5.98681640625, 6.3460693359375, 6.705322265625, 7.0645751953125, 7.423828125, 7.7830810546875, 8.142333984375, 8.5015869140625, 8.86083984375, 9.2200927734375, 9.579345703125, 9.9385986328125, 10.2978515625, 10.6571044921875, 11.016357421875, 11.3756103515625, 11.73486328125, 12.0941162109375, 12.453369140625, 12.8126220703125, 13.171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 10.0, 5.0, 7.0, 14.0, 10.0, 20.0, 15.0, 28.0, 46.0, 43.0, 84.0, 101.0, 164.0, 330.0, 950.0, 1152.0, 450.0, 207.0, 104.0, 74.0, 55.0, 37.0, 41.0, 28.0, 24.0, 23.0, 7.0, 7.0, 3.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.425537109375, -9.07763671875, -8.729736328125, -8.3818359375, -8.033935546875, -7.68603515625, -7.338134765625, -6.990234375, -6.642333984375, -6.29443359375, -5.946533203125, -5.5986328125, -5.250732421875, -4.90283203125, -4.554931640625, -4.20703125, -3.859130859375, -3.51123046875, -3.163330078125, -2.8154296875, -2.467529296875, -2.11962890625, -1.771728515625, -1.423828125, -1.075927734375, -0.72802734375, -0.380126953125, -0.0322265625, 0.315673828125, 0.66357421875, 1.011474609375, 1.359375, 1.707275390625, 2.05517578125, 2.403076171875, 2.7509765625, 3.098876953125, 3.44677734375, 3.794677734375, 4.142578125, 4.490478515625, 4.83837890625, 5.186279296875, 5.5341796875, 5.882080078125, 6.22998046875, 6.577880859375, 6.92578125, 7.273681640625, 7.62158203125, 7.969482421875, 8.3173828125, 8.665283203125, 9.01318359375, 9.361083984375, 9.708984375, 10.056884765625, 10.40478515625, 10.752685546875, 11.1005859375, 11.448486328125, 11.79638671875, 12.144287109375, 12.4921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 24.0, 75.0, 275.0, 401.0, 162.0, 40.0, 10.0, 7.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.5133514404297, -149.35073852539062, -141.1881103515625, -133.02549743652344, -124.86288452148438, -116.70026397705078, -108.53764343261719, -100.37503051757812, -92.21240997314453, -84.04978942871094, -75.88717651367188, -67.72455596923828, -59.56193923950195, -51.399322509765625, -43.23670196533203, -35.0740852355957, -26.911468505859375, -18.748851776123047, -10.586233139038086, -2.423614501953125, 5.739002227783203, 13.901618957519531, 22.064239501953125, 30.226856231689453, 38.38947296142578, 46.55208969116211, 54.71470642089844, 62.87732696533203, 71.03994750976562, 79.20256042480469, 87.36518096923828, 95.52780151367188, 103.69039916992188, 111.85301971435547, 120.01563262939453, 128.17825317382812, 136.3408660888672, 144.50347900390625, 152.66610717773438, 160.82872009277344, 168.9913330078125, 177.15394592285156, 185.3165740966797, 193.47918701171875, 201.6417999267578, 209.80441284179688, 217.967041015625, 226.12965393066406, 234.2922821044922, 242.45489501953125, 250.61752319335938, 258.7801513671875, 266.9427490234375, 275.1053771972656, 283.26800537109375, 291.43060302734375, 299.5932312011719, 307.755859375, 315.91845703125, 324.0810852050781, 332.24371337890625, 340.40631103515625, 348.5689392089844, 356.7315673828125, 364.8941650390625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 6.0, 2.0, 2.0, 10.0, 11.0, 15.0, 12.0, 14.0, 14.0, 19.0, 19.0, 33.0, 23.0, 30.0, 29.0, 44.0, 45.0, 34.0, 57.0, 55.0, 46.0, 51.0, 44.0, 34.0, 36.0, 41.0, 33.0, 25.0, 25.0, 35.0, 36.0, 18.0, 19.0, 18.0, 11.0, 7.0, 11.0, 10.0, 11.0, 5.0, 0.0, 8.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-50.7946891784668, -49.412879943847656, -48.031070709228516, -46.649261474609375, -45.26744842529297, -43.88563919067383, -42.50382995605469, -41.12202072143555, -39.740211486816406, -38.358402252197266, -36.976593017578125, -35.59477996826172, -34.21297073364258, -32.83116149902344, -31.449352264404297, -30.067543029785156, -28.68572998046875, -27.30392074584961, -25.922109603881836, -24.540300369262695, -23.158489227294922, -21.77667999267578, -20.39487075805664, -19.0130615234375, -17.631250381469727, -16.249441146850586, -14.867630004882812, -13.485820770263672, -12.104010581970215, -10.722200393676758, -9.340391159057617, -7.95858097076416, -6.576774597167969, -5.194964408874512, -3.813154697418213, -2.431344985961914, -1.049534797668457, 0.332275390625, 1.7140846252441406, 3.0958948135375977, 4.477705001831055, 5.859515190124512, 7.2413249015808105, 8.62313461303711, 10.004944801330566, 11.386754989624023, 12.768564224243164, 14.150374412536621, 15.532184600830078, 16.91399383544922, 18.295804977416992, 19.677614212036133, 21.059425354003906, 22.441234588623047, 23.823043823242188, 25.204853057861328, 26.5866641998291, 27.968473434448242, 29.350284576416016, 30.732093811035156, 32.1139030456543, 33.49571228027344, 34.877525329589844, 36.259334564208984, 37.641143798828125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 10.0, 7.0, 6.0, 5.0, 13.0, 21.0, 33.0, 47.0, 70.0, 85.0, 133.0, 221.0, 294.0, 488.0, 698.0, 1156.0, 1875.0, 3286.0, 6322.0, 11629.0, 24062.0, 53268.0, 143683.0, 456685.0, 212900.0, 69291.0, 30353.0, 14707.0, 7318.0, 3838.0, 2244.0, 1362.0, 876.0, 550.0, 337.0, 218.0, 134.0, 96.0, 72.0, 65.0, 28.0, 23.0, 11.0, 12.0, 6.0, 6.0, 6.0, 3.0, 3.0, 4.0, 1.0, 5.0], "bins": [-9.7109375, -9.43853759765625, -9.1661376953125, -8.89373779296875, -8.621337890625, -8.34893798828125, -8.0765380859375, -7.80413818359375, -7.53173828125, -7.25933837890625, -6.9869384765625, -6.71453857421875, -6.442138671875, -6.16973876953125, -5.8973388671875, -5.62493896484375, -5.3525390625, -5.08013916015625, -4.8077392578125, -4.53533935546875, -4.262939453125, -3.99053955078125, -3.7181396484375, -3.44573974609375, -3.17333984375, -2.90093994140625, -2.6285400390625, -2.35614013671875, -2.083740234375, -1.81134033203125, -1.5389404296875, -1.26654052734375, -0.994140625, -0.72174072265625, -0.4493408203125, -0.17694091796875, 0.095458984375, 0.36785888671875, 0.6402587890625, 0.91265869140625, 1.18505859375, 1.45745849609375, 1.7298583984375, 2.00225830078125, 2.274658203125, 2.54705810546875, 2.8194580078125, 3.09185791015625, 3.3642578125, 3.63665771484375, 3.9090576171875, 4.18145751953125, 4.453857421875, 4.72625732421875, 4.9986572265625, 5.27105712890625, 5.54345703125, 5.81585693359375, 6.0882568359375, 6.36065673828125, 6.633056640625, 6.90545654296875, 7.1778564453125, 7.45025634765625, 7.72265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 4.0, 6.0, 11.0, 11.0, 11.0, 20.0, 14.0, 22.0, 26.0, 25.0, 38.0, 29.0, 30.0, 38.0, 58.0, 48.0, 45.0, 56.0, 56.0, 50.0, 47.0, 47.0, 51.0, 35.0, 29.0, 31.0, 32.0, 26.0, 24.0, 14.0, 12.0, 9.0, 10.0, 11.0, 5.0, 3.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.177734375, -3.075439453125, -2.97314453125, -2.870849609375, -2.7685546875, -2.666259765625, -2.56396484375, -2.461669921875, -2.359375, -2.257080078125, -2.15478515625, -2.052490234375, -1.9501953125, -1.847900390625, -1.74560546875, -1.643310546875, -1.541015625, -1.438720703125, -1.33642578125, -1.234130859375, -1.1318359375, -1.029541015625, -0.92724609375, -0.824951171875, -0.72265625, -0.620361328125, -0.51806640625, -0.415771484375, -0.3134765625, -0.211181640625, -0.10888671875, -0.006591796875, 0.095703125, 0.197998046875, 0.30029296875, 0.402587890625, 0.5048828125, 0.607177734375, 0.70947265625, 0.811767578125, 0.9140625, 1.016357421875, 1.11865234375, 1.220947265625, 1.3232421875, 1.425537109375, 1.52783203125, 1.630126953125, 1.732421875, 1.834716796875, 1.93701171875, 2.039306640625, 2.1416015625, 2.243896484375, 2.34619140625, 2.448486328125, 2.55078125, 2.653076171875, 2.75537109375, 2.857666015625, 2.9599609375, 3.062255859375, 3.16455078125, 3.266845703125, 3.369140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 10.0, 5.0, 16.0, 15.0, 16.0, 42.0, 86.0, 153.0, 309.0, 622.0, 2035.0, 11464.0, 717565.0, 304807.0, 8576.0, 1686.0, 584.0, 248.0, 121.0, 64.0, 38.0, 36.0, 26.0, 9.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.96875, -38.82470703125, -37.6806640625, -36.53662109375, -35.392578125, -34.24853515625, -33.1044921875, -31.96044921875, -30.81640625, -29.67236328125, -28.5283203125, -27.38427734375, -26.240234375, -25.09619140625, -23.9521484375, -22.80810546875, -21.6640625, -20.52001953125, -19.3759765625, -18.23193359375, -17.087890625, -15.94384765625, -14.7998046875, -13.65576171875, -12.51171875, -11.36767578125, -10.2236328125, -9.07958984375, -7.935546875, -6.79150390625, -5.6474609375, -4.50341796875, -3.359375, -2.21533203125, -1.0712890625, 0.07275390625, 1.216796875, 2.36083984375, 3.5048828125, 4.64892578125, 5.79296875, 6.93701171875, 8.0810546875, 9.22509765625, 10.369140625, 11.51318359375, 12.6572265625, 13.80126953125, 14.9453125, 16.08935546875, 17.2333984375, 18.37744140625, 19.521484375, 20.66552734375, 21.8095703125, 22.95361328125, 24.09765625, 25.24169921875, 26.3857421875, 27.52978515625, 28.673828125, 29.81787109375, 30.9619140625, 32.10595703125, 33.25]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 5.0, 7.0, 6.0, 9.0, 17.0, 20.0, 17.0, 16.0, 27.0, 29.0, 50.0, 53.0, 40.0, 56.0, 53.0, 67.0, 66.0, 51.0, 83.0, 63.0, 42.0, 41.0, 22.0, 39.0, 21.0, 19.0, 18.0, 12.0, 10.0, 8.0, 4.0, 7.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.46875, -17.852783203125, -17.23681640625, -16.620849609375, -16.0048828125, -15.388916015625, -14.77294921875, -14.156982421875, -13.541015625, -12.925048828125, -12.30908203125, -11.693115234375, -11.0771484375, -10.461181640625, -9.84521484375, -9.229248046875, -8.61328125, -7.997314453125, -7.38134765625, -6.765380859375, -6.1494140625, -5.533447265625, -4.91748046875, -4.301513671875, -3.685546875, -3.069580078125, -2.45361328125, -1.837646484375, -1.2216796875, -0.605712890625, 0.01025390625, 0.626220703125, 1.2421875, 1.858154296875, 2.47412109375, 3.090087890625, 3.7060546875, 4.322021484375, 4.93798828125, 5.553955078125, 6.169921875, 6.785888671875, 7.40185546875, 8.017822265625, 8.6337890625, 9.249755859375, 9.86572265625, 10.481689453125, 11.09765625, 11.713623046875, 12.32958984375, 12.945556640625, 13.5615234375, 14.177490234375, 14.79345703125, 15.409423828125, 16.025390625, 16.641357421875, 17.25732421875, 17.873291015625, 18.4892578125, 19.105224609375, 19.72119140625, 20.337158203125, 20.953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 8.0, 5.0, 9.0, 15.0, 17.0, 26.0, 37.0, 48.0, 85.0, 142.0, 256.0, 513.0, 1247.0, 3888.0, 18458.0, 214825.0, 755241.0, 43458.0, 6835.0, 1860.0, 724.0, 325.0, 195.0, 93.0, 65.0, 54.0, 36.0, 20.0, 19.0, 16.0, 7.0, 6.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.703125, -8.39453125, -8.0859375, -7.77734375, -7.46875, -7.16015625, -6.8515625, -6.54296875, -6.234375, -5.92578125, -5.6171875, -5.30859375, -5.0, -4.69140625, -4.3828125, -4.07421875, -3.765625, -3.45703125, -3.1484375, -2.83984375, -2.53125, -2.22265625, -1.9140625, -1.60546875, -1.296875, -0.98828125, -0.6796875, -0.37109375, -0.0625, 0.24609375, 0.5546875, 0.86328125, 1.171875, 1.48046875, 1.7890625, 2.09765625, 2.40625, 2.71484375, 3.0234375, 3.33203125, 3.640625, 3.94921875, 4.2578125, 4.56640625, 4.875, 5.18359375, 5.4921875, 5.80078125, 6.109375, 6.41796875, 6.7265625, 7.03515625, 7.34375, 7.65234375, 7.9609375, 8.26953125, 8.578125, 8.88671875, 9.1953125, 9.50390625, 9.8125, 10.12109375, 10.4296875, 10.73828125, 11.046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 9.0, 7.0, 10.0, 13.0, 21.0, 27.0, 45.0, 62.0, 87.0, 156.0, 206.0, 108.0, 73.0, 27.0, 37.0, 24.0, 19.0, 13.0, 11.0, 11.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011615753173828125, -0.0011154413223266602, -0.0010693073272705078, -0.0010231733322143555, -0.0009770393371582031, -0.0009309053421020508, -0.0008847713470458984, -0.0008386373519897461, -0.0007925033569335938, -0.0007463693618774414, -0.0007002353668212891, -0.0006541013717651367, -0.0006079673767089844, -0.000561833381652832, -0.0005156993865966797, -0.00046956539154052734, -0.000423431396484375, -0.00037729740142822266, -0.0003311634063720703, -0.00028502941131591797, -0.00023889541625976562, -0.00019276142120361328, -0.00014662742614746094, -0.0001004934310913086, -5.435943603515625e-05, -8.225440979003906e-06, 3.790855407714844e-05, 8.404254913330078e-05, 0.00013017654418945312, 0.00017631053924560547, 0.0002224445343017578, 0.00026857852935791016, 0.0003147125244140625, 0.00036084651947021484, 0.0004069805145263672, 0.00045311450958251953, 0.0004992485046386719, 0.0005453824996948242, 0.0005915164947509766, 0.0006376504898071289, 0.0006837844848632812, 0.0007299184799194336, 0.0007760524749755859, 0.0008221864700317383, 0.0008683204650878906, 0.000914454460144043, 0.0009605884552001953, 0.0010067224502563477, 0.0010528564453125, 0.0010989904403686523, 0.0011451244354248047, 0.001191258430480957, 0.0012373924255371094, 0.0012835264205932617, 0.001329660415649414, 0.0013757944107055664, 0.0014219284057617188, 0.001468062400817871, 0.0015141963958740234, 0.0015603303909301758, 0.0016064643859863281, 0.0016525983810424805, 0.0016987323760986328, 0.0017448663711547852, 0.0017910003662109375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 9.0, 7.0, 11.0, 18.0, 41.0, 51.0, 86.0, 207.0, 449.0, 1240.0, 4962.0, 54431.0, 918077.0, 61073.0, 5605.0, 1371.0, 472.0, 222.0, 98.0, 47.0, 30.0, 22.0, 14.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1796875, -10.7415771484375, -10.303466796875, -9.8653564453125, -9.42724609375, -8.9891357421875, -8.551025390625, -8.1129150390625, -7.6748046875, -7.2366943359375, -6.798583984375, -6.3604736328125, -5.92236328125, -5.4842529296875, -5.046142578125, -4.6080322265625, -4.169921875, -3.7318115234375, -3.293701171875, -2.8555908203125, -2.41748046875, -1.9793701171875, -1.541259765625, -1.1031494140625, -0.6650390625, -0.2269287109375, 0.211181640625, 0.6492919921875, 1.08740234375, 1.5255126953125, 1.963623046875, 2.4017333984375, 2.83984375, 3.2779541015625, 3.716064453125, 4.1541748046875, 4.59228515625, 5.0303955078125, 5.468505859375, 5.9066162109375, 6.3447265625, 6.7828369140625, 7.220947265625, 7.6590576171875, 8.09716796875, 8.5352783203125, 8.973388671875, 9.4114990234375, 9.849609375, 10.2877197265625, 10.725830078125, 11.1639404296875, 11.60205078125, 12.0401611328125, 12.478271484375, 12.9163818359375, 13.3544921875, 13.7926025390625, 14.230712890625, 14.6688232421875, 15.10693359375, 15.5450439453125, 15.983154296875, 16.4212646484375, 16.859375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 4.0, 5.0, 7.0, 9.0, 20.0, 12.0, 26.0, 36.0, 25.0, 49.0, 54.0, 70.0, 65.0, 89.0, 92.0, 84.0, 60.0, 67.0, 46.0, 42.0, 28.0, 19.0, 22.0, 18.0, 8.0, 9.0, 9.0, 2.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.57421875, -6.39154052734375, -6.2088623046875, -6.02618408203125, -5.843505859375, -5.66082763671875, -5.4781494140625, -5.29547119140625, -5.11279296875, -4.93011474609375, -4.7474365234375, -4.56475830078125, -4.382080078125, -4.19940185546875, -4.0167236328125, -3.83404541015625, -3.6513671875, -3.46868896484375, -3.2860107421875, -3.10333251953125, -2.920654296875, -2.73797607421875, -2.5552978515625, -2.37261962890625, -2.18994140625, -2.00726318359375, -1.8245849609375, -1.64190673828125, -1.459228515625, -1.27655029296875, -1.0938720703125, -0.91119384765625, -0.728515625, -0.54583740234375, -0.3631591796875, -0.18048095703125, 0.002197265625, 0.18487548828125, 0.3675537109375, 0.55023193359375, 0.73291015625, 0.91558837890625, 1.0982666015625, 1.28094482421875, 1.463623046875, 1.64630126953125, 1.8289794921875, 2.01165771484375, 2.1943359375, 2.37701416015625, 2.5596923828125, 2.74237060546875, 2.925048828125, 3.10772705078125, 3.2904052734375, 3.47308349609375, 3.65576171875, 3.83843994140625, 4.0211181640625, 4.20379638671875, 4.386474609375, 4.56915283203125, 4.7518310546875, 4.93450927734375, 5.1171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 7.0, 7.0, 19.0, 34.0, 58.0, 87.0, 125.0, 190.0, 166.0, 125.0, 65.0, 48.0, 28.0, 14.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-128.66168212890625, -125.17101287841797, -121.68035125732422, -118.18968200683594, -114.69902038574219, -111.2083511352539, -107.71768188476562, -104.22702026367188, -100.73635864257812, -97.24568939208984, -93.7550277709961, -90.26435852050781, -86.77369689941406, -83.28302764892578, -79.7923583984375, -76.30169677734375, -72.81102752685547, -69.32035827636719, -65.82969665527344, -62.339027404785156, -58.848365783691406, -55.357696533203125, -51.86703109741211, -48.376365661621094, -44.88570022583008, -41.39503479003906, -37.90436935424805, -34.41370391845703, -30.923036575317383, -27.432371139526367, -23.94170379638672, -20.451038360595703, -16.960372924804688, -13.469707489013672, -9.97904109954834, -6.488374710083008, -2.997709274291992, 0.49295616149902344, 3.983623504638672, 7.4742889404296875, 10.964954376220703, 14.455619812011719, 17.946285247802734, 21.436952590942383, 24.9276180267334, 28.418283462524414, 31.908950805664062, 35.39961624145508, 38.890281677246094, 42.38094711303711, 45.871612548828125, 49.362281799316406, 52.852943420410156, 56.34361267089844, 59.83427810668945, 63.32494354248047, 66.81561279296875, 70.30628204345703, 73.79694366455078, 77.28761291503906, 80.77827453613281, 84.2689437866211, 87.75961303710938, 91.25027465820312, 94.74093627929688]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 6.0, 10.0, 10.0, 18.0, 12.0, 19.0, 34.0, 36.0, 44.0, 38.0, 32.0, 29.0, 50.0, 56.0, 65.0, 70.0, 44.0, 63.0, 49.0, 38.0, 24.0, 43.0, 34.0, 24.0, 19.0, 22.0, 14.0, 19.0, 19.0, 13.0, 8.0, 5.0, 7.0, 9.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.23706817626953, -46.19571304321289, -44.15435791015625, -42.11300277709961, -40.07164764404297, -38.03029251098633, -35.98893737792969, -33.94758224487305, -31.906227111816406, -29.864871978759766, -27.823516845703125, -25.782161712646484, -23.740806579589844, -21.699451446533203, -19.658096313476562, -17.616741180419922, -15.575386047363281, -13.53403091430664, -11.49267578125, -9.45132064819336, -7.409965515136719, -5.368610382080078, -3.3272552490234375, -1.2859001159667969, 0.7554550170898438, 2.7968101501464844, 4.838165283203125, 6.879520416259766, 8.920875549316406, 10.962230682373047, 13.003585815429688, 15.044940948486328, 17.0863037109375, 19.12765884399414, 21.16901397705078, 23.210369110107422, 25.251724243164062, 27.293079376220703, 29.334434509277344, 31.375789642333984, 33.417144775390625, 35.458499908447266, 37.499855041503906, 39.54121017456055, 41.58256530761719, 43.62392044067383, 45.66527557373047, 47.70663070678711, 49.74798583984375, 51.78934097290039, 53.83069610595703, 55.87205123901367, 57.91340637207031, 59.95476150512695, 61.996116638183594, 64.0374755859375, 66.07882690429688, 68.12017822265625, 70.16153717041016, 72.20289611816406, 74.24424743652344, 76.28559875488281, 78.32695770263672, 80.36831665039062, 82.40966796875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 8.0, 9.0, 14.0, 21.0, 36.0, 59.0, 64.0, 107.0, 202.0, 399.0, 802.0, 2049.0, 6321.0, 30338.0, 916508.0, 3180082.0, 44208.0, 8368.0, 2635.0, 988.0, 449.0, 245.0, 121.0, 80.0, 57.0, 25.0, 17.0, 14.0, 16.0, 10.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.171875, -14.650390625, -14.12890625, -13.607421875, -13.0859375, -12.564453125, -12.04296875, -11.521484375, -11.0, -10.478515625, -9.95703125, -9.435546875, -8.9140625, -8.392578125, -7.87109375, -7.349609375, -6.828125, -6.306640625, -5.78515625, -5.263671875, -4.7421875, -4.220703125, -3.69921875, -3.177734375, -2.65625, -2.134765625, -1.61328125, -1.091796875, -0.5703125, -0.048828125, 0.47265625, 0.994140625, 1.515625, 2.037109375, 2.55859375, 3.080078125, 3.6015625, 4.123046875, 4.64453125, 5.166015625, 5.6875, 6.208984375, 6.73046875, 7.251953125, 7.7734375, 8.294921875, 8.81640625, 9.337890625, 9.859375, 10.380859375, 10.90234375, 11.423828125, 11.9453125, 12.466796875, 12.98828125, 13.509765625, 14.03125, 14.552734375, 15.07421875, 15.595703125, 16.1171875, 16.638671875, 17.16015625, 17.681640625, 18.203125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 6.0, 1.0, 4.0, 10.0, 16.0, 22.0, 24.0, 17.0, 39.0, 40.0, 45.0, 52.0, 57.0, 63.0, 60.0, 54.0, 76.0, 54.0, 63.0, 50.0, 52.0, 28.0, 42.0, 31.0, 27.0, 17.0, 19.0, 10.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.301727294921875, -2.17962646484375, -2.057525634765625, -1.9354248046875, -1.813323974609375, -1.69122314453125, -1.569122314453125, -1.447021484375, -1.324920654296875, -1.20281982421875, -1.080718994140625, -0.9586181640625, -0.836517333984375, -0.71441650390625, -0.592315673828125, -0.47021484375, -0.348114013671875, -0.22601318359375, -0.103912353515625, 0.0181884765625, 0.140289306640625, 0.26239013671875, 0.384490966796875, 0.506591796875, 0.628692626953125, 0.75079345703125, 0.872894287109375, 0.9949951171875, 1.117095947265625, 1.23919677734375, 1.361297607421875, 1.4833984375, 1.605499267578125, 1.72760009765625, 1.849700927734375, 1.9718017578125, 2.093902587890625, 2.21600341796875, 2.338104248046875, 2.460205078125, 2.582305908203125, 2.70440673828125, 2.826507568359375, 2.9486083984375, 3.070709228515625, 3.19281005859375, 3.314910888671875, 3.43701171875, 3.559112548828125, 3.68121337890625, 3.803314208984375, 3.9254150390625, 4.047515869140625, 4.16961669921875, 4.291717529296875, 4.413818359375, 4.535919189453125, 4.65802001953125, 4.780120849609375, 4.9022216796875, 5.024322509765625, 5.14642333984375, 5.268524169921875, 5.390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 10.0, 9.0, 2.0, 13.0, 26.0, 23.0, 41.0, 50.0, 72.0, 92.0, 166.0, 260.0, 403.0, 733.0, 1528.0, 3726.0, 10568.0, 39804.0, 274940.0, 3601730.0, 211619.0, 33501.0, 8906.0, 3012.0, 1312.0, 619.0, 343.0, 208.0, 138.0, 122.0, 78.0, 57.0, 42.0, 40.0, 23.0, 19.0, 12.0, 6.0, 5.0, 7.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-13.0625, -12.6719970703125, -12.281494140625, -11.8909912109375, -11.50048828125, -11.1099853515625, -10.719482421875, -10.3289794921875, -9.9384765625, -9.5479736328125, -9.157470703125, -8.7669677734375, -8.37646484375, -7.9859619140625, -7.595458984375, -7.2049560546875, -6.814453125, -6.4239501953125, -6.033447265625, -5.6429443359375, -5.25244140625, -4.8619384765625, -4.471435546875, -4.0809326171875, -3.6904296875, -3.2999267578125, -2.909423828125, -2.5189208984375, -2.12841796875, -1.7379150390625, -1.347412109375, -0.9569091796875, -0.56640625, -0.1759033203125, 0.214599609375, 0.6051025390625, 0.99560546875, 1.3861083984375, 1.776611328125, 2.1671142578125, 2.5576171875, 2.9481201171875, 3.338623046875, 3.7291259765625, 4.11962890625, 4.5101318359375, 4.900634765625, 5.2911376953125, 5.681640625, 6.0721435546875, 6.462646484375, 6.8531494140625, 7.24365234375, 7.6341552734375, 8.024658203125, 8.4151611328125, 8.8056640625, 9.1961669921875, 9.586669921875, 9.9771728515625, 10.36767578125, 10.7581787109375, 11.148681640625, 11.5391845703125, 11.9296875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 4.0, 5.0, 6.0, 8.0, 13.0, 27.0, 42.0, 73.0, 113.0, 323.0, 1356.0, 1451.0, 369.0, 118.0, 69.0, 38.0, 34.0, 13.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7734375, -14.1832275390625, -13.593017578125, -13.0028076171875, -12.41259765625, -11.8223876953125, -11.232177734375, -10.6419677734375, -10.0517578125, -9.4615478515625, -8.871337890625, -8.2811279296875, -7.69091796875, -7.1007080078125, -6.510498046875, -5.9202880859375, -5.330078125, -4.7398681640625, -4.149658203125, -3.5594482421875, -2.96923828125, -2.3790283203125, -1.788818359375, -1.1986083984375, -0.6083984375, -0.0181884765625, 0.572021484375, 1.1622314453125, 1.75244140625, 2.3426513671875, 2.932861328125, 3.5230712890625, 4.11328125, 4.7034912109375, 5.293701171875, 5.8839111328125, 6.47412109375, 7.0643310546875, 7.654541015625, 8.2447509765625, 8.8349609375, 9.4251708984375, 10.015380859375, 10.6055908203125, 11.19580078125, 11.7860107421875, 12.376220703125, 12.9664306640625, 13.556640625, 14.1468505859375, 14.737060546875, 15.3272705078125, 15.91748046875, 16.5076904296875, 17.097900390625, 17.6881103515625, 18.2783203125, 18.8685302734375, 19.458740234375, 20.0489501953125, 20.63916015625, 21.2293701171875, 21.819580078125, 22.4097900390625, 23.0]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 4.0, 12.0, 18.0, 23.0, 45.0, 74.0, 122.0, 169.0, 147.0, 136.0, 85.0, 49.0, 36.0, 28.0, 11.0, 5.0, 5.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.79319763183594, -78.28009033203125, -75.76698303222656, -73.2538833618164, -70.74077606201172, -68.22766876220703, -65.71456909179688, -63.20146179199219, -60.6883544921875, -58.17524719238281, -55.66214370727539, -53.14904022216797, -50.63593292236328, -48.122825622558594, -45.60972213745117, -43.09661865234375, -40.58351135253906, -38.070404052734375, -35.55730056762695, -33.04419708251953, -30.531089782714844, -28.01798439025879, -25.504878997802734, -22.99177360534668, -20.478668212890625, -17.96556282043457, -15.452457427978516, -12.939352035522461, -10.426246643066406, -7.913141250610352, -5.400035858154297, -2.886930465698242, -0.3738250732421875, 2.139280319213867, 4.652385711669922, 7.165491104125977, 9.678596496582031, 12.191701889038086, 14.70480728149414, 17.217912673950195, 19.73101806640625, 22.244123458862305, 24.75722885131836, 27.270334243774414, 29.78343963623047, 32.296546936035156, 34.80965042114258, 37.32275390625, 39.83586120605469, 42.348968505859375, 44.8620719909668, 47.37517547607422, 49.888282775878906, 52.401390075683594, 54.914493560791016, 57.42759704589844, 59.940704345703125, 62.45381164550781, 64.9669189453125, 67.48001861572266, 69.99312591552734, 72.50623321533203, 75.01933288574219, 77.53244018554688, 80.04554748535156]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 16.0, 12.0, 14.0, 18.0, 25.0, 11.0, 27.0, 19.0, 33.0, 27.0, 26.0, 42.0, 36.0, 41.0, 33.0, 47.0, 47.0, 37.0, 42.0, 34.0, 52.0, 35.0, 35.0, 35.0, 28.0, 36.0, 28.0, 29.0, 17.0, 15.0, 15.0, 21.0, 8.0, 5.0, 10.0, 6.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-39.75970458984375, -38.49917221069336, -37.23863983154297, -35.97810745239258, -34.71757507324219, -33.45703887939453, -32.19650650024414, -30.93597412109375, -29.67544174194336, -28.41490936279297, -27.154376983642578, -25.893842697143555, -24.633310317993164, -23.372777938842773, -22.11224365234375, -20.85171127319336, -19.59117889404297, -18.330646514892578, -17.070114135742188, -15.809579849243164, -14.549047470092773, -13.288515090942383, -12.027981758117676, -10.767448425292969, -9.506916046142578, -8.246383666992188, -6.9858503341674805, -5.725317478179932, -4.464784622192383, -3.204251766204834, -1.9437189102172852, -0.6831855773925781, 0.5773429870605469, 1.8378758430480957, 3.0984086990356445, 4.358941555023193, 5.619474411010742, 6.880007266998291, 8.14054012298584, 9.401073455810547, 10.661605834960938, 11.922138214111328, 13.182671546936035, 14.443204879760742, 15.703737258911133, 16.964269638061523, 18.224803924560547, 19.485336303710938, 20.745868682861328, 22.00640106201172, 23.26693344116211, 24.527467727661133, 25.788000106811523, 27.048532485961914, 28.309066772460938, 29.569599151611328, 30.83013153076172, 32.09066390991211, 33.3511962890625, 34.61172866821289, 35.87226104736328, 37.13279724121094, 38.39332962036133, 39.65386199951172, 40.91439437866211]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 2.0, 4.0, 8.0, 26.0, 10.0, 23.0, 29.0, 38.0, 55.0, 81.0, 113.0, 156.0, 260.0, 363.0, 517.0, 802.0, 1232.0, 2096.0, 3628.0, 6242.0, 12328.0, 25775.0, 61815.0, 204085.0, 463544.0, 163962.0, 53112.0, 22853.0, 11116.0, 5714.0, 3226.0, 1889.0, 1190.0, 739.0, 486.0, 295.0, 217.0, 143.0, 102.0, 55.0, 62.0, 45.0, 34.0, 17.0, 16.0, 14.0, 7.0, 7.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-7.51171875, -7.27264404296875, -7.0335693359375, -6.79449462890625, -6.555419921875, -6.31634521484375, -6.0772705078125, -5.83819580078125, -5.59912109375, -5.36004638671875, -5.1209716796875, -4.88189697265625, -4.642822265625, -4.40374755859375, -4.1646728515625, -3.92559814453125, -3.6865234375, -3.44744873046875, -3.2083740234375, -2.96929931640625, -2.730224609375, -2.49114990234375, -2.2520751953125, -2.01300048828125, -1.77392578125, -1.53485107421875, -1.2957763671875, -1.05670166015625, -0.817626953125, -0.57855224609375, -0.3394775390625, -0.10040283203125, 0.138671875, 0.37774658203125, 0.6168212890625, 0.85589599609375, 1.094970703125, 1.33404541015625, 1.5731201171875, 1.81219482421875, 2.05126953125, 2.29034423828125, 2.5294189453125, 2.76849365234375, 3.007568359375, 3.24664306640625, 3.4857177734375, 3.72479248046875, 3.9638671875, 4.20294189453125, 4.4420166015625, 4.68109130859375, 4.920166015625, 5.15924072265625, 5.3983154296875, 5.63739013671875, 5.87646484375, 6.11553955078125, 6.3546142578125, 6.59368896484375, 6.832763671875, 7.07183837890625, 7.3109130859375, 7.54998779296875, 7.7890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 9.0, 6.0, 17.0, 8.0, 19.0, 23.0, 33.0, 26.0, 36.0, 43.0, 41.0, 40.0, 43.0, 66.0, 60.0, 62.0, 55.0, 49.0, 53.0, 26.0, 49.0, 47.0, 33.0, 27.0, 26.0, 19.0, 21.0, 16.0, 7.0, 11.0, 9.0, 6.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.708984375, -3.591705322265625, -3.47442626953125, -3.357147216796875, -3.2398681640625, -3.122589111328125, -3.00531005859375, -2.888031005859375, -2.770751953125, -2.653472900390625, -2.53619384765625, -2.418914794921875, -2.3016357421875, -2.184356689453125, -2.06707763671875, -1.949798583984375, -1.83251953125, -1.715240478515625, -1.59796142578125, -1.480682373046875, -1.3634033203125, -1.246124267578125, -1.12884521484375, -1.011566162109375, -0.894287109375, -0.777008056640625, -0.65972900390625, -0.542449951171875, -0.4251708984375, -0.307891845703125, -0.19061279296875, -0.073333740234375, 0.0439453125, 0.161224365234375, 0.27850341796875, 0.395782470703125, 0.5130615234375, 0.630340576171875, 0.74761962890625, 0.864898681640625, 0.982177734375, 1.099456787109375, 1.21673583984375, 1.334014892578125, 1.4512939453125, 1.568572998046875, 1.68585205078125, 1.803131103515625, 1.92041015625, 2.037689208984375, 2.15496826171875, 2.272247314453125, 2.3895263671875, 2.506805419921875, 2.62408447265625, 2.741363525390625, 2.858642578125, 2.975921630859375, 3.09320068359375, 3.210479736328125, 3.3277587890625, 3.445037841796875, 3.56231689453125, 3.679595947265625, 3.796875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 8.0, 7.0, 10.0, 9.0, 13.0, 24.0, 25.0, 53.0, 54.0, 96.0, 144.0, 216.0, 457.0, 903.0, 2237.0, 6727.0, 31980.0, 409245.0, 548731.0, 35757.0, 7311.0, 2359.0, 1014.0, 456.0, 284.0, 148.0, 86.0, 57.0, 38.0, 32.0, 15.0, 18.0, 6.0, 11.0, 6.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.5859375, -13.0430908203125, -12.500244140625, -11.9573974609375, -11.41455078125, -10.8717041015625, -10.328857421875, -9.7860107421875, -9.2431640625, -8.7003173828125, -8.157470703125, -7.6146240234375, -7.07177734375, -6.5289306640625, -5.986083984375, -5.4432373046875, -4.900390625, -4.3575439453125, -3.814697265625, -3.2718505859375, -2.72900390625, -2.1861572265625, -1.643310546875, -1.1004638671875, -0.5576171875, -0.0147705078125, 0.528076171875, 1.0709228515625, 1.61376953125, 2.1566162109375, 2.699462890625, 3.2423095703125, 3.78515625, 4.3280029296875, 4.870849609375, 5.4136962890625, 5.95654296875, 6.4993896484375, 7.042236328125, 7.5850830078125, 8.1279296875, 8.6707763671875, 9.213623046875, 9.7564697265625, 10.29931640625, 10.8421630859375, 11.385009765625, 11.9278564453125, 12.470703125, 13.0135498046875, 13.556396484375, 14.0992431640625, 14.64208984375, 15.1849365234375, 15.727783203125, 16.2706298828125, 16.8134765625, 17.3563232421875, 17.899169921875, 18.4420166015625, 18.98486328125, 19.5277099609375, 20.070556640625, 20.6134033203125, 21.15625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 8.0, 13.0, 29.0, 23.0, 34.0, 42.0, 40.0, 51.0, 85.0, 68.0, 76.0, 64.0, 60.0, 57.0, 57.0, 58.0, 62.0, 31.0, 25.0, 20.0, 23.0, 13.0, 8.0, 8.0, 9.0, 4.0, 2.0, 6.0, 3.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.96875, -22.340087890625, -21.71142578125, -21.082763671875, -20.4541015625, -19.825439453125, -19.19677734375, -18.568115234375, -17.939453125, -17.310791015625, -16.68212890625, -16.053466796875, -15.4248046875, -14.796142578125, -14.16748046875, -13.538818359375, -12.91015625, -12.281494140625, -11.65283203125, -11.024169921875, -10.3955078125, -9.766845703125, -9.13818359375, -8.509521484375, -7.880859375, -7.252197265625, -6.62353515625, -5.994873046875, -5.3662109375, -4.737548828125, -4.10888671875, -3.480224609375, -2.8515625, -2.222900390625, -1.59423828125, -0.965576171875, -0.3369140625, 0.291748046875, 0.92041015625, 1.549072265625, 2.177734375, 2.806396484375, 3.43505859375, 4.063720703125, 4.6923828125, 5.321044921875, 5.94970703125, 6.578369140625, 7.20703125, 7.835693359375, 8.46435546875, 9.093017578125, 9.7216796875, 10.350341796875, 10.97900390625, 11.607666015625, 12.236328125, 12.864990234375, 13.49365234375, 14.122314453125, 14.7509765625, 15.379638671875, 16.00830078125, 16.636962890625, 17.265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 6.0, 9.0, 9.0, 12.0, 20.0, 25.0, 46.0, 97.0, 182.0, 386.0, 1147.0, 4659.0, 36248.0, 791188.0, 197872.0, 13000.0, 2340.0, 734.0, 266.0, 128.0, 66.0, 32.0, 17.0, 7.0, 12.0, 11.0, 4.0, 5.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.6875, -11.3514404296875, -11.015380859375, -10.6793212890625, -10.34326171875, -10.0072021484375, -9.671142578125, -9.3350830078125, -8.9990234375, -8.6629638671875, -8.326904296875, -7.9908447265625, -7.65478515625, -7.3187255859375, -6.982666015625, -6.6466064453125, -6.310546875, -5.9744873046875, -5.638427734375, -5.3023681640625, -4.96630859375, -4.6302490234375, -4.294189453125, -3.9581298828125, -3.6220703125, -3.2860107421875, -2.949951171875, -2.6138916015625, -2.27783203125, -1.9417724609375, -1.605712890625, -1.2696533203125, -0.93359375, -0.5975341796875, -0.261474609375, 0.0745849609375, 0.41064453125, 0.7467041015625, 1.082763671875, 1.4188232421875, 1.7548828125, 2.0909423828125, 2.427001953125, 2.7630615234375, 3.09912109375, 3.4351806640625, 3.771240234375, 4.1072998046875, 4.443359375, 4.7794189453125, 5.115478515625, 5.4515380859375, 5.78759765625, 6.1236572265625, 6.459716796875, 6.7957763671875, 7.1318359375, 7.4678955078125, 7.803955078125, 8.1400146484375, 8.47607421875, 8.8121337890625, 9.148193359375, 9.4842529296875, 9.8203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 5.0, 7.0, 9.0, 18.0, 11.0, 29.0, 30.0, 61.0, 69.0, 111.0, 143.0, 158.0, 105.0, 60.0, 46.0, 33.0, 21.0, 12.0, 14.0, 7.0, 8.0, 8.0, 4.0, 4.0, 3.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011653900146484375, -0.0011276155710220337, -0.0010898411273956299, -0.001052066683769226, -0.0010142922401428223, -0.0009765177965164185, -0.0009387433528900146, -0.0009009689092636108, -0.000863194465637207, -0.0008254200220108032, -0.0007876455783843994, -0.0007498711347579956, -0.0007120966911315918, -0.000674322247505188, -0.0006365478038787842, -0.0005987733602523804, -0.0005609989166259766, -0.0005232244729995728, -0.00048545002937316895, -0.00044767558574676514, -0.00040990114212036133, -0.0003721266984939575, -0.0003343522548675537, -0.0002965778112411499, -0.0002588033676147461, -0.00022102892398834229, -0.00018325448036193848, -0.00014548003673553467, -0.00010770559310913086, -6.993114948272705e-05, -3.215670585632324e-05, 5.617737770080566e-06, 4.3392181396484375e-05, 8.116662502288818e-05, 0.00011894106864929199, 0.0001567155122756958, 0.0001944899559020996, 0.00023226439952850342, 0.0002700388431549072, 0.00030781328678131104, 0.00034558773040771484, 0.00038336217403411865, 0.00042113661766052246, 0.00045891106128692627, 0.0004966855049133301, 0.0005344599485397339, 0.0005722343921661377, 0.0006100088357925415, 0.0006477832794189453, 0.0006855577230453491, 0.0007233321666717529, 0.0007611066102981567, 0.0007988810539245605, 0.0008366554975509644, 0.0008744299411773682, 0.000912204384803772, 0.0009499788284301758, 0.0009877532720565796, 0.0010255277156829834, 0.0010633021593093872, 0.001101076602935791, 0.0011388510465621948, 0.0011766254901885986, 0.0012143999338150024, 0.0012521743774414062]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 7.0, 3.0, 5.0, 6.0, 16.0, 15.0, 14.0, 25.0, 34.0, 56.0, 116.0, 249.0, 509.0, 1264.0, 3366.0, 14333.0, 137041.0, 800234.0, 76605.0, 9931.0, 2722.0, 1028.0, 463.0, 220.0, 110.0, 50.0, 34.0, 25.0, 18.0, 15.0, 9.0, 6.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.72265625, -6.47723388671875, -6.2318115234375, -5.98638916015625, -5.740966796875, -5.49554443359375, -5.2501220703125, -5.00469970703125, -4.75927734375, -4.51385498046875, -4.2684326171875, -4.02301025390625, -3.777587890625, -3.53216552734375, -3.2867431640625, -3.04132080078125, -2.7958984375, -2.55047607421875, -2.3050537109375, -2.05963134765625, -1.814208984375, -1.56878662109375, -1.3233642578125, -1.07794189453125, -0.83251953125, -0.58709716796875, -0.3416748046875, -0.09625244140625, 0.149169921875, 0.39459228515625, 0.6400146484375, 0.88543701171875, 1.130859375, 1.37628173828125, 1.6217041015625, 1.86712646484375, 2.112548828125, 2.35797119140625, 2.6033935546875, 2.84881591796875, 3.09423828125, 3.33966064453125, 3.5850830078125, 3.83050537109375, 4.075927734375, 4.32135009765625, 4.5667724609375, 4.81219482421875, 5.0576171875, 5.30303955078125, 5.5484619140625, 5.79388427734375, 6.039306640625, 6.28472900390625, 6.5301513671875, 6.77557373046875, 7.02099609375, 7.26641845703125, 7.5118408203125, 7.75726318359375, 8.002685546875, 8.24810791015625, 8.4935302734375, 8.73895263671875, 8.984375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 8.0, 8.0, 8.0, 16.0, 26.0, 22.0, 47.0, 51.0, 64.0, 71.0, 93.0, 99.0, 103.0, 69.0, 79.0, 47.0, 42.0, 33.0, 32.0, 21.0, 15.0, 15.0, 4.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.962890625, -3.789337158203125, -3.61578369140625, -3.442230224609375, -3.2686767578125, -3.095123291015625, -2.92156982421875, -2.748016357421875, -2.574462890625, -2.400909423828125, -2.22735595703125, -2.053802490234375, -1.8802490234375, -1.706695556640625, -1.53314208984375, -1.359588623046875, -1.18603515625, -1.012481689453125, -0.83892822265625, -0.665374755859375, -0.4918212890625, -0.318267822265625, -0.14471435546875, 0.028839111328125, 0.202392578125, 0.375946044921875, 0.54949951171875, 0.723052978515625, 0.8966064453125, 1.070159912109375, 1.24371337890625, 1.417266845703125, 1.5908203125, 1.764373779296875, 1.93792724609375, 2.111480712890625, 2.2850341796875, 2.458587646484375, 2.63214111328125, 2.805694580078125, 2.979248046875, 3.152801513671875, 3.32635498046875, 3.499908447265625, 3.6734619140625, 3.847015380859375, 4.02056884765625, 4.194122314453125, 4.36767578125, 4.541229248046875, 4.71478271484375, 4.888336181640625, 5.0618896484375, 5.235443115234375, 5.40899658203125, 5.582550048828125, 5.756103515625, 5.929656982421875, 6.10321044921875, 6.276763916015625, 6.4503173828125, 6.623870849609375, 6.79742431640625, 6.970977783203125, 7.14453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 5.0, 9.0, 15.0, 44.0, 96.0, 219.0, 335.0, 179.0, 71.0, 17.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-234.24664306640625, -228.4665069580078, -222.68637084960938, -216.90621948242188, -211.12608337402344, -205.345947265625, -199.56581115722656, -193.78567504882812, -188.0055389404297, -182.22540283203125, -176.4452667236328, -170.66513061523438, -164.88497924804688, -159.10484313964844, -153.32470703125, -147.54457092285156, -141.76443481445312, -135.9842987060547, -130.20416259765625, -124.42401885986328, -118.64388275146484, -112.86373901367188, -107.08360290527344, -101.303466796875, -95.5233154296875, -89.74317932128906, -83.9630355834961, -78.18289947509766, -72.40276336669922, -66.62261962890625, -60.84248352050781, -55.062347412109375, -49.28221130371094, -43.502071380615234, -37.7219352722168, -31.941795349121094, -26.161657333374023, -20.381519317626953, -14.60137939453125, -8.821243286132812, -3.0411033630371094, 2.739035129547119, 8.519173622131348, 14.299312591552734, 20.079450607299805, 25.859588623046875, 31.639728546142578, 37.419864654541016, 43.20000457763672, 48.98014450073242, 54.76028060913086, 60.54042053222656, 66.320556640625, 72.10069274902344, 77.8808364868164, 83.66097259521484, 89.44111633300781, 95.22125244140625, 101.00139617919922, 106.78153228759766, 112.5616683959961, 118.34181213378906, 124.1219482421875, 129.90208435058594, 135.68222045898438]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 3.0, 6.0, 10.0, 4.0, 4.0, 4.0, 6.0, 10.0, 8.0, 13.0, 26.0, 32.0, 32.0, 33.0, 32.0, 35.0, 49.0, 49.0, 66.0, 55.0, 77.0, 61.0, 64.0, 48.0, 41.0, 35.0, 31.0, 25.0, 24.0, 25.0, 25.0, 18.0, 9.0, 11.0, 13.0, 7.0, 0.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.64801025390625, -57.46404266357422, -55.28007888793945, -53.09611129760742, -50.912147521972656, -48.728179931640625, -46.544212341308594, -44.36024475097656, -42.1762809753418, -39.992313385009766, -37.808349609375, -35.62438201904297, -33.44041442871094, -31.256450653076172, -29.07248306274414, -26.888517379760742, -24.704551696777344, -22.520586013793945, -20.336620330810547, -18.152652740478516, -15.968687057495117, -13.784721374511719, -11.600754737854004, -9.416788101196289, -7.232822418212891, -5.048856258392334, -2.8648900985717773, -0.6809239387512207, 1.503042221069336, 3.6870079040527344, 5.870974540710449, 8.054941177368164, 10.238906860351562, 12.422872543334961, 14.606839179992676, 16.79080581665039, 18.97477149963379, 21.158737182617188, 23.34270477294922, 25.526670455932617, 27.710636138916016, 29.894601821899414, 32.07856750488281, 34.262535095214844, 36.446502685546875, 38.63046646118164, 40.81443405151367, 42.99839782714844, 45.18236541748047, 47.3663330078125, 49.550296783447266, 51.7342643737793, 53.91822814941406, 56.102195739746094, 58.286163330078125, 60.470130920410156, 62.65409469604492, 64.83805847167969, 67.02202606201172, 69.20599365234375, 71.38996124267578, 73.57392883300781, 75.75788879394531, 77.94185638427734, 80.12582397460938]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 10.0, 12.0, 14.0, 30.0, 42.0, 88.0, 148.0, 251.0, 502.0, 989.0, 2021.0, 4454.0, 10705.0, 28305.0, 92702.0, 569149.0, 2851610.0, 504811.0, 85018.0, 25598.0, 9552.0, 4172.0, 1957.0, 874.0, 521.0, 266.0, 167.0, 128.0, 61.0, 31.0, 32.0, 13.0, 15.0, 9.0, 5.0, 3.0, 3.0, 3.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.0592041015625, -4.860595703125, -4.6619873046875, -4.46337890625, -4.2647705078125, -4.066162109375, -3.8675537109375, -3.6689453125, -3.4703369140625, -3.271728515625, -3.0731201171875, -2.87451171875, -2.6759033203125, -2.477294921875, -2.2786865234375, -2.080078125, -1.8814697265625, -1.682861328125, -1.4842529296875, -1.28564453125, -1.0870361328125, -0.888427734375, -0.6898193359375, -0.4912109375, -0.2926025390625, -0.093994140625, 0.1046142578125, 0.30322265625, 0.5018310546875, 0.700439453125, 0.8990478515625, 1.09765625, 1.2962646484375, 1.494873046875, 1.6934814453125, 1.89208984375, 2.0906982421875, 2.289306640625, 2.4879150390625, 2.6865234375, 2.8851318359375, 3.083740234375, 3.2823486328125, 3.48095703125, 3.6795654296875, 3.878173828125, 4.0767822265625, 4.275390625, 4.4739990234375, 4.672607421875, 4.8712158203125, 5.06982421875, 5.2684326171875, 5.467041015625, 5.6656494140625, 5.8642578125, 6.0628662109375, 6.261474609375, 6.4600830078125, 6.65869140625, 6.8572998046875, 7.055908203125, 7.2545166015625, 7.453125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 9.0, 4.0, 13.0, 28.0, 28.0, 49.0, 80.0, 97.0, 94.0, 115.0, 112.0, 92.0, 86.0, 61.0, 35.0, 38.0, 39.0, 15.0, 11.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.822265625, -2.606414794921875, -2.39056396484375, -2.174713134765625, -1.9588623046875, -1.743011474609375, -1.52716064453125, -1.311309814453125, -1.095458984375, -0.879608154296875, -0.66375732421875, -0.447906494140625, -0.2320556640625, -0.016204833984375, 0.19964599609375, 0.415496826171875, 0.63134765625, 0.847198486328125, 1.06304931640625, 1.278900146484375, 1.4947509765625, 1.710601806640625, 1.92645263671875, 2.142303466796875, 2.358154296875, 2.574005126953125, 2.78985595703125, 3.005706787109375, 3.2215576171875, 3.437408447265625, 3.65325927734375, 3.869110107421875, 4.0849609375, 4.300811767578125, 4.51666259765625, 4.732513427734375, 4.9483642578125, 5.164215087890625, 5.38006591796875, 5.595916748046875, 5.811767578125, 6.027618408203125, 6.24346923828125, 6.459320068359375, 6.6751708984375, 6.891021728515625, 7.10687255859375, 7.322723388671875, 7.53857421875, 7.754425048828125, 7.97027587890625, 8.186126708984375, 8.4019775390625, 8.617828369140625, 8.83367919921875, 9.049530029296875, 9.265380859375, 9.481231689453125, 9.69708251953125, 9.912933349609375, 10.1287841796875, 10.344635009765625, 10.56048583984375, 10.776336669921875, 10.9921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 5.0, 5.0, 5.0, 15.0, 17.0, 47.0, 75.0, 109.0, 189.0, 446.0, 855.0, 2538.0, 11336.0, 91600.0, 3369357.0, 672162.0, 36851.0, 5927.0, 1524.0, 600.0, 271.0, 154.0, 83.0, 44.0, 22.0, 17.0, 13.0, 4.0, 4.0, 6.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.234375, -13.722412109375, -13.21044921875, -12.698486328125, -12.1865234375, -11.674560546875, -11.16259765625, -10.650634765625, -10.138671875, -9.626708984375, -9.11474609375, -8.602783203125, -8.0908203125, -7.578857421875, -7.06689453125, -6.554931640625, -6.04296875, -5.531005859375, -5.01904296875, -4.507080078125, -3.9951171875, -3.483154296875, -2.97119140625, -2.459228515625, -1.947265625, -1.435302734375, -0.92333984375, -0.411376953125, 0.1005859375, 0.612548828125, 1.12451171875, 1.636474609375, 2.1484375, 2.660400390625, 3.17236328125, 3.684326171875, 4.1962890625, 4.708251953125, 5.22021484375, 5.732177734375, 6.244140625, 6.756103515625, 7.26806640625, 7.780029296875, 8.2919921875, 8.803955078125, 9.31591796875, 9.827880859375, 10.33984375, 10.851806640625, 11.36376953125, 11.875732421875, 12.3876953125, 12.899658203125, 13.41162109375, 13.923583984375, 14.435546875, 14.947509765625, 15.45947265625, 15.971435546875, 16.4833984375, 16.995361328125, 17.50732421875, 18.019287109375, 18.53125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 9.0, 12.0, 17.0, 16.0, 32.0, 68.0, 131.0, 211.0, 466.0, 1125.0, 1090.0, 420.0, 195.0, 115.0, 53.0, 37.0, 32.0, 22.0, 13.0, 5.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.71875, -18.133544921875, -17.54833984375, -16.963134765625, -16.3779296875, -15.792724609375, -15.20751953125, -14.622314453125, -14.037109375, -13.451904296875, -12.86669921875, -12.281494140625, -11.6962890625, -11.111083984375, -10.52587890625, -9.940673828125, -9.35546875, -8.770263671875, -8.18505859375, -7.599853515625, -7.0146484375, -6.429443359375, -5.84423828125, -5.259033203125, -4.673828125, -4.088623046875, -3.50341796875, -2.918212890625, -2.3330078125, -1.747802734375, -1.16259765625, -0.577392578125, 0.0078125, 0.593017578125, 1.17822265625, 1.763427734375, 2.3486328125, 2.933837890625, 3.51904296875, 4.104248046875, 4.689453125, 5.274658203125, 5.85986328125, 6.445068359375, 7.0302734375, 7.615478515625, 8.20068359375, 8.785888671875, 9.37109375, 9.956298828125, 10.54150390625, 11.126708984375, 11.7119140625, 12.297119140625, 12.88232421875, 13.467529296875, 14.052734375, 14.637939453125, 15.22314453125, 15.808349609375, 16.3935546875, 16.978759765625, 17.56396484375, 18.149169921875, 18.734375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 12.0, 43.0, 133.0, 295.0, 311.0, 112.0, 50.0, 13.0, 11.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-214.93740844726562, -208.78524780273438, -202.63308715820312, -196.48092651367188, -190.32876586914062, -184.17660522460938, -178.02444458007812, -171.87228393554688, -165.72012329101562, -159.56796264648438, -153.41580200195312, -147.26364135742188, -141.11148071289062, -134.95932006835938, -128.80715942382812, -122.65499114990234, -116.50282287597656, -110.35066223144531, -104.19850158691406, -98.04634094238281, -91.89418029785156, -85.74201965332031, -79.58985137939453, -73.43769073486328, -67.28553009033203, -61.13336944580078, -54.98120880126953, -48.829044342041016, -42.676883697509766, -36.524723052978516, -30.37255859375, -24.22039794921875, -18.0682373046875, -11.916075706481934, -5.763914108276367, 0.3882484436035156, 6.540409088134766, 12.692569732666016, 18.84473419189453, 24.99689483642578, 31.14905548095703, 37.30121612548828, 43.45337677001953, 49.60554122924805, 55.7577018737793, 61.90986251831055, 68.06202697753906, 74.21418762207031, 80.36634826660156, 86.51850891113281, 92.67066955566406, 98.82283020019531, 104.97499084472656, 111.12715148925781, 117.2793197631836, 123.43148040771484, 129.58364868164062, 135.73580932617188, 141.88796997070312, 148.04013061523438, 154.19229125976562, 160.34445190429688, 166.49661254882812, 172.64877319335938, 178.80093383789062]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 10.0, 11.0, 15.0, 37.0, 33.0, 43.0, 47.0, 69.0, 75.0, 65.0, 58.0, 52.0, 64.0, 82.0, 59.0, 54.0, 45.0, 37.0, 22.0, 28.0, 23.0, 19.0, 14.0, 8.0, 8.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.04048156738281, -96.5303726196289, -94.020263671875, -91.5101547241211, -89.00004577636719, -86.48994445800781, -83.9798355102539, -81.4697265625, -78.9596176147461, -76.44950866699219, -73.93939971923828, -71.42929077148438, -68.919189453125, -66.4090805053711, -63.89897155761719, -61.38886260986328, -58.878753662109375, -56.36864471435547, -53.85853576660156, -51.34843063354492, -48.838321685791016, -46.32821273803711, -43.81810760498047, -41.30799865722656, -38.797889709472656, -36.28778076171875, -33.777671813964844, -31.267566680908203, -28.757457733154297, -26.24734878540039, -23.737241744995117, -21.227134704589844, -18.717018127441406, -16.2069091796875, -13.696802139282227, -11.186694145202637, -8.676586151123047, -6.166478157043457, -3.656370162963867, -1.1462631225585938, 1.3638458251953125, 3.8739538192749023, 6.384061813354492, 8.894169807434082, 11.404277801513672, 13.914385795593262, 16.42449378967285, 18.934600830078125, 21.44470977783203, 23.954818725585938, 26.46492576599121, 28.975032806396484, 31.48514175415039, 33.9952507019043, 36.50535583496094, 39.015464782714844, 41.52557373046875, 44.035682678222656, 46.54579162597656, 49.0558967590332, 51.56600570678711, 54.076114654541016, 56.586219787597656, 59.09632873535156, 61.60643768310547]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 14.0, 12.0, 22.0, 39.0, 53.0, 85.0, 133.0, 210.0, 320.0, 567.0, 1009.0, 1676.0, 2940.0, 5426.0, 10750.0, 22005.0, 47491.0, 110430.0, 292029.0, 326554.0, 123956.0, 52736.0, 24566.0, 12042.0, 5999.0, 3115.0, 1753.0, 1051.0, 560.0, 360.0, 252.0, 125.0, 79.0, 58.0, 56.0, 24.0, 10.0, 12.0, 7.0, 7.0, 5.0, 6.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.89453125, -5.66839599609375, -5.4422607421875, -5.21612548828125, -4.989990234375, -4.76385498046875, -4.5377197265625, -4.31158447265625, -4.08544921875, -3.85931396484375, -3.6331787109375, -3.40704345703125, -3.180908203125, -2.95477294921875, -2.7286376953125, -2.50250244140625, -2.2763671875, -2.05023193359375, -1.8240966796875, -1.59796142578125, -1.371826171875, -1.14569091796875, -0.9195556640625, -0.69342041015625, -0.46728515625, -0.24114990234375, -0.0150146484375, 0.21112060546875, 0.437255859375, 0.66339111328125, 0.8895263671875, 1.11566162109375, 1.341796875, 1.56793212890625, 1.7940673828125, 2.02020263671875, 2.246337890625, 2.47247314453125, 2.6986083984375, 2.92474365234375, 3.15087890625, 3.37701416015625, 3.6031494140625, 3.82928466796875, 4.055419921875, 4.28155517578125, 4.5076904296875, 4.73382568359375, 4.9599609375, 5.18609619140625, 5.4122314453125, 5.63836669921875, 5.864501953125, 6.09063720703125, 6.3167724609375, 6.54290771484375, 6.76904296875, 6.99517822265625, 7.2213134765625, 7.44744873046875, 7.673583984375, 7.89971923828125, 8.1258544921875, 8.35198974609375, 8.578125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 8.0, 7.0, 4.0, 13.0, 10.0, 19.0, 19.0, 20.0, 18.0, 25.0, 24.0, 29.0, 25.0, 23.0, 30.0, 39.0, 45.0, 34.0, 44.0, 34.0, 35.0, 29.0, 45.0, 40.0, 24.0, 35.0, 23.0, 31.0, 33.0, 24.0, 16.0, 33.0, 22.0, 16.0, 17.0, 13.0, 17.0, 16.0, 10.0, 6.0, 4.0, 8.0, 3.0, 5.0, 5.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.552734375, -2.4698486328125, -2.386962890625, -2.3040771484375, -2.22119140625, -2.1383056640625, -2.055419921875, -1.9725341796875, -1.8896484375, -1.8067626953125, -1.723876953125, -1.6409912109375, -1.55810546875, -1.4752197265625, -1.392333984375, -1.3094482421875, -1.2265625, -1.1436767578125, -1.060791015625, -0.9779052734375, -0.89501953125, -0.8121337890625, -0.729248046875, -0.6463623046875, -0.5634765625, -0.4805908203125, -0.397705078125, -0.3148193359375, -0.23193359375, -0.1490478515625, -0.066162109375, 0.0167236328125, 0.099609375, 0.1824951171875, 0.265380859375, 0.3482666015625, 0.43115234375, 0.5140380859375, 0.596923828125, 0.6798095703125, 0.7626953125, 0.8455810546875, 0.928466796875, 1.0113525390625, 1.09423828125, 1.1771240234375, 1.260009765625, 1.3428955078125, 1.42578125, 1.5086669921875, 1.591552734375, 1.6744384765625, 1.75732421875, 1.8402099609375, 1.923095703125, 2.0059814453125, 2.0888671875, 2.1717529296875, 2.254638671875, 2.3375244140625, 2.42041015625, 2.5032958984375, 2.586181640625, 2.6690673828125, 2.751953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 7.0, 4.0, 11.0, 11.0, 16.0, 28.0, 36.0, 67.0, 90.0, 130.0, 211.0, 328.0, 623.0, 1183.0, 2971.0, 10959.0, 109572.0, 851580.0, 58479.0, 7585.0, 2337.0, 1010.0, 505.0, 286.0, 187.0, 102.0, 71.0, 56.0, 30.0, 22.0, 21.0, 11.0, 10.0, 3.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.28125, -23.5751953125, -22.869140625, -22.1630859375, -21.45703125, -20.7509765625, -20.044921875, -19.3388671875, -18.6328125, -17.9267578125, -17.220703125, -16.5146484375, -15.80859375, -15.1025390625, -14.396484375, -13.6904296875, -12.984375, -12.2783203125, -11.572265625, -10.8662109375, -10.16015625, -9.4541015625, -8.748046875, -8.0419921875, -7.3359375, -6.6298828125, -5.923828125, -5.2177734375, -4.51171875, -3.8056640625, -3.099609375, -2.3935546875, -1.6875, -0.9814453125, -0.275390625, 0.4306640625, 1.13671875, 1.8427734375, 2.548828125, 3.2548828125, 3.9609375, 4.6669921875, 5.373046875, 6.0791015625, 6.78515625, 7.4912109375, 8.197265625, 8.9033203125, 9.609375, 10.3154296875, 11.021484375, 11.7275390625, 12.43359375, 13.1396484375, 13.845703125, 14.5517578125, 15.2578125, 15.9638671875, 16.669921875, 17.3759765625, 18.08203125, 18.7880859375, 19.494140625, 20.2001953125, 20.90625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 10.0, 6.0, 13.0, 10.0, 15.0, 18.0, 25.0, 21.0, 20.0, 23.0, 42.0, 41.0, 39.0, 53.0, 56.0, 59.0, 57.0, 44.0, 49.0, 49.0, 43.0, 44.0, 30.0, 38.0, 28.0, 21.0, 31.0, 18.0, 23.0, 15.0, 8.0, 6.0, 15.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.921875, -18.38720703125, -17.8525390625, -17.31787109375, -16.783203125, -16.24853515625, -15.7138671875, -15.17919921875, -14.64453125, -14.10986328125, -13.5751953125, -13.04052734375, -12.505859375, -11.97119140625, -11.4365234375, -10.90185546875, -10.3671875, -9.83251953125, -9.2978515625, -8.76318359375, -8.228515625, -7.69384765625, -7.1591796875, -6.62451171875, -6.08984375, -5.55517578125, -5.0205078125, -4.48583984375, -3.951171875, -3.41650390625, -2.8818359375, -2.34716796875, -1.8125, -1.27783203125, -0.7431640625, -0.20849609375, 0.326171875, 0.86083984375, 1.3955078125, 1.93017578125, 2.46484375, 2.99951171875, 3.5341796875, 4.06884765625, 4.603515625, 5.13818359375, 5.6728515625, 6.20751953125, 6.7421875, 7.27685546875, 7.8115234375, 8.34619140625, 8.880859375, 9.41552734375, 9.9501953125, 10.48486328125, 11.01953125, 11.55419921875, 12.0888671875, 12.62353515625, 13.158203125, 13.69287109375, 14.2275390625, 14.76220703125, 15.296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 6.0, 10.0, 13.0, 26.0, 27.0, 60.0, 85.0, 150.0, 280.0, 609.0, 1892.0, 8872.0, 82681.0, 827930.0, 111314.0, 10952.0, 2247.0, 671.0, 308.0, 152.0, 99.0, 60.0, 36.0, 21.0, 23.0, 5.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.78515625, -6.54754638671875, -6.3099365234375, -6.07232666015625, -5.834716796875, -5.59710693359375, -5.3594970703125, -5.12188720703125, -4.88427734375, -4.64666748046875, -4.4090576171875, -4.17144775390625, -3.933837890625, -3.69622802734375, -3.4586181640625, -3.22100830078125, -2.9833984375, -2.74578857421875, -2.5081787109375, -2.27056884765625, -2.032958984375, -1.79534912109375, -1.5577392578125, -1.32012939453125, -1.08251953125, -0.84490966796875, -0.6072998046875, -0.36968994140625, -0.132080078125, 0.10552978515625, 0.3431396484375, 0.58074951171875, 0.818359375, 1.05596923828125, 1.2935791015625, 1.53118896484375, 1.768798828125, 2.00640869140625, 2.2440185546875, 2.48162841796875, 2.71923828125, 2.95684814453125, 3.1944580078125, 3.43206787109375, 3.669677734375, 3.90728759765625, 4.1448974609375, 4.38250732421875, 4.6201171875, 4.85772705078125, 5.0953369140625, 5.33294677734375, 5.570556640625, 5.80816650390625, 6.0457763671875, 6.28338623046875, 6.52099609375, 6.75860595703125, 6.9962158203125, 7.23382568359375, 7.471435546875, 7.70904541015625, 7.9466552734375, 8.18426513671875, 8.421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 2.0, 9.0, 7.0, 11.0, 10.0, 15.0, 14.0, 20.0, 30.0, 30.0, 31.0, 38.0, 72.0, 86.0, 99.0, 106.0, 88.0, 62.0, 42.0, 35.0, 34.0, 28.0, 20.0, 17.0, 19.0, 15.0, 6.0, 10.0, 8.0, 8.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 5.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008945465087890625, -0.0008629709482192993, -0.0008313953876495361, -0.000799819827079773, -0.0007682442665100098, -0.0007366687059402466, -0.0007050931453704834, -0.0006735175848007202, -0.000641942024230957, -0.0006103664636611938, -0.0005787909030914307, -0.0005472153425216675, -0.0005156397819519043, -0.0004840642213821411, -0.00045248866081237793, -0.00042091310024261475, -0.00038933753967285156, -0.0003577619791030884, -0.0003261864185333252, -0.000294610857963562, -0.00026303529739379883, -0.00023145973682403564, -0.00019988417625427246, -0.00016830861568450928, -0.0001367330551147461, -0.00010515749454498291, -7.358193397521973e-05, -4.200637340545654e-05, -1.043081283569336e-05, 2.1144747734069824e-05, 5.272030830383301e-05, 8.429586887359619e-05, 0.00011587142944335938, 0.00014744699001312256, 0.00017902255058288574, 0.00021059811115264893, 0.0002421736717224121, 0.0002737492322921753, 0.0003053247928619385, 0.00033690035343170166, 0.00036847591400146484, 0.00040005147457122803, 0.0004316270351409912, 0.0004632025957107544, 0.0004947781562805176, 0.0005263537168502808, 0.0005579292774200439, 0.0005895048379898071, 0.0006210803985595703, 0.0006526559591293335, 0.0006842315196990967, 0.0007158070802688599, 0.000747382640838623, 0.0007789582014083862, 0.0008105337619781494, 0.0008421093225479126, 0.0008736848831176758, 0.000905260443687439, 0.0009368360042572021, 0.0009684115648269653, 0.0009999871253967285, 0.0010315626859664917, 0.0010631382465362549, 0.001094713807106018, 0.0011262893676757812]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 8.0, 14.0, 12.0, 12.0, 14.0, 35.0, 51.0, 52.0, 96.0, 103.0, 179.0, 299.0, 489.0, 883.0, 1857.0, 4744.0, 15436.0, 88161.0, 713737.0, 184628.0, 25778.0, 6611.0, 2524.0, 1183.0, 600.0, 383.0, 213.0, 147.0, 87.0, 54.0, 48.0, 34.0, 29.0, 19.0, 13.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.37109375, -4.2186279296875, -4.066162109375, -3.9136962890625, -3.76123046875, -3.6087646484375, -3.456298828125, -3.3038330078125, -3.1513671875, -2.9989013671875, -2.846435546875, -2.6939697265625, -2.54150390625, -2.3890380859375, -2.236572265625, -2.0841064453125, -1.931640625, -1.7791748046875, -1.626708984375, -1.4742431640625, -1.32177734375, -1.1693115234375, -1.016845703125, -0.8643798828125, -0.7119140625, -0.5594482421875, -0.406982421875, -0.2545166015625, -0.10205078125, 0.0504150390625, 0.202880859375, 0.3553466796875, 0.5078125, 0.6602783203125, 0.812744140625, 0.9652099609375, 1.11767578125, 1.2701416015625, 1.422607421875, 1.5750732421875, 1.7275390625, 1.8800048828125, 2.032470703125, 2.1849365234375, 2.33740234375, 2.4898681640625, 2.642333984375, 2.7947998046875, 2.947265625, 3.0997314453125, 3.252197265625, 3.4046630859375, 3.55712890625, 3.7095947265625, 3.862060546875, 4.0145263671875, 4.1669921875, 4.3194580078125, 4.471923828125, 4.6243896484375, 4.77685546875, 4.9293212890625, 5.081787109375, 5.2342529296875, 5.38671875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 0.0, 6.0, 2.0, 12.0, 9.0, 5.0, 11.0, 17.0, 10.0, 25.0, 26.0, 31.0, 29.0, 36.0, 31.0, 61.0, 55.0, 68.0, 67.0, 67.0, 55.0, 59.0, 54.0, 56.0, 38.0, 28.0, 28.0, 18.0, 18.0, 15.0, 12.0, 9.0, 7.0, 7.0, 7.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.20703125, -4.084075927734375, -3.96112060546875, -3.838165283203125, -3.7152099609375, -3.592254638671875, -3.46929931640625, -3.346343994140625, -3.223388671875, -3.100433349609375, -2.97747802734375, -2.854522705078125, -2.7315673828125, -2.608612060546875, -2.48565673828125, -2.362701416015625, -2.23974609375, -2.116790771484375, -1.99383544921875, -1.870880126953125, -1.7479248046875, -1.624969482421875, -1.50201416015625, -1.379058837890625, -1.256103515625, -1.133148193359375, -1.01019287109375, -0.887237548828125, -0.7642822265625, -0.641326904296875, -0.51837158203125, -0.395416259765625, -0.2724609375, -0.149505615234375, -0.02655029296875, 0.096405029296875, 0.2193603515625, 0.342315673828125, 0.46527099609375, 0.588226318359375, 0.711181640625, 0.834136962890625, 0.95709228515625, 1.080047607421875, 1.2030029296875, 1.325958251953125, 1.44891357421875, 1.571868896484375, 1.69482421875, 1.817779541015625, 1.94073486328125, 2.063690185546875, 2.1866455078125, 2.309600830078125, 2.43255615234375, 2.555511474609375, 2.678466796875, 2.801422119140625, 2.92437744140625, 3.047332763671875, 3.1702880859375, 3.293243408203125, 3.41619873046875, 3.539154052734375, 3.662109375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 11.0, 23.0, 66.0, 203.0, 355.0, 185.0, 103.0, 28.0, 16.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.56884765625, -135.01531982421875, -129.46180725097656, -123.90828704833984, -118.35476684570312, -112.8012466430664, -107.24772644042969, -101.69420623779297, -96.14068603515625, -90.58716583251953, -85.03364562988281, -79.4801254272461, -73.92660522460938, -68.37308502197266, -62.81956481933594, -57.26604461669922, -51.7125244140625, -46.15900421142578, -40.60548400878906, -35.051963806152344, -29.498443603515625, -23.944923400878906, -18.391403198242188, -12.837882995605469, -7.28436279296875, -1.7308425903320312, 3.8226776123046875, 9.376197814941406, 14.929718017578125, 20.483238220214844, 26.036758422851562, 31.59027862548828, 37.143798828125, 42.69731903076172, 48.25083923339844, 53.804359436035156, 59.357879638671875, 64.9113998413086, 70.46492004394531, 76.01844024658203, 81.57196044921875, 87.12548065185547, 92.67900085449219, 98.2325210571289, 103.78604125976562, 109.33956146240234, 114.89308166503906, 120.44660186767578, 126.0001220703125, 131.55364990234375, 137.10716247558594, 142.66067504882812, 148.21420288085938, 153.76773071289062, 159.3212432861328, 164.874755859375, 170.42828369140625, 175.9818115234375, 181.5353240966797, 187.08883666992188, 192.64236450195312, 198.19589233398438, 203.74940490722656, 209.30291748046875, 214.8564453125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 6.0, 10.0, 8.0, 12.0, 11.0, 15.0, 10.0, 18.0, 18.0, 16.0, 32.0, 30.0, 21.0, 34.0, 38.0, 33.0, 53.0, 54.0, 52.0, 49.0, 55.0, 58.0, 42.0, 38.0, 29.0, 30.0, 35.0, 27.0, 24.0, 17.0, 28.0, 17.0, 13.0, 9.0, 10.0, 9.0, 5.0, 11.0, 6.0, 2.0, 7.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.46921920776367, -54.72515869140625, -52.98109817504883, -51.237037658691406, -49.492977142333984, -47.74891662597656, -46.004852294921875, -44.26079559326172, -42.51673126220703, -40.77267074584961, -39.02861022949219, -37.284549713134766, -35.540489196777344, -33.79642868041992, -32.0523681640625, -30.308305740356445, -28.564247131347656, -26.820186614990234, -25.076126098632812, -23.33206558227539, -21.58800506591797, -19.843944549560547, -18.099882125854492, -16.35582160949707, -14.611761093139648, -12.867700576782227, -11.123640060424805, -9.379578590393066, -7.6355180740356445, -5.891457557678223, -4.147396087646484, -2.4033355712890625, -0.6592750549316406, 1.0847856998443604, 2.8288464546203613, 4.572907447814941, 6.316967964172363, 8.061028480529785, 9.805089950561523, 11.549150466918945, 13.293210983276367, 15.037271499633789, 16.78133201599121, 18.525394439697266, 20.269454956054688, 22.01351547241211, 23.75757598876953, 25.501636505126953, 27.245697021484375, 28.989757537841797, 30.73381805419922, 32.47787857055664, 34.22193908691406, 35.965999603271484, 37.710060119628906, 39.454124450683594, 41.19818115234375, 42.94224166870117, 44.686302185058594, 46.430362701416016, 48.17442321777344, 49.91848373413086, 51.66254425048828, 53.40660858154297, 55.15066909790039]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 6.0, 15.0, 13.0, 37.0, 52.0, 86.0, 155.0, 285.0, 509.0, 964.0, 2096.0, 4545.0, 10853.0, 28997.0, 98919.0, 592660.0, 2691754.0, 615803.0, 98426.0, 28333.0, 10653.0, 4687.0, 2135.0, 1032.0, 499.0, 288.0, 173.0, 90.0, 68.0, 47.0, 20.0, 17.0, 16.0, 12.0, 10.0, 4.0, 5.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1875, -5.0174560546875, -4.847412109375, -4.6773681640625, -4.50732421875, -4.3372802734375, -4.167236328125, -3.9971923828125, -3.8271484375, -3.6571044921875, -3.487060546875, -3.3170166015625, -3.14697265625, -2.9769287109375, -2.806884765625, -2.6368408203125, -2.466796875, -2.2967529296875, -2.126708984375, -1.9566650390625, -1.78662109375, -1.6165771484375, -1.446533203125, -1.2764892578125, -1.1064453125, -0.9364013671875, -0.766357421875, -0.5963134765625, -0.42626953125, -0.2562255859375, -0.086181640625, 0.0838623046875, 0.25390625, 0.4239501953125, 0.593994140625, 0.7640380859375, 0.93408203125, 1.1041259765625, 1.274169921875, 1.4442138671875, 1.6142578125, 1.7843017578125, 1.954345703125, 2.1243896484375, 2.29443359375, 2.4644775390625, 2.634521484375, 2.8045654296875, 2.974609375, 3.1446533203125, 3.314697265625, 3.4847412109375, 3.65478515625, 3.8248291015625, 3.994873046875, 4.1649169921875, 4.3349609375, 4.5050048828125, 4.675048828125, 4.8450927734375, 5.01513671875, 5.1851806640625, 5.355224609375, 5.5252685546875, 5.6953125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 3.0, 4.0, 13.0, 10.0, 18.0, 14.0, 15.0, 25.0, 30.0, 35.0, 26.0, 39.0, 46.0, 54.0, 36.0, 57.0, 52.0, 61.0, 59.0, 55.0, 49.0, 36.0, 28.0, 34.0, 36.0, 27.0, 27.0, 22.0, 16.0, 17.0, 17.0, 10.0, 7.0, 8.0, 1.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.77734375, -2.6634521484375, -2.549560546875, -2.4356689453125, -2.32177734375, -2.2078857421875, -2.093994140625, -1.9801025390625, -1.8662109375, -1.7523193359375, -1.638427734375, -1.5245361328125, -1.41064453125, -1.2967529296875, -1.182861328125, -1.0689697265625, -0.955078125, -0.8411865234375, -0.727294921875, -0.6134033203125, -0.49951171875, -0.3856201171875, -0.271728515625, -0.1578369140625, -0.0439453125, 0.0699462890625, 0.183837890625, 0.2977294921875, 0.41162109375, 0.5255126953125, 0.639404296875, 0.7532958984375, 0.8671875, 0.9810791015625, 1.094970703125, 1.2088623046875, 1.32275390625, 1.4366455078125, 1.550537109375, 1.6644287109375, 1.7783203125, 1.8922119140625, 2.006103515625, 2.1199951171875, 2.23388671875, 2.3477783203125, 2.461669921875, 2.5755615234375, 2.689453125, 2.8033447265625, 2.917236328125, 3.0311279296875, 3.14501953125, 3.2589111328125, 3.372802734375, 3.4866943359375, 3.6005859375, 3.7144775390625, 3.828369140625, 3.9422607421875, 4.05615234375, 4.1700439453125, 4.283935546875, 4.3978271484375, 4.51171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 12.0, 21.0, 35.0, 47.0, 57.0, 119.0, 166.0, 310.0, 610.0, 1340.0, 3130.0, 9332.0, 35758.0, 233057.0, 3249080.0, 574432.0, 64277.0, 14615.0, 4417.0, 1697.0, 754.0, 387.0, 231.0, 137.0, 87.0, 49.0, 36.0, 21.0, 22.0, 12.0, 4.0, 3.0, 7.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0625, -9.7635498046875, -9.464599609375, -9.1656494140625, -8.86669921875, -8.5677490234375, -8.268798828125, -7.9698486328125, -7.6708984375, -7.3719482421875, -7.072998046875, -6.7740478515625, -6.47509765625, -6.1761474609375, -5.877197265625, -5.5782470703125, -5.279296875, -4.9803466796875, -4.681396484375, -4.3824462890625, -4.08349609375, -3.7845458984375, -3.485595703125, -3.1866455078125, -2.8876953125, -2.5887451171875, -2.289794921875, -1.9908447265625, -1.69189453125, -1.3929443359375, -1.093994140625, -0.7950439453125, -0.49609375, -0.1971435546875, 0.101806640625, 0.4007568359375, 0.69970703125, 0.9986572265625, 1.297607421875, 1.5965576171875, 1.8955078125, 2.1944580078125, 2.493408203125, 2.7923583984375, 3.09130859375, 3.3902587890625, 3.689208984375, 3.9881591796875, 4.287109375, 4.5860595703125, 4.885009765625, 5.1839599609375, 5.48291015625, 5.7818603515625, 6.080810546875, 6.3797607421875, 6.6787109375, 6.9776611328125, 7.276611328125, 7.5755615234375, 7.87451171875, 8.1734619140625, 8.472412109375, 8.7713623046875, 9.0703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 1.0, 6.0, 20.0, 17.0, 22.0, 32.0, 52.0, 84.0, 138.0, 245.0, 532.0, 995.0, 819.0, 456.0, 260.0, 133.0, 90.0, 58.0, 33.0, 20.0, 15.0, 11.0, 8.0, 4.0, 11.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.671875, -12.26123046875, -11.8505859375, -11.43994140625, -11.029296875, -10.61865234375, -10.2080078125, -9.79736328125, -9.38671875, -8.97607421875, -8.5654296875, -8.15478515625, -7.744140625, -7.33349609375, -6.9228515625, -6.51220703125, -6.1015625, -5.69091796875, -5.2802734375, -4.86962890625, -4.458984375, -4.04833984375, -3.6376953125, -3.22705078125, -2.81640625, -2.40576171875, -1.9951171875, -1.58447265625, -1.173828125, -0.76318359375, -0.3525390625, 0.05810546875, 0.46875, 0.87939453125, 1.2900390625, 1.70068359375, 2.111328125, 2.52197265625, 2.9326171875, 3.34326171875, 3.75390625, 4.16455078125, 4.5751953125, 4.98583984375, 5.396484375, 5.80712890625, 6.2177734375, 6.62841796875, 7.0390625, 7.44970703125, 7.8603515625, 8.27099609375, 8.681640625, 9.09228515625, 9.5029296875, 9.91357421875, 10.32421875, 10.73486328125, 11.1455078125, 11.55615234375, 11.966796875, 12.37744140625, 12.7880859375, 13.19873046875, 13.609375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 18.0, 62.0, 101.0, 241.0, 225.0, 165.0, 89.0, 34.0, 7.0, 8.0, 8.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.14408874511719, -86.53569793701172, -82.92730712890625, -79.31891632080078, -75.71052551269531, -72.10213470458984, -68.49374389648438, -64.8853530883789, -61.27696228027344, -57.66857147216797, -54.0601806640625, -50.45178985595703, -46.84339904785156, -43.235008239746094, -39.626617431640625, -36.018226623535156, -32.40983200073242, -28.801441192626953, -25.193050384521484, -21.584659576416016, -17.976268768310547, -14.367876052856445, -10.759485244750977, -7.151094436645508, -3.542703628540039, 0.06568741798400879, 3.6740784645080566, 7.282469749450684, 10.890860557556152, 14.499252319335938, 18.107643127441406, 21.716033935546875, 25.324424743652344, 28.932815551757812, 32.54120635986328, 36.14959716796875, 39.75798797607422, 43.36637878417969, 46.974769592285156, 50.583160400390625, 54.191551208496094, 57.79994201660156, 61.40833282470703, 65.0167236328125, 68.62511444091797, 72.23350524902344, 75.8418960571289, 79.45028686523438, 83.05868530273438, 86.66707611083984, 90.27546691894531, 93.88385772705078, 97.49224853515625, 101.10063934326172, 104.70903015136719, 108.31742095947266, 111.92581176757812, 115.5342025756836, 119.14259338378906, 122.75098419189453, 126.359375, 129.9677734375, 133.57615661621094, 137.18455505371094, 140.79293823242188]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 6.0, 12.0, 8.0, 23.0, 19.0, 21.0, 29.0, 38.0, 39.0, 35.0, 58.0, 56.0, 46.0, 47.0, 45.0, 59.0, 44.0, 50.0, 54.0, 47.0, 33.0, 34.0, 36.0, 24.0, 16.0, 13.0, 22.0, 18.0, 11.0, 9.0, 7.0, 10.0, 4.0, 1.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.31983184814453, -50.75276184082031, -49.18569564819336, -47.61862564086914, -46.05155563354492, -44.48448944091797, -42.91741943359375, -41.35034942626953, -39.78327941894531, -38.216209411621094, -36.64914321899414, -35.08207321166992, -33.5150032043457, -31.947935104370117, -30.38086700439453, -28.813796997070312, -27.24673080444336, -25.679662704467773, -24.112592697143555, -22.54552459716797, -20.97845458984375, -19.411386489868164, -17.844318389892578, -16.27724838256836, -14.710180282592773, -13.143111228942871, -11.576042175292969, -10.008974075317383, -8.44190502166748, -6.874835968017578, -5.307767868041992, -3.74069881439209, -2.1736297607421875, -0.6065609455108643, 0.960507869720459, 2.527576446533203, 4.0946455001831055, 5.661714553833008, 7.228782653808594, 8.795851707458496, 10.362920761108398, 11.9299898147583, 13.497058868408203, 15.064126968383789, 16.631195068359375, 18.198265075683594, 19.76533317565918, 21.332401275634766, 22.899471282958984, 24.46653938293457, 26.03360939025879, 27.600677490234375, 29.167747497558594, 30.73481559753418, 32.301883697509766, 33.868953704833984, 35.43601989746094, 37.003089904785156, 38.57015609741211, 40.13722610473633, 41.70429611206055, 43.2713623046875, 44.83843231201172, 46.40550231933594, 47.972572326660156]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 9.0, 5.0, 10.0, 13.0, 24.0, 42.0, 49.0, 99.0, 166.0, 303.0, 539.0, 963.0, 1938.0, 3914.0, 9318.0, 23635.0, 73959.0, 326905.0, 451395.0, 103098.0, 31086.0, 11461.0, 4696.0, 2258.0, 1136.0, 643.0, 366.0, 227.0, 136.0, 62.0, 38.0, 21.0, 13.0, 13.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.7349853515625, -8.454345703125, -8.1737060546875, -7.89306640625, -7.6124267578125, -7.331787109375, -7.0511474609375, -6.7705078125, -6.4898681640625, -6.209228515625, -5.9285888671875, -5.64794921875, -5.3673095703125, -5.086669921875, -4.8060302734375, -4.525390625, -4.2447509765625, -3.964111328125, -3.6834716796875, -3.40283203125, -3.1221923828125, -2.841552734375, -2.5609130859375, -2.2802734375, -1.9996337890625, -1.718994140625, -1.4383544921875, -1.15771484375, -0.8770751953125, -0.596435546875, -0.3157958984375, -0.03515625, 0.2454833984375, 0.526123046875, 0.8067626953125, 1.08740234375, 1.3680419921875, 1.648681640625, 1.9293212890625, 2.2099609375, 2.4906005859375, 2.771240234375, 3.0518798828125, 3.33251953125, 3.6131591796875, 3.893798828125, 4.1744384765625, 4.455078125, 4.7357177734375, 5.016357421875, 5.2969970703125, 5.57763671875, 5.8582763671875, 6.138916015625, 6.4195556640625, 6.7001953125, 6.9808349609375, 7.261474609375, 7.5421142578125, 7.82275390625, 8.1033935546875, 8.384033203125, 8.6646728515625, 8.9453125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 3.0, 4.0, 4.0, 6.0, 7.0, 25.0, 21.0, 22.0, 28.0, 35.0, 41.0, 62.0, 53.0, 82.0, 70.0, 64.0, 62.0, 66.0, 62.0, 60.0, 59.0, 29.0, 33.0, 23.0, 32.0, 26.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.71484375, -3.5579833984375, -3.401123046875, -3.2442626953125, -3.08740234375, -2.9305419921875, -2.773681640625, -2.6168212890625, -2.4599609375, -2.3031005859375, -2.146240234375, -1.9893798828125, -1.83251953125, -1.6756591796875, -1.518798828125, -1.3619384765625, -1.205078125, -1.0482177734375, -0.891357421875, -0.7344970703125, -0.57763671875, -0.4207763671875, -0.263916015625, -0.1070556640625, 0.0498046875, 0.2066650390625, 0.363525390625, 0.5203857421875, 0.67724609375, 0.8341064453125, 0.990966796875, 1.1478271484375, 1.3046875, 1.4615478515625, 1.618408203125, 1.7752685546875, 1.93212890625, 2.0889892578125, 2.245849609375, 2.4027099609375, 2.5595703125, 2.7164306640625, 2.873291015625, 3.0301513671875, 3.18701171875, 3.3438720703125, 3.500732421875, 3.6575927734375, 3.814453125, 3.9713134765625, 4.128173828125, 4.2850341796875, 4.44189453125, 4.5987548828125, 4.755615234375, 4.9124755859375, 5.0693359375, 5.2261962890625, 5.383056640625, 5.5399169921875, 5.69677734375, 5.8536376953125, 6.010498046875, 6.1673583984375, 6.32421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 9.0, 12.0, 19.0, 30.0, 36.0, 69.0, 100.0, 130.0, 291.0, 493.0, 1209.0, 3704.0, 21123.0, 702440.0, 298882.0, 14843.0, 2936.0, 1027.0, 497.0, 238.0, 162.0, 91.0, 68.0, 38.0, 28.0, 18.0, 15.0, 10.0, 12.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.671875, -20.970947265625, -20.27001953125, -19.569091796875, -18.8681640625, -18.167236328125, -17.46630859375, -16.765380859375, -16.064453125, -15.363525390625, -14.66259765625, -13.961669921875, -13.2607421875, -12.559814453125, -11.85888671875, -11.157958984375, -10.45703125, -9.756103515625, -9.05517578125, -8.354248046875, -7.6533203125, -6.952392578125, -6.25146484375, -5.550537109375, -4.849609375, -4.148681640625, -3.44775390625, -2.746826171875, -2.0458984375, -1.344970703125, -0.64404296875, 0.056884765625, 0.7578125, 1.458740234375, 2.15966796875, 2.860595703125, 3.5615234375, 4.262451171875, 4.96337890625, 5.664306640625, 6.365234375, 7.066162109375, 7.76708984375, 8.468017578125, 9.1689453125, 9.869873046875, 10.57080078125, 11.271728515625, 11.97265625, 12.673583984375, 13.37451171875, 14.075439453125, 14.7763671875, 15.477294921875, 16.17822265625, 16.879150390625, 17.580078125, 18.281005859375, 18.98193359375, 19.682861328125, 20.3837890625, 21.084716796875, 21.78564453125, 22.486572265625, 23.1875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 8.0, 4.0, 14.0, 11.0, 20.0, 24.0, 34.0, 35.0, 57.0, 73.0, 88.0, 96.0, 76.0, 84.0, 92.0, 68.0, 60.0, 46.0, 32.0, 24.0, 18.0, 11.0, 5.0, 10.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.921875, -17.15576171875, -16.3896484375, -15.62353515625, -14.857421875, -14.09130859375, -13.3251953125, -12.55908203125, -11.79296875, -11.02685546875, -10.2607421875, -9.49462890625, -8.728515625, -7.96240234375, -7.1962890625, -6.43017578125, -5.6640625, -4.89794921875, -4.1318359375, -3.36572265625, -2.599609375, -1.83349609375, -1.0673828125, -0.30126953125, 0.46484375, 1.23095703125, 1.9970703125, 2.76318359375, 3.529296875, 4.29541015625, 5.0615234375, 5.82763671875, 6.59375, 7.35986328125, 8.1259765625, 8.89208984375, 9.658203125, 10.42431640625, 11.1904296875, 11.95654296875, 12.72265625, 13.48876953125, 14.2548828125, 15.02099609375, 15.787109375, 16.55322265625, 17.3193359375, 18.08544921875, 18.8515625, 19.61767578125, 20.3837890625, 21.14990234375, 21.916015625, 22.68212890625, 23.4482421875, 24.21435546875, 24.98046875, 25.74658203125, 26.5126953125, 27.27880859375, 28.044921875, 28.81103515625, 29.5771484375, 30.34326171875, 31.109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 7.0, 6.0, 11.0, 15.0, 24.0, 32.0, 37.0, 56.0, 65.0, 129.0, 238.0, 400.0, 1067.0, 3548.0, 18887.0, 233111.0, 743539.0, 38639.0, 5954.0, 1504.0, 555.0, 249.0, 129.0, 97.0, 65.0, 47.0, 35.0, 20.0, 11.0, 17.0, 13.0, 5.0, 4.0, 7.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-6.63671875, -6.4425048828125, -6.248291015625, -6.0540771484375, -5.85986328125, -5.6656494140625, -5.471435546875, -5.2772216796875, -5.0830078125, -4.8887939453125, -4.694580078125, -4.5003662109375, -4.30615234375, -4.1119384765625, -3.917724609375, -3.7235107421875, -3.529296875, -3.3350830078125, -3.140869140625, -2.9466552734375, -2.75244140625, -2.5582275390625, -2.364013671875, -2.1697998046875, -1.9755859375, -1.7813720703125, -1.587158203125, -1.3929443359375, -1.19873046875, -1.0045166015625, -0.810302734375, -0.6160888671875, -0.421875, -0.2276611328125, -0.033447265625, 0.1607666015625, 0.35498046875, 0.5491943359375, 0.743408203125, 0.9376220703125, 1.1318359375, 1.3260498046875, 1.520263671875, 1.7144775390625, 1.90869140625, 2.1029052734375, 2.297119140625, 2.4913330078125, 2.685546875, 2.8797607421875, 3.073974609375, 3.2681884765625, 3.46240234375, 3.6566162109375, 3.850830078125, 4.0450439453125, 4.2392578125, 4.4334716796875, 4.627685546875, 4.8218994140625, 5.01611328125, 5.2103271484375, 5.404541015625, 5.5987548828125, 5.79296875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 4.0, 2.0, 6.0, 6.0, 6.0, 11.0, 17.0, 18.0, 33.0, 25.0, 54.0, 89.0, 151.0, 147.0, 139.0, 93.0, 42.0, 45.0, 35.0, 17.0, 12.0, 14.0, 6.0, 5.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012617111206054688, -0.001224130392074585, -0.0011865496635437012, -0.0011489689350128174, -0.0011113882064819336, -0.0010738074779510498, -0.001036226749420166, -0.0009986460208892822, -0.0009610652923583984, -0.0009234845638275146, -0.0008859038352966309, -0.0008483231067657471, -0.0008107423782348633, -0.0007731616497039795, -0.0007355809211730957, -0.0006980001926422119, -0.0006604194641113281, -0.0006228387355804443, -0.0005852580070495605, -0.0005476772785186768, -0.000510096549987793, -0.0004725158214569092, -0.0004349350929260254, -0.0003973543643951416, -0.0003597736358642578, -0.000322192907333374, -0.00028461217880249023, -0.00024703145027160645, -0.00020945072174072266, -0.00017186999320983887, -0.00013428926467895508, -9.670853614807129e-05, -5.91278076171875e-05, -2.154707908630371e-05, 1.6033649444580078e-05, 5.361437797546387e-05, 9.119510650634766e-05, 0.00012877583503723145, 0.00016635656356811523, 0.00020393729209899902, 0.0002415180206298828, 0.0002790987491607666, 0.0003166794776916504, 0.0003542602062225342, 0.00039184093475341797, 0.00042942166328430176, 0.00046700239181518555, 0.0005045831203460693, 0.0005421638488769531, 0.0005797445774078369, 0.0006173253059387207, 0.0006549060344696045, 0.0006924867630004883, 0.0007300674915313721, 0.0007676482200622559, 0.0008052289485931396, 0.0008428096771240234, 0.0008803904056549072, 0.000917971134185791, 0.0009555518627166748, 0.0009931325912475586, 0.0010307133197784424, 0.0010682940483093262, 0.00110587477684021, 0.0011434555053710938]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 2.0, 9.0, 12.0, 6.0, 23.0, 23.0, 34.0, 54.0, 60.0, 124.0, 152.0, 261.0, 500.0, 968.0, 2076.0, 6174.0, 26110.0, 214900.0, 708464.0, 69918.0, 12088.0, 3412.0, 1420.0, 721.0, 378.0, 232.0, 123.0, 86.0, 63.0, 57.0, 27.0, 22.0, 13.0, 10.0, 8.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.935546875, -3.81353759765625, -3.6915283203125, -3.56951904296875, -3.447509765625, -3.32550048828125, -3.2034912109375, -3.08148193359375, -2.95947265625, -2.83746337890625, -2.7154541015625, -2.59344482421875, -2.471435546875, -2.34942626953125, -2.2274169921875, -2.10540771484375, -1.9833984375, -1.86138916015625, -1.7393798828125, -1.61737060546875, -1.495361328125, -1.37335205078125, -1.2513427734375, -1.12933349609375, -1.00732421875, -0.88531494140625, -0.7633056640625, -0.64129638671875, -0.519287109375, -0.39727783203125, -0.2752685546875, -0.15325927734375, -0.03125, 0.09075927734375, 0.2127685546875, 0.33477783203125, 0.456787109375, 0.57879638671875, 0.7008056640625, 0.82281494140625, 0.94482421875, 1.06683349609375, 1.1888427734375, 1.31085205078125, 1.432861328125, 1.55487060546875, 1.6768798828125, 1.79888916015625, 1.9208984375, 2.04290771484375, 2.1649169921875, 2.28692626953125, 2.408935546875, 2.53094482421875, 2.6529541015625, 2.77496337890625, 2.89697265625, 3.01898193359375, 3.1409912109375, 3.26300048828125, 3.385009765625, 3.50701904296875, 3.6290283203125, 3.75103759765625, 3.873046875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 4.0, 7.0, 4.0, 13.0, 18.0, 21.0, 33.0, 33.0, 42.0, 55.0, 71.0, 96.0, 89.0, 79.0, 80.0, 77.0, 60.0, 52.0, 35.0, 29.0, 23.0, 20.0, 10.0, 12.0, 4.0, 4.0, 7.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.8125, -3.697662353515625, -3.58282470703125, -3.467987060546875, -3.3531494140625, -3.238311767578125, -3.12347412109375, -3.008636474609375, -2.893798828125, -2.778961181640625, -2.66412353515625, -2.549285888671875, -2.4344482421875, -2.319610595703125, -2.20477294921875, -2.089935302734375, -1.97509765625, -1.860260009765625, -1.74542236328125, -1.630584716796875, -1.5157470703125, -1.400909423828125, -1.28607177734375, -1.171234130859375, -1.056396484375, -0.941558837890625, -0.82672119140625, -0.711883544921875, -0.5970458984375, -0.482208251953125, -0.36737060546875, -0.252532958984375, -0.1376953125, -0.022857666015625, 0.09197998046875, 0.206817626953125, 0.3216552734375, 0.436492919921875, 0.55133056640625, 0.666168212890625, 0.781005859375, 0.895843505859375, 1.01068115234375, 1.125518798828125, 1.2403564453125, 1.355194091796875, 1.47003173828125, 1.584869384765625, 1.69970703125, 1.814544677734375, 1.92938232421875, 2.044219970703125, 2.1590576171875, 2.273895263671875, 2.38873291015625, 2.503570556640625, 2.618408203125, 2.733245849609375, 2.84808349609375, 2.962921142578125, 3.0777587890625, 3.192596435546875, 3.30743408203125, 3.422271728515625, 3.537109375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 7.0, 3.0, 6.0, 3.0, 13.0, 37.0, 107.0, 275.0, 305.0, 139.0, 60.0, 23.0, 13.0, 3.0, 8.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.72006225585938, -82.39778137207031, -78.07550048828125, -73.75321960449219, -69.43093872070312, -65.10865783691406, -60.78636932373047, -56.464088439941406, -52.141807556152344, -47.81952667236328, -43.49724578857422, -39.17496109008789, -34.85268020629883, -30.530399322509766, -26.20811653137207, -21.885833740234375, -17.563552856445312, -13.241271018981934, -8.918989181518555, -4.596707344055176, -0.2744255065917969, 4.047855377197266, 8.370138168334961, 12.692420959472656, 17.01470184326172, 21.33698272705078, 25.659265518188477, 29.981548309326172, 34.303829193115234, 38.6261100769043, 42.948394775390625, 47.27067565917969, 51.59295654296875, 55.91523742675781, 60.237518310546875, 64.55979919433594, 68.882080078125, 73.20436096191406, 77.52664947509766, 81.84893035888672, 86.17121124267578, 90.49349212646484, 94.8157730102539, 99.13805389404297, 103.46034240722656, 107.78262329101562, 112.10490417480469, 116.42718505859375, 120.74946594238281, 125.07174682617188, 129.39402770996094, 133.71630859375, 138.03858947753906, 142.36087036132812, 146.6831512451172, 151.00543212890625, 155.32772827148438, 159.65000915527344, 163.9722900390625, 168.29457092285156, 172.61685180664062, 176.9391326904297, 181.26141357421875, 185.58370971679688, 189.90597534179688]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 6.0, 1.0, 5.0, 10.0, 9.0, 17.0, 15.0, 12.0, 19.0, 20.0, 23.0, 34.0, 27.0, 30.0, 41.0, 28.0, 48.0, 51.0, 67.0, 77.0, 67.0, 56.0, 45.0, 27.0, 37.0, 33.0, 20.0, 45.0, 15.0, 18.0, 23.0, 16.0, 15.0, 8.0, 3.0, 6.0, 10.0, 12.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-64.0519790649414, -62.28700637817383, -60.52203369140625, -58.757057189941406, -56.99208450317383, -55.22711181640625, -53.46213912963867, -51.697166442871094, -49.93218994140625, -48.16721725463867, -46.402244567871094, -44.63726806640625, -42.87229537963867, -41.107322692871094, -39.342350006103516, -37.57737731933594, -35.81240463256836, -34.04743194580078, -32.2824592590332, -30.517484664916992, -28.75251007080078, -26.987537384033203, -25.222564697265625, -23.457592010498047, -21.692617416381836, -19.927644729614258, -18.162670135498047, -16.39769744873047, -14.632723808288574, -12.86775016784668, -11.102777481079102, -9.337803840637207, -7.5728302001953125, -5.807856559753418, -4.042883396148682, -2.2779102325439453, -0.5129365921020508, 1.2520370483398438, 3.017009735107422, 4.781983375549316, 6.546957015991211, 8.311930656433105, 10.076904296875, 11.841876983642578, 13.606850624084473, 15.371824264526367, 17.136796951293945, 18.901771545410156, 20.666744232177734, 22.431716918945312, 24.196691513061523, 25.9616641998291, 27.726638793945312, 29.49161148071289, 31.25658416748047, 33.02155685424805, 34.786529541015625, 36.5515022277832, 38.31647491455078, 40.081451416015625, 41.8464241027832, 43.61139678955078, 45.37636947631836, 47.14134216308594, 48.90631866455078]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 4.0, 13.0, 23.0, 28.0, 34.0, 55.0, 100.0, 192.0, 326.0, 581.0, 1183.0, 2685.0, 6827.0, 20780.0, 94070.0, 905391.0, 2795009.0, 301132.0, 45262.0, 12275.0, 4372.0, 1950.0, 906.0, 475.0, 248.0, 148.0, 75.0, 48.0, 26.0, 14.0, 14.0, 13.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.984375, -4.81414794921875, -4.6439208984375, -4.47369384765625, -4.303466796875, -4.13323974609375, -3.9630126953125, -3.79278564453125, -3.62255859375, -3.45233154296875, -3.2821044921875, -3.11187744140625, -2.941650390625, -2.77142333984375, -2.6011962890625, -2.43096923828125, -2.2607421875, -2.09051513671875, -1.9202880859375, -1.75006103515625, -1.579833984375, -1.40960693359375, -1.2393798828125, -1.06915283203125, -0.89892578125, -0.72869873046875, -0.5584716796875, -0.38824462890625, -0.218017578125, -0.04779052734375, 0.1224365234375, 0.29266357421875, 0.462890625, 0.63311767578125, 0.8033447265625, 0.97357177734375, 1.143798828125, 1.31402587890625, 1.4842529296875, 1.65447998046875, 1.82470703125, 1.99493408203125, 2.1651611328125, 2.33538818359375, 2.505615234375, 2.67584228515625, 2.8460693359375, 3.01629638671875, 3.1865234375, 3.35675048828125, 3.5269775390625, 3.69720458984375, 3.867431640625, 4.03765869140625, 4.2078857421875, 4.37811279296875, 4.54833984375, 4.71856689453125, 4.8887939453125, 5.05902099609375, 5.229248046875, 5.39947509765625, 5.5697021484375, 5.73992919921875, 5.91015625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 8.0, 10.0, 13.0, 9.0, 9.0, 10.0, 19.0, 20.0, 41.0, 28.0, 32.0, 43.0, 40.0, 40.0, 46.0, 52.0, 49.0, 52.0, 57.0, 51.0, 40.0, 46.0, 41.0, 41.0, 39.0, 30.0, 11.0, 21.0, 15.0, 23.0, 11.0, 13.0, 10.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.94921875, -3.84332275390625, -3.7374267578125, -3.63153076171875, -3.525634765625, -3.41973876953125, -3.3138427734375, -3.20794677734375, -3.10205078125, -2.99615478515625, -2.8902587890625, -2.78436279296875, -2.678466796875, -2.57257080078125, -2.4666748046875, -2.36077880859375, -2.2548828125, -2.14898681640625, -2.0430908203125, -1.93719482421875, -1.831298828125, -1.72540283203125, -1.6195068359375, -1.51361083984375, -1.40771484375, -1.30181884765625, -1.1959228515625, -1.09002685546875, -0.984130859375, -0.87823486328125, -0.7723388671875, -0.66644287109375, -0.560546875, -0.45465087890625, -0.3487548828125, -0.24285888671875, -0.136962890625, -0.03106689453125, 0.0748291015625, 0.18072509765625, 0.28662109375, 0.39251708984375, 0.4984130859375, 0.60430908203125, 0.710205078125, 0.81610107421875, 0.9219970703125, 1.02789306640625, 1.1337890625, 1.23968505859375, 1.3455810546875, 1.45147705078125, 1.557373046875, 1.66326904296875, 1.7691650390625, 1.87506103515625, 1.98095703125, 2.08685302734375, 2.1927490234375, 2.29864501953125, 2.404541015625, 2.51043701171875, 2.6163330078125, 2.72222900390625, 2.828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 8.0, 13.0, 13.0, 22.0, 25.0, 61.0, 87.0, 146.0, 320.0, 665.0, 1431.0, 3634.0, 14015.0, 108638.0, 3608972.0, 418615.0, 28067.0, 5833.0, 1936.0, 872.0, 399.0, 204.0, 109.0, 76.0, 33.0, 32.0, 10.0, 13.0, 8.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.03125, -8.6798095703125, -8.328369140625, -7.9769287109375, -7.62548828125, -7.2740478515625, -6.922607421875, -6.5711669921875, -6.2197265625, -5.8682861328125, -5.516845703125, -5.1654052734375, -4.81396484375, -4.4625244140625, -4.111083984375, -3.7596435546875, -3.408203125, -3.0567626953125, -2.705322265625, -2.3538818359375, -2.00244140625, -1.6510009765625, -1.299560546875, -0.9481201171875, -0.5966796875, -0.2452392578125, 0.106201171875, 0.4576416015625, 0.80908203125, 1.1605224609375, 1.511962890625, 1.8634033203125, 2.21484375, 2.5662841796875, 2.917724609375, 3.2691650390625, 3.62060546875, 3.9720458984375, 4.323486328125, 4.6749267578125, 5.0263671875, 5.3778076171875, 5.729248046875, 6.0806884765625, 6.43212890625, 6.7835693359375, 7.135009765625, 7.4864501953125, 7.837890625, 8.1893310546875, 8.540771484375, 8.8922119140625, 9.24365234375, 9.5950927734375, 9.946533203125, 10.2979736328125, 10.6494140625, 11.0008544921875, 11.352294921875, 11.7037353515625, 12.05517578125, 12.4066162109375, 12.758056640625, 13.1094970703125, 13.4609375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 6.0, 7.0, 10.0, 18.0, 21.0, 32.0, 50.0, 56.0, 127.0, 246.0, 570.0, 1029.0, 903.0, 482.0, 198.0, 104.0, 59.0, 59.0, 32.0, 13.0, 11.0, 8.0, 9.0, 7.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.4375, -10.098876953125, -9.76025390625, -9.421630859375, -9.0830078125, -8.744384765625, -8.40576171875, -8.067138671875, -7.728515625, -7.389892578125, -7.05126953125, -6.712646484375, -6.3740234375, -6.035400390625, -5.69677734375, -5.358154296875, -5.01953125, -4.680908203125, -4.34228515625, -4.003662109375, -3.6650390625, -3.326416015625, -2.98779296875, -2.649169921875, -2.310546875, -1.971923828125, -1.63330078125, -1.294677734375, -0.9560546875, -0.617431640625, -0.27880859375, 0.059814453125, 0.3984375, 0.737060546875, 1.07568359375, 1.414306640625, 1.7529296875, 2.091552734375, 2.43017578125, 2.768798828125, 3.107421875, 3.446044921875, 3.78466796875, 4.123291015625, 4.4619140625, 4.800537109375, 5.13916015625, 5.477783203125, 5.81640625, 6.155029296875, 6.49365234375, 6.832275390625, 7.1708984375, 7.509521484375, 7.84814453125, 8.186767578125, 8.525390625, 8.864013671875, 9.20263671875, 9.541259765625, 9.8798828125, 10.218505859375, 10.55712890625, 10.895751953125, 11.234375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 17.0, 39.0, 127.0, 266.0, 287.0, 157.0, 48.0, 12.0, 10.0, 7.0, 6.0, 5.0, 4.0, 6.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.03190612792969, -89.43699645996094, -85.84209442138672, -82.24718475341797, -78.65228271484375, -75.057373046875, -71.46247100830078, -67.86756134033203, -64.27265930175781, -60.67775344848633, -57.082847595214844, -53.48794174194336, -49.893035888671875, -46.298126220703125, -42.703224182128906, -39.108314514160156, -35.51340866088867, -31.918502807617188, -28.323596954345703, -24.72869110107422, -21.133785247802734, -17.538877487182617, -13.943971633911133, -10.349065780639648, -6.754159927368164, -3.1592538356781006, 0.4356522560119629, 4.0305585861206055, 7.62546443939209, 11.22037124633789, 14.815277099609375, 18.41018295288086, 22.005088806152344, 25.599994659423828, 29.194900512695312, 32.7898063659668, 36.38471221923828, 39.97962188720703, 43.57452392578125, 47.16943359375, 50.76433563232422, 54.3592414855957, 57.95414733886719, 61.54905319213867, 65.14395904541016, 68.7388687133789, 72.33377075195312, 75.92868041992188, 79.52359008789062, 83.11849975585938, 86.7134017944336, 90.30831146240234, 93.90321350097656, 97.49812316894531, 101.09302520751953, 104.68793487548828, 108.2828369140625, 111.87774658203125, 115.47264862060547, 119.06755828857422, 122.66246032714844, 126.25736999511719, 129.85227966308594, 133.44717407226562, 137.04208374023438]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 11.0, 9.0, 25.0, 23.0, 22.0, 42.0, 44.0, 48.0, 43.0, 49.0, 66.0, 73.0, 53.0, 52.0, 68.0, 62.0, 47.0, 40.0, 46.0, 41.0, 30.0, 20.0, 26.0, 12.0, 10.0, 11.0, 7.0, 9.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.86661911010742, -55.2278938293457, -53.58916473388672, -51.950439453125, -50.31171417236328, -48.6729850769043, -47.03425979614258, -45.395530700683594, -43.756805419921875, -42.118080139160156, -40.47935104370117, -38.84062576293945, -37.20189666748047, -35.56317138671875, -33.92444610595703, -32.28572082519531, -30.646991729736328, -29.008264541625977, -27.369537353515625, -25.730812072753906, -24.092084884643555, -22.453357696533203, -20.814632415771484, -19.175905227661133, -17.53717803955078, -15.89845085144043, -14.259724617004395, -12.62099838256836, -10.982271194458008, -9.343544006347656, -7.704817771911621, -6.066091537475586, -4.427364349365234, -2.788637638092041, -1.1499109268188477, 0.4888157844543457, 2.127542495727539, 3.7662696838378906, 5.404995918273926, 7.043722152709961, 8.682449340820312, 10.321176528930664, 11.9599027633667, 13.598628997802734, 15.237356185913086, 16.876083374023438, 18.514808654785156, 20.153535842895508, 21.79226303100586, 23.43099021911621, 25.069717407226562, 26.70844268798828, 28.347169876098633, 29.985897064208984, 31.624622344970703, 33.26335144042969, 34.902076721191406, 36.540802001953125, 38.17953109741211, 39.81825637817383, 41.45698547363281, 43.09571075439453, 44.73443603515625, 46.37316131591797, 48.01189041137695]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 13.0, 9.0, 14.0, 21.0, 40.0, 62.0, 110.0, 177.0, 347.0, 623.0, 1110.0, 2380.0, 5499.0, 15915.0, 60931.0, 301920.0, 491636.0, 124513.0, 27797.0, 8771.0, 3349.0, 1458.0, 801.0, 440.0, 232.0, 146.0, 82.0, 51.0, 37.0, 27.0, 14.0, 13.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.7109375, -7.5037841796875, -7.296630859375, -7.0894775390625, -6.88232421875, -6.6751708984375, -6.468017578125, -6.2608642578125, -6.0537109375, -5.8465576171875, -5.639404296875, -5.4322509765625, -5.22509765625, -5.0179443359375, -4.810791015625, -4.6036376953125, -4.396484375, -4.1893310546875, -3.982177734375, -3.7750244140625, -3.56787109375, -3.3607177734375, -3.153564453125, -2.9464111328125, -2.7392578125, -2.5321044921875, -2.324951171875, -2.1177978515625, -1.91064453125, -1.7034912109375, -1.496337890625, -1.2891845703125, -1.08203125, -0.8748779296875, -0.667724609375, -0.4605712890625, -0.25341796875, -0.0462646484375, 0.160888671875, 0.3680419921875, 0.5751953125, 0.7823486328125, 0.989501953125, 1.1966552734375, 1.40380859375, 1.6109619140625, 1.818115234375, 2.0252685546875, 2.232421875, 2.4395751953125, 2.646728515625, 2.8538818359375, 3.06103515625, 3.2681884765625, 3.475341796875, 3.6824951171875, 3.8896484375, 4.0968017578125, 4.303955078125, 4.5111083984375, 4.71826171875, 4.9254150390625, 5.132568359375, 5.3397216796875, 5.546875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 10.0, 14.0, 7.0, 14.0, 20.0, 16.0, 20.0, 21.0, 19.0, 29.0, 32.0, 39.0, 31.0, 36.0, 52.0, 43.0, 36.0, 44.0, 44.0, 50.0, 48.0, 38.0, 40.0, 35.0, 33.0, 21.0, 30.0, 33.0, 19.0, 9.0, 22.0, 17.0, 12.0, 9.0, 7.0, 5.0, 3.0, 3.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.375, -3.27484130859375, -3.1746826171875, -3.07452392578125, -2.974365234375, -2.87420654296875, -2.7740478515625, -2.67388916015625, -2.57373046875, -2.47357177734375, -2.3734130859375, -2.27325439453125, -2.173095703125, -2.07293701171875, -1.9727783203125, -1.87261962890625, -1.7724609375, -1.67230224609375, -1.5721435546875, -1.47198486328125, -1.371826171875, -1.27166748046875, -1.1715087890625, -1.07135009765625, -0.97119140625, -0.87103271484375, -0.7708740234375, -0.67071533203125, -0.570556640625, -0.47039794921875, -0.3702392578125, -0.27008056640625, -0.169921875, -0.06976318359375, 0.0303955078125, 0.13055419921875, 0.230712890625, 0.33087158203125, 0.4310302734375, 0.53118896484375, 0.63134765625, 0.73150634765625, 0.8316650390625, 0.93182373046875, 1.031982421875, 1.13214111328125, 1.2322998046875, 1.33245849609375, 1.4326171875, 1.53277587890625, 1.6329345703125, 1.73309326171875, 1.833251953125, 1.93341064453125, 2.0335693359375, 2.13372802734375, 2.23388671875, 2.33404541015625, 2.4342041015625, 2.53436279296875, 2.634521484375, 2.73468017578125, 2.8348388671875, 2.93499755859375, 3.03515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 10.0, 14.0, 23.0, 28.0, 68.0, 69.0, 147.0, 276.0, 780.0, 2353.0, 12651.0, 187751.0, 794059.0, 42947.0, 5175.0, 1279.0, 465.0, 196.0, 90.0, 62.0, 34.0, 30.0, 10.0, 13.0, 6.0, 10.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3671875, -9.98681640625, -9.6064453125, -9.22607421875, -8.845703125, -8.46533203125, -8.0849609375, -7.70458984375, -7.32421875, -6.94384765625, -6.5634765625, -6.18310546875, -5.802734375, -5.42236328125, -5.0419921875, -4.66162109375, -4.28125, -3.90087890625, -3.5205078125, -3.14013671875, -2.759765625, -2.37939453125, -1.9990234375, -1.61865234375, -1.23828125, -0.85791015625, -0.4775390625, -0.09716796875, 0.283203125, 0.66357421875, 1.0439453125, 1.42431640625, 1.8046875, 2.18505859375, 2.5654296875, 2.94580078125, 3.326171875, 3.70654296875, 4.0869140625, 4.46728515625, 4.84765625, 5.22802734375, 5.6083984375, 5.98876953125, 6.369140625, 6.74951171875, 7.1298828125, 7.51025390625, 7.890625, 8.27099609375, 8.6513671875, 9.03173828125, 9.412109375, 9.79248046875, 10.1728515625, 10.55322265625, 10.93359375, 11.31396484375, 11.6943359375, 12.07470703125, 12.455078125, 12.83544921875, 13.2158203125, 13.59619140625, 13.9765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 2.0, 3.0, 10.0, 5.0, 27.0, 11.0, 15.0, 37.0, 45.0, 55.0, 47.0, 63.0, 63.0, 70.0, 70.0, 65.0, 67.0, 50.0, 50.0, 50.0, 42.0, 29.0, 32.0, 13.0, 25.0, 14.0, 10.0, 10.0, 3.0, 2.0, 2.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.015625, -15.509521484375, -15.00341796875, -14.497314453125, -13.9912109375, -13.485107421875, -12.97900390625, -12.472900390625, -11.966796875, -11.460693359375, -10.95458984375, -10.448486328125, -9.9423828125, -9.436279296875, -8.93017578125, -8.424072265625, -7.91796875, -7.411865234375, -6.90576171875, -6.399658203125, -5.8935546875, -5.387451171875, -4.88134765625, -4.375244140625, -3.869140625, -3.363037109375, -2.85693359375, -2.350830078125, -1.8447265625, -1.338623046875, -0.83251953125, -0.326416015625, 0.1796875, 0.685791015625, 1.19189453125, 1.697998046875, 2.2041015625, 2.710205078125, 3.21630859375, 3.722412109375, 4.228515625, 4.734619140625, 5.24072265625, 5.746826171875, 6.2529296875, 6.759033203125, 7.26513671875, 7.771240234375, 8.27734375, 8.783447265625, 9.28955078125, 9.795654296875, 10.3017578125, 10.807861328125, 11.31396484375, 11.820068359375, 12.326171875, 12.832275390625, 13.33837890625, 13.844482421875, 14.3505859375, 14.856689453125, 15.36279296875, 15.868896484375, 16.375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 9.0, 10.0, 4.0, 18.0, 25.0, 35.0, 49.0, 57.0, 93.0, 161.0, 285.0, 490.0, 957.0, 2164.0, 4957.0, 13492.0, 42091.0, 153916.0, 579715.0, 176849.0, 47716.0, 15248.0, 5590.0, 2276.0, 1021.0, 518.0, 276.0, 169.0, 105.0, 73.0, 65.0, 30.0, 27.0, 12.0, 10.0, 15.0, 5.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.486328125, -1.42816162109375, -1.3699951171875, -1.31182861328125, -1.253662109375, -1.19549560546875, -1.1373291015625, -1.07916259765625, -1.02099609375, -0.96282958984375, -0.9046630859375, -0.84649658203125, -0.788330078125, -0.73016357421875, -0.6719970703125, -0.61383056640625, -0.5556640625, -0.49749755859375, -0.4393310546875, -0.38116455078125, -0.322998046875, -0.26483154296875, -0.2066650390625, -0.14849853515625, -0.09033203125, -0.03216552734375, 0.0260009765625, 0.08416748046875, 0.142333984375, 0.20050048828125, 0.2586669921875, 0.31683349609375, 0.375, 0.43316650390625, 0.4913330078125, 0.54949951171875, 0.607666015625, 0.66583251953125, 0.7239990234375, 0.78216552734375, 0.84033203125, 0.89849853515625, 0.9566650390625, 1.01483154296875, 1.072998046875, 1.13116455078125, 1.1893310546875, 1.24749755859375, 1.3056640625, 1.36383056640625, 1.4219970703125, 1.48016357421875, 1.538330078125, 1.59649658203125, 1.6546630859375, 1.71282958984375, 1.77099609375, 1.82916259765625, 1.8873291015625, 1.94549560546875, 2.003662109375, 2.06182861328125, 2.1199951171875, 2.17816162109375, 2.236328125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 13.0, 16.0, 22.0, 28.0, 57.0, 80.0, 103.0, 130.0, 145.0, 131.0, 87.0, 59.0, 44.0, 24.0, 19.0, 9.0, 6.0, 6.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007472038269042969, -0.0007223561406135559, -0.0006975084543228149, -0.000672660768032074, -0.000647813081741333, -0.000622965395450592, -0.0005981177091598511, -0.0005732700228691101, -0.0005484223365783691, -0.0005235746502876282, -0.0004987269639968872, -0.00047387927770614624, -0.0004490315914154053, -0.0004241839051246643, -0.00039933621883392334, -0.0003744885325431824, -0.0003496408462524414, -0.00032479315996170044, -0.00029994547367095947, -0.0002750977873802185, -0.00025025010108947754, -0.00022540241479873657, -0.0002005547285079956, -0.00017570704221725464, -0.00015085935592651367, -0.0001260116696357727, -0.00010116398334503174, -7.631629705429077e-05, -5.1468610763549805e-05, -2.6620924472808838e-05, -1.773238182067871e-06, 2.3074448108673096e-05, 4.792213439941406e-05, 7.276982069015503e-05, 9.7617506980896e-05, 0.00012246519327163696, 0.00014731287956237793, 0.0001721605658531189, 0.00019700825214385986, 0.00022185593843460083, 0.0002467036247253418, 0.00027155131101608276, 0.00029639899730682373, 0.0003212466835975647, 0.00034609436988830566, 0.00037094205617904663, 0.0003957897424697876, 0.00042063742876052856, 0.00044548511505126953, 0.0004703328013420105, 0.0004951804876327515, 0.0005200281739234924, 0.0005448758602142334, 0.0005697235465049744, 0.0005945712327957153, 0.0006194189190864563, 0.0006442666053771973, 0.0006691142916679382, 0.0006939619779586792, 0.0007188096642494202, 0.0007436573505401611, 0.0007685050368309021, 0.0007933527231216431, 0.000818200409412384, 0.000843048095703125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 7.0, 11.0, 6.0, 17.0, 33.0, 42.0, 58.0, 89.0, 180.0, 304.0, 554.0, 1329.0, 3225.0, 10565.0, 45271.0, 251628.0, 616627.0, 91090.0, 18711.0, 5153.0, 1885.0, 761.0, 437.0, 217.0, 130.0, 75.0, 55.0, 20.0, 16.0, 14.0, 14.0, 7.0, 8.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.259765625, -2.179656982421875, -2.09954833984375, -2.019439697265625, -1.9393310546875, -1.859222412109375, -1.77911376953125, -1.699005126953125, -1.618896484375, -1.538787841796875, -1.45867919921875, -1.378570556640625, -1.2984619140625, -1.218353271484375, -1.13824462890625, -1.058135986328125, -0.97802734375, -0.897918701171875, -0.81781005859375, -0.737701416015625, -0.6575927734375, -0.577484130859375, -0.49737548828125, -0.417266845703125, -0.337158203125, -0.257049560546875, -0.17694091796875, -0.096832275390625, -0.0167236328125, 0.063385009765625, 0.14349365234375, 0.223602294921875, 0.3037109375, 0.383819580078125, 0.46392822265625, 0.544036865234375, 0.6241455078125, 0.704254150390625, 0.78436279296875, 0.864471435546875, 0.944580078125, 1.024688720703125, 1.10479736328125, 1.184906005859375, 1.2650146484375, 1.345123291015625, 1.42523193359375, 1.505340576171875, 1.58544921875, 1.665557861328125, 1.74566650390625, 1.825775146484375, 1.9058837890625, 1.985992431640625, 2.06610107421875, 2.146209716796875, 2.226318359375, 2.306427001953125, 2.38653564453125, 2.466644287109375, 2.5467529296875, 2.626861572265625, 2.70697021484375, 2.787078857421875, 2.8671875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 13.0, 16.0, 16.0, 31.0, 45.0, 73.0, 82.0, 69.0, 104.0, 117.0, 99.0, 92.0, 76.0, 48.0, 32.0, 19.0, 15.0, 14.0, 7.0, 5.0, 4.0, 4.0, 1.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.099609375, -2.996826171875, -2.89404296875, -2.791259765625, -2.6884765625, -2.585693359375, -2.48291015625, -2.380126953125, -2.27734375, -2.174560546875, -2.07177734375, -1.968994140625, -1.8662109375, -1.763427734375, -1.66064453125, -1.557861328125, -1.455078125, -1.352294921875, -1.24951171875, -1.146728515625, -1.0439453125, -0.941162109375, -0.83837890625, -0.735595703125, -0.6328125, -0.530029296875, -0.42724609375, -0.324462890625, -0.2216796875, -0.118896484375, -0.01611328125, 0.086669921875, 0.189453125, 0.292236328125, 0.39501953125, 0.497802734375, 0.6005859375, 0.703369140625, 0.80615234375, 0.908935546875, 1.01171875, 1.114501953125, 1.21728515625, 1.320068359375, 1.4228515625, 1.525634765625, 1.62841796875, 1.731201171875, 1.833984375, 1.936767578125, 2.03955078125, 2.142333984375, 2.2451171875, 2.347900390625, 2.45068359375, 2.553466796875, 2.65625, 2.759033203125, 2.86181640625, 2.964599609375, 3.0673828125, 3.170166015625, 3.27294921875, 3.375732421875, 3.478515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 9.0, 6.0, 3.0, 9.0, 22.0, 34.0, 65.0, 160.0, 263.0, 201.0, 108.0, 61.0, 30.0, 13.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.27042388916016, -74.00942993164062, -71.7484359741211, -69.48744201660156, -67.22644805908203, -64.9654541015625, -62.704463958740234, -60.4434700012207, -58.18247604370117, -55.92148208618164, -53.66048812866211, -51.39949417114258, -49.13850402832031, -46.87751007080078, -44.61651611328125, -42.35552215576172, -40.09452819824219, -37.833534240722656, -35.572540283203125, -33.311546325683594, -31.050554275512695, -28.789560317993164, -26.528568267822266, -24.267574310302734, -22.006580352783203, -19.745586395263672, -17.48459243774414, -15.223600387573242, -12.962606430053711, -10.70161247253418, -8.440619468688965, -6.17962646484375, -3.91864013671875, -1.657646656036377, 0.6033468246459961, 2.864340305328369, 5.125333786010742, 7.386327743530273, 9.647320747375488, 11.908313751220703, 14.169307708740234, 16.430301666259766, 18.691295623779297, 20.952287673950195, 23.213281631469727, 25.474275588989258, 27.735267639160156, 29.996261596679688, 32.25725555419922, 34.51824951171875, 36.77924346923828, 39.04023742675781, 41.301231384277344, 43.562225341796875, 45.82321548461914, 48.08420944213867, 50.3452033996582, 52.606197357177734, 54.867191314697266, 57.1281852722168, 59.38917541503906, 61.650169372558594, 63.911163330078125, 66.17215728759766, 68.43315124511719]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 0.0, 5.0, 4.0, 8.0, 17.0, 12.0, 9.0, 19.0, 21.0, 20.0, 24.0, 28.0, 22.0, 36.0, 24.0, 50.0, 52.0, 59.0, 81.0, 89.0, 69.0, 49.0, 35.0, 36.0, 33.0, 35.0, 26.0, 29.0, 15.0, 13.0, 17.0, 11.0, 15.0, 11.0, 6.0, 7.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-54.819374084472656, -53.17552185058594, -51.53166580200195, -49.887813568115234, -48.24395751953125, -46.60010528564453, -44.95625305175781, -43.31239700317383, -41.668540954589844, -40.024688720703125, -38.38083267211914, -36.73698043823242, -35.09312438964844, -33.44927215576172, -31.805418014526367, -30.161563873291016, -28.517711639404297, -26.873857498168945, -25.230003356933594, -23.586151123046875, -21.94229507446289, -20.298442840576172, -18.65458869934082, -17.01073455810547, -15.366880416870117, -13.723026275634766, -12.079172134399414, -10.435318946838379, -8.791464805603027, -7.147610664367676, -5.503757476806641, -3.859903335571289, -2.2160491943359375, -0.572195291519165, 1.0716586112976074, 2.715512275695801, 4.359366416931152, 6.003220558166504, 7.647073745727539, 9.29092788696289, 10.934782028198242, 12.578636169433594, 14.222490310668945, 15.86634349822998, 17.510196685791016, 19.154052734375, 20.79790496826172, 22.44175910949707, 24.085613250732422, 25.729467391967773, 27.373321533203125, 29.017173767089844, 30.661029815673828, 32.30488204956055, 33.94873809814453, 35.59259033203125, 37.23644256591797, 38.88029479980469, 40.52415084838867, 42.16800308227539, 43.811859130859375, 45.455711364746094, 47.09956359863281, 48.7434196472168, 50.38727569580078]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 3.0, 11.0, 4.0, 14.0, 18.0, 22.0, 41.0, 49.0, 79.0, 119.0, 158.0, 237.0, 378.0, 659.0, 1367.0, 2708.0, 6245.0, 17440.0, 74898.0, 581385.0, 2852027.0, 551391.0, 75544.0, 17428.0, 6172.0, 2673.0, 1337.0, 686.0, 421.0, 249.0, 144.0, 103.0, 91.0, 54.0, 34.0, 22.0, 23.0, 15.0, 5.0, 10.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.82061767578125, -3.6763916015625, -3.53216552734375, -3.387939453125, -3.24371337890625, -3.0994873046875, -2.95526123046875, -2.81103515625, -2.66680908203125, -2.5225830078125, -2.37835693359375, -2.234130859375, -2.08990478515625, -1.9456787109375, -1.80145263671875, -1.6572265625, -1.51300048828125, -1.3687744140625, -1.22454833984375, -1.080322265625, -0.93609619140625, -0.7918701171875, -0.64764404296875, -0.50341796875, -0.35919189453125, -0.2149658203125, -0.07073974609375, 0.073486328125, 0.21771240234375, 0.3619384765625, 0.50616455078125, 0.650390625, 0.79461669921875, 0.9388427734375, 1.08306884765625, 1.227294921875, 1.37152099609375, 1.5157470703125, 1.65997314453125, 1.80419921875, 1.94842529296875, 2.0926513671875, 2.23687744140625, 2.381103515625, 2.52532958984375, 2.6695556640625, 2.81378173828125, 2.9580078125, 3.10223388671875, 3.2464599609375, 3.39068603515625, 3.534912109375, 3.67913818359375, 3.8233642578125, 3.96759033203125, 4.11181640625, 4.25604248046875, 4.4002685546875, 4.54449462890625, 4.688720703125, 4.83294677734375, 4.9771728515625, 5.12139892578125, 5.265625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 7.0, 5.0, 7.0, 7.0, 8.0, 14.0, 10.0, 21.0, 21.0, 20.0, 22.0, 40.0, 38.0, 28.0, 49.0, 49.0, 44.0, 41.0, 43.0, 46.0, 58.0, 41.0, 43.0, 47.0, 39.0, 39.0, 33.0, 30.0, 23.0, 27.0, 20.0, 10.0, 13.0, 13.0, 7.0, 6.0, 7.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.435546875, -3.334075927734375, -3.23260498046875, -3.131134033203125, -3.0296630859375, -2.928192138671875, -2.82672119140625, -2.725250244140625, -2.623779296875, -2.522308349609375, -2.42083740234375, -2.319366455078125, -2.2178955078125, -2.116424560546875, -2.01495361328125, -1.913482666015625, -1.81201171875, -1.710540771484375, -1.60906982421875, -1.507598876953125, -1.4061279296875, -1.304656982421875, -1.20318603515625, -1.101715087890625, -1.000244140625, -0.898773193359375, -0.79730224609375, -0.695831298828125, -0.5943603515625, -0.492889404296875, -0.39141845703125, -0.289947509765625, -0.1884765625, -0.087005615234375, 0.01446533203125, 0.115936279296875, 0.2174072265625, 0.318878173828125, 0.42034912109375, 0.521820068359375, 0.623291015625, 0.724761962890625, 0.82623291015625, 0.927703857421875, 1.0291748046875, 1.130645751953125, 1.23211669921875, 1.333587646484375, 1.43505859375, 1.536529541015625, 1.63800048828125, 1.739471435546875, 1.8409423828125, 1.942413330078125, 2.04388427734375, 2.145355224609375, 2.246826171875, 2.348297119140625, 2.44976806640625, 2.551239013671875, 2.6527099609375, 2.754180908203125, 2.85565185546875, 2.957122802734375, 3.05859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 14.0, 15.0, 27.0, 43.0, 106.0, 285.0, 710.0, 3428.0, 53955.0, 3957608.0, 170313.0, 6009.0, 1081.0, 368.0, 143.0, 91.0, 31.0, 20.0, 13.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.5625, -13.1197509765625, -12.677001953125, -12.2342529296875, -11.79150390625, -11.3487548828125, -10.906005859375, -10.4632568359375, -10.0205078125, -9.5777587890625, -9.135009765625, -8.6922607421875, -8.24951171875, -7.8067626953125, -7.364013671875, -6.9212646484375, -6.478515625, -6.0357666015625, -5.593017578125, -5.1502685546875, -4.70751953125, -4.2647705078125, -3.822021484375, -3.3792724609375, -2.9365234375, -2.4937744140625, -2.051025390625, -1.6082763671875, -1.16552734375, -0.7227783203125, -0.280029296875, 0.1627197265625, 0.60546875, 1.0482177734375, 1.490966796875, 1.9337158203125, 2.37646484375, 2.8192138671875, 3.261962890625, 3.7047119140625, 4.1474609375, 4.5902099609375, 5.032958984375, 5.4757080078125, 5.91845703125, 6.3612060546875, 6.803955078125, 7.2467041015625, 7.689453125, 8.1322021484375, 8.574951171875, 9.0177001953125, 9.46044921875, 9.9031982421875, 10.345947265625, 10.7886962890625, 11.2314453125, 11.6741943359375, 12.116943359375, 12.5596923828125, 13.00244140625, 13.4451904296875, 13.887939453125, 14.3306884765625, 14.7734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 10.0, 18.0, 25.0, 46.0, 60.0, 91.0, 173.0, 297.0, 671.0, 1030.0, 767.0, 382.0, 193.0, 118.0, 74.0, 39.0, 21.0, 16.0, 12.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.62890625, -6.36029052734375, -6.0916748046875, -5.82305908203125, -5.554443359375, -5.28582763671875, -5.0172119140625, -4.74859619140625, -4.47998046875, -4.21136474609375, -3.9427490234375, -3.67413330078125, -3.405517578125, -3.13690185546875, -2.8682861328125, -2.59967041015625, -2.3310546875, -2.06243896484375, -1.7938232421875, -1.52520751953125, -1.256591796875, -0.98797607421875, -0.7193603515625, -0.45074462890625, -0.18212890625, 0.08648681640625, 0.3551025390625, 0.62371826171875, 0.892333984375, 1.16094970703125, 1.4295654296875, 1.69818115234375, 1.966796875, 2.23541259765625, 2.5040283203125, 2.77264404296875, 3.041259765625, 3.30987548828125, 3.5784912109375, 3.84710693359375, 4.11572265625, 4.38433837890625, 4.6529541015625, 4.92156982421875, 5.190185546875, 5.45880126953125, 5.7274169921875, 5.99603271484375, 6.2646484375, 6.53326416015625, 6.8018798828125, 7.07049560546875, 7.339111328125, 7.60772705078125, 7.8763427734375, 8.14495849609375, 8.41357421875, 8.68218994140625, 8.9508056640625, 9.21942138671875, 9.488037109375, 9.75665283203125, 10.0252685546875, 10.29388427734375, 10.5625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 28.0, 107.0, 278.0, 356.0, 149.0, 45.0, 21.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.39299011230469, -103.18627166748047, -99.97955322265625, -96.7728271484375, -93.56610870361328, -90.35939025878906, -87.15266418457031, -83.9459457397461, -80.73922729492188, -77.53250885009766, -74.32579040527344, -71.11906433105469, -67.91234588623047, -64.70562744140625, -61.498905181884766, -58.29218292236328, -55.08546447753906, -51.878746032714844, -48.67202377319336, -45.465301513671875, -42.258583068847656, -39.05186462402344, -35.84514236450195, -32.63842010498047, -29.43170166015625, -26.2249813079834, -23.018260955810547, -19.811540603637695, -16.604820251464844, -13.398099899291992, -10.19137954711914, -6.984659194946289, -3.7779388427734375, -0.5712184906005859, 2.6355018615722656, 5.842222213745117, 9.048942565917969, 12.25566291809082, 15.462383270263672, 18.669103622436523, 21.875823974609375, 25.082544326782227, 28.289264678955078, 31.49598503112793, 34.70270538330078, 37.909423828125, 41.116146087646484, 44.32286834716797, 47.52958679199219, 50.736305236816406, 53.94302749633789, 57.149749755859375, 60.356468200683594, 63.56318664550781, 66.76991271972656, 69.97663116455078, 73.183349609375, 76.39006805419922, 79.59678649902344, 82.80351257324219, 86.0102310180664, 89.21694946289062, 92.42367553710938, 95.6303939819336, 98.83711242675781]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 12.0, 10.0, 15.0, 15.0, 21.0, 16.0, 29.0, 16.0, 30.0, 30.0, 42.0, 34.0, 44.0, 40.0, 43.0, 45.0, 45.0, 49.0, 53.0, 51.0, 30.0, 38.0, 38.0, 29.0, 29.0, 29.0, 17.0, 23.0, 12.0, 12.0, 18.0, 19.0, 8.0, 11.0, 13.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.48458480834961, -24.652755737304688, -23.820926666259766, -22.989097595214844, -22.15726661682129, -21.325437545776367, -20.493608474731445, -19.661779403686523, -18.82994842529297, -17.998119354248047, -17.166290283203125, -16.334461212158203, -15.502630233764648, -14.670801162719727, -13.838972091674805, -13.007143020629883, -12.175313949584961, -11.343484878540039, -10.5116548538208, -9.679825782775879, -8.84799575805664, -8.016166687011719, -7.184337615966797, -6.352508068084717, -5.520678520202637, -4.688848972320557, -3.8570196628570557, -3.0251903533935547, -2.1933608055114746, -1.3615312576293945, -0.5297021865844727, 0.3021273612976074, 1.1339569091796875, 1.965786337852478, 2.7976157665252686, 3.6294450759887695, 4.46127462387085, 5.29310417175293, 6.124933242797852, 6.956762790679932, 7.788592338562012, 8.620421409606934, 9.452251434326172, 10.284080505371094, 11.115909576416016, 11.947739601135254, 12.779568672180176, 13.611398696899414, 14.443227767944336, 15.275056838989258, 16.10688591003418, 16.938716888427734, 17.770545959472656, 18.602375030517578, 19.4342041015625, 20.266033172607422, 21.097862243652344, 21.929691314697266, 22.761520385742188, 23.59334945678711, 24.425180435180664, 25.257009506225586, 26.088838577270508, 26.92066764831543, 27.752498626708984]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 8.0, 6.0, 13.0, 10.0, 19.0, 35.0, 48.0, 78.0, 111.0, 219.0, 357.0, 607.0, 1086.0, 2148.0, 4704.0, 12009.0, 35750.0, 135023.0, 468929.0, 283968.0, 68618.0, 20598.0, 7492.0, 3191.0, 1519.0, 792.0, 437.0, 304.0, 177.0, 122.0, 62.0, 45.0, 28.0, 17.0, 10.0, 7.0, 3.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.51171875, -4.34918212890625, -4.1866455078125, -4.02410888671875, -3.861572265625, -3.69903564453125, -3.5364990234375, -3.37396240234375, -3.21142578125, -3.04888916015625, -2.8863525390625, -2.72381591796875, -2.561279296875, -2.39874267578125, -2.2362060546875, -2.07366943359375, -1.9111328125, -1.74859619140625, -1.5860595703125, -1.42352294921875, -1.260986328125, -1.09844970703125, -0.9359130859375, -0.77337646484375, -0.61083984375, -0.44830322265625, -0.2857666015625, -0.12322998046875, 0.039306640625, 0.20184326171875, 0.3643798828125, 0.52691650390625, 0.689453125, 0.85198974609375, 1.0145263671875, 1.17706298828125, 1.339599609375, 1.50213623046875, 1.6646728515625, 1.82720947265625, 1.98974609375, 2.15228271484375, 2.3148193359375, 2.47735595703125, 2.639892578125, 2.80242919921875, 2.9649658203125, 3.12750244140625, 3.2900390625, 3.45257568359375, 3.6151123046875, 3.77764892578125, 3.940185546875, 4.10272216796875, 4.2652587890625, 4.42779541015625, 4.59033203125, 4.75286865234375, 4.9154052734375, 5.07794189453125, 5.240478515625, 5.40301513671875, 5.5655517578125, 5.72808837890625, 5.890625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 5.0, 10.0, 8.0, 13.0, 6.0, 16.0, 11.0, 13.0, 19.0, 18.0, 20.0, 31.0, 30.0, 41.0, 31.0, 31.0, 57.0, 34.0, 38.0, 45.0, 42.0, 41.0, 48.0, 31.0, 46.0, 41.0, 33.0, 28.0, 31.0, 25.0, 27.0, 21.0, 18.0, 15.0, 8.0, 15.0, 6.0, 10.0, 6.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.22265625, -3.13018798828125, -3.0377197265625, -2.94525146484375, -2.852783203125, -2.76031494140625, -2.6678466796875, -2.57537841796875, -2.48291015625, -2.39044189453125, -2.2979736328125, -2.20550537109375, -2.113037109375, -2.02056884765625, -1.9281005859375, -1.83563232421875, -1.7431640625, -1.65069580078125, -1.5582275390625, -1.46575927734375, -1.373291015625, -1.28082275390625, -1.1883544921875, -1.09588623046875, -1.00341796875, -0.91094970703125, -0.8184814453125, -0.72601318359375, -0.633544921875, -0.54107666015625, -0.4486083984375, -0.35614013671875, -0.263671875, -0.17120361328125, -0.0787353515625, 0.01373291015625, 0.106201171875, 0.19866943359375, 0.2911376953125, 0.38360595703125, 0.47607421875, 0.56854248046875, 0.6610107421875, 0.75347900390625, 0.845947265625, 0.93841552734375, 1.0308837890625, 1.12335205078125, 1.2158203125, 1.30828857421875, 1.4007568359375, 1.49322509765625, 1.585693359375, 1.67816162109375, 1.7706298828125, 1.86309814453125, 1.95556640625, 2.04803466796875, 2.1405029296875, 2.23297119140625, 2.325439453125, 2.41790771484375, 2.5103759765625, 2.60284423828125, 2.6953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 5.0, 6.0, 6.0, 5.0, 23.0, 19.0, 38.0, 46.0, 59.0, 113.0, 157.0, 220.0, 438.0, 908.0, 2264.0, 8427.0, 59158.0, 795210.0, 159661.0, 15755.0, 3485.0, 1176.0, 529.0, 297.0, 193.0, 107.0, 73.0, 38.0, 36.0, 25.0, 23.0, 10.0, 6.0, 10.0, 8.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.90625, -9.6121826171875, -9.318115234375, -9.0240478515625, -8.72998046875, -8.4359130859375, -8.141845703125, -7.8477783203125, -7.5537109375, -7.2596435546875, -6.965576171875, -6.6715087890625, -6.37744140625, -6.0833740234375, -5.789306640625, -5.4952392578125, -5.201171875, -4.9071044921875, -4.613037109375, -4.3189697265625, -4.02490234375, -3.7308349609375, -3.436767578125, -3.1427001953125, -2.8486328125, -2.5545654296875, -2.260498046875, -1.9664306640625, -1.67236328125, -1.3782958984375, -1.084228515625, -0.7901611328125, -0.49609375, -0.2020263671875, 0.092041015625, 0.3861083984375, 0.68017578125, 0.9742431640625, 1.268310546875, 1.5623779296875, 1.8564453125, 2.1505126953125, 2.444580078125, 2.7386474609375, 3.03271484375, 3.3267822265625, 3.620849609375, 3.9149169921875, 4.208984375, 4.5030517578125, 4.797119140625, 5.0911865234375, 5.38525390625, 5.6793212890625, 5.973388671875, 6.2674560546875, 6.5615234375, 6.8555908203125, 7.149658203125, 7.4437255859375, 7.73779296875, 8.0318603515625, 8.325927734375, 8.6199951171875, 8.9140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 1.0, 5.0, 5.0, 4.0, 8.0, 13.0, 11.0, 18.0, 34.0, 45.0, 45.0, 54.0, 57.0, 70.0, 80.0, 73.0, 82.0, 76.0, 65.0, 72.0, 56.0, 36.0, 29.0, 22.0, 14.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.40478515625, -18.8251953125, -18.24560546875, -17.666015625, -17.08642578125, -16.5068359375, -15.92724609375, -15.34765625, -14.76806640625, -14.1884765625, -13.60888671875, -13.029296875, -12.44970703125, -11.8701171875, -11.29052734375, -10.7109375, -10.13134765625, -9.5517578125, -8.97216796875, -8.392578125, -7.81298828125, -7.2333984375, -6.65380859375, -6.07421875, -5.49462890625, -4.9150390625, -4.33544921875, -3.755859375, -3.17626953125, -2.5966796875, -2.01708984375, -1.4375, -0.85791015625, -0.2783203125, 0.30126953125, 0.880859375, 1.46044921875, 2.0400390625, 2.61962890625, 3.19921875, 3.77880859375, 4.3583984375, 4.93798828125, 5.517578125, 6.09716796875, 6.6767578125, 7.25634765625, 7.8359375, 8.41552734375, 8.9951171875, 9.57470703125, 10.154296875, 10.73388671875, 11.3134765625, 11.89306640625, 12.47265625, 13.05224609375, 13.6318359375, 14.21142578125, 14.791015625, 15.37060546875, 15.9501953125, 16.52978515625, 17.109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 10.0, 7.0, 6.0, 12.0, 23.0, 21.0, 18.0, 35.0, 45.0, 84.0, 131.0, 185.0, 303.0, 530.0, 991.0, 1914.0, 4073.0, 10177.0, 29993.0, 123310.0, 688766.0, 136442.0, 31969.0, 10761.0, 4357.0, 1974.0, 971.0, 521.0, 301.0, 182.0, 140.0, 65.0, 76.0, 36.0, 27.0, 20.0, 22.0, 11.0, 10.0, 8.0, 8.0, 7.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.732421875, -1.6774749755859375, -1.622528076171875, -1.5675811767578125, -1.51263427734375, -1.4576873779296875, -1.402740478515625, -1.3477935791015625, -1.2928466796875, -1.2378997802734375, -1.182952880859375, -1.1280059814453125, -1.07305908203125, -1.0181121826171875, -0.963165283203125, -0.9082183837890625, -0.853271484375, -0.7983245849609375, -0.743377685546875, -0.6884307861328125, -0.63348388671875, -0.5785369873046875, -0.523590087890625, -0.4686431884765625, -0.4136962890625, -0.3587493896484375, -0.303802490234375, -0.2488555908203125, -0.19390869140625, -0.1389617919921875, -0.084014892578125, -0.0290679931640625, 0.02587890625, 0.0808258056640625, 0.135772705078125, 0.1907196044921875, 0.24566650390625, 0.3006134033203125, 0.355560302734375, 0.4105072021484375, 0.4654541015625, 0.5204010009765625, 0.575347900390625, 0.6302947998046875, 0.68524169921875, 0.7401885986328125, 0.795135498046875, 0.8500823974609375, 0.905029296875, 0.9599761962890625, 1.014923095703125, 1.0698699951171875, 1.12481689453125, 1.1797637939453125, 1.234710693359375, 1.2896575927734375, 1.3446044921875, 1.3995513916015625, 1.454498291015625, 1.5094451904296875, 1.56439208984375, 1.6193389892578125, 1.674285888671875, 1.7292327880859375, 1.7841796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 8.0, 8.0, 10.0, 17.0, 30.0, 36.0, 54.0, 93.0, 113.0, 151.0, 140.0, 104.0, 68.0, 43.0, 26.0, 25.0, 10.0, 9.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005807876586914062, -0.0005630403757095337, -0.0005452930927276611, -0.0005275458097457886, -0.000509798526763916, -0.0004920512437820435, -0.0004743039608001709, -0.00045655667781829834, -0.0004388093948364258, -0.0004210621118545532, -0.00040331482887268066, -0.0003855675458908081, -0.00036782026290893555, -0.000350072979927063, -0.00033232569694519043, -0.00031457841396331787, -0.0002968311309814453, -0.00027908384799957275, -0.0002613365650177002, -0.00024358928203582764, -0.00022584199905395508, -0.00020809471607208252, -0.00019034743309020996, -0.0001726001501083374, -0.00015485286712646484, -0.00013710558414459229, -0.00011935830116271973, -0.00010161101818084717, -8.386373519897461e-05, -6.611645221710205e-05, -4.836916923522949e-05, -3.0621886253356934e-05, -1.2874603271484375e-05, 4.872679710388184e-06, 2.2619962692260742e-05, 4.03672456741333e-05, 5.811452865600586e-05, 7.586181163787842e-05, 9.360909461975098e-05, 0.00011135637760162354, 0.0001291036605834961, 0.00014685094356536865, 0.0001645982265472412, 0.00018234550952911377, 0.00020009279251098633, 0.0002178400754928589, 0.00023558735847473145, 0.000253334641456604, 0.00027108192443847656, 0.0002888292074203491, 0.0003065764904022217, 0.00032432377338409424, 0.0003420710563659668, 0.00035981833934783936, 0.0003775656223297119, 0.00039531290531158447, 0.00041306018829345703, 0.0004308074712753296, 0.00044855475425720215, 0.0004663020372390747, 0.00048404932022094727, 0.0005017966032028198, 0.0005195438861846924, 0.0005372911691665649, 0.0005550384521484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 6.0, 9.0, 8.0, 11.0, 19.0, 20.0, 29.0, 58.0, 90.0, 148.0, 196.0, 439.0, 858.0, 1985.0, 5276.0, 18732.0, 95930.0, 740941.0, 146893.0, 25521.0, 6720.0, 2477.0, 1047.0, 470.0, 271.0, 157.0, 86.0, 59.0, 33.0, 22.0, 18.0, 8.0, 10.0, 2.0, 7.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.27734375, -2.205291748046875, -2.13323974609375, -2.061187744140625, -1.9891357421875, -1.917083740234375, -1.84503173828125, -1.772979736328125, -1.700927734375, -1.628875732421875, -1.55682373046875, -1.484771728515625, -1.4127197265625, -1.340667724609375, -1.26861572265625, -1.196563720703125, -1.12451171875, -1.052459716796875, -0.98040771484375, -0.908355712890625, -0.8363037109375, -0.764251708984375, -0.69219970703125, -0.620147705078125, -0.548095703125, -0.476043701171875, -0.40399169921875, -0.331939697265625, -0.2598876953125, -0.187835693359375, -0.11578369140625, -0.043731689453125, 0.0283203125, 0.100372314453125, 0.17242431640625, 0.244476318359375, 0.3165283203125, 0.388580322265625, 0.46063232421875, 0.532684326171875, 0.604736328125, 0.676788330078125, 0.74884033203125, 0.820892333984375, 0.8929443359375, 0.964996337890625, 1.03704833984375, 1.109100341796875, 1.18115234375, 1.253204345703125, 1.32525634765625, 1.397308349609375, 1.4693603515625, 1.541412353515625, 1.61346435546875, 1.685516357421875, 1.757568359375, 1.829620361328125, 1.90167236328125, 1.973724365234375, 2.0457763671875, 2.117828369140625, 2.18988037109375, 2.261932373046875, 2.333984375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 7.0, 14.0, 11.0, 14.0, 23.0, 28.0, 35.0, 47.0, 63.0, 73.0, 108.0, 123.0, 102.0, 83.0, 64.0, 55.0, 41.0, 22.0, 21.0, 8.0, 12.0, 6.0, 7.0, 2.0, 3.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0625, -1.987823486328125, -1.91314697265625, -1.838470458984375, -1.7637939453125, -1.689117431640625, -1.61444091796875, -1.539764404296875, -1.465087890625, -1.390411376953125, -1.31573486328125, -1.241058349609375, -1.1663818359375, -1.091705322265625, -1.01702880859375, -0.942352294921875, -0.86767578125, -0.792999267578125, -0.71832275390625, -0.643646240234375, -0.5689697265625, -0.494293212890625, -0.41961669921875, -0.344940185546875, -0.270263671875, -0.195587158203125, -0.12091064453125, -0.046234130859375, 0.0284423828125, 0.103118896484375, 0.17779541015625, 0.252471923828125, 0.3271484375, 0.401824951171875, 0.47650146484375, 0.551177978515625, 0.6258544921875, 0.700531005859375, 0.77520751953125, 0.849884033203125, 0.924560546875, 0.999237060546875, 1.07391357421875, 1.148590087890625, 1.2232666015625, 1.297943115234375, 1.37261962890625, 1.447296142578125, 1.52197265625, 1.596649169921875, 1.67132568359375, 1.746002197265625, 1.8206787109375, 1.895355224609375, 1.97003173828125, 2.044708251953125, 2.119384765625, 2.194061279296875, 2.26873779296875, 2.343414306640625, 2.4180908203125, 2.492767333984375, 2.56744384765625, 2.642120361328125, 2.716796875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 7.0, 8.0, 17.0, 23.0, 48.0, 87.0, 135.0, 365.0, 149.0, 70.0, 45.0, 22.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.878021240234375, -48.964630126953125, -47.051239013671875, -45.137847900390625, -43.224456787109375, -41.311065673828125, -39.397674560546875, -37.484283447265625, -35.570892333984375, -33.657501220703125, -31.744110107421875, -29.830718994140625, -27.917327880859375, -26.003936767578125, -24.090543746948242, -22.177152633666992, -20.26375961303711, -18.35036849975586, -16.43697738647461, -14.523585319519043, -12.610194206237793, -10.696803092956543, -8.783411026000977, -6.870019912719727, -4.956628799438477, -3.0432374477386475, -1.1298460960388184, 0.7835454940795898, 2.69693660736084, 4.61032772064209, 6.523719787597656, 8.437110900878906, 10.350502014160156, 12.263893127441406, 14.177284240722656, 16.090675354003906, 18.004066467285156, 19.917457580566406, 21.83085060119629, 23.74424171447754, 25.65763282775879, 27.57102394104004, 29.48441505432129, 31.397808074951172, 33.31119918823242, 35.22459030151367, 37.13798141479492, 39.05137252807617, 40.96476364135742, 42.87815475463867, 44.79154586791992, 46.70493698120117, 48.61832809448242, 50.53171920776367, 52.44511413574219, 54.35850524902344, 56.27189636230469, 58.18528747558594, 60.09867858886719, 62.01206970214844, 63.92546081542969, 65.83885192871094, 67.75224304199219, 69.66563415527344, 71.57902526855469]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 5.0, 8.0, 2.0, 8.0, 11.0, 15.0, 14.0, 18.0, 12.0, 21.0, 23.0, 15.0, 27.0, 25.0, 23.0, 31.0, 45.0, 42.0, 70.0, 81.0, 77.0, 53.0, 45.0, 35.0, 40.0, 36.0, 22.0, 27.0, 27.0, 15.0, 22.0, 19.0, 6.0, 8.0, 8.0, 8.0, 7.0, 7.0, 6.0, 6.0, 2.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-41.45472717285156, -40.26729965209961, -39.079872131347656, -37.8924446105957, -36.70501708984375, -35.51758575439453, -34.33015823364258, -33.142730712890625, -31.955303192138672, -30.76787567138672, -29.580448150634766, -28.39301872253418, -27.205591201782227, -26.018163681030273, -24.830734252929688, -23.643306732177734, -22.45587921142578, -21.268451690673828, -20.081024169921875, -18.89359474182129, -17.706167221069336, -16.518739700317383, -15.331311225891113, -14.143882751464844, -12.95645523071289, -11.769027709960938, -10.581599235534668, -9.394170761108398, -8.206743240356445, -7.019315242767334, -5.831887245178223, -4.644458770751953, -3.4570274353027344, -2.269599437713623, -1.0821714401245117, 0.10525655746459961, 1.292684555053711, 2.4801125526428223, 3.6675405502319336, 4.854969024658203, 6.042396545410156, 7.229824542999268, 8.417252540588379, 9.604681015014648, 10.792108535766602, 11.979536056518555, 13.166964530944824, 14.354393005371094, 15.541820526123047, 16.729248046875, 17.916675567626953, 19.10410499572754, 20.291532516479492, 21.478960037231445, 22.66638946533203, 23.853816986083984, 25.041244506835938, 26.22867202758789, 27.416099548339844, 28.60352897644043, 29.790956497192383, 30.978384017944336, 32.16581344604492, 33.353240966796875, 34.54066848754883]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 12.0, 19.0, 21.0, 32.0, 49.0, 72.0, 111.0, 173.0, 355.0, 560.0, 1036.0, 2198.0, 4707.0, 11793.0, 37841.0, 174205.0, 1059639.0, 2294813.0, 479073.0, 89445.0, 23049.0, 7939.0, 3517.0, 1683.0, 813.0, 444.0, 253.0, 153.0, 95.0, 60.0, 27.0, 30.0, 22.0, 15.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.76171875, -3.63751220703125, -3.5133056640625, -3.38909912109375, -3.264892578125, -3.14068603515625, -3.0164794921875, -2.89227294921875, -2.76806640625, -2.64385986328125, -2.5196533203125, -2.39544677734375, -2.271240234375, -2.14703369140625, -2.0228271484375, -1.89862060546875, -1.7744140625, -1.65020751953125, -1.5260009765625, -1.40179443359375, -1.277587890625, -1.15338134765625, -1.0291748046875, -0.90496826171875, -0.78076171875, -0.65655517578125, -0.5323486328125, -0.40814208984375, -0.283935546875, -0.15972900390625, -0.0355224609375, 0.08868408203125, 0.212890625, 0.33709716796875, 0.4613037109375, 0.58551025390625, 0.709716796875, 0.83392333984375, 0.9581298828125, 1.08233642578125, 1.20654296875, 1.33074951171875, 1.4549560546875, 1.57916259765625, 1.703369140625, 1.82757568359375, 1.9517822265625, 2.07598876953125, 2.2001953125, 2.32440185546875, 2.4486083984375, 2.57281494140625, 2.697021484375, 2.82122802734375, 2.9454345703125, 3.06964111328125, 3.19384765625, 3.31805419921875, 3.4422607421875, 3.56646728515625, 3.690673828125, 3.81488037109375, 3.9390869140625, 4.06329345703125, 4.1875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 8.0, 11.0, 8.0, 8.0, 16.0, 10.0, 20.0, 23.0, 20.0, 18.0, 32.0, 25.0, 38.0, 42.0, 38.0, 42.0, 43.0, 39.0, 44.0, 48.0, 35.0, 51.0, 45.0, 30.0, 38.0, 35.0, 33.0, 29.0, 27.0, 27.0, 12.0, 14.0, 10.0, 15.0, 10.0, 9.0, 11.0, 8.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.197265625, -3.105224609375, -3.01318359375, -2.921142578125, -2.8291015625, -2.737060546875, -2.64501953125, -2.552978515625, -2.4609375, -2.368896484375, -2.27685546875, -2.184814453125, -2.0927734375, -2.000732421875, -1.90869140625, -1.816650390625, -1.724609375, -1.632568359375, -1.54052734375, -1.448486328125, -1.3564453125, -1.264404296875, -1.17236328125, -1.080322265625, -0.98828125, -0.896240234375, -0.80419921875, -0.712158203125, -0.6201171875, -0.528076171875, -0.43603515625, -0.343994140625, -0.251953125, -0.159912109375, -0.06787109375, 0.024169921875, 0.1162109375, 0.208251953125, 0.30029296875, 0.392333984375, 0.484375, 0.576416015625, 0.66845703125, 0.760498046875, 0.8525390625, 0.944580078125, 1.03662109375, 1.128662109375, 1.220703125, 1.312744140625, 1.40478515625, 1.496826171875, 1.5888671875, 1.680908203125, 1.77294921875, 1.864990234375, 1.95703125, 2.049072265625, 2.14111328125, 2.233154296875, 2.3251953125, 2.417236328125, 2.50927734375, 2.601318359375, 2.693359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 7.0, 9.0, 13.0, 12.0, 23.0, 23.0, 35.0, 53.0, 99.0, 202.0, 436.0, 1085.0, 3628.0, 19768.0, 302343.0, 3692132.0, 156177.0, 13740.0, 2815.0, 822.0, 333.0, 194.0, 100.0, 73.0, 41.0, 29.0, 24.0, 10.0, 10.0, 10.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.78125, -7.50732421875, -7.2333984375, -6.95947265625, -6.685546875, -6.41162109375, -6.1376953125, -5.86376953125, -5.58984375, -5.31591796875, -5.0419921875, -4.76806640625, -4.494140625, -4.22021484375, -3.9462890625, -3.67236328125, -3.3984375, -3.12451171875, -2.8505859375, -2.57666015625, -2.302734375, -2.02880859375, -1.7548828125, -1.48095703125, -1.20703125, -0.93310546875, -0.6591796875, -0.38525390625, -0.111328125, 0.16259765625, 0.4365234375, 0.71044921875, 0.984375, 1.25830078125, 1.5322265625, 1.80615234375, 2.080078125, 2.35400390625, 2.6279296875, 2.90185546875, 3.17578125, 3.44970703125, 3.7236328125, 3.99755859375, 4.271484375, 4.54541015625, 4.8193359375, 5.09326171875, 5.3671875, 5.64111328125, 5.9150390625, 6.18896484375, 6.462890625, 6.73681640625, 7.0107421875, 7.28466796875, 7.55859375, 7.83251953125, 8.1064453125, 8.38037109375, 8.654296875, 8.92822265625, 9.2021484375, 9.47607421875, 9.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 11.0, 4.0, 4.0, 9.0, 15.0, 24.0, 26.0, 44.0, 47.0, 66.0, 125.0, 155.0, 235.0, 405.0, 598.0, 693.0, 528.0, 355.0, 213.0, 154.0, 106.0, 60.0, 50.0, 40.0, 21.0, 17.0, 15.0, 6.0, 11.0, 5.0, 6.0, 3.0, 6.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.15234375, -4.9573974609375, -4.762451171875, -4.5675048828125, -4.37255859375, -4.1776123046875, -3.982666015625, -3.7877197265625, -3.5927734375, -3.3978271484375, -3.202880859375, -3.0079345703125, -2.81298828125, -2.6180419921875, -2.423095703125, -2.2281494140625, -2.033203125, -1.8382568359375, -1.643310546875, -1.4483642578125, -1.25341796875, -1.0584716796875, -0.863525390625, -0.6685791015625, -0.4736328125, -0.2786865234375, -0.083740234375, 0.1112060546875, 0.30615234375, 0.5010986328125, 0.696044921875, 0.8909912109375, 1.0859375, 1.2808837890625, 1.475830078125, 1.6707763671875, 1.86572265625, 2.0606689453125, 2.255615234375, 2.4505615234375, 2.6455078125, 2.8404541015625, 3.035400390625, 3.2303466796875, 3.42529296875, 3.6202392578125, 3.815185546875, 4.0101318359375, 4.205078125, 4.4000244140625, 4.594970703125, 4.7899169921875, 4.98486328125, 5.1798095703125, 5.374755859375, 5.5697021484375, 5.7646484375, 5.9595947265625, 6.154541015625, 6.3494873046875, 6.54443359375, 6.7393798828125, 6.934326171875, 7.1292724609375, 7.32421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 10.0, 19.0, 70.0, 281.0, 411.0, 166.0, 33.0, 11.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.41714477539062, -78.56761932373047, -74.71809387207031, -70.86856079101562, -67.01903533935547, -63.16950988769531, -59.31998062133789, -55.47045135498047, -51.62092590332031, -47.771400451660156, -43.921871185302734, -40.07234191894531, -36.222816467285156, -32.373291015625, -28.523761749267578, -24.67423439025879, -20.82470703125, -16.97517967224121, -13.125652313232422, -9.276124954223633, -5.426597595214844, -1.5770702362060547, 2.2724571228027344, 6.121984481811523, 9.971511840820312, 13.821039199829102, 17.67056655883789, 21.52009391784668, 25.36962127685547, 29.219148635864258, 33.06867599487305, 36.91820526123047, 40.767730712890625, 44.61725616455078, 48.4667854309082, 52.316314697265625, 56.16584014892578, 60.01536560058594, 63.86489486694336, 67.71442413330078, 71.56394958496094, 75.4134750366211, 79.26300048828125, 83.11253356933594, 86.9620590209961, 90.81158447265625, 94.66111755371094, 98.5106430053711, 102.36016845703125, 106.2096939086914, 110.05921936035156, 113.90875244140625, 117.7582778930664, 121.60780334472656, 125.45733642578125, 129.30685424804688, 133.15638732910156, 137.00592041015625, 140.85543823242188, 144.70497131347656, 148.55450439453125, 152.40402221679688, 156.25355529785156, 160.1030731201172, 163.95260620117188]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 7.0, 13.0, 11.0, 7.0, 14.0, 30.0, 17.0, 24.0, 41.0, 46.0, 43.0, 59.0, 50.0, 63.0, 61.0, 55.0, 64.0, 58.0, 62.0, 42.0, 31.0, 30.0, 24.0, 34.0, 26.0, 16.0, 17.0, 14.0, 7.0, 10.0, 9.0, 1.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.14480972290039, -43.93681335449219, -42.728816986083984, -41.52082061767578, -40.312828063964844, -39.10483169555664, -37.89683532714844, -36.688838958740234, -35.48084259033203, -34.27284622192383, -33.064849853515625, -31.856855392456055, -30.64885902404785, -29.44086265563965, -28.232868194580078, -27.024871826171875, -25.816875457763672, -24.60887908935547, -23.400882720947266, -22.192888259887695, -20.984891891479492, -19.77689552307129, -18.56890106201172, -17.360904693603516, -16.152908325195312, -14.94491195678711, -13.736916542053223, -12.528921127319336, -11.320924758911133, -10.11292839050293, -8.904932975769043, -7.696937561035156, -6.488941192626953, -5.280945301055908, -4.072949409484863, -2.8649535179138184, -1.6569576263427734, -0.4489617347717285, 0.7590341567993164, 1.9670295715332031, 3.1750259399414062, 4.383021831512451, 5.591017723083496, 6.799013614654541, 8.007009506225586, 9.215005874633789, 10.423001289367676, 11.630996704101562, 12.838993072509766, 14.046989440917969, 15.254984855651855, 16.462980270385742, 17.670976638793945, 18.87897300720215, 20.08696746826172, 21.294963836669922, 22.502960205078125, 23.710956573486328, 24.91895294189453, 26.1269474029541, 27.334943771362305, 28.542940139770508, 29.750934600830078, 30.95893096923828, 32.166927337646484]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 12.0, 12.0, 14.0, 16.0, 28.0, 47.0, 67.0, 103.0, 148.0, 258.0, 532.0, 974.0, 1848.0, 3800.0, 8312.0, 20703.0, 59817.0, 216713.0, 485102.0, 169284.0, 49036.0, 17577.0, 7256.0, 3317.0, 1617.0, 847.0, 450.0, 257.0, 141.0, 102.0, 63.0, 38.0, 19.0, 15.0, 3.0, 9.0, 8.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8359375, -5.6756591796875, -5.515380859375, -5.3551025390625, -5.19482421875, -5.0345458984375, -4.874267578125, -4.7139892578125, -4.5537109375, -4.3934326171875, -4.233154296875, -4.0728759765625, -3.91259765625, -3.7523193359375, -3.592041015625, -3.4317626953125, -3.271484375, -3.1112060546875, -2.950927734375, -2.7906494140625, -2.63037109375, -2.4700927734375, -2.309814453125, -2.1495361328125, -1.9892578125, -1.8289794921875, -1.668701171875, -1.5084228515625, -1.34814453125, -1.1878662109375, -1.027587890625, -0.8673095703125, -0.70703125, -0.5467529296875, -0.386474609375, -0.2261962890625, -0.06591796875, 0.0943603515625, 0.254638671875, 0.4149169921875, 0.5751953125, 0.7354736328125, 0.895751953125, 1.0560302734375, 1.21630859375, 1.3765869140625, 1.536865234375, 1.6971435546875, 1.857421875, 2.0177001953125, 2.177978515625, 2.3382568359375, 2.49853515625, 2.6588134765625, 2.819091796875, 2.9793701171875, 3.1396484375, 3.2999267578125, 3.460205078125, 3.6204833984375, 3.78076171875, 3.9410400390625, 4.101318359375, 4.2615966796875, 4.421875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 3.0, 9.0, 14.0, 16.0, 14.0, 12.0, 19.0, 30.0, 23.0, 21.0, 25.0, 40.0, 41.0, 36.0, 35.0, 47.0, 33.0, 47.0, 55.0, 43.0, 44.0, 51.0, 39.0, 48.0, 35.0, 23.0, 33.0, 19.0, 21.0, 20.0, 16.0, 16.0, 12.0, 8.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.453125, -3.354034423828125, -3.25494384765625, -3.155853271484375, -3.0567626953125, -2.957672119140625, -2.85858154296875, -2.759490966796875, -2.660400390625, -2.561309814453125, -2.46221923828125, -2.363128662109375, -2.2640380859375, -2.164947509765625, -2.06585693359375, -1.966766357421875, -1.86767578125, -1.768585205078125, -1.66949462890625, -1.570404052734375, -1.4713134765625, -1.372222900390625, -1.27313232421875, -1.174041748046875, -1.074951171875, -0.975860595703125, -0.87677001953125, -0.777679443359375, -0.6785888671875, -0.579498291015625, -0.48040771484375, -0.381317138671875, -0.2822265625, -0.183135986328125, -0.08404541015625, 0.015045166015625, 0.1141357421875, 0.213226318359375, 0.31231689453125, 0.411407470703125, 0.510498046875, 0.609588623046875, 0.70867919921875, 0.807769775390625, 0.9068603515625, 1.005950927734375, 1.10504150390625, 1.204132080078125, 1.30322265625, 1.402313232421875, 1.50140380859375, 1.600494384765625, 1.6995849609375, 1.798675537109375, 1.89776611328125, 1.996856689453125, 2.095947265625, 2.195037841796875, 2.29412841796875, 2.393218994140625, 2.4923095703125, 2.591400146484375, 2.69049072265625, 2.789581298828125, 2.888671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 13.0, 5.0, 17.0, 9.0, 20.0, 29.0, 34.0, 52.0, 64.0, 116.0, 162.0, 246.0, 391.0, 638.0, 1117.0, 2570.0, 7325.0, 33760.0, 624872.0, 334560.0, 30522.0, 6795.0, 2417.0, 1166.0, 573.0, 353.0, 208.0, 140.0, 113.0, 65.0, 37.0, 52.0, 27.0, 18.0, 14.0, 8.0, 11.0, 11.0, 6.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.6134033203125, -8.343994140625, -8.0745849609375, -7.80517578125, -7.5357666015625, -7.266357421875, -6.9969482421875, -6.7275390625, -6.4581298828125, -6.188720703125, -5.9193115234375, -5.64990234375, -5.3804931640625, -5.111083984375, -4.8416748046875, -4.572265625, -4.3028564453125, -4.033447265625, -3.7640380859375, -3.49462890625, -3.2252197265625, -2.955810546875, -2.6864013671875, -2.4169921875, -2.1475830078125, -1.878173828125, -1.6087646484375, -1.33935546875, -1.0699462890625, -0.800537109375, -0.5311279296875, -0.26171875, 0.0076904296875, 0.277099609375, 0.5465087890625, 0.81591796875, 1.0853271484375, 1.354736328125, 1.6241455078125, 1.8935546875, 2.1629638671875, 2.432373046875, 2.7017822265625, 2.97119140625, 3.2406005859375, 3.510009765625, 3.7794189453125, 4.048828125, 4.3182373046875, 4.587646484375, 4.8570556640625, 5.12646484375, 5.3958740234375, 5.665283203125, 5.9346923828125, 6.2041015625, 6.4735107421875, 6.742919921875, 7.0123291015625, 7.28173828125, 7.5511474609375, 7.820556640625, 8.0899658203125, 8.359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 9.0, 17.0, 10.0, 19.0, 15.0, 24.0, 29.0, 33.0, 47.0, 42.0, 49.0, 51.0, 80.0, 82.0, 52.0, 64.0, 46.0, 47.0, 40.0, 46.0, 29.0, 32.0, 19.0, 27.0, 13.0, 17.0, 7.0, 9.0, 8.0, 5.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4296875, -14.0040283203125, -13.578369140625, -13.1527099609375, -12.72705078125, -12.3013916015625, -11.875732421875, -11.4500732421875, -11.0244140625, -10.5987548828125, -10.173095703125, -9.7474365234375, -9.32177734375, -8.8961181640625, -8.470458984375, -8.0447998046875, -7.619140625, -7.1934814453125, -6.767822265625, -6.3421630859375, -5.91650390625, -5.4908447265625, -5.065185546875, -4.6395263671875, -4.2138671875, -3.7882080078125, -3.362548828125, -2.9368896484375, -2.51123046875, -2.0855712890625, -1.659912109375, -1.2342529296875, -0.80859375, -0.3829345703125, 0.042724609375, 0.4683837890625, 0.89404296875, 1.3197021484375, 1.745361328125, 2.1710205078125, 2.5966796875, 3.0223388671875, 3.447998046875, 3.8736572265625, 4.29931640625, 4.7249755859375, 5.150634765625, 5.5762939453125, 6.001953125, 6.4276123046875, 6.853271484375, 7.2789306640625, 7.70458984375, 8.1302490234375, 8.555908203125, 8.9815673828125, 9.4072265625, 9.8328857421875, 10.258544921875, 10.6842041015625, 11.10986328125, 11.5355224609375, 11.961181640625, 12.3868408203125, 12.8125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 2.0, 6.0, 9.0, 7.0, 10.0, 7.0, 14.0, 14.0, 25.0, 24.0, 30.0, 38.0, 54.0, 61.0, 104.0, 157.0, 294.0, 550.0, 1244.0, 3383.0, 11295.0, 65746.0, 844508.0, 99093.0, 14698.0, 4165.0, 1529.0, 642.0, 327.0, 156.0, 109.0, 63.0, 47.0, 33.0, 25.0, 15.0, 16.0, 15.0, 12.0, 9.0, 6.0, 2.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.61328125, -2.5330810546875, -2.452880859375, -2.3726806640625, -2.29248046875, -2.2122802734375, -2.132080078125, -2.0518798828125, -1.9716796875, -1.8914794921875, -1.811279296875, -1.7310791015625, -1.65087890625, -1.5706787109375, -1.490478515625, -1.4102783203125, -1.330078125, -1.2498779296875, -1.169677734375, -1.0894775390625, -1.00927734375, -0.9290771484375, -0.848876953125, -0.7686767578125, -0.6884765625, -0.6082763671875, -0.528076171875, -0.4478759765625, -0.36767578125, -0.2874755859375, -0.207275390625, -0.1270751953125, -0.046875, 0.0333251953125, 0.113525390625, 0.1937255859375, 0.27392578125, 0.3541259765625, 0.434326171875, 0.5145263671875, 0.5947265625, 0.6749267578125, 0.755126953125, 0.8353271484375, 0.91552734375, 0.9957275390625, 1.075927734375, 1.1561279296875, 1.236328125, 1.3165283203125, 1.396728515625, 1.4769287109375, 1.55712890625, 1.6373291015625, 1.717529296875, 1.7977294921875, 1.8779296875, 1.9581298828125, 2.038330078125, 2.1185302734375, 2.19873046875, 2.2789306640625, 2.359130859375, 2.4393310546875, 2.51953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 12.0, 2.0, 4.0, 5.0, 9.0, 18.0, 13.0, 26.0, 35.0, 86.0, 107.0, 218.0, 159.0, 94.0, 70.0, 37.0, 30.0, 17.0, 18.0, 10.0, 6.0, 10.0, 6.0, 2.0, 3.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0008029937744140625, -0.0007805302739143372, -0.0007580667734146118, -0.0007356032729148865, -0.0007131397724151611, -0.0006906762719154358, -0.0006682127714157104, -0.0006457492709159851, -0.0006232857704162598, -0.0006008222699165344, -0.0005783587694168091, -0.0005558952689170837, -0.0005334317684173584, -0.0005109682679176331, -0.0004885047674179077, -0.0004660412669181824, -0.00044357776641845703, -0.0004211142659187317, -0.00039865076541900635, -0.000376187264919281, -0.00035372376441955566, -0.0003312602639198303, -0.000308796763420105, -0.00028633326292037964, -0.0002638697624206543, -0.00024140626192092896, -0.0002189427614212036, -0.00019647926092147827, -0.00017401576042175293, -0.0001515522599220276, -0.00012908875942230225, -0.0001066252589225769, -8.416175842285156e-05, -6.169825792312622e-05, -3.923475742340088e-05, -1.6771256923675537e-05, 5.692243576049805e-06, 2.8155744075775146e-05, 5.061924457550049e-05, 7.308274507522583e-05, 9.554624557495117e-05, 0.00011800974607467651, 0.00014047324657440186, 0.0001629367470741272, 0.00018540024757385254, 0.00020786374807357788, 0.00023032724857330322, 0.00025279074907302856, 0.0002752542495727539, 0.00029771775007247925, 0.0003201812505722046, 0.00034264475107192993, 0.0003651082515716553, 0.0003875717520713806, 0.00041003525257110596, 0.0004324987530708313, 0.00045496225357055664, 0.000477425754070282, 0.0004998892545700073, 0.0005223527550697327, 0.000544816255569458, 0.0005672797560691833, 0.0005897432565689087, 0.000612206757068634, 0.0006346702575683594]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 15.0, 12.0, 20.0, 18.0, 26.0, 43.0, 66.0, 74.0, 164.0, 194.0, 384.0, 697.0, 1390.0, 2961.0, 7240.0, 26456.0, 221800.0, 721860.0, 46991.0, 10337.0, 3872.0, 1799.0, 903.0, 444.0, 261.0, 165.0, 120.0, 67.0, 49.0, 50.0, 25.0, 13.0, 11.0, 10.0, 13.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.083984375, -2.014892578125, -1.94580078125, -1.876708984375, -1.8076171875, -1.738525390625, -1.66943359375, -1.600341796875, -1.53125, -1.462158203125, -1.39306640625, -1.323974609375, -1.2548828125, -1.185791015625, -1.11669921875, -1.047607421875, -0.978515625, -0.909423828125, -0.84033203125, -0.771240234375, -0.7021484375, -0.633056640625, -0.56396484375, -0.494873046875, -0.42578125, -0.356689453125, -0.28759765625, -0.218505859375, -0.1494140625, -0.080322265625, -0.01123046875, 0.057861328125, 0.126953125, 0.196044921875, 0.26513671875, 0.334228515625, 0.4033203125, 0.472412109375, 0.54150390625, 0.610595703125, 0.6796875, 0.748779296875, 0.81787109375, 0.886962890625, 0.9560546875, 1.025146484375, 1.09423828125, 1.163330078125, 1.232421875, 1.301513671875, 1.37060546875, 1.439697265625, 1.5087890625, 1.577880859375, 1.64697265625, 1.716064453125, 1.78515625, 1.854248046875, 1.92333984375, 1.992431640625, 2.0615234375, 2.130615234375, 2.19970703125, 2.268798828125, 2.337890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 5.0, 10.0, 9.0, 13.0, 23.0, 30.0, 32.0, 38.0, 47.0, 66.0, 110.0, 117.0, 111.0, 90.0, 62.0, 60.0, 39.0, 41.0, 21.0, 16.0, 12.0, 9.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.3294677734375, -2.260498046875, -2.1915283203125, -2.12255859375, -2.0535888671875, -1.984619140625, -1.9156494140625, -1.8466796875, -1.7777099609375, -1.708740234375, -1.6397705078125, -1.57080078125, -1.5018310546875, -1.432861328125, -1.3638916015625, -1.294921875, -1.2259521484375, -1.156982421875, -1.0880126953125, -1.01904296875, -0.9500732421875, -0.881103515625, -0.8121337890625, -0.7431640625, -0.6741943359375, -0.605224609375, -0.5362548828125, -0.46728515625, -0.3983154296875, -0.329345703125, -0.2603759765625, -0.19140625, -0.1224365234375, -0.053466796875, 0.0155029296875, 0.08447265625, 0.1534423828125, 0.222412109375, 0.2913818359375, 0.3603515625, 0.4293212890625, 0.498291015625, 0.5672607421875, 0.63623046875, 0.7052001953125, 0.774169921875, 0.8431396484375, 0.912109375, 0.9810791015625, 1.050048828125, 1.1190185546875, 1.18798828125, 1.2569580078125, 1.325927734375, 1.3948974609375, 1.4638671875, 1.5328369140625, 1.601806640625, 1.6707763671875, 1.73974609375, 1.8087158203125, 1.877685546875, 1.9466552734375, 2.015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 4.0, 9.0, 10.0, 16.0, 42.0, 148.0, 452.0, 236.0, 58.0, 13.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.41390991210938, -126.9677963256836, -123.52168273925781, -120.07557678222656, -116.62946319580078, -113.183349609375, -109.73723602294922, -106.29112243652344, -102.84501647949219, -99.3989028930664, -95.95278930664062, -92.50668334960938, -89.0605697631836, -85.61445617675781, -82.16834259033203, -78.72222900390625, -75.27611541748047, -71.83000183105469, -68.3838882446289, -64.93777465820312, -61.491668701171875, -58.045555114746094, -54.59944152832031, -51.15332794189453, -47.707218170166016, -44.261104583740234, -40.81499481201172, -37.36888122558594, -33.922767639160156, -30.47665786743164, -27.03054428100586, -23.58443260192871, -20.138320922851562, -16.692209243774414, -13.24609661102295, -9.799983978271484, -6.353872299194336, -2.9077606201171875, 0.5383529663085938, 3.984464645385742, 7.430576324462891, 10.876688003540039, 14.322800636291504, 17.76891326904297, 21.215024948120117, 24.661136627197266, 28.107250213623047, 31.553361892700195, 34.999473571777344, 38.445587158203125, 41.89169692993164, 45.33781051635742, 48.78392028808594, 52.23003387451172, 55.6761474609375, 59.12226104736328, 62.5683708190918, 66.01448059082031, 69.4605941772461, 72.90670776367188, 76.35282135009766, 79.79893493652344, 83.24504089355469, 86.69115447998047, 90.13726806640625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 9.0, 6.0, 11.0, 21.0, 12.0, 19.0, 29.0, 22.0, 23.0, 43.0, 39.0, 47.0, 51.0, 93.0, 145.0, 109.0, 61.0, 42.0, 37.0, 41.0, 23.0, 25.0, 18.0, 16.0, 15.0, 15.0, 7.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.756980895996094, -56.95661926269531, -55.156253814697266, -53.35588836669922, -51.55552673339844, -49.755165100097656, -47.95479965209961, -46.15443420410156, -44.35407257080078, -42.5537109375, -40.75334548950195, -38.952980041503906, -37.152618408203125, -35.352256774902344, -33.5518913269043, -31.751527786254883, -29.95116424560547, -28.150800704956055, -26.35043716430664, -24.550073623657227, -22.749710083007812, -20.9493465423584, -19.148983001708984, -17.34861946105957, -15.548255920410156, -13.747892379760742, -11.947528839111328, -10.147165298461914, -8.3468017578125, -6.546438217163086, -4.746074676513672, -2.945711135864258, -1.1453437805175781, 0.6550197601318359, 2.45538330078125, 4.255746841430664, 6.056110382080078, 7.856473922729492, 9.656837463378906, 11.45720100402832, 13.257564544677734, 15.057928085327148, 16.858291625976562, 18.658655166625977, 20.45901870727539, 22.259382247924805, 24.05974578857422, 25.860109329223633, 27.660472869873047, 29.46083641052246, 31.261199951171875, 33.061561584472656, 34.8619270324707, 36.66229248046875, 38.46265411376953, 40.26301574707031, 42.06338119506836, 43.863746643066406, 45.66410827636719, 47.46446990966797, 49.264835357666016, 51.06520080566406, 52.865562438964844, 54.665924072265625, 56.46628952026367]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 2.0, 3.0, 6.0, 1.0, 8.0, 9.0, 12.0, 14.0, 24.0, 17.0, 44.0, 53.0, 86.0, 97.0, 179.0, 279.0, 454.0, 798.0, 1431.0, 3028.0, 6902.0, 19815.0, 94522.0, 782103.0, 2502940.0, 664820.0, 85765.0, 18638.0, 6243.0, 2848.0, 1304.0, 690.0, 428.0, 247.0, 149.0, 105.0, 70.0, 42.0, 23.0, 27.0, 23.0, 16.0, 8.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.97265625, -6.77032470703125, -6.5679931640625, -6.36566162109375, -6.163330078125, -5.96099853515625, -5.7586669921875, -5.55633544921875, -5.35400390625, -5.15167236328125, -4.9493408203125, -4.74700927734375, -4.544677734375, -4.34234619140625, -4.1400146484375, -3.93768310546875, -3.7353515625, -3.53302001953125, -3.3306884765625, -3.12835693359375, -2.926025390625, -2.72369384765625, -2.5213623046875, -2.31903076171875, -2.11669921875, -1.91436767578125, -1.7120361328125, -1.50970458984375, -1.307373046875, -1.10504150390625, -0.9027099609375, -0.70037841796875, -0.498046875, -0.29571533203125, -0.0933837890625, 0.10894775390625, 0.311279296875, 0.51361083984375, 0.7159423828125, 0.91827392578125, 1.12060546875, 1.32293701171875, 1.5252685546875, 1.72760009765625, 1.929931640625, 2.13226318359375, 2.3345947265625, 2.53692626953125, 2.7392578125, 2.94158935546875, 3.1439208984375, 3.34625244140625, 3.548583984375, 3.75091552734375, 3.9532470703125, 4.15557861328125, 4.35791015625, 4.56024169921875, 4.7625732421875, 4.96490478515625, 5.167236328125, 5.36956787109375, 5.5718994140625, 5.77423095703125, 5.9765625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 2.0, 7.0, 11.0, 15.0, 10.0, 15.0, 14.0, 27.0, 30.0, 33.0, 29.0, 42.0, 37.0, 38.0, 37.0, 41.0, 37.0, 41.0, 46.0, 65.0, 34.0, 47.0, 41.0, 48.0, 41.0, 39.0, 21.0, 21.0, 25.0, 20.0, 9.0, 23.0, 9.0, 10.0, 5.0, 4.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.302734375, -3.205535888671875, -3.10833740234375, -3.011138916015625, -2.9139404296875, -2.816741943359375, -2.71954345703125, -2.622344970703125, -2.525146484375, -2.427947998046875, -2.33074951171875, -2.233551025390625, -2.1363525390625, -2.039154052734375, -1.94195556640625, -1.844757080078125, -1.74755859375, -1.650360107421875, -1.55316162109375, -1.455963134765625, -1.3587646484375, -1.261566162109375, -1.16436767578125, -1.067169189453125, -0.969970703125, -0.872772216796875, -0.77557373046875, -0.678375244140625, -0.5811767578125, -0.483978271484375, -0.38677978515625, -0.289581298828125, -0.1923828125, -0.095184326171875, 0.00201416015625, 0.099212646484375, 0.1964111328125, 0.293609619140625, 0.39080810546875, 0.488006591796875, 0.585205078125, 0.682403564453125, 0.77960205078125, 0.876800537109375, 0.9739990234375, 1.071197509765625, 1.16839599609375, 1.265594482421875, 1.36279296875, 1.459991455078125, 1.55718994140625, 1.654388427734375, 1.7515869140625, 1.848785400390625, 1.94598388671875, 2.043182373046875, 2.140380859375, 2.237579345703125, 2.33477783203125, 2.431976318359375, 2.5291748046875, 2.626373291015625, 2.72357177734375, 2.820770263671875, 2.91796875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 6.0, 10.0, 16.0, 30.0, 49.0, 83.0, 150.0, 302.0, 600.0, 1792.0, 11133.0, 2683297.0, 1484557.0, 9444.0, 1641.0, 578.0, 269.0, 135.0, 76.0, 39.0, 22.0, 16.0, 12.0, 9.0, 7.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-29.6875, -28.94482421875, -28.2021484375, -27.45947265625, -26.716796875, -25.97412109375, -25.2314453125, -24.48876953125, -23.74609375, -23.00341796875, -22.2607421875, -21.51806640625, -20.775390625, -20.03271484375, -19.2900390625, -18.54736328125, -17.8046875, -17.06201171875, -16.3193359375, -15.57666015625, -14.833984375, -14.09130859375, -13.3486328125, -12.60595703125, -11.86328125, -11.12060546875, -10.3779296875, -9.63525390625, -8.892578125, -8.14990234375, -7.4072265625, -6.66455078125, -5.921875, -5.17919921875, -4.4365234375, -3.69384765625, -2.951171875, -2.20849609375, -1.4658203125, -0.72314453125, 0.01953125, 0.76220703125, 1.5048828125, 2.24755859375, 2.990234375, 3.73291015625, 4.4755859375, 5.21826171875, 5.9609375, 6.70361328125, 7.4462890625, 8.18896484375, 8.931640625, 9.67431640625, 10.4169921875, 11.15966796875, 11.90234375, 12.64501953125, 13.3876953125, 14.13037109375, 14.873046875, 15.61572265625, 16.3583984375, 17.10107421875, 17.84375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 5.0, 10.0, 12.0, 17.0, 38.0, 39.0, 61.0, 88.0, 125.0, 205.0, 382.0, 622.0, 823.0, 618.0, 396.0, 226.0, 136.0, 90.0, 51.0, 43.0, 26.0, 21.0, 11.0, 11.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5390625, -9.150634765625, -8.76220703125, -8.373779296875, -7.9853515625, -7.596923828125, -7.20849609375, -6.820068359375, -6.431640625, -6.043212890625, -5.65478515625, -5.266357421875, -4.8779296875, -4.489501953125, -4.10107421875, -3.712646484375, -3.32421875, -2.935791015625, -2.54736328125, -2.158935546875, -1.7705078125, -1.382080078125, -0.99365234375, -0.605224609375, -0.216796875, 0.171630859375, 0.56005859375, 0.948486328125, 1.3369140625, 1.725341796875, 2.11376953125, 2.502197265625, 2.890625, 3.279052734375, 3.66748046875, 4.055908203125, 4.4443359375, 4.832763671875, 5.22119140625, 5.609619140625, 5.998046875, 6.386474609375, 6.77490234375, 7.163330078125, 7.5517578125, 7.940185546875, 8.32861328125, 8.717041015625, 9.10546875, 9.493896484375, 9.88232421875, 10.270751953125, 10.6591796875, 11.047607421875, 11.43603515625, 11.824462890625, 12.212890625, 12.601318359375, 12.98974609375, 13.378173828125, 13.7666015625, 14.155029296875, 14.54345703125, 14.931884765625, 15.3203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 7.0, 10.0, 12.0, 24.0, 34.0, 71.0, 132.0, 203.0, 188.0, 131.0, 77.0, 31.0, 19.0, 17.0, 6.0, 4.0, 8.0, 7.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-128.28350830078125, -124.50596618652344, -120.7284164428711, -116.95087432861328, -113.17332458496094, -109.39578247070312, -105.61823272705078, -101.84069061279297, -98.06314086914062, -94.28559875488281, -90.50804901123047, -86.73050689697266, -82.95295715332031, -79.1754150390625, -75.39786529541016, -71.62032318115234, -67.8427734375, -64.06523132324219, -60.287681579589844, -56.510135650634766, -52.73258972167969, -48.955047607421875, -45.17749786376953, -41.39995574951172, -37.622413635253906, -33.84486770629883, -30.06732177734375, -26.289775848388672, -22.512229919433594, -18.73468589782715, -14.95713996887207, -11.179594039916992, -7.402046203613281, -3.6245005130767822, 0.1530451774597168, 3.9305906295776367, 7.708136558532715, 11.485681533813477, 15.263227462768555, 19.040773391723633, 22.81831932067871, 26.59586524963379, 30.373411178588867, 34.15095520019531, 37.92850112915039, 41.70604705810547, 45.48359298706055, 49.261138916015625, 53.0386848449707, 56.81623077392578, 60.59377670288086, 64.37132263183594, 68.14886474609375, 71.9264144897461, 75.7039566040039, 79.48150634765625, 83.25904846191406, 87.03659057617188, 90.81414031982422, 94.59168243408203, 98.36923217773438, 102.14677429199219, 105.92432403564453, 109.70186614990234, 113.47941589355469]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 10.0, 12.0, 20.0, 27.0, 35.0, 33.0, 61.0, 35.0, 68.0, 85.0, 75.0, 87.0, 73.0, 57.0, 60.0, 65.0, 39.0, 35.0, 30.0, 24.0, 22.0, 10.0, 8.0, 13.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.88571166992188, -93.31988525390625, -90.75405883789062, -88.188232421875, -85.62240600585938, -83.05657196044922, -80.4907455444336, -77.92491912841797, -75.35909271240234, -72.79326629638672, -70.2274398803711, -67.66161346435547, -65.09577941894531, -62.52995681762695, -59.96412658691406, -57.39830017089844, -54.83247375488281, -52.26664733886719, -49.70082092285156, -47.13499069213867, -44.56916427612305, -42.00333786010742, -39.43750762939453, -36.871681213378906, -34.30585479736328, -31.740028381347656, -29.1742000579834, -26.60837173461914, -24.042545318603516, -21.47671890258789, -18.910890579223633, -16.345062255859375, -13.77923583984375, -11.213408470153809, -8.647581100463867, -6.081753730773926, -3.5159263610839844, -0.950098991394043, 1.6157283782958984, 4.181556701660156, 6.747383117675781, 9.313210487365723, 11.879037857055664, 14.444865226745605, 17.010692596435547, 19.576519012451172, 22.14234733581543, 24.708175659179688, 27.274002075195312, 29.839828491210938, 32.40565490722656, 34.97148513793945, 37.53731155395508, 40.1031379699707, 42.668968200683594, 45.23479461669922, 47.800621032714844, 50.36644744873047, 52.932273864746094, 55.498104095458984, 58.06393051147461, 60.629756927490234, 63.195587158203125, 65.76141357421875, 68.32723999023438]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 0.0, 3.0, 10.0, 16.0, 22.0, 28.0, 35.0, 54.0, 99.0, 162.0, 243.0, 425.0, 775.0, 1491.0, 3080.0, 7074.0, 18977.0, 61848.0, 298965.0, 527453.0, 85705.0, 25184.0, 9157.0, 3756.0, 1799.0, 934.0, 518.0, 272.0, 164.0, 106.0, 71.0, 31.0, 24.0, 29.0, 18.0, 7.0, 8.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.27734375, -4.1304931640625, -3.983642578125, -3.8367919921875, -3.68994140625, -3.5430908203125, -3.396240234375, -3.2493896484375, -3.1025390625, -2.9556884765625, -2.808837890625, -2.6619873046875, -2.51513671875, -2.3682861328125, -2.221435546875, -2.0745849609375, -1.927734375, -1.7808837890625, -1.634033203125, -1.4871826171875, -1.34033203125, -1.1934814453125, -1.046630859375, -0.8997802734375, -0.7529296875, -0.6060791015625, -0.459228515625, -0.3123779296875, -0.16552734375, -0.0186767578125, 0.128173828125, 0.2750244140625, 0.421875, 0.5687255859375, 0.715576171875, 0.8624267578125, 1.00927734375, 1.1561279296875, 1.302978515625, 1.4498291015625, 1.5966796875, 1.7435302734375, 1.890380859375, 2.0372314453125, 2.18408203125, 2.3309326171875, 2.477783203125, 2.6246337890625, 2.771484375, 2.9183349609375, 3.065185546875, 3.2120361328125, 3.35888671875, 3.5057373046875, 3.652587890625, 3.7994384765625, 3.9462890625, 4.0931396484375, 4.239990234375, 4.3868408203125, 4.53369140625, 4.6805419921875, 4.827392578125, 4.9742431640625, 5.12109375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 10.0, 16.0, 21.0, 23.0, 29.0, 24.0, 28.0, 37.0, 51.0, 51.0, 53.0, 67.0, 65.0, 61.0, 54.0, 58.0, 56.0, 60.0, 42.0, 48.0, 36.0, 25.0, 21.0, 17.0, 13.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.47265625, -5.32501220703125, -5.1773681640625, -5.02972412109375, -4.882080078125, -4.73443603515625, -4.5867919921875, -4.43914794921875, -4.29150390625, -4.14385986328125, -3.9962158203125, -3.84857177734375, -3.700927734375, -3.55328369140625, -3.4056396484375, -3.25799560546875, -3.1103515625, -2.96270751953125, -2.8150634765625, -2.66741943359375, -2.519775390625, -2.37213134765625, -2.2244873046875, -2.07684326171875, -1.92919921875, -1.78155517578125, -1.6339111328125, -1.48626708984375, -1.338623046875, -1.19097900390625, -1.0433349609375, -0.89569091796875, -0.748046875, -0.60040283203125, -0.4527587890625, -0.30511474609375, -0.157470703125, -0.00982666015625, 0.1378173828125, 0.28546142578125, 0.43310546875, 0.58074951171875, 0.7283935546875, 0.87603759765625, 1.023681640625, 1.17132568359375, 1.3189697265625, 1.46661376953125, 1.6142578125, 1.76190185546875, 1.9095458984375, 2.05718994140625, 2.204833984375, 2.35247802734375, 2.5001220703125, 2.64776611328125, 2.79541015625, 2.94305419921875, 3.0906982421875, 3.23834228515625, 3.385986328125, 3.53363037109375, 3.6812744140625, 3.82891845703125, 3.9765625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 0.0, 7.0, 6.0, 5.0, 16.0, 11.0, 14.0, 23.0, 23.0, 33.0, 65.0, 83.0, 131.0, 185.0, 287.0, 555.0, 1322.0, 3822.0, 20121.0, 773752.0, 226586.0, 15722.0, 3284.0, 1140.0, 523.0, 308.0, 177.0, 117.0, 70.0, 34.0, 32.0, 20.0, 20.0, 14.0, 13.0, 9.0, 7.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2734375, -8.014404296875, -7.75537109375, -7.496337890625, -7.2373046875, -6.978271484375, -6.71923828125, -6.460205078125, -6.201171875, -5.942138671875, -5.68310546875, -5.424072265625, -5.1650390625, -4.906005859375, -4.64697265625, -4.387939453125, -4.12890625, -3.869873046875, -3.61083984375, -3.351806640625, -3.0927734375, -2.833740234375, -2.57470703125, -2.315673828125, -2.056640625, -1.797607421875, -1.53857421875, -1.279541015625, -1.0205078125, -0.761474609375, -0.50244140625, -0.243408203125, 0.015625, 0.274658203125, 0.53369140625, 0.792724609375, 1.0517578125, 1.310791015625, 1.56982421875, 1.828857421875, 2.087890625, 2.346923828125, 2.60595703125, 2.864990234375, 3.1240234375, 3.383056640625, 3.64208984375, 3.901123046875, 4.16015625, 4.419189453125, 4.67822265625, 4.937255859375, 5.1962890625, 5.455322265625, 5.71435546875, 5.973388671875, 6.232421875, 6.491455078125, 6.75048828125, 7.009521484375, 7.2685546875, 7.527587890625, 7.78662109375, 8.045654296875, 8.3046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 10.0, 9.0, 6.0, 9.0, 8.0, 9.0, 5.0, 11.0, 18.0, 11.0, 22.0, 25.0, 32.0, 33.0, 41.0, 47.0, 42.0, 70.0, 54.0, 79.0, 55.0, 54.0, 59.0, 38.0, 35.0, 34.0, 33.0, 21.0, 21.0, 13.0, 12.0, 10.0, 12.0, 13.0, 6.0, 7.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.5091552734375, -13.065185546875, -12.6212158203125, -12.17724609375, -11.7332763671875, -11.289306640625, -10.8453369140625, -10.4013671875, -9.9573974609375, -9.513427734375, -9.0694580078125, -8.62548828125, -8.1815185546875, -7.737548828125, -7.2935791015625, -6.849609375, -6.4056396484375, -5.961669921875, -5.5177001953125, -5.07373046875, -4.6297607421875, -4.185791015625, -3.7418212890625, -3.2978515625, -2.8538818359375, -2.409912109375, -1.9659423828125, -1.52197265625, -1.0780029296875, -0.634033203125, -0.1900634765625, 0.25390625, 0.6978759765625, 1.141845703125, 1.5858154296875, 2.02978515625, 2.4737548828125, 2.917724609375, 3.3616943359375, 3.8056640625, 4.2496337890625, 4.693603515625, 5.1375732421875, 5.58154296875, 6.0255126953125, 6.469482421875, 6.9134521484375, 7.357421875, 7.8013916015625, 8.245361328125, 8.6893310546875, 9.13330078125, 9.5772705078125, 10.021240234375, 10.4652099609375, 10.9091796875, 11.3531494140625, 11.797119140625, 12.2410888671875, 12.68505859375, 13.1290283203125, 13.572998046875, 14.0169677734375, 14.4609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 11.0, 10.0, 12.0, 18.0, 31.0, 60.0, 97.0, 137.0, 300.0, 634.0, 1529.0, 4730.0, 22001.0, 210471.0, 770124.0, 29185.0, 5911.0, 1871.0, 682.0, 310.0, 172.0, 77.0, 58.0, 27.0, 23.0, 20.0, 9.0, 6.0, 5.0, 4.0, 5.0, 4.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5078125, -1.4671478271484375, -1.426483154296875, -1.3858184814453125, -1.34515380859375, -1.3044891357421875, -1.263824462890625, -1.2231597900390625, -1.1824951171875, -1.1418304443359375, -1.101165771484375, -1.0605010986328125, -1.01983642578125, -0.9791717529296875, -0.938507080078125, -0.8978424072265625, -0.857177734375, -0.8165130615234375, -0.775848388671875, -0.7351837158203125, -0.69451904296875, -0.6538543701171875, -0.613189697265625, -0.5725250244140625, -0.5318603515625, -0.4911956787109375, -0.450531005859375, -0.4098663330078125, -0.36920166015625, -0.3285369873046875, -0.287872314453125, -0.2472076416015625, -0.20654296875, -0.1658782958984375, -0.125213623046875, -0.0845489501953125, -0.04388427734375, -0.0032196044921875, 0.037445068359375, 0.0781097412109375, 0.1187744140625, 0.1594390869140625, 0.200103759765625, 0.2407684326171875, 0.28143310546875, 0.3220977783203125, 0.362762451171875, 0.4034271240234375, 0.444091796875, 0.4847564697265625, 0.525421142578125, 0.5660858154296875, 0.60675048828125, 0.6474151611328125, 0.688079833984375, 0.7287445068359375, 0.7694091796875, 0.8100738525390625, 0.850738525390625, 0.8914031982421875, 0.93206787109375, 0.9727325439453125, 1.013397216796875, 1.0540618896484375, 1.0947265625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 11.0, 13.0, 13.0, 16.0, 21.0, 29.0, 42.0, 51.0, 56.0, 78.0, 102.0, 105.0, 96.0, 63.0, 64.0, 50.0, 38.0, 33.0, 19.0, 16.0, 6.0, 9.0, 9.0, 6.0, 11.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00025963783264160156, -0.00025184638798236847, -0.00024405494332313538, -0.00023626349866390228, -0.0002284720540046692, -0.0002206806093454361, -0.000212889164686203, -0.0002050977200269699, -0.00019730627536773682, -0.00018951483070850372, -0.00018172338604927063, -0.00017393194139003754, -0.00016614049673080444, -0.00015834905207157135, -0.00015055760741233826, -0.00014276616275310516, -0.00013497471809387207, -0.00012718327343463898, -0.00011939182877540588, -0.00011160038411617279, -0.0001038089394569397, -9.60174947977066e-05, -8.822605013847351e-05, -8.043460547924042e-05, -7.264316082000732e-05, -6.485171616077423e-05, -5.706027150154114e-05, -4.9268826842308044e-05, -4.147738218307495e-05, -3.368593752384186e-05, -2.5894492864608765e-05, -1.810304820537567e-05, -1.0311603546142578e-05, -2.520158886909485e-06, 5.271285772323608e-06, 1.3062730431556702e-05, 2.0854175090789795e-05, 2.8645619750022888e-05, 3.643706440925598e-05, 4.4228509068489075e-05, 5.201995372772217e-05, 5.981139838695526e-05, 6.760284304618835e-05, 7.539428770542145e-05, 8.318573236465454e-05, 9.097717702388763e-05, 9.876862168312073e-05, 0.00010656006634235382, 0.00011435151100158691, 0.00012214295566082, 0.0001299344003200531, 0.0001377258449792862, 0.0001455172896385193, 0.00015330873429775238, 0.00016110017895698547, 0.00016889162361621857, 0.00017668306827545166, 0.00018447451293468475, 0.00019226595759391785, 0.00020005740225315094, 0.00020784884691238403, 0.00021564029157161713, 0.00022343173623085022, 0.0002312231808900833, 0.0002390146255493164]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0, 11.0, 8.0, 13.0, 12.0, 21.0, 28.0, 39.0, 44.0, 56.0, 83.0, 134.0, 214.0, 295.0, 549.0, 853.0, 1579.0, 2876.0, 5884.0, 13756.0, 37500.0, 165431.0, 722881.0, 61109.0, 19013.0, 7754.0, 3666.0, 2004.0, 1030.0, 641.0, 374.0, 222.0, 134.0, 88.0, 70.0, 35.0, 32.0, 31.0, 24.0, 19.0, 14.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.791015625, -0.7678756713867188, -0.7447357177734375, -0.7215957641601562, -0.698455810546875, -0.6753158569335938, -0.6521759033203125, -0.6290359497070312, -0.60589599609375, -0.5827560424804688, -0.5596160888671875, -0.5364761352539062, -0.513336181640625, -0.49019622802734375, -0.4670562744140625, -0.44391632080078125, -0.4207763671875, -0.39763641357421875, -0.3744964599609375, -0.35135650634765625, -0.328216552734375, -0.30507659912109375, -0.2819366455078125, -0.25879669189453125, -0.23565673828125, -0.21251678466796875, -0.1893768310546875, -0.16623687744140625, -0.143096923828125, -0.11995697021484375, -0.0968170166015625, -0.07367706298828125, -0.050537109375, -0.02739715576171875, -0.0042572021484375, 0.01888275146484375, 0.042022705078125, 0.06516265869140625, 0.0883026123046875, 0.11144256591796875, 0.13458251953125, 0.15772247314453125, 0.1808624267578125, 0.20400238037109375, 0.227142333984375, 0.25028228759765625, 0.2734222412109375, 0.29656219482421875, 0.3197021484375, 0.34284210205078125, 0.3659820556640625, 0.38912200927734375, 0.412261962890625, 0.43540191650390625, 0.4585418701171875, 0.48168182373046875, 0.50482177734375, 0.5279617309570312, 0.5511016845703125, 0.5742416381835938, 0.597381591796875, 0.6205215454101562, 0.6436614990234375, 0.6668014526367188, 0.68994140625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 0.0, 7.0, 5.0, 5.0, 10.0, 6.0, 19.0, 10.0, 23.0, 21.0, 24.0, 32.0, 45.0, 51.0, 83.0, 90.0, 92.0, 80.0, 88.0, 57.0, 46.0, 38.0, 28.0, 30.0, 20.0, 15.0, 12.0, 11.0, 10.0, 9.0, 5.0, 8.0, 8.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9384765625, -0.9088973999023438, -0.8793182373046875, -0.8497390747070312, -0.820159912109375, -0.7905807495117188, -0.7610015869140625, -0.7314224243164062, -0.70184326171875, -0.6722640991210938, -0.6426849365234375, -0.6131057739257812, -0.583526611328125, -0.5539474487304688, -0.5243682861328125, -0.49478912353515625, -0.4652099609375, -0.43563079833984375, -0.4060516357421875, -0.37647247314453125, -0.346893310546875, -0.31731414794921875, -0.2877349853515625, -0.25815582275390625, -0.22857666015625, -0.19899749755859375, -0.1694183349609375, -0.13983917236328125, -0.110260009765625, -0.08068084716796875, -0.0511016845703125, -0.02152252197265625, 0.008056640625, 0.03763580322265625, 0.0672149658203125, 0.09679412841796875, 0.126373291015625, 0.15595245361328125, 0.1855316162109375, 0.21511077880859375, 0.24468994140625, 0.27426910400390625, 0.3038482666015625, 0.33342742919921875, 0.363006591796875, 0.39258575439453125, 0.4221649169921875, 0.45174407958984375, 0.4813232421875, 0.5109024047851562, 0.5404815673828125, 0.5700607299804688, 0.599639892578125, 0.6292190551757812, 0.6587982177734375, 0.6883773803710938, 0.71795654296875, 0.7475357055664062, 0.7771148681640625, 0.8066940307617188, 0.836273193359375, 0.8658523559570312, 0.8954315185546875, 0.9250106811523438, 0.95458984375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 9.0, 14.0, 16.0, 25.0, 46.0, 99.0, 328.0, 274.0, 77.0, 42.0, 26.0, 12.0, 9.0, 6.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.80644226074219, -63.92009353637695, -62.03374481201172, -60.147396087646484, -58.26104736328125, -56.37469482421875, -54.48834991455078, -52.60199737548828, -50.71564865112305, -48.82929992675781, -46.94295120239258, -45.056602478027344, -43.17025375366211, -41.283905029296875, -39.397552490234375, -37.51120376586914, -35.624855041503906, -33.73850631713867, -31.852157592773438, -29.965808868408203, -28.079458236694336, -26.1931095123291, -24.306760787963867, -22.42041015625, -20.53406524658203, -18.647716522216797, -16.761367797851562, -14.875018119812012, -12.988668441772461, -11.102319717407227, -9.215970993041992, -7.329621315002441, -5.443271636962891, -3.556922435760498, -1.6705734729766846, 0.2157754898071289, 2.1021246910095215, 3.988473892211914, 5.874822616577148, 7.761172294616699, 9.647521018981934, 11.533869743347168, 13.420219421386719, 15.306568145751953, 17.192916870117188, 19.079265594482422, 20.965614318847656, 22.851964950561523, 24.738313674926758, 26.624662399291992, 28.511011123657227, 30.397361755371094, 32.28371047973633, 34.17005920410156, 36.0564079284668, 37.94275665283203, 39.829105377197266, 41.7154541015625, 43.601802825927734, 45.48815155029297, 47.3745002746582, 49.26084899902344, 51.14720153808594, 53.03355026245117, 54.919898986816406]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 3.0, 2.0, 3.0, 5.0, 11.0, 3.0, 6.0, 2.0, 6.0, 4.0, 9.0, 12.0, 17.0, 21.0, 22.0, 26.0, 37.0, 56.0, 72.0, 79.0, 126.0, 133.0, 89.0, 58.0, 39.0, 27.0, 26.0, 24.0, 22.0, 10.0, 8.0, 9.0, 10.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.97613525390625, -45.54729461669922, -44.11845397949219, -42.689613342285156, -41.260772705078125, -39.831932067871094, -38.40309143066406, -36.97425079345703, -35.54541015625, -34.11656951904297, -32.68772888183594, -31.258888244628906, -29.830047607421875, -28.401206970214844, -26.972366333007812, -25.54352569580078, -24.114686965942383, -22.68584632873535, -21.25700569152832, -19.82816505432129, -18.399324417114258, -16.970483779907227, -15.541644096374512, -14.11280345916748, -12.68396282196045, -11.255122184753418, -9.826281547546387, -8.397441864013672, -6.968600749969482, -5.539760112762451, -4.110919952392578, -2.682079315185547, -1.2532386779785156, 0.17560184001922607, 1.6044423580169678, 3.03328275680542, 4.462123394012451, 5.890964031219482, 7.3198041915893555, 8.748644828796387, 10.177485466003418, 11.60632610321045, 13.03516674041748, 14.464006423950195, 15.892847061157227, 17.321687698364258, 18.75052833557129, 20.17936897277832, 21.60820960998535, 23.037050247192383, 24.465890884399414, 25.894731521606445, 27.323572158813477, 28.752412796020508, 30.181251525878906, 31.610092163085938, 33.03893280029297, 34.4677734375, 35.89661407470703, 37.32545471191406, 38.754295349121094, 40.183135986328125, 41.611976623535156, 43.04081726074219, 44.46965789794922]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 12.0, 12.0, 8.0, 5.0, 20.0, 17.0, 26.0, 31.0, 47.0, 35.0, 49.0, 113.0, 297.0, 70.0, 50.0, 34.0, 28.0, 26.0, 29.0, 24.0, 19.0, 11.0, 9.0, 8.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.876953125, -3.729827880859375, -3.58270263671875, -3.435577392578125, -3.2884521484375, -3.141326904296875, -2.99420166015625, -2.847076416015625, -2.699951171875, -2.552825927734375, -2.40570068359375, -2.258575439453125, -2.1114501953125, -1.964324951171875, -1.81719970703125, -1.670074462890625, -1.52294921875, -1.375823974609375, -1.22869873046875, -1.081573486328125, -0.9344482421875, -0.787322998046875, -0.64019775390625, -0.493072509765625, -0.345947265625, -0.198822021484375, -0.05169677734375, 0.095428466796875, 0.2425537109375, 0.389678955078125, 0.53680419921875, 0.683929443359375, 0.8310546875, 0.978179931640625, 1.12530517578125, 1.272430419921875, 1.4195556640625, 1.566680908203125, 1.71380615234375, 1.860931396484375, 2.008056640625, 2.155181884765625, 2.30230712890625, 2.449432373046875, 2.5965576171875, 2.743682861328125, 2.89080810546875, 3.037933349609375, 3.18505859375, 3.332183837890625, 3.47930908203125, 3.626434326171875, 3.7735595703125, 3.920684814453125, 4.06781005859375, 4.214935302734375, 4.362060546875, 4.509185791015625, 4.65631103515625, 4.803436279296875, 4.9505615234375, 5.097686767578125, 5.24481201171875, 5.391937255859375, 5.5390625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 10.0, 4.0, 1.0, 0.0, 2.0, 4.0, 4.0, 10.0, 10.0, 6.0, 17.0, 14.0, 67.0, 73.0, 123.0, 347.0, 1031.0, 5457.0, 8306426.0, 70183.0, 3499.0, 763.0, 267.0, 103.0, 65.0, 43.0, 18.0, 11.0, 12.0, 7.0, 6.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.20458221435547, -57.68196105957031, -56.15933609008789, -54.636714935302734, -53.11408996582031, -51.591468811035156, -50.06884765625, -48.54622268676758, -47.023597717285156, -45.5009765625, -43.97835159301758, -42.45573043823242, -40.93310546875, -39.410484313964844, -37.88786315917969, -36.365238189697266, -34.84261703491211, -33.31999588012695, -31.79737091064453, -30.274749755859375, -28.752124786376953, -27.229503631591797, -25.706880569458008, -24.18425750732422, -22.66163444519043, -21.13901138305664, -19.61638832092285, -18.093765258789062, -16.571144104003906, -15.0485200881958, -13.525897979736328, -12.003274917602539, -10.480655670166016, -8.958032608032227, -7.435410022735596, -5.912787437438965, -4.390164375305176, -2.8675413131713867, -1.344919204711914, 0.177703857421875, 1.700326919555664, 3.222949743270874, 4.745572566986084, 6.268195152282715, 7.790818214416504, 9.313441276550293, 10.836063385009766, 12.358686447143555, 13.881309509277344, 15.403932571411133, 16.926555633544922, 18.449176788330078, 19.9718017578125, 21.494422912597656, 23.017045974731445, 24.539669036865234, 26.062292098999023, 27.584915161132812, 29.1075382232666, 30.63016128540039, 32.15278244018555, 33.67540740966797, 35.198028564453125, 36.72064971923828, 38.2432746887207]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 8.0, 7.0, 3.0, 4.0, 7.0, 10.0, 6.0, 3.0, 5.0, 7.0, 7.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-107.35186767578125, -104.48748016357422, -101.62309265136719, -98.75870513916016, -95.89431762695312, -93.02992248535156, -90.16553497314453, -87.3011474609375, -84.43675994873047, -81.57237243652344, -78.7079849243164, -75.84359741210938, -72.97920227050781, -70.11481475830078, -67.25042724609375, -64.38603973388672, -61.52165222167969, -58.657264709472656, -55.792877197265625, -52.92848587036133, -50.0640983581543, -47.199710845947266, -44.33531951904297, -41.47093200683594, -38.606544494628906, -35.742156982421875, -32.877769470214844, -30.013378143310547, -27.148990631103516, -24.284603118896484, -21.42021369934082, -18.555824279785156, -15.691444396972656, -12.827055931091309, -9.962667465209961, -7.098278999328613, -4.233890533447266, -1.369502067565918, 1.4948863983154297, 4.359275817871094, 7.223663330078125, 10.088051795959473, 12.95244026184082, 15.816828727722168, 18.681217193603516, 21.545604705810547, 24.40999412536621, 27.274383544921875, 30.138771057128906, 33.00315856933594, 35.86754608154297, 38.731937408447266, 41.5963249206543, 44.46071243286133, 47.325103759765625, 50.189491271972656, 53.05387878417969, 55.91826629638672, 58.78265380859375, 61.64704513549805, 64.51142883300781, 67.37582397460938, 70.2402114868164, 73.10459899902344, 75.96898651123047]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 6.0, 10.0, 10.0, 16.0, 23.0, 34.0, 54.0, 81.0, 149.0, 260.0, 535.0, 1337.0, 3662.0, 11824.0, 41584.0, 152312.0, 216419.0, 68254.0, 18636.0, 5702.0, 1893.0, 686.0, 297.0, 164.0, 116.0, 66.0, 43.0, 25.0, 14.0, 15.0, 11.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.0625, -31.00048828125, -29.9384765625, -28.87646484375, -27.814453125, -26.75244140625, -25.6904296875, -24.62841796875, -23.56640625, -22.50439453125, -21.4423828125, -20.38037109375, -19.318359375, -18.25634765625, -17.1943359375, -16.13232421875, -15.0703125, -14.00830078125, -12.9462890625, -11.88427734375, -10.822265625, -9.76025390625, -8.6982421875, -7.63623046875, -6.57421875, -5.51220703125, -4.4501953125, -3.38818359375, -2.326171875, -1.26416015625, -0.2021484375, 0.85986328125, 1.921875, 2.98388671875, 4.0458984375, 5.10791015625, 6.169921875, 7.23193359375, 8.2939453125, 9.35595703125, 10.41796875, 11.47998046875, 12.5419921875, 13.60400390625, 14.666015625, 15.72802734375, 16.7900390625, 17.85205078125, 18.9140625, 19.97607421875, 21.0380859375, 22.10009765625, 23.162109375, 24.22412109375, 25.2861328125, 26.34814453125, 27.41015625, 28.47216796875, 29.5341796875, 30.59619140625, 31.658203125, 32.72021484375, 33.7822265625, 34.84423828125, 35.90625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 9.0, 13.0, 10.0, 10.0, 13.0, 20.0, 26.0, 40.0, 35.0, 52.0, 60.0, 75.0, 69.0, 85.0, 72.0, 81.0, 54.0, 43.0, 50.0, 52.0, 18.0, 18.0, 23.0, 15.0, 17.0, 10.0, 6.0, 10.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.640625, -5.491943359375, -5.34326171875, -5.194580078125, -5.0458984375, -4.897216796875, -4.74853515625, -4.599853515625, -4.451171875, -4.302490234375, -4.15380859375, -4.005126953125, -3.8564453125, -3.707763671875, -3.55908203125, -3.410400390625, -3.26171875, -3.113037109375, -2.96435546875, -2.815673828125, -2.6669921875, -2.518310546875, -2.36962890625, -2.220947265625, -2.072265625, -1.923583984375, -1.77490234375, -1.626220703125, -1.4775390625, -1.328857421875, -1.18017578125, -1.031494140625, -0.8828125, -0.734130859375, -0.58544921875, -0.436767578125, -0.2880859375, -0.139404296875, 0.00927734375, 0.157958984375, 0.306640625, 0.455322265625, 0.60400390625, 0.752685546875, 0.9013671875, 1.050048828125, 1.19873046875, 1.347412109375, 1.49609375, 1.644775390625, 1.79345703125, 1.942138671875, 2.0908203125, 2.239501953125, 2.38818359375, 2.536865234375, 2.685546875, 2.834228515625, 2.98291015625, 3.131591796875, 3.2802734375, 3.428955078125, 3.57763671875, 3.726318359375, 3.875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 12.0, 17.0, 28.0, 57.0, 90.0, 98.0, 50.0, 53.0, 24.0, 16.0, 10.0, 5.0, 5.0, 3.0, 6.0, 3.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.900714874267578, -27.722326278686523, -26.54393768310547, -25.365549087524414, -24.18716049194336, -23.008771896362305, -21.83038330078125, -20.651992797851562, -19.47360610961914, -18.295217514038086, -17.11682891845703, -15.938440322875977, -14.760051727294922, -13.581663131713867, -12.403273582458496, -11.224884986877441, -10.04649543762207, -8.868106842041016, -7.689718246459961, -6.511329174041748, -5.332940578460693, -4.154551982879639, -2.976162910461426, -1.797774314880371, -0.6193857192993164, 0.5590029954910278, 1.737391710281372, 2.915780544281006, 4.0941691398620605, 5.272557735443115, 6.450946807861328, 7.629335403442383, 8.807723999023438, 9.986112594604492, 11.164501190185547, 12.342889785766602, 13.521278381347656, 14.699666976928711, 15.878056526184082, 17.056446075439453, 18.234832763671875, 19.41322135925293, 20.591609954833984, 21.76999855041504, 22.948387145996094, 24.12677574157715, 25.305164337158203, 26.48355484008789, 27.661943435668945, 28.84033203125, 30.018720626831055, 31.19710922241211, 32.3754997253418, 33.55388641357422, 34.732276916503906, 35.91066360473633, 37.089054107666016, 38.2674446105957, 39.445831298828125, 40.62422180175781, 41.802608489990234, 42.98099899291992, 44.159385681152344, 45.33777618408203, 46.51616287231445]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 6.0, 5.0, 8.0, 12.0, 54.0, 70.0, 108.0, 63.0, 50.0, 25.0, 13.0, 11.0, 2.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.38745880126953, -19.598468780517578, -18.809478759765625, -18.020488739013672, -17.23149871826172, -16.442508697509766, -15.653518676757812, -14.86452865600586, -14.075538635253906, -13.286548614501953, -12.49755859375, -11.708568572998047, -10.919578552246094, -10.13058853149414, -9.341598510742188, -8.552608489990234, -7.763617515563965, -6.974627494812012, -6.185637474060059, -5.3966474533081055, -4.607657432556152, -3.81866717338562, -3.029676914215088, -2.2406868934631348, -1.4516968727111816, -0.6627067923545837, 0.12628328800201416, 0.9152734279632568, 1.70426344871521, 2.493253469467163, 3.2822437286376953, 4.071233749389648, 4.860223770141602, 5.649213790893555, 6.438203811645508, 7.227193832397461, 8.016183853149414, 8.805173873901367, 9.59416389465332, 10.383153915405273, 11.172143936157227, 11.96113395690918, 12.750123977661133, 13.539113998413086, 14.328104019165039, 15.117094039916992, 15.906084060668945, 16.6950740814209, 17.484066009521484, 18.273056030273438, 19.06204605102539, 19.851036071777344, 20.640026092529297, 21.42901611328125, 22.218006134033203, 23.006996154785156, 23.79598617553711, 24.584976196289062, 25.373966217041016, 26.16295623779297, 26.951946258544922, 27.740936279296875, 28.529926300048828, 29.31891632080078, 30.107906341552734]}, "eval/loss": 1.6450167894363403, "eval/wer": 1.1136850456168188, "eval/runtime": 1264.9501, "eval/samples_per_second": 2.089, "eval/steps_per_second": 0.262} \ No newline at end of file +{"train/loss": 0.0292, "train/learning_rate": 6.143111638954869e-05, "train/epoch": 8.41, "train/global_step": 7500, "_runtime": 47224, "_timestamp": 1647144994, "_step": 7502, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 8.0, 9.0, 21.0, 29.0, 32.0, 47.0, 59.0, 64.0, 130.0, 143.0, 124.0, 108.0, 60.0, 46.0, 31.0, 33.0, 25.0, 15.0, 3.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78019905090332, -10.362777709960938, -9.945357322692871, -9.527935981750488, -9.110515594482422, -8.693094253540039, -8.275672912597656, -7.85825252532959, -7.440831661224365, -7.023410797119141, -6.605989933013916, -6.188569068908691, -5.771147727966309, -5.353727340698242, -4.936305999755859, -4.518885135650635, -4.10146427154541, -3.6840434074401855, -3.266622543334961, -2.8492014408111572, -2.4317805767059326, -2.014359712600708, -1.5969386100769043, -1.1795177459716797, -0.7620968818664551, -0.3446759581565857, 0.07274496555328369, 0.49016594886779785, 0.9075868129730225, 1.325007677078247, 1.7424287796020508, 2.1598496437072754, 2.5772695541381836, 2.994690418243408, 3.412111282348633, 3.8295323848724365, 4.246953010559082, 4.664374351501465, 5.0817952156066895, 5.499216079711914, 5.916636943817139, 6.334057807922363, 6.751478672027588, 7.1688995361328125, 7.586320877075195, 8.003741264343262, 8.421162605285645, 8.838582992553711, 9.256004333496094, 9.673425674438477, 10.090846061706543, 10.508267402648926, 10.925687789916992, 11.343109130859375, 11.760530471801758, 12.177950859069824, 12.59537124633789, 13.012792587280273, 13.43021297454834, 13.847634315490723, 14.265054702758789, 14.682476043701172, 15.099897384643555, 15.517317771911621, 15.934739112854004]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 14.0, 21.0, 14.0, 22.0, 26.0, 36.0, 45.0, 46.0, 53.0, 68.0, 71.0, 67.0, 67.0, 63.0, 56.0, 58.0, 47.0, 41.0, 44.0, 31.0, 22.0, 18.0, 16.0, 13.0, 7.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.285859107971191, -8.977399826049805, -8.668941497802734, -8.360483169555664, -8.052023887634277, -7.743565082550049, -7.43510627746582, -7.126647472381592, -6.818188667297363, -6.509729862213135, -6.201271057128906, -5.892812252044678, -5.584353446960449, -5.275894641876221, -4.967435836791992, -4.658977031707764, -4.350518226623535, -4.042059421539307, -3.733600616455078, -3.4251418113708496, -3.116683006286621, -2.8082242012023926, -2.499765396118164, -2.1913065910339355, -1.882847785949707, -1.5743889808654785, -1.26593017578125, -0.9574713706970215, -0.649012565612793, -0.34055376052856445, -0.03209495544433594, 0.2763638496398926, 0.5848236083984375, 0.893282413482666, 1.2017412185668945, 1.510200023651123, 1.8186588287353516, 2.12711763381958, 2.4355764389038086, 2.744035243988037, 3.0524940490722656, 3.360952854156494, 3.6694116592407227, 3.977870464324951, 4.28632926940918, 4.594788074493408, 4.903246879577637, 5.211705684661865, 5.520164489746094, 5.828623294830322, 6.137082099914551, 6.445540904998779, 6.753999710083008, 7.062458515167236, 7.370917320251465, 7.679376125335693, 7.987834930419922, 8.296293258666992, 8.604752540588379, 8.913211822509766, 9.221670150756836, 9.530128479003906, 9.838587760925293, 10.14704704284668, 10.45550537109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 6.0, 11.0, 15.0, 20.0, 11.0, 24.0, 22.0, 31.0, 39.0, 36.0, 44.0, 60.0, 56.0, 63.0, 56.0, 62.0, 48.0, 48.0, 49.0, 48.0, 45.0, 38.0, 35.0, 22.0, 21.0, 21.0, 14.0, 16.0, 5.0, 4.0, 7.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80908203125, -0.7820053100585938, -0.7549285888671875, -0.7278518676757812, -0.700775146484375, -0.6736984252929688, -0.6466217041015625, -0.6195449829101562, -0.59246826171875, -0.5653915405273438, -0.5383148193359375, -0.5112380981445312, -0.484161376953125, -0.45708465576171875, -0.4300079345703125, -0.40293121337890625, -0.3758544921875, -0.34877777099609375, -0.3217010498046875, -0.29462432861328125, -0.267547607421875, -0.24047088623046875, -0.2133941650390625, -0.18631744384765625, -0.15924072265625, -0.13216400146484375, -0.1050872802734375, -0.07801055908203125, -0.050933837890625, -0.02385711669921875, 0.0032196044921875, 0.03029632568359375, 0.057373046875, 0.08444976806640625, 0.1115264892578125, 0.13860321044921875, 0.165679931640625, 0.19275665283203125, 0.2198333740234375, 0.24691009521484375, 0.27398681640625, 0.30106353759765625, 0.3281402587890625, 0.35521697998046875, 0.382293701171875, 0.40937042236328125, 0.4364471435546875, 0.46352386474609375, 0.4906005859375, 0.5176773071289062, 0.5447540283203125, 0.5718307495117188, 0.598907470703125, 0.6259841918945312, 0.6530609130859375, 0.6801376342773438, 0.70721435546875, 0.7342910766601562, 0.7613677978515625, 0.7884445190429688, 0.815521240234375, 0.8425979614257812, 0.8696746826171875, 0.8967514038085938, 0.923828125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 9.0, 13.0, 24.0, 23.0, 31.0, 41.0, 63.0, 85.0, 109.0, 145.0, 196.0, 325.0, 487.0, 937.0, 1950.0, 5657.0, 22670.0, 221184.0, 3851321.0, 69690.0, 12309.0, 3541.0, 1380.0, 717.0, 429.0, 267.0, 213.0, 117.0, 76.0, 55.0, 60.0, 46.0, 24.0, 16.0, 18.0, 13.0, 13.0, 5.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.984375, -8.677734375, -8.37109375, -8.064453125, -7.7578125, -7.451171875, -7.14453125, -6.837890625, -6.53125, -6.224609375, -5.91796875, -5.611328125, -5.3046875, -4.998046875, -4.69140625, -4.384765625, -4.078125, -3.771484375, -3.46484375, -3.158203125, -2.8515625, -2.544921875, -2.23828125, -1.931640625, -1.625, -1.318359375, -1.01171875, -0.705078125, -0.3984375, -0.091796875, 0.21484375, 0.521484375, 0.828125, 1.134765625, 1.44140625, 1.748046875, 2.0546875, 2.361328125, 2.66796875, 2.974609375, 3.28125, 3.587890625, 3.89453125, 4.201171875, 4.5078125, 4.814453125, 5.12109375, 5.427734375, 5.734375, 6.041015625, 6.34765625, 6.654296875, 6.9609375, 7.267578125, 7.57421875, 7.880859375, 8.1875, 8.494140625, 8.80078125, 9.107421875, 9.4140625, 9.720703125, 10.02734375, 10.333984375, 10.640625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 8.0, 10.0, 11.0, 23.0, 42.0, 68.0, 115.0, 244.0, 715.0, 1703.0, 604.0, 239.0, 121.0, 56.0, 49.0, 21.0, 19.0, 10.0, 7.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.484375, -4.30059814453125, -4.1168212890625, -3.93304443359375, -3.749267578125, -3.56549072265625, -3.3817138671875, -3.19793701171875, -3.01416015625, -2.83038330078125, -2.6466064453125, -2.46282958984375, -2.279052734375, -2.09527587890625, -1.9114990234375, -1.72772216796875, -1.5439453125, -1.36016845703125, -1.1763916015625, -0.99261474609375, -0.808837890625, -0.62506103515625, -0.4412841796875, -0.25750732421875, -0.07373046875, 0.11004638671875, 0.2938232421875, 0.47760009765625, 0.661376953125, 0.84515380859375, 1.0289306640625, 1.21270751953125, 1.396484375, 1.58026123046875, 1.7640380859375, 1.94781494140625, 2.131591796875, 2.31536865234375, 2.4991455078125, 2.68292236328125, 2.86669921875, 3.05047607421875, 3.2342529296875, 3.41802978515625, 3.601806640625, 3.78558349609375, 3.9693603515625, 4.15313720703125, 4.3369140625, 4.52069091796875, 4.7044677734375, 4.88824462890625, 5.072021484375, 5.25579833984375, 5.4395751953125, 5.62335205078125, 5.80712890625, 5.99090576171875, 6.1746826171875, 6.35845947265625, 6.542236328125, 6.72601318359375, 6.9097900390625, 7.09356689453125, 7.27734375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 17.0, 22.0, 24.0, 44.0, 87.0, 128.0, 243.0, 549.0, 1298.0, 4529.0, 21606.0, 218621.0, 3763442.0, 159373.0, 18056.0, 3975.0, 1245.0, 471.0, 222.0, 128.0, 75.0, 46.0, 31.0, 20.0, 7.0, 8.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.7421875, -13.2755126953125, -12.808837890625, -12.3421630859375, -11.87548828125, -11.4088134765625, -10.942138671875, -10.4754638671875, -10.0087890625, -9.5421142578125, -9.075439453125, -8.6087646484375, -8.14208984375, -7.6754150390625, -7.208740234375, -6.7420654296875, -6.275390625, -5.8087158203125, -5.342041015625, -4.8753662109375, -4.40869140625, -3.9420166015625, -3.475341796875, -3.0086669921875, -2.5419921875, -2.0753173828125, -1.608642578125, -1.1419677734375, -0.67529296875, -0.2086181640625, 0.258056640625, 0.7247314453125, 1.19140625, 1.6580810546875, 2.124755859375, 2.5914306640625, 3.05810546875, 3.5247802734375, 3.991455078125, 4.4581298828125, 4.9248046875, 5.3914794921875, 5.858154296875, 6.3248291015625, 6.79150390625, 7.2581787109375, 7.724853515625, 8.1915283203125, 8.658203125, 9.1248779296875, 9.591552734375, 10.0582275390625, 10.52490234375, 10.9915771484375, 11.458251953125, 11.9249267578125, 12.3916015625, 12.8582763671875, 13.324951171875, 13.7916259765625, 14.25830078125, 14.7249755859375, 15.191650390625, 15.6583251953125, 16.125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 17.0, 22.0, 36.0, 66.0, 149.0, 177.0, 226.0, 149.0, 87.0, 41.0, 22.0, 12.0, 4.0, 1.0, 3.0], "bins": [-45.231937408447266, -44.40984344482422, -43.58774948120117, -42.76565933227539, -41.943565368652344, -41.1214714050293, -40.29937744140625, -39.47728729248047, -38.65519332885742, -37.833099365234375, -37.01100540161133, -36.18891525268555, -35.3668212890625, -34.54472732543945, -33.722633361816406, -32.900543212890625, -32.07844543457031, -31.256351470947266, -30.43425941467285, -29.612165451049805, -28.79007339477539, -27.967979431152344, -27.145885467529297, -26.323793411254883, -25.50170135498047, -24.679607391357422, -23.857515335083008, -23.03542137145996, -22.213329315185547, -21.3912353515625, -20.569141387939453, -19.74704933166504, -18.924957275390625, -18.102863311767578, -17.280771255493164, -16.458677291870117, -15.636585235595703, -14.814491271972656, -13.992398262023926, -13.170305252075195, -12.348211288452148, -11.526118278503418, -10.704025268554688, -9.88193130493164, -9.059839248657227, -8.23774528503418, -7.415652275085449, -6.593559265136719, -5.7714667320251465, -4.949373722076416, -4.127280235290527, -3.305187225341797, -2.4830942153930664, -1.661001205444336, -0.8389077186584473, -0.016814708709716797, 0.8052783012390137, 1.6273714303970337, 2.4494645595550537, 3.2715578079223633, 4.093650817871094, 4.915743827819824, 5.737837314605713, 6.559930324554443, 7.382023334503174]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 7.0, 11.0, 9.0, 14.0, 15.0, 15.0, 21.0, 29.0, 37.0, 29.0, 42.0, 37.0, 53.0, 55.0, 54.0, 44.0, 52.0, 48.0, 62.0, 49.0, 41.0, 50.0, 33.0, 35.0, 21.0, 33.0, 16.0, 22.0, 14.0, 12.0, 9.0, 8.0, 7.0, 2.0, 3.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.963400840759277, -9.571216583251953, -9.179031372070312, -8.786847114562988, -8.394662857055664, -8.00247859954834, -7.610293865203857, -7.218109130859375, -6.825924873352051, -6.433740615844727, -6.041555881500244, -5.649371147155762, -5.2571868896484375, -4.865002632141113, -4.472817897796631, -4.080633163452148, -3.688448905944824, -3.296264410018921, -2.9040799140930176, -2.5118954181671143, -2.119710922241211, -1.7275264263153076, -1.3353419303894043, -0.943157434463501, -0.5509729385375977, -0.15878844261169434, 0.23339605331420898, 0.6255805492401123, 1.0177650451660156, 1.409949541091919, 1.8021340370178223, 2.1943185329437256, 2.586503028869629, 2.9786875247955322, 3.3708720207214355, 3.763056516647339, 4.155241012573242, 4.547425270080566, 4.939610004425049, 5.331794738769531, 5.7239789962768555, 6.11616325378418, 6.508347988128662, 6.9005327224731445, 7.292716979980469, 7.684901237487793, 8.077085494995117, 8.469270706176758, 8.861454963684082, 9.253639221191406, 9.645824432373047, 10.038008689880371, 10.430192947387695, 10.82237720489502, 11.214561462402344, 11.606746673583984, 11.998930931091309, 12.391115188598633, 12.783300399780273, 13.175484657287598, 13.567668914794922, 13.959853172302246, 14.35203742980957, 14.744222640991211, 15.136406898498535]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 6.0, 5.0, 10.0, 13.0, 14.0, 9.0, 12.0, 20.0, 18.0, 20.0, 26.0, 33.0, 32.0, 30.0, 38.0, 40.0, 32.0, 43.0, 44.0, 41.0, 38.0, 46.0, 34.0, 43.0, 39.0, 37.0, 36.0, 22.0, 27.0, 31.0, 26.0, 24.0, 20.0, 7.0, 15.0, 13.0, 8.0, 12.0, 7.0, 5.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.72216796875, -0.7009429931640625, -0.679718017578125, -0.6584930419921875, -0.63726806640625, -0.6160430908203125, -0.594818115234375, -0.5735931396484375, -0.5523681640625, -0.5311431884765625, -0.509918212890625, -0.4886932373046875, -0.46746826171875, -0.4462432861328125, -0.425018310546875, -0.4037933349609375, -0.382568359375, -0.3613433837890625, -0.340118408203125, -0.3188934326171875, -0.29766845703125, -0.2764434814453125, -0.255218505859375, -0.2339935302734375, -0.2127685546875, -0.1915435791015625, -0.170318603515625, -0.1490936279296875, -0.12786865234375, -0.1066436767578125, -0.085418701171875, -0.0641937255859375, -0.04296875, -0.0217437744140625, -0.000518798828125, 0.0207061767578125, 0.04193115234375, 0.0631561279296875, 0.084381103515625, 0.1056060791015625, 0.1268310546875, 0.1480560302734375, 0.169281005859375, 0.1905059814453125, 0.21173095703125, 0.2329559326171875, 0.254180908203125, 0.2754058837890625, 0.296630859375, 0.3178558349609375, 0.339080810546875, 0.3603057861328125, 0.38153076171875, 0.4027557373046875, 0.423980712890625, 0.4452056884765625, 0.4664306640625, 0.4876556396484375, 0.508880615234375, 0.5301055908203125, 0.55133056640625, 0.5725555419921875, 0.593780517578125, 0.6150054931640625, 0.63623046875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 9.0, 10.0, 26.0, 30.0, 49.0, 69.0, 93.0, 174.0, 243.0, 333.0, 482.0, 756.0, 1139.0, 1836.0, 2814.0, 4398.0, 6930.0, 11100.0, 18216.0, 30394.0, 51802.0, 94167.0, 186684.0, 272608.0, 162711.0, 83196.0, 46374.0, 27221.0, 16467.0, 10301.0, 6395.0, 3976.0, 2607.0, 1675.0, 1092.0, 716.0, 444.0, 319.0, 194.0, 166.0, 104.0, 65.0, 54.0, 36.0, 25.0, 14.0, 12.0, 7.0, 6.0, 4.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82275390625, -0.7956924438476562, -0.7686309814453125, -0.7415695190429688, -0.714508056640625, -0.6874465942382812, -0.6603851318359375, -0.6333236694335938, -0.60626220703125, -0.5792007446289062, -0.5521392822265625, -0.5250778198242188, -0.498016357421875, -0.47095489501953125, -0.4438934326171875, -0.41683197021484375, -0.3897705078125, -0.36270904541015625, -0.3356475830078125, -0.30858612060546875, -0.281524658203125, -0.25446319580078125, -0.2274017333984375, -0.20034027099609375, -0.17327880859375, -0.14621734619140625, -0.1191558837890625, -0.09209442138671875, -0.065032958984375, -0.03797149658203125, -0.0109100341796875, 0.01615142822265625, 0.043212890625, 0.07027435302734375, 0.0973358154296875, 0.12439727783203125, 0.151458740234375, 0.17852020263671875, 0.2055816650390625, 0.23264312744140625, 0.25970458984375, 0.28676605224609375, 0.3138275146484375, 0.34088897705078125, 0.367950439453125, 0.39501190185546875, 0.4220733642578125, 0.44913482666015625, 0.4761962890625, 0.5032577514648438, 0.5303192138671875, 0.5573806762695312, 0.584442138671875, 0.6115036010742188, 0.6385650634765625, 0.6656265258789062, 0.69268798828125, 0.7197494506835938, 0.7468109130859375, 0.7738723754882812, 0.800933837890625, 0.8279953002929688, 0.8550567626953125, 0.8821182250976562, 0.9091796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 11.0, 10.0, 16.0, 10.0, 18.0, 19.0, 20.0, 19.0, 21.0, 22.0, 24.0, 33.0, 41.0, 37.0, 29.0, 31.0, 37.0, 45.0, 1057.0, 39.0, 50.0, 44.0, 46.0, 25.0, 32.0, 36.0, 28.0, 19.0, 37.0, 29.0, 9.0, 26.0, 17.0, 12.0, 11.0, 12.0, 4.0, 6.0, 4.0, 6.0, 9.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6455078125, -0.6252899169921875, -0.605072021484375, -0.5848541259765625, -0.56463623046875, -0.5444183349609375, -0.524200439453125, -0.5039825439453125, -0.4837646484375, -0.4635467529296875, -0.443328857421875, -0.4231109619140625, -0.40289306640625, -0.3826751708984375, -0.362457275390625, -0.3422393798828125, -0.322021484375, -0.3018035888671875, -0.281585693359375, -0.2613677978515625, -0.24114990234375, -0.2209320068359375, -0.200714111328125, -0.1804962158203125, -0.1602783203125, -0.1400604248046875, -0.119842529296875, -0.0996246337890625, -0.07940673828125, -0.0591888427734375, -0.038970947265625, -0.0187530517578125, 0.00146484375, 0.0216827392578125, 0.041900634765625, 0.0621185302734375, 0.08233642578125, 0.1025543212890625, 0.122772216796875, 0.1429901123046875, 0.1632080078125, 0.1834259033203125, 0.203643798828125, 0.2238616943359375, 0.24407958984375, 0.2642974853515625, 0.284515380859375, 0.3047332763671875, 0.324951171875, 0.3451690673828125, 0.365386962890625, 0.3856048583984375, 0.40582275390625, 0.4260406494140625, 0.446258544921875, 0.4664764404296875, 0.4866943359375, 0.5069122314453125, 0.527130126953125, 0.5473480224609375, 0.56756591796875, 0.5877838134765625, 0.608001708984375, 0.6282196044921875, 0.6484375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 10.0, 12.0, 11.0, 17.0, 29.0, 25.0, 47.0, 67.0, 109.0, 145.0, 241.0, 357.0, 437.0, 718.0, 1118.0, 1736.0, 2896.0, 4723.0, 8930.0, 17903.0, 48363.0, 1380453.0, 548820.0, 43144.0, 16617.0, 8079.0, 4562.0, 2647.0, 1690.0, 1108.0, 676.0, 424.0, 328.0, 207.0, 148.0, 88.0, 71.0, 51.0, 32.0, 40.0, 13.0, 10.0, 9.0, 8.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.98974609375, -0.958770751953125, -0.92779541015625, -0.896820068359375, -0.8658447265625, -0.834869384765625, -0.80389404296875, -0.772918701171875, -0.741943359375, -0.710968017578125, -0.67999267578125, -0.649017333984375, -0.6180419921875, -0.587066650390625, -0.55609130859375, -0.525115966796875, -0.494140625, -0.463165283203125, -0.43218994140625, -0.401214599609375, -0.3702392578125, -0.339263916015625, -0.30828857421875, -0.277313232421875, -0.246337890625, -0.215362548828125, -0.18438720703125, -0.153411865234375, -0.1224365234375, -0.091461181640625, -0.06048583984375, -0.029510498046875, 0.00146484375, 0.032440185546875, 0.06341552734375, 0.094390869140625, 0.1253662109375, 0.156341552734375, 0.18731689453125, 0.218292236328125, 0.249267578125, 0.280242919921875, 0.31121826171875, 0.342193603515625, 0.3731689453125, 0.404144287109375, 0.43511962890625, 0.466094970703125, 0.4970703125, 0.528045654296875, 0.55902099609375, 0.589996337890625, 0.6209716796875, 0.651947021484375, 0.68292236328125, 0.713897705078125, 0.744873046875, 0.775848388671875, 0.80682373046875, 0.837799072265625, 0.8687744140625, 0.899749755859375, 0.93072509765625, 0.961700439453125, 0.99267578125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 4.0, 4.0, 5.0, 5.0, 12.0, 10.0, 17.0, 14.0, 23.0, 32.0, 27.0, 36.0, 40.0, 62.0, 91.0, 112.0, 130.0, 79.0, 59.0, 54.0, 31.0, 20.0, 17.0, 14.0, 23.0, 12.0, 6.0, 9.0, 4.0, 8.0, 4.0, 7.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1048583984375, -0.10085296630859375, -0.0968475341796875, -0.09284210205078125, -0.088836669921875, -0.08483123779296875, -0.0808258056640625, -0.07682037353515625, -0.07281494140625, -0.06880950927734375, -0.0648040771484375, -0.06079864501953125, -0.056793212890625, -0.05278778076171875, -0.0487823486328125, -0.04477691650390625, -0.040771484375, -0.03676605224609375, -0.0327606201171875, -0.02875518798828125, -0.024749755859375, -0.02074432373046875, -0.0167388916015625, -0.01273345947265625, -0.00872802734375, -0.00472259521484375, -0.0007171630859375, 0.00328826904296875, 0.007293701171875, 0.01129913330078125, 0.0153045654296875, 0.01930999755859375, 0.0233154296875, 0.02732086181640625, 0.0313262939453125, 0.03533172607421875, 0.039337158203125, 0.04334259033203125, 0.0473480224609375, 0.05135345458984375, 0.05535888671875, 0.05936431884765625, 0.0633697509765625, 0.06737518310546875, 0.071380615234375, 0.07538604736328125, 0.0793914794921875, 0.08339691162109375, 0.08740234375, 0.09140777587890625, 0.0954132080078125, 0.09941864013671875, 0.103424072265625, 0.10742950439453125, 0.1114349365234375, 0.11544036865234375, 0.11944580078125, 0.12345123291015625, 0.1274566650390625, 0.13146209716796875, 0.135467529296875, 0.13947296142578125, 0.1434783935546875, 0.14748382568359375, 0.1514892578125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 8.0, 7.0, 11.0, 17.0, 18.0, 27.0, 32.0, 33.0, 54.0, 81.0, 112.0, 148.0, 266.0, 576.0, 1933.0, 11767.0, 403569.0, 612200.0, 14210.0, 2102.0, 551.0, 230.0, 139.0, 98.0, 71.0, 73.0, 31.0, 40.0, 22.0, 19.0, 16.0, 15.0, 13.0, 15.0, 12.0, 5.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.638671875, -1.580230712890625, -1.52178955078125, -1.463348388671875, -1.4049072265625, -1.346466064453125, -1.28802490234375, -1.229583740234375, -1.171142578125, -1.112701416015625, -1.05426025390625, -0.995819091796875, -0.9373779296875, -0.878936767578125, -0.82049560546875, -0.762054443359375, -0.70361328125, -0.645172119140625, -0.58673095703125, -0.528289794921875, -0.4698486328125, -0.411407470703125, -0.35296630859375, -0.294525146484375, -0.236083984375, -0.177642822265625, -0.11920166015625, -0.060760498046875, -0.0023193359375, 0.056121826171875, 0.11456298828125, 0.173004150390625, 0.2314453125, 0.289886474609375, 0.34832763671875, 0.406768798828125, 0.4652099609375, 0.523651123046875, 0.58209228515625, 0.640533447265625, 0.698974609375, 0.757415771484375, 0.81585693359375, 0.874298095703125, 0.9327392578125, 0.991180419921875, 1.04962158203125, 1.108062744140625, 1.16650390625, 1.224945068359375, 1.28338623046875, 1.341827392578125, 1.4002685546875, 1.458709716796875, 1.51715087890625, 1.575592041015625, 1.634033203125, 1.692474365234375, 1.75091552734375, 1.809356689453125, 1.8677978515625, 1.926239013671875, 1.98468017578125, 2.043121337890625, 2.1015625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 12.0, 15.0, 12.0, 24.0, 47.0, 60.0, 90.0, 115.0, 177.0, 123.0, 105.0, 71.0, 50.0, 29.0, 17.0, 16.0, 14.0, 8.0, 8.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4762885868549347, -0.45195645093917847, -0.42762428522109985, -0.40329214930534363, -0.3789600133895874, -0.3546278476715088, -0.33029571175575256, -0.30596357583999634, -0.2816314101219177, -0.2572992742061615, -0.23296710848808289, -0.20863497257232666, -0.18430282175540924, -0.15997067093849182, -0.1356385350227356, -0.11130638420581818, -0.08697423338890076, -0.06264208257198334, -0.038309939205646515, -0.013977795839309692, 0.010354354977607727, 0.034686505794525146, 0.05901864171028137, 0.08335079252719879, 0.10768294334411621, 0.13201509416103363, 0.15634724497795105, 0.18067938089370728, 0.2050115317106247, 0.22934368252754211, 0.25367581844329834, 0.27800798416137695, 0.30234014987945557, 0.3266722857952118, 0.3510044515132904, 0.37533658742904663, 0.39966875314712524, 0.42400088906288147, 0.4483330249786377, 0.4726651906967163, 0.49699732661247253, 0.5213294625282288, 0.5456616282463074, 0.5699937343597412, 0.5943259000778198, 0.6186580657958984, 0.642990231513977, 0.6673223376274109, 0.6916545033454895, 0.7159866690635681, 0.740318775177002, 0.7646509408950806, 0.7889831066131592, 0.8133152723312378, 0.8376473784446716, 0.8619795441627502, 0.8863116502761841, 0.9106438159942627, 0.9349759221076965, 0.9593080878257751, 0.9836402535438538, 1.0079723596572876, 1.0323045253753662, 1.0566366910934448, 1.0809688568115234]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 0.0, 4.0, 6.0, 10.0, 11.0, 16.0, 15.0, 17.0, 36.0, 22.0, 32.0, 45.0, 28.0, 55.0, 55.0, 44.0, 54.0, 57.0, 53.0, 52.0, 56.0, 37.0, 47.0, 37.0, 35.0, 31.0, 35.0, 22.0, 23.0, 20.0, 17.0, 9.0, 1.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.34772950410842896, -0.33804401755332947, -0.32835856080055237, -0.3186730742454529, -0.3089876174926758, -0.2993021309375763, -0.2896166741847992, -0.2799311876296997, -0.2702457308769226, -0.2605602443218231, -0.250874787569046, -0.24118931591510773, -0.23150384426116943, -0.22181835770606995, -0.21213288605213165, -0.20244741439819336, -0.19276192784309387, -0.18307645618915558, -0.17339098453521729, -0.163705512881279, -0.1540200412273407, -0.1443345546722412, -0.13464908301830292, -0.12496361136436462, -0.11527813971042633, -0.10559266805648804, -0.09590719640254974, -0.08622171729803085, -0.07653624564409256, -0.06685077399015427, -0.057165298610925674, -0.04747982323169708, -0.03779435157775879, -0.028108878061175346, -0.018423404544591904, -0.008737931028008461, 0.0009475424885749817, 0.010633014142513275, 0.020318489521741867, 0.03000396490097046, 0.03968943655490875, 0.049374908208847046, 0.05906038358807564, 0.06874585896730423, 0.07843133062124252, 0.08811680227518082, 0.09780228137969971, 0.107487753033638, 0.1171732246875763, 0.1268586963415146, 0.13654416799545288, 0.14622963964939117, 0.15591511130332947, 0.16560059785842896, 0.17528606951236725, 0.18497154116630554, 0.19465701282024384, 0.20434248447418213, 0.21402795612812042, 0.22371342778205872, 0.2333989143371582, 0.2430843710899353, 0.2527698576450348, 0.2624553442001343, 0.2721408009529114]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 1.0, 7.0, 5.0, 10.0, 14.0, 12.0, 11.0, 11.0, 23.0, 15.0, 23.0, 24.0, 33.0, 34.0, 32.0, 34.0, 42.0, 35.0, 36.0, 47.0, 42.0, 42.0, 48.0, 29.0, 45.0, 38.0, 34.0, 36.0, 25.0, 29.0, 28.0, 27.0, 23.0, 17.0, 10.0, 14.0, 11.0, 9.0, 13.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.72412109375, -0.7027664184570312, -0.6814117431640625, -0.6600570678710938, -0.638702392578125, -0.6173477172851562, -0.5959930419921875, -0.5746383666992188, -0.55328369140625, -0.5319290161132812, -0.5105743408203125, -0.48921966552734375, -0.467864990234375, -0.44651031494140625, -0.4251556396484375, -0.40380096435546875, -0.3824462890625, -0.36109161376953125, -0.3397369384765625, -0.31838226318359375, -0.297027587890625, -0.27567291259765625, -0.2543182373046875, -0.23296356201171875, -0.21160888671875, -0.19025421142578125, -0.1688995361328125, -0.14754486083984375, -0.126190185546875, -0.10483551025390625, -0.0834808349609375, -0.06212615966796875, -0.040771484375, -0.01941680908203125, 0.0019378662109375, 0.02329254150390625, 0.044647216796875, 0.06600189208984375, 0.0873565673828125, 0.10871124267578125, 0.13006591796875, 0.15142059326171875, 0.1727752685546875, 0.19412994384765625, 0.215484619140625, 0.23683929443359375, 0.2581939697265625, 0.27954864501953125, 0.3009033203125, 0.32225799560546875, 0.3436126708984375, 0.36496734619140625, 0.386322021484375, 0.40767669677734375, 0.4290313720703125, 0.45038604736328125, 0.47174072265625, 0.49309539794921875, 0.5144500732421875, 0.5358047485351562, 0.557159423828125, 0.5785140991210938, 0.5998687744140625, 0.6212234497070312, 0.642578125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 17.0, 16.0, 21.0, 25.0, 29.0, 58.0, 89.0, 156.0, 203.0, 317.0, 457.0, 724.0, 1101.0, 1774.0, 2879.0, 4892.0, 8673.0, 15938.0, 32433.0, 73020.0, 197471.0, 409946.0, 169675.0, 64685.0, 29405.0, 14530.0, 7944.0, 4594.0, 2699.0, 1648.0, 1135.0, 662.0, 455.0, 312.0, 188.0, 117.0, 91.0, 50.0, 36.0, 27.0, 21.0, 15.0, 16.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.26953125, -2.19732666015625, -2.1251220703125, -2.05291748046875, -1.980712890625, -1.90850830078125, -1.8363037109375, -1.76409912109375, -1.69189453125, -1.61968994140625, -1.5474853515625, -1.47528076171875, -1.403076171875, -1.33087158203125, -1.2586669921875, -1.18646240234375, -1.1142578125, -1.04205322265625, -0.9698486328125, -0.89764404296875, -0.825439453125, -0.75323486328125, -0.6810302734375, -0.60882568359375, -0.53662109375, -0.46441650390625, -0.3922119140625, -0.32000732421875, -0.247802734375, -0.17559814453125, -0.1033935546875, -0.03118896484375, 0.041015625, 0.11322021484375, 0.1854248046875, 0.25762939453125, 0.329833984375, 0.40203857421875, 0.4742431640625, 0.54644775390625, 0.61865234375, 0.69085693359375, 0.7630615234375, 0.83526611328125, 0.907470703125, 0.97967529296875, 1.0518798828125, 1.12408447265625, 1.1962890625, 1.26849365234375, 1.3406982421875, 1.41290283203125, 1.485107421875, 1.55731201171875, 1.6295166015625, 1.70172119140625, 1.77392578125, 1.84613037109375, 1.9183349609375, 1.99053955078125, 2.062744140625, 2.13494873046875, 2.2071533203125, 2.27935791015625, 2.3515625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 9.0, 15.0, 8.0, 16.0, 23.0, 18.0, 23.0, 32.0, 29.0, 33.0, 50.0, 79.0, 101.0, 139.0, 196.0, 1324.0, 208.0, 187.0, 110.0, 70.0, 66.0, 56.0, 50.0, 33.0, 30.0, 23.0, 17.0, 19.0, 13.0, 19.0, 13.0, 5.0, 4.0, 5.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.76953125, -2.68475341796875, -2.5999755859375, -2.51519775390625, -2.430419921875, -2.34564208984375, -2.2608642578125, -2.17608642578125, -2.09130859375, -2.00653076171875, -1.9217529296875, -1.83697509765625, -1.752197265625, -1.66741943359375, -1.5826416015625, -1.49786376953125, -1.4130859375, -1.32830810546875, -1.2435302734375, -1.15875244140625, -1.073974609375, -0.98919677734375, -0.9044189453125, -0.81964111328125, -0.73486328125, -0.65008544921875, -0.5653076171875, -0.48052978515625, -0.395751953125, -0.31097412109375, -0.2261962890625, -0.14141845703125, -0.056640625, 0.02813720703125, 0.1129150390625, 0.19769287109375, 0.282470703125, 0.36724853515625, 0.4520263671875, 0.53680419921875, 0.62158203125, 0.70635986328125, 0.7911376953125, 0.87591552734375, 0.960693359375, 1.04547119140625, 1.1302490234375, 1.21502685546875, 1.2998046875, 1.38458251953125, 1.4693603515625, 1.55413818359375, 1.638916015625, 1.72369384765625, 1.8084716796875, 1.89324951171875, 1.97802734375, 2.06280517578125, 2.1475830078125, 2.23236083984375, 2.317138671875, 2.40191650390625, 2.4866943359375, 2.57147216796875, 2.65625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 16.0, 12.0, 16.0, 19.0, 20.0, 31.0, 33.0, 63.0, 106.0, 261.0, 1005.0, 7329.0, 307661.0, 2798809.0, 27239.0, 2278.0, 411.0, 138.0, 72.0, 42.0, 34.0, 21.0, 12.0, 18.0, 13.0, 7.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2890625, -11.8955078125, -11.501953125, -11.1083984375, -10.71484375, -10.3212890625, -9.927734375, -9.5341796875, -9.140625, -8.7470703125, -8.353515625, -7.9599609375, -7.56640625, -7.1728515625, -6.779296875, -6.3857421875, -5.9921875, -5.5986328125, -5.205078125, -4.8115234375, -4.41796875, -4.0244140625, -3.630859375, -3.2373046875, -2.84375, -2.4501953125, -2.056640625, -1.6630859375, -1.26953125, -0.8759765625, -0.482421875, -0.0888671875, 0.3046875, 0.6982421875, 1.091796875, 1.4853515625, 1.87890625, 2.2724609375, 2.666015625, 3.0595703125, 3.453125, 3.8466796875, 4.240234375, 4.6337890625, 5.02734375, 5.4208984375, 5.814453125, 6.2080078125, 6.6015625, 6.9951171875, 7.388671875, 7.7822265625, 8.17578125, 8.5693359375, 8.962890625, 9.3564453125, 9.75, 10.1435546875, 10.537109375, 10.9306640625, 11.32421875, 11.7177734375, 12.111328125, 12.5048828125, 12.8984375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 44.0, 329.0, 502.0, 125.0, 14.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.377891540527344, -32.19456481933594, -31.011234283447266, -29.827905654907227, -28.644577026367188, -27.46125030517578, -26.277921676635742, -25.094593048095703, -23.911264419555664, -22.727935791015625, -21.544607162475586, -20.361278533935547, -19.17795181274414, -17.99462127685547, -16.811294555664062, -15.627965927124023, -14.444637298583984, -13.261308670043945, -12.077980041503906, -10.894652366638184, -9.711323738098145, -8.527995109558105, -7.344666957855225, -6.161338806152344, -4.978010177612305, -3.7946817874908447, -2.6113533973693848, -1.4280250072479248, -0.24469661712646484, 0.9386320114135742, 2.121960163116455, 3.305288314819336, 4.488616943359375, 5.671945571899414, 6.855273723602295, 8.038601875305176, 9.221930503845215, 10.405259132385254, 11.588586807250977, 12.771915435791016, 13.955244064331055, 15.138572692871094, 16.321901321411133, 17.505229949951172, 18.688556671142578, 19.87188720703125, 21.055213928222656, 22.238542556762695, 23.421871185302734, 24.605199813842773, 25.788528442382812, 26.97185707092285, 28.15518569946289, 29.338512420654297, 30.521841049194336, 31.705169677734375, 32.88849639892578, 34.07182312011719, 35.25515365600586, 36.438480377197266, 37.62181091308594, 38.805137634277344, 39.988468170166016, 41.17179489135742, 42.355125427246094]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 7.0, 4.0, 6.0, 8.0, 6.0, 19.0, 15.0, 9.0, 19.0, 17.0, 19.0, 20.0, 25.0, 31.0, 38.0, 42.0, 27.0, 31.0, 36.0, 38.0, 37.0, 35.0, 34.0, 38.0, 46.0, 40.0, 25.0, 40.0, 42.0, 22.0, 27.0, 24.0, 20.0, 25.0, 19.0, 19.0, 16.0, 15.0, 10.0, 7.0, 8.0, 7.0, 9.0, 4.0, 4.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.416872024536133, -8.174131393432617, -7.931390762329102, -7.688650131225586, -7.44590950012207, -7.203168869018555, -6.960428714752197, -6.717688083648682, -6.474947452545166, -6.23220682144165, -5.989466190338135, -5.746725559234619, -5.503985404968262, -5.261244773864746, -5.0185041427612305, -4.775763511657715, -4.533022880554199, -4.290282249450684, -4.047541618347168, -3.8048012256622314, -3.562060594558716, -3.3193199634552, -3.0765795707702637, -2.833838939666748, -2.5910983085632324, -2.348357677459717, -2.105617046356201, -1.8628766536712646, -1.620136022567749, -1.3773953914642334, -1.1346548795700073, -0.8919143676757812, -0.6491737365722656, -0.4064331650733948, -0.16369259357452393, 0.07904797792434692, 0.3217885494232178, 0.5645291805267334, 0.8072696924209595, 1.0500102043151855, 1.2927508354187012, 1.5354914665222168, 1.7782319784164429, 2.020972490310669, 2.2637131214141846, 2.5064537525177, 2.7491941452026367, 2.9919347763061523, 3.234675407409668, 3.4774160385131836, 3.720156669616699, 3.9628970623016357, 4.2056379318237305, 4.448378562927246, 4.6911187171936035, 4.933859348297119, 5.176599979400635, 5.41934061050415, 5.662081241607666, 5.904821872711182, 6.147562026977539, 6.390302658081055, 6.63304328918457, 6.875783920288086, 7.118524551391602]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 5.0, 7.0, 3.0, 8.0, 11.0, 7.0, 14.0, 14.0, 22.0, 19.0, 25.0, 23.0, 26.0, 31.0, 34.0, 30.0, 31.0, 36.0, 43.0, 37.0, 38.0, 45.0, 47.0, 44.0, 40.0, 41.0, 38.0, 27.0, 34.0, 20.0, 33.0, 22.0, 25.0, 19.0, 19.0, 11.0, 15.0, 8.0, 16.0, 9.0, 5.0, 4.0, 4.0, 5.0, 4.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.779296875, -0.7560958862304688, -0.7328948974609375, -0.7096939086914062, -0.686492919921875, -0.6632919311523438, -0.6400909423828125, -0.6168899536132812, -0.59368896484375, -0.5704879760742188, -0.5472869873046875, -0.5240859985351562, -0.500885009765625, -0.47768402099609375, -0.4544830322265625, -0.43128204345703125, -0.4080810546875, -0.38488006591796875, -0.3616790771484375, -0.33847808837890625, -0.315277099609375, -0.29207611083984375, -0.2688751220703125, -0.24567413330078125, -0.22247314453125, -0.19927215576171875, -0.1760711669921875, -0.15287017822265625, -0.129669189453125, -0.10646820068359375, -0.0832672119140625, -0.06006622314453125, -0.036865234375, -0.01366424560546875, 0.0095367431640625, 0.03273773193359375, 0.055938720703125, 0.07913970947265625, 0.1023406982421875, 0.12554168701171875, 0.14874267578125, 0.17194366455078125, 0.1951446533203125, 0.21834564208984375, 0.241546630859375, 0.26474761962890625, 0.2879486083984375, 0.31114959716796875, 0.3343505859375, 0.35755157470703125, 0.3807525634765625, 0.40395355224609375, 0.427154541015625, 0.45035552978515625, 0.4735565185546875, 0.49675750732421875, 0.51995849609375, 0.5431594848632812, 0.5663604736328125, 0.5895614624023438, 0.612762451171875, 0.6359634399414062, 0.6591644287109375, 0.6823654174804688, 0.70556640625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 9.0, 9.0, 18.0, 30.0, 39.0, 45.0, 65.0, 90.0, 145.0, 216.0, 338.0, 499.0, 759.0, 1124.0, 1766.0, 2695.0, 4356.0, 7296.0, 12410.0, 22168.0, 43114.0, 109576.0, 556884.0, 2660365.0, 561061.0, 111727.0, 44289.0, 22187.0, 12138.0, 7119.0, 4372.0, 2723.0, 1638.0, 997.0, 681.0, 432.0, 288.0, 205.0, 143.0, 76.0, 58.0, 29.0, 29.0, 25.0, 13.0, 16.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.35546875, -2.28515625, -2.21484375, -2.14453125, -2.07421875, -2.00390625, -1.93359375, -1.86328125, -1.79296875, -1.72265625, -1.65234375, -1.58203125, -1.51171875, -1.44140625, -1.37109375, -1.30078125, -1.23046875, -1.16015625, -1.08984375, -1.01953125, -0.94921875, -0.87890625, -0.80859375, -0.73828125, -0.66796875, -0.59765625, -0.52734375, -0.45703125, -0.38671875, -0.31640625, -0.24609375, -0.17578125, -0.10546875, -0.03515625, 0.03515625, 0.10546875, 0.17578125, 0.24609375, 0.31640625, 0.38671875, 0.45703125, 0.52734375, 0.59765625, 0.66796875, 0.73828125, 0.80859375, 0.87890625, 0.94921875, 1.01953125, 1.08984375, 1.16015625, 1.23046875, 1.30078125, 1.37109375, 1.44140625, 1.51171875, 1.58203125, 1.65234375, 1.72265625, 1.79296875, 1.86328125, 1.93359375, 2.00390625, 2.07421875, 2.14453125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 8.0, 12.0, 19.0, 25.0, 34.0, 43.0, 78.0, 94.0, 157.0, 284.0, 552.0, 972.0, 745.0, 409.0, 211.0, 140.0, 99.0, 55.0, 33.0, 34.0, 17.0, 8.0, 9.0, 13.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.6845703125, -4.560546875, -4.4365234375, -4.3125, -4.1884765625, -4.064453125, -3.9404296875, -3.81640625, -3.6923828125, -3.568359375, -3.4443359375, -3.3203125, -3.1962890625, -3.072265625, -2.9482421875, -2.82421875, -2.7001953125, -2.576171875, -2.4521484375, -2.328125, -2.2041015625, -2.080078125, -1.9560546875, -1.83203125, -1.7080078125, -1.583984375, -1.4599609375, -1.3359375, -1.2119140625, -1.087890625, -0.9638671875, -0.83984375, -0.7158203125, -0.591796875, -0.4677734375, -0.34375, -0.2197265625, -0.095703125, 0.0283203125, 0.15234375, 0.2763671875, 0.400390625, 0.5244140625, 0.6484375, 0.7724609375, 0.896484375, 1.0205078125, 1.14453125, 1.2685546875, 1.392578125, 1.5166015625, 1.640625, 1.7646484375, 1.888671875, 2.0126953125, 2.13671875, 2.2607421875, 2.384765625, 2.5087890625, 2.6328125, 2.7568359375, 2.880859375, 3.0048828125, 3.12890625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 5.0, 3.0, 10.0, 16.0, 23.0, 22.0, 26.0, 44.0, 71.0, 120.0, 239.0, 515.0, 1293.0, 3578.0, 11493.0, 46695.0, 277244.0, 3242846.0, 518310.0, 67819.0, 16159.0, 4691.0, 1710.0, 664.0, 295.0, 143.0, 83.0, 52.0, 29.0, 24.0, 22.0, 10.0, 16.0, 5.0, 6.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.328125, -9.08660888671875, -8.8450927734375, -8.60357666015625, -8.362060546875, -8.12054443359375, -7.8790283203125, -7.63751220703125, -7.39599609375, -7.15447998046875, -6.9129638671875, -6.67144775390625, -6.429931640625, -6.18841552734375, -5.9468994140625, -5.70538330078125, -5.4638671875, -5.22235107421875, -4.9808349609375, -4.73931884765625, -4.497802734375, -4.25628662109375, -4.0147705078125, -3.77325439453125, -3.53173828125, -3.29022216796875, -3.0487060546875, -2.80718994140625, -2.565673828125, -2.32415771484375, -2.0826416015625, -1.84112548828125, -1.599609375, -1.35809326171875, -1.1165771484375, -0.87506103515625, -0.633544921875, -0.39202880859375, -0.1505126953125, 0.09100341796875, 0.33251953125, 0.57403564453125, 0.8155517578125, 1.05706787109375, 1.298583984375, 1.54010009765625, 1.7816162109375, 2.02313232421875, 2.2646484375, 2.50616455078125, 2.7476806640625, 2.98919677734375, 3.230712890625, 3.47222900390625, 3.7137451171875, 3.95526123046875, 4.19677734375, 4.43829345703125, 4.6798095703125, 4.92132568359375, 5.162841796875, 5.40435791015625, 5.6458740234375, 5.88739013671875, 6.12890625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 12.0, 23.0, 51.0, 81.0, 164.0, 210.0, 217.0, 125.0, 63.0, 36.0, 15.0, 10.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.495407104492188, -15.705595970153809, -14.91578483581543, -14.12597370147705, -13.336162567138672, -12.546351432800293, -11.756540298461914, -10.966729164123535, -10.176918029785156, -9.387106895446777, -8.597295761108398, -7.8074846267700195, -7.017673492431641, -6.227862358093262, -5.438051223754883, -4.648240089416504, -3.858428955078125, -3.068617820739746, -2.278806686401367, -1.4889955520629883, -0.6991844177246094, 0.09062671661376953, 0.8804378509521484, 1.6702489852905273, 2.4600601196289062, 3.249871253967285, 4.039682388305664, 4.829493522644043, 5.619304656982422, 6.409115791320801, 7.19892692565918, 7.988738059997559, 8.778549194335938, 9.568360328674316, 10.358171463012695, 11.147982597351074, 11.937793731689453, 12.727604866027832, 13.517416000366211, 14.30722713470459, 15.097038269042969, 15.886849403381348, 16.676660537719727, 17.466472625732422, 18.256282806396484, 19.046092987060547, 19.835905075073242, 20.625717163085938, 21.41552734375, 22.205337524414062, 22.995149612426758, 23.784961700439453, 24.574771881103516, 25.364582061767578, 26.154394149780273, 26.94420623779297, 27.73401641845703, 28.523826599121094, 29.31363868713379, 30.103450775146484, 30.893260955810547, 31.68307113647461, 32.47288513183594, 33.2626953125, 34.05250549316406]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 6.0, 6.0, 9.0, 9.0, 16.0, 21.0, 13.0, 18.0, 20.0, 23.0, 20.0, 29.0, 32.0, 36.0, 40.0, 38.0, 31.0, 33.0, 43.0, 36.0, 40.0, 36.0, 44.0, 30.0, 52.0, 28.0, 37.0, 33.0, 32.0, 27.0, 29.0, 21.0, 22.0, 14.0, 10.0, 10.0, 13.0, 6.0, 6.0, 6.0, 9.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.426960468292236, -7.167996406555176, -6.909032344818115, -6.650068283081055, -6.391103744506836, -6.132139682769775, -5.873175621032715, -5.614211559295654, -5.355247497558594, -5.096283435821533, -4.837319374084473, -4.578354835510254, -4.319390773773193, -4.060426712036133, -3.8014626502990723, -3.5424985885620117, -3.283534049987793, -3.0245699882507324, -2.7656056880950928, -2.5066416263580322, -2.2476773262023926, -1.988713264465332, -1.7297492027282715, -1.4707850217819214, -1.2118208408355713, -0.9528566598892212, -0.6938925385475159, -0.43492841720581055, -0.17596423625946045, 0.08299994468688965, 0.3419640064239502, 0.6009281873703003, 0.8598918914794922, 1.1188560724258423, 1.3778202533721924, 1.636784315109253, 1.895748496055603, 2.154712677001953, 2.4136767387390137, 2.672640800476074, 2.931605100631714, 3.1905691623687744, 3.449533462524414, 3.7084975242614746, 3.967461585998535, 4.226426124572754, 4.485389709472656, 4.744354248046875, 5.0033183097839355, 5.262282371520996, 5.521246433258057, 5.780210494995117, 6.039175033569336, 6.2981390953063965, 6.557103157043457, 6.816067218780518, 7.075031280517578, 7.333995342254639, 7.592959403991699, 7.851923942565918, 8.11088752746582, 8.369852066040039, 8.628816604614258, 8.88778018951416, 9.146744728088379]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 3.0, 3.0, 7.0, 18.0, 15.0, 11.0, 23.0, 23.0, 36.0, 33.0, 28.0, 21.0, 37.0, 31.0, 42.0, 43.0, 42.0, 43.0, 39.0, 45.0, 50.0, 48.0, 43.0, 36.0, 36.0, 33.0, 20.0, 32.0, 26.0, 23.0, 18.0, 21.0, 17.0, 17.0, 8.0, 8.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.88330078125, -0.8570327758789062, -0.8307647705078125, -0.8044967651367188, -0.778228759765625, -0.7519607543945312, -0.7256927490234375, -0.6994247436523438, -0.67315673828125, -0.6468887329101562, -0.6206207275390625, -0.5943527221679688, -0.568084716796875, -0.5418167114257812, -0.5155487060546875, -0.48928070068359375, -0.4630126953125, -0.43674468994140625, -0.4104766845703125, -0.38420867919921875, -0.357940673828125, -0.33167266845703125, -0.3054046630859375, -0.27913665771484375, -0.25286865234375, -0.22660064697265625, -0.2003326416015625, -0.17406463623046875, -0.147796630859375, -0.12152862548828125, -0.0952606201171875, -0.06899261474609375, -0.042724609375, -0.01645660400390625, 0.0098114013671875, 0.03607940673828125, 0.062347412109375, 0.08861541748046875, 0.1148834228515625, 0.14115142822265625, 0.16741943359375, 0.19368743896484375, 0.2199554443359375, 0.24622344970703125, 0.272491455078125, 0.29875946044921875, 0.3250274658203125, 0.35129547119140625, 0.3775634765625, 0.40383148193359375, 0.4300994873046875, 0.45636749267578125, 0.482635498046875, 0.5089035034179688, 0.5351715087890625, 0.5614395141601562, 0.58770751953125, 0.6139755249023438, 0.6402435302734375, 0.6665115356445312, 0.692779541015625, 0.7190475463867188, 0.7453155517578125, 0.7715835571289062, 0.7978515625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 7.0, 2.0, 12.0, 13.0, 17.0, 20.0, 30.0, 40.0, 52.0, 78.0, 117.0, 160.0, 267.0, 348.0, 506.0, 786.0, 1150.0, 1713.0, 2691.0, 4131.0, 6620.0, 10245.0, 16160.0, 25545.0, 40597.0, 64044.0, 99015.0, 142613.0, 172737.0, 153327.0, 109498.0, 71417.0, 45452.0, 28841.0, 18088.0, 11523.0, 7321.0, 4574.0, 3012.0, 1910.0, 1222.0, 823.0, 581.0, 402.0, 286.0, 192.0, 103.0, 79.0, 48.0, 45.0, 27.0, 23.0, 23.0, 9.0, 7.0, 6.0, 7.0, 2.0, 4.0, 2.0], "bins": [-0.74169921875, -0.718963623046875, -0.69622802734375, -0.673492431640625, -0.6507568359375, -0.628021240234375, -0.60528564453125, -0.582550048828125, -0.559814453125, -0.537078857421875, -0.51434326171875, -0.491607666015625, -0.4688720703125, -0.446136474609375, -0.42340087890625, -0.400665283203125, -0.3779296875, -0.355194091796875, -0.33245849609375, -0.309722900390625, -0.2869873046875, -0.264251708984375, -0.24151611328125, -0.218780517578125, -0.196044921875, -0.173309326171875, -0.15057373046875, -0.127838134765625, -0.1051025390625, -0.082366943359375, -0.05963134765625, -0.036895751953125, -0.01416015625, 0.008575439453125, 0.03131103515625, 0.054046630859375, 0.0767822265625, 0.099517822265625, 0.12225341796875, 0.144989013671875, 0.167724609375, 0.190460205078125, 0.21319580078125, 0.235931396484375, 0.2586669921875, 0.281402587890625, 0.30413818359375, 0.326873779296875, 0.349609375, 0.372344970703125, 0.39508056640625, 0.417816162109375, 0.4405517578125, 0.463287353515625, 0.48602294921875, 0.508758544921875, 0.531494140625, 0.554229736328125, 0.57696533203125, 0.599700927734375, 0.6224365234375, 0.645172119140625, 0.66790771484375, 0.690643310546875, 0.71337890625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 9.0, 6.0, 4.0, 10.0, 10.0, 19.0, 20.0, 14.0, 17.0, 33.0, 25.0, 27.0, 28.0, 25.0, 45.0, 37.0, 45.0, 39.0, 43.0, 40.0, 1064.0, 36.0, 37.0, 45.0, 48.0, 41.0, 33.0, 28.0, 24.0, 28.0, 20.0, 23.0, 17.0, 18.0, 12.0, 10.0, 12.0, 9.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.93359375, -0.9053115844726562, -0.8770294189453125, -0.8487472534179688, -0.820465087890625, -0.7921829223632812, -0.7639007568359375, -0.7356185913085938, -0.70733642578125, -0.6790542602539062, -0.6507720947265625, -0.6224899291992188, -0.594207763671875, -0.5659255981445312, -0.5376434326171875, -0.5093612670898438, -0.4810791015625, -0.45279693603515625, -0.4245147705078125, -0.39623260498046875, -0.367950439453125, -0.33966827392578125, -0.3113861083984375, -0.28310394287109375, -0.25482177734375, -0.22653961181640625, -0.1982574462890625, -0.16997528076171875, -0.141693115234375, -0.11341094970703125, -0.0851287841796875, -0.05684661865234375, -0.028564453125, -0.00028228759765625, 0.0279998779296875, 0.05628204345703125, 0.084564208984375, 0.11284637451171875, 0.1411285400390625, 0.16941070556640625, 0.19769287109375, 0.22597503662109375, 0.2542572021484375, 0.28253936767578125, 0.310821533203125, 0.33910369873046875, 0.3673858642578125, 0.39566802978515625, 0.4239501953125, 0.45223236083984375, 0.4805145263671875, 0.5087966918945312, 0.537078857421875, 0.5653610229492188, 0.5936431884765625, 0.6219253540039062, 0.65020751953125, 0.6784896850585938, 0.7067718505859375, 0.7350540161132812, 0.763336181640625, 0.7916183471679688, 0.8199005126953125, 0.8481826782226562, 0.87646484375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 6.0, 3.0, 10.0, 11.0, 19.0, 19.0, 27.0, 44.0, 44.0, 82.0, 100.0, 149.0, 192.0, 338.0, 480.0, 671.0, 1025.0, 1674.0, 2670.0, 4419.0, 7205.0, 12983.0, 24589.0, 58422.0, 720037.0, 1141399.0, 62033.0, 25541.0, 13235.0, 7499.0, 4461.0, 2682.0, 1718.0, 1105.0, 692.0, 443.0, 344.0, 232.0, 139.0, 117.0, 76.0, 56.0, 42.0, 26.0, 16.0, 19.0, 11.0, 9.0, 6.0, 5.0, 3.0, 7.0, 2.0, 1.0, 1.0], "bins": [-1.15625, -1.1222686767578125, -1.088287353515625, -1.0543060302734375, -1.02032470703125, -0.9863433837890625, -0.952362060546875, -0.9183807373046875, -0.8843994140625, -0.8504180908203125, -0.816436767578125, -0.7824554443359375, -0.74847412109375, -0.7144927978515625, -0.680511474609375, -0.6465301513671875, -0.612548828125, -0.5785675048828125, -0.544586181640625, -0.5106048583984375, -0.47662353515625, -0.4426422119140625, -0.408660888671875, -0.3746795654296875, -0.3406982421875, -0.3067169189453125, -0.272735595703125, -0.2387542724609375, -0.20477294921875, -0.1707916259765625, -0.136810302734375, -0.1028289794921875, -0.06884765625, -0.0348663330078125, -0.000885009765625, 0.0330963134765625, 0.06707763671875, 0.1010589599609375, 0.135040283203125, 0.1690216064453125, 0.2030029296875, 0.2369842529296875, 0.270965576171875, 0.3049468994140625, 0.33892822265625, 0.3729095458984375, 0.406890869140625, 0.4408721923828125, 0.474853515625, 0.5088348388671875, 0.542816162109375, 0.5767974853515625, 0.61077880859375, 0.6447601318359375, 0.678741455078125, 0.7127227783203125, 0.7467041015625, 0.7806854248046875, 0.814666748046875, 0.8486480712890625, 0.88262939453125, 0.9166107177734375, 0.950592041015625, 0.9845733642578125, 1.0185546875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 2.0, 2.0, 7.0, 5.0, 9.0, 5.0, 15.0, 7.0, 28.0, 18.0, 36.0, 38.0, 56.0, 67.0, 81.0, 93.0, 94.0, 63.0, 77.0, 46.0, 37.0, 28.0, 31.0, 28.0, 23.0, 21.0, 11.0, 18.0, 6.0, 8.0, 6.0, 3.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.16455078125, -0.1590747833251953, -0.15359878540039062, -0.14812278747558594, -0.14264678955078125, -0.13717079162597656, -0.13169479370117188, -0.1262187957763672, -0.1207427978515625, -0.11526679992675781, -0.10979080200195312, -0.10431480407714844, -0.09883880615234375, -0.09336280822753906, -0.08788681030273438, -0.08241081237792969, -0.076934814453125, -0.07145881652832031, -0.06598281860351562, -0.06050682067871094, -0.05503082275390625, -0.04955482482910156, -0.044078826904296875, -0.03860282897949219, -0.0331268310546875, -0.027650833129882812, -0.022174835205078125, -0.016698837280273438, -0.01122283935546875, -0.0057468414306640625, -0.000270843505859375, 0.0052051544189453125, 0.01068115234375, 0.016157150268554688, 0.021633148193359375, 0.027109146118164062, 0.03258514404296875, 0.03806114196777344, 0.043537139892578125, 0.04901313781738281, 0.0544891357421875, 0.05996513366699219, 0.06544113159179688, 0.07091712951660156, 0.07639312744140625, 0.08186912536621094, 0.08734512329101562, 0.09282112121582031, 0.098297119140625, 0.10377311706542969, 0.10924911499023438, 0.11472511291503906, 0.12020111083984375, 0.12567710876464844, 0.13115310668945312, 0.1366291046142578, 0.1421051025390625, 0.1475811004638672, 0.15305709838867188, 0.15853309631347656, 0.16400909423828125, 0.16948509216308594, 0.17496109008789062, 0.1804370880126953, 0.1859130859375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 3.0, 4.0, 3.0, 7.0, 8.0, 13.0, 7.0, 15.0, 12.0, 11.0, 24.0, 29.0, 38.0, 45.0, 57.0, 78.0, 119.0, 136.0, 223.0, 528.0, 2720.0, 33955.0, 940414.0, 64676.0, 3777.0, 673.0, 251.0, 147.0, 120.0, 94.0, 67.0, 68.0, 40.0, 41.0, 27.0, 11.0, 25.0, 13.0, 11.0, 12.0, 6.0, 8.0, 5.0, 7.0, 2.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-2.498046875, -2.4163818359375, -2.334716796875, -2.2530517578125, -2.17138671875, -2.0897216796875, -2.008056640625, -1.9263916015625, -1.8447265625, -1.7630615234375, -1.681396484375, -1.5997314453125, -1.51806640625, -1.4364013671875, -1.354736328125, -1.2730712890625, -1.19140625, -1.1097412109375, -1.028076171875, -0.9464111328125, -0.86474609375, -0.7830810546875, -0.701416015625, -0.6197509765625, -0.5380859375, -0.4564208984375, -0.374755859375, -0.2930908203125, -0.21142578125, -0.1297607421875, -0.048095703125, 0.0335693359375, 0.115234375, 0.1968994140625, 0.278564453125, 0.3602294921875, 0.44189453125, 0.5235595703125, 0.605224609375, 0.6868896484375, 0.7685546875, 0.8502197265625, 0.931884765625, 1.0135498046875, 1.09521484375, 1.1768798828125, 1.258544921875, 1.3402099609375, 1.421875, 1.5035400390625, 1.585205078125, 1.6668701171875, 1.74853515625, 1.8302001953125, 1.911865234375, 1.9935302734375, 2.0751953125, 2.1568603515625, 2.238525390625, 2.3201904296875, 2.40185546875, 2.4835205078125, 2.565185546875, 2.6468505859375, 2.728515625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 34.0, 341.0, 566.0, 65.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4697303771972656, -3.278604507446289, -3.0874786376953125, -2.896353006362915, -2.7052271366119385, -2.514101266860962, -2.3229756355285645, -2.131849765777588, -1.9407238960266113, -1.7495980262756348, -1.5584722757339478, -1.3673465251922607, -1.1762206554412842, -0.9850948452949524, -0.7939690351486206, -0.6028432846069336, -0.41171741485595703, -0.22059160470962524, -0.029465794563293457, 0.16166001558303833, 0.3527858257293701, 0.5439116358757019, 0.7350374460220337, 0.9261631965637207, 1.1172890663146973, 1.3084149360656738, 1.4995406866073608, 1.6906664371490479, 1.8817923069000244, 2.072918176651001, 2.2640438079833984, 2.455169677734375, 2.6462955474853516, 2.837421417236328, 3.0285472869873047, 3.219672918319702, 3.4107987880706787, 3.6019246578216553, 3.7930502891540527, 3.9841761589050293, 4.175302028656006, 4.366427898406982, 4.557553768157959, 4.7486796379089355, 4.939805030822754, 5.1309309005737305, 5.322056770324707, 5.513182640075684, 5.70430850982666, 5.895434379577637, 6.086560249328613, 6.27768611907959, 6.468811988830566, 6.659937381744385, 6.851063251495361, 7.042189121246338, 7.2333149909973145, 7.424440860748291, 7.615566730499268, 7.806692600250244, 7.9978179931640625, 8.188943862915039, 8.380069732666016, 8.571195602416992, 8.762321472167969]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 8.0, 11.0, 17.0, 21.0, 15.0, 33.0, 21.0, 38.0, 36.0, 43.0, 47.0, 55.0, 62.0, 54.0, 57.0, 81.0, 67.0, 53.0, 36.0, 41.0, 34.0, 33.0, 27.0, 25.0, 22.0, 11.0, 8.0, 14.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.015175461769104, -0.9890737533569336, -0.9629720449447632, -0.9368703365325928, -0.9107686281204224, -0.884666919708252, -0.8585652709007263, -0.8324635624885559, -0.8063618540763855, -0.7802601456642151, -0.7541584372520447, -0.7280567288398743, -0.7019550800323486, -0.6758533716201782, -0.6497516632080078, -0.6236499547958374, -0.597548246383667, -0.5714465379714966, -0.5453448295593262, -0.5192431211471558, -0.49314144253730774, -0.46703973412513733, -0.4409380555152893, -0.4148363471031189, -0.3887346386909485, -0.3626329302787781, -0.33653122186660767, -0.31042954325675964, -0.28432783484458923, -0.2582261264324188, -0.2321244329214096, -0.2060227394104004, -0.17992109060287476, -0.15381938219070435, -0.12771768867969513, -0.10161598771810532, -0.0755142867565155, -0.04941257834434509, -0.023310884833335876, 0.00279080867767334, 0.02889251708984375, 0.05499421805143356, 0.08109591901302338, 0.10719761997461319, 0.133299320936203, 0.1594010293483734, 0.18550272285938263, 0.21160441637039185, 0.23770612478256226, 0.26380783319473267, 0.2899095416069031, 0.3160112202167511, 0.3421129286289215, 0.3682146370410919, 0.39431631565093994, 0.42041802406311035, 0.44651973247528076, 0.47262144088745117, 0.4987231492996216, 0.524824857711792, 0.5509265661239624, 0.5770282745361328, 0.6031299233436584, 0.6292316317558289, 0.6553333401679993]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 1.0, 11.0, 15.0, 17.0, 12.0, 19.0, 26.0, 27.0, 41.0, 29.0, 20.0, 35.0, 29.0, 49.0, 40.0, 37.0, 44.0, 46.0, 48.0, 45.0, 51.0, 43.0, 38.0, 26.0, 37.0, 27.0, 27.0, 27.0, 21.0, 19.0, 19.0, 22.0, 12.0, 9.0, 9.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.88623046875, -0.8598175048828125, -0.833404541015625, -0.8069915771484375, -0.78057861328125, -0.7541656494140625, -0.727752685546875, -0.7013397216796875, -0.6749267578125, -0.6485137939453125, -0.622100830078125, -0.5956878662109375, -0.56927490234375, -0.5428619384765625, -0.516448974609375, -0.4900360107421875, -0.463623046875, -0.4372100830078125, -0.410797119140625, -0.3843841552734375, -0.35797119140625, -0.3315582275390625, -0.305145263671875, -0.2787322998046875, -0.2523193359375, -0.2259063720703125, -0.199493408203125, -0.1730804443359375, -0.14666748046875, -0.1202545166015625, -0.093841552734375, -0.0674285888671875, -0.041015625, -0.0146026611328125, 0.011810302734375, 0.0382232666015625, 0.06463623046875, 0.0910491943359375, 0.117462158203125, 0.1438751220703125, 0.1702880859375, 0.1967010498046875, 0.223114013671875, 0.2495269775390625, 0.27593994140625, 0.3023529052734375, 0.328765869140625, 0.3551788330078125, 0.381591796875, 0.4080047607421875, 0.434417724609375, 0.4608306884765625, 0.48724365234375, 0.5136566162109375, 0.540069580078125, 0.5664825439453125, 0.5928955078125, 0.6193084716796875, 0.645721435546875, 0.6721343994140625, 0.69854736328125, 0.7249603271484375, 0.751373291015625, 0.7777862548828125, 0.80419921875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 11.0, 16.0, 14.0, 31.0, 28.0, 38.0, 61.0, 70.0, 89.0, 141.0, 206.0, 300.0, 378.0, 560.0, 698.0, 1064.0, 1531.0, 2319.0, 3488.0, 5608.0, 9898.0, 21723.0, 73722.0, 562130.0, 280217.0, 45607.0, 16196.0, 7976.0, 4741.0, 2994.0, 1922.0, 1389.0, 1005.0, 669.0, 479.0, 319.0, 239.0, 181.0, 144.0, 100.0, 72.0, 42.0, 45.0, 21.0, 17.0, 14.0, 7.0, 10.0, 9.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.98828125, -2.891357421875, -2.79443359375, -2.697509765625, -2.6005859375, -2.503662109375, -2.40673828125, -2.309814453125, -2.212890625, -2.115966796875, -2.01904296875, -1.922119140625, -1.8251953125, -1.728271484375, -1.63134765625, -1.534423828125, -1.4375, -1.340576171875, -1.24365234375, -1.146728515625, -1.0498046875, -0.952880859375, -0.85595703125, -0.759033203125, -0.662109375, -0.565185546875, -0.46826171875, -0.371337890625, -0.2744140625, -0.177490234375, -0.08056640625, 0.016357421875, 0.11328125, 0.210205078125, 0.30712890625, 0.404052734375, 0.5009765625, 0.597900390625, 0.69482421875, 0.791748046875, 0.888671875, 0.985595703125, 1.08251953125, 1.179443359375, 1.2763671875, 1.373291015625, 1.47021484375, 1.567138671875, 1.6640625, 1.760986328125, 1.85791015625, 1.954833984375, 2.0517578125, 2.148681640625, 2.24560546875, 2.342529296875, 2.439453125, 2.536376953125, 2.63330078125, 2.730224609375, 2.8271484375, 2.924072265625, 3.02099609375, 3.117919921875, 3.21484375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 8.0, 6.0, 2.0, 3.0, 11.0, 11.0, 13.0, 18.0, 17.0, 28.0, 23.0, 19.0, 26.0, 31.0, 36.0, 41.0, 46.0, 79.0, 92.0, 130.0, 262.0, 1381.0, 222.0, 103.0, 74.0, 43.0, 48.0, 32.0, 33.0, 36.0, 32.0, 25.0, 13.0, 22.0, 14.0, 16.0, 4.0, 11.0, 6.0, 6.0, 8.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.771484375, -2.680206298828125, -2.58892822265625, -2.497650146484375, -2.4063720703125, -2.315093994140625, -2.22381591796875, -2.132537841796875, -2.041259765625, -1.949981689453125, -1.85870361328125, -1.767425537109375, -1.6761474609375, -1.584869384765625, -1.49359130859375, -1.402313232421875, -1.31103515625, -1.219757080078125, -1.12847900390625, -1.037200927734375, -0.9459228515625, -0.854644775390625, -0.76336669921875, -0.672088623046875, -0.580810546875, -0.489532470703125, -0.39825439453125, -0.306976318359375, -0.2156982421875, -0.124420166015625, -0.03314208984375, 0.058135986328125, 0.1494140625, 0.240692138671875, 0.33197021484375, 0.423248291015625, 0.5145263671875, 0.605804443359375, 0.69708251953125, 0.788360595703125, 0.879638671875, 0.970916748046875, 1.06219482421875, 1.153472900390625, 1.2447509765625, 1.336029052734375, 1.42730712890625, 1.518585205078125, 1.60986328125, 1.701141357421875, 1.79241943359375, 1.883697509765625, 1.9749755859375, 2.066253662109375, 2.15753173828125, 2.248809814453125, 2.340087890625, 2.431365966796875, 2.52264404296875, 2.613922119140625, 2.7052001953125, 2.796478271484375, 2.88775634765625, 2.979034423828125, 3.0703125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 4.0, 9.0, 8.0, 7.0, 7.0, 9.0, 12.0, 20.0, 30.0, 60.0, 87.0, 129.0, 258.0, 409.0, 796.0, 1488.0, 3019.0, 6799.0, 20361.0, 97858.0, 1790573.0, 1118804.0, 75464.0, 17396.0, 6227.0, 2797.0, 1332.0, 688.0, 413.0, 223.0, 133.0, 67.0, 72.0, 32.0, 19.0, 25.0, 15.0, 8.0, 12.0, 5.0, 7.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.83984375, -4.69287109375, -4.5458984375, -4.39892578125, -4.251953125, -4.10498046875, -3.9580078125, -3.81103515625, -3.6640625, -3.51708984375, -3.3701171875, -3.22314453125, -3.076171875, -2.92919921875, -2.7822265625, -2.63525390625, -2.48828125, -2.34130859375, -2.1943359375, -2.04736328125, -1.900390625, -1.75341796875, -1.6064453125, -1.45947265625, -1.3125, -1.16552734375, -1.0185546875, -0.87158203125, -0.724609375, -0.57763671875, -0.4306640625, -0.28369140625, -0.13671875, 0.01025390625, 0.1572265625, 0.30419921875, 0.451171875, 0.59814453125, 0.7451171875, 0.89208984375, 1.0390625, 1.18603515625, 1.3330078125, 1.47998046875, 1.626953125, 1.77392578125, 1.9208984375, 2.06787109375, 2.21484375, 2.36181640625, 2.5087890625, 2.65576171875, 2.802734375, 2.94970703125, 3.0966796875, 3.24365234375, 3.390625, 3.53759765625, 3.6845703125, 3.83154296875, 3.978515625, 4.12548828125, 4.2724609375, 4.41943359375, 4.56640625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 13.0, 20.0, 64.0, 163.0, 272.0, 223.0, 136.0, 60.0, 33.0, 10.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.305017471313477, -25.777816772460938, -25.25061798095703, -24.723417282104492, -24.196218490600586, -23.669017791748047, -23.14181900024414, -22.6146183013916, -22.087417602539062, -21.560216903686523, -21.033018112182617, -20.505817413330078, -19.978618621826172, -19.451417922973633, -18.924219131469727, -18.397018432617188, -17.86981964111328, -17.342618942260742, -16.815420150756836, -16.288219451904297, -15.76102066040039, -15.233819961547852, -14.706620216369629, -14.179420471191406, -13.652220726013184, -13.125020980834961, -12.597821235656738, -12.070621490478516, -11.543420791625977, -11.01622200012207, -10.489021301269531, -9.961821556091309, -9.434621810913086, -8.907422065734863, -8.38022232055664, -7.85302209854126, -7.325822353363037, -6.7986226081848145, -6.271422386169434, -5.744222640991211, -5.21702241897583, -4.689822673797607, -4.162622451782227, -3.635422706604004, -3.1082229614257812, -2.5810232162475586, -2.053823232650757, -1.526623249053955, -0.9994235038757324, -0.4722236394882202, 0.05497622489929199, 0.5821760892868042, 1.1093759536743164, 1.636575698852539, 2.163775682449341, 2.6909756660461426, 3.2181754112243652, 3.745375156402588, 4.272575378417969, 4.799775123596191, 5.326974868774414, 5.854174613952637, 6.381374359130859, 6.90857458114624, 7.435774326324463]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 11.0, 6.0, 9.0, 8.0, 14.0, 18.0, 20.0, 18.0, 22.0, 30.0, 27.0, 35.0, 31.0, 39.0, 33.0, 45.0, 42.0, 37.0, 43.0, 43.0, 53.0, 42.0, 27.0, 41.0, 35.0, 31.0, 26.0, 36.0, 21.0, 20.0, 16.0, 23.0, 17.0, 16.0, 15.0, 12.0, 9.0, 8.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.989239692687988, -9.696913719177246, -9.404586791992188, -9.112260818481445, -8.819934844970703, -8.527607917785645, -8.235281944274902, -7.942955493927002, -7.650629043579102, -7.358302593231201, -7.065976142883301, -6.773650169372559, -6.481323719024658, -6.188997268676758, -5.896671295166016, -5.604344844818115, -5.312018394470215, -5.0196919441223145, -4.727365493774414, -4.435039520263672, -4.1427130699157715, -3.850386619567871, -3.55806040763855, -3.2657341957092285, -2.973407745361328, -2.6810812950134277, -2.3887550830841064, -2.096428871154785, -1.8041024208068848, -1.511776089668274, -1.219449758529663, -0.9271235466003418, -0.6347980499267578, -0.342471718788147, -0.05014538764953613, 0.2421809434890747, 0.5345072746276855, 0.8268336057662964, 1.1191599369049072, 1.4114861488342285, 1.703812599182129, 1.9961389303207397, 2.2884652614593506, 2.580791473388672, 2.8731179237365723, 3.1654443740844727, 3.457770586013794, 3.7500967979431152, 4.042423248291016, 4.334749698638916, 4.627076148986816, 4.919402122497559, 5.211728572845459, 5.504055023193359, 5.796380996704102, 6.088707447052002, 6.381033897399902, 6.673360347747803, 6.965686798095703, 7.258012771606445, 7.550339221954346, 7.842665672302246, 8.134991645812988, 8.427318572998047, 8.719644546508789]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 6.0, 14.0, 8.0, 18.0, 11.0, 15.0, 17.0, 21.0, 28.0, 30.0, 30.0, 34.0, 32.0, 38.0, 30.0, 35.0, 49.0, 41.0, 45.0, 40.0, 60.0, 37.0, 38.0, 38.0, 34.0, 35.0, 24.0, 26.0, 18.0, 27.0, 21.0, 19.0, 19.0, 11.0, 14.0, 15.0, 7.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.96142578125, -0.9338226318359375, -0.906219482421875, -0.8786163330078125, -0.85101318359375, -0.8234100341796875, -0.795806884765625, -0.7682037353515625, -0.7406005859375, -0.7129974365234375, -0.685394287109375, -0.6577911376953125, -0.63018798828125, -0.6025848388671875, -0.574981689453125, -0.5473785400390625, -0.519775390625, -0.4921722412109375, -0.464569091796875, -0.4369659423828125, -0.40936279296875, -0.3817596435546875, -0.354156494140625, -0.3265533447265625, -0.2989501953125, -0.2713470458984375, -0.243743896484375, -0.2161407470703125, -0.18853759765625, -0.1609344482421875, -0.133331298828125, -0.1057281494140625, -0.078125, -0.0505218505859375, -0.022918701171875, 0.0046844482421875, 0.03228759765625, 0.0598907470703125, 0.087493896484375, 0.1150970458984375, 0.1427001953125, 0.1703033447265625, 0.197906494140625, 0.2255096435546875, 0.25311279296875, 0.2807159423828125, 0.308319091796875, 0.3359222412109375, 0.363525390625, 0.3911285400390625, 0.418731689453125, 0.4463348388671875, 0.47393798828125, 0.5015411376953125, 0.529144287109375, 0.5567474365234375, 0.5843505859375, 0.6119537353515625, 0.639556884765625, 0.6671600341796875, 0.69476318359375, 0.7223663330078125, 0.749969482421875, 0.7775726318359375, 0.80517578125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 10.0, 11.0, 8.0, 10.0, 15.0, 13.0, 25.0, 32.0, 48.0, 69.0, 94.0, 142.0, 278.0, 543.0, 1094.0, 2150.0, 5282.0, 14647.0, 50849.0, 423021.0, 3438755.0, 201607.0, 36017.0, 11442.0, 4241.0, 1850.0, 898.0, 433.0, 235.0, 141.0, 90.0, 60.0, 37.0, 37.0, 20.0, 14.0, 12.0, 15.0, 13.0, 10.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.5, -4.36517333984375, -4.2303466796875, -4.09552001953125, -3.960693359375, -3.82586669921875, -3.6910400390625, -3.55621337890625, -3.42138671875, -3.28656005859375, -3.1517333984375, -3.01690673828125, -2.882080078125, -2.74725341796875, -2.6124267578125, -2.47760009765625, -2.3427734375, -2.20794677734375, -2.0731201171875, -1.93829345703125, -1.803466796875, -1.66864013671875, -1.5338134765625, -1.39898681640625, -1.26416015625, -1.12933349609375, -0.9945068359375, -0.85968017578125, -0.724853515625, -0.59002685546875, -0.4552001953125, -0.32037353515625, -0.185546875, -0.05072021484375, 0.0841064453125, 0.21893310546875, 0.353759765625, 0.48858642578125, 0.6234130859375, 0.75823974609375, 0.89306640625, 1.02789306640625, 1.1627197265625, 1.29754638671875, 1.432373046875, 1.56719970703125, 1.7020263671875, 1.83685302734375, 1.9716796875, 2.10650634765625, 2.2413330078125, 2.37615966796875, 2.510986328125, 2.64581298828125, 2.7806396484375, 2.91546630859375, 3.05029296875, 3.18511962890625, 3.3199462890625, 3.45477294921875, 3.589599609375, 3.72442626953125, 3.8592529296875, 3.99407958984375, 4.12890625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 10.0, 13.0, 23.0, 27.0, 25.0, 28.0, 45.0, 56.0, 106.0, 137.0, 230.0, 370.0, 707.0, 830.0, 515.0, 306.0, 191.0, 114.0, 91.0, 49.0, 40.0, 36.0, 37.0, 22.0, 16.0, 4.0, 8.0, 10.0, 8.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.267822265625, -2.17041015625, -2.072998046875, -1.9755859375, -1.878173828125, -1.78076171875, -1.683349609375, -1.5859375, -1.488525390625, -1.39111328125, -1.293701171875, -1.1962890625, -1.098876953125, -1.00146484375, -0.904052734375, -0.806640625, -0.709228515625, -0.61181640625, -0.514404296875, -0.4169921875, -0.319580078125, -0.22216796875, -0.124755859375, -0.02734375, 0.070068359375, 0.16748046875, 0.264892578125, 0.3623046875, 0.459716796875, 0.55712890625, 0.654541015625, 0.751953125, 0.849365234375, 0.94677734375, 1.044189453125, 1.1416015625, 1.239013671875, 1.33642578125, 1.433837890625, 1.53125, 1.628662109375, 1.72607421875, 1.823486328125, 1.9208984375, 2.018310546875, 2.11572265625, 2.213134765625, 2.310546875, 2.407958984375, 2.50537109375, 2.602783203125, 2.7001953125, 2.797607421875, 2.89501953125, 2.992431640625, 3.08984375, 3.187255859375, 3.28466796875, 3.382080078125, 3.4794921875, 3.576904296875, 3.67431640625, 3.771728515625, 3.869140625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 11.0, 9.0, 15.0, 28.0, 46.0, 82.0, 148.0, 270.0, 514.0, 1083.0, 2546.0, 7194.0, 21353.0, 80293.0, 511697.0, 3124455.0, 352550.0, 63799.0, 17665.0, 6133.0, 2329.0, 1006.0, 486.0, 222.0, 131.0, 69.0, 54.0, 28.0, 30.0, 11.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.87109375, -4.671630859375, -4.47216796875, -4.272705078125, -4.0732421875, -3.873779296875, -3.67431640625, -3.474853515625, -3.275390625, -3.075927734375, -2.87646484375, -2.677001953125, -2.4775390625, -2.278076171875, -2.07861328125, -1.879150390625, -1.6796875, -1.480224609375, -1.28076171875, -1.081298828125, -0.8818359375, -0.682373046875, -0.48291015625, -0.283447265625, -0.083984375, 0.115478515625, 0.31494140625, 0.514404296875, 0.7138671875, 0.913330078125, 1.11279296875, 1.312255859375, 1.51171875, 1.711181640625, 1.91064453125, 2.110107421875, 2.3095703125, 2.509033203125, 2.70849609375, 2.907958984375, 3.107421875, 3.306884765625, 3.50634765625, 3.705810546875, 3.9052734375, 4.104736328125, 4.30419921875, 4.503662109375, 4.703125, 4.902587890625, 5.10205078125, 5.301513671875, 5.5009765625, 5.700439453125, 5.89990234375, 6.099365234375, 6.298828125, 6.498291015625, 6.69775390625, 6.897216796875, 7.0966796875, 7.296142578125, 7.49560546875, 7.695068359375, 7.89453125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 1.0, 4.0, 3.0, 9.0, 8.0, 13.0, 6.0, 11.0, 29.0, 35.0, 47.0, 61.0, 71.0, 87.0, 96.0, 80.0, 93.0, 68.0, 76.0, 50.0, 37.0, 29.0, 18.0, 23.0, 13.0, 15.0, 9.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.152830123901367, -11.774765014648438, -11.396700859069824, -11.018635749816895, -10.640571594238281, -10.262506484985352, -9.884441375732422, -9.506377220153809, -9.128312110900879, -8.75024700164795, -8.372182846069336, -7.994117736816406, -7.616053104400635, -7.237988471984863, -6.859923839569092, -6.48185920715332, -6.103794574737549, -5.725729942321777, -5.347665309906006, -4.969600677490234, -4.591535568237305, -4.213470935821533, -3.8354063034057617, -3.457341432571411, -3.0792768001556396, -2.701212167739868, -2.3231472969055176, -1.945082664489746, -1.567017912864685, -1.188953161239624, -0.8108885288238525, -0.43282365798950195, -0.05475902557373047, 0.3233056962490082, 0.7013704180717468, 1.079435110092163, 1.4574998617172241, 1.8355646133422852, 2.2136292457580566, 2.5916941165924072, 2.9697587490081787, 3.34782338142395, 3.725888252258301, 4.103952884674072, 4.482017517089844, 4.860082626342773, 5.238146781921387, 5.616211891174316, 5.994276523590088, 6.372341156005859, 6.750405788421631, 7.128470420837402, 7.506535530090332, 7.8846001625061035, 8.262664794921875, 8.640729904174805, 9.018794059753418, 9.396859169006348, 9.774923324584961, 10.15298843383789, 10.531052589416504, 10.909117698669434, 11.287181854248047, 11.665246963500977, 12.043312072753906]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 15.0, 15.0, 12.0, 17.0, 19.0, 19.0, 39.0, 31.0, 25.0, 39.0, 25.0, 56.0, 49.0, 39.0, 41.0, 45.0, 41.0, 39.0, 37.0, 46.0, 23.0, 30.0, 33.0, 39.0, 23.0, 31.0, 28.0, 31.0, 16.0, 15.0, 14.0, 7.0, 15.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-9.760139465332031, -9.491737365722656, -9.223335266113281, -8.954933166503906, -8.686531066894531, -8.418128967285156, -8.149726867675781, -7.8813252449035645, -7.6129231452941895, -7.3445210456848145, -7.0761189460754395, -6.8077168464660645, -6.539315223693848, -6.270913124084473, -6.002511024475098, -5.734108924865723, -5.465706825256348, -5.197304725646973, -4.928902626037598, -4.660500526428223, -4.392098426818848, -4.123696327209473, -3.855294704437256, -3.586892604827881, -3.318490505218506, -3.050088405609131, -2.781686305999756, -2.51328444480896, -2.244882345199585, -1.97648024559021, -1.7080782651901245, -1.439676284790039, -1.1712732315063477, -0.9028711915016174, -0.6344691514968872, -0.366067111492157, -0.09766507148742676, 0.17073702812194824, 0.4391390085220337, 0.7075409889221191, 0.9759430885314941, 1.2443451881408691, 1.5127471685409546, 1.78114914894104, 2.049551248550415, 2.31795334815979, 2.586355209350586, 2.854757308959961, 3.123159408569336, 3.391561508178711, 3.659963607788086, 3.928365468978882, 4.196767807006836, 4.465169906616211, 4.733571529388428, 5.001973628997803, 5.270375728607178, 5.538777828216553, 5.807179927825928, 6.075582027435303, 6.3439836502075195, 6.6123857498168945, 6.8807878494262695, 7.1491899490356445, 7.4175920486450195]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 8.0, 9.0, 11.0, 7.0, 6.0, 21.0, 8.0, 24.0, 28.0, 25.0, 25.0, 31.0, 36.0, 30.0, 37.0, 44.0, 37.0, 45.0, 55.0, 47.0, 45.0, 43.0, 39.0, 54.0, 39.0, 33.0, 30.0, 20.0, 33.0, 21.0, 18.0, 21.0, 16.0, 17.0, 7.0, 6.0, 7.0, 10.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.10546875, -1.0757369995117188, -1.0460052490234375, -1.0162734985351562, -0.986541748046875, -0.9568099975585938, -0.9270782470703125, -0.8973464965820312, -0.86761474609375, -0.8378829956054688, -0.8081512451171875, -0.7784194946289062, -0.748687744140625, -0.7189559936523438, -0.6892242431640625, -0.6594924926757812, -0.6297607421875, -0.6000289916992188, -0.5702972412109375, -0.5405654907226562, -0.510833740234375, -0.48110198974609375, -0.4513702392578125, -0.42163848876953125, -0.39190673828125, -0.36217498779296875, -0.3324432373046875, -0.30271148681640625, -0.272979736328125, -0.24324798583984375, -0.2135162353515625, -0.18378448486328125, -0.154052734375, -0.12432098388671875, -0.0945892333984375, -0.06485748291015625, -0.035125732421875, -0.00539398193359375, 0.0243377685546875, 0.05406951904296875, 0.08380126953125, 0.11353302001953125, 0.1432647705078125, 0.17299652099609375, 0.202728271484375, 0.23246002197265625, 0.2621917724609375, 0.29192352294921875, 0.3216552734375, 0.35138702392578125, 0.3811187744140625, 0.41085052490234375, 0.440582275390625, 0.47031402587890625, 0.5000457763671875, 0.5297775268554688, 0.55950927734375, 0.5892410278320312, 0.6189727783203125, 0.6487045288085938, 0.678436279296875, 0.7081680297851562, 0.7378997802734375, 0.7676315307617188, 0.79736328125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 8.0, 17.0, 23.0, 31.0, 43.0, 89.0, 104.0, 181.0, 314.0, 430.0, 685.0, 1172.0, 1843.0, 2902.0, 4625.0, 7421.0, 12137.0, 19365.0, 31280.0, 49464.0, 74814.0, 107718.0, 148652.0, 195672.0, 126908.0, 92515.0, 62637.0, 40292.0, 25555.0, 15650.0, 9886.0, 6122.0, 3708.0, 2284.0, 1389.0, 946.0, 561.0, 390.0, 242.0, 168.0, 97.0, 70.0, 49.0, 30.0, 23.0, 14.0, 5.0, 4.0, 0.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.9072265625, -0.879119873046875, -0.85101318359375, -0.822906494140625, -0.7947998046875, -0.766693115234375, -0.73858642578125, -0.710479736328125, -0.682373046875, -0.654266357421875, -0.62615966796875, -0.598052978515625, -0.5699462890625, -0.541839599609375, -0.51373291015625, -0.485626220703125, -0.45751953125, -0.429412841796875, -0.40130615234375, -0.373199462890625, -0.3450927734375, -0.316986083984375, -0.28887939453125, -0.260772705078125, -0.232666015625, -0.204559326171875, -0.17645263671875, -0.148345947265625, -0.1202392578125, -0.092132568359375, -0.06402587890625, -0.035919189453125, -0.0078125, 0.020294189453125, 0.04840087890625, 0.076507568359375, 0.1046142578125, 0.132720947265625, 0.16082763671875, 0.188934326171875, 0.217041015625, 0.245147705078125, 0.27325439453125, 0.301361083984375, 0.3294677734375, 0.357574462890625, 0.38568115234375, 0.413787841796875, 0.44189453125, 0.470001220703125, 0.49810791015625, 0.526214599609375, 0.5543212890625, 0.582427978515625, 0.61053466796875, 0.638641357421875, 0.666748046875, 0.694854736328125, 0.72296142578125, 0.751068115234375, 0.7791748046875, 0.807281494140625, 0.83538818359375, 0.863494873046875, 0.8916015625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 10.0, 18.0, 11.0, 18.0, 19.0, 32.0, 26.0, 36.0, 37.0, 37.0, 37.0, 54.0, 48.0, 50.0, 46.0, 1081.0, 50.0, 37.0, 33.0, 47.0, 46.0, 34.0, 34.0, 31.0, 26.0, 23.0, 9.0, 18.0, 8.0, 9.0, 9.0, 7.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.976043701171875, -0.93939208984375, -0.902740478515625, -0.8660888671875, -0.829437255859375, -0.79278564453125, -0.756134033203125, -0.719482421875, -0.682830810546875, -0.64617919921875, -0.609527587890625, -0.5728759765625, -0.536224365234375, -0.49957275390625, -0.462921142578125, -0.42626953125, -0.389617919921875, -0.35296630859375, -0.316314697265625, -0.2796630859375, -0.243011474609375, -0.20635986328125, -0.169708251953125, -0.133056640625, -0.096405029296875, -0.05975341796875, -0.023101806640625, 0.0135498046875, 0.050201416015625, 0.08685302734375, 0.123504638671875, 0.16015625, 0.196807861328125, 0.23345947265625, 0.270111083984375, 0.3067626953125, 0.343414306640625, 0.38006591796875, 0.416717529296875, 0.453369140625, 0.490020751953125, 0.52667236328125, 0.563323974609375, 0.5999755859375, 0.636627197265625, 0.67327880859375, 0.709930419921875, 0.74658203125, 0.783233642578125, 0.81988525390625, 0.856536865234375, 0.8931884765625, 0.929840087890625, 0.96649169921875, 1.003143310546875, 1.039794921875, 1.076446533203125, 1.11309814453125, 1.149749755859375, 1.1864013671875, 1.223052978515625, 1.25970458984375, 1.296356201171875, 1.3330078125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 10.0, 6.0, 7.0, 6.0, 13.0, 13.0, 42.0, 32.0, 53.0, 85.0, 110.0, 164.0, 243.0, 331.0, 544.0, 798.0, 1262.0, 1990.0, 3165.0, 5100.0, 8452.0, 14573.0, 26293.0, 53553.0, 317347.0, 1497728.0, 85011.0, 34341.0, 18424.0, 10572.0, 6316.0, 3865.0, 2374.0, 1499.0, 953.0, 578.0, 358.0, 289.0, 205.0, 127.0, 94.0, 70.0, 36.0, 35.0, 15.0, 14.0, 9.0, 9.0, 11.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.201171875, -1.16387939453125, -1.1265869140625, -1.08929443359375, -1.052001953125, -1.01470947265625, -0.9774169921875, -0.94012451171875, -0.90283203125, -0.86553955078125, -0.8282470703125, -0.79095458984375, -0.753662109375, -0.71636962890625, -0.6790771484375, -0.64178466796875, -0.6044921875, -0.56719970703125, -0.5299072265625, -0.49261474609375, -0.455322265625, -0.41802978515625, -0.3807373046875, -0.34344482421875, -0.30615234375, -0.26885986328125, -0.2315673828125, -0.19427490234375, -0.156982421875, -0.11968994140625, -0.0823974609375, -0.04510498046875, -0.0078125, 0.02947998046875, 0.0667724609375, 0.10406494140625, 0.141357421875, 0.17864990234375, 0.2159423828125, 0.25323486328125, 0.29052734375, 0.32781982421875, 0.3651123046875, 0.40240478515625, 0.439697265625, 0.47698974609375, 0.5142822265625, 0.55157470703125, 0.5888671875, 0.62615966796875, 0.6634521484375, 0.70074462890625, 0.738037109375, 0.77532958984375, 0.8126220703125, 0.84991455078125, 0.88720703125, 0.92449951171875, 0.9617919921875, 0.99908447265625, 1.036376953125, 1.07366943359375, 1.1109619140625, 1.14825439453125, 1.185546875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 1.0, 5.0, 4.0, 6.0, 8.0, 8.0, 9.0, 11.0, 20.0, 19.0, 29.0, 30.0, 31.0, 29.0, 48.0, 58.0, 64.0, 66.0, 124.0, 60.0, 59.0, 53.0, 42.0, 34.0, 35.0, 28.0, 15.0, 19.0, 25.0, 6.0, 6.0, 12.0, 5.0, 8.0, 4.0, 4.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2259521484375, -0.2189464569091797, -0.21194076538085938, -0.20493507385253906, -0.19792938232421875, -0.19092369079589844, -0.18391799926757812, -0.1769123077392578, -0.1699066162109375, -0.1629009246826172, -0.15589523315429688, -0.14888954162597656, -0.14188385009765625, -0.13487815856933594, -0.12787246704101562, -0.12086677551269531, -0.113861083984375, -0.10685539245605469, -0.09984970092773438, -0.09284400939941406, -0.08583831787109375, -0.07883262634277344, -0.07182693481445312, -0.06482124328613281, -0.0578155517578125, -0.05080986022949219, -0.043804168701171875, -0.03679847717285156, -0.02979278564453125, -0.022787094116210938, -0.015781402587890625, -0.008775711059570312, -0.00177001953125, 0.0052356719970703125, 0.012241363525390625, 0.019247055053710938, 0.02625274658203125, 0.03325843811035156, 0.040264129638671875, 0.04726982116699219, 0.0542755126953125, 0.06128120422363281, 0.06828689575195312, 0.07529258728027344, 0.08229827880859375, 0.08930397033691406, 0.09630966186523438, 0.10331535339355469, 0.110321044921875, 0.11732673645019531, 0.12433242797851562, 0.13133811950683594, 0.13834381103515625, 0.14534950256347656, 0.15235519409179688, 0.1593608856201172, 0.1663665771484375, 0.1733722686767578, 0.18037796020507812, 0.18738365173339844, 0.19438934326171875, 0.20139503479003906, 0.20840072631835938, 0.2154064178466797, 0.222412109375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 7.0, 6.0, 2.0, 4.0, 9.0, 17.0, 17.0, 15.0, 22.0, 21.0, 31.0, 42.0, 70.0, 70.0, 97.0, 121.0, 171.0, 297.0, 737.0, 2923.0, 18591.0, 231046.0, 732401.0, 52921.0, 6372.0, 1240.0, 436.0, 203.0, 139.0, 117.0, 85.0, 62.0, 44.0, 48.0, 24.0, 26.0, 13.0, 14.0, 16.0, 15.0, 16.0, 8.0, 7.0, 5.0, 4.0, 1.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.646484375, -2.561737060546875, -2.47698974609375, -2.392242431640625, -2.3074951171875, -2.222747802734375, -2.13800048828125, -2.053253173828125, -1.968505859375, -1.883758544921875, -1.79901123046875, -1.714263916015625, -1.6295166015625, -1.544769287109375, -1.46002197265625, -1.375274658203125, -1.29052734375, -1.205780029296875, -1.12103271484375, -1.036285400390625, -0.9515380859375, -0.866790771484375, -0.78204345703125, -0.697296142578125, -0.612548828125, -0.527801513671875, -0.44305419921875, -0.358306884765625, -0.2735595703125, -0.188812255859375, -0.10406494140625, -0.019317626953125, 0.0654296875, 0.150177001953125, 0.23492431640625, 0.319671630859375, 0.4044189453125, 0.489166259765625, 0.57391357421875, 0.658660888671875, 0.743408203125, 0.828155517578125, 0.91290283203125, 0.997650146484375, 1.0823974609375, 1.167144775390625, 1.25189208984375, 1.336639404296875, 1.42138671875, 1.506134033203125, 1.59088134765625, 1.675628662109375, 1.7603759765625, 1.845123291015625, 1.92987060546875, 2.014617919921875, 2.099365234375, 2.184112548828125, 2.26885986328125, 2.353607177734375, 2.4383544921875, 2.523101806640625, 2.60784912109375, 2.692596435546875, 2.77734375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 28.0, 180.0, 560.0, 191.0, 37.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8764781951904297, -3.626852035522461, -3.377225637435913, -3.1275992393493652, -2.8779730796813965, -2.6283469200134277, -2.37872052192688, -2.129094123840332, -1.8794679641723633, -1.629841685295105, -1.3802154064178467, -1.1305891275405884, -0.8809628486633301, -0.6313365697860718, -0.3817102909088135, -0.13208401203155518, 0.11754226684570312, 0.3671685457229614, 0.6167948246002197, 0.866421103477478, 1.1160473823547363, 1.3656736612319946, 1.615299940109253, 1.8649262189865112, 2.1145524978637695, 2.3641786575317383, 2.613805055618286, 2.863431453704834, 3.1130576133728027, 3.3626837730407715, 3.6123101711273193, 3.861936569213867, 4.111562728881836, 4.361188888549805, 4.610815048217773, 4.8604416847229, 5.110067844390869, 5.359694004058838, 5.609320640563965, 5.858946800231934, 6.108572959899902, 6.358199119567871, 6.60782527923584, 6.857451915740967, 7.1070780754089355, 7.356704235076904, 7.606330871582031, 7.85595703125, 8.105583190917969, 8.355209350585938, 8.604835510253906, 8.854461669921875, 9.104087829589844, 9.353714942932129, 9.603341102600098, 9.852967262268066, 10.102593421936035, 10.352219581604004, 10.601845741271973, 10.851471900939941, 11.101099014282227, 11.350725173950195, 11.600351333618164, 11.849977493286133, 12.099603652954102]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 10.0, 12.0, 7.0, 8.0, 11.0, 21.0, 21.0, 26.0, 38.0, 43.0, 47.0, 47.0, 47.0, 51.0, 54.0, 69.0, 55.0, 50.0, 52.0, 35.0, 65.0, 38.0, 30.0, 25.0, 32.0, 29.0, 25.0, 15.0, 9.0, 10.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9749481081962585, -0.9441759586334229, -0.9134038686752319, -0.8826317191123962, -0.8518596291542053, -0.8210874795913696, -0.7903153896331787, -0.759543240070343, -0.7287710905075073, -0.6979989409446716, -0.6672268509864807, -0.636454701423645, -0.6056826114654541, -0.5749104619026184, -0.5441383123397827, -0.5133662223815918, -0.4825941324234009, -0.4518220126628876, -0.42104989290237427, -0.3902777433395386, -0.35950565338134766, -0.32873350381851196, -0.29796138405799866, -0.26718926429748535, -0.23641714453697205, -0.20564502477645874, -0.17487290501594543, -0.14410077035427094, -0.11332865059375763, -0.08255653083324432, -0.051784396171569824, -0.02101227641105652, 0.009759843349456787, 0.04053196683526039, 0.071304090321064, 0.1020762175321579, 0.1328483372926712, 0.1636204570531845, 0.194392591714859, 0.22516471147537231, 0.2559368312358856, 0.2867089509963989, 0.31748107075691223, 0.34825319051742554, 0.37902534008026123, 0.40979743003845215, 0.44056957960128784, 0.47134169936180115, 0.5021138191223145, 0.5328859686851501, 0.5636580586433411, 0.5944302082061768, 0.6252022981643677, 0.6559744477272034, 0.6867465972900391, 0.71751868724823, 0.7482907772064209, 0.7790629267692566, 0.8098350167274475, 0.8406071662902832, 0.8713792562484741, 0.9021514058113098, 0.9329235553741455, 0.9636956453323364, 0.9944677948951721]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 2.0, 8.0, 11.0, 11.0, 4.0, 12.0, 14.0, 15.0, 25.0, 28.0, 28.0, 26.0, 35.0, 30.0, 31.0, 41.0, 36.0, 48.0, 50.0, 46.0, 46.0, 46.0, 45.0, 41.0, 42.0, 44.0, 33.0, 25.0, 26.0, 25.0, 22.0, 19.0, 22.0, 17.0, 13.0, 6.0, 5.0, 8.0, 9.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.103515625, -1.073577880859375, -1.04364013671875, -1.013702392578125, -0.9837646484375, -0.953826904296875, -0.92388916015625, -0.893951416015625, -0.864013671875, -0.834075927734375, -0.80413818359375, -0.774200439453125, -0.7442626953125, -0.714324951171875, -0.68438720703125, -0.654449462890625, -0.62451171875, -0.594573974609375, -0.56463623046875, -0.534698486328125, -0.5047607421875, -0.474822998046875, -0.44488525390625, -0.414947509765625, -0.385009765625, -0.355072021484375, -0.32513427734375, -0.295196533203125, -0.2652587890625, -0.235321044921875, -0.20538330078125, -0.175445556640625, -0.1455078125, -0.115570068359375, -0.08563232421875, -0.055694580078125, -0.0257568359375, 0.004180908203125, 0.03411865234375, 0.064056396484375, 0.093994140625, 0.123931884765625, 0.15386962890625, 0.183807373046875, 0.2137451171875, 0.243682861328125, 0.27362060546875, 0.303558349609375, 0.33349609375, 0.363433837890625, 0.39337158203125, 0.423309326171875, 0.4532470703125, 0.483184814453125, 0.51312255859375, 0.543060302734375, 0.572998046875, 0.602935791015625, 0.63287353515625, 0.662811279296875, 0.6927490234375, 0.722686767578125, 0.75262451171875, 0.782562255859375, 0.8125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 10.0, 4.0, 10.0, 14.0, 26.0, 30.0, 33.0, 67.0, 81.0, 130.0, 290.0, 522.0, 1013.0, 2153.0, 4763.0, 12446.0, 40175.0, 238868.0, 642057.0, 73802.0, 19055.0, 7091.0, 2921.0, 1430.0, 651.0, 342.0, 181.0, 105.0, 76.0, 47.0, 40.0, 23.0, 12.0, 20.0, 9.0, 13.0, 6.0, 5.0, 0.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.40234375, -4.256591796875, -4.11083984375, -3.965087890625, -3.8193359375, -3.673583984375, -3.52783203125, -3.382080078125, -3.236328125, -3.090576171875, -2.94482421875, -2.799072265625, -2.6533203125, -2.507568359375, -2.36181640625, -2.216064453125, -2.0703125, -1.924560546875, -1.77880859375, -1.633056640625, -1.4873046875, -1.341552734375, -1.19580078125, -1.050048828125, -0.904296875, -0.758544921875, -0.61279296875, -0.467041015625, -0.3212890625, -0.175537109375, -0.02978515625, 0.115966796875, 0.26171875, 0.407470703125, 0.55322265625, 0.698974609375, 0.8447265625, 0.990478515625, 1.13623046875, 1.281982421875, 1.427734375, 1.573486328125, 1.71923828125, 1.864990234375, 2.0107421875, 2.156494140625, 2.30224609375, 2.447998046875, 2.59375, 2.739501953125, 2.88525390625, 3.031005859375, 3.1767578125, 3.322509765625, 3.46826171875, 3.614013671875, 3.759765625, 3.905517578125, 4.05126953125, 4.197021484375, 4.3427734375, 4.488525390625, 4.63427734375, 4.780029296875, 4.92578125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 5.0, 7.0, 11.0, 6.0, 12.0, 13.0, 17.0, 19.0, 25.0, 25.0, 39.0, 33.0, 46.0, 57.0, 66.0, 81.0, 112.0, 149.0, 206.0, 1316.0, 174.0, 115.0, 83.0, 83.0, 61.0, 45.0, 45.0, 49.0, 24.0, 31.0, 18.0, 18.0, 16.0, 14.0, 9.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.895538330078125, -2.78521728515625, -2.674896240234375, -2.5645751953125, -2.454254150390625, -2.34393310546875, -2.233612060546875, -2.123291015625, -2.012969970703125, -1.90264892578125, -1.792327880859375, -1.6820068359375, -1.571685791015625, -1.46136474609375, -1.351043701171875, -1.24072265625, -1.130401611328125, -1.02008056640625, -0.909759521484375, -0.7994384765625, -0.689117431640625, -0.57879638671875, -0.468475341796875, -0.358154296875, -0.247833251953125, -0.13751220703125, -0.027191162109375, 0.0831298828125, 0.193450927734375, 0.30377197265625, 0.414093017578125, 0.5244140625, 0.634735107421875, 0.74505615234375, 0.855377197265625, 0.9656982421875, 1.076019287109375, 1.18634033203125, 1.296661376953125, 1.406982421875, 1.517303466796875, 1.62762451171875, 1.737945556640625, 1.8482666015625, 1.958587646484375, 2.06890869140625, 2.179229736328125, 2.28955078125, 2.399871826171875, 2.51019287109375, 2.620513916015625, 2.7308349609375, 2.841156005859375, 2.95147705078125, 3.061798095703125, 3.172119140625, 3.282440185546875, 3.39276123046875, 3.503082275390625, 3.6134033203125, 3.723724365234375, 3.83404541015625, 3.944366455078125, 4.0546875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 14.0, 12.0, 23.0, 19.0, 38.0, 68.0, 112.0, 144.0, 207.0, 343.0, 651.0, 1180.0, 2278.0, 4752.0, 11281.0, 31355.0, 109309.0, 636560.0, 2008735.0, 247397.0, 57611.0, 18838.0, 7457.0, 3350.0, 1686.0, 889.0, 525.0, 313.0, 188.0, 100.0, 86.0, 46.0, 39.0, 30.0, 18.0, 16.0, 4.0, 7.0, 5.0, 2.0, 7.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0546875, -4.89801025390625, -4.7413330078125, -4.58465576171875, -4.427978515625, -4.27130126953125, -4.1146240234375, -3.95794677734375, -3.80126953125, -3.64459228515625, -3.4879150390625, -3.33123779296875, -3.174560546875, -3.01788330078125, -2.8612060546875, -2.70452880859375, -2.5478515625, -2.39117431640625, -2.2344970703125, -2.07781982421875, -1.921142578125, -1.76446533203125, -1.6077880859375, -1.45111083984375, -1.29443359375, -1.13775634765625, -0.9810791015625, -0.82440185546875, -0.667724609375, -0.51104736328125, -0.3543701171875, -0.19769287109375, -0.041015625, 0.11566162109375, 0.2723388671875, 0.42901611328125, 0.585693359375, 0.74237060546875, 0.8990478515625, 1.05572509765625, 1.21240234375, 1.36907958984375, 1.5257568359375, 1.68243408203125, 1.839111328125, 1.99578857421875, 2.1524658203125, 2.30914306640625, 2.4658203125, 2.62249755859375, 2.7791748046875, 2.93585205078125, 3.092529296875, 3.24920654296875, 3.4058837890625, 3.56256103515625, 3.71923828125, 3.87591552734375, 4.0325927734375, 4.18927001953125, 4.345947265625, 4.50262451171875, 4.6593017578125, 4.81597900390625, 4.97265625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [9.0, 68.0, 501.0, 377.0, 54.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.694783687591553, -4.406377792358398, -2.1179723739624023, 0.17043352127075195, 2.458838939666748, 4.747244358062744, 7.035650730133057, 9.324054718017578, 11.61246109008789, 13.900866508483887, 16.189271926879883, 18.477678298950195, 20.766082763671875, 23.054489135742188, 25.3428955078125, 27.63129997253418, 29.919706344604492, 32.20811080932617, 34.496517181396484, 36.7849235534668, 39.07332992553711, 41.361732482910156, 43.65013885498047, 45.93854522705078, 48.226951599121094, 50.515357971191406, 52.80376434326172, 55.09217071533203, 57.38057327270508, 59.66897964477539, 61.9573860168457, 64.24578857421875, 66.5342025756836, 68.8226089477539, 71.11101531982422, 73.39942169189453, 75.68782806396484, 77.97622680664062, 80.26463317871094, 82.55303955078125, 84.84144592285156, 87.12985229492188, 89.41825866699219, 91.7066650390625, 93.99507141113281, 96.28347778320312, 98.57188415527344, 100.86028289794922, 103.14869689941406, 105.43710327148438, 107.72550964355469, 110.013916015625, 112.30232238769531, 114.59072875976562, 116.87913513183594, 119.16753387451172, 121.45594024658203, 123.74434661865234, 126.03275299072266, 128.32115173339844, 130.60955810546875, 132.89796447753906, 135.18637084960938, 137.4747772216797, 139.76318359375]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 10.0, 10.0, 11.0, 14.0, 12.0, 21.0, 15.0, 22.0, 25.0, 25.0, 30.0, 31.0, 29.0, 35.0, 31.0, 39.0, 35.0, 27.0, 35.0, 28.0, 40.0, 40.0, 34.0, 41.0, 34.0, 31.0, 26.0, 28.0, 25.0, 27.0, 22.0, 17.0, 21.0, 10.0, 18.0, 10.0, 10.0, 13.0, 12.0, 9.0, 11.0, 8.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-10.278423309326172, -9.961944580078125, -9.645464897155762, -9.328985214233398, -9.012506484985352, -8.696027755737305, -8.379548072814941, -8.063068389892578, -7.746589660644531, -7.430110454559326, -7.113631248474121, -6.797152042388916, -6.480672836303711, -6.164193630218506, -5.847714424133301, -5.531235218048096, -5.214756011962891, -4.8982768058776855, -4.5817975997924805, -4.265318393707275, -3.9488391876220703, -3.6323599815368652, -3.31588077545166, -2.999401569366455, -2.68292236328125, -2.366443157196045, -2.04996395111084, -1.7334847450256348, -1.4170055389404297, -1.1005263328552246, -0.7840471267700195, -0.46756792068481445, -0.15108871459960938, 0.1653904914855957, 0.4818696975708008, 0.7983489036560059, 1.114828109741211, 1.431307315826416, 1.747786521911621, 2.064265727996826, 2.3807449340820312, 2.6972241401672363, 3.0137033462524414, 3.3301825523376465, 3.6466617584228516, 3.9631409645080566, 4.279620170593262, 4.596099376678467, 4.912578582763672, 5.229057788848877, 5.545536994934082, 5.862016201019287, 6.178495407104492, 6.494974613189697, 6.811453819274902, 7.127933025360107, 7.4444122314453125, 7.760891437530518, 8.077370643615723, 8.393850326538086, 8.710329055786133, 9.02680778503418, 9.343287467956543, 9.659767150878906, 9.976245880126953]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 10.0, 9.0, 7.0, 8.0, 6.0, 14.0, 13.0, 24.0, 17.0, 25.0, 26.0, 23.0, 31.0, 41.0, 33.0, 35.0, 40.0, 52.0, 50.0, 60.0, 43.0, 54.0, 38.0, 44.0, 33.0, 31.0, 36.0, 31.0, 32.0, 24.0, 18.0, 21.0, 11.0, 16.0, 11.0, 11.0, 9.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2333984375, -1.199554443359375, -1.16571044921875, -1.131866455078125, -1.0980224609375, -1.064178466796875, -1.03033447265625, -0.996490478515625, -0.962646484375, -0.928802490234375, -0.89495849609375, -0.861114501953125, -0.8272705078125, -0.793426513671875, -0.75958251953125, -0.725738525390625, -0.69189453125, -0.658050537109375, -0.62420654296875, -0.590362548828125, -0.5565185546875, -0.522674560546875, -0.48883056640625, -0.454986572265625, -0.421142578125, -0.387298583984375, -0.35345458984375, -0.319610595703125, -0.2857666015625, -0.251922607421875, -0.21807861328125, -0.184234619140625, -0.150390625, -0.116546630859375, -0.08270263671875, -0.048858642578125, -0.0150146484375, 0.018829345703125, 0.05267333984375, 0.086517333984375, 0.120361328125, 0.154205322265625, 0.18804931640625, 0.221893310546875, 0.2557373046875, 0.289581298828125, 0.32342529296875, 0.357269287109375, 0.39111328125, 0.424957275390625, 0.45880126953125, 0.492645263671875, 0.5264892578125, 0.560333251953125, 0.59417724609375, 0.628021240234375, 0.661865234375, 0.695709228515625, 0.72955322265625, 0.763397216796875, 0.7972412109375, 0.831085205078125, 0.86492919921875, 0.898773193359375, 0.9326171875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 7.0, 11.0, 22.0, 16.0, 35.0, 43.0, 48.0, 59.0, 101.0, 117.0, 235.0, 305.0, 488.0, 733.0, 1311.0, 2395.0, 4509.0, 9074.0, 20468.0, 59986.0, 455154.0, 3209905.0, 339874.0, 52815.0, 18745.0, 8295.0, 4037.0, 2162.0, 1199.0, 758.0, 448.0, 245.0, 193.0, 150.0, 100.0, 64.0, 40.0, 42.0, 20.0, 23.0, 17.0, 11.0, 11.0, 4.0, 4.0, 4.0, 0.0, 1.0], "bins": [-3.947265625, -3.84185791015625, -3.7364501953125, -3.63104248046875, -3.525634765625, -3.42022705078125, -3.3148193359375, -3.20941162109375, -3.10400390625, -2.99859619140625, -2.8931884765625, -2.78778076171875, -2.682373046875, -2.57696533203125, -2.4715576171875, -2.36614990234375, -2.2607421875, -2.15533447265625, -2.0499267578125, -1.94451904296875, -1.839111328125, -1.73370361328125, -1.6282958984375, -1.52288818359375, -1.41748046875, -1.31207275390625, -1.2066650390625, -1.10125732421875, -0.995849609375, -0.89044189453125, -0.7850341796875, -0.67962646484375, -0.57421875, -0.46881103515625, -0.3634033203125, -0.25799560546875, -0.152587890625, -0.04718017578125, 0.0582275390625, 0.16363525390625, 0.26904296875, 0.37445068359375, 0.4798583984375, 0.58526611328125, 0.690673828125, 0.79608154296875, 0.9014892578125, 1.00689697265625, 1.1123046875, 1.21771240234375, 1.3231201171875, 1.42852783203125, 1.533935546875, 1.63934326171875, 1.7447509765625, 1.85015869140625, 1.95556640625, 2.06097412109375, 2.1663818359375, 2.27178955078125, 2.377197265625, 2.48260498046875, 2.5880126953125, 2.69342041015625, 2.798828125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 7.0, 15.0, 26.0, 48.0, 77.0, 104.0, 238.0, 708.0, 1514.0, 796.0, 259.0, 107.0, 71.0, 38.0, 21.0, 13.0, 9.0, 11.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.26171875, -7.06298828125, -6.8642578125, -6.66552734375, -6.466796875, -6.26806640625, -6.0693359375, -5.87060546875, -5.671875, -5.47314453125, -5.2744140625, -5.07568359375, -4.876953125, -4.67822265625, -4.4794921875, -4.28076171875, -4.08203125, -3.88330078125, -3.6845703125, -3.48583984375, -3.287109375, -3.08837890625, -2.8896484375, -2.69091796875, -2.4921875, -2.29345703125, -2.0947265625, -1.89599609375, -1.697265625, -1.49853515625, -1.2998046875, -1.10107421875, -0.90234375, -0.70361328125, -0.5048828125, -0.30615234375, -0.107421875, 0.09130859375, 0.2900390625, 0.48876953125, 0.6875, 0.88623046875, 1.0849609375, 1.28369140625, 1.482421875, 1.68115234375, 1.8798828125, 2.07861328125, 2.27734375, 2.47607421875, 2.6748046875, 2.87353515625, 3.072265625, 3.27099609375, 3.4697265625, 3.66845703125, 3.8671875, 4.06591796875, 4.2646484375, 4.46337890625, 4.662109375, 4.86083984375, 5.0595703125, 5.25830078125, 5.45703125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 14.0, 10.0, 18.0, 28.0, 46.0, 58.0, 77.0, 111.0, 240.0, 535.0, 1477.0, 5669.0, 28172.0, 300458.0, 3679577.0, 152474.0, 18986.0, 4114.0, 1189.0, 455.0, 175.0, 121.0, 83.0, 58.0, 35.0, 26.0, 27.0, 12.0, 9.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3359375, -10.9859619140625, -10.635986328125, -10.2860107421875, -9.93603515625, -9.5860595703125, -9.236083984375, -8.8861083984375, -8.5361328125, -8.1861572265625, -7.836181640625, -7.4862060546875, -7.13623046875, -6.7862548828125, -6.436279296875, -6.0863037109375, -5.736328125, -5.3863525390625, -5.036376953125, -4.6864013671875, -4.33642578125, -3.9864501953125, -3.636474609375, -3.2864990234375, -2.9365234375, -2.5865478515625, -2.236572265625, -1.8865966796875, -1.53662109375, -1.1866455078125, -0.836669921875, -0.4866943359375, -0.13671875, 0.2132568359375, 0.563232421875, 0.9132080078125, 1.26318359375, 1.6131591796875, 1.963134765625, 2.3131103515625, 2.6630859375, 3.0130615234375, 3.363037109375, 3.7130126953125, 4.06298828125, 4.4129638671875, 4.762939453125, 5.1129150390625, 5.462890625, 5.8128662109375, 6.162841796875, 6.5128173828125, 6.86279296875, 7.2127685546875, 7.562744140625, 7.9127197265625, 8.2626953125, 8.6126708984375, 8.962646484375, 9.3126220703125, 9.66259765625, 10.0125732421875, 10.362548828125, 10.7125244140625, 11.0625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 8.0, 18.0, 52.0, 180.0, 291.0, 252.0, 128.0, 48.0, 23.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.790937423706055, -26.39804458618164, -25.005151748657227, -23.612258911132812, -22.219364166259766, -20.826473236083984, -19.433578491210938, -18.040685653686523, -16.64779281616211, -15.254899978637695, -13.862007141113281, -12.46911334991455, -11.076220512390137, -9.683327674865723, -8.290433883666992, -6.897541046142578, -5.504648208618164, -4.11175537109375, -2.7188620567321777, -1.3259687423706055, 0.0669240951538086, 1.4598169326782227, 2.852710723876953, 4.245603561401367, 5.638496398925781, 7.031389236450195, 8.42428207397461, 9.81717586517334, 11.210068702697754, 12.602961540222168, 13.995855331420898, 15.388748168945312, 16.781639099121094, 18.174531936645508, 19.567424774169922, 20.96031951904297, 22.35321044921875, 23.746105194091797, 25.13899803161621, 26.531890869140625, 27.92478370666504, 29.317676544189453, 30.710569381713867, 32.10346221923828, 33.49635696411133, 34.88924789428711, 36.282142639160156, 37.67503356933594, 39.067928314208984, 40.46082305908203, 41.85371398925781, 43.24660873413086, 44.63949966430664, 46.03239440917969, 47.42528533935547, 48.818180084228516, 50.21107482910156, 51.60396957397461, 52.99686050415039, 54.38975524902344, 55.78264617919922, 57.175540924072266, 58.56843566894531, 59.961326599121094, 61.354217529296875]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 12.0, 4.0, 14.0, 10.0, 16.0, 14.0, 24.0, 17.0, 31.0, 23.0, 27.0, 23.0, 26.0, 41.0, 39.0, 39.0, 45.0, 40.0, 51.0, 48.0, 41.0, 44.0, 48.0, 31.0, 39.0, 32.0, 25.0, 30.0, 23.0, 29.0, 24.0, 17.0, 10.0, 17.0, 14.0, 6.0, 7.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.748716354370117, -9.43023681640625, -9.111756324768066, -8.7932767868042, -8.474796295166016, -8.156316757202148, -7.837836742401123, -7.519356727600098, -7.2008771896362305, -6.882397174835205, -6.56391716003418, -6.2454376220703125, -5.926957607269287, -5.608477592468262, -5.289997577667236, -4.971517562866211, -4.6530375480651855, -4.33455753326416, -4.016077518463135, -3.6975977420806885, -3.379117965698242, -3.060637950897217, -2.7421579360961914, -2.423678159713745, -2.1051981449127197, -1.7867182493209839, -1.468238353729248, -1.1497583389282227, -0.8312784433364868, -0.512798547744751, -0.19431853294372559, 0.1241612434387207, 0.4426412582397461, 0.7611211538314819, 1.0796010494232178, 1.3980810642242432, 1.716560959815979, 2.035040855407715, 2.3535208702087402, 2.6720006465911865, 2.990480661392212, 3.3089606761932373, 3.6274404525756836, 3.945920467376709, 4.264400482177734, 4.582880020141602, 4.901360511779785, 5.219840049743652, 5.538320064544678, 5.856800079345703, 6.1752800941467285, 6.493760108947754, 6.812239646911621, 7.1307196617126465, 7.449199676513672, 7.767679214477539, 8.086159706115723, 8.40463924407959, 8.723119735717773, 9.04159927368164, 9.360079765319824, 9.678559303283691, 9.997039794921875, 10.315519332885742, 10.63399887084961]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 2.0, 4.0, 6.0, 4.0, 15.0, 14.0, 8.0, 11.0, 16.0, 16.0, 11.0, 15.0, 17.0, 26.0, 21.0, 25.0, 26.0, 31.0, 41.0, 23.0, 42.0, 39.0, 41.0, 42.0, 43.0, 56.0, 39.0, 39.0, 38.0, 36.0, 33.0, 21.0, 19.0, 21.0, 28.0, 19.0, 24.0, 14.0, 12.0, 13.0, 7.0, 9.0, 10.0, 5.0, 9.0, 5.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9825286865234375, -0.952362060546875, -0.9221954345703125, -0.89202880859375, -0.8618621826171875, -0.831695556640625, -0.8015289306640625, -0.7713623046875, -0.7411956787109375, -0.711029052734375, -0.6808624267578125, -0.65069580078125, -0.6205291748046875, -0.590362548828125, -0.5601959228515625, -0.530029296875, -0.4998626708984375, -0.469696044921875, -0.4395294189453125, -0.40936279296875, -0.3791961669921875, -0.349029541015625, -0.3188629150390625, -0.2886962890625, -0.2585296630859375, -0.228363037109375, -0.1981964111328125, -0.16802978515625, -0.1378631591796875, -0.107696533203125, -0.0775299072265625, -0.04736328125, -0.0171966552734375, 0.012969970703125, 0.0431365966796875, 0.07330322265625, 0.1034698486328125, 0.133636474609375, 0.1638031005859375, 0.1939697265625, 0.2241363525390625, 0.254302978515625, 0.2844696044921875, 0.31463623046875, 0.3448028564453125, 0.374969482421875, 0.4051361083984375, 0.435302734375, 0.4654693603515625, 0.495635986328125, 0.5258026123046875, 0.55596923828125, 0.5861358642578125, 0.616302490234375, 0.6464691162109375, 0.6766357421875, 0.7068023681640625, 0.736968994140625, 0.7671356201171875, 0.79730224609375, 0.8274688720703125, 0.857635498046875, 0.8878021240234375, 0.91796875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 16.0, 14.0, 21.0, 34.0, 63.0, 81.0, 124.0, 193.0, 306.0, 465.0, 640.0, 1102.0, 1717.0, 2681.0, 4323.0, 7105.0, 11372.0, 18143.0, 29084.0, 46267.0, 70594.0, 103092.0, 136321.0, 153326.0, 140579.0, 109728.0, 76212.0, 50125.0, 31931.0, 20074.0, 12266.0, 7691.0, 4796.0, 2864.0, 1878.0, 1185.0, 777.0, 460.0, 320.0, 211.0, 118.0, 96.0, 63.0, 27.0, 19.0, 13.0, 13.0, 5.0, 9.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.966796875, -0.9361953735351562, -0.9055938720703125, -0.8749923706054688, -0.844390869140625, -0.8137893676757812, -0.7831878662109375, -0.7525863647460938, -0.72198486328125, -0.6913833618164062, -0.6607818603515625, -0.6301803588867188, -0.599578857421875, -0.5689773559570312, -0.5383758544921875, -0.5077743530273438, -0.4771728515625, -0.44657135009765625, -0.4159698486328125, -0.38536834716796875, -0.354766845703125, -0.32416534423828125, -0.2935638427734375, -0.26296234130859375, -0.23236083984375, -0.20175933837890625, -0.1711578369140625, -0.14055633544921875, -0.109954833984375, -0.07935333251953125, -0.0487518310546875, -0.01815032958984375, 0.012451171875, 0.04305267333984375, 0.0736541748046875, 0.10425567626953125, 0.134857177734375, 0.16545867919921875, 0.1960601806640625, 0.22666168212890625, 0.25726318359375, 0.28786468505859375, 0.3184661865234375, 0.34906768798828125, 0.379669189453125, 0.41027069091796875, 0.4408721923828125, 0.47147369384765625, 0.5020751953125, 0.5326766967773438, 0.5632781982421875, 0.5938796997070312, 0.624481201171875, 0.6550827026367188, 0.6856842041015625, 0.7162857055664062, 0.74688720703125, 0.7774887084960938, 0.8080902099609375, 0.8386917114257812, 0.869293212890625, 0.8998947143554688, 0.9304962158203125, 0.9610977172851562, 0.99169921875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 7.0, 7.0, 7.0, 11.0, 13.0, 11.0, 15.0, 23.0, 28.0, 19.0, 26.0, 30.0, 40.0, 21.0, 43.0, 46.0, 36.0, 46.0, 45.0, 1064.0, 26.0, 46.0, 41.0, 35.0, 43.0, 35.0, 30.0, 20.0, 36.0, 27.0, 25.0, 17.0, 12.0, 16.0, 21.0, 8.0, 9.0, 12.0, 5.0, 4.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.376953125, -1.338043212890625, -1.29913330078125, -1.260223388671875, -1.2213134765625, -1.182403564453125, -1.14349365234375, -1.104583740234375, -1.065673828125, -1.026763916015625, -0.98785400390625, -0.948944091796875, -0.9100341796875, -0.871124267578125, -0.83221435546875, -0.793304443359375, -0.75439453125, -0.715484619140625, -0.67657470703125, -0.637664794921875, -0.5987548828125, -0.559844970703125, -0.52093505859375, -0.482025146484375, -0.443115234375, -0.404205322265625, -0.36529541015625, -0.326385498046875, -0.2874755859375, -0.248565673828125, -0.20965576171875, -0.170745849609375, -0.1318359375, -0.092926025390625, -0.05401611328125, -0.015106201171875, 0.0238037109375, 0.062713623046875, 0.10162353515625, 0.140533447265625, 0.179443359375, 0.218353271484375, 0.25726318359375, 0.296173095703125, 0.3350830078125, 0.373992919921875, 0.41290283203125, 0.451812744140625, 0.49072265625, 0.529632568359375, 0.56854248046875, 0.607452392578125, 0.6463623046875, 0.685272216796875, 0.72418212890625, 0.763092041015625, 0.802001953125, 0.840911865234375, 0.87982177734375, 0.918731689453125, 0.9576416015625, 0.996551513671875, 1.03546142578125, 1.074371337890625, 1.11328125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 12.0, 14.0, 18.0, 21.0, 31.0, 41.0, 55.0, 74.0, 106.0, 170.0, 229.0, 311.0, 422.0, 637.0, 932.0, 1394.0, 2276.0, 3701.0, 5986.0, 10286.0, 18443.0, 35803.0, 90865.0, 1493145.0, 313906.0, 55925.0, 26445.0, 14400.0, 8128.0, 4764.0, 2895.0, 1873.0, 1213.0, 753.0, 531.0, 373.0, 270.0, 173.0, 137.0, 102.0, 75.0, 56.0, 39.0, 33.0, 23.0, 19.0, 13.0, 7.0, 3.0, 2.0, 2.0, 3.0], "bins": [-1.8955078125, -1.842529296875, -1.78955078125, -1.736572265625, -1.68359375, -1.630615234375, -1.57763671875, -1.524658203125, -1.4716796875, -1.418701171875, -1.36572265625, -1.312744140625, -1.259765625, -1.206787109375, -1.15380859375, -1.100830078125, -1.0478515625, -0.994873046875, -0.94189453125, -0.888916015625, -0.8359375, -0.782958984375, -0.72998046875, -0.677001953125, -0.6240234375, -0.571044921875, -0.51806640625, -0.465087890625, -0.412109375, -0.359130859375, -0.30615234375, -0.253173828125, -0.2001953125, -0.147216796875, -0.09423828125, -0.041259765625, 0.01171875, 0.064697265625, 0.11767578125, 0.170654296875, 0.2236328125, 0.276611328125, 0.32958984375, 0.382568359375, 0.435546875, 0.488525390625, 0.54150390625, 0.594482421875, 0.6474609375, 0.700439453125, 0.75341796875, 0.806396484375, 0.859375, 0.912353515625, 0.96533203125, 1.018310546875, 1.0712890625, 1.124267578125, 1.17724609375, 1.230224609375, 1.283203125, 1.336181640625, 1.38916015625, 1.442138671875, 1.4951171875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 6.0, 3.0, 7.0, 6.0, 5.0, 4.0, 6.0, 13.0, 12.0, 10.0, 26.0, 25.0, 31.0, 43.0, 40.0, 62.0, 81.0, 130.0, 106.0, 67.0, 57.0, 47.0, 40.0, 30.0, 24.0, 24.0, 17.0, 12.0, 16.0, 12.0, 6.0, 10.0, 6.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47216796875, -0.45635986328125, -0.4405517578125, -0.42474365234375, -0.408935546875, -0.39312744140625, -0.3773193359375, -0.36151123046875, -0.345703125, -0.32989501953125, -0.3140869140625, -0.29827880859375, -0.282470703125, -0.26666259765625, -0.2508544921875, -0.23504638671875, -0.21923828125, -0.20343017578125, -0.1876220703125, -0.17181396484375, -0.156005859375, -0.14019775390625, -0.1243896484375, -0.10858154296875, -0.0927734375, -0.07696533203125, -0.0611572265625, -0.04534912109375, -0.029541015625, -0.01373291015625, 0.0020751953125, 0.01788330078125, 0.03369140625, 0.04949951171875, 0.0653076171875, 0.08111572265625, 0.096923828125, 0.11273193359375, 0.1285400390625, 0.14434814453125, 0.16015625, 0.17596435546875, 0.1917724609375, 0.20758056640625, 0.223388671875, 0.23919677734375, 0.2550048828125, 0.27081298828125, 0.28662109375, 0.30242919921875, 0.3182373046875, 0.33404541015625, 0.349853515625, 0.36566162109375, 0.3814697265625, 0.39727783203125, 0.4130859375, 0.42889404296875, 0.4447021484375, 0.46051025390625, 0.476318359375, 0.49212646484375, 0.5079345703125, 0.52374267578125, 0.53955078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 14.0, 11.0, 16.0, 19.0, 24.0, 33.0, 38.0, 41.0, 51.0, 72.0, 89.0, 144.0, 267.0, 724.0, 4328.0, 44440.0, 883217.0, 104907.0, 7940.0, 1148.0, 331.0, 191.0, 105.0, 98.0, 55.0, 56.0, 39.0, 31.0, 26.0, 21.0, 15.0, 23.0, 7.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.92578125, -6.71990966796875, -6.5140380859375, -6.30816650390625, -6.102294921875, -5.89642333984375, -5.6905517578125, -5.48468017578125, -5.27880859375, -5.07293701171875, -4.8670654296875, -4.66119384765625, -4.455322265625, -4.24945068359375, -4.0435791015625, -3.83770751953125, -3.6318359375, -3.42596435546875, -3.2200927734375, -3.01422119140625, -2.808349609375, -2.60247802734375, -2.3966064453125, -2.19073486328125, -1.98486328125, -1.77899169921875, -1.5731201171875, -1.36724853515625, -1.161376953125, -0.95550537109375, -0.7496337890625, -0.54376220703125, -0.337890625, -0.13201904296875, 0.0738525390625, 0.27972412109375, 0.485595703125, 0.69146728515625, 0.8973388671875, 1.10321044921875, 1.30908203125, 1.51495361328125, 1.7208251953125, 1.92669677734375, 2.132568359375, 2.33843994140625, 2.5443115234375, 2.75018310546875, 2.9560546875, 3.16192626953125, 3.3677978515625, 3.57366943359375, 3.779541015625, 3.98541259765625, 4.1912841796875, 4.39715576171875, 4.60302734375, 4.80889892578125, 5.0147705078125, 5.22064208984375, 5.426513671875, 5.63238525390625, 5.8382568359375, 6.04412841796875, 6.25]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 31.0, 292.0, 622.0, 54.0, 16.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.248943328857422, -21.431180953979492, -20.613420486450195, -19.795658111572266, -18.977895736694336, -18.160133361816406, -17.34237289428711, -16.52461051940918, -15.706849098205566, -14.889087677001953, -14.071325302124023, -13.25356388092041, -12.435802459716797, -11.618040084838867, -10.800278663635254, -9.98251724243164, -9.164754867553711, -8.346993446350098, -7.529231071472168, -6.711469650268555, -5.893707752227783, -5.075945854187012, -4.258184432983398, -3.440422534942627, -2.6226606369018555, -1.8048988580703735, -0.9871370792388916, -0.16937541961669922, 0.6483864784240723, 1.4661483764648438, 2.283909797668457, 3.1016716957092285, 3.919431686401367, 4.737193584442139, 5.55495548248291, 6.372716903686523, 7.190478801727295, 8.008240699768066, 8.82600212097168, 9.64376449584961, 10.461525917053223, 11.279287338256836, 12.097049713134766, 12.914811134338379, 13.732572555541992, 14.550334930419922, 15.368096351623535, 16.18585777282715, 17.003620147705078, 17.821382522583008, 18.639142990112305, 19.456905364990234, 20.274667739868164, 21.092430114746094, 21.91019058227539, 22.72795295715332, 23.54571533203125, 24.36347770690918, 25.181238174438477, 25.999000549316406, 26.816762924194336, 27.634525299072266, 28.452285766601562, 29.270048141479492, 30.08780860900879]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 9.0, 13.0, 16.0, 21.0, 23.0, 17.0, 31.0, 40.0, 40.0, 43.0, 37.0, 50.0, 53.0, 58.0, 59.0, 54.0, 61.0, 57.0, 41.0, 46.0, 36.0, 19.0, 25.0, 31.0, 27.0, 18.0, 20.0, 9.0, 12.0, 7.0, 9.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.67937970161438, -3.5866241455078125, -3.493868827819824, -3.401113510131836, -3.3083579540252686, -3.215602397918701, -3.122847080230713, -3.0300917625427246, -2.9373362064361572, -2.84458065032959, -2.7518253326416016, -2.6590700149536133, -2.566314458847046, -2.4735589027404785, -2.3808035850524902, -2.288048267364502, -2.1952927112579346, -2.102537155151367, -2.009781837463379, -1.917026400566101, -1.8242709636688232, -1.7315155267715454, -1.6387600898742676, -1.5460046529769897, -1.453249216079712, -1.360493779182434, -1.2677383422851562, -1.1749829053878784, -1.0822274684906006, -0.9894720315933228, -0.8967165946960449, -0.8039611577987671, -0.7112054824829102, -0.6184500455856323, -0.5256946086883545, -0.43293917179107666, -0.34018373489379883, -0.247428297996521, -0.15467286109924316, -0.06191742420196533, 0.0308380126953125, 0.12359344959259033, 0.21634888648986816, 0.309104323387146, 0.40185976028442383, 0.49461519718170166, 0.5873706340789795, 0.6801260709762573, 0.7728815078735352, 0.865636944770813, 0.9583923816680908, 1.0511478185653687, 1.1439032554626465, 1.2366586923599243, 1.3294141292572021, 1.42216956615448, 1.5149250030517578, 1.6076804399490356, 1.7004358768463135, 1.7931913137435913, 1.8859467506408691, 1.978702187538147, 2.071457624435425, 2.164213180541992, 2.2569684982299805]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 4.0, 4.0, 13.0, 1.0, 7.0, 10.0, 8.0, 16.0, 18.0, 15.0, 9.0, 20.0, 28.0, 15.0, 17.0, 28.0, 33.0, 30.0, 30.0, 31.0, 44.0, 23.0, 40.0, 31.0, 43.0, 41.0, 54.0, 39.0, 50.0, 32.0, 29.0, 32.0, 25.0, 24.0, 19.0, 23.0, 14.0, 18.0, 16.0, 8.0, 12.0, 6.0, 8.0, 8.0, 13.0, 5.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0224609375, -0.9921493530273438, -0.9618377685546875, -0.9315261840820312, -0.901214599609375, -0.8709030151367188, -0.8405914306640625, -0.8102798461914062, -0.77996826171875, -0.7496566772460938, -0.7193450927734375, -0.6890335083007812, -0.658721923828125, -0.6284103393554688, -0.5980987548828125, -0.5677871704101562, -0.5374755859375, -0.5071640014648438, -0.4768524169921875, -0.44654083251953125, -0.416229248046875, -0.38591766357421875, -0.3556060791015625, -0.32529449462890625, -0.29498291015625, -0.26467132568359375, -0.2343597412109375, -0.20404815673828125, -0.173736572265625, -0.14342498779296875, -0.1131134033203125, -0.08280181884765625, -0.052490234375, -0.02217864990234375, 0.0081329345703125, 0.03844451904296875, 0.068756103515625, 0.09906768798828125, 0.1293792724609375, 0.15969085693359375, 0.19000244140625, 0.22031402587890625, 0.2506256103515625, 0.28093719482421875, 0.311248779296875, 0.34156036376953125, 0.3718719482421875, 0.40218353271484375, 0.4324951171875, 0.46280670166015625, 0.4931182861328125, 0.5234298706054688, 0.553741455078125, 0.5840530395507812, 0.6143646240234375, 0.6446762084960938, 0.67498779296875, 0.7052993774414062, 0.7356109619140625, 0.7659225463867188, 0.796234130859375, 0.8265457153320312, 0.8568572998046875, 0.8871688842773438, 0.91748046875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 8.0, 15.0, 15.0, 20.0, 20.0, 37.0, 44.0, 45.0, 52.0, 76.0, 111.0, 163.0, 215.0, 289.0, 435.0, 548.0, 747.0, 1105.0, 1567.0, 2395.0, 3704.0, 6017.0, 11394.0, 26240.0, 110227.0, 730959.0, 98590.0, 24986.0, 11272.0, 5962.0, 3563.0, 2316.0, 1547.0, 1029.0, 764.0, 546.0, 433.0, 280.0, 205.0, 154.0, 115.0, 74.0, 56.0, 51.0, 42.0, 31.0, 18.0, 19.0, 17.0, 11.0, 9.0, 9.0, 4.0, 0.0, 4.0, 2.0, 1.0], "bins": [-3.73828125, -3.6231689453125, -3.508056640625, -3.3929443359375, -3.27783203125, -3.1627197265625, -3.047607421875, -2.9324951171875, -2.8173828125, -2.7022705078125, -2.587158203125, -2.4720458984375, -2.35693359375, -2.2418212890625, -2.126708984375, -2.0115966796875, -1.896484375, -1.7813720703125, -1.666259765625, -1.5511474609375, -1.43603515625, -1.3209228515625, -1.205810546875, -1.0906982421875, -0.9755859375, -0.8604736328125, -0.745361328125, -0.6302490234375, -0.51513671875, -0.4000244140625, -0.284912109375, -0.1697998046875, -0.0546875, 0.0604248046875, 0.175537109375, 0.2906494140625, 0.40576171875, 0.5208740234375, 0.635986328125, 0.7510986328125, 0.8662109375, 0.9813232421875, 1.096435546875, 1.2115478515625, 1.32666015625, 1.4417724609375, 1.556884765625, 1.6719970703125, 1.787109375, 1.9022216796875, 2.017333984375, 2.1324462890625, 2.24755859375, 2.3626708984375, 2.477783203125, 2.5928955078125, 2.7080078125, 2.8231201171875, 2.938232421875, 3.0533447265625, 3.16845703125, 3.2835693359375, 3.398681640625, 3.5137939453125, 3.62890625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 9.0, 2.0, 4.0, 4.0, 4.0, 14.0, 12.0, 11.0, 18.0, 19.0, 22.0, 23.0, 22.0, 27.0, 28.0, 22.0, 39.0, 39.0, 53.0, 68.0, 66.0, 108.0, 216.0, 1386.0, 231.0, 137.0, 75.0, 56.0, 49.0, 41.0, 34.0, 36.0, 26.0, 20.0, 23.0, 21.0, 12.0, 15.0, 10.0, 9.0, 8.0, 12.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.6484375, -3.53973388671875, -3.4310302734375, -3.32232666015625, -3.213623046875, -3.10491943359375, -2.9962158203125, -2.88751220703125, -2.77880859375, -2.67010498046875, -2.5614013671875, -2.45269775390625, -2.343994140625, -2.23529052734375, -2.1265869140625, -2.01788330078125, -1.9091796875, -1.80047607421875, -1.6917724609375, -1.58306884765625, -1.474365234375, -1.36566162109375, -1.2569580078125, -1.14825439453125, -1.03955078125, -0.93084716796875, -0.8221435546875, -0.71343994140625, -0.604736328125, -0.49603271484375, -0.3873291015625, -0.27862548828125, -0.169921875, -0.06121826171875, 0.0474853515625, 0.15618896484375, 0.264892578125, 0.37359619140625, 0.4822998046875, 0.59100341796875, 0.69970703125, 0.80841064453125, 0.9171142578125, 1.02581787109375, 1.134521484375, 1.24322509765625, 1.3519287109375, 1.46063232421875, 1.5693359375, 1.67803955078125, 1.7867431640625, 1.89544677734375, 2.004150390625, 2.11285400390625, 2.2215576171875, 2.33026123046875, 2.43896484375, 2.54766845703125, 2.6563720703125, 2.76507568359375, 2.873779296875, 2.98248291015625, 3.0911865234375, 3.19989013671875, 3.30859375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 7.0, 11.0, 18.0, 33.0, 25.0, 42.0, 74.0, 110.0, 148.0, 225.0, 409.0, 712.0, 1293.0, 2400.0, 4623.0, 10012.0, 25507.0, 99297.0, 1846564.0, 1038038.0, 76303.0, 21841.0, 8767.0, 4135.0, 2169.0, 1151.0, 669.0, 381.0, 252.0, 154.0, 118.0, 57.0, 53.0, 31.0, 16.0, 20.0, 11.0, 11.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.71875, -4.5709228515625, -4.423095703125, -4.2752685546875, -4.12744140625, -3.9796142578125, -3.831787109375, -3.6839599609375, -3.5361328125, -3.3883056640625, -3.240478515625, -3.0926513671875, -2.94482421875, -2.7969970703125, -2.649169921875, -2.5013427734375, -2.353515625, -2.2056884765625, -2.057861328125, -1.9100341796875, -1.76220703125, -1.6143798828125, -1.466552734375, -1.3187255859375, -1.1708984375, -1.0230712890625, -0.875244140625, -0.7274169921875, -0.57958984375, -0.4317626953125, -0.283935546875, -0.1361083984375, 0.01171875, 0.1595458984375, 0.307373046875, 0.4552001953125, 0.60302734375, 0.7508544921875, 0.898681640625, 1.0465087890625, 1.1943359375, 1.3421630859375, 1.489990234375, 1.6378173828125, 1.78564453125, 1.9334716796875, 2.081298828125, 2.2291259765625, 2.376953125, 2.5247802734375, 2.672607421875, 2.8204345703125, 2.96826171875, 3.1160888671875, 3.263916015625, 3.4117431640625, 3.5595703125, 3.7073974609375, 3.855224609375, 4.0030517578125, 4.15087890625, 4.2987060546875, 4.446533203125, 4.5943603515625, 4.7421875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 34.0, 123.0, 350.0, 358.0, 108.0, 22.0, 10.0, 3.0, 2.0], "bins": [-72.24443817138672, -70.99794006347656, -69.7514419555664, -68.50494384765625, -67.25843811035156, -66.0119400024414, -64.76544189453125, -63.518943786621094, -62.27244567871094, -61.02594757080078, -59.779449462890625, -58.5329475402832, -57.28644943237305, -56.03995132446289, -54.79344940185547, -53.54695129394531, -52.300453186035156, -51.053955078125, -49.807456970214844, -48.56095504760742, -47.314456939697266, -46.06795883178711, -44.82145690917969, -43.57495880126953, -42.328460693359375, -41.08196258544922, -39.83546447753906, -38.58896255493164, -37.342464447021484, -36.09596633911133, -34.849464416503906, -33.60296630859375, -32.356468200683594, -31.109970092773438, -29.86347007751465, -28.61697006225586, -27.370471954345703, -26.123973846435547, -24.877473831176758, -23.63097381591797, -22.38447380065918, -21.13797378540039, -19.891475677490234, -18.644977569580078, -17.39847755432129, -16.1519775390625, -14.905479431152344, -13.658980369567871, -12.412481307983398, -11.165982246398926, -9.919483184814453, -8.67298412322998, -7.426485061645508, -6.179986000061035, -4.9334869384765625, -3.68698787689209, -2.4404892921447754, -1.1939902305603027, 0.05250883102416992, 1.2990078926086426, 2.5455069541931152, 3.792006015777588, 5.0385050773620605, 6.285004138946533, 7.531503200531006]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 1.0, 7.0, 6.0, 17.0, 9.0, 9.0, 12.0, 19.0, 15.0, 20.0, 22.0, 25.0, 17.0, 34.0, 32.0, 35.0, 42.0, 45.0, 41.0, 33.0, 40.0, 42.0, 44.0, 40.0, 39.0, 43.0, 41.0, 39.0, 33.0, 33.0, 20.0, 24.0, 24.0, 19.0, 19.0, 13.0, 10.0, 4.0, 8.0, 4.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.02138614654541, -11.629741668701172, -11.238097190856934, -10.846452713012695, -10.45480728149414, -10.063162803649902, -9.671518325805664, -9.279873847961426, -8.888229370117188, -8.49658489227295, -8.104940414428711, -7.7132954597473145, -7.321650981903076, -6.930006504058838, -6.538361549377441, -6.146717071533203, -5.755072593688965, -5.363428115844727, -4.971783638000488, -4.580138683319092, -4.1884942054748535, -3.7968497276306152, -3.405205011367798, -3.0135602951049805, -2.621915817260742, -2.230271339416504, -1.8386266231536865, -1.4469820261001587, -1.0553374290466309, -0.663692831993103, -0.2720482349395752, 0.11959648132324219, 0.5112400054931641, 0.9028846025466919, 1.2945291996002197, 1.6861737966537476, 2.0778183937072754, 2.4694628715515137, 2.861107587814331, 3.2527523040771484, 3.6443967819213867, 4.036041259765625, 4.427685737609863, 4.81933069229126, 5.210975170135498, 5.602619647979736, 5.994264602661133, 6.385909080505371, 6.777553558349609, 7.169198036193848, 7.560842514038086, 7.952487468719482, 8.344131469726562, 8.735776901245117, 9.127421379089355, 9.519065856933594, 9.910710334777832, 10.30235481262207, 10.693999290466309, 11.085643768310547, 11.477289199829102, 11.86893367767334, 12.260578155517578, 12.652222633361816, 13.043867111206055]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 2.0, 3.0, 6.0, 11.0, 10.0, 9.0, 17.0, 15.0, 15.0, 19.0, 17.0, 15.0, 27.0, 19.0, 18.0, 27.0, 25.0, 29.0, 33.0, 33.0, 35.0, 38.0, 35.0, 44.0, 37.0, 26.0, 34.0, 44.0, 32.0, 37.0, 32.0, 26.0, 28.0, 23.0, 20.0, 24.0, 19.0, 23.0, 12.0, 11.0, 10.0, 9.0, 9.0, 5.0, 8.0, 9.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.0009765625, -0.9708404541015625, -0.940704345703125, -0.9105682373046875, -0.88043212890625, -0.8502960205078125, -0.820159912109375, -0.7900238037109375, -0.7598876953125, -0.7297515869140625, -0.699615478515625, -0.6694793701171875, -0.63934326171875, -0.6092071533203125, -0.579071044921875, -0.5489349365234375, -0.518798828125, -0.4886627197265625, -0.458526611328125, -0.4283905029296875, -0.39825439453125, -0.3681182861328125, -0.337982177734375, -0.3078460693359375, -0.2777099609375, -0.2475738525390625, -0.217437744140625, -0.1873016357421875, -0.15716552734375, -0.1270294189453125, -0.096893310546875, -0.0667572021484375, -0.03662109375, -0.0064849853515625, 0.023651123046875, 0.0537872314453125, 0.08392333984375, 0.1140594482421875, 0.144195556640625, 0.1743316650390625, 0.2044677734375, 0.2346038818359375, 0.264739990234375, 0.2948760986328125, 0.32501220703125, 0.3551483154296875, 0.385284423828125, 0.4154205322265625, 0.445556640625, 0.4756927490234375, 0.505828857421875, 0.5359649658203125, 0.56610107421875, 0.5962371826171875, 0.626373291015625, 0.6565093994140625, 0.6866455078125, 0.7167816162109375, 0.746917724609375, 0.7770538330078125, 0.80718994140625, 0.8373260498046875, 0.867462158203125, 0.8975982666015625, 0.927734375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 3.0, 2.0, 6.0, 8.0, 14.0, 15.0, 20.0, 38.0, 35.0, 69.0, 86.0, 139.0, 196.0, 265.0, 372.0, 595.0, 816.0, 1263.0, 1889.0, 2741.0, 4199.0, 6800.0, 11255.0, 20484.0, 42756.0, 121439.0, 733040.0, 2543229.0, 520695.0, 98092.0, 37246.0, 18411.0, 10267.0, 6158.0, 3770.0, 2519.0, 1704.0, 1070.0, 755.0, 549.0, 379.0, 232.0, 207.0, 146.0, 93.0, 65.0, 48.0, 34.0, 16.0, 11.0, 21.0, 12.0, 7.0, 1.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.23046875, -2.157135009765625, -2.08380126953125, -2.010467529296875, -1.9371337890625, -1.863800048828125, -1.79046630859375, -1.717132568359375, -1.643798828125, -1.570465087890625, -1.49713134765625, -1.423797607421875, -1.3504638671875, -1.277130126953125, -1.20379638671875, -1.130462646484375, -1.05712890625, -0.983795166015625, -0.91046142578125, -0.837127685546875, -0.7637939453125, -0.690460205078125, -0.61712646484375, -0.543792724609375, -0.470458984375, -0.397125244140625, -0.32379150390625, -0.250457763671875, -0.1771240234375, -0.103790283203125, -0.03045654296875, 0.042877197265625, 0.1162109375, 0.189544677734375, 0.26287841796875, 0.336212158203125, 0.4095458984375, 0.482879638671875, 0.55621337890625, 0.629547119140625, 0.702880859375, 0.776214599609375, 0.84954833984375, 0.922882080078125, 0.9962158203125, 1.069549560546875, 1.14288330078125, 1.216217041015625, 1.28955078125, 1.362884521484375, 1.43621826171875, 1.509552001953125, 1.5828857421875, 1.656219482421875, 1.72955322265625, 1.802886962890625, 1.876220703125, 1.949554443359375, 2.02288818359375, 2.096221923828125, 2.1695556640625, 2.242889404296875, 2.31622314453125, 2.389556884765625, 2.462890625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 5.0, 5.0, 8.0, 12.0, 17.0, 29.0, 28.0, 38.0, 48.0, 73.0, 111.0, 210.0, 328.0, 708.0, 886.0, 626.0, 359.0, 180.0, 145.0, 64.0, 40.0, 37.0, 37.0, 18.0, 11.0, 7.0, 8.0, 11.0, 9.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.828125, -3.709991455078125, -3.59185791015625, -3.473724365234375, -3.3555908203125, -3.237457275390625, -3.11932373046875, -3.001190185546875, -2.883056640625, -2.764923095703125, -2.64678955078125, -2.528656005859375, -2.4105224609375, -2.292388916015625, -2.17425537109375, -2.056121826171875, -1.93798828125, -1.819854736328125, -1.70172119140625, -1.583587646484375, -1.4654541015625, -1.347320556640625, -1.22918701171875, -1.111053466796875, -0.992919921875, -0.874786376953125, -0.75665283203125, -0.638519287109375, -0.5203857421875, -0.402252197265625, -0.28411865234375, -0.165985107421875, -0.0478515625, 0.070281982421875, 0.18841552734375, 0.306549072265625, 0.4246826171875, 0.542816162109375, 0.66094970703125, 0.779083251953125, 0.897216796875, 1.015350341796875, 1.13348388671875, 1.251617431640625, 1.3697509765625, 1.487884521484375, 1.60601806640625, 1.724151611328125, 1.84228515625, 1.960418701171875, 2.07855224609375, 2.196685791015625, 2.3148193359375, 2.432952880859375, 2.55108642578125, 2.669219970703125, 2.787353515625, 2.905487060546875, 3.02362060546875, 3.141754150390625, 3.2598876953125, 3.378021240234375, 3.49615478515625, 3.614288330078125, 3.732421875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 1.0, 6.0, 2.0, 5.0, 10.0, 11.0, 17.0, 18.0, 25.0, 33.0, 49.0, 55.0, 86.0, 123.0, 175.0, 282.0, 371.0, 640.0, 1074.0, 1851.0, 3578.0, 7134.0, 15054.0, 34008.0, 89453.0, 371077.0, 2656998.0, 789236.0, 137141.0, 46209.0, 19787.0, 9347.0, 4492.0, 2371.0, 1348.0, 796.0, 470.0, 309.0, 208.0, 126.0, 83.0, 62.0, 56.0, 32.0, 14.0, 19.0, 12.0, 11.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.34765625, -4.2059326171875, -4.064208984375, -3.9224853515625, -3.78076171875, -3.6390380859375, -3.497314453125, -3.3555908203125, -3.2138671875, -3.0721435546875, -2.930419921875, -2.7886962890625, -2.64697265625, -2.5052490234375, -2.363525390625, -2.2218017578125, -2.080078125, -1.9383544921875, -1.796630859375, -1.6549072265625, -1.51318359375, -1.3714599609375, -1.229736328125, -1.0880126953125, -0.9462890625, -0.8045654296875, -0.662841796875, -0.5211181640625, -0.37939453125, -0.2376708984375, -0.095947265625, 0.0457763671875, 0.1875, 0.3292236328125, 0.470947265625, 0.6126708984375, 0.75439453125, 0.8961181640625, 1.037841796875, 1.1795654296875, 1.3212890625, 1.4630126953125, 1.604736328125, 1.7464599609375, 1.88818359375, 2.0299072265625, 2.171630859375, 2.3133544921875, 2.455078125, 2.5968017578125, 2.738525390625, 2.8802490234375, 3.02197265625, 3.1636962890625, 3.305419921875, 3.4471435546875, 3.5888671875, 3.7305908203125, 3.872314453125, 4.0140380859375, 4.15576171875, 4.2974853515625, 4.439208984375, 4.5809326171875, 4.72265625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 12.0, 9.0, 22.0, 54.0, 80.0, 140.0, 206.0, 193.0, 129.0, 81.0, 46.0, 22.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-51.85649108886719, -50.85857009887695, -49.86064529418945, -48.86272430419922, -47.864803314208984, -46.866878509521484, -45.86895751953125, -44.871036529541016, -43.873111724853516, -42.87519073486328, -41.87726593017578, -40.87934494018555, -39.88142395019531, -38.88349914550781, -37.88557815551758, -36.887657165527344, -35.88973617553711, -34.891815185546875, -33.893890380859375, -32.89596939086914, -31.898046493530273, -30.90012550354004, -29.902202606201172, -28.904281616210938, -27.906356811523438, -26.90843391418457, -25.910512924194336, -24.91259002685547, -23.9146671295166, -22.916746139526367, -21.9188232421875, -20.920902252197266, -19.922977447509766, -18.9250545501709, -17.927133560180664, -16.929210662841797, -15.931288719177246, -14.933366775512695, -13.935443878173828, -12.937521934509277, -11.939599990844727, -10.941678047180176, -9.943755149841309, -8.945833206176758, -7.947911262512207, -6.949988842010498, -5.952066421508789, -4.954144477844238, -3.9562225341796875, -2.9583003520965576, -1.9603780508041382, -0.9624557495117188, 0.03546643257141113, 1.033388614654541, 2.03131103515625, 3.029232978820801, 4.02715539932251, 5.025077819824219, 6.0229997634887695, 7.0209221839904785, 8.018844604492188, 9.016766548156738, 10.014688491821289, 11.012611389160156, 12.010533332824707]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 16.0, 14.0, 13.0, 19.0, 17.0, 25.0, 29.0, 19.0, 38.0, 21.0, 25.0, 32.0, 40.0, 36.0, 39.0, 49.0, 42.0, 36.0, 52.0, 38.0, 41.0, 42.0, 31.0, 40.0, 34.0, 19.0, 24.0, 12.0, 31.0, 27.0, 15.0, 11.0, 19.0, 9.0, 7.0, 6.0, 2.0, 10.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.947196960449219, -9.633197784423828, -9.319198608398438, -9.00519847869873, -8.69119930267334, -8.37720012664795, -8.063200950622559, -7.749201774597168, -7.435202121734619, -7.1212029457092285, -6.80720329284668, -6.493204116821289, -6.179204940795898, -5.86520528793335, -5.551206111907959, -5.23720645904541, -4.9232072830200195, -4.609208106994629, -4.29520845413208, -3.9812092781066895, -3.6672098636627197, -3.35321044921875, -3.0392112731933594, -2.7252118587493896, -2.41121244430542, -2.09721302986145, -1.78321373462677, -1.4692144393920898, -1.1552150249481201, -0.8412156105041504, -0.5272163152694702, -0.21321702003479004, 0.10078239440917969, 0.41478174924850464, 0.7287811040878296, 1.0427803993225098, 1.3567798137664795, 1.6707792282104492, 1.9847785234451294, 2.2987778186798096, 2.6127772331237793, 2.926776647567749, 3.2407760620117188, 3.5547752380371094, 3.868774652481079, 4.182774066925049, 4.4967732429504395, 4.810772895812988, 5.124772071838379, 5.4387712478637695, 5.752770900726318, 6.066770076751709, 6.380769729614258, 6.694768905639648, 7.008768081665039, 7.32276725769043, 7.6367669105529785, 7.950766086578369, 8.264765739440918, 8.578764915466309, 8.8927640914917, 9.206764221191406, 9.520763397216797, 9.834762573242188, 10.148761749267578]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 13.0, 12.0, 5.0, 11.0, 9.0, 17.0, 13.0, 18.0, 23.0, 10.0, 26.0, 22.0, 30.0, 21.0, 14.0, 23.0, 36.0, 37.0, 33.0, 25.0, 39.0, 42.0, 34.0, 34.0, 46.0, 38.0, 36.0, 25.0, 38.0, 31.0, 32.0, 21.0, 17.0, 24.0, 26.0, 13.0, 13.0, 18.0, 12.0, 10.0, 9.0, 8.0, 3.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.017578125, -0.9871063232421875, -0.956634521484375, -0.9261627197265625, -0.89569091796875, -0.8652191162109375, -0.834747314453125, -0.8042755126953125, -0.7738037109375, -0.7433319091796875, -0.712860107421875, -0.6823883056640625, -0.65191650390625, -0.6214447021484375, -0.590972900390625, -0.5605010986328125, -0.530029296875, -0.4995574951171875, -0.469085693359375, -0.4386138916015625, -0.40814208984375, -0.3776702880859375, -0.347198486328125, -0.3167266845703125, -0.2862548828125, -0.2557830810546875, -0.225311279296875, -0.1948394775390625, -0.16436767578125, -0.1338958740234375, -0.103424072265625, -0.0729522705078125, -0.04248046875, -0.0120086669921875, 0.018463134765625, 0.0489349365234375, 0.07940673828125, 0.1098785400390625, 0.140350341796875, 0.1708221435546875, 0.2012939453125, 0.2317657470703125, 0.262237548828125, 0.2927093505859375, 0.32318115234375, 0.3536529541015625, 0.384124755859375, 0.4145965576171875, 0.445068359375, 0.4755401611328125, 0.506011962890625, 0.5364837646484375, 0.56695556640625, 0.5974273681640625, 0.627899169921875, 0.6583709716796875, 0.6888427734375, 0.7193145751953125, 0.749786376953125, 0.7802581787109375, 0.81072998046875, 0.8412017822265625, 0.871673583984375, 0.9021453857421875, 0.9326171875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 19.0, 22.0, 42.0, 55.0, 83.0, 152.0, 205.0, 347.0, 544.0, 752.0, 1322.0, 2062.0, 3334.0, 5254.0, 8839.0, 13935.0, 22381.0, 36261.0, 57583.0, 87170.0, 123307.0, 153072.0, 154973.0, 125801.0, 90336.0, 60313.0, 37905.0, 23699.0, 14856.0, 9147.0, 5591.0, 3376.0, 2054.0, 1419.0, 834.0, 545.0, 337.0, 208.0, 147.0, 95.0, 51.0, 42.0, 23.0, 16.0, 16.0, 7.0, 4.0, 9.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.09375, -1.0606536865234375, -1.027557373046875, -0.9944610595703125, -0.96136474609375, -0.9282684326171875, -0.895172119140625, -0.8620758056640625, -0.8289794921875, -0.7958831787109375, -0.762786865234375, -0.7296905517578125, -0.69659423828125, -0.6634979248046875, -0.630401611328125, -0.5973052978515625, -0.564208984375, -0.5311126708984375, -0.498016357421875, -0.4649200439453125, -0.43182373046875, -0.3987274169921875, -0.365631103515625, -0.3325347900390625, -0.2994384765625, -0.2663421630859375, -0.233245849609375, -0.2001495361328125, -0.16705322265625, -0.1339569091796875, -0.100860595703125, -0.0677642822265625, -0.03466796875, -0.0015716552734375, 0.031524658203125, 0.0646209716796875, 0.09771728515625, 0.1308135986328125, 0.163909912109375, 0.1970062255859375, 0.2301025390625, 0.2631988525390625, 0.296295166015625, 0.3293914794921875, 0.36248779296875, 0.3955841064453125, 0.428680419921875, 0.4617767333984375, 0.494873046875, 0.5279693603515625, 0.561065673828125, 0.5941619873046875, 0.62725830078125, 0.6603546142578125, 0.693450927734375, 0.7265472412109375, 0.7596435546875, 0.7927398681640625, 0.825836181640625, 0.8589324951171875, 0.89202880859375, 0.9251251220703125, 0.958221435546875, 0.9913177490234375, 1.0244140625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 10.0, 11.0, 8.0, 10.0, 13.0, 11.0, 20.0, 16.0, 20.0, 22.0, 23.0, 29.0, 37.0, 30.0, 45.0, 43.0, 29.0, 40.0, 47.0, 37.0, 1061.0, 45.0, 32.0, 39.0, 35.0, 40.0, 30.0, 30.0, 25.0, 21.0, 29.0, 27.0, 21.0, 11.0, 18.0, 7.0, 12.0, 11.0, 8.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.96142578125, -0.9259567260742188, -0.8904876708984375, -0.8550186157226562, -0.819549560546875, -0.7840805053710938, -0.7486114501953125, -0.7131423950195312, -0.67767333984375, -0.6422042846679688, -0.6067352294921875, -0.5712661743164062, -0.535797119140625, -0.5003280639648438, -0.4648590087890625, -0.42938995361328125, -0.3939208984375, -0.35845184326171875, -0.3229827880859375, -0.28751373291015625, -0.252044677734375, -0.21657562255859375, -0.1811065673828125, -0.14563751220703125, -0.11016845703125, -0.07469940185546875, -0.0392303466796875, -0.00376129150390625, 0.031707763671875, 0.06717681884765625, 0.1026458740234375, 0.13811492919921875, 0.173583984375, 0.20905303955078125, 0.2445220947265625, 0.27999114990234375, 0.315460205078125, 0.35092926025390625, 0.3863983154296875, 0.42186737060546875, 0.45733642578125, 0.49280548095703125, 0.5282745361328125, 0.5637435913085938, 0.599212646484375, 0.6346817016601562, 0.6701507568359375, 0.7056198120117188, 0.7410888671875, 0.7765579223632812, 0.8120269775390625, 0.8474960327148438, 0.882965087890625, 0.9184341430664062, 0.9539031982421875, 0.9893722534179688, 1.02484130859375, 1.0603103637695312, 1.0957794189453125, 1.1312484741210938, 1.166717529296875, 1.2021865844726562, 1.2376556396484375, 1.2731246948242188, 1.30859375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 10.0, 14.0, 16.0, 19.0, 28.0, 31.0, 49.0, 66.0, 106.0, 133.0, 231.0, 315.0, 486.0, 745.0, 1212.0, 2004.0, 3104.0, 5301.0, 9080.0, 15543.0, 29226.0, 64533.0, 820457.0, 1010356.0, 65734.0, 29464.0, 15888.0, 9130.0, 5262.0, 3150.0, 1907.0, 1208.0, 786.0, 483.0, 352.0, 225.0, 134.0, 102.0, 59.0, 64.0, 30.0, 17.0, 17.0, 18.0, 8.0, 6.0, 4.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.37890625, -1.3313751220703125, -1.283843994140625, -1.2363128662109375, -1.18878173828125, -1.1412506103515625, -1.093719482421875, -1.0461883544921875, -0.9986572265625, -0.9511260986328125, -0.903594970703125, -0.8560638427734375, -0.80853271484375, -0.7610015869140625, -0.713470458984375, -0.6659393310546875, -0.618408203125, -0.5708770751953125, -0.523345947265625, -0.4758148193359375, -0.42828369140625, -0.3807525634765625, -0.333221435546875, -0.2856903076171875, -0.2381591796875, -0.1906280517578125, -0.143096923828125, -0.0955657958984375, -0.04803466796875, -0.0005035400390625, 0.047027587890625, 0.0945587158203125, 0.14208984375, 0.1896209716796875, 0.237152099609375, 0.2846832275390625, 0.33221435546875, 0.3797454833984375, 0.427276611328125, 0.4748077392578125, 0.5223388671875, 0.5698699951171875, 0.617401123046875, 0.6649322509765625, 0.71246337890625, 0.7599945068359375, 0.807525634765625, 0.8550567626953125, 0.902587890625, 0.9501190185546875, 0.997650146484375, 1.0451812744140625, 1.09271240234375, 1.1402435302734375, 1.187774658203125, 1.2353057861328125, 1.2828369140625, 1.3303680419921875, 1.377899169921875, 1.4254302978515625, 1.47296142578125, 1.5204925537109375, 1.568023681640625, 1.6155548095703125, 1.6630859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 5.0, 6.0, 8.0, 6.0, 15.0, 12.0, 12.0, 13.0, 14.0, 26.0, 22.0, 30.0, 50.0, 45.0, 36.0, 49.0, 56.0, 68.0, 86.0, 51.0, 55.0, 51.0, 42.0, 37.0, 27.0, 31.0, 19.0, 26.0, 12.0, 14.0, 10.0, 9.0, 9.0, 8.0, 9.0, 9.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2032470703125, -0.19728469848632812, -0.19132232666015625, -0.18535995483398438, -0.1793975830078125, -0.17343521118164062, -0.16747283935546875, -0.16151046752929688, -0.155548095703125, -0.14958572387695312, -0.14362335205078125, -0.13766098022460938, -0.1316986083984375, -0.12573623657226562, -0.11977386474609375, -0.11381149291992188, -0.10784912109375, -0.10188674926757812, -0.09592437744140625, -0.08996200561523438, -0.0839996337890625, -0.07803726196289062, -0.07207489013671875, -0.06611251831054688, -0.060150146484375, -0.054187774658203125, -0.04822540283203125, -0.042263031005859375, -0.0363006591796875, -0.030338287353515625, -0.02437591552734375, -0.018413543701171875, -0.012451171875, -0.006488800048828125, -0.00052642822265625, 0.005435943603515625, 0.0113983154296875, 0.017360687255859375, 0.02332305908203125, 0.029285430908203125, 0.035247802734375, 0.041210174560546875, 0.04717254638671875, 0.053134918212890625, 0.0590972900390625, 0.06505966186523438, 0.07102203369140625, 0.07698440551757812, 0.08294677734375, 0.08890914916992188, 0.09487152099609375, 0.10083389282226562, 0.1067962646484375, 0.11275863647460938, 0.11872100830078125, 0.12468338012695312, 0.130645751953125, 0.13660812377929688, 0.14257049560546875, 0.14853286743164062, 0.1544952392578125, 0.16045761108398438, 0.16641998291015625, 0.17238235473632812, 0.1783447265625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 11.0, 7.0, 6.0, 12.0, 11.0, 24.0, 22.0, 28.0, 43.0, 53.0, 73.0, 88.0, 129.0, 144.0, 245.0, 594.0, 3288.0, 32972.0, 642607.0, 344705.0, 19942.0, 2252.0, 452.0, 206.0, 149.0, 98.0, 86.0, 68.0, 62.0, 46.0, 23.0, 31.0, 22.0, 10.0, 11.0, 11.0, 4.0, 8.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.646484375, -2.554901123046875, -2.46331787109375, -2.371734619140625, -2.2801513671875, -2.188568115234375, -2.09698486328125, -2.005401611328125, -1.913818359375, -1.822235107421875, -1.73065185546875, -1.639068603515625, -1.5474853515625, -1.455902099609375, -1.36431884765625, -1.272735595703125, -1.18115234375, -1.089569091796875, -0.99798583984375, -0.906402587890625, -0.8148193359375, -0.723236083984375, -0.63165283203125, -0.540069580078125, -0.448486328125, -0.356903076171875, -0.26531982421875, -0.173736572265625, -0.0821533203125, 0.009429931640625, 0.10101318359375, 0.192596435546875, 0.2841796875, 0.375762939453125, 0.46734619140625, 0.558929443359375, 0.6505126953125, 0.742095947265625, 0.83367919921875, 0.925262451171875, 1.016845703125, 1.108428955078125, 1.20001220703125, 1.291595458984375, 1.3831787109375, 1.474761962890625, 1.56634521484375, 1.657928466796875, 1.74951171875, 1.841094970703125, 1.93267822265625, 2.024261474609375, 2.1158447265625, 2.207427978515625, 2.29901123046875, 2.390594482421875, 2.482177734375, 2.573760986328125, 2.66534423828125, 2.756927490234375, 2.8485107421875, 2.940093994140625, 3.03167724609375, 3.123260498046875, 3.21484375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 12.0, 78.0, 611.0, 290.0, 28.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.790554523468018, -5.4465227127075195, -5.102490425109863, -4.758458137512207, -4.414426326751709, -4.070394515991211, -3.7263622283935547, -3.3823301792144775, -3.0382981300354004, -2.6942660808563232, -2.350234031677246, -2.006201982498169, -1.6621699333190918, -1.3181378841400146, -0.9741058349609375, -0.6300737857818604, -0.2860417366027832, 0.057990312576293945, 0.4020223617553711, 0.7460544109344482, 1.0900864601135254, 1.4341185092926025, 1.7781505584716797, 2.122182607650757, 2.466214656829834, 2.810246706008911, 3.1542787551879883, 3.4983108043670654, 3.8423428535461426, 4.186374664306641, 4.530406951904297, 4.874439239501953, 5.218471527099609, 5.562503814697266, 5.906535625457764, 6.250567436218262, 6.594599723815918, 6.938632011413574, 7.282663822174072, 7.62669563293457, 7.970727920532227, 8.314760208129883, 8.658792495727539, 9.002823829650879, 9.346856117248535, 9.690888404846191, 10.034919738769531, 10.378952026367188, 10.722984313964844, 11.0670166015625, 11.411048889160156, 11.755080223083496, 12.099112510681152, 12.443144798278809, 12.787176132202148, 13.131208419799805, 13.475240707397461, 13.819272994995117, 14.163305282592773, 14.507336616516113, 14.85136890411377, 15.195401191711426, 15.539432525634766, 15.883464813232422, 16.227497100830078]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 10.0, 11.0, 9.0, 13.0, 14.0, 25.0, 28.0, 34.0, 41.0, 47.0, 42.0, 47.0, 64.0, 51.0, 63.0, 66.0, 52.0, 51.0, 45.0, 45.0, 34.0, 46.0, 29.0, 38.0, 19.0, 12.0, 14.0, 18.0, 11.0, 5.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3719418048858643, -1.3376210927963257, -1.303300380706787, -1.268979549407959, -1.2346588373184204, -1.2003381252288818, -1.1660174131393433, -1.1316967010498047, -1.0973759889602661, -1.0630552768707275, -1.028734564781189, -0.9944137930870056, -0.960093080997467, -0.9257723093032837, -0.8914515972137451, -0.8571308851242065, -0.8228101134300232, -0.7884894013404846, -0.7541686296463013, -0.7198479175567627, -0.6855272054672241, -0.6512064933776855, -0.6168857216835022, -0.5825650095939636, -0.5482442378997803, -0.5139235258102417, -0.47960278391838074, -0.4452820420265198, -0.4109613299369812, -0.37664058804512024, -0.3423198461532593, -0.3079991340637207, -0.27367836236953735, -0.23935763537883759, -0.20503690838813782, -0.17071616649627686, -0.1363954395055771, -0.10207471251487732, -0.06775397062301636, -0.03343324363231659, 0.0008874833583831787, 0.035208214074373245, 0.06952894479036331, 0.10384967923164368, 0.13817040622234344, 0.1724911332130432, 0.20681187510490417, 0.24113260209560394, 0.2754533290863037, 0.3097740709781647, 0.34409478306770325, 0.3784155249595642, 0.4127362370491028, 0.44705697894096375, 0.4813777208328247, 0.5156984329223633, 0.5500191450119019, 0.5843398571014404, 0.6186606287956238, 0.6529813408851624, 0.6873020529747009, 0.7216228246688843, 0.7559435367584229, 0.7902642488479614, 0.8245850205421448]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 4.0, 9.0, 11.0, 8.0, 9.0, 13.0, 6.0, 13.0, 18.0, 24.0, 17.0, 16.0, 25.0, 21.0, 19.0, 24.0, 16.0, 21.0, 33.0, 38.0, 30.0, 25.0, 37.0, 41.0, 35.0, 30.0, 45.0, 34.0, 41.0, 26.0, 25.0, 38.0, 35.0, 21.0, 22.0, 22.0, 21.0, 20.0, 17.0, 15.0, 11.0, 12.0, 13.0, 6.0, 4.0, 6.0, 4.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.0126953125, -0.9825820922851562, -0.9524688720703125, -0.9223556518554688, -0.892242431640625, -0.8621292114257812, -0.8320159912109375, -0.8019027709960938, -0.77178955078125, -0.7416763305664062, -0.7115631103515625, -0.6814498901367188, -0.651336669921875, -0.6212234497070312, -0.5911102294921875, -0.5609970092773438, -0.5308837890625, -0.5007705688476562, -0.4706573486328125, -0.44054412841796875, -0.410430908203125, -0.38031768798828125, -0.3502044677734375, -0.32009124755859375, -0.28997802734375, -0.25986480712890625, -0.2297515869140625, -0.19963836669921875, -0.169525146484375, -0.13941192626953125, -0.1092987060546875, -0.07918548583984375, -0.049072265625, -0.01895904541015625, 0.0111541748046875, 0.04126739501953125, 0.071380615234375, 0.10149383544921875, 0.1316070556640625, 0.16172027587890625, 0.19183349609375, 0.22194671630859375, 0.2520599365234375, 0.28217315673828125, 0.312286376953125, 0.34239959716796875, 0.3725128173828125, 0.40262603759765625, 0.4327392578125, 0.46285247802734375, 0.4929656982421875, 0.5230789184570312, 0.553192138671875, 0.5833053588867188, 0.6134185791015625, 0.6435317993164062, 0.67364501953125, 0.7037582397460938, 0.7338714599609375, 0.7639846801757812, 0.794097900390625, 0.8242111206054688, 0.8543243408203125, 0.8844375610351562, 0.91455078125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 2.0, 4.0, 14.0, 15.0, 20.0, 36.0, 49.0, 54.0, 77.0, 110.0, 144.0, 191.0, 319.0, 424.0, 569.0, 849.0, 1349.0, 2190.0, 3424.0, 6493.0, 12530.0, 30915.0, 107188.0, 617116.0, 187065.0, 41982.0, 16184.0, 7710.0, 4206.0, 2580.0, 1515.0, 973.0, 714.0, 448.0, 332.0, 201.0, 147.0, 113.0, 102.0, 71.0, 35.0, 23.0, 20.0, 13.0, 12.0, 11.0, 4.0, 10.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.6953125, -2.617523193359375, -2.53973388671875, -2.461944580078125, -2.3841552734375, -2.306365966796875, -2.22857666015625, -2.150787353515625, -2.072998046875, -1.995208740234375, -1.91741943359375, -1.839630126953125, -1.7618408203125, -1.684051513671875, -1.60626220703125, -1.528472900390625, -1.45068359375, -1.372894287109375, -1.29510498046875, -1.217315673828125, -1.1395263671875, -1.061737060546875, -0.98394775390625, -0.906158447265625, -0.828369140625, -0.750579833984375, -0.67279052734375, -0.595001220703125, -0.5172119140625, -0.439422607421875, -0.36163330078125, -0.283843994140625, -0.2060546875, -0.128265380859375, -0.05047607421875, 0.027313232421875, 0.1051025390625, 0.182891845703125, 0.26068115234375, 0.338470458984375, 0.416259765625, 0.494049072265625, 0.57183837890625, 0.649627685546875, 0.7274169921875, 0.805206298828125, 0.88299560546875, 0.960784912109375, 1.03857421875, 1.116363525390625, 1.19415283203125, 1.271942138671875, 1.3497314453125, 1.427520751953125, 1.50531005859375, 1.583099365234375, 1.660888671875, 1.738677978515625, 1.81646728515625, 1.894256591796875, 1.9720458984375, 2.049835205078125, 2.12762451171875, 2.205413818359375, 2.283203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 6.0, 6.0, 17.0, 18.0, 12.0, 22.0, 30.0, 33.0, 40.0, 44.0, 63.0, 56.0, 83.0, 134.0, 245.0, 1557.0, 183.0, 90.0, 64.0, 62.0, 46.0, 36.0, 38.0, 39.0, 22.0, 18.0, 24.0, 13.0, 6.0, 12.0, 6.0, 3.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.15625, -4.99212646484375, -4.8280029296875, -4.66387939453125, -4.499755859375, -4.33563232421875, -4.1715087890625, -4.00738525390625, -3.84326171875, -3.67913818359375, -3.5150146484375, -3.35089111328125, -3.186767578125, -3.02264404296875, -2.8585205078125, -2.69439697265625, -2.5302734375, -2.36614990234375, -2.2020263671875, -2.03790283203125, -1.873779296875, -1.70965576171875, -1.5455322265625, -1.38140869140625, -1.21728515625, -1.05316162109375, -0.8890380859375, -0.72491455078125, -0.560791015625, -0.39666748046875, -0.2325439453125, -0.06842041015625, 0.095703125, 0.25982666015625, 0.4239501953125, 0.58807373046875, 0.752197265625, 0.91632080078125, 1.0804443359375, 1.24456787109375, 1.40869140625, 1.57281494140625, 1.7369384765625, 1.90106201171875, 2.065185546875, 2.22930908203125, 2.3934326171875, 2.55755615234375, 2.7216796875, 2.88580322265625, 3.0499267578125, 3.21405029296875, 3.378173828125, 3.54229736328125, 3.7064208984375, 3.87054443359375, 4.03466796875, 4.19879150390625, 4.3629150390625, 4.52703857421875, 4.691162109375, 4.85528564453125, 5.0194091796875, 5.18353271484375, 5.34765625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 6.0, 11.0, 15.0, 21.0, 26.0, 23.0, 42.0, 47.0, 63.0, 116.0, 124.0, 224.0, 393.0, 647.0, 1272.0, 2518.0, 5252.0, 12721.0, 42126.0, 389563.0, 2525054.0, 123962.0, 24384.0, 8791.0, 3935.0, 1900.0, 968.0, 560.0, 321.0, 203.0, 135.0, 69.0, 58.0, 37.0, 28.0, 19.0, 16.0, 10.0, 15.0, 13.0, 3.0, 8.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.0859375, -5.90313720703125, -5.7203369140625, -5.53753662109375, -5.354736328125, -5.17193603515625, -4.9891357421875, -4.80633544921875, -4.62353515625, -4.44073486328125, -4.2579345703125, -4.07513427734375, -3.892333984375, -3.70953369140625, -3.5267333984375, -3.34393310546875, -3.1611328125, -2.97833251953125, -2.7955322265625, -2.61273193359375, -2.429931640625, -2.24713134765625, -2.0643310546875, -1.88153076171875, -1.69873046875, -1.51593017578125, -1.3331298828125, -1.15032958984375, -0.967529296875, -0.78472900390625, -0.6019287109375, -0.41912841796875, -0.236328125, -0.05352783203125, 0.1292724609375, 0.31207275390625, 0.494873046875, 0.67767333984375, 0.8604736328125, 1.04327392578125, 1.22607421875, 1.40887451171875, 1.5916748046875, 1.77447509765625, 1.957275390625, 2.14007568359375, 2.3228759765625, 2.50567626953125, 2.6884765625, 2.87127685546875, 3.0540771484375, 3.23687744140625, 3.419677734375, 3.60247802734375, 3.7852783203125, 3.96807861328125, 4.15087890625, 4.33367919921875, 4.5164794921875, 4.69927978515625, 4.882080078125, 5.06488037109375, 5.2476806640625, 5.43048095703125, 5.61328125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 31.0, 711.0, 270.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.779240608215332, -5.650929927825928, -2.5226192474365234, 0.6056909561157227, 3.734002113342285, 6.862313270568848, 9.990622520446777, 13.11893367767334, 16.24724578857422, 19.37555694580078, 22.503868103027344, 25.632177352905273, 28.760488510131836, 31.8887996673584, 35.01710891723633, 38.14542007446289, 41.27373123168945, 44.402042388916016, 47.53035354614258, 50.658660888671875, 53.78697204589844, 56.915283203125, 60.04359436035156, 63.171905517578125, 66.30021667480469, 69.42852783203125, 72.55683898925781, 75.68515014648438, 78.81346130371094, 81.9417724609375, 85.07008361816406, 88.19839477539062, 91.32670593261719, 94.45501708984375, 97.58332824707031, 100.71163940429688, 103.83995056152344, 106.96826171875, 110.09657287597656, 113.22488403320312, 116.35319519042969, 119.48150634765625, 122.60981750488281, 125.73812866210938, 128.86643981933594, 131.9947509765625, 135.12306213378906, 138.25137329101562, 141.37966918945312, 144.5079803466797, 147.63629150390625, 150.7646026611328, 153.89291381835938, 157.02122497558594, 160.1495361328125, 163.27784729003906, 166.40615844726562, 169.5344696044922, 172.66278076171875, 175.7910919189453, 178.91940307617188, 182.04771423339844, 185.176025390625, 188.30433654785156, 191.43264770507812]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 7.0, 5.0, 4.0, 5.0, 14.0, 14.0, 21.0, 24.0, 13.0, 19.0, 28.0, 34.0, 32.0, 29.0, 25.0, 34.0, 30.0, 39.0, 44.0, 48.0, 38.0, 36.0, 37.0, 34.0, 38.0, 35.0, 47.0, 36.0, 32.0, 26.0, 29.0, 25.0, 21.0, 19.0, 13.0, 14.0, 9.0, 11.0, 9.0, 8.0, 9.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.959578514099121, -11.564936637878418, -11.170294761657715, -10.775652885437012, -10.381011962890625, -9.986370086669922, -9.591728210449219, -9.197086334228516, -8.802444458007812, -8.40780258178711, -8.013160705566406, -7.618519306182861, -7.223877429962158, -6.829235553741455, -6.43459415435791, -6.039952278137207, -5.645310401916504, -5.250668525695801, -4.856026649475098, -4.461385250091553, -4.06674337387085, -3.6721014976501465, -3.2774598598480225, -2.8828182220458984, -2.4881763458251953, -2.093534469604492, -1.6988928318023682, -1.3042510747909546, -0.909609317779541, -0.5149675607681274, -0.12032580375671387, 0.27431583404541016, 0.6689586639404297, 1.0636004209518433, 1.4582421779632568, 1.8528839349746704, 2.247525691986084, 2.642167568206787, 3.036809206008911, 3.431450843811035, 3.8260927200317383, 4.220734596252441, 4.6153764724731445, 5.0100178718566895, 5.404659748077393, 5.799301624298096, 6.193943023681641, 6.588584899902344, 6.983226776123047, 7.37786865234375, 7.772510528564453, 8.167152404785156, 8.56179428100586, 8.956435203552246, 9.35107707977295, 9.745718955993652, 10.140360832214355, 10.535002708435059, 10.929644584655762, 11.324286460876465, 11.718927383422852, 12.113569259643555, 12.508211135864258, 12.902853012084961, 13.297494888305664]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 7.0, 4.0, 6.0, 7.0, 7.0, 12.0, 7.0, 13.0, 20.0, 20.0, 20.0, 18.0, 25.0, 21.0, 22.0, 17.0, 24.0, 36.0, 30.0, 29.0, 31.0, 42.0, 37.0, 38.0, 28.0, 41.0, 44.0, 35.0, 35.0, 39.0, 33.0, 29.0, 31.0, 30.0, 30.0, 28.0, 16.0, 10.0, 19.0, 11.0, 7.0, 12.0, 4.0, 5.0, 4.0, 5.0, 5.0, 2.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.115234375, -1.0810546875, -1.046875, -1.0126953125, -0.978515625, -0.9443359375, -0.91015625, -0.8759765625, -0.841796875, -0.8076171875, -0.7734375, -0.7392578125, -0.705078125, -0.6708984375, -0.63671875, -0.6025390625, -0.568359375, -0.5341796875, -0.5, -0.4658203125, -0.431640625, -0.3974609375, -0.36328125, -0.3291015625, -0.294921875, -0.2607421875, -0.2265625, -0.1923828125, -0.158203125, -0.1240234375, -0.08984375, -0.0556640625, -0.021484375, 0.0126953125, 0.046875, 0.0810546875, 0.115234375, 0.1494140625, 0.18359375, 0.2177734375, 0.251953125, 0.2861328125, 0.3203125, 0.3544921875, 0.388671875, 0.4228515625, 0.45703125, 0.4912109375, 0.525390625, 0.5595703125, 0.59375, 0.6279296875, 0.662109375, 0.6962890625, 0.73046875, 0.7646484375, 0.798828125, 0.8330078125, 0.8671875, 0.9013671875, 0.935546875, 0.9697265625, 1.00390625, 1.0380859375, 1.072265625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 18.0, 21.0, 22.0, 36.0, 50.0, 67.0, 100.0, 153.0, 237.0, 407.0, 709.0, 1101.0, 1915.0, 3415.0, 6237.0, 12006.0, 25318.0, 62304.0, 257985.0, 2232833.0, 1338215.0, 161807.0, 48062.0, 20319.0, 9502.0, 4969.0, 2727.0, 1448.0, 843.0, 519.0, 347.0, 200.0, 131.0, 83.0, 55.0, 34.0, 26.0, 17.0, 6.0, 9.0, 13.0, 6.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6328125, -2.541595458984375, -2.45037841796875, -2.359161376953125, -2.2679443359375, -2.176727294921875, -2.08551025390625, -1.994293212890625, -1.903076171875, -1.811859130859375, -1.72064208984375, -1.629425048828125, -1.5382080078125, -1.446990966796875, -1.35577392578125, -1.264556884765625, -1.17333984375, -1.082122802734375, -0.99090576171875, -0.899688720703125, -0.8084716796875, -0.717254638671875, -0.62603759765625, -0.534820556640625, -0.443603515625, -0.352386474609375, -0.26116943359375, -0.169952392578125, -0.0787353515625, 0.012481689453125, 0.10369873046875, 0.194915771484375, 0.2861328125, 0.377349853515625, 0.46856689453125, 0.559783935546875, 0.6510009765625, 0.742218017578125, 0.83343505859375, 0.924652099609375, 1.015869140625, 1.107086181640625, 1.19830322265625, 1.289520263671875, 1.3807373046875, 1.471954345703125, 1.56317138671875, 1.654388427734375, 1.74560546875, 1.836822509765625, 1.92803955078125, 2.019256591796875, 2.1104736328125, 2.201690673828125, 2.29290771484375, 2.384124755859375, 2.475341796875, 2.566558837890625, 2.65777587890625, 2.748992919921875, 2.8402099609375, 2.931427001953125, 3.02264404296875, 3.113861083984375, 3.205078125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 7.0, 7.0, 10.0, 10.0, 18.0, 21.0, 28.0, 30.0, 55.0, 68.0, 134.0, 220.0, 418.0, 792.0, 958.0, 561.0, 271.0, 168.0, 76.0, 73.0, 52.0, 24.0, 18.0, 11.0, 16.0, 11.0, 5.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15234375, -3.010009765625, -2.86767578125, -2.725341796875, -2.5830078125, -2.440673828125, -2.29833984375, -2.156005859375, -2.013671875, -1.871337890625, -1.72900390625, -1.586669921875, -1.4443359375, -1.302001953125, -1.15966796875, -1.017333984375, -0.875, -0.732666015625, -0.59033203125, -0.447998046875, -0.3056640625, -0.163330078125, -0.02099609375, 0.121337890625, 0.263671875, 0.406005859375, 0.54833984375, 0.690673828125, 0.8330078125, 0.975341796875, 1.11767578125, 1.260009765625, 1.40234375, 1.544677734375, 1.68701171875, 1.829345703125, 1.9716796875, 2.114013671875, 2.25634765625, 2.398681640625, 2.541015625, 2.683349609375, 2.82568359375, 2.968017578125, 3.1103515625, 3.252685546875, 3.39501953125, 3.537353515625, 3.6796875, 3.822021484375, 3.96435546875, 4.106689453125, 4.2490234375, 4.391357421875, 4.53369140625, 4.676025390625, 4.818359375, 4.960693359375, 5.10302734375, 5.245361328125, 5.3876953125, 5.530029296875, 5.67236328125, 5.814697265625, 5.95703125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 12.0, 8.0, 10.0, 16.0, 32.0, 56.0, 103.0, 191.0, 303.0, 624.0, 1252.0, 2748.0, 6245.0, 15824.0, 48085.0, 212270.0, 2655812.0, 1077699.0, 120332.0, 32532.0, 11296.0, 4577.0, 2083.0, 1040.0, 483.0, 263.0, 162.0, 85.0, 51.0, 30.0, 26.0, 10.0, 5.0, 6.0, 3.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.25, -6.05364990234375, -5.8572998046875, -5.66094970703125, -5.464599609375, -5.26824951171875, -5.0718994140625, -4.87554931640625, -4.67919921875, -4.48284912109375, -4.2864990234375, -4.09014892578125, -3.893798828125, -3.69744873046875, -3.5010986328125, -3.30474853515625, -3.1083984375, -2.91204833984375, -2.7156982421875, -2.51934814453125, -2.322998046875, -2.12664794921875, -1.9302978515625, -1.73394775390625, -1.53759765625, -1.34124755859375, -1.1448974609375, -0.94854736328125, -0.752197265625, -0.55584716796875, -0.3594970703125, -0.16314697265625, 0.033203125, 0.22955322265625, 0.4259033203125, 0.62225341796875, 0.818603515625, 1.01495361328125, 1.2113037109375, 1.40765380859375, 1.60400390625, 1.80035400390625, 1.9967041015625, 2.19305419921875, 2.389404296875, 2.58575439453125, 2.7821044921875, 2.97845458984375, 3.1748046875, 3.37115478515625, 3.5675048828125, 3.76385498046875, 3.960205078125, 4.15655517578125, 4.3529052734375, 4.54925537109375, 4.74560546875, 4.94195556640625, 5.1383056640625, 5.33465576171875, 5.531005859375, 5.72735595703125, 5.9237060546875, 6.12005615234375, 6.31640625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 13.0, 9.0, 9.0, 20.0, 31.0, 50.0, 50.0, 74.0, 93.0, 115.0, 86.0, 99.0, 79.0, 74.0, 51.0, 41.0, 23.0, 25.0, 16.0, 13.0, 12.0, 12.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.75844955444336, -10.231993675231934, -9.705536842346191, -9.179080963134766, -8.652624130249023, -8.126168251037598, -7.599712371826172, -7.073256015777588, -6.546799659729004, -6.02034330368042, -5.493886947631836, -4.96743106842041, -4.440974712371826, -3.914518356323242, -3.3880622386932373, -2.8616061210632324, -2.3351497650146484, -1.808693528175354, -1.2822372913360596, -0.7557810544967651, -0.2293248176574707, 0.2971315383911133, 0.8235876560211182, 1.350043773651123, 1.876500129699707, 2.402956485748291, 2.929412603378296, 3.455868721008301, 3.9823250770568848, 4.508781433105469, 5.0352373123168945, 5.5616936683654785, 6.0881500244140625, 6.6146063804626465, 7.1410627365112305, 7.667518615722656, 8.193975448608398, 8.720431327819824, 9.24688720703125, 9.773344039916992, 10.299799919128418, 10.826255798339844, 11.352712631225586, 11.879168510437012, 12.405624389648438, 12.93208122253418, 13.458537101745605, 13.984992980957031, 14.511449813842773, 15.0379056930542, 15.564362525939941, 16.090818405151367, 16.61727523803711, 17.14373016357422, 17.67018699645996, 18.196643829345703, 18.723098754882812, 19.249555587768555, 19.776010513305664, 20.302467346191406, 20.82892417907715, 21.35538101196289, 21.8818359375, 22.408292770385742, 22.934749603271484]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 10.0, 5.0, 7.0, 15.0, 21.0, 15.0, 15.0, 25.0, 17.0, 25.0, 27.0, 41.0, 26.0, 37.0, 30.0, 51.0, 31.0, 36.0, 42.0, 40.0, 47.0, 31.0, 44.0, 33.0, 41.0, 35.0, 35.0, 33.0, 29.0, 30.0, 21.0, 11.0, 12.0, 7.0, 18.0, 10.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.877226829528809, -9.562623023986816, -9.248018264770508, -8.933414459228516, -8.618810653686523, -8.304206848144531, -7.989602088928223, -7.6749982833862305, -7.36039400100708, -7.04578971862793, -6.7311859130859375, -6.416581630706787, -6.101977348327637, -5.7873735427856445, -5.472769260406494, -5.158164978027344, -4.843561172485352, -4.528956890106201, -4.214353084564209, -3.8997488021850586, -3.5851447582244873, -3.270540714263916, -2.9559364318847656, -2.6413323879241943, -2.326728343963623, -2.0121243000030518, -1.697520136833191, -1.38291597366333, -1.0683119297027588, -0.7537078857421875, -0.43910372257232666, -0.12449955940246582, 0.19010353088378906, 0.5047076344490051, 0.8193117380142212, 1.133915901184082, 1.4485199451446533, 1.7631239891052246, 2.077728271484375, 2.3923323154449463, 2.7069363594055176, 3.021540403366089, 3.33614444732666, 3.6507487297058105, 3.965352773666382, 4.279956817626953, 4.5945611000061035, 4.909165382385254, 5.223769187927246, 5.5383734703063965, 5.852977275848389, 6.167581558227539, 6.482185363769531, 6.796789646148682, 7.111393928527832, 7.425997734069824, 7.740602016448975, 8.055206298828125, 8.369810104370117, 8.68441390991211, 8.999018669128418, 9.31362247467041, 9.628226280212402, 9.942831039428711, 10.257434844970703]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 3.0, 2.0, 7.0, 8.0, 8.0, 8.0, 4.0, 9.0, 16.0, 12.0, 21.0, 21.0, 14.0, 23.0, 21.0, 31.0, 37.0, 21.0, 24.0, 39.0, 22.0, 36.0, 35.0, 34.0, 36.0, 39.0, 34.0, 52.0, 37.0, 38.0, 28.0, 32.0, 34.0, 24.0, 32.0, 17.0, 21.0, 22.0, 18.0, 19.0, 14.0, 7.0, 8.0, 10.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.0712890625, -1.0371856689453125, -1.003082275390625, -0.9689788818359375, -0.93487548828125, -0.9007720947265625, -0.866668701171875, -0.8325653076171875, -0.7984619140625, -0.7643585205078125, -0.730255126953125, -0.6961517333984375, -0.66204833984375, -0.6279449462890625, -0.593841552734375, -0.5597381591796875, -0.525634765625, -0.4915313720703125, -0.457427978515625, -0.4233245849609375, -0.38922119140625, -0.3551177978515625, -0.321014404296875, -0.2869110107421875, -0.2528076171875, -0.2187042236328125, -0.184600830078125, -0.1504974365234375, -0.11639404296875, -0.0822906494140625, -0.048187255859375, -0.0140838623046875, 0.02001953125, 0.0541229248046875, 0.088226318359375, 0.1223297119140625, 0.15643310546875, 0.1905364990234375, 0.224639892578125, 0.2587432861328125, 0.2928466796875, 0.3269500732421875, 0.361053466796875, 0.3951568603515625, 0.42926025390625, 0.4633636474609375, 0.497467041015625, 0.5315704345703125, 0.565673828125, 0.5997772216796875, 0.633880615234375, 0.6679840087890625, 0.70208740234375, 0.7361907958984375, 0.770294189453125, 0.8043975830078125, 0.8385009765625, 0.8726043701171875, 0.906707763671875, 0.9408111572265625, 0.97491455078125, 1.0090179443359375, 1.043121337890625, 1.0772247314453125, 1.111328125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 14.0, 11.0, 27.0, 28.0, 61.0, 110.0, 144.0, 193.0, 358.0, 564.0, 914.0, 1344.0, 2298.0, 3520.0, 5824.0, 9194.0, 14746.0, 23420.0, 37104.0, 57330.0, 84447.0, 116825.0, 142081.0, 146592.0, 126067.0, 94608.0, 65370.0, 42533.0, 27227.0, 17181.0, 10774.0, 6657.0, 4104.0, 2556.0, 1615.0, 978.0, 590.0, 433.0, 266.0, 152.0, 110.0, 71.0, 35.0, 29.0, 22.0, 10.0, 4.0, 8.0, 6.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.99365234375, -0.9627532958984375, -0.931854248046875, -0.9009552001953125, -0.87005615234375, -0.8391571044921875, -0.808258056640625, -0.7773590087890625, -0.7464599609375, -0.7155609130859375, -0.684661865234375, -0.6537628173828125, -0.62286376953125, -0.5919647216796875, -0.561065673828125, -0.5301666259765625, -0.499267578125, -0.4683685302734375, -0.437469482421875, -0.4065704345703125, -0.37567138671875, -0.3447723388671875, -0.313873291015625, -0.2829742431640625, -0.2520751953125, -0.2211761474609375, -0.190277099609375, -0.1593780517578125, -0.12847900390625, -0.0975799560546875, -0.066680908203125, -0.0357818603515625, -0.0048828125, 0.0260162353515625, 0.056915283203125, 0.0878143310546875, 0.11871337890625, 0.1496124267578125, 0.180511474609375, 0.2114105224609375, 0.2423095703125, 0.2732086181640625, 0.304107666015625, 0.3350067138671875, 0.36590576171875, 0.3968048095703125, 0.427703857421875, 0.4586029052734375, 0.489501953125, 0.5204010009765625, 0.551300048828125, 0.5821990966796875, 0.61309814453125, 0.6439971923828125, 0.674896240234375, 0.7057952880859375, 0.7366943359375, 0.7675933837890625, 0.798492431640625, 0.8293914794921875, 0.86029052734375, 0.8911895751953125, 0.922088623046875, 0.9529876708984375, 0.98388671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 3.0, 10.0, 8.0, 12.0, 15.0, 12.0, 16.0, 19.0, 21.0, 26.0, 21.0, 34.0, 21.0, 35.0, 44.0, 40.0, 38.0, 39.0, 44.0, 1070.0, 39.0, 42.0, 33.0, 48.0, 40.0, 32.0, 35.0, 28.0, 33.0, 26.0, 23.0, 17.0, 22.0, 12.0, 14.0, 11.0, 7.0, 9.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.990386962890625, -0.95147705078125, -0.912567138671875, -0.8736572265625, -0.834747314453125, -0.79583740234375, -0.756927490234375, -0.718017578125, -0.679107666015625, -0.64019775390625, -0.601287841796875, -0.5623779296875, -0.523468017578125, -0.48455810546875, -0.445648193359375, -0.40673828125, -0.367828369140625, -0.32891845703125, -0.290008544921875, -0.2510986328125, -0.212188720703125, -0.17327880859375, -0.134368896484375, -0.095458984375, -0.056549072265625, -0.01763916015625, 0.021270751953125, 0.0601806640625, 0.099090576171875, 0.13800048828125, 0.176910400390625, 0.2158203125, 0.254730224609375, 0.29364013671875, 0.332550048828125, 0.3714599609375, 0.410369873046875, 0.44927978515625, 0.488189697265625, 0.527099609375, 0.566009521484375, 0.60491943359375, 0.643829345703125, 0.6827392578125, 0.721649169921875, 0.76055908203125, 0.799468994140625, 0.83837890625, 0.877288818359375, 0.91619873046875, 0.955108642578125, 0.9940185546875, 1.032928466796875, 1.07183837890625, 1.110748291015625, 1.149658203125, 1.188568115234375, 1.22747802734375, 1.266387939453125, 1.3052978515625, 1.344207763671875, 1.38311767578125, 1.422027587890625, 1.4609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 8.0, 11.0, 19.0, 12.0, 25.0, 29.0, 49.0, 72.0, 85.0, 131.0, 199.0, 297.0, 407.0, 657.0, 902.0, 1468.0, 2301.0, 3766.0, 6147.0, 10414.0, 17908.0, 32579.0, 77876.0, 1379714.0, 437594.0, 57744.0, 27414.0, 15594.0, 9001.0, 5325.0, 3283.0, 2090.0, 1313.0, 799.0, 582.0, 424.0, 252.0, 174.0, 130.0, 115.0, 47.0, 50.0, 32.0, 20.0, 18.0, 13.0, 8.0, 8.0, 8.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.54296875, -1.4945526123046875, -1.446136474609375, -1.3977203369140625, -1.34930419921875, -1.3008880615234375, -1.252471923828125, -1.2040557861328125, -1.1556396484375, -1.1072235107421875, -1.058807373046875, -1.0103912353515625, -0.96197509765625, -0.9135589599609375, -0.865142822265625, -0.8167266845703125, -0.768310546875, -0.7198944091796875, -0.671478271484375, -0.6230621337890625, -0.57464599609375, -0.5262298583984375, -0.477813720703125, -0.4293975830078125, -0.3809814453125, -0.3325653076171875, -0.284149169921875, -0.2357330322265625, -0.18731689453125, -0.1389007568359375, -0.090484619140625, -0.0420684814453125, 0.00634765625, 0.0547637939453125, 0.103179931640625, 0.1515960693359375, 0.20001220703125, 0.2484283447265625, 0.296844482421875, 0.3452606201171875, 0.3936767578125, 0.4420928955078125, 0.490509033203125, 0.5389251708984375, 0.58734130859375, 0.6357574462890625, 0.684173583984375, 0.7325897216796875, 0.781005859375, 0.8294219970703125, 0.877838134765625, 0.9262542724609375, 0.97467041015625, 1.0230865478515625, 1.071502685546875, 1.1199188232421875, 1.1683349609375, 1.2167510986328125, 1.265167236328125, 1.3135833740234375, 1.36199951171875, 1.4104156494140625, 1.458831787109375, 1.5072479248046875, 1.5556640625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 8.0, 16.0, 10.0, 7.0, 12.0, 15.0, 20.0, 20.0, 33.0, 33.0, 33.0, 48.0, 64.0, 62.0, 66.0, 70.0, 74.0, 55.0, 73.0, 48.0, 43.0, 46.0, 23.0, 19.0, 20.0, 13.0, 12.0, 11.0, 13.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.207763671875, -0.20156478881835938, -0.19536590576171875, -0.18916702270507812, -0.1829681396484375, -0.17676925659179688, -0.17057037353515625, -0.16437149047851562, -0.158172607421875, -0.15197372436523438, -0.14577484130859375, -0.13957595825195312, -0.1333770751953125, -0.12717819213867188, -0.12097930908203125, -0.11478042602539062, -0.10858154296875, -0.10238265991210938, -0.09618377685546875, -0.08998489379882812, -0.0837860107421875, -0.07758712768554688, -0.07138824462890625, -0.06518936157226562, -0.058990478515625, -0.052791595458984375, -0.04659271240234375, -0.040393829345703125, -0.0341949462890625, -0.027996063232421875, -0.02179718017578125, -0.015598297119140625, -0.0093994140625, -0.003200531005859375, 0.00299835205078125, 0.009197235107421875, 0.0153961181640625, 0.021595001220703125, 0.02779388427734375, 0.033992767333984375, 0.040191650390625, 0.046390533447265625, 0.05258941650390625, 0.058788299560546875, 0.0649871826171875, 0.07118606567382812, 0.07738494873046875, 0.08358383178710938, 0.08978271484375, 0.09598159790039062, 0.10218048095703125, 0.10837936401367188, 0.1145782470703125, 0.12077713012695312, 0.12697601318359375, 0.13317489624023438, 0.139373779296875, 0.14557266235351562, 0.15177154541015625, 0.15797042846679688, 0.1641693115234375, 0.17036819458007812, 0.17656707763671875, 0.18276596069335938, 0.18896484375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 10.0, 10.0, 6.0, 27.0, 24.0, 27.0, 62.0, 65.0, 98.0, 179.0, 291.0, 793.0, 4923.0, 61990.0, 883064.0, 89193.0, 5911.0, 1042.0, 304.0, 175.0, 96.0, 56.0, 60.0, 28.0, 25.0, 18.0, 17.0, 19.0, 6.0, 2.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.01171875, -2.91314697265625, -2.8145751953125, -2.71600341796875, -2.617431640625, -2.51885986328125, -2.4202880859375, -2.32171630859375, -2.22314453125, -2.12457275390625, -2.0260009765625, -1.92742919921875, -1.828857421875, -1.73028564453125, -1.6317138671875, -1.53314208984375, -1.4345703125, -1.33599853515625, -1.2374267578125, -1.13885498046875, -1.040283203125, -0.94171142578125, -0.8431396484375, -0.74456787109375, -0.64599609375, -0.54742431640625, -0.4488525390625, -0.35028076171875, -0.251708984375, -0.15313720703125, -0.0545654296875, 0.04400634765625, 0.142578125, 0.24114990234375, 0.3397216796875, 0.43829345703125, 0.536865234375, 0.63543701171875, 0.7340087890625, 0.83258056640625, 0.93115234375, 1.02972412109375, 1.1282958984375, 1.22686767578125, 1.325439453125, 1.42401123046875, 1.5225830078125, 1.62115478515625, 1.7197265625, 1.81829833984375, 1.9168701171875, 2.01544189453125, 2.114013671875, 2.21258544921875, 2.3111572265625, 2.40972900390625, 2.50830078125, 2.60687255859375, 2.7054443359375, 2.80401611328125, 2.902587890625, 3.00115966796875, 3.0997314453125, 3.19830322265625, 3.296875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 12.0, 50.0, 174.0, 517.0, 211.0, 44.0, 9.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.010072946548462, -1.8363933563232422, -1.662713885307312, -1.4890342950820923, -1.315354824066162, -1.1416752338409424, -0.9679956436157227, -0.7943161725997925, -0.6206365823745728, -0.4469570517539978, -0.27327749133110046, -0.09959793090820312, 0.07408159971237183, 0.24776113033294678, 0.4214407205581665, 0.5951201915740967, 0.7687997817993164, 0.9424793124198914, 1.1161588430404663, 1.289838433265686, 1.4635179042816162, 1.637197494506836, 1.8108770847320557, 1.9845565557479858, 2.158236026763916, 2.3319156169891357, 2.5055952072143555, 2.679274559020996, 2.852954149246216, 3.0266337394714355, 3.2003133296966553, 3.373992919921875, 3.547672748565674, 3.7213523387908936, 3.8950319290161133, 4.068711280822754, 4.242391109466553, 4.416070461273193, 4.589750289916992, 4.763429641723633, 4.937108993530273, 5.110788345336914, 5.284468173980713, 5.4581475257873535, 5.631827354431152, 5.805506706237793, 5.979186058044434, 6.152865886688232, 6.326545715332031, 6.500225067138672, 6.673904895782471, 6.847584247589111, 7.02126407623291, 7.194943428039551, 7.368622779846191, 7.54230260848999, 7.715981960296631, 7.8896613121032715, 8.06334114074707, 8.237020492553711, 8.410699844360352, 8.584379196166992, 8.75805950164795, 8.93173885345459, 9.10541820526123]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 7.0, 7.0, 13.0, 18.0, 24.0, 22.0, 31.0, 25.0, 40.0, 41.0, 41.0, 50.0, 51.0, 47.0, 41.0, 50.0, 61.0, 68.0, 44.0, 46.0, 49.0, 42.0, 33.0, 38.0, 26.0, 16.0, 16.0, 12.0, 10.0, 11.0, 4.0, 5.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6182995438575745, -0.6007850170135498, -0.5832705497741699, -0.5657560229301453, -0.5482415556907654, -0.5307270288467407, -0.5132125616073608, -0.4956980347633362, -0.4781835079193115, -0.46066901087760925, -0.443154513835907, -0.4256399869918823, -0.40812548995018005, -0.3906109929084778, -0.3730964958667755, -0.35558199882507324, -0.33806750178337097, -0.3205530047416687, -0.30303850769996643, -0.28552401065826416, -0.2680094838142395, -0.25049498677253723, -0.23298048973083496, -0.2154659926891327, -0.19795148074626923, -0.18043698370456696, -0.1629224717617035, -0.14540797472000122, -0.12789347767829895, -0.11037896573543549, -0.09286446869373322, -0.07534996420145035, -0.05783545970916748, -0.04032095521688461, -0.022806454449892044, -0.005291953682899475, 0.012222550809383392, 0.02973705530166626, 0.04725155234336853, 0.0647660568356514, 0.08228056132793427, 0.09979506582021713, 0.1173095703125, 0.13482406735420227, 0.15233856439590454, 0.169853076338768, 0.18736757338047028, 0.20488208532333374, 0.222396582365036, 0.23991107940673828, 0.25742557644844055, 0.2749400734901428, 0.2924546003341675, 0.30996909737586975, 0.327483594417572, 0.3449980914592743, 0.36251258850097656, 0.38002708554267883, 0.3975415825843811, 0.41505610942840576, 0.43257060647010803, 0.4500851035118103, 0.4675996005535126, 0.48511409759521484, 0.5026286244392395]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 8.0, 6.0, 8.0, 5.0, 7.0, 13.0, 16.0, 15.0, 22.0, 18.0, 21.0, 21.0, 22.0, 39.0, 31.0, 16.0, 38.0, 24.0, 31.0, 44.0, 26.0, 39.0, 33.0, 31.0, 52.0, 49.0, 25.0, 39.0, 26.0, 44.0, 25.0, 29.0, 21.0, 22.0, 16.0, 19.0, 19.0, 21.0, 8.0, 3.0, 13.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.0947265625, -1.060333251953125, -1.02593994140625, -0.991546630859375, -0.9571533203125, -0.922760009765625, -0.88836669921875, -0.853973388671875, -0.819580078125, -0.785186767578125, -0.75079345703125, -0.716400146484375, -0.6820068359375, -0.647613525390625, -0.61322021484375, -0.578826904296875, -0.54443359375, -0.510040283203125, -0.47564697265625, -0.441253662109375, -0.4068603515625, -0.372467041015625, -0.33807373046875, -0.303680419921875, -0.269287109375, -0.234893798828125, -0.20050048828125, -0.166107177734375, -0.1317138671875, -0.097320556640625, -0.06292724609375, -0.028533935546875, 0.005859375, 0.040252685546875, 0.07464599609375, 0.109039306640625, 0.1434326171875, 0.177825927734375, 0.21221923828125, 0.246612548828125, 0.281005859375, 0.315399169921875, 0.34979248046875, 0.384185791015625, 0.4185791015625, 0.452972412109375, 0.48736572265625, 0.521759033203125, 0.55615234375, 0.590545654296875, 0.62493896484375, 0.659332275390625, 0.6937255859375, 0.728118896484375, 0.76251220703125, 0.796905517578125, 0.831298828125, 0.865692138671875, 0.90008544921875, 0.934478759765625, 0.9688720703125, 1.003265380859375, 1.03765869140625, 1.072052001953125, 1.1064453125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 14.0, 13.0, 25.0, 26.0, 37.0, 52.0, 101.0, 143.0, 192.0, 261.0, 374.0, 572.0, 772.0, 1172.0, 1753.0, 2577.0, 3863.0, 5877.0, 9213.0, 14620.0, 23513.0, 40028.0, 76889.0, 218920.0, 392526.0, 119633.0, 53741.0, 30106.0, 18337.0, 11211.0, 7322.0, 4690.0, 3260.0, 2182.0, 1374.0, 1023.0, 691.0, 423.0, 315.0, 244.0, 130.0, 121.0, 76.0, 41.0, 36.0, 23.0, 24.0, 8.0, 4.0, 2.0, 3.0, 2.0, 4.0, 4.0], "bins": [-1.6982421875, -1.648651123046875, -1.59906005859375, -1.549468994140625, -1.4998779296875, -1.450286865234375, -1.40069580078125, -1.351104736328125, -1.301513671875, -1.251922607421875, -1.20233154296875, -1.152740478515625, -1.1031494140625, -1.053558349609375, -1.00396728515625, -0.954376220703125, -0.90478515625, -0.855194091796875, -0.80560302734375, -0.756011962890625, -0.7064208984375, -0.656829833984375, -0.60723876953125, -0.557647705078125, -0.508056640625, -0.458465576171875, -0.40887451171875, -0.359283447265625, -0.3096923828125, -0.260101318359375, -0.21051025390625, -0.160919189453125, -0.111328125, -0.061737060546875, -0.01214599609375, 0.037445068359375, 0.0870361328125, 0.136627197265625, 0.18621826171875, 0.235809326171875, 0.285400390625, 0.334991455078125, 0.38458251953125, 0.434173583984375, 0.4837646484375, 0.533355712890625, 0.58294677734375, 0.632537841796875, 0.68212890625, 0.731719970703125, 0.78131103515625, 0.830902099609375, 0.8804931640625, 0.930084228515625, 0.97967529296875, 1.029266357421875, 1.078857421875, 1.128448486328125, 1.17803955078125, 1.227630615234375, 1.2772216796875, 1.326812744140625, 1.37640380859375, 1.425994873046875, 1.4755859375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 4.0, 11.0, 10.0, 16.0, 9.0, 12.0, 20.0, 19.0, 32.0, 36.0, 32.0, 43.0, 42.0, 54.0, 72.0, 124.0, 202.0, 1536.0, 186.0, 126.0, 91.0, 43.0, 50.0, 47.0, 31.0, 28.0, 28.0, 22.0, 24.0, 22.0, 19.0, 13.0, 5.0, 7.0, 3.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.185302734375, -4.03857421875, -3.891845703125, -3.7451171875, -3.598388671875, -3.45166015625, -3.304931640625, -3.158203125, -3.011474609375, -2.86474609375, -2.718017578125, -2.5712890625, -2.424560546875, -2.27783203125, -2.131103515625, -1.984375, -1.837646484375, -1.69091796875, -1.544189453125, -1.3974609375, -1.250732421875, -1.10400390625, -0.957275390625, -0.810546875, -0.663818359375, -0.51708984375, -0.370361328125, -0.2236328125, -0.076904296875, 0.06982421875, 0.216552734375, 0.36328125, 0.510009765625, 0.65673828125, 0.803466796875, 0.9501953125, 1.096923828125, 1.24365234375, 1.390380859375, 1.537109375, 1.683837890625, 1.83056640625, 1.977294921875, 2.1240234375, 2.270751953125, 2.41748046875, 2.564208984375, 2.7109375, 2.857666015625, 3.00439453125, 3.151123046875, 3.2978515625, 3.444580078125, 3.59130859375, 3.738037109375, 3.884765625, 4.031494140625, 4.17822265625, 4.324951171875, 4.4716796875, 4.618408203125, 4.76513671875, 4.911865234375, 5.05859375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 11.0, 5.0, 9.0, 11.0, 20.0, 48.0, 58.0, 85.0, 121.0, 215.0, 407.0, 854.0, 2291.0, 8420.0, 55672.0, 2157525.0, 869707.0, 39858.0, 6791.0, 1950.0, 741.0, 350.0, 218.0, 92.0, 71.0, 66.0, 24.0, 30.0, 13.0, 11.0, 8.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.1015625, -8.84820556640625, -8.5948486328125, -8.34149169921875, -8.088134765625, -7.83477783203125, -7.5814208984375, -7.32806396484375, -7.07470703125, -6.82135009765625, -6.5679931640625, -6.31463623046875, -6.061279296875, -5.80792236328125, -5.5545654296875, -5.30120849609375, -5.0478515625, -4.79449462890625, -4.5411376953125, -4.28778076171875, -4.034423828125, -3.78106689453125, -3.5277099609375, -3.27435302734375, -3.02099609375, -2.76763916015625, -2.5142822265625, -2.26092529296875, -2.007568359375, -1.75421142578125, -1.5008544921875, -1.24749755859375, -0.994140625, -0.74078369140625, -0.4874267578125, -0.23406982421875, 0.019287109375, 0.27264404296875, 0.5260009765625, 0.77935791015625, 1.03271484375, 1.28607177734375, 1.5394287109375, 1.79278564453125, 2.046142578125, 2.29949951171875, 2.5528564453125, 2.80621337890625, 3.0595703125, 3.31292724609375, 3.5662841796875, 3.81964111328125, 4.072998046875, 4.32635498046875, 4.5797119140625, 4.83306884765625, 5.08642578125, 5.33978271484375, 5.5931396484375, 5.84649658203125, 6.099853515625, 6.35321044921875, 6.6065673828125, 6.85992431640625, 7.11328125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [3.0, 39.0, 184.0, 444.0, 273.0, 65.0, 10.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.015747547149658, -3.6580281257629395, -2.3003089427948, -0.9425897598266602, 0.4151296615600586, 1.7728490829467773, 3.130568027496338, 4.488287448883057, 5.846006870269775, 7.203726291656494, 8.561445236206055, 9.919164657592773, 11.276884078979492, 12.634603500366211, 13.99232292175293, 15.350042343139648, 16.707761764526367, 18.065481185913086, 19.423200607299805, 20.780920028686523, 22.138639450073242, 23.49635887145996, 24.854076385498047, 26.211795806884766, 27.569515228271484, 28.927234649658203, 30.284954071044922, 31.64267349243164, 33.00039291381836, 34.35811233520508, 35.7158317565918, 37.073551177978516, 38.431270599365234, 39.78899002075195, 41.14670944213867, 42.50442886352539, 43.86214828491211, 45.21986770629883, 46.57758712768555, 47.935306549072266, 49.293025970458984, 50.6507453918457, 52.00846481323242, 53.36618423461914, 54.72390365600586, 56.08162307739258, 57.4393424987793, 58.797061920166016, 60.15477752685547, 61.51249694824219, 62.870216369628906, 64.22793579101562, 65.58565521240234, 66.94337463378906, 68.30109405517578, 69.6588134765625, 71.01653289794922, 72.37425231933594, 73.73197174072266, 75.08969116210938, 76.4474105834961, 77.80513000488281, 79.16284942626953, 80.52056884765625, 81.87828826904297]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 10.0, 7.0, 5.0, 11.0, 16.0, 12.0, 21.0, 18.0, 20.0, 27.0, 23.0, 40.0, 25.0, 30.0, 40.0, 43.0, 41.0, 53.0, 34.0, 41.0, 39.0, 49.0, 35.0, 34.0, 46.0, 42.0, 43.0, 30.0, 27.0, 21.0, 25.0, 17.0, 14.0, 13.0, 8.0, 13.0, 8.0, 2.0, 1.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.714778900146484, -12.293701171875, -11.8726224899292, -11.451544761657715, -11.030466079711914, -10.60938835144043, -10.188310623168945, -9.767231941223145, -9.346153259277344, -8.92507553100586, -8.503996849060059, -8.082919120788574, -7.661840438842773, -7.240762710571289, -6.8196845054626465, -6.398606300354004, -5.9775285720825195, -5.556450366973877, -5.135372161865234, -4.71429443359375, -4.293215751647949, -3.8721377849578857, -3.4510598182678223, -3.0299816131591797, -2.608903408050537, -2.1878252029418945, -1.7667471170425415, -1.3456690311431885, -0.9245908260345459, -0.5035126209259033, -0.08243465423583984, 0.33864355087280273, 0.7597208023071289, 1.1807990074157715, 1.6018770933151245, 2.0229551792144775, 2.44403338432312, 2.8651115894317627, 3.286189556121826, 3.7072677612304688, 4.128345966339111, 4.549424171447754, 4.9705023765563965, 5.391580581665039, 5.812658309936523, 6.233736991882324, 6.654814720153809, 7.075892925262451, 7.496971130371094, 7.918049335479736, 8.339127540588379, 8.760205268859863, 9.181283950805664, 9.602361679077148, 10.023439407348633, 10.444518089294434, 10.865596771240234, 11.286674499511719, 11.70775318145752, 12.128830909729004, 12.549909591674805, 12.970987319946289, 13.392065048217773, 13.813143730163574, 14.234221458435059]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 7.0, 5.0, 7.0, 12.0, 7.0, 10.0, 19.0, 18.0, 15.0, 17.0, 22.0, 28.0, 26.0, 25.0, 22.0, 30.0, 30.0, 43.0, 30.0, 43.0, 37.0, 49.0, 39.0, 40.0, 42.0, 39.0, 44.0, 28.0, 27.0, 33.0, 27.0, 20.0, 30.0, 20.0, 16.0, 14.0, 19.0, 11.0, 10.0, 4.0, 13.0, 5.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.173828125, -1.1363067626953125, -1.098785400390625, -1.0612640380859375, -1.02374267578125, -0.9862213134765625, -0.948699951171875, -0.9111785888671875, -0.8736572265625, -0.8361358642578125, -0.798614501953125, -0.7610931396484375, -0.72357177734375, -0.6860504150390625, -0.648529052734375, -0.6110076904296875, -0.573486328125, -0.5359649658203125, -0.498443603515625, -0.4609222412109375, -0.42340087890625, -0.3858795166015625, -0.348358154296875, -0.3108367919921875, -0.2733154296875, -0.2357940673828125, -0.198272705078125, -0.1607513427734375, -0.12322998046875, -0.0857086181640625, -0.048187255859375, -0.0106658935546875, 0.02685546875, 0.0643768310546875, 0.101898193359375, 0.1394195556640625, 0.17694091796875, 0.2144622802734375, 0.251983642578125, 0.2895050048828125, 0.3270263671875, 0.3645477294921875, 0.402069091796875, 0.4395904541015625, 0.47711181640625, 0.5146331787109375, 0.552154541015625, 0.5896759033203125, 0.627197265625, 0.6647186279296875, 0.702239990234375, 0.7397613525390625, 0.77728271484375, 0.8148040771484375, 0.852325439453125, 0.8898468017578125, 0.9273681640625, 0.9648895263671875, 1.002410888671875, 1.0399322509765625, 1.07745361328125, 1.1149749755859375, 1.152496337890625, 1.1900177001953125, 1.2275390625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 8.0, 3.0, 8.0, 13.0, 19.0, 40.0, 39.0, 59.0, 95.0, 133.0, 211.0, 251.0, 351.0, 476.0, 671.0, 877.0, 1333.0, 1896.0, 2631.0, 3830.0, 5723.0, 8581.0, 13730.0, 23330.0, 43374.0, 97585.0, 312309.0, 1263556.0, 1664951.0, 485894.0, 135938.0, 53487.0, 27642.0, 15915.0, 9702.0, 6137.0, 4047.0, 2809.0, 1956.0, 1306.0, 976.0, 725.0, 473.0, 321.0, 276.0, 168.0, 130.0, 101.0, 57.0, 57.0, 31.0, 22.0, 14.0, 11.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0], "bins": [-1.8017578125, -1.7457122802734375, -1.689666748046875, -1.6336212158203125, -1.57757568359375, -1.5215301513671875, -1.465484619140625, -1.4094390869140625, -1.3533935546875, -1.2973480224609375, -1.241302490234375, -1.1852569580078125, -1.12921142578125, -1.0731658935546875, -1.017120361328125, -0.9610748291015625, -0.905029296875, -0.8489837646484375, -0.792938232421875, -0.7368927001953125, -0.68084716796875, -0.6248016357421875, -0.568756103515625, -0.5127105712890625, -0.4566650390625, -0.4006195068359375, -0.344573974609375, -0.2885284423828125, -0.23248291015625, -0.1764373779296875, -0.120391845703125, -0.0643463134765625, -0.00830078125, 0.0477447509765625, 0.103790283203125, 0.1598358154296875, 0.21588134765625, 0.2719268798828125, 0.327972412109375, 0.3840179443359375, 0.4400634765625, 0.4961090087890625, 0.552154541015625, 0.6082000732421875, 0.66424560546875, 0.7202911376953125, 0.776336669921875, 0.8323822021484375, 0.888427734375, 0.9444732666015625, 1.000518798828125, 1.0565643310546875, 1.11260986328125, 1.1686553955078125, 1.224700927734375, 1.2807464599609375, 1.3367919921875, 1.3928375244140625, 1.448883056640625, 1.5049285888671875, 1.56097412109375, 1.6170196533203125, 1.673065185546875, 1.7291107177734375, 1.78515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 6.0, 12.0, 18.0, 35.0, 45.0, 64.0, 104.0, 218.0, 418.0, 859.0, 1099.0, 569.0, 264.0, 113.0, 92.0, 53.0, 31.0, 24.0, 18.0, 10.0, 11.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8046875, -4.63421630859375, -4.4637451171875, -4.29327392578125, -4.122802734375, -3.95233154296875, -3.7818603515625, -3.61138916015625, -3.44091796875, -3.27044677734375, -3.0999755859375, -2.92950439453125, -2.759033203125, -2.58856201171875, -2.4180908203125, -2.24761962890625, -2.0771484375, -1.90667724609375, -1.7362060546875, -1.56573486328125, -1.395263671875, -1.22479248046875, -1.0543212890625, -0.88385009765625, -0.71337890625, -0.54290771484375, -0.3724365234375, -0.20196533203125, -0.031494140625, 0.13897705078125, 0.3094482421875, 0.47991943359375, 0.650390625, 0.82086181640625, 0.9913330078125, 1.16180419921875, 1.332275390625, 1.50274658203125, 1.6732177734375, 1.84368896484375, 2.01416015625, 2.18463134765625, 2.3551025390625, 2.52557373046875, 2.696044921875, 2.86651611328125, 3.0369873046875, 3.20745849609375, 3.3779296875, 3.54840087890625, 3.7188720703125, 3.88934326171875, 4.059814453125, 4.23028564453125, 4.4007568359375, 4.57122802734375, 4.74169921875, 4.91217041015625, 5.0826416015625, 5.25311279296875, 5.423583984375, 5.59405517578125, 5.7645263671875, 5.93499755859375, 6.10546875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 15.0, 14.0, 16.0, 25.0, 36.0, 43.0, 66.0, 87.0, 187.0, 266.0, 488.0, 925.0, 1787.0, 4056.0, 9336.0, 24053.0, 69879.0, 309575.0, 2708482.0, 874004.0, 126974.0, 38220.0, 14393.0, 5899.0, 2649.0, 1283.0, 621.0, 336.0, 201.0, 118.0, 72.0, 63.0, 37.0, 24.0, 22.0, 16.0, 13.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.04351806640625, -3.8800048828125, -3.71649169921875, -3.552978515625, -3.38946533203125, -3.2259521484375, -3.06243896484375, -2.89892578125, -2.73541259765625, -2.5718994140625, -2.40838623046875, -2.244873046875, -2.08135986328125, -1.9178466796875, -1.75433349609375, -1.5908203125, -1.42730712890625, -1.2637939453125, -1.10028076171875, -0.936767578125, -0.77325439453125, -0.6097412109375, -0.44622802734375, -0.28271484375, -0.11920166015625, 0.0443115234375, 0.20782470703125, 0.371337890625, 0.53485107421875, 0.6983642578125, 0.86187744140625, 1.025390625, 1.18890380859375, 1.3524169921875, 1.51593017578125, 1.679443359375, 1.84295654296875, 2.0064697265625, 2.16998291015625, 2.33349609375, 2.49700927734375, 2.6605224609375, 2.82403564453125, 2.987548828125, 3.15106201171875, 3.3145751953125, 3.47808837890625, 3.6416015625, 3.80511474609375, 3.9686279296875, 4.13214111328125, 4.295654296875, 4.45916748046875, 4.6226806640625, 4.78619384765625, 4.94970703125, 5.11322021484375, 5.2767333984375, 5.44024658203125, 5.603759765625, 5.76727294921875, 5.9307861328125, 6.09429931640625, 6.2578125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 7.0, 19.0, 45.0, 91.0, 163.0, 221.0, 208.0, 125.0, 78.0, 28.0, 12.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.979034423828125, -45.797183990478516, -44.615333557128906, -43.43348693847656, -42.25163650512695, -41.069786071777344, -39.887935638427734, -38.706085205078125, -37.52423858642578, -36.34238815307617, -35.16053771972656, -33.97869110107422, -32.79684066772461, -31.614990234375, -30.43313980102539, -29.251291275024414, -28.069440841674805, -26.887590408325195, -25.70574188232422, -24.52389144897461, -23.342042922973633, -22.160192489624023, -20.978343963623047, -19.796493530273438, -18.614643096923828, -17.43279266357422, -16.250944137573242, -15.069093704223633, -13.887245178222656, -12.705394744873047, -11.523545265197754, -10.341695785522461, -9.159849166870117, -7.977999687194824, -6.796150207519531, -5.61430025100708, -4.432450771331787, -3.250601291656494, -2.068751335144043, -0.88690185546875, 0.29494762420654297, 1.4767972230911255, 2.658646821975708, 3.84049654006958, 5.022346019744873, 6.204195499420166, 7.386045455932617, 8.56789493560791, 9.749744415283203, 10.931593894958496, 12.113443374633789, 13.295293807983398, 14.477142333984375, 15.658992767333984, 16.840843200683594, 18.02269172668457, 19.204540252685547, 20.386390686035156, 21.568239212036133, 22.750089645385742, 23.93193817138672, 25.113788604736328, 26.295639038085938, 27.477487564086914, 28.659337997436523]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 7.0, 14.0, 9.0, 12.0, 14.0, 18.0, 24.0, 32.0, 21.0, 22.0, 28.0, 26.0, 42.0, 30.0, 29.0, 35.0, 41.0, 35.0, 44.0, 45.0, 47.0, 35.0, 35.0, 32.0, 38.0, 28.0, 31.0, 29.0, 28.0, 33.0, 14.0, 20.0, 10.0, 19.0, 14.0, 15.0, 5.0, 5.0, 5.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.825056076049805, -9.511898040771484, -9.19874095916748, -8.88558292388916, -8.57242488861084, -8.25926685333252, -7.946109771728516, -7.632951736450195, -7.319793701171875, -7.006636142730713, -6.693478107452393, -6.3803205490112305, -6.06716251373291, -5.754004955291748, -5.440847396850586, -5.127689361572266, -4.8145318031311035, -4.501374244689941, -4.188216209411621, -3.875058650970459, -3.5619006156921387, -3.2487430572509766, -2.9355852603912354, -2.622427463531494, -2.309269666671753, -1.9961118698120117, -1.6829540729522705, -1.3697963953018188, -1.0566385984420776, -0.7434808015823364, -0.43032312393188477, -0.11716532707214355, 0.19599246978759766, 0.5091502666473389, 0.8223080039024353, 1.1354657411575317, 1.448623538017273, 1.7617813348770142, 2.074939012527466, 2.388096809387207, 2.7012546062469482, 3.0144124031066895, 3.3275701999664307, 3.640727996826172, 3.953885555267334, 4.267043590545654, 4.580201148986816, 4.893359184265137, 5.206516742706299, 5.519674301147461, 5.832832336425781, 6.145989894866943, 6.459147930145264, 6.772305488586426, 7.085463523864746, 7.398621082305908, 7.71177864074707, 8.02493667602539, 8.338093757629395, 8.651251792907715, 8.964409828186035, 9.277567863464355, 9.59072494506836, 9.90388298034668, 10.217041015625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 9.0, 7.0, 6.0, 11.0, 13.0, 13.0, 5.0, 18.0, 20.0, 22.0, 25.0, 21.0, 29.0, 36.0, 20.0, 44.0, 28.0, 31.0, 46.0, 39.0, 36.0, 41.0, 47.0, 43.0, 41.0, 39.0, 30.0, 36.0, 27.0, 38.0, 28.0, 31.0, 14.0, 19.0, 17.0, 15.0, 10.0, 5.0, 6.0, 11.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1708984375, -1.13165283203125, -1.0924072265625, -1.05316162109375, -1.013916015625, -0.97467041015625, -0.9354248046875, -0.89617919921875, -0.85693359375, -0.81768798828125, -0.7784423828125, -0.73919677734375, -0.699951171875, -0.66070556640625, -0.6214599609375, -0.58221435546875, -0.54296875, -0.50372314453125, -0.4644775390625, -0.42523193359375, -0.385986328125, -0.34674072265625, -0.3074951171875, -0.26824951171875, -0.22900390625, -0.18975830078125, -0.1505126953125, -0.11126708984375, -0.072021484375, -0.03277587890625, 0.0064697265625, 0.04571533203125, 0.0849609375, 0.12420654296875, 0.1634521484375, 0.20269775390625, 0.241943359375, 0.28118896484375, 0.3204345703125, 0.35968017578125, 0.39892578125, 0.43817138671875, 0.4774169921875, 0.51666259765625, 0.555908203125, 0.59515380859375, 0.6343994140625, 0.67364501953125, 0.712890625, 0.75213623046875, 0.7913818359375, 0.83062744140625, 0.869873046875, 0.90911865234375, 0.9483642578125, 0.98760986328125, 1.02685546875, 1.06610107421875, 1.1053466796875, 1.14459228515625, 1.183837890625, 1.22308349609375, 1.2623291015625, 1.30157470703125, 1.3408203125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 9.0, 6.0, 4.0, 12.0, 19.0, 23.0, 49.0, 63.0, 82.0, 148.0, 237.0, 309.0, 530.0, 774.0, 1186.0, 1758.0, 2810.0, 4005.0, 6091.0, 8980.0, 13366.0, 19674.0, 27818.0, 40030.0, 54967.0, 72709.0, 90955.0, 108241.0, 115005.0, 110864.0, 95789.0, 76540.0, 57882.0, 42581.0, 30043.0, 21054.0, 14480.0, 9824.0, 6562.0, 4366.0, 3002.0, 1934.0, 1331.0, 845.0, 537.0, 386.0, 238.0, 169.0, 107.0, 60.0, 33.0, 28.0, 16.0, 13.0, 8.0, 6.0, 2.0, 4.0, 3.0], "bins": [-0.8251953125, -0.8006362915039062, -0.7760772705078125, -0.7515182495117188, -0.726959228515625, -0.7024002075195312, -0.6778411865234375, -0.6532821655273438, -0.62872314453125, -0.6041641235351562, -0.5796051025390625, -0.5550460815429688, -0.530487060546875, -0.5059280395507812, -0.4813690185546875, -0.45680999755859375, -0.4322509765625, -0.40769195556640625, -0.3831329345703125, -0.35857391357421875, -0.334014892578125, -0.30945587158203125, -0.2848968505859375, -0.26033782958984375, -0.23577880859375, -0.21121978759765625, -0.1866607666015625, -0.16210174560546875, -0.137542724609375, -0.11298370361328125, -0.0884246826171875, -0.06386566162109375, -0.039306640625, -0.01474761962890625, 0.0098114013671875, 0.03437042236328125, 0.058929443359375, 0.08348846435546875, 0.1080474853515625, 0.13260650634765625, 0.15716552734375, 0.18172454833984375, 0.2062835693359375, 0.23084259033203125, 0.255401611328125, 0.27996063232421875, 0.3045196533203125, 0.32907867431640625, 0.3536376953125, 0.37819671630859375, 0.4027557373046875, 0.42731475830078125, 0.451873779296875, 0.47643280029296875, 0.5009918212890625, 0.5255508422851562, 0.55010986328125, 0.5746688842773438, 0.5992279052734375, 0.6237869262695312, 0.648345947265625, 0.6729049682617188, 0.6974639892578125, 0.7220230102539062, 0.74658203125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 7.0, 9.0, 10.0, 11.0, 18.0, 22.0, 18.0, 18.0, 20.0, 29.0, 27.0, 26.0, 38.0, 48.0, 29.0, 46.0, 46.0, 43.0, 1069.0, 43.0, 38.0, 32.0, 40.0, 28.0, 29.0, 25.0, 24.0, 21.0, 21.0, 26.0, 28.0, 19.0, 13.0, 17.0, 13.0, 7.0, 11.0, 11.0, 10.0, 9.0, 4.0, 2.0, 4.0, 5.0, 0.0, 1.0, 3.0], "bins": [-1.2294921875, -1.1950759887695312, -1.1606597900390625, -1.1262435913085938, -1.091827392578125, -1.0574111938476562, -1.0229949951171875, -0.9885787963867188, -0.95416259765625, -0.9197463989257812, -0.8853302001953125, -0.8509140014648438, -0.816497802734375, -0.7820816040039062, -0.7476654052734375, -0.7132492065429688, -0.6788330078125, -0.6444168090820312, -0.6100006103515625, -0.5755844116210938, -0.541168212890625, -0.5067520141601562, -0.4723358154296875, -0.43791961669921875, -0.40350341796875, -0.36908721923828125, -0.3346710205078125, -0.30025482177734375, -0.265838623046875, -0.23142242431640625, -0.1970062255859375, -0.16259002685546875, -0.128173828125, -0.09375762939453125, -0.0593414306640625, -0.02492523193359375, 0.009490966796875, 0.04390716552734375, 0.0783233642578125, 0.11273956298828125, 0.14715576171875, 0.18157196044921875, 0.2159881591796875, 0.25040435791015625, 0.284820556640625, 0.31923675537109375, 0.3536529541015625, 0.38806915283203125, 0.4224853515625, 0.45690155029296875, 0.4913177490234375, 0.5257339477539062, 0.560150146484375, 0.5945663452148438, 0.6289825439453125, 0.6633987426757812, 0.69781494140625, 0.7322311401367188, 0.7666473388671875, 0.8010635375976562, 0.835479736328125, 0.8698959350585938, 0.9043121337890625, 0.9387283325195312, 0.97314453125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 5.0, 13.0, 7.0, 12.0, 17.0, 26.0, 41.0, 37.0, 74.0, 88.0, 142.0, 226.0, 310.0, 481.0, 743.0, 1217.0, 2190.0, 3265.0, 5810.0, 9554.0, 16881.0, 31860.0, 81336.0, 1502258.0, 330293.0, 52264.0, 24483.0, 13580.0, 7836.0, 4626.0, 2749.0, 1704.0, 1048.0, 662.0, 426.0, 269.0, 181.0, 139.0, 72.0, 56.0, 46.0, 37.0, 21.0, 12.0, 9.0, 8.0, 3.0, 5.0, 1.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.427734375, -1.382843017578125, -1.33795166015625, -1.293060302734375, -1.2481689453125, -1.203277587890625, -1.15838623046875, -1.113494873046875, -1.068603515625, -1.023712158203125, -0.97882080078125, -0.933929443359375, -0.8890380859375, -0.844146728515625, -0.79925537109375, -0.754364013671875, -0.70947265625, -0.664581298828125, -0.61968994140625, -0.574798583984375, -0.5299072265625, -0.485015869140625, -0.44012451171875, -0.395233154296875, -0.350341796875, -0.305450439453125, -0.26055908203125, -0.215667724609375, -0.1707763671875, -0.125885009765625, -0.08099365234375, -0.036102294921875, 0.0087890625, 0.053680419921875, 0.09857177734375, 0.143463134765625, 0.1883544921875, 0.233245849609375, 0.27813720703125, 0.323028564453125, 0.367919921875, 0.412811279296875, 0.45770263671875, 0.502593994140625, 0.5474853515625, 0.592376708984375, 0.63726806640625, 0.682159423828125, 0.72705078125, 0.771942138671875, 0.81683349609375, 0.861724853515625, 0.9066162109375, 0.951507568359375, 0.99639892578125, 1.041290283203125, 1.086181640625, 1.131072998046875, 1.17596435546875, 1.220855712890625, 1.2657470703125, 1.310638427734375, 1.35552978515625, 1.400421142578125, 1.4453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 8.0, 4.0, 9.0, 5.0, 8.0, 13.0, 10.0, 13.0, 19.0, 17.0, 34.0, 39.0, 44.0, 54.0, 33.0, 59.0, 50.0, 67.0, 80.0, 69.0, 56.0, 52.0, 37.0, 32.0, 40.0, 35.0, 30.0, 14.0, 23.0, 10.0, 15.0, 7.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1824951171875, -0.1775188446044922, -0.17254257202148438, -0.16756629943847656, -0.16259002685546875, -0.15761375427246094, -0.15263748168945312, -0.1476612091064453, -0.1426849365234375, -0.1377086639404297, -0.13273239135742188, -0.12775611877441406, -0.12277984619140625, -0.11780357360839844, -0.11282730102539062, -0.10785102844238281, -0.102874755859375, -0.09789848327636719, -0.09292221069335938, -0.08794593811035156, -0.08296966552734375, -0.07799339294433594, -0.07301712036132812, -0.06804084777832031, -0.0630645751953125, -0.05808830261230469, -0.053112030029296875, -0.04813575744628906, -0.04315948486328125, -0.03818321228027344, -0.033206939697265625, -0.028230667114257812, -0.02325439453125, -0.018278121948242188, -0.013301849365234375, -0.008325576782226562, -0.00334930419921875, 0.0016269683837890625, 0.006603240966796875, 0.011579513549804688, 0.0165557861328125, 0.021532058715820312, 0.026508331298828125, 0.03148460388183594, 0.03646087646484375, 0.04143714904785156, 0.046413421630859375, 0.05138969421386719, 0.056365966796875, 0.06134223937988281, 0.06631851196289062, 0.07129478454589844, 0.07627105712890625, 0.08124732971191406, 0.08622360229492188, 0.09119987487792969, 0.0961761474609375, 0.10115242004394531, 0.10612869262695312, 0.11110496520996094, 0.11608123779296875, 0.12105751037597656, 0.12603378295898438, 0.1310100555419922, 0.135986328125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 5.0, 10.0, 7.0, 10.0, 10.0, 22.0, 17.0, 32.0, 49.0, 56.0, 62.0, 69.0, 127.0, 214.0, 456.0, 1069.0, 3674.0, 21573.0, 256672.0, 687994.0, 65106.0, 7774.0, 1885.0, 722.0, 341.0, 200.0, 116.0, 72.0, 53.0, 35.0, 31.0, 20.0, 16.0, 9.0, 6.0, 4.0, 11.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.728515625, -1.669403076171875, -1.61029052734375, -1.551177978515625, -1.4920654296875, -1.432952880859375, -1.37384033203125, -1.314727783203125, -1.255615234375, -1.196502685546875, -1.13739013671875, -1.078277587890625, -1.0191650390625, -0.960052490234375, -0.90093994140625, -0.841827392578125, -0.78271484375, -0.723602294921875, -0.66448974609375, -0.605377197265625, -0.5462646484375, -0.487152099609375, -0.42803955078125, -0.368927001953125, -0.309814453125, -0.250701904296875, -0.19158935546875, -0.132476806640625, -0.0733642578125, -0.014251708984375, 0.04486083984375, 0.103973388671875, 0.1630859375, 0.222198486328125, 0.28131103515625, 0.340423583984375, 0.3995361328125, 0.458648681640625, 0.51776123046875, 0.576873779296875, 0.635986328125, 0.695098876953125, 0.75421142578125, 0.813323974609375, 0.8724365234375, 0.931549072265625, 0.99066162109375, 1.049774169921875, 1.10888671875, 1.167999267578125, 1.22711181640625, 1.286224365234375, 1.3453369140625, 1.404449462890625, 1.46356201171875, 1.522674560546875, 1.581787109375, 1.640899658203125, 1.70001220703125, 1.759124755859375, 1.8182373046875, 1.877349853515625, 1.93646240234375, 1.995574951171875, 2.0546875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 12.0, 16.0, 56.0, 122.0, 272.0, 326.0, 130.0, 57.0, 17.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2162940502166748, -1.1155431270599365, -1.0147920846939087, -0.9140411615371704, -0.8132901787757874, -0.7125391960144043, -0.611788272857666, -0.511037290096283, -0.4102863073348999, -0.30953532457351685, -0.20878437161445618, -0.10803341865539551, -0.007282435894012451, 0.0934685468673706, 0.1942194700241089, 0.29497045278549194, 0.395721435546875, 0.49647241830825806, 0.5972234010696411, 0.6979743242263794, 0.7987253069877625, 0.8994762897491455, 1.0002272129058838, 1.100978136062622, 1.20172917842865, 1.3024801015853882, 1.403231143951416, 1.5039820671081543, 1.6047329902648926, 1.7054840326309204, 1.8062349557876587, 1.9069859981536865, 2.0077366828918457, 2.108487606048584, 2.2092385292053223, 2.3099894523620605, 2.410740613937378, 2.511491537094116, 2.6122424602508545, 2.7129933834075928, 2.81374454498291, 2.9144954681396484, 3.0152463912963867, 3.115997314453125, 3.2167484760284424, 3.3174993991851807, 3.418250322341919, 3.5190012454986572, 3.6197521686553955, 3.720503091812134, 3.821254014968872, 3.9220051765441895, 4.022756099700928, 4.123507022857666, 4.224257946014404, 4.325008869171143, 4.425759792327881, 4.526510715484619, 4.627261638641357, 4.728012561798096, 4.828763484954834, 4.9295148849487305, 5.030265808105469, 5.131016731262207, 5.231767654418945]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 4.0, 5.0, 12.0, 9.0, 10.0, 14.0, 14.0, 24.0, 29.0, 38.0, 36.0, 41.0, 32.0, 34.0, 44.0, 56.0, 47.0, 56.0, 42.0, 57.0, 47.0, 46.0, 46.0, 51.0, 40.0, 31.0, 21.0, 19.0, 29.0, 15.0, 8.0, 9.0, 5.0, 11.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4896050691604614, -0.4722776412963867, -0.454950213432312, -0.4376228153705597, -0.420295387506485, -0.4029679596424103, -0.38564056158065796, -0.36831313371658325, -0.35098570585250854, -0.33365827798843384, -0.31633085012435913, -0.2990034520626068, -0.2816760241985321, -0.2643485963344574, -0.24702118337154388, -0.22969377040863037, -0.21236634254455566, -0.19503891468048096, -0.17771150171756744, -0.16038408875465393, -0.14305666089057922, -0.12572923302650452, -0.108401820063591, -0.0910743996500969, -0.07374697923660278, -0.05641955882310867, -0.03909213840961456, -0.021764717996120453, -0.004437297582626343, 0.012890122830867767, 0.030217543244361877, 0.04754496365785599, 0.06487232446670532, 0.08219974488019943, 0.09952716529369354, 0.11685458570718765, 0.13418200612068176, 0.15150943398475647, 0.16883684694766998, 0.1861642599105835, 0.2034916877746582, 0.2208191156387329, 0.23814652860164642, 0.25547394156455994, 0.27280136942863464, 0.29012879729270935, 0.30745619535446167, 0.3247836232185364, 0.3421110510826111, 0.3594384789466858, 0.3767659068107605, 0.3940933048725128, 0.4114207327365875, 0.42874816060066223, 0.44607555866241455, 0.46340298652648926, 0.48073041439056396, 0.49805784225463867, 0.5153852701187134, 0.5327126979827881, 0.5500401258468628, 0.5673674941062927, 0.5846949219703674, 0.6020223498344421, 0.6193497776985168]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 2.0, 7.0, 4.0, 8.0, 5.0, 9.0, 15.0, 12.0, 9.0, 16.0, 13.0, 21.0, 22.0, 23.0, 24.0, 40.0, 29.0, 31.0, 34.0, 31.0, 34.0, 47.0, 36.0, 38.0, 47.0, 45.0, 40.0, 42.0, 34.0, 29.0, 35.0, 38.0, 29.0, 26.0, 26.0, 18.0, 12.0, 20.0, 12.0, 7.0, 6.0, 9.0, 9.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2001953125, -1.1605987548828125, -1.121002197265625, -1.0814056396484375, -1.04180908203125, -1.0022125244140625, -0.962615966796875, -0.9230194091796875, -0.8834228515625, -0.8438262939453125, -0.804229736328125, -0.7646331787109375, -0.72503662109375, -0.6854400634765625, -0.645843505859375, -0.6062469482421875, -0.566650390625, -0.5270538330078125, -0.487457275390625, -0.4478607177734375, -0.40826416015625, -0.3686676025390625, -0.329071044921875, -0.2894744873046875, -0.2498779296875, -0.2102813720703125, -0.170684814453125, -0.1310882568359375, -0.09149169921875, -0.0518951416015625, -0.012298583984375, 0.0272979736328125, 0.06689453125, 0.1064910888671875, 0.146087646484375, 0.1856842041015625, 0.22528076171875, 0.2648773193359375, 0.304473876953125, 0.3440704345703125, 0.3836669921875, 0.4232635498046875, 0.462860107421875, 0.5024566650390625, 0.54205322265625, 0.5816497802734375, 0.621246337890625, 0.6608428955078125, 0.700439453125, 0.7400360107421875, 0.779632568359375, 0.8192291259765625, 0.85882568359375, 0.8984222412109375, 0.938018798828125, 0.9776153564453125, 1.0172119140625, 1.0568084716796875, 1.096405029296875, 1.1360015869140625, 1.17559814453125, 1.2151947021484375, 1.254791259765625, 1.2943878173828125, 1.333984375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 6.0, 4.0, 13.0, 16.0, 33.0, 36.0, 58.0, 87.0, 113.0, 135.0, 176.0, 248.0, 319.0, 535.0, 736.0, 1054.0, 1549.0, 2425.0, 4148.0, 7298.0, 13810.0, 29861.0, 81582.0, 507256.0, 287017.0, 58656.0, 23526.0, 11422.0, 6189.0, 3436.0, 2200.0, 1361.0, 911.0, 685.0, 463.0, 341.0, 227.0, 178.0, 122.0, 94.0, 78.0, 40.0, 34.0, 21.0, 19.0, 13.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-2.396484375, -2.32354736328125, -2.2506103515625, -2.17767333984375, -2.104736328125, -2.03179931640625, -1.9588623046875, -1.88592529296875, -1.81298828125, -1.74005126953125, -1.6671142578125, -1.59417724609375, -1.521240234375, -1.44830322265625, -1.3753662109375, -1.30242919921875, -1.2294921875, -1.15655517578125, -1.0836181640625, -1.01068115234375, -0.937744140625, -0.86480712890625, -0.7918701171875, -0.71893310546875, -0.64599609375, -0.57305908203125, -0.5001220703125, -0.42718505859375, -0.354248046875, -0.28131103515625, -0.2083740234375, -0.13543701171875, -0.0625, 0.01043701171875, 0.0833740234375, 0.15631103515625, 0.229248046875, 0.30218505859375, 0.3751220703125, 0.44805908203125, 0.52099609375, 0.59393310546875, 0.6668701171875, 0.73980712890625, 0.812744140625, 0.88568115234375, 0.9586181640625, 1.03155517578125, 1.1044921875, 1.17742919921875, 1.2503662109375, 1.32330322265625, 1.396240234375, 1.46917724609375, 1.5421142578125, 1.61505126953125, 1.68798828125, 1.76092529296875, 1.8338623046875, 1.90679931640625, 1.979736328125, 2.05267333984375, 2.1256103515625, 2.19854736328125, 2.271484375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 5.0, 11.0, 8.0, 9.0, 11.0, 20.0, 25.0, 19.0, 16.0, 27.0, 31.0, 47.0, 50.0, 53.0, 45.0, 68.0, 106.0, 358.0, 1562.0, 124.0, 62.0, 46.0, 41.0, 32.0, 46.0, 44.0, 33.0, 20.0, 17.0, 14.0, 19.0, 17.0, 15.0, 9.0, 7.0, 6.0, 6.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.92388916015625, -4.7657470703125, -4.60760498046875, -4.449462890625, -4.29132080078125, -4.1331787109375, -3.97503662109375, -3.81689453125, -3.65875244140625, -3.5006103515625, -3.34246826171875, -3.184326171875, -3.02618408203125, -2.8680419921875, -2.70989990234375, -2.5517578125, -2.39361572265625, -2.2354736328125, -2.07733154296875, -1.919189453125, -1.76104736328125, -1.6029052734375, -1.44476318359375, -1.28662109375, -1.12847900390625, -0.9703369140625, -0.81219482421875, -0.654052734375, -0.49591064453125, -0.3377685546875, -0.17962646484375, -0.021484375, 0.13665771484375, 0.2947998046875, 0.45294189453125, 0.611083984375, 0.76922607421875, 0.9273681640625, 1.08551025390625, 1.24365234375, 1.40179443359375, 1.5599365234375, 1.71807861328125, 1.876220703125, 2.03436279296875, 2.1925048828125, 2.35064697265625, 2.5087890625, 2.66693115234375, 2.8250732421875, 2.98321533203125, 3.141357421875, 3.29949951171875, 3.4576416015625, 3.61578369140625, 3.77392578125, 3.93206787109375, 4.0902099609375, 4.24835205078125, 4.406494140625, 4.56463623046875, 4.7227783203125, 4.88092041015625, 5.0390625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 12.0, 7.0, 9.0, 34.0, 27.0, 30.0, 56.0, 95.0, 172.0, 266.0, 562.0, 1771.0, 10484.0, 221686.0, 2871414.0, 33350.0, 3819.0, 965.0, 379.0, 212.0, 121.0, 67.0, 53.0, 38.0, 20.0, 14.0, 16.0, 10.0, 10.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5546875, -10.1937255859375, -9.832763671875, -9.4718017578125, -9.11083984375, -8.7498779296875, -8.388916015625, -8.0279541015625, -7.6669921875, -7.3060302734375, -6.945068359375, -6.5841064453125, -6.22314453125, -5.8621826171875, -5.501220703125, -5.1402587890625, -4.779296875, -4.4183349609375, -4.057373046875, -3.6964111328125, -3.33544921875, -2.9744873046875, -2.613525390625, -2.2525634765625, -1.8916015625, -1.5306396484375, -1.169677734375, -0.8087158203125, -0.44775390625, -0.0867919921875, 0.274169921875, 0.6351318359375, 0.99609375, 1.3570556640625, 1.718017578125, 2.0789794921875, 2.43994140625, 2.8009033203125, 3.161865234375, 3.5228271484375, 3.8837890625, 4.2447509765625, 4.605712890625, 4.9666748046875, 5.32763671875, 5.6885986328125, 6.049560546875, 6.4105224609375, 6.771484375, 7.1324462890625, 7.493408203125, 7.8543701171875, 8.21533203125, 8.5762939453125, 8.937255859375, 9.2982177734375, 9.6591796875, 10.0201416015625, 10.381103515625, 10.7420654296875, 11.10302734375, 11.4639892578125, 11.824951171875, 12.1859130859375, 12.546875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [13.0, 96.0, 466.0, 385.0, 53.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4695868492126465, -2.908106565475464, -1.3466262817382812, 0.21485376358032227, 1.776334285736084, 3.3378148078918457, 4.899294376373291, 6.460774898529053, 8.022254943847656, 9.583735466003418, 11.14521598815918, 12.706695556640625, 14.268176078796387, 15.829656600952148, 17.391136169433594, 18.952617645263672, 20.514097213745117, 22.075576782226562, 23.63705825805664, 25.198537826538086, 26.76001739501953, 28.32149887084961, 29.882978439331055, 31.4444580078125, 33.00593948364258, 34.567420959472656, 36.12889862060547, 37.69038009643555, 39.251861572265625, 40.81333923339844, 42.374820709228516, 43.936302185058594, 45.497779846191406, 47.059261322021484, 48.6207389831543, 50.182220458984375, 51.74370193481445, 53.30518341064453, 54.866661071777344, 56.42814254760742, 57.9896240234375, 59.55110549926758, 61.11258316040039, 62.67406463623047, 64.23554229736328, 65.79702758789062, 67.35850524902344, 68.91998291015625, 70.48146057128906, 72.04293823242188, 73.60442352294922, 75.16590118408203, 76.72737884521484, 78.28886413574219, 79.850341796875, 81.41181945800781, 82.97330474853516, 84.53478240966797, 86.09626770019531, 87.65774536132812, 89.21922302246094, 90.78070831298828, 92.3421859741211, 93.9036636352539, 95.46514892578125]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 7.0, 11.0, 7.0, 12.0, 11.0, 15.0, 21.0, 15.0, 26.0, 21.0, 34.0, 28.0, 41.0, 35.0, 42.0, 34.0, 47.0, 39.0, 51.0, 31.0, 43.0, 44.0, 44.0, 36.0, 23.0, 41.0, 26.0, 36.0, 21.0, 28.0, 16.0, 20.0, 17.0, 19.0, 13.0, 8.0, 14.0, 5.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.224444389343262, -9.825515747070312, -9.426587104797363, -9.027658462524414, -8.628729820251465, -8.229801177978516, -7.830872058868408, -7.431943416595459, -7.03301477432251, -6.6340861320495605, -6.235157489776611, -5.836228370666504, -5.437299728393555, -5.0383710861206055, -4.639442443847656, -4.240513801574707, -3.841585159301758, -3.4426565170288086, -3.0437278747558594, -2.644798994064331, -2.245870351791382, -1.8469417095184326, -1.4480128288269043, -1.049084186553955, -0.6501555442810059, -0.25122684240341187, 0.14770185947418213, 0.5466306209564209, 0.9455592632293701, 1.3444879055023193, 1.7434167861938477, 2.142345428466797, 2.5412750244140625, 2.9402036666870117, 3.339132308959961, 3.7380611896514893, 4.136989593505859, 4.535918235778809, 4.934847354888916, 5.333775997161865, 5.7327046394348145, 6.131633281707764, 6.530561923980713, 6.92949104309082, 7.3284196853637695, 7.727348327636719, 8.126276969909668, 8.525205612182617, 8.924134254455566, 9.323062896728516, 9.721991539001465, 10.120920181274414, 10.519848823547363, 10.918777465820312, 11.317707061767578, 11.716634750366211, 12.115564346313477, 12.514492988586426, 12.913421630859375, 13.312350273132324, 13.711278915405273, 14.110207557678223, 14.509136199951172, 14.908065795898438, 15.30699348449707]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 9.0, 9.0, 9.0, 9.0, 19.0, 17.0, 17.0, 17.0, 23.0, 19.0, 35.0, 31.0, 30.0, 32.0, 48.0, 31.0, 34.0, 35.0, 41.0, 47.0, 39.0, 46.0, 49.0, 24.0, 27.0, 35.0, 34.0, 41.0, 31.0, 30.0, 29.0, 16.0, 12.0, 10.0, 9.0, 13.0, 9.0, 8.0, 6.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.205078125, -1.1639862060546875, -1.122894287109375, -1.0818023681640625, -1.04071044921875, -0.9996185302734375, -0.958526611328125, -0.9174346923828125, -0.8763427734375, -0.8352508544921875, -0.794158935546875, -0.7530670166015625, -0.71197509765625, -0.6708831787109375, -0.629791259765625, -0.5886993408203125, -0.547607421875, -0.5065155029296875, -0.465423583984375, -0.4243316650390625, -0.38323974609375, -0.3421478271484375, -0.301055908203125, -0.2599639892578125, -0.2188720703125, -0.1777801513671875, -0.136688232421875, -0.0955963134765625, -0.05450439453125, -0.0134124755859375, 0.027679443359375, 0.0687713623046875, 0.10986328125, 0.1509552001953125, 0.192047119140625, 0.2331390380859375, 0.27423095703125, 0.3153228759765625, 0.356414794921875, 0.3975067138671875, 0.4385986328125, 0.4796905517578125, 0.520782470703125, 0.5618743896484375, 0.60296630859375, 0.6440582275390625, 0.685150146484375, 0.7262420654296875, 0.767333984375, 0.8084259033203125, 0.849517822265625, 0.8906097412109375, 0.93170166015625, 0.9727935791015625, 1.013885498046875, 1.0549774169921875, 1.0960693359375, 1.1371612548828125, 1.178253173828125, 1.2193450927734375, 1.26043701171875, 1.3015289306640625, 1.342620849609375, 1.3837127685546875, 1.4248046875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 6.0, 13.0, 8.0, 15.0, 18.0, 40.0, 50.0, 62.0, 95.0, 163.0, 262.0, 521.0, 838.0, 1509.0, 2932.0, 6066.0, 13158.0, 32105.0, 102605.0, 806589.0, 2765611.0, 352263.0, 65652.0, 23328.0, 10066.0, 4743.0, 2450.0, 1236.0, 724.0, 408.0, 260.0, 173.0, 95.0, 67.0, 50.0, 29.0, 24.0, 15.0, 11.0, 8.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.037109375, -2.921783447265625, -2.80645751953125, -2.691131591796875, -2.5758056640625, -2.460479736328125, -2.34515380859375, -2.229827880859375, -2.114501953125, -1.999176025390625, -1.88385009765625, -1.768524169921875, -1.6531982421875, -1.537872314453125, -1.42254638671875, -1.307220458984375, -1.19189453125, -1.076568603515625, -0.96124267578125, -0.845916748046875, -0.7305908203125, -0.615264892578125, -0.49993896484375, -0.384613037109375, -0.269287109375, -0.153961181640625, -0.03863525390625, 0.076690673828125, 0.1920166015625, 0.307342529296875, 0.42266845703125, 0.537994384765625, 0.6533203125, 0.768646240234375, 0.88397216796875, 0.999298095703125, 1.1146240234375, 1.229949951171875, 1.34527587890625, 1.460601806640625, 1.575927734375, 1.691253662109375, 1.80657958984375, 1.921905517578125, 2.0372314453125, 2.152557373046875, 2.26788330078125, 2.383209228515625, 2.49853515625, 2.613861083984375, 2.72918701171875, 2.844512939453125, 2.9598388671875, 3.075164794921875, 3.19049072265625, 3.305816650390625, 3.421142578125, 3.536468505859375, 3.65179443359375, 3.767120361328125, 3.8824462890625, 3.997772216796875, 4.11309814453125, 4.228424072265625, 4.34375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 10.0, 18.0, 22.0, 26.0, 33.0, 67.0, 99.0, 134.0, 260.0, 491.0, 952.0, 790.0, 503.0, 218.0, 157.0, 88.0, 47.0, 51.0, 26.0, 23.0, 12.0, 12.0, 7.0, 8.0, 9.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.65625, -5.51104736328125, -5.3658447265625, -5.22064208984375, -5.075439453125, -4.93023681640625, -4.7850341796875, -4.63983154296875, -4.49462890625, -4.34942626953125, -4.2042236328125, -4.05902099609375, -3.913818359375, -3.76861572265625, -3.6234130859375, -3.47821044921875, -3.3330078125, -3.18780517578125, -3.0426025390625, -2.89739990234375, -2.752197265625, -2.60699462890625, -2.4617919921875, -2.31658935546875, -2.17138671875, -2.02618408203125, -1.8809814453125, -1.73577880859375, -1.590576171875, -1.44537353515625, -1.3001708984375, -1.15496826171875, -1.009765625, -0.86456298828125, -0.7193603515625, -0.57415771484375, -0.428955078125, -0.28375244140625, -0.1385498046875, 0.00665283203125, 0.15185546875, 0.29705810546875, 0.4422607421875, 0.58746337890625, 0.732666015625, 0.87786865234375, 1.0230712890625, 1.16827392578125, 1.3134765625, 1.45867919921875, 1.6038818359375, 1.74908447265625, 1.894287109375, 2.03948974609375, 2.1846923828125, 2.32989501953125, 2.47509765625, 2.62030029296875, 2.7655029296875, 2.91070556640625, 3.055908203125, 3.20111083984375, 3.3463134765625, 3.49151611328125, 3.63671875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 0.0, 5.0, 8.0, 10.0, 18.0, 29.0, 60.0, 122.0, 245.0, 634.0, 2174.0, 9261.0, 56423.0, 1144241.0, 2871917.0, 91575.0, 13297.0, 2891.0, 825.0, 294.0, 118.0, 69.0, 28.0, 19.0, 14.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0625, -8.7401123046875, -8.417724609375, -8.0953369140625, -7.77294921875, -7.4505615234375, -7.128173828125, -6.8057861328125, -6.4833984375, -6.1610107421875, -5.838623046875, -5.5162353515625, -5.19384765625, -4.8714599609375, -4.549072265625, -4.2266845703125, -3.904296875, -3.5819091796875, -3.259521484375, -2.9371337890625, -2.61474609375, -2.2923583984375, -1.969970703125, -1.6475830078125, -1.3251953125, -1.0028076171875, -0.680419921875, -0.3580322265625, -0.03564453125, 0.2867431640625, 0.609130859375, 0.9315185546875, 1.25390625, 1.5762939453125, 1.898681640625, 2.2210693359375, 2.54345703125, 2.8658447265625, 3.188232421875, 3.5106201171875, 3.8330078125, 4.1553955078125, 4.477783203125, 4.8001708984375, 5.12255859375, 5.4449462890625, 5.767333984375, 6.0897216796875, 6.412109375, 6.7344970703125, 7.056884765625, 7.3792724609375, 7.70166015625, 8.0240478515625, 8.346435546875, 8.6688232421875, 8.9912109375, 9.3135986328125, 9.635986328125, 9.9583740234375, 10.28076171875, 10.6031494140625, 10.925537109375, 11.2479248046875, 11.5703125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 14.0, 41.0, 41.0, 85.0, 141.0, 186.0, 183.0, 136.0, 89.0, 47.0, 31.0, 12.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.65752410888672, -32.635066986083984, -31.612611770629883, -30.59015464782715, -29.567699432373047, -28.545242309570312, -27.522785186767578, -26.500329971313477, -25.477874755859375, -24.45541763305664, -23.43296241760254, -22.410505294799805, -21.388050079345703, -20.36559295654297, -19.343135833740234, -18.320680618286133, -17.2982234954834, -16.275766372680664, -15.253311157226562, -14.230854034423828, -13.208398818969727, -12.185941696166992, -11.163485527038574, -10.141029357910156, -9.118573188781738, -8.09611701965332, -7.073660850524902, -6.051204204559326, -5.028748035430908, -4.00629186630249, -2.983835220336914, -1.961379051208496, -0.9389209747314453, 0.08353531360626221, 1.1059916019439697, 2.128448009490967, 3.1509041786193848, 4.173360347747803, 5.195816993713379, 6.218273162841797, 7.240729331970215, 8.263185501098633, 9.28564167022705, 10.308097839355469, 11.330554962158203, 12.353010177612305, 13.375467300415039, 14.397923469543457, 15.420379638671875, 16.44283676147461, 17.46529197692871, 18.487749099731445, 19.510204315185547, 20.53266143798828, 21.555118560791016, 22.577573776245117, 23.60002899169922, 24.622486114501953, 25.644941329956055, 26.66739845275879, 27.68985366821289, 28.712310791015625, 29.73476791381836, 30.75722312927246, 31.779680252075195]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 7.0, 2.0, 4.0, 7.0, 7.0, 10.0, 12.0, 5.0, 11.0, 12.0, 14.0, 13.0, 23.0, 21.0, 15.0, 26.0, 27.0, 24.0, 36.0, 41.0, 47.0, 37.0, 39.0, 43.0, 29.0, 30.0, 29.0, 47.0, 36.0, 30.0, 30.0, 36.0, 38.0, 23.0, 21.0, 31.0, 25.0, 13.0, 12.0, 13.0, 10.0, 13.0, 14.0, 13.0, 10.0, 5.0, 5.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.73436450958252, -8.430671691894531, -8.126978874206543, -7.8232855796813965, -7.51959228515625, -7.215899467468262, -6.912206649780273, -6.608513832092285, -6.304820537567139, -6.00112771987915, -5.697434425354004, -5.393741607666016, -5.090048789978027, -4.786355495452881, -4.482662677764893, -4.178969383239746, -3.875276565551758, -3.5715835094451904, -3.267890453338623, -2.9641976356506348, -2.6605045795440674, -2.3568115234375, -2.0531187057495117, -1.7494256496429443, -1.445732593536377, -1.1420395374298096, -0.8383466005325317, -0.5346536040306091, -0.23096060752868652, 0.07273244857788086, 0.3764253854751587, 0.6801183223724365, 0.9838123321533203, 1.2875053882598877, 1.5911983251571655, 1.8948912620544434, 2.1985843181610107, 2.502277374267578, 2.8059701919555664, 3.109663248062134, 3.413356304168701, 3.7170493602752686, 4.020742416381836, 4.324435234069824, 4.6281280517578125, 4.931821346282959, 5.235514163970947, 5.539207458496094, 5.842900276184082, 6.14659309387207, 6.450286388397217, 6.753979206085205, 7.057672500610352, 7.36136531829834, 7.665058135986328, 7.968750953674316, 8.272443771362305, 8.576136589050293, 8.879829406738281, 9.183523178100586, 9.487215995788574, 9.790908813476562, 10.09460163116455, 10.398294448852539, 10.701988220214844]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 1.0, 3.0, 10.0, 3.0, 11.0, 12.0, 18.0, 19.0, 17.0, 21.0, 23.0, 23.0, 45.0, 37.0, 23.0, 34.0, 43.0, 38.0, 43.0, 44.0, 44.0, 49.0, 41.0, 54.0, 39.0, 41.0, 37.0, 34.0, 27.0, 31.0, 22.0, 15.0, 27.0, 15.0, 9.0, 9.0, 13.0, 8.0, 3.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2548828125, -1.210479736328125, -1.16607666015625, -1.121673583984375, -1.0772705078125, -1.032867431640625, -0.98846435546875, -0.944061279296875, -0.899658203125, -0.855255126953125, -0.81085205078125, -0.766448974609375, -0.7220458984375, -0.677642822265625, -0.63323974609375, -0.588836669921875, -0.54443359375, -0.500030517578125, -0.45562744140625, -0.411224365234375, -0.3668212890625, -0.322418212890625, -0.27801513671875, -0.233612060546875, -0.189208984375, -0.144805908203125, -0.10040283203125, -0.055999755859375, -0.0115966796875, 0.032806396484375, 0.07720947265625, 0.121612548828125, 0.166015625, 0.210418701171875, 0.25482177734375, 0.299224853515625, 0.3436279296875, 0.388031005859375, 0.43243408203125, 0.476837158203125, 0.521240234375, 0.565643310546875, 0.61004638671875, 0.654449462890625, 0.6988525390625, 0.743255615234375, 0.78765869140625, 0.832061767578125, 0.87646484375, 0.920867919921875, 0.96527099609375, 1.009674072265625, 1.0540771484375, 1.098480224609375, 1.14288330078125, 1.187286376953125, 1.231689453125, 1.276092529296875, 1.32049560546875, 1.364898681640625, 1.4093017578125, 1.453704833984375, 1.49810791015625, 1.542510986328125, 1.5869140625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 2.0, 4.0, 9.0, 21.0, 32.0, 25.0, 46.0, 71.0, 108.0, 167.0, 278.0, 398.0, 652.0, 988.0, 1513.0, 2268.0, 3633.0, 5691.0, 8935.0, 13843.0, 21307.0, 31935.0, 46982.0, 68256.0, 110059.0, 294261.0, 181770.0, 84054.0, 56925.0, 39345.0, 26438.0, 17308.0, 11301.0, 7186.0, 4565.0, 2927.0, 1776.0, 1213.0, 756.0, 535.0, 361.0, 209.0, 136.0, 101.0, 57.0, 42.0, 22.0, 13.0, 13.0, 7.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.80517578125, -0.7798233032226562, -0.7544708251953125, -0.7291183471679688, -0.703765869140625, -0.6784133911132812, -0.6530609130859375, -0.6277084350585938, -0.60235595703125, -0.5770034790039062, -0.5516510009765625, -0.5262985229492188, -0.500946044921875, -0.47559356689453125, -0.4502410888671875, -0.42488861083984375, -0.3995361328125, -0.37418365478515625, -0.3488311767578125, -0.32347869873046875, -0.298126220703125, -0.27277374267578125, -0.2474212646484375, -0.22206878662109375, -0.19671630859375, -0.17136383056640625, -0.1460113525390625, -0.12065887451171875, -0.095306396484375, -0.06995391845703125, -0.0446014404296875, -0.01924896240234375, 0.006103515625, 0.03145599365234375, 0.0568084716796875, 0.08216094970703125, 0.107513427734375, 0.13286590576171875, 0.1582183837890625, 0.18357086181640625, 0.20892333984375, 0.23427581787109375, 0.2596282958984375, 0.28498077392578125, 0.310333251953125, 0.33568572998046875, 0.3610382080078125, 0.38639068603515625, 0.4117431640625, 0.43709564208984375, 0.4624481201171875, 0.48780059814453125, 0.513153076171875, 0.5385055541992188, 0.5638580322265625, 0.5892105102539062, 0.61456298828125, 0.6399154663085938, 0.6652679443359375, 0.6906204223632812, 0.715972900390625, 0.7413253784179688, 0.7666778564453125, 0.7920303344726562, 0.8173828125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 11.0, 13.0, 14.0, 7.0, 12.0, 24.0, 24.0, 27.0, 30.0, 28.0, 43.0, 41.0, 38.0, 37.0, 55.0, 43.0, 43.0, 1066.0, 51.0, 49.0, 42.0, 45.0, 42.0, 31.0, 35.0, 30.0, 25.0, 17.0, 26.0, 15.0, 9.0, 17.0, 6.0, 5.0, 10.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3154296875, -1.275634765625, -1.23583984375, -1.196044921875, -1.15625, -1.116455078125, -1.07666015625, -1.036865234375, -0.9970703125, -0.957275390625, -0.91748046875, -0.877685546875, -0.837890625, -0.798095703125, -0.75830078125, -0.718505859375, -0.6787109375, -0.638916015625, -0.59912109375, -0.559326171875, -0.51953125, -0.479736328125, -0.43994140625, -0.400146484375, -0.3603515625, -0.320556640625, -0.28076171875, -0.240966796875, -0.201171875, -0.161376953125, -0.12158203125, -0.081787109375, -0.0419921875, -0.002197265625, 0.03759765625, 0.077392578125, 0.1171875, 0.156982421875, 0.19677734375, 0.236572265625, 0.2763671875, 0.316162109375, 0.35595703125, 0.395751953125, 0.435546875, 0.475341796875, 0.51513671875, 0.554931640625, 0.5947265625, 0.634521484375, 0.67431640625, 0.714111328125, 0.75390625, 0.793701171875, 0.83349609375, 0.873291015625, 0.9130859375, 0.952880859375, 0.99267578125, 1.032470703125, 1.072265625, 1.112060546875, 1.15185546875, 1.191650390625, 1.2314453125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 7.0, 11.0, 9.0, 13.0, 25.0, 31.0, 47.0, 63.0, 81.0, 99.0, 182.0, 209.0, 329.0, 560.0, 864.0, 1340.0, 2057.0, 3296.0, 5254.0, 8762.0, 15705.0, 33174.0, 183838.0, 1716074.0, 70746.0, 23377.0, 12128.0, 7080.0, 4200.0, 2667.0, 1685.0, 1112.0, 702.0, 455.0, 270.0, 196.0, 138.0, 94.0, 68.0, 59.0, 31.0, 25.0, 19.0, 12.0, 12.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3203125, -1.2781219482421875, -1.235931396484375, -1.1937408447265625, -1.15155029296875, -1.1093597412109375, -1.067169189453125, -1.0249786376953125, -0.9827880859375, -0.9405975341796875, -0.898406982421875, -0.8562164306640625, -0.81402587890625, -0.7718353271484375, -0.729644775390625, -0.6874542236328125, -0.645263671875, -0.6030731201171875, -0.560882568359375, -0.5186920166015625, -0.47650146484375, -0.4343109130859375, -0.392120361328125, -0.3499298095703125, -0.3077392578125, -0.2655487060546875, -0.223358154296875, -0.1811676025390625, -0.13897705078125, -0.0967864990234375, -0.054595947265625, -0.0124053955078125, 0.02978515625, 0.0719757080078125, 0.114166259765625, 0.1563568115234375, 0.19854736328125, 0.2407379150390625, 0.282928466796875, 0.3251190185546875, 0.3673095703125, 0.4095001220703125, 0.451690673828125, 0.4938812255859375, 0.53607177734375, 0.5782623291015625, 0.620452880859375, 0.6626434326171875, 0.704833984375, 0.7470245361328125, 0.789215087890625, 0.8314056396484375, 0.87359619140625, 0.9157867431640625, 0.957977294921875, 1.0001678466796875, 1.0423583984375, 1.0845489501953125, 1.126739501953125, 1.1689300537109375, 1.21112060546875, 1.2533111572265625, 1.295501708984375, 1.3376922607421875, 1.3798828125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 1.0, 7.0, 4.0, 7.0, 3.0, 7.0, 11.0, 9.0, 11.0, 15.0, 17.0, 20.0, 24.0, 29.0, 27.0, 36.0, 44.0, 99.0, 146.0, 113.0, 68.0, 57.0, 32.0, 23.0, 22.0, 28.0, 17.0, 17.0, 13.0, 18.0, 13.0, 12.0, 9.0, 8.0, 1.0, 7.0, 7.0, 3.0, 1.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0999755859375, -0.09701728820800781, -0.09405899047851562, -0.09110069274902344, -0.08814239501953125, -0.08518409729003906, -0.08222579956054688, -0.07926750183105469, -0.0763092041015625, -0.07335090637207031, -0.07039260864257812, -0.06743431091308594, -0.06447601318359375, -0.06151771545410156, -0.058559417724609375, -0.05560111999511719, -0.052642822265625, -0.04968452453613281, -0.046726226806640625, -0.04376792907714844, -0.04080963134765625, -0.03785133361816406, -0.034893035888671875, -0.03193473815917969, -0.0289764404296875, -0.026018142700195312, -0.023059844970703125, -0.020101547241210938, -0.01714324951171875, -0.014184951782226562, -0.011226654052734375, -0.008268356323242188, -0.00531005859375, -0.0023517608642578125, 0.000606536865234375, 0.0035648345947265625, 0.00652313232421875, 0.009481430053710938, 0.012439727783203125, 0.015398025512695312, 0.0183563232421875, 0.021314620971679688, 0.024272918701171875, 0.027231216430664062, 0.03018951416015625, 0.03314781188964844, 0.036106109619140625, 0.03906440734863281, 0.042022705078125, 0.04498100280761719, 0.047939300537109375, 0.05089759826660156, 0.05385589599609375, 0.05681419372558594, 0.059772491455078125, 0.06273078918457031, 0.0656890869140625, 0.06864738464355469, 0.07160568237304688, 0.07456398010253906, 0.07752227783203125, 0.08048057556152344, 0.08343887329101562, 0.08639717102050781, 0.08935546875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 9.0, 6.0, 10.0, 17.0, 11.0, 20.0, 27.0, 48.0, 39.0, 66.0, 71.0, 113.0, 241.0, 740.0, 3079.0, 18078.0, 177466.0, 790770.0, 48400.0, 6890.0, 1473.0, 404.0, 162.0, 110.0, 63.0, 52.0, 38.0, 40.0, 30.0, 17.0, 17.0, 7.0, 8.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2216796875, -1.1825714111328125, -1.143463134765625, -1.1043548583984375, -1.06524658203125, -1.0261383056640625, -0.987030029296875, -0.9479217529296875, -0.9088134765625, -0.8697052001953125, -0.830596923828125, -0.7914886474609375, -0.75238037109375, -0.7132720947265625, -0.674163818359375, -0.6350555419921875, -0.595947265625, -0.5568389892578125, -0.517730712890625, -0.4786224365234375, -0.43951416015625, -0.4004058837890625, -0.361297607421875, -0.3221893310546875, -0.2830810546875, -0.2439727783203125, -0.204864501953125, -0.1657562255859375, -0.12664794921875, -0.0875396728515625, -0.048431396484375, -0.0093231201171875, 0.02978515625, 0.0688934326171875, 0.108001708984375, 0.1471099853515625, 0.18621826171875, 0.2253265380859375, 0.264434814453125, 0.3035430908203125, 0.3426513671875, 0.3817596435546875, 0.420867919921875, 0.4599761962890625, 0.49908447265625, 0.5381927490234375, 0.577301025390625, 0.6164093017578125, 0.655517578125, 0.6946258544921875, 0.733734130859375, 0.7728424072265625, 0.81195068359375, 0.8510589599609375, 0.890167236328125, 0.9292755126953125, 0.9683837890625, 1.0074920654296875, 1.046600341796875, 1.0857086181640625, 1.12481689453125, 1.1639251708984375, 1.203033447265625, 1.2421417236328125, 1.28125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 9.0, 18.0, 37.0, 76.0, 181.0, 266.0, 212.0, 127.0, 42.0, 29.0, 6.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6000566482543945, -1.5565357208251953, -1.513014793395996, -1.4694938659667969, -1.4259730577468872, -1.382452130317688, -1.3389312028884888, -1.2954102754592896, -1.2518894672393799, -1.2083685398101807, -1.1648476123809814, -1.1213266849517822, -1.0778058767318726, -1.0342849493026733, -0.9907640218734741, -0.9472430944442749, -0.9037221670150757, -0.8602012395858765, -0.816680371761322, -0.7731594443321228, -0.7296385765075684, -0.6861176490783691, -0.6425967216491699, -0.5990757942199707, -0.5555549263954163, -0.512033998966217, -0.4685131311416626, -0.4249922037124634, -0.38147130608558655, -0.3379504084587097, -0.2944294810295105, -0.25090858340263367, -0.20738756656646729, -0.16386666893959045, -0.12034575641155243, -0.0768248438835144, -0.03330394625663757, 0.010216951370239258, 0.05373787879943848, 0.09725877642631531, 0.14077967405319214, 0.18430057168006897, 0.227821484208107, 0.271342396736145, 0.31486329436302185, 0.3583841919898987, 0.4019051194190979, 0.44542601704597473, 0.48894691467285156, 0.5324678421020508, 0.5759887099266052, 0.6195096373558044, 0.6630305051803589, 0.7065514326095581, 0.7500723600387573, 0.7935932874679565, 0.837114155292511, 0.8806350827217102, 0.9241559505462646, 0.9676768779754639, 1.011197805404663, 1.0547187328338623, 1.0982396602630615, 1.1417604684829712, 1.1852813959121704]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 9.0, 1.0, 8.0, 7.0, 8.0, 11.0, 20.0, 19.0, 25.0, 21.0, 23.0, 26.0, 28.0, 31.0, 27.0, 38.0, 34.0, 38.0, 48.0, 39.0, 42.0, 40.0, 31.0, 50.0, 42.0, 49.0, 37.0, 36.0, 25.0, 30.0, 27.0, 22.0, 12.0, 14.0, 15.0, 11.0, 12.0, 10.0, 14.0, 12.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.35726022720336914, -0.3468080163002014, -0.3363558053970337, -0.32590359449386597, -0.31545135378837585, -0.30499914288520813, -0.2945469319820404, -0.2840947210788727, -0.27364251017570496, -0.26319029927253723, -0.2527380883693695, -0.2422858625650406, -0.23183365166187286, -0.22138142585754395, -0.21092921495437622, -0.2004770040512085, -0.19002477824687958, -0.17957256734371185, -0.16912034153938293, -0.1586681306362152, -0.14821591973304749, -0.13776370882987976, -0.12731148302555084, -0.11685927212238312, -0.1064070537686348, -0.09595483541488647, -0.08550262451171875, -0.07505040615797043, -0.0645981878042221, -0.05414597690105438, -0.04369375854730606, -0.033241547644138336, -0.022789329290390015, -0.012337113730609417, -0.0018848981708288193, 0.008567318320274353, 0.019019532948732376, 0.0294717475771904, 0.03992396593093872, 0.050376176834106445, 0.06082839518785477, 0.07128061354160309, 0.08173282444477081, 0.09218504279851913, 0.10263726115226746, 0.11308947205543518, 0.1235416904091835, 0.13399389386177063, 0.14444611966609955, 0.15489833056926727, 0.1653505563735962, 0.17580276727676392, 0.18625497817993164, 0.19670718908309937, 0.20715941488742828, 0.217611625790596, 0.22806385159492493, 0.23851606249809265, 0.24896828830242157, 0.2594205141067505, 0.2698727250099182, 0.28032493591308594, 0.29077714681625366, 0.3012293577194214, 0.3116815686225891]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 3.0, 2.0, 2.0, 5.0, 8.0, 6.0, 12.0, 17.0, 16.0, 18.0, 22.0, 25.0, 21.0, 30.0, 44.0, 33.0, 24.0, 34.0, 49.0, 39.0, 48.0, 38.0, 52.0, 46.0, 45.0, 46.0, 39.0, 33.0, 37.0, 33.0, 32.0, 23.0, 17.0, 27.0, 17.0, 11.0, 10.0, 13.0, 7.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.231903076171875, -1.18743896484375, -1.142974853515625, -1.0985107421875, -1.054046630859375, -1.00958251953125, -0.965118408203125, -0.920654296875, -0.876190185546875, -0.83172607421875, -0.787261962890625, -0.7427978515625, -0.698333740234375, -0.65386962890625, -0.609405517578125, -0.56494140625, -0.520477294921875, -0.47601318359375, -0.431549072265625, -0.3870849609375, -0.342620849609375, -0.29815673828125, -0.253692626953125, -0.209228515625, -0.164764404296875, -0.12030029296875, -0.075836181640625, -0.0313720703125, 0.013092041015625, 0.05755615234375, 0.102020263671875, 0.146484375, 0.190948486328125, 0.23541259765625, 0.279876708984375, 0.3243408203125, 0.368804931640625, 0.41326904296875, 0.457733154296875, 0.502197265625, 0.546661376953125, 0.59112548828125, 0.635589599609375, 0.6800537109375, 0.724517822265625, 0.76898193359375, 0.813446044921875, 0.85791015625, 0.902374267578125, 0.94683837890625, 0.991302490234375, 1.0357666015625, 1.080230712890625, 1.12469482421875, 1.169158935546875, 1.213623046875, 1.258087158203125, 1.30255126953125, 1.347015380859375, 1.3914794921875, 1.435943603515625, 1.48040771484375, 1.524871826171875, 1.5693359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 8.0, 21.0, 36.0, 27.0, 64.0, 99.0, 145.0, 229.0, 320.0, 467.0, 754.0, 1160.0, 1829.0, 3023.0, 5459.0, 10462.0, 22576.0, 57743.0, 207450.0, 515768.0, 138098.0, 44332.0, 18251.0, 8430.0, 4556.0, 2630.0, 1609.0, 1032.0, 691.0, 417.0, 287.0, 191.0, 138.0, 76.0, 54.0, 38.0, 22.0, 13.0, 12.0, 5.0, 7.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763671875, -2.6695556640625, -2.575439453125, -2.4813232421875, -2.38720703125, -2.2930908203125, -2.198974609375, -2.1048583984375, -2.0107421875, -1.9166259765625, -1.822509765625, -1.7283935546875, -1.63427734375, -1.5401611328125, -1.446044921875, -1.3519287109375, -1.2578125, -1.1636962890625, -1.069580078125, -0.9754638671875, -0.88134765625, -0.7872314453125, -0.693115234375, -0.5989990234375, -0.5048828125, -0.4107666015625, -0.316650390625, -0.2225341796875, -0.12841796875, -0.0343017578125, 0.059814453125, 0.1539306640625, 0.248046875, 0.3421630859375, 0.436279296875, 0.5303955078125, 0.62451171875, 0.7186279296875, 0.812744140625, 0.9068603515625, 1.0009765625, 1.0950927734375, 1.189208984375, 1.2833251953125, 1.37744140625, 1.4715576171875, 1.565673828125, 1.6597900390625, 1.75390625, 1.8480224609375, 1.942138671875, 2.0362548828125, 2.13037109375, 2.2244873046875, 2.318603515625, 2.4127197265625, 2.5068359375, 2.6009521484375, 2.695068359375, 2.7891845703125, 2.88330078125, 2.9774169921875, 3.071533203125, 3.1656494140625, 3.259765625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 10.0, 11.0, 17.0, 9.0, 8.0, 18.0, 14.0, 32.0, 33.0, 29.0, 29.0, 37.0, 44.0, 57.0, 65.0, 83.0, 128.0, 240.0, 1386.0, 216.0, 117.0, 68.0, 47.0, 45.0, 29.0, 44.0, 40.0, 32.0, 24.0, 20.0, 20.0, 11.0, 13.0, 9.0, 12.0, 13.0, 8.0, 8.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.7890625, -4.65020751953125, -4.5113525390625, -4.37249755859375, -4.233642578125, -4.09478759765625, -3.9559326171875, -3.81707763671875, -3.67822265625, -3.53936767578125, -3.4005126953125, -3.26165771484375, -3.122802734375, -2.98394775390625, -2.8450927734375, -2.70623779296875, -2.5673828125, -2.42852783203125, -2.2896728515625, -2.15081787109375, -2.011962890625, -1.87310791015625, -1.7342529296875, -1.59539794921875, -1.45654296875, -1.31768798828125, -1.1788330078125, -1.03997802734375, -0.901123046875, -0.76226806640625, -0.6234130859375, -0.48455810546875, -0.345703125, -0.20684814453125, -0.0679931640625, 0.07086181640625, 0.209716796875, 0.34857177734375, 0.4874267578125, 0.62628173828125, 0.76513671875, 0.90399169921875, 1.0428466796875, 1.18170166015625, 1.320556640625, 1.45941162109375, 1.5982666015625, 1.73712158203125, 1.8759765625, 2.01483154296875, 2.1536865234375, 2.29254150390625, 2.431396484375, 2.57025146484375, 2.7091064453125, 2.84796142578125, 2.98681640625, 3.12567138671875, 3.2645263671875, 3.40338134765625, 3.542236328125, 3.68109130859375, 3.8199462890625, 3.95880126953125, 4.09765625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 6.0, 10.0, 8.0, 18.0, 19.0, 26.0, 37.0, 49.0, 67.0, 94.0, 181.0, 291.0, 543.0, 1367.0, 4417.0, 24407.0, 376772.0, 2610556.0, 110046.0, 11929.0, 2795.0, 948.0, 411.0, 210.0, 144.0, 100.0, 68.0, 45.0, 32.0, 19.0, 30.0, 12.0, 15.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1953125, -6.941162109375, -6.68701171875, -6.432861328125, -6.1787109375, -5.924560546875, -5.67041015625, -5.416259765625, -5.162109375, -4.907958984375, -4.65380859375, -4.399658203125, -4.1455078125, -3.891357421875, -3.63720703125, -3.383056640625, -3.12890625, -2.874755859375, -2.62060546875, -2.366455078125, -2.1123046875, -1.858154296875, -1.60400390625, -1.349853515625, -1.095703125, -0.841552734375, -0.58740234375, -0.333251953125, -0.0791015625, 0.175048828125, 0.42919921875, 0.683349609375, 0.9375, 1.191650390625, 1.44580078125, 1.699951171875, 1.9541015625, 2.208251953125, 2.46240234375, 2.716552734375, 2.970703125, 3.224853515625, 3.47900390625, 3.733154296875, 3.9873046875, 4.241455078125, 4.49560546875, 4.749755859375, 5.00390625, 5.258056640625, 5.51220703125, 5.766357421875, 6.0205078125, 6.274658203125, 6.52880859375, 6.782958984375, 7.037109375, 7.291259765625, 7.54541015625, 7.799560546875, 8.0537109375, 8.307861328125, 8.56201171875, 8.816162109375, 9.0703125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 12.0, 34.0, 77.0, 132.0, 209.0, 211.0, 176.0, 103.0, 33.0, 16.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.6903076171875, -25.95026206970215, -25.21021842956543, -24.470172882080078, -23.730127334594727, -22.990081787109375, -22.250038146972656, -21.509992599487305, -20.769947052001953, -20.0299015045166, -19.289857864379883, -18.54981231689453, -17.80976676940918, -17.069721221923828, -16.32967758178711, -15.589632034301758, -14.849587440490723, -14.109542846679688, -13.369497299194336, -12.6294527053833, -11.88940715789795, -11.149362564086914, -10.409317016601562, -9.669272422790527, -8.929227828979492, -8.189183235168457, -7.4491376876831055, -6.70909309387207, -5.969047546386719, -5.229002952575684, -4.48895788192749, -3.748912811279297, -3.0088672637939453, -2.268822193145752, -1.5287772417068481, -0.7887322902679443, -0.04868721961975098, 0.6913578510284424, 1.4314026832580566, 2.17144775390625, 2.9114928245544434, 3.6515378952026367, 4.39158296585083, 5.131628036499023, 5.871672630310059, 6.61171817779541, 7.351762771606445, 8.091808319091797, 8.831852912902832, 9.571897506713867, 10.311943054199219, 11.051987648010254, 11.792033195495605, 12.53207778930664, 13.272123336791992, 14.012167930603027, 14.752212524414062, 15.492257118225098, 16.232301712036133, 16.972347259521484, 17.712392807006836, 18.452438354492188, 19.192481994628906, 19.932527542114258, 20.67257308959961]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 11.0, 12.0, 12.0, 12.0, 15.0, 22.0, 22.0, 35.0, 24.0, 29.0, 36.0, 38.0, 31.0, 36.0, 38.0, 49.0, 47.0, 45.0, 39.0, 43.0, 37.0, 47.0, 46.0, 28.0, 38.0, 18.0, 29.0, 20.0, 21.0, 21.0, 23.0, 16.0, 8.0, 8.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.457600593566895, -14.023017883300781, -13.588436126708984, -13.153853416442871, -12.719270706176758, -12.284688949584961, -11.850106239318848, -11.415523529052734, -10.980941772460938, -10.546359062194824, -10.111777305603027, -9.677194595336914, -9.2426118850708, -8.808029174804688, -8.37344741821289, -7.938864707946777, -7.504281997680664, -7.069699764251709, -6.635117053985596, -6.200534820556641, -5.765952110290527, -5.331369876861572, -4.896787643432617, -4.462204933166504, -4.027622699737549, -3.5930402278900146, -3.1584577560424805, -2.7238755226135254, -2.289293050765991, -1.854710578918457, -1.420128345489502, -0.9855458736419678, -0.5509624481201172, -0.11638003587722778, 0.3182023763656616, 0.7527847290039062, 1.1873672008514404, 1.6219496726989746, 2.0565319061279297, 2.491114377975464, 2.925696849822998, 3.3602793216705322, 3.7948617935180664, 4.2294440269470215, 4.664026260375977, 5.09860897064209, 5.533191204071045, 5.9677734375, 6.402356147766113, 6.836938381195068, 7.271521091461182, 7.706103324890137, 8.14068603515625, 8.575267791748047, 9.00985050201416, 9.444433212280273, 9.87901496887207, 10.313597679138184, 10.74817943572998, 11.182762145996094, 11.617344856262207, 12.05192756652832, 12.486509323120117, 12.92109203338623, 13.355674743652344]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 5.0, 9.0, 11.0, 7.0, 11.0, 22.0, 12.0, 22.0, 30.0, 21.0, 30.0, 31.0, 37.0, 41.0, 40.0, 35.0, 38.0, 51.0, 41.0, 47.0, 55.0, 47.0, 37.0, 32.0, 33.0, 30.0, 41.0, 34.0, 23.0, 24.0, 20.0, 12.0, 19.0, 12.0, 4.0, 8.0, 3.0, 3.0, 7.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4736328125, -1.42559814453125, -1.3775634765625, -1.32952880859375, -1.281494140625, -1.23345947265625, -1.1854248046875, -1.13739013671875, -1.08935546875, -1.04132080078125, -0.9932861328125, -0.94525146484375, -0.897216796875, -0.84918212890625, -0.8011474609375, -0.75311279296875, -0.705078125, -0.65704345703125, -0.6090087890625, -0.56097412109375, -0.512939453125, -0.46490478515625, -0.4168701171875, -0.36883544921875, -0.32080078125, -0.27276611328125, -0.2247314453125, -0.17669677734375, -0.128662109375, -0.08062744140625, -0.0325927734375, 0.01544189453125, 0.0634765625, 0.11151123046875, 0.1595458984375, 0.20758056640625, 0.255615234375, 0.30364990234375, 0.3516845703125, 0.39971923828125, 0.44775390625, 0.49578857421875, 0.5438232421875, 0.59185791015625, 0.639892578125, 0.68792724609375, 0.7359619140625, 0.78399658203125, 0.83203125, 0.88006591796875, 0.9281005859375, 0.97613525390625, 1.024169921875, 1.07220458984375, 1.1202392578125, 1.16827392578125, 1.21630859375, 1.26434326171875, 1.3123779296875, 1.36041259765625, 1.408447265625, 1.45648193359375, 1.5045166015625, 1.55255126953125, 1.6005859375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 6.0, 9.0, 23.0, 20.0, 37.0, 63.0, 92.0, 142.0, 179.0, 299.0, 421.0, 636.0, 963.0, 1476.0, 2283.0, 3481.0, 5621.0, 9655.0, 17034.0, 32100.0, 73799.0, 236599.0, 1056474.0, 1927918.0, 577120.0, 137619.0, 50355.0, 24654.0, 13610.0, 7946.0, 4713.0, 2998.0, 1977.0, 1290.0, 839.0, 589.0, 431.0, 266.0, 168.0, 125.0, 88.0, 61.0, 31.0, 22.0, 20.0, 18.0, 9.0, 9.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9189453125, -1.8486480712890625, -1.778350830078125, -1.7080535888671875, -1.63775634765625, -1.5674591064453125, -1.497161865234375, -1.4268646240234375, -1.3565673828125, -1.2862701416015625, -1.215972900390625, -1.1456756591796875, -1.07537841796875, -1.0050811767578125, -0.934783935546875, -0.8644866943359375, -0.794189453125, -0.7238922119140625, -0.653594970703125, -0.5832977294921875, -0.51300048828125, -0.4427032470703125, -0.372406005859375, -0.3021087646484375, -0.2318115234375, -0.1615142822265625, -0.091217041015625, -0.0209197998046875, 0.04937744140625, 0.1196746826171875, 0.189971923828125, 0.2602691650390625, 0.33056640625, 0.4008636474609375, 0.471160888671875, 0.5414581298828125, 0.61175537109375, 0.6820526123046875, 0.752349853515625, 0.8226470947265625, 0.8929443359375, 0.9632415771484375, 1.033538818359375, 1.1038360595703125, 1.17413330078125, 1.2444305419921875, 1.314727783203125, 1.3850250244140625, 1.455322265625, 1.5256195068359375, 1.595916748046875, 1.6662139892578125, 1.73651123046875, 1.8068084716796875, 1.877105712890625, 1.9474029541015625, 2.0177001953125, 2.0879974365234375, 2.158294677734375, 2.2285919189453125, 2.29888916015625, 2.3691864013671875, 2.439483642578125, 2.5097808837890625, 2.580078125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 6.0, 13.0, 15.0, 25.0, 25.0, 53.0, 86.0, 127.0, 317.0, 639.0, 1054.0, 822.0, 389.0, 175.0, 121.0, 69.0, 42.0, 29.0, 30.0, 11.0, 3.0, 11.0, 3.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-7.98828125, -7.809417724609375, -7.63055419921875, -7.451690673828125, -7.2728271484375, -7.093963623046875, -6.91510009765625, -6.736236572265625, -6.557373046875, -6.378509521484375, -6.19964599609375, -6.020782470703125, -5.8419189453125, -5.663055419921875, -5.48419189453125, -5.305328369140625, -5.12646484375, -4.947601318359375, -4.76873779296875, -4.589874267578125, -4.4110107421875, -4.232147216796875, -4.05328369140625, -3.874420166015625, -3.695556640625, -3.516693115234375, -3.33782958984375, -3.158966064453125, -2.9801025390625, -2.801239013671875, -2.62237548828125, -2.443511962890625, -2.2646484375, -2.085784912109375, -1.90692138671875, -1.728057861328125, -1.5491943359375, -1.370330810546875, -1.19146728515625, -1.012603759765625, -0.833740234375, -0.654876708984375, -0.47601318359375, -0.297149658203125, -0.1182861328125, 0.060577392578125, 0.23944091796875, 0.418304443359375, 0.59716796875, 0.776031494140625, 0.95489501953125, 1.133758544921875, 1.3126220703125, 1.491485595703125, 1.67034912109375, 1.849212646484375, 2.028076171875, 2.206939697265625, 2.38580322265625, 2.564666748046875, 2.7435302734375, 2.922393798828125, 3.10125732421875, 3.280120849609375, 3.458984375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 9.0, 14.0, 21.0, 37.0, 38.0, 57.0, 105.0, 228.0, 498.0, 1251.0, 3293.0, 10060.0, 38334.0, 235046.0, 3150489.0, 659394.0, 71126.0, 16326.0, 4944.0, 1681.0, 660.0, 313.0, 151.0, 73.0, 45.0, 32.0, 14.0, 12.0, 15.0, 1.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.87890625, -4.64312744140625, -4.4073486328125, -4.17156982421875, -3.935791015625, -3.70001220703125, -3.4642333984375, -3.22845458984375, -2.99267578125, -2.75689697265625, -2.5211181640625, -2.28533935546875, -2.049560546875, -1.81378173828125, -1.5780029296875, -1.34222412109375, -1.1064453125, -0.87066650390625, -0.6348876953125, -0.39910888671875, -0.163330078125, 0.07244873046875, 0.3082275390625, 0.54400634765625, 0.77978515625, 1.01556396484375, 1.2513427734375, 1.48712158203125, 1.722900390625, 1.95867919921875, 2.1944580078125, 2.43023681640625, 2.666015625, 2.90179443359375, 3.1375732421875, 3.37335205078125, 3.609130859375, 3.84490966796875, 4.0806884765625, 4.31646728515625, 4.55224609375, 4.78802490234375, 5.0238037109375, 5.25958251953125, 5.495361328125, 5.73114013671875, 5.9669189453125, 6.20269775390625, 6.4384765625, 6.67425537109375, 6.9100341796875, 7.14581298828125, 7.381591796875, 7.61737060546875, 7.8531494140625, 8.08892822265625, 8.32470703125, 8.56048583984375, 8.7962646484375, 9.03204345703125, 9.267822265625, 9.50360107421875, 9.7393798828125, 9.97515869140625, 10.2109375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 7.0, 10.0, 12.0, 16.0, 24.0, 25.0, 52.0, 62.0, 67.0, 86.0, 94.0, 96.0, 99.0, 77.0, 61.0, 54.0, 45.0, 35.0, 19.0, 20.0, 12.0, 9.0, 6.0, 6.0, 2.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.634004592895508, -19.108203887939453, -18.582401275634766, -18.05660057067871, -17.530799865722656, -17.0049991607666, -16.479198455810547, -15.95339584350586, -15.427595138549805, -14.90179443359375, -14.375992774963379, -13.850191116333008, -13.324390411376953, -12.798589706420898, -12.272788047790527, -11.746986389160156, -11.221185684204102, -10.695384979248047, -10.169583320617676, -9.643781661987305, -9.11798095703125, -8.592180252075195, -8.066378593444824, -7.540577411651611, -7.014776229858398, -6.4889750480651855, -5.963173866271973, -5.43737268447876, -4.911571502685547, -4.385770320892334, -3.859969139099121, -3.334167957305908, -2.808368682861328, -2.2825675010681152, -1.7567663192749023, -1.2309651374816895, -0.7051639556884766, -0.17936277389526367, 0.3464384078979492, 0.8722395896911621, 1.398040771484375, 1.923841953277588, 2.449643135070801, 2.9754443168640137, 3.5012454986572266, 4.0270466804504395, 4.552847862243652, 5.078649044036865, 5.604450225830078, 6.130251407623291, 6.656052589416504, 7.181853771209717, 7.70765495300293, 8.233455657958984, 8.759257316589355, 9.285058975219727, 9.810859680175781, 10.336660385131836, 10.862462043762207, 11.388263702392578, 11.914064407348633, 12.439865112304688, 12.965666770935059, 13.49146842956543, 14.017269134521484]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 2.0, 5.0, 10.0, 13.0, 11.0, 14.0, 14.0, 19.0, 24.0, 18.0, 27.0, 23.0, 28.0, 29.0, 34.0, 36.0, 40.0, 38.0, 46.0, 45.0, 36.0, 37.0, 35.0, 28.0, 31.0, 43.0, 31.0, 35.0, 33.0, 28.0, 29.0, 18.0, 22.0, 19.0, 14.0, 9.0, 15.0, 15.0, 12.0, 9.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0], "bins": [-12.02035903930664, -11.666400909423828, -11.312442779541016, -10.958484649658203, -10.60452651977539, -10.250568389892578, -9.896610260009766, -9.542652130126953, -9.18869400024414, -8.834735870361328, -8.480777740478516, -8.126819610595703, -7.772861480712891, -7.418903350830078, -7.064945220947266, -6.710987091064453, -6.357029438018799, -6.003071308135986, -5.649113178253174, -5.295155048370361, -4.941196918487549, -4.587238788604736, -4.233281135559082, -3.8793227672576904, -3.525364637374878, -3.1714065074920654, -2.817448377609253, -2.4634904861450195, -2.109532356262207, -1.755574107170105, -1.401616096496582, -1.0476579666137695, -0.693699836730957, -0.3397417366504669, 0.014216363430023193, 0.3681744337081909, 0.7221325635910034, 1.076090693473816, 1.4300487041473389, 1.7840068340301514, 2.137964963912964, 2.4919230937957764, 2.845881223678589, 3.1998391151428223, 3.5537972450256348, 3.9077553749084473, 4.26171350479126, 4.615671634674072, 4.969629764556885, 5.323587894439697, 5.67754602432251, 6.031504154205322, 6.385462284088135, 6.739420413970947, 7.093378067016602, 7.447336196899414, 7.801294326782227, 8.155252456665039, 8.509210586547852, 8.863168716430664, 9.217126846313477, 9.571084976196289, 9.925043106079102, 10.279001235961914, 10.632959365844727]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 13.0, 15.0, 9.0, 15.0, 18.0, 22.0, 21.0, 18.0, 19.0, 42.0, 26.0, 37.0, 33.0, 56.0, 51.0, 51.0, 55.0, 45.0, 39.0, 50.0, 45.0, 35.0, 28.0, 46.0, 33.0, 34.0, 29.0, 19.0, 20.0, 17.0, 12.0, 12.0, 9.0, 7.0, 5.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.329681396484375, -1.27850341796875, -1.227325439453125, -1.1761474609375, -1.124969482421875, -1.07379150390625, -1.022613525390625, -0.971435546875, -0.920257568359375, -0.86907958984375, -0.817901611328125, -0.7667236328125, -0.715545654296875, -0.66436767578125, -0.613189697265625, -0.56201171875, -0.510833740234375, -0.45965576171875, -0.408477783203125, -0.3572998046875, -0.306121826171875, -0.25494384765625, -0.203765869140625, -0.152587890625, -0.101409912109375, -0.05023193359375, 0.000946044921875, 0.0521240234375, 0.103302001953125, 0.15447998046875, 0.205657958984375, 0.2568359375, 0.308013916015625, 0.35919189453125, 0.410369873046875, 0.4615478515625, 0.512725830078125, 0.56390380859375, 0.615081787109375, 0.666259765625, 0.717437744140625, 0.76861572265625, 0.819793701171875, 0.8709716796875, 0.922149658203125, 0.97332763671875, 1.024505615234375, 1.07568359375, 1.126861572265625, 1.17803955078125, 1.229217529296875, 1.2803955078125, 1.331573486328125, 1.38275146484375, 1.433929443359375, 1.485107421875, 1.536285400390625, 1.58746337890625, 1.638641357421875, 1.6898193359375, 1.740997314453125, 1.79217529296875, 1.843353271484375, 1.89453125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 8.0, 12.0, 17.0, 33.0, 45.0, 64.0, 115.0, 170.0, 268.0, 424.0, 642.0, 1179.0, 1783.0, 2728.0, 4443.0, 7185.0, 11353.0, 18228.0, 28306.0, 43716.0, 66041.0, 95533.0, 125158.0, 145626.0, 140568.0, 113758.0, 83039.0, 56612.0, 37164.0, 24000.0, 15121.0, 9522.0, 5864.0, 3684.0, 2341.0, 1448.0, 866.0, 556.0, 358.0, 207.0, 128.0, 76.0, 61.0, 37.0, 22.0, 10.0, 17.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.84716796875, -0.8213424682617188, -0.7955169677734375, -0.7696914672851562, -0.743865966796875, -0.7180404663085938, -0.6922149658203125, -0.6663894653320312, -0.64056396484375, -0.6147384643554688, -0.5889129638671875, -0.5630874633789062, -0.537261962890625, -0.5114364624023438, -0.4856109619140625, -0.45978546142578125, -0.4339599609375, -0.40813446044921875, -0.3823089599609375, -0.35648345947265625, -0.330657958984375, -0.30483245849609375, -0.2790069580078125, -0.25318145751953125, -0.22735595703125, -0.20153045654296875, -0.1757049560546875, -0.14987945556640625, -0.124053955078125, -0.09822845458984375, -0.0724029541015625, -0.04657745361328125, -0.020751953125, 0.00507354736328125, 0.0308990478515625, 0.05672454833984375, 0.082550048828125, 0.10837554931640625, 0.1342010498046875, 0.16002655029296875, 0.18585205078125, 0.21167755126953125, 0.2375030517578125, 0.26332855224609375, 0.289154052734375, 0.31497955322265625, 0.3408050537109375, 0.36663055419921875, 0.3924560546875, 0.41828155517578125, 0.4441070556640625, 0.46993255615234375, 0.495758056640625, 0.5215835571289062, 0.5474090576171875, 0.5732345581054688, 0.59906005859375, 0.6248855590820312, 0.6507110595703125, 0.6765365600585938, 0.702362060546875, 0.7281875610351562, 0.7540130615234375, 0.7798385620117188, 0.8056640625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 9.0, 10.0, 12.0, 15.0, 23.0, 26.0, 22.0, 22.0, 18.0, 31.0, 44.0, 42.0, 45.0, 44.0, 48.0, 42.0, 1071.0, 64.0, 43.0, 40.0, 43.0, 35.0, 43.0, 31.0, 30.0, 18.0, 23.0, 24.0, 18.0, 19.0, 13.0, 7.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.25, -1.2099609375, -1.169921875, -1.1298828125, -1.08984375, -1.0498046875, -1.009765625, -0.9697265625, -0.9296875, -0.8896484375, -0.849609375, -0.8095703125, -0.76953125, -0.7294921875, -0.689453125, -0.6494140625, -0.609375, -0.5693359375, -0.529296875, -0.4892578125, -0.44921875, -0.4091796875, -0.369140625, -0.3291015625, -0.2890625, -0.2490234375, -0.208984375, -0.1689453125, -0.12890625, -0.0888671875, -0.048828125, -0.0087890625, 0.03125, 0.0712890625, 0.111328125, 0.1513671875, 0.19140625, 0.2314453125, 0.271484375, 0.3115234375, 0.3515625, 0.3916015625, 0.431640625, 0.4716796875, 0.51171875, 0.5517578125, 0.591796875, 0.6318359375, 0.671875, 0.7119140625, 0.751953125, 0.7919921875, 0.83203125, 0.8720703125, 0.912109375, 0.9521484375, 0.9921875, 1.0322265625, 1.072265625, 1.1123046875, 1.15234375, 1.1923828125, 1.232421875, 1.2724609375, 1.3125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 9.0, 12.0, 14.0, 27.0, 44.0, 56.0, 75.0, 129.0, 213.0, 347.0, 495.0, 897.0, 1525.0, 2673.0, 4550.0, 7767.0, 13991.0, 27233.0, 81960.0, 1700649.0, 179070.0, 35533.0, 17084.0, 9382.0, 5480.0, 3251.0, 1803.0, 1080.0, 661.0, 441.0, 223.0, 151.0, 81.0, 59.0, 39.0, 29.0, 30.0, 16.0, 10.0, 10.0, 7.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.716796875, -1.665802001953125, -1.61480712890625, -1.563812255859375, -1.5128173828125, -1.461822509765625, -1.41082763671875, -1.359832763671875, -1.308837890625, -1.257843017578125, -1.20684814453125, -1.155853271484375, -1.1048583984375, -1.053863525390625, -1.00286865234375, -0.951873779296875, -0.90087890625, -0.849884033203125, -0.79888916015625, -0.747894287109375, -0.6968994140625, -0.645904541015625, -0.59490966796875, -0.543914794921875, -0.492919921875, -0.441925048828125, -0.39093017578125, -0.339935302734375, -0.2889404296875, -0.237945556640625, -0.18695068359375, -0.135955810546875, -0.0849609375, -0.033966064453125, 0.01702880859375, 0.068023681640625, 0.1190185546875, 0.170013427734375, 0.22100830078125, 0.272003173828125, 0.322998046875, 0.373992919921875, 0.42498779296875, 0.475982666015625, 0.5269775390625, 0.577972412109375, 0.62896728515625, 0.679962158203125, 0.73095703125, 0.781951904296875, 0.83294677734375, 0.883941650390625, 0.9349365234375, 0.985931396484375, 1.03692626953125, 1.087921142578125, 1.138916015625, 1.189910888671875, 1.24090576171875, 1.291900634765625, 1.3428955078125, 1.393890380859375, 1.44488525390625, 1.495880126953125, 1.546875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 5.0, 5.0, 4.0, 9.0, 12.0, 10.0, 15.0, 26.0, 42.0, 55.0, 59.0, 44.0, 65.0, 71.0, 64.0, 92.0, 69.0, 76.0, 47.0, 53.0, 36.0, 30.0, 22.0, 25.0, 10.0, 9.0, 13.0, 4.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.10906982421875, -0.10601615905761719, -0.10296249389648438, -0.09990882873535156, -0.09685516357421875, -0.09380149841308594, -0.09074783325195312, -0.08769416809082031, -0.0846405029296875, -0.08158683776855469, -0.07853317260742188, -0.07547950744628906, -0.07242584228515625, -0.06937217712402344, -0.06631851196289062, -0.06326484680175781, -0.060211181640625, -0.05715751647949219, -0.054103851318359375, -0.05105018615722656, -0.04799652099609375, -0.04494285583496094, -0.041889190673828125, -0.03883552551269531, -0.0357818603515625, -0.03272819519042969, -0.029674530029296875, -0.026620864868164062, -0.02356719970703125, -0.020513534545898438, -0.017459869384765625, -0.014406204223632812, -0.0113525390625, -0.008298873901367188, -0.005245208740234375, -0.0021915435791015625, 0.00086212158203125, 0.0039157867431640625, 0.006969451904296875, 0.010023117065429688, 0.0130767822265625, 0.016130447387695312, 0.019184112548828125, 0.022237777709960938, 0.02529144287109375, 0.028345108032226562, 0.031398773193359375, 0.03445243835449219, 0.037506103515625, 0.04055976867675781, 0.043613433837890625, 0.04666709899902344, 0.04972076416015625, 0.05277442932128906, 0.055828094482421875, 0.05888175964355469, 0.0619354248046875, 0.06498908996582031, 0.06804275512695312, 0.07109642028808594, 0.07415008544921875, 0.07720375061035156, 0.08025741577148438, 0.08331108093261719, 0.08636474609375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 7.0, 3.0, 8.0, 8.0, 10.0, 14.0, 9.0, 18.0, 29.0, 50.0, 47.0, 79.0, 125.0, 246.0, 607.0, 1416.0, 5546.0, 57407.0, 782809.0, 185193.0, 11090.0, 2203.0, 757.0, 343.0, 173.0, 95.0, 61.0, 37.0, 33.0, 30.0, 22.0, 13.0, 11.0, 9.0, 11.0, 3.0, 4.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.03125, -0.9965057373046875, -0.961761474609375, -0.9270172119140625, -0.89227294921875, -0.8575286865234375, -0.822784423828125, -0.7880401611328125, -0.7532958984375, -0.7185516357421875, -0.683807373046875, -0.6490631103515625, -0.61431884765625, -0.5795745849609375, -0.544830322265625, -0.5100860595703125, -0.475341796875, -0.4405975341796875, -0.405853271484375, -0.3711090087890625, -0.33636474609375, -0.3016204833984375, -0.266876220703125, -0.2321319580078125, -0.1973876953125, -0.1626434326171875, -0.127899169921875, -0.0931549072265625, -0.05841064453125, -0.0236663818359375, 0.011077880859375, 0.0458221435546875, 0.08056640625, 0.1153106689453125, 0.150054931640625, 0.1847991943359375, 0.21954345703125, 0.2542877197265625, 0.289031982421875, 0.3237762451171875, 0.3585205078125, 0.3932647705078125, 0.428009033203125, 0.4627532958984375, 0.49749755859375, 0.5322418212890625, 0.566986083984375, 0.6017303466796875, 0.636474609375, 0.6712188720703125, 0.705963134765625, 0.7407073974609375, 0.77545166015625, 0.8101959228515625, 0.844940185546875, 0.8796844482421875, 0.9144287109375, 0.9491729736328125, 0.983917236328125, 1.0186614990234375, 1.05340576171875, 1.0881500244140625, 1.122894287109375, 1.1576385498046875, 1.1923828125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 10.0, 15.0, 27.0, 46.0, 62.0, 110.0, 145.0, 174.0, 148.0, 107.0, 68.0, 38.0, 19.0, 12.0, 10.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3726251721382141, -0.3487432599067688, -0.3248613476753235, -0.30097946524620056, -0.27709755301475525, -0.25321564078330994, -0.22933374345302582, -0.2054518461227417, -0.1815699338912964, -0.15768802165985107, -0.13380612432956696, -0.10992421954870224, -0.08604231476783752, -0.06216040998697281, -0.03827850520610809, -0.014396607875823975, 0.009485304355621338, 0.03336720913648605, 0.05724911391735077, 0.08113101869821548, 0.1050129234790802, 0.1288948357105255, 0.15277673304080963, 0.17665863037109375, 0.20054054260253906, 0.22442245483398438, 0.2483043521642685, 0.2721862494945526, 0.2960681617259979, 0.31995007395744324, 0.34383195638656616, 0.3677138686180115, 0.391595721244812, 0.4154776334762573, 0.43935954570770264, 0.46324142813682556, 0.4871233403682709, 0.5110052227973938, 0.5348871350288391, 0.5587690472602844, 0.5826509594917297, 0.606532871723175, 0.6304147839546204, 0.6542966961860657, 0.6781785488128662, 0.7020604610443115, 0.7259423732757568, 0.7498242855072021, 0.7737061977386475, 0.7975881099700928, 0.8214700222015381, 0.8453519344329834, 0.8692338466644287, 0.8931156992912292, 0.9169976115226746, 0.9408795237541199, 0.9647614359855652, 0.9886433482170105, 1.012525200843811, 1.0364071130752563, 1.0602890253067017, 1.084170937538147, 1.1080528497695923, 1.1319347620010376, 1.155816674232483]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 16.0, 15.0, 20.0, 20.0, 19.0, 24.0, 41.0, 34.0, 51.0, 56.0, 57.0, 49.0, 48.0, 72.0, 69.0, 46.0, 55.0, 41.0, 41.0, 37.0, 41.0, 28.0, 22.0, 25.0, 13.0, 11.0, 10.0, 8.0, 9.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3286868929862976, -0.3152666985988617, -0.3018464744091034, -0.2884262800216675, -0.2750060558319092, -0.26158586144447327, -0.24816566705703735, -0.23474545776844025, -0.22132524847984314, -0.20790503919124603, -0.19448482990264893, -0.181064635515213, -0.1676444262266159, -0.1542242169380188, -0.14080402255058289, -0.12738381326198578, -0.11396360397338867, -0.10054339468479156, -0.08712319284677505, -0.07370299100875854, -0.06028278172016144, -0.04686257243156433, -0.03344237059354782, -0.02002216875553131, -0.006601959466934204, 0.006818246096372604, 0.020238451659679413, 0.03365865722298622, 0.04707886278629303, 0.06049907207489014, 0.07391927391290665, 0.08733947575092316, 0.10075968503952026, 0.11417989432811737, 0.12760010361671448, 0.1410202980041504, 0.1544405072927475, 0.1678607165813446, 0.18128091096878052, 0.19470112025737762, 0.20812132954597473, 0.22154153883457184, 0.23496174812316895, 0.24838194251060486, 0.26180213689804077, 0.2752223610877991, 0.288642555475235, 0.3020627498626709, 0.3154829740524292, 0.3289031684398651, 0.3423233926296234, 0.3557435870170593, 0.3691638112068176, 0.38258400559425354, 0.39600419998168945, 0.40942442417144775, 0.42284461855888367, 0.4362648129463196, 0.4496850371360779, 0.4631052315235138, 0.4765254259109497, 0.489945650100708, 0.5033658742904663, 0.5167860388755798, 0.5302062630653381]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 9.0, 13.0, 15.0, 14.0, 14.0, 23.0, 22.0, 17.0, 24.0, 32.0, 30.0, 43.0, 34.0, 50.0, 55.0, 54.0, 48.0, 47.0, 40.0, 55.0, 45.0, 34.0, 28.0, 48.0, 30.0, 32.0, 29.0, 19.0, 20.0, 20.0, 10.0, 12.0, 9.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3896484375, -1.338134765625, -1.28662109375, -1.235107421875, -1.18359375, -1.132080078125, -1.08056640625, -1.029052734375, -0.9775390625, -0.926025390625, -0.87451171875, -0.822998046875, -0.771484375, -0.719970703125, -0.66845703125, -0.616943359375, -0.5654296875, -0.513916015625, -0.46240234375, -0.410888671875, -0.359375, -0.307861328125, -0.25634765625, -0.204833984375, -0.1533203125, -0.101806640625, -0.05029296875, 0.001220703125, 0.052734375, 0.104248046875, 0.15576171875, 0.207275390625, 0.2587890625, 0.310302734375, 0.36181640625, 0.413330078125, 0.46484375, 0.516357421875, 0.56787109375, 0.619384765625, 0.6708984375, 0.722412109375, 0.77392578125, 0.825439453125, 0.876953125, 0.928466796875, 0.97998046875, 1.031494140625, 1.0830078125, 1.134521484375, 1.18603515625, 1.237548828125, 1.2890625, 1.340576171875, 1.39208984375, 1.443603515625, 1.4951171875, 1.546630859375, 1.59814453125, 1.649658203125, 1.701171875, 1.752685546875, 1.80419921875, 1.855712890625, 1.9072265625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 9.0, 14.0, 10.0, 18.0, 39.0, 47.0, 51.0, 88.0, 149.0, 227.0, 333.0, 499.0, 892.0, 1455.0, 2661.0, 4749.0, 9133.0, 18663.0, 40279.0, 96347.0, 470892.0, 265905.0, 72490.0, 31943.0, 14750.0, 7446.0, 4036.0, 2095.0, 1256.0, 751.0, 462.0, 308.0, 189.0, 131.0, 76.0, 54.0, 31.0, 28.0, 24.0, 7.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.10546875, -2.99395751953125, -2.8824462890625, -2.77093505859375, -2.659423828125, -2.54791259765625, -2.4364013671875, -2.32489013671875, -2.21337890625, -2.10186767578125, -1.9903564453125, -1.87884521484375, -1.767333984375, -1.65582275390625, -1.5443115234375, -1.43280029296875, -1.3212890625, -1.20977783203125, -1.0982666015625, -0.98675537109375, -0.875244140625, -0.76373291015625, -0.6522216796875, -0.54071044921875, -0.42919921875, -0.31768798828125, -0.2061767578125, -0.09466552734375, 0.016845703125, 0.12835693359375, 0.2398681640625, 0.35137939453125, 0.462890625, 0.57440185546875, 0.6859130859375, 0.79742431640625, 0.908935546875, 1.02044677734375, 1.1319580078125, 1.24346923828125, 1.35498046875, 1.46649169921875, 1.5780029296875, 1.68951416015625, 1.801025390625, 1.91253662109375, 2.0240478515625, 2.13555908203125, 2.2470703125, 2.35858154296875, 2.4700927734375, 2.58160400390625, 2.693115234375, 2.80462646484375, 2.9161376953125, 3.02764892578125, 3.13916015625, 3.25067138671875, 3.3621826171875, 3.47369384765625, 3.585205078125, 3.69671630859375, 3.8082275390625, 3.91973876953125, 4.03125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 8.0, 13.0, 7.0, 8.0, 14.0, 16.0, 19.0, 15.0, 17.0, 24.0, 32.0, 31.0, 44.0, 46.0, 61.0, 71.0, 92.0, 157.0, 202.0, 1366.0, 173.0, 105.0, 94.0, 75.0, 58.0, 43.0, 30.0, 32.0, 33.0, 23.0, 25.0, 25.0, 19.0, 9.0, 7.0, 9.0, 8.0, 4.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 3.0], "bins": [-5.640625, -5.4852294921875, -5.329833984375, -5.1744384765625, -5.01904296875, -4.8636474609375, -4.708251953125, -4.5528564453125, -4.3974609375, -4.2420654296875, -4.086669921875, -3.9312744140625, -3.77587890625, -3.6204833984375, -3.465087890625, -3.3096923828125, -3.154296875, -2.9989013671875, -2.843505859375, -2.6881103515625, -2.53271484375, -2.3773193359375, -2.221923828125, -2.0665283203125, -1.9111328125, -1.7557373046875, -1.600341796875, -1.4449462890625, -1.28955078125, -1.1341552734375, -0.978759765625, -0.8233642578125, -0.66796875, -0.5125732421875, -0.357177734375, -0.2017822265625, -0.04638671875, 0.1090087890625, 0.264404296875, 0.4197998046875, 0.5751953125, 0.7305908203125, 0.885986328125, 1.0413818359375, 1.19677734375, 1.3521728515625, 1.507568359375, 1.6629638671875, 1.818359375, 1.9737548828125, 2.129150390625, 2.2845458984375, 2.43994140625, 2.5953369140625, 2.750732421875, 2.9061279296875, 3.0615234375, 3.2169189453125, 3.372314453125, 3.5277099609375, 3.68310546875, 3.8385009765625, 3.993896484375, 4.1492919921875, 4.3046875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 10.0, 12.0, 16.0, 20.0, 32.0, 39.0, 46.0, 66.0, 82.0, 142.0, 205.0, 389.0, 714.0, 1830.0, 6748.0, 33875.0, 283088.0, 2528270.0, 249475.0, 30835.0, 6218.0, 1809.0, 725.0, 341.0, 199.0, 134.0, 69.0, 65.0, 54.0, 40.0, 27.0, 28.0, 21.0, 13.0, 11.0, 5.0, 9.0, 4.0, 7.0, 4.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.19921875, -6.93719482421875, -6.6751708984375, -6.41314697265625, -6.151123046875, -5.88909912109375, -5.6270751953125, -5.36505126953125, -5.10302734375, -4.84100341796875, -4.5789794921875, -4.31695556640625, -4.054931640625, -3.79290771484375, -3.5308837890625, -3.26885986328125, -3.0068359375, -2.74481201171875, -2.4827880859375, -2.22076416015625, -1.958740234375, -1.69671630859375, -1.4346923828125, -1.17266845703125, -0.91064453125, -0.64862060546875, -0.3865966796875, -0.12457275390625, 0.137451171875, 0.39947509765625, 0.6614990234375, 0.92352294921875, 1.185546875, 1.44757080078125, 1.7095947265625, 1.97161865234375, 2.233642578125, 2.49566650390625, 2.7576904296875, 3.01971435546875, 3.28173828125, 3.54376220703125, 3.8057861328125, 4.06781005859375, 4.329833984375, 4.59185791015625, 4.8538818359375, 5.11590576171875, 5.3779296875, 5.63995361328125, 5.9019775390625, 6.16400146484375, 6.426025390625, 6.68804931640625, 6.9500732421875, 7.21209716796875, 7.47412109375, 7.73614501953125, 7.9981689453125, 8.26019287109375, 8.522216796875, 8.78424072265625, 9.0462646484375, 9.30828857421875, 9.5703125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 11.0, 34.0, 96.0, 210.0, 268.0, 215.0, 113.0, 34.0, 19.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.34949493408203, -32.29011917114258, -31.230743408203125, -30.171369552612305, -29.11199378967285, -28.0526180267334, -26.993244171142578, -25.933868408203125, -24.874492645263672, -23.81511688232422, -22.755741119384766, -21.696367263793945, -20.636991500854492, -19.57761573791504, -18.51824188232422, -17.458866119384766, -16.399490356445312, -15.34011459350586, -14.280739784240723, -13.221364974975586, -12.161989212036133, -11.10261344909668, -10.043238639831543, -8.983863830566406, -7.924488067626953, -6.865112781524658, -5.805737495422363, -4.746362209320068, -3.6869869232177734, -2.6276116371154785, -1.5682363510131836, -0.5088610649108887, 0.5505142211914062, 1.6098895072937012, 2.669264793395996, 3.728640079498291, 4.788015365600586, 5.847390651702881, 6.906765937805176, 7.966141223907471, 9.025516510009766, 10.084892272949219, 11.144267082214355, 12.203641891479492, 13.263017654418945, 14.322393417358398, 15.381768226623535, 16.441143035888672, 17.500518798828125, 18.559894561767578, 19.61927032470703, 20.67864418029785, 21.738019943237305, 22.797395706176758, 23.856769561767578, 24.91614532470703, 25.975521087646484, 27.034896850585938, 28.09427261352539, 29.15364646911621, 30.213022232055664, 31.272397994995117, 32.33177185058594, 33.39114761352539, 34.450523376464844]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 2.0, 9.0, 6.0, 4.0, 13.0, 14.0, 10.0, 18.0, 16.0, 17.0, 16.0, 24.0, 16.0, 30.0, 26.0, 30.0, 25.0, 33.0, 34.0, 46.0, 36.0, 37.0, 42.0, 35.0, 42.0, 38.0, 30.0, 34.0, 35.0, 38.0, 35.0, 24.0, 26.0, 20.0, 14.0, 15.0, 17.0, 15.0, 10.0, 18.0, 8.0, 6.0, 8.0, 5.0, 6.0, 7.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0], "bins": [-11.146112442016602, -10.79095458984375, -10.435797691345215, -10.080639839172363, -9.725481986999512, -9.370325088500977, -9.015167236328125, -8.660009384155273, -8.304851531982422, -7.9496941566467285, -7.594536304473877, -7.239378929138184, -6.884221076965332, -6.529063701629639, -6.173906326293945, -5.818748474121094, -5.463591575622559, -5.108434200286865, -4.753276348114014, -4.39811897277832, -4.042961120605469, -3.6878037452697754, -3.332646369934082, -2.9774887561798096, -2.622331142425537, -2.2671735286712646, -1.9120160341262817, -1.5568585395812988, -1.2017009258270264, -0.8465433120727539, -0.49138593673706055, -0.13622832298278809, 0.21893024444580078, 0.5740877985954285, 0.9292453527450562, 1.284402847290039, 1.6395604610443115, 1.994718074798584, 2.3498754501342773, 2.70503306388855, 3.0601906776428223, 3.4153482913970947, 3.770505905151367, 4.1256632804870605, 4.480820655822754, 4.8359785079956055, 5.191135883331299, 5.546293258666992, 5.901451110839844, 6.256608486175537, 6.611766338348389, 6.966923713684082, 7.322081565856934, 7.677238941192627, 8.03239631652832, 8.387554168701172, 8.742712020874023, 9.097869873046875, 9.45302677154541, 9.808184623718262, 10.163342475891113, 10.518499374389648, 10.8736572265625, 11.228815078735352, 11.583971977233887]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 9.0, 16.0, 12.0, 17.0, 23.0, 16.0, 20.0, 24.0, 33.0, 23.0, 41.0, 38.0, 51.0, 44.0, 53.0, 40.0, 53.0, 43.0, 53.0, 40.0, 40.0, 47.0, 37.0, 30.0, 23.0, 25.0, 24.0, 18.0, 17.0, 20.0, 12.0, 12.0, 7.0, 3.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3385467529296875, -1.285491943359375, -1.2324371337890625, -1.17938232421875, -1.1263275146484375, -1.073272705078125, -1.0202178955078125, -0.9671630859375, -0.9141082763671875, -0.861053466796875, -0.8079986572265625, -0.75494384765625, -0.7018890380859375, -0.648834228515625, -0.5957794189453125, -0.542724609375, -0.4896697998046875, -0.436614990234375, -0.3835601806640625, -0.33050537109375, -0.2774505615234375, -0.224395751953125, -0.1713409423828125, -0.1182861328125, -0.0652313232421875, -0.012176513671875, 0.0408782958984375, 0.09393310546875, 0.1469879150390625, 0.200042724609375, 0.2530975341796875, 0.30615234375, 0.3592071533203125, 0.412261962890625, 0.4653167724609375, 0.51837158203125, 0.5714263916015625, 0.624481201171875, 0.6775360107421875, 0.7305908203125, 0.7836456298828125, 0.836700439453125, 0.8897552490234375, 0.94281005859375, 0.9958648681640625, 1.048919677734375, 1.1019744873046875, 1.155029296875, 1.2080841064453125, 1.261138916015625, 1.3141937255859375, 1.36724853515625, 1.4203033447265625, 1.473358154296875, 1.5264129638671875, 1.5794677734375, 1.6325225830078125, 1.685577392578125, 1.7386322021484375, 1.79168701171875, 1.8447418212890625, 1.897796630859375, 1.9508514404296875, 2.00390625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 7.0, 8.0, 4.0, 10.0, 6.0, 14.0, 14.0, 27.0, 27.0, 37.0, 43.0, 61.0, 121.0, 173.0, 312.0, 708.0, 1464.0, 3489.0, 9086.0, 26920.0, 106358.0, 1195358.0, 2590538.0, 195525.0, 41035.0, 13364.0, 5107.0, 2198.0, 1011.0, 508.0, 266.0, 150.0, 110.0, 66.0, 38.0, 35.0, 19.0, 14.0, 15.0, 15.0, 4.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.2327880859375, -4.071044921875, -3.9093017578125, -3.74755859375, -3.5858154296875, -3.424072265625, -3.2623291015625, -3.1005859375, -2.9388427734375, -2.777099609375, -2.6153564453125, -2.45361328125, -2.2918701171875, -2.130126953125, -1.9683837890625, -1.806640625, -1.6448974609375, -1.483154296875, -1.3214111328125, -1.15966796875, -0.9979248046875, -0.836181640625, -0.6744384765625, -0.5126953125, -0.3509521484375, -0.189208984375, -0.0274658203125, 0.13427734375, 0.2960205078125, 0.457763671875, 0.6195068359375, 0.78125, 0.9429931640625, 1.104736328125, 1.2664794921875, 1.42822265625, 1.5899658203125, 1.751708984375, 1.9134521484375, 2.0751953125, 2.2369384765625, 2.398681640625, 2.5604248046875, 2.72216796875, 2.8839111328125, 3.045654296875, 3.2073974609375, 3.369140625, 3.5308837890625, 3.692626953125, 3.8543701171875, 4.01611328125, 4.1778564453125, 4.339599609375, 4.5013427734375, 4.6630859375, 4.8248291015625, 4.986572265625, 5.1483154296875, 5.31005859375, 5.4718017578125, 5.633544921875, 5.7952880859375, 5.95703125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 16.0, 20.0, 32.0, 30.0, 41.0, 54.0, 97.0, 138.0, 208.0, 286.0, 493.0, 697.0, 674.0, 471.0, 258.0, 168.0, 97.0, 80.0, 45.0, 40.0, 33.0, 19.0, 16.0, 12.0, 15.0, 6.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.0858154296875, -2.956787109375, -2.8277587890625, -2.69873046875, -2.5697021484375, -2.440673828125, -2.3116455078125, -2.1826171875, -2.0535888671875, -1.924560546875, -1.7955322265625, -1.66650390625, -1.5374755859375, -1.408447265625, -1.2794189453125, -1.150390625, -1.0213623046875, -0.892333984375, -0.7633056640625, -0.63427734375, -0.5052490234375, -0.376220703125, -0.2471923828125, -0.1181640625, 0.0108642578125, 0.139892578125, 0.2689208984375, 0.39794921875, 0.5269775390625, 0.656005859375, 0.7850341796875, 0.9140625, 1.0430908203125, 1.172119140625, 1.3011474609375, 1.43017578125, 1.5592041015625, 1.688232421875, 1.8172607421875, 1.9462890625, 2.0753173828125, 2.204345703125, 2.3333740234375, 2.46240234375, 2.5914306640625, 2.720458984375, 2.8494873046875, 2.978515625, 3.1075439453125, 3.236572265625, 3.3656005859375, 3.49462890625, 3.6236572265625, 3.752685546875, 3.8817138671875, 4.0107421875, 4.1397705078125, 4.268798828125, 4.3978271484375, 4.52685546875, 4.6558837890625, 4.784912109375, 4.9139404296875, 5.04296875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 19.0, 14.0, 20.0, 40.0, 66.0, 104.0, 177.0, 328.0, 675.0, 1584.0, 3993.0, 11160.0, 36666.0, 158010.0, 1522006.0, 2189891.0, 203026.0, 45077.0, 13206.0, 4713.0, 1851.0, 773.0, 394.0, 204.0, 111.0, 66.0, 33.0, 29.0, 10.0, 10.0, 4.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.1875, -7.9881591796875, -7.788818359375, -7.5894775390625, -7.39013671875, -7.1907958984375, -6.991455078125, -6.7921142578125, -6.5927734375, -6.3934326171875, -6.194091796875, -5.9947509765625, -5.79541015625, -5.5960693359375, -5.396728515625, -5.1973876953125, -4.998046875, -4.7987060546875, -4.599365234375, -4.4000244140625, -4.20068359375, -4.0013427734375, -3.802001953125, -3.6026611328125, -3.4033203125, -3.2039794921875, -3.004638671875, -2.8052978515625, -2.60595703125, -2.4066162109375, -2.207275390625, -2.0079345703125, -1.80859375, -1.6092529296875, -1.409912109375, -1.2105712890625, -1.01123046875, -0.8118896484375, -0.612548828125, -0.4132080078125, -0.2138671875, -0.0145263671875, 0.184814453125, 0.3841552734375, 0.58349609375, 0.7828369140625, 0.982177734375, 1.1815185546875, 1.380859375, 1.5802001953125, 1.779541015625, 1.9788818359375, 2.17822265625, 2.3775634765625, 2.576904296875, 2.7762451171875, 2.9755859375, 3.1749267578125, 3.374267578125, 3.5736083984375, 3.77294921875, 3.9722900390625, 4.171630859375, 4.3709716796875, 4.5703125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 7.0, 7.0, 10.0, 5.0, 19.0, 40.0, 56.0, 74.0, 102.0, 124.0, 125.0, 139.0, 92.0, 81.0, 47.0, 34.0, 18.0, 14.0, 4.0, 3.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.363386154174805, -22.61882972717285, -21.874271392822266, -21.129714965820312, -20.38515853881836, -19.640602111816406, -18.896045684814453, -18.151487350463867, -17.406930923461914, -16.66237449645996, -15.917817115783691, -15.173259735107422, -14.428703308105469, -13.684146881103516, -12.939589500427246, -12.195032119750977, -11.450475692749023, -10.70591926574707, -9.9613618850708, -9.216804504394531, -8.472248077392578, -7.727691173553467, -6.9831342697143555, -6.238577365875244, -5.494020462036133, -4.7494635581970215, -4.00490665435791, -3.260349750518799, -2.5157928466796875, -1.7712359428405762, -1.0266790390014648, -0.2821221351623535, 0.4624366760253906, 1.206993579864502, 1.9515504837036133, 2.6961073875427246, 3.440664291381836, 4.185221195220947, 4.929778099060059, 5.67433500289917, 6.418891906738281, 7.163448810577393, 7.908005714416504, 8.652563095092773, 9.397119522094727, 10.14167594909668, 10.88623332977295, 11.630790710449219, 12.375347137451172, 13.119903564453125, 13.864460945129395, 14.609018325805664, 15.353574752807617, 16.09813117980957, 16.842689514160156, 17.58724594116211, 18.331802368164062, 19.076358795166016, 19.82091522216797, 20.565473556518555, 21.310029983520508, 22.05458641052246, 22.799144744873047, 23.543701171875, 24.288257598876953]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 9.0, 7.0, 19.0, 26.0, 24.0, 25.0, 35.0, 28.0, 34.0, 34.0, 35.0, 25.0, 46.0, 51.0, 46.0, 37.0, 37.0, 47.0, 48.0, 32.0, 45.0, 43.0, 34.0, 32.0, 20.0, 30.0, 28.0, 22.0, 20.0, 16.0, 10.0, 15.0, 4.0, 8.0, 6.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.996298789978027, -9.623560905456543, -9.250822067260742, -8.878084182739258, -8.505346298217773, -8.132608413696289, -7.759869575500488, -7.387131690979004, -7.014393329620361, -6.641654968261719, -6.268917083740234, -5.896178722381592, -5.523440361022949, -5.150702476501465, -4.777964115142822, -4.40522575378418, -4.032487869262695, -3.659749746322632, -3.2870116233825684, -2.914273262023926, -2.5415351390838623, -2.168797016143799, -1.7960586547851562, -1.4233205318450928, -1.0505824089050293, -0.677844226360321, -0.3051060438156128, 0.06763219833374023, 0.4403703212738037, 0.8131084442138672, 1.1858468055725098, 1.5585849285125732, 1.9313220977783203, 2.304060220718384, 2.6767983436584473, 3.04953670501709, 3.4222748279571533, 3.795012950897217, 4.167751312255859, 4.540489196777344, 4.913227558135986, 5.285965919494629, 5.658703804016113, 6.031442165374756, 6.404180526733398, 6.776918411254883, 7.149656772613525, 7.522395133972168, 7.895133018493652, 8.267870903015137, 8.640609741210938, 9.013347625732422, 9.386085510253906, 9.75882339477539, 10.131562232971191, 10.504300117492676, 10.877038955688477, 11.249776840209961, 11.622515678405762, 11.995253562927246, 12.36799144744873, 12.740730285644531, 13.113468170166016, 13.4862060546875, 13.858943939208984]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 6.0, 6.0, 3.0, 5.0, 10.0, 12.0, 13.0, 15.0, 14.0, 19.0, 12.0, 27.0, 26.0, 23.0, 18.0, 29.0, 24.0, 39.0, 40.0, 50.0, 46.0, 29.0, 58.0, 33.0, 27.0, 37.0, 38.0, 41.0, 34.0, 34.0, 27.0, 26.0, 26.0, 15.0, 18.0, 14.0, 19.0, 19.0, 10.0, 12.0, 12.0, 5.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.2880859375, -1.2441253662109375, -1.200164794921875, -1.1562042236328125, -1.11224365234375, -1.0682830810546875, -1.024322509765625, -0.9803619384765625, -0.9364013671875, -0.8924407958984375, -0.848480224609375, -0.8045196533203125, -0.76055908203125, -0.7165985107421875, -0.672637939453125, -0.6286773681640625, -0.584716796875, -0.5407562255859375, -0.496795654296875, -0.4528350830078125, -0.40887451171875, -0.3649139404296875, -0.320953369140625, -0.2769927978515625, -0.2330322265625, -0.1890716552734375, -0.145111083984375, -0.1011505126953125, -0.05718994140625, -0.0132293701171875, 0.030731201171875, 0.0746917724609375, 0.11865234375, 0.1626129150390625, 0.206573486328125, 0.2505340576171875, 0.29449462890625, 0.3384552001953125, 0.382415771484375, 0.4263763427734375, 0.4703369140625, 0.5142974853515625, 0.558258056640625, 0.6022186279296875, 0.64617919921875, 0.6901397705078125, 0.734100341796875, 0.7780609130859375, 0.822021484375, 0.8659820556640625, 0.909942626953125, 0.9539031982421875, 0.99786376953125, 1.0418243408203125, 1.085784912109375, 1.1297454833984375, 1.1737060546875, 1.2176666259765625, 1.261627197265625, 1.3055877685546875, 1.34954833984375, 1.3935089111328125, 1.437469482421875, 1.4814300537109375, 1.525390625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 13.0, 23.0, 36.0, 59.0, 84.0, 126.0, 207.0, 322.0, 560.0, 838.0, 1476.0, 2337.0, 3965.0, 6542.0, 10749.0, 18494.0, 32096.0, 56312.0, 107879.0, 279497.0, 282712.0, 109012.0, 56829.0, 32202.0, 18786.0, 10882.0, 6489.0, 3934.0, 2322.0, 1433.0, 945.0, 549.0, 310.0, 184.0, 111.0, 65.0, 53.0, 28.0, 41.0, 15.0, 11.0, 10.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.705078125, -0.68157958984375, -0.6580810546875, -0.63458251953125, -0.611083984375, -0.58758544921875, -0.5640869140625, -0.54058837890625, -0.51708984375, -0.49359130859375, -0.4700927734375, -0.44659423828125, -0.423095703125, -0.39959716796875, -0.3760986328125, -0.35260009765625, -0.3291015625, -0.30560302734375, -0.2821044921875, -0.25860595703125, -0.235107421875, -0.21160888671875, -0.1881103515625, -0.16461181640625, -0.14111328125, -0.11761474609375, -0.0941162109375, -0.07061767578125, -0.047119140625, -0.02362060546875, -0.0001220703125, 0.02337646484375, 0.046875, 0.07037353515625, 0.0938720703125, 0.11737060546875, 0.140869140625, 0.16436767578125, 0.1878662109375, 0.21136474609375, 0.23486328125, 0.25836181640625, 0.2818603515625, 0.30535888671875, 0.328857421875, 0.35235595703125, 0.3758544921875, 0.39935302734375, 0.4228515625, 0.44635009765625, 0.4698486328125, 0.49334716796875, 0.516845703125, 0.54034423828125, 0.5638427734375, 0.58734130859375, 0.61083984375, 0.63433837890625, 0.6578369140625, 0.68133544921875, 0.704833984375, 0.72833251953125, 0.7518310546875, 0.77532958984375, 0.798828125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 1.0, 12.0, 8.0, 7.0, 11.0, 10.0, 14.0, 15.0, 23.0, 18.0, 24.0, 17.0, 33.0, 37.0, 32.0, 32.0, 40.0, 30.0, 36.0, 29.0, 53.0, 1073.0, 37.0, 28.0, 31.0, 48.0, 32.0, 34.0, 41.0, 18.0, 27.0, 30.0, 21.0, 15.0, 15.0, 14.0, 16.0, 17.0, 9.0, 7.0, 7.0, 3.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.1748046875, -1.140380859375, -1.10595703125, -1.071533203125, -1.037109375, -1.002685546875, -0.96826171875, -0.933837890625, -0.8994140625, -0.864990234375, -0.83056640625, -0.796142578125, -0.76171875, -0.727294921875, -0.69287109375, -0.658447265625, -0.6240234375, -0.589599609375, -0.55517578125, -0.520751953125, -0.486328125, -0.451904296875, -0.41748046875, -0.383056640625, -0.3486328125, -0.314208984375, -0.27978515625, -0.245361328125, -0.2109375, -0.176513671875, -0.14208984375, -0.107666015625, -0.0732421875, -0.038818359375, -0.00439453125, 0.030029296875, 0.064453125, 0.098876953125, 0.13330078125, 0.167724609375, 0.2021484375, 0.236572265625, 0.27099609375, 0.305419921875, 0.33984375, 0.374267578125, 0.40869140625, 0.443115234375, 0.4775390625, 0.511962890625, 0.54638671875, 0.580810546875, 0.615234375, 0.649658203125, 0.68408203125, 0.718505859375, 0.7529296875, 0.787353515625, 0.82177734375, 0.856201171875, 0.890625, 0.925048828125, 0.95947265625, 0.993896484375, 1.0283203125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 6.0, 7.0, 11.0, 22.0, 35.0, 55.0, 116.0, 245.0, 470.0, 1181.0, 2935.0, 7143.0, 21159.0, 424831.0, 1601662.0, 23917.0, 7957.0, 3072.0, 1283.0, 512.0, 239.0, 117.0, 65.0, 32.0, 22.0, 12.0, 11.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.56170654296875, -2.4925537109375, -2.42340087890625, -2.354248046875, -2.28509521484375, -2.2159423828125, -2.14678955078125, -2.07763671875, -2.00848388671875, -1.9393310546875, -1.87017822265625, -1.801025390625, -1.73187255859375, -1.6627197265625, -1.59356689453125, -1.5244140625, -1.45526123046875, -1.3861083984375, -1.31695556640625, -1.247802734375, -1.17864990234375, -1.1094970703125, -1.04034423828125, -0.97119140625, -0.90203857421875, -0.8328857421875, -0.76373291015625, -0.694580078125, -0.62542724609375, -0.5562744140625, -0.48712158203125, -0.41796875, -0.34881591796875, -0.2796630859375, -0.21051025390625, -0.141357421875, -0.07220458984375, -0.0030517578125, 0.06610107421875, 0.13525390625, 0.20440673828125, 0.2735595703125, 0.34271240234375, 0.411865234375, 0.48101806640625, 0.5501708984375, 0.61932373046875, 0.6884765625, 0.75762939453125, 0.8267822265625, 0.89593505859375, 0.965087890625, 1.03424072265625, 1.1033935546875, 1.17254638671875, 1.24169921875, 1.31085205078125, 1.3800048828125, 1.44915771484375, 1.518310546875, 1.58746337890625, 1.6566162109375, 1.72576904296875, 1.794921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 14.0, 13.0, 21.0, 17.0, 35.0, 38.0, 56.0, 53.0, 69.0, 102.0, 119.0, 109.0, 67.0, 67.0, 48.0, 43.0, 33.0, 18.0, 18.0, 17.0, 15.0, 11.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09295654296875, -0.09048748016357422, -0.08801841735839844, -0.08554935455322266, -0.08308029174804688, -0.0806112289428711, -0.07814216613769531, -0.07567310333251953, -0.07320404052734375, -0.07073497772216797, -0.06826591491699219, -0.0657968521118164, -0.06332778930664062, -0.060858726501464844, -0.05838966369628906, -0.05592060089111328, -0.0534515380859375, -0.05098247528076172, -0.04851341247558594, -0.046044349670410156, -0.043575286865234375, -0.041106224060058594, -0.03863716125488281, -0.03616809844970703, -0.03369903564453125, -0.03122997283935547, -0.028760910034179688, -0.026291847229003906, -0.023822784423828125, -0.021353721618652344, -0.018884658813476562, -0.01641559600830078, -0.013946533203125, -0.011477470397949219, -0.009008407592773438, -0.006539344787597656, -0.004070281982421875, -0.0016012191772460938, 0.0008678436279296875, 0.0033369064331054688, 0.00580596923828125, 0.008275032043457031, 0.010744094848632812, 0.013213157653808594, 0.015682220458984375, 0.018151283264160156, 0.020620346069335938, 0.02308940887451172, 0.0255584716796875, 0.02802753448486328, 0.030496597290039062, 0.032965660095214844, 0.035434722900390625, 0.037903785705566406, 0.04037284851074219, 0.04284191131591797, 0.04531097412109375, 0.04778003692626953, 0.05024909973144531, 0.052718162536621094, 0.055187225341796875, 0.057656288146972656, 0.06012535095214844, 0.06259441375732422, 0.0650634765625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 3.0, 8.0, 9.0, 12.0, 32.0, 25.0, 33.0, 57.0, 106.0, 210.0, 500.0, 2548.0, 112091.0, 917762.0, 13437.0, 997.0, 317.0, 141.0, 84.0, 58.0, 30.0, 32.0, 16.0, 7.0, 10.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.916015625, -0.882415771484375, -0.84881591796875, -0.815216064453125, -0.7816162109375, -0.748016357421875, -0.71441650390625, -0.680816650390625, -0.647216796875, -0.613616943359375, -0.58001708984375, -0.546417236328125, -0.5128173828125, -0.479217529296875, -0.44561767578125, -0.412017822265625, -0.37841796875, -0.344818115234375, -0.31121826171875, -0.277618408203125, -0.2440185546875, -0.210418701171875, -0.17681884765625, -0.143218994140625, -0.109619140625, -0.076019287109375, -0.04241943359375, -0.008819580078125, 0.0247802734375, 0.058380126953125, 0.09197998046875, 0.125579833984375, 0.1591796875, 0.192779541015625, 0.22637939453125, 0.259979248046875, 0.2935791015625, 0.327178955078125, 0.36077880859375, 0.394378662109375, 0.427978515625, 0.461578369140625, 0.49517822265625, 0.528778076171875, 0.5623779296875, 0.595977783203125, 0.62957763671875, 0.663177490234375, 0.69677734375, 0.730377197265625, 0.76397705078125, 0.797576904296875, 0.8311767578125, 0.864776611328125, 0.89837646484375, 0.931976318359375, 0.965576171875, 0.999176025390625, 1.03277587890625, 1.066375732421875, 1.0999755859375, 1.133575439453125, 1.16717529296875, 1.200775146484375, 1.234375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 26.0, 87.0, 270.0, 378.0, 167.0, 50.0, 15.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4994397461414337, -0.48177167773246765, -0.4641036093235016, -0.4464355409145355, -0.42876747250556946, -0.4110994040966034, -0.39343130588531494, -0.3757632374763489, -0.3580951690673828, -0.34042710065841675, -0.3227590322494507, -0.3050909638404846, -0.28742289543151855, -0.2697548270225525, -0.2520867586135864, -0.23441867530345917, -0.2167506217956543, -0.19908255338668823, -0.18141448497772217, -0.1637464165687561, -0.14607834815979004, -0.12841027975082397, -0.11074219644069672, -0.09307412803173065, -0.07540605962276459, -0.05773799121379852, -0.04006991907954216, -0.022401846945285797, -0.004733778536319733, 0.012934289872646332, 0.030602365732192993, 0.04827043414115906, 0.06593853235244751, 0.08360660076141357, 0.10127466917037964, 0.1189427450299263, 0.13661080598831177, 0.15427887439727783, 0.1719469577074051, 0.18961502611637115, 0.20728309452533722, 0.22495116293430328, 0.24261923134326935, 0.2602873146533966, 0.27795538306236267, 0.29562345147132874, 0.3132915198802948, 0.33095958828926086, 0.34862765669822693, 0.366295725107193, 0.38396379351615906, 0.4016318619251251, 0.4192999303340912, 0.43696799874305725, 0.4546360969543457, 0.47230416536331177, 0.48997223377227783, 0.5076403021812439, 0.52530837059021, 0.542976438999176, 0.5606445074081421, 0.5783125758171082, 0.5959806442260742, 0.6136487126350403, 0.6313167810440063]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 9.0, 4.0, 8.0, 15.0, 12.0, 16.0, 18.0, 23.0, 26.0, 22.0, 38.0, 51.0, 45.0, 56.0, 43.0, 45.0, 56.0, 41.0, 51.0, 40.0, 51.0, 43.0, 47.0, 40.0, 29.0, 36.0, 29.0, 14.0, 22.0, 18.0, 15.0, 10.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.18680042028427124, -0.18148207664489746, -0.17616373300552368, -0.1708453893661499, -0.16552704572677612, -0.16020870208740234, -0.15489035844802856, -0.14957201480865479, -0.144253671169281, -0.13893532752990723, -0.13361698389053345, -0.12829864025115967, -0.12298029661178589, -0.11766195297241211, -0.11234360933303833, -0.10702526569366455, -0.10170692205429077, -0.09638857841491699, -0.09107023477554321, -0.08575189113616943, -0.08043354749679565, -0.07511520385742188, -0.0697968602180481, -0.06447851657867432, -0.05916017293930054, -0.05384182929992676, -0.04852348566055298, -0.0432051420211792, -0.03788679838180542, -0.03256845474243164, -0.02725011110305786, -0.021931767463684082, -0.016613423824310303, -0.011295080184936523, -0.005976736545562744, -0.0006583929061889648, 0.0046599507331848145, 0.009978294372558594, 0.015296638011932373, 0.020614981651306152, 0.02593332529067993, 0.03125166893005371, 0.03657001256942749, 0.04188835620880127, 0.04720669984817505, 0.05252504348754883, 0.05784338712692261, 0.06316173076629639, 0.06848007440567017, 0.07379841804504395, 0.07911676168441772, 0.0844351053237915, 0.08975344896316528, 0.09507179260253906, 0.10039013624191284, 0.10570847988128662, 0.1110268235206604, 0.11634516716003418, 0.12166351079940796, 0.12698185443878174, 0.13230019807815552, 0.1376185417175293, 0.14293688535690308, 0.14825522899627686, 0.15357357263565063]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 6.0, 5.0, 5.0, 4.0, 8.0, 12.0, 16.0, 15.0, 14.0, 18.0, 11.0, 25.0, 25.0, 20.0, 24.0, 26.0, 26.0, 33.0, 39.0, 50.0, 48.0, 35.0, 47.0, 38.0, 27.0, 36.0, 40.0, 45.0, 32.0, 31.0, 33.0, 19.0, 29.0, 16.0, 17.0, 18.0, 14.0, 20.0, 13.0, 11.0, 13.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.291015625, -1.247222900390625, -1.20343017578125, -1.159637451171875, -1.1158447265625, -1.072052001953125, -1.02825927734375, -0.984466552734375, -0.940673828125, -0.896881103515625, -0.85308837890625, -0.809295654296875, -0.7655029296875, -0.721710205078125, -0.67791748046875, -0.634124755859375, -0.59033203125, -0.546539306640625, -0.50274658203125, -0.458953857421875, -0.4151611328125, -0.371368408203125, -0.32757568359375, -0.283782958984375, -0.239990234375, -0.196197509765625, -0.15240478515625, -0.108612060546875, -0.0648193359375, -0.021026611328125, 0.02276611328125, 0.066558837890625, 0.1103515625, 0.154144287109375, 0.19793701171875, 0.241729736328125, 0.2855224609375, 0.329315185546875, 0.37310791015625, 0.416900634765625, 0.460693359375, 0.504486083984375, 0.54827880859375, 0.592071533203125, 0.6358642578125, 0.679656982421875, 0.72344970703125, 0.767242431640625, 0.81103515625, 0.854827880859375, 0.89862060546875, 0.942413330078125, 0.9862060546875, 1.029998779296875, 1.07379150390625, 1.117584228515625, 1.161376953125, 1.205169677734375, 1.24896240234375, 1.292755126953125, 1.3365478515625, 1.380340576171875, 1.42413330078125, 1.467926025390625, 1.51171875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 3.0, 8.0, 15.0, 17.0, 23.0, 36.0, 40.0, 95.0, 113.0, 172.0, 251.0, 395.0, 639.0, 1041.0, 1620.0, 2682.0, 4738.0, 8405.0, 15228.0, 29098.0, 64528.0, 181569.0, 421533.0, 185413.0, 65548.0, 29427.0, 15393.0, 8380.0, 4884.0, 2747.0, 1678.0, 1024.0, 612.0, 406.0, 288.0, 164.0, 113.0, 66.0, 56.0, 37.0, 16.0, 13.0, 16.0, 9.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.12109375, -3.02508544921875, -2.9290771484375, -2.83306884765625, -2.737060546875, -2.64105224609375, -2.5450439453125, -2.44903564453125, -2.35302734375, -2.25701904296875, -2.1610107421875, -2.06500244140625, -1.968994140625, -1.87298583984375, -1.7769775390625, -1.68096923828125, -1.5849609375, -1.48895263671875, -1.3929443359375, -1.29693603515625, -1.200927734375, -1.10491943359375, -1.0089111328125, -0.91290283203125, -0.81689453125, -0.72088623046875, -0.6248779296875, -0.52886962890625, -0.432861328125, -0.33685302734375, -0.2408447265625, -0.14483642578125, -0.048828125, 0.04718017578125, 0.1431884765625, 0.23919677734375, 0.335205078125, 0.43121337890625, 0.5272216796875, 0.62322998046875, 0.71923828125, 0.81524658203125, 0.9112548828125, 1.00726318359375, 1.103271484375, 1.19927978515625, 1.2952880859375, 1.39129638671875, 1.4873046875, 1.58331298828125, 1.6793212890625, 1.77532958984375, 1.871337890625, 1.96734619140625, 2.0633544921875, 2.15936279296875, 2.25537109375, 2.35137939453125, 2.4473876953125, 2.54339599609375, 2.639404296875, 2.73541259765625, 2.8314208984375, 2.92742919921875, 3.0234375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 10.0, 9.0, 14.0, 21.0, 25.0, 29.0, 26.0, 31.0, 39.0, 53.0, 64.0, 44.0, 78.0, 89.0, 175.0, 292.0, 1317.0, 155.0, 96.0, 89.0, 62.0, 48.0, 50.0, 42.0, 37.0, 25.0, 19.0, 19.0, 15.0, 13.0, 13.0, 8.0, 9.0, 4.0, 6.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.640625, -5.484130859375, -5.32763671875, -5.171142578125, -5.0146484375, -4.858154296875, -4.70166015625, -4.545166015625, -4.388671875, -4.232177734375, -4.07568359375, -3.919189453125, -3.7626953125, -3.606201171875, -3.44970703125, -3.293212890625, -3.13671875, -2.980224609375, -2.82373046875, -2.667236328125, -2.5107421875, -2.354248046875, -2.19775390625, -2.041259765625, -1.884765625, -1.728271484375, -1.57177734375, -1.415283203125, -1.2587890625, -1.102294921875, -0.94580078125, -0.789306640625, -0.6328125, -0.476318359375, -0.31982421875, -0.163330078125, -0.0068359375, 0.149658203125, 0.30615234375, 0.462646484375, 0.619140625, 0.775634765625, 0.93212890625, 1.088623046875, 1.2451171875, 1.401611328125, 1.55810546875, 1.714599609375, 1.87109375, 2.027587890625, 2.18408203125, 2.340576171875, 2.4970703125, 2.653564453125, 2.81005859375, 2.966552734375, 3.123046875, 3.279541015625, 3.43603515625, 3.592529296875, 3.7490234375, 3.905517578125, 4.06201171875, 4.218505859375, 4.375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 18.0, 19.0, 21.0, 25.0, 34.0, 39.0, 52.0, 74.0, 131.0, 182.0, 307.0, 708.0, 2585.0, 12046.0, 90586.0, 2142988.0, 835529.0, 49465.0, 7687.0, 1792.0, 599.0, 237.0, 138.0, 99.0, 87.0, 68.0, 41.0, 35.0, 29.0, 21.0, 12.0, 12.0, 8.0, 3.0, 8.0, 2.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.91015625, -7.62628173828125, -7.3424072265625, -7.05853271484375, -6.774658203125, -6.49078369140625, -6.2069091796875, -5.92303466796875, -5.63916015625, -5.35528564453125, -5.0714111328125, -4.78753662109375, -4.503662109375, -4.21978759765625, -3.9359130859375, -3.65203857421875, -3.3681640625, -3.08428955078125, -2.8004150390625, -2.51654052734375, -2.232666015625, -1.94879150390625, -1.6649169921875, -1.38104248046875, -1.09716796875, -0.81329345703125, -0.5294189453125, -0.24554443359375, 0.038330078125, 0.32220458984375, 0.6060791015625, 0.88995361328125, 1.173828125, 1.45770263671875, 1.7415771484375, 2.02545166015625, 2.309326171875, 2.59320068359375, 2.8770751953125, 3.16094970703125, 3.44482421875, 3.72869873046875, 4.0125732421875, 4.29644775390625, 4.580322265625, 4.86419677734375, 5.1480712890625, 5.43194580078125, 5.7158203125, 5.99969482421875, 6.2835693359375, 6.56744384765625, 6.851318359375, 7.13519287109375, 7.4190673828125, 7.70294189453125, 7.98681640625, 8.27069091796875, 8.5545654296875, 8.83843994140625, 9.122314453125, 9.40618896484375, 9.6900634765625, 9.97393798828125, 10.2578125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 211.0, 721.0, 79.0, 4.0, 0.0, 1.0], "bins": [-219.1438751220703, -215.44842529296875, -211.7529754638672, -208.05752563476562, -204.36207580566406, -200.6666259765625, -196.97117614746094, -193.27572631835938, -189.58026123046875, -185.8848114013672, -182.18936157226562, -178.49391174316406, -174.7984619140625, -171.10301208496094, -167.40756225585938, -163.71209716796875, -160.01666259765625, -156.3212127685547, -152.62576293945312, -148.93031311035156, -145.23486328125, -141.53941345214844, -137.84396362304688, -134.14849853515625, -130.45306396484375, -126.75761413574219, -123.06216430664062, -119.36671447753906, -115.6712646484375, -111.97581481933594, -108.28035736083984, -104.58490753173828, -100.88945007324219, -97.19400024414062, -93.49855041503906, -89.8031005859375, -86.10765075683594, -82.41220092773438, -78.71674346923828, -75.02129364013672, -71.32584381103516, -67.6303939819336, -63.93494415283203, -60.2394905090332, -56.54404067993164, -52.84859085083008, -49.15313720703125, -45.45768737792969, -41.762237548828125, -38.06678771972656, -34.371337890625, -30.675884246826172, -26.98043441772461, -23.284984588623047, -19.58953285217285, -15.894081115722656, -12.198631286621094, -8.503180503845215, -4.807729721069336, -1.112278938293457, 2.583171844482422, 6.278621673583984, 9.97407341003418, 13.669525146484375, 17.364974975585938]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 12.0, 11.0, 16.0, 11.0, 19.0, 26.0, 27.0, 26.0, 26.0, 39.0, 42.0, 47.0, 41.0, 52.0, 64.0, 41.0, 49.0, 57.0, 35.0, 31.0, 40.0, 42.0, 40.0, 25.0, 36.0, 21.0, 14.0, 18.0, 16.0, 16.0, 15.0, 7.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.19316291809082, -12.701231956481934, -12.20930004119873, -11.717369079589844, -11.22543716430664, -10.733506202697754, -10.24157428741455, -9.749643325805664, -9.257711410522461, -8.765780448913574, -8.273848533630371, -7.781917095184326, -7.289985656738281, -6.7980546951293945, -6.306122779846191, -5.814191818237305, -5.32226037979126, -4.830328941345215, -4.33839750289917, -3.846466064453125, -3.35453462600708, -2.8626034259796143, -2.3706719875335693, -1.8787405490875244, -1.3868091106414795, -0.8948776721954346, -0.4029462933540344, 0.08898508548736572, 0.5809165239334106, 1.072847843170166, 1.564779281616211, 2.056710720062256, 2.548642158508301, 3.0405735969543457, 3.5325050354003906, 4.0244364738464355, 4.5163679122924805, 5.008298873901367, 5.50023078918457, 5.992161750793457, 6.48409366607666, 6.976025104522705, 7.46795654296875, 7.959887981414795, 8.45181941986084, 8.943750381469727, 9.43568229675293, 9.927613258361816, 10.419544219970703, 10.91147518157959, 11.403407096862793, 11.89533805847168, 12.387269973754883, 12.87920093536377, 13.371132850646973, 13.86306381225586, 14.354995727539062, 14.84692668914795, 15.338858604431152, 15.830789566040039, 16.322721481323242, 16.814653396606445, 17.306583404541016, 17.79851531982422, 18.290447235107422]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 2.0, 1.0, 6.0, 5.0, 6.0, 6.0, 4.0, 9.0, 10.0, 13.0, 17.0, 15.0, 30.0, 25.0, 29.0, 38.0, 27.0, 26.0, 39.0, 44.0, 49.0, 39.0, 43.0, 48.0, 35.0, 48.0, 33.0, 33.0, 46.0, 35.0, 41.0, 31.0, 30.0, 19.0, 22.0, 21.0, 14.0, 15.0, 14.0, 6.0, 8.0, 3.0, 5.0, 8.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4599609375, -1.4047393798828125, -1.349517822265625, -1.2942962646484375, -1.23907470703125, -1.1838531494140625, -1.128631591796875, -1.0734100341796875, -1.0181884765625, -0.9629669189453125, -0.907745361328125, -0.8525238037109375, -0.79730224609375, -0.7420806884765625, -0.686859130859375, -0.6316375732421875, -0.576416015625, -0.5211944580078125, -0.465972900390625, -0.4107513427734375, -0.35552978515625, -0.3003082275390625, -0.245086669921875, -0.1898651123046875, -0.1346435546875, -0.0794219970703125, -0.024200439453125, 0.0310211181640625, 0.08624267578125, 0.1414642333984375, 0.196685791015625, 0.2519073486328125, 0.30712890625, 0.3623504638671875, 0.417572021484375, 0.4727935791015625, 0.52801513671875, 0.5832366943359375, 0.638458251953125, 0.6936798095703125, 0.7489013671875, 0.8041229248046875, 0.859344482421875, 0.9145660400390625, 0.96978759765625, 1.0250091552734375, 1.080230712890625, 1.1354522705078125, 1.190673828125, 1.2458953857421875, 1.301116943359375, 1.3563385009765625, 1.41156005859375, 1.4667816162109375, 1.522003173828125, 1.5772247314453125, 1.6324462890625, 1.6876678466796875, 1.742889404296875, 1.7981109619140625, 1.85333251953125, 1.9085540771484375, 1.963775634765625, 2.0189971923828125, 2.07421875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 15.0, 17.0, 35.0, 38.0, 48.0, 74.0, 116.0, 173.0, 241.0, 348.0, 542.0, 859.0, 1246.0, 1895.0, 2946.0, 4627.0, 7816.0, 13417.0, 25393.0, 51941.0, 132887.0, 495550.0, 1725201.0, 1245348.0, 302835.0, 91271.0, 39330.0, 19943.0, 11146.0, 6648.0, 4137.0, 2743.0, 1693.0, 1173.0, 760.0, 554.0, 382.0, 245.0, 205.0, 132.0, 81.0, 69.0, 44.0, 25.0, 29.0, 16.0, 15.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0], "bins": [-2.521484375, -2.439697265625, -2.35791015625, -2.276123046875, -2.1943359375, -2.112548828125, -2.03076171875, -1.948974609375, -1.8671875, -1.785400390625, -1.70361328125, -1.621826171875, -1.5400390625, -1.458251953125, -1.37646484375, -1.294677734375, -1.212890625, -1.131103515625, -1.04931640625, -0.967529296875, -0.8857421875, -0.803955078125, -0.72216796875, -0.640380859375, -0.55859375, -0.476806640625, -0.39501953125, -0.313232421875, -0.2314453125, -0.149658203125, -0.06787109375, 0.013916015625, 0.095703125, 0.177490234375, 0.25927734375, 0.341064453125, 0.4228515625, 0.504638671875, 0.58642578125, 0.668212890625, 0.75, 0.831787109375, 0.91357421875, 0.995361328125, 1.0771484375, 1.158935546875, 1.24072265625, 1.322509765625, 1.404296875, 1.486083984375, 1.56787109375, 1.649658203125, 1.7314453125, 1.813232421875, 1.89501953125, 1.976806640625, 2.05859375, 2.140380859375, 2.22216796875, 2.303955078125, 2.3857421875, 2.467529296875, 2.54931640625, 2.631103515625, 2.712890625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 7.0, 9.0, 10.0, 10.0, 17.0, 22.0, 26.0, 49.0, 72.0, 81.0, 136.0, 189.0, 279.0, 479.0, 729.0, 676.0, 450.0, 287.0, 187.0, 97.0, 87.0, 49.0, 40.0, 27.0, 15.0, 14.0, 8.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 8.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.48828125, -5.350830078125, -5.21337890625, -5.075927734375, -4.9384765625, -4.801025390625, -4.66357421875, -4.526123046875, -4.388671875, -4.251220703125, -4.11376953125, -3.976318359375, -3.8388671875, -3.701416015625, -3.56396484375, -3.426513671875, -3.2890625, -3.151611328125, -3.01416015625, -2.876708984375, -2.7392578125, -2.601806640625, -2.46435546875, -2.326904296875, -2.189453125, -2.052001953125, -1.91455078125, -1.777099609375, -1.6396484375, -1.502197265625, -1.36474609375, -1.227294921875, -1.08984375, -0.952392578125, -0.81494140625, -0.677490234375, -0.5400390625, -0.402587890625, -0.26513671875, -0.127685546875, 0.009765625, 0.147216796875, 0.28466796875, 0.422119140625, 0.5595703125, 0.697021484375, 0.83447265625, 0.971923828125, 1.109375, 1.246826171875, 1.38427734375, 1.521728515625, 1.6591796875, 1.796630859375, 1.93408203125, 2.071533203125, 2.208984375, 2.346435546875, 2.48388671875, 2.621337890625, 2.7587890625, 2.896240234375, 3.03369140625, 3.171142578125, 3.30859375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 11.0, 16.0, 27.0, 42.0, 45.0, 91.0, 161.0, 291.0, 791.0, 3134.0, 17459.0, 178373.0, 3487431.0, 466664.0, 32503.0, 5065.0, 1192.0, 464.0, 212.0, 103.0, 55.0, 44.0, 26.0, 15.0, 17.0, 9.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796875, -9.4549560546875, -9.113037109375, -8.7711181640625, -8.42919921875, -8.0872802734375, -7.745361328125, -7.4034423828125, -7.0615234375, -6.7196044921875, -6.377685546875, -6.0357666015625, -5.69384765625, -5.3519287109375, -5.010009765625, -4.6680908203125, -4.326171875, -3.9842529296875, -3.642333984375, -3.3004150390625, -2.95849609375, -2.6165771484375, -2.274658203125, -1.9327392578125, -1.5908203125, -1.2489013671875, -0.906982421875, -0.5650634765625, -0.22314453125, 0.1187744140625, 0.460693359375, 0.8026123046875, 1.14453125, 1.4864501953125, 1.828369140625, 2.1702880859375, 2.51220703125, 2.8541259765625, 3.196044921875, 3.5379638671875, 3.8798828125, 4.2218017578125, 4.563720703125, 4.9056396484375, 5.24755859375, 5.5894775390625, 5.931396484375, 6.2733154296875, 6.615234375, 6.9571533203125, 7.299072265625, 7.6409912109375, 7.98291015625, 8.3248291015625, 8.666748046875, 9.0086669921875, 9.3505859375, 9.6925048828125, 10.034423828125, 10.3763427734375, 10.71826171875, 11.0601806640625, 11.402099609375, 11.7440185546875, 12.0859375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 17.0, 41.0, 103.0, 210.0, 220.0, 194.0, 115.0, 66.0, 25.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.82265853881836, -46.48038101196289, -45.13810348510742, -43.79582977294922, -42.45355224609375, -41.11127471923828, -39.76899719238281, -38.426719665527344, -37.084442138671875, -35.742164611816406, -34.39988708496094, -33.05760955810547, -31.715335845947266, -30.373058319091797, -29.030780792236328, -27.68850326538086, -26.346229553222656, -25.003952026367188, -23.66167640686035, -22.319398880004883, -20.977123260498047, -19.634845733642578, -18.29256820678711, -16.95029067993164, -15.608015060424805, -14.265738487243652, -12.9234619140625, -11.581184387207031, -10.238907814025879, -8.896631240844727, -7.554353713989258, -6.2120771408081055, -4.869804382324219, -3.5275275707244873, -2.185250759124756, -0.8429737091064453, 0.49930286407470703, 1.8415794372558594, 3.183856964111328, 4.5261335372924805, 5.868410110473633, 7.210686683654785, 8.552963256835938, 9.895240783691406, 11.237517356872559, 12.579793930053711, 13.92207145690918, 15.264348030090332, 16.606624603271484, 17.948902130126953, 19.29117774963379, 20.633455276489258, 21.975730895996094, 23.318008422851562, 24.66028594970703, 26.0025634765625, 27.344839096069336, 28.687116622924805, 30.02939224243164, 31.37166976928711, 32.71394729614258, 34.05622100830078, 35.39849853515625, 36.74077606201172, 38.08305358886719]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 8.0, 9.0, 13.0, 13.0, 17.0, 17.0, 30.0, 27.0, 19.0, 34.0, 30.0, 28.0, 44.0, 44.0, 39.0, 44.0, 31.0, 46.0, 45.0, 42.0, 44.0, 37.0, 30.0, 31.0, 21.0, 35.0, 28.0, 31.0, 25.0, 29.0, 12.0, 23.0, 7.0, 18.0, 12.0, 8.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.551460266113281, -12.194915771484375, -11.838371276855469, -11.481827735900879, -11.125283241271973, -10.768738746643066, -10.412195205688477, -10.05565071105957, -9.699106216430664, -9.342561721801758, -8.986017227172852, -8.629473686218262, -8.272929191589355, -7.916384696960449, -7.559840679168701, -7.203296661376953, -6.846752166748047, -6.490207672119141, -6.133663654327393, -5.7771196365356445, -5.420575141906738, -5.064030647277832, -4.707486629486084, -4.350942611694336, -3.9943981170654297, -3.6378538608551025, -3.2813096046447754, -2.9247653484344482, -2.568221092224121, -2.211676836013794, -1.8551325798034668, -1.4985883235931396, -1.142045021057129, -0.7855007648468018, -0.4289565086364746, -0.07241225242614746, 0.2841320037841797, 0.6406762599945068, 0.997220516204834, 1.3537647724151611, 1.7103090286254883, 2.0668532848358154, 2.4233975410461426, 2.7799417972564697, 3.136486053466797, 3.493030309677124, 3.849574565887451, 4.206118583679199, 4.5626630783081055, 4.919207572937012, 5.27575159072876, 5.632295608520508, 5.988840103149414, 6.34538459777832, 6.701928615570068, 7.058472633361816, 7.415017127990723, 7.771561622619629, 8.128105163574219, 8.484649658203125, 8.841194152832031, 9.197738647460938, 9.554283142089844, 9.910826683044434, 10.26737117767334]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 11.0, 13.0, 4.0, 10.0, 12.0, 14.0, 15.0, 20.0, 22.0, 19.0, 31.0, 27.0, 33.0, 29.0, 31.0, 35.0, 39.0, 39.0, 36.0, 30.0, 36.0, 48.0, 36.0, 36.0, 30.0, 43.0, 36.0, 27.0, 27.0, 27.0, 34.0, 22.0, 14.0, 17.0, 15.0, 13.0, 11.0, 10.0, 10.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.40234375, -1.355499267578125, -1.30865478515625, -1.261810302734375, -1.2149658203125, -1.168121337890625, -1.12127685546875, -1.074432373046875, -1.027587890625, -0.980743408203125, -0.93389892578125, -0.887054443359375, -0.8402099609375, -0.793365478515625, -0.74652099609375, -0.699676513671875, -0.65283203125, -0.605987548828125, -0.55914306640625, -0.512298583984375, -0.4654541015625, -0.418609619140625, -0.37176513671875, -0.324920654296875, -0.278076171875, -0.231231689453125, -0.18438720703125, -0.137542724609375, -0.0906982421875, -0.043853759765625, 0.00299072265625, 0.049835205078125, 0.0966796875, 0.143524169921875, 0.19036865234375, 0.237213134765625, 0.2840576171875, 0.330902099609375, 0.37774658203125, 0.424591064453125, 0.471435546875, 0.518280029296875, 0.56512451171875, 0.611968994140625, 0.6588134765625, 0.705657958984375, 0.75250244140625, 0.799346923828125, 0.84619140625, 0.893035888671875, 0.93988037109375, 0.986724853515625, 1.0335693359375, 1.080413818359375, 1.12725830078125, 1.174102783203125, 1.220947265625, 1.267791748046875, 1.31463623046875, 1.361480712890625, 1.4083251953125, 1.455169677734375, 1.50201416015625, 1.548858642578125, 1.595703125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 4.0, 7.0, 15.0, 30.0, 28.0, 43.0, 62.0, 71.0, 127.0, 165.0, 280.0, 409.0, 594.0, 939.0, 1418.0, 2182.0, 3401.0, 5200.0, 8469.0, 13853.0, 22507.0, 38471.0, 66816.0, 120873.0, 218519.0, 232464.0, 132727.0, 72706.0, 41783.0, 24594.0, 14818.0, 8948.0, 5687.0, 3629.0, 2240.0, 1521.0, 978.0, 618.0, 448.0, 304.0, 196.0, 147.0, 84.0, 62.0, 42.0, 24.0, 6.0, 23.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.471435546875, -0.4562644958496094, -0.44109344482421875, -0.4259223937988281, -0.4107513427734375, -0.3955802917480469, -0.38040924072265625, -0.3652381896972656, -0.350067138671875, -0.3348960876464844, -0.31972503662109375, -0.3045539855957031, -0.2893829345703125, -0.2742118835449219, -0.25904083251953125, -0.24386978149414062, -0.22869873046875, -0.21352767944335938, -0.19835662841796875, -0.18318557739257812, -0.1680145263671875, -0.15284347534179688, -0.13767242431640625, -0.12250137329101562, -0.107330322265625, -0.09215927124023438, -0.07698822021484375, -0.061817169189453125, -0.0466461181640625, -0.031475067138671875, -0.01630401611328125, -0.001132965087890625, 0.0140380859375, 0.029209136962890625, 0.04438018798828125, 0.059551239013671875, 0.0747222900390625, 0.08989334106445312, 0.10506439208984375, 0.12023544311523438, 0.135406494140625, 0.15057754516601562, 0.16574859619140625, 0.18091964721679688, 0.1960906982421875, 0.21126174926757812, 0.22643280029296875, 0.24160385131835938, 0.25677490234375, 0.2719459533691406, 0.28711700439453125, 0.3022880554199219, 0.3174591064453125, 0.3326301574707031, 0.34780120849609375, 0.3629722595214844, 0.378143310546875, 0.3933143615722656, 0.40848541259765625, 0.4236564636230469, 0.4388275146484375, 0.4539985656738281, 0.46916961669921875, 0.4843406677246094, 0.49951171875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 10.0, 6.0, 10.0, 8.0, 12.0, 10.0, 6.0, 12.0, 20.0, 15.0, 22.0, 27.0, 24.0, 25.0, 40.0, 26.0, 42.0, 42.0, 38.0, 42.0, 33.0, 1062.0, 39.0, 48.0, 36.0, 46.0, 37.0, 37.0, 31.0, 34.0, 41.0, 21.0, 27.0, 18.0, 19.0, 16.0, 5.0, 6.0, 9.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -0.993438720703125, -0.95660400390625, -0.919769287109375, -0.8829345703125, -0.846099853515625, -0.80926513671875, -0.772430419921875, -0.735595703125, -0.698760986328125, -0.66192626953125, -0.625091552734375, -0.5882568359375, -0.551422119140625, -0.51458740234375, -0.477752685546875, -0.44091796875, -0.404083251953125, -0.36724853515625, -0.330413818359375, -0.2935791015625, -0.256744384765625, -0.21990966796875, -0.183074951171875, -0.146240234375, -0.109405517578125, -0.07257080078125, -0.035736083984375, 0.0010986328125, 0.037933349609375, 0.07476806640625, 0.111602783203125, 0.1484375, 0.185272216796875, 0.22210693359375, 0.258941650390625, 0.2957763671875, 0.332611083984375, 0.36944580078125, 0.406280517578125, 0.443115234375, 0.479949951171875, 0.51678466796875, 0.553619384765625, 0.5904541015625, 0.627288818359375, 0.66412353515625, 0.700958251953125, 0.73779296875, 0.774627685546875, 0.81146240234375, 0.848297119140625, 0.8851318359375, 0.921966552734375, 0.95880126953125, 0.995635986328125, 1.032470703125, 1.069305419921875, 1.10614013671875, 1.142974853515625, 1.1798095703125, 1.216644287109375, 1.25347900390625, 1.290313720703125, 1.3271484375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 1.0, 2.0, 5.0, 2.0, 10.0, 10.0, 14.0, 30.0, 39.0, 53.0, 102.0, 220.0, 487.0, 1195.0, 2689.0, 6866.0, 20147.0, 149892.0, 1859847.0, 37280.0, 10983.0, 4097.0, 1714.0, 708.0, 301.0, 176.0, 91.0, 59.0, 31.0, 25.0, 16.0, 10.0, 9.0, 6.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.98828125, -1.937591552734375, -1.88690185546875, -1.836212158203125, -1.7855224609375, -1.734832763671875, -1.68414306640625, -1.633453369140625, -1.582763671875, -1.532073974609375, -1.48138427734375, -1.430694580078125, -1.3800048828125, -1.329315185546875, -1.27862548828125, -1.227935791015625, -1.17724609375, -1.126556396484375, -1.07586669921875, -1.025177001953125, -0.9744873046875, -0.923797607421875, -0.87310791015625, -0.822418212890625, -0.771728515625, -0.721038818359375, -0.67034912109375, -0.619659423828125, -0.5689697265625, -0.518280029296875, -0.46759033203125, -0.416900634765625, -0.3662109375, -0.315521240234375, -0.26483154296875, -0.214141845703125, -0.1634521484375, -0.112762451171875, -0.06207275390625, -0.011383056640625, 0.039306640625, 0.089996337890625, 0.14068603515625, 0.191375732421875, 0.2420654296875, 0.292755126953125, 0.34344482421875, 0.394134521484375, 0.44482421875, 0.495513916015625, 0.54620361328125, 0.596893310546875, 0.6475830078125, 0.698272705078125, 0.74896240234375, 0.799652099609375, 0.850341796875, 0.901031494140625, 0.95172119140625, 1.002410888671875, 1.0531005859375, 1.103790283203125, 1.15447998046875, 1.205169677734375, 1.255859375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 1.0, 9.0, 10.0, 13.0, 19.0, 31.0, 47.0, 48.0, 65.0, 109.0, 132.0, 128.0, 109.0, 75.0, 56.0, 38.0, 26.0, 26.0, 11.0, 17.0, 9.0, 6.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05712890625, -0.0552978515625, -0.053466796875, -0.0516357421875, -0.0498046875, -0.0479736328125, -0.046142578125, -0.0443115234375, -0.04248046875, -0.0406494140625, -0.038818359375, -0.0369873046875, -0.03515625, -0.0333251953125, -0.031494140625, -0.0296630859375, -0.02783203125, -0.0260009765625, -0.024169921875, -0.0223388671875, -0.0205078125, -0.0186767578125, -0.016845703125, -0.0150146484375, -0.01318359375, -0.0113525390625, -0.009521484375, -0.0076904296875, -0.005859375, -0.0040283203125, -0.002197265625, -0.0003662109375, 0.00146484375, 0.0032958984375, 0.005126953125, 0.0069580078125, 0.0087890625, 0.0106201171875, 0.012451171875, 0.0142822265625, 0.01611328125, 0.0179443359375, 0.019775390625, 0.0216064453125, 0.0234375, 0.0252685546875, 0.027099609375, 0.0289306640625, 0.03076171875, 0.0325927734375, 0.034423828125, 0.0362548828125, 0.0380859375, 0.0399169921875, 0.041748046875, 0.0435791015625, 0.04541015625, 0.0472412109375, 0.049072265625, 0.0509033203125, 0.052734375, 0.0545654296875, 0.056396484375, 0.0582275390625, 0.06005859375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 5.0, 7.0, 12.0, 13.0, 21.0, 31.0, 55.0, 77.0, 166.0, 624.0, 11743.0, 999874.0, 34497.0, 914.0, 226.0, 102.0, 71.0, 44.0, 23.0, 10.0, 7.0, 9.0, 7.0, 5.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0431976318359375, -1.011199951171875, -0.9792022705078125, -0.94720458984375, -0.9152069091796875, -0.883209228515625, -0.8512115478515625, -0.8192138671875, -0.7872161865234375, -0.755218505859375, -0.7232208251953125, -0.69122314453125, -0.6592254638671875, -0.627227783203125, -0.5952301025390625, -0.563232421875, -0.5312347412109375, -0.499237060546875, -0.4672393798828125, -0.43524169921875, -0.4032440185546875, -0.371246337890625, -0.3392486572265625, -0.3072509765625, -0.2752532958984375, -0.243255615234375, -0.2112579345703125, -0.17926025390625, -0.1472625732421875, -0.115264892578125, -0.0832672119140625, -0.05126953125, -0.0192718505859375, 0.012725830078125, 0.0447235107421875, 0.07672119140625, 0.1087188720703125, 0.140716552734375, 0.1727142333984375, 0.2047119140625, 0.2367095947265625, 0.268707275390625, 0.3007049560546875, 0.33270263671875, 0.3647003173828125, 0.396697998046875, 0.4286956787109375, 0.460693359375, 0.4926910400390625, 0.524688720703125, 0.5566864013671875, 0.58868408203125, 0.6206817626953125, 0.652679443359375, 0.6846771240234375, 0.7166748046875, 0.7486724853515625, 0.780670166015625, 0.8126678466796875, 0.84466552734375, 0.8766632080078125, 0.908660888671875, 0.9406585693359375, 0.97265625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 35.0, 101.0, 265.0, 304.0, 190.0, 69.0, 31.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09084304422140121, -0.07983092963695526, -0.06881880760192871, -0.05780669301748276, -0.046794578433036804, -0.03578246384859085, -0.0247703418135643, -0.013758227229118347, -0.002746112644672394, 0.008266003802418709, 0.01927812024950981, 0.030290238559246063, 0.04130235314369202, 0.05231446772813797, 0.06332658976316452, 0.07433870434761047, 0.08535081893205643, 0.09636293351650238, 0.10737505555152893, 0.11838717013597488, 0.12939928472042084, 0.1404114067554474, 0.15142351388931274, 0.1624356359243393, 0.17344775795936584, 0.1844598799943924, 0.19547198712825775, 0.2064841091632843, 0.21749621629714966, 0.2285083383321762, 0.23952046036720276, 0.2505325675010681, 0.26154470443725586, 0.2725568115711212, 0.28356894850730896, 0.2945810556411743, 0.3055931627750397, 0.31660526990890503, 0.3276174068450928, 0.33862951397895813, 0.3496416211128235, 0.36065372824668884, 0.3716658651828766, 0.38267797231674194, 0.3936900794506073, 0.40470218658447266, 0.4157143235206604, 0.42672643065452576, 0.4377385675907135, 0.44875067472457886, 0.4597628116607666, 0.47077491879463196, 0.4817870259284973, 0.49279916286468506, 0.503811240196228, 0.5148233771324158, 0.5258355140686035, 0.5368476510047913, 0.5478597283363342, 0.558871865272522, 0.5698840022087097, 0.5808960795402527, 0.5919082164764404, 0.6029203534126282, 0.6139324307441711]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 4.0, 4.0, 8.0, 11.0, 6.0, 11.0, 17.0, 14.0, 22.0, 16.0, 28.0, 46.0, 27.0, 37.0, 41.0, 43.0, 29.0, 43.0, 45.0, 49.0, 54.0, 52.0, 28.0, 52.0, 38.0, 38.0, 30.0, 36.0, 29.0, 26.0, 19.0, 16.0, 21.0, 14.0, 13.0, 12.0, 6.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0626574158668518, -0.06091519817709923, -0.05917298048734665, -0.05743076652288437, -0.05568854883313179, -0.05394633114337921, -0.05220411717891693, -0.05046189948916435, -0.048719681799411774, -0.046977464109659195, -0.045235246419906616, -0.043493032455444336, -0.04175081476569176, -0.04000859707593918, -0.0382663831114769, -0.03652416542172432, -0.03478194773197174, -0.03303973004221916, -0.03129751235246658, -0.029555298388004303, -0.027813080698251724, -0.026070863008499146, -0.024328647181391716, -0.022586431354284286, -0.020844213664531708, -0.01910199597477913, -0.0173597801476717, -0.015617563389241695, -0.013875346630811691, -0.012133129872381687, -0.010390913113951683, -0.008648696355521679, -0.006906479597091675, -0.005164262838661671, -0.0034220460802316666, -0.0016798293218016624, 6.238743662834167e-05, 0.0018046041950583458, 0.00354682095348835, 0.005289037711918354, 0.007031254470348358, 0.008773471228778362, 0.010515687987208366, 0.01225790474563837, 0.014000121504068375, 0.015742339193820953, 0.017484555020928383, 0.019226770848035812, 0.02096898853778839, 0.02271120622754097, 0.0244534220546484, 0.02619563788175583, 0.027937855571508408, 0.029680073261260986, 0.03142228722572327, 0.033164504915475845, 0.034906722605228424, 0.036648940294981, 0.03839115798473358, 0.04013337194919586, 0.04187558963894844, 0.04361780732870102, 0.0453600212931633, 0.04710223898291588, 0.04884445667266846]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 11.0, 12.0, 6.0, 10.0, 11.0, 14.0, 16.0, 20.0, 20.0, 20.0, 32.0, 26.0, 34.0, 28.0, 30.0, 33.0, 44.0, 36.0, 36.0, 31.0, 36.0, 46.0, 36.0, 35.0, 33.0, 41.0, 35.0, 30.0, 28.0, 23.0, 36.0, 22.0, 13.0, 19.0, 17.0, 11.0, 11.0, 11.0, 9.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.4052734375, -1.3584136962890625, -1.311553955078125, -1.2646942138671875, -1.21783447265625, -1.1709747314453125, -1.124114990234375, -1.0772552490234375, -1.0303955078125, -0.9835357666015625, -0.936676025390625, -0.8898162841796875, -0.84295654296875, -0.7960968017578125, -0.749237060546875, -0.7023773193359375, -0.655517578125, -0.6086578369140625, -0.561798095703125, -0.5149383544921875, -0.46807861328125, -0.4212188720703125, -0.374359130859375, -0.3274993896484375, -0.2806396484375, -0.2337799072265625, -0.186920166015625, -0.1400604248046875, -0.09320068359375, -0.0463409423828125, 0.000518798828125, 0.0473785400390625, 0.09423828125, 0.1410980224609375, 0.187957763671875, 0.2348175048828125, 0.28167724609375, 0.3285369873046875, 0.375396728515625, 0.4222564697265625, 0.4691162109375, 0.5159759521484375, 0.562835693359375, 0.6096954345703125, 0.65655517578125, 0.7034149169921875, 0.750274658203125, 0.7971343994140625, 0.843994140625, 0.8908538818359375, 0.937713623046875, 0.9845733642578125, 1.03143310546875, 1.0782928466796875, 1.125152587890625, 1.1720123291015625, 1.2188720703125, 1.2657318115234375, 1.312591552734375, 1.3594512939453125, 1.40631103515625, 1.4531707763671875, 1.500030517578125, 1.5468902587890625, 1.59375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 6.0, 5.0, 5.0, 7.0, 6.0, 8.0, 20.0, 33.0, 42.0, 49.0, 61.0, 103.0, 140.0, 235.0, 291.0, 424.0, 586.0, 878.0, 1319.0, 1950.0, 2779.0, 4647.0, 7535.0, 12705.0, 22816.0, 47889.0, 130809.0, 408342.0, 246743.0, 80107.0, 33532.0, 17355.0, 10038.0, 5880.0, 3682.0, 2453.0, 1594.0, 1093.0, 737.0, 473.0, 337.0, 246.0, 166.0, 112.0, 95.0, 69.0, 36.0, 35.0, 27.0, 19.0, 15.0, 9.0, 9.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.5, -2.41876220703125, -2.3375244140625, -2.25628662109375, -2.175048828125, -2.09381103515625, -2.0125732421875, -1.93133544921875, -1.85009765625, -1.76885986328125, -1.6876220703125, -1.60638427734375, -1.525146484375, -1.44390869140625, -1.3626708984375, -1.28143310546875, -1.2001953125, -1.11895751953125, -1.0377197265625, -0.95648193359375, -0.875244140625, -0.79400634765625, -0.7127685546875, -0.63153076171875, -0.55029296875, -0.46905517578125, -0.3878173828125, -0.30657958984375, -0.225341796875, -0.14410400390625, -0.0628662109375, 0.01837158203125, 0.099609375, 0.18084716796875, 0.2620849609375, 0.34332275390625, 0.424560546875, 0.50579833984375, 0.5870361328125, 0.66827392578125, 0.74951171875, 0.83074951171875, 0.9119873046875, 0.99322509765625, 1.074462890625, 1.15570068359375, 1.2369384765625, 1.31817626953125, 1.3994140625, 1.48065185546875, 1.5618896484375, 1.64312744140625, 1.724365234375, 1.80560302734375, 1.8868408203125, 1.96807861328125, 2.04931640625, 2.13055419921875, 2.2117919921875, 2.29302978515625, 2.374267578125, 2.45550537109375, 2.5367431640625, 2.61798095703125, 2.69921875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 6.0, 6.0, 8.0, 7.0, 9.0, 13.0, 13.0, 18.0, 27.0, 18.0, 13.0, 29.0, 35.0, 46.0, 40.0, 55.0, 69.0, 92.0, 139.0, 216.0, 1389.0, 190.0, 122.0, 83.0, 58.0, 46.0, 31.0, 49.0, 31.0, 28.0, 18.0, 29.0, 20.0, 12.0, 11.0, 11.0, 9.0, 11.0, 10.0, 6.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2890625, -4.1375732421875, -3.986083984375, -3.8345947265625, -3.68310546875, -3.5316162109375, -3.380126953125, -3.2286376953125, -3.0771484375, -2.9256591796875, -2.774169921875, -2.6226806640625, -2.47119140625, -2.3197021484375, -2.168212890625, -2.0167236328125, -1.865234375, -1.7137451171875, -1.562255859375, -1.4107666015625, -1.25927734375, -1.1077880859375, -0.956298828125, -0.8048095703125, -0.6533203125, -0.5018310546875, -0.350341796875, -0.1988525390625, -0.04736328125, 0.1041259765625, 0.255615234375, 0.4071044921875, 0.55859375, 0.7100830078125, 0.861572265625, 1.0130615234375, 1.16455078125, 1.3160400390625, 1.467529296875, 1.6190185546875, 1.7705078125, 1.9219970703125, 2.073486328125, 2.2249755859375, 2.37646484375, 2.5279541015625, 2.679443359375, 2.8309326171875, 2.982421875, 3.1339111328125, 3.285400390625, 3.4368896484375, 3.58837890625, 3.7398681640625, 3.891357421875, 4.0428466796875, 4.1943359375, 4.3458251953125, 4.497314453125, 4.6488037109375, 4.80029296875, 4.9517822265625, 5.103271484375, 5.2547607421875, 5.40625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 10.0, 10.0, 8.0, 8.0, 13.0, 24.0, 27.0, 38.0, 46.0, 62.0, 108.0, 122.0, 230.0, 344.0, 692.0, 2251.0, 12783.0, 190107.0, 2816861.0, 109343.0, 9222.0, 1770.0, 644.0, 353.0, 191.0, 129.0, 81.0, 61.0, 49.0, 39.0, 19.0, 21.0, 15.0, 9.0, 8.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796875, -9.4395751953125, -9.082275390625, -8.7249755859375, -8.36767578125, -8.0103759765625, -7.653076171875, -7.2957763671875, -6.9384765625, -6.5811767578125, -6.223876953125, -5.8665771484375, -5.50927734375, -5.1519775390625, -4.794677734375, -4.4373779296875, -4.080078125, -3.7227783203125, -3.365478515625, -3.0081787109375, -2.65087890625, -2.2935791015625, -1.936279296875, -1.5789794921875, -1.2216796875, -0.8643798828125, -0.507080078125, -0.1497802734375, 0.20751953125, 0.5648193359375, 0.922119140625, 1.2794189453125, 1.63671875, 1.9940185546875, 2.351318359375, 2.7086181640625, 3.06591796875, 3.4232177734375, 3.780517578125, 4.1378173828125, 4.4951171875, 4.8524169921875, 5.209716796875, 5.5670166015625, 5.92431640625, 6.2816162109375, 6.638916015625, 6.9962158203125, 7.353515625, 7.7108154296875, 8.068115234375, 8.4254150390625, 8.78271484375, 9.1400146484375, 9.497314453125, 9.8546142578125, 10.2119140625, 10.5692138671875, 10.926513671875, 11.2838134765625, 11.64111328125, 11.9984130859375, 12.355712890625, 12.7130126953125, 13.0703125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 23.0, 132.0, 387.0, 342.0, 98.0, 24.0, 7.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.60494232177734, -87.91011047363281, -86.21527099609375, -84.52043914794922, -82.82560729980469, -81.13077545166016, -79.4359359741211, -77.74110412597656, -76.04627227783203, -74.3514404296875, -72.65660095214844, -70.9617691040039, -69.26693725585938, -67.57210540771484, -65.87726593017578, -64.18243408203125, -62.48759841918945, -60.792762756347656, -59.097930908203125, -57.40309524536133, -55.7082633972168, -54.013427734375, -52.31859588623047, -50.62376022338867, -48.928924560546875, -47.23408889770508, -45.53925704956055, -43.84442138671875, -42.14958953857422, -40.45475387573242, -38.759918212890625, -37.065086364746094, -35.37025451660156, -33.675418853759766, -31.980587005615234, -30.285751342773438, -28.590919494628906, -26.89608383178711, -25.201250076293945, -23.50641632080078, -21.81158447265625, -20.116750717163086, -18.421916961669922, -16.727081298828125, -15.032248497009277, -13.337414741516113, -11.642580032348633, -9.947746276855469, -8.252912521362305, -6.558078765869141, -4.863244533538818, -3.168410301208496, -1.473576545715332, 0.22125720977783203, 1.9160919189453125, 3.6109256744384766, 5.305759429931641, 7.000593185424805, 8.695426940917969, 10.39026165008545, 12.085095405578613, 13.779929161071777, 15.474763870239258, 17.169597625732422, 18.864431381225586]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 7.0, 12.0, 10.0, 11.0, 15.0, 17.0, 19.0, 16.0, 21.0, 27.0, 24.0, 29.0, 30.0, 29.0, 39.0, 50.0, 37.0, 41.0, 28.0, 33.0, 42.0, 48.0, 38.0, 23.0, 35.0, 35.0, 33.0, 27.0, 22.0, 24.0, 20.0, 21.0, 24.0, 16.0, 17.0, 19.0, 14.0, 9.0, 12.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.580638885498047, -12.16757583618164, -11.754511833190918, -11.341448783874512, -10.928384780883789, -10.515321731567383, -10.102258682250977, -9.68919563293457, -9.276131629943848, -8.863068580627441, -8.450004577636719, -8.036941528320312, -7.623878002166748, -7.210814476013184, -6.797751426696777, -6.384687900543213, -5.971624374389648, -5.558560848236084, -5.1454973220825195, -4.732434272766113, -4.319370746612549, -3.9063072204589844, -3.493243932723999, -3.0801806449890137, -2.667117118835449, -2.2540535926818848, -1.8409903049468994, -1.4279268980026245, -1.0148634910583496, -0.6017999649047852, -0.1887366771697998, 0.22432661056518555, 0.63739013671875, 1.050453543663025, 1.4635169506072998, 1.8765803575515747, 2.2896437644958496, 2.702707290649414, 3.1157705783843994, 3.5288338661193848, 3.941897392272949, 4.354960918426514, 4.768024444580078, 5.181087493896484, 5.594151020050049, 6.007214546203613, 6.4202775955200195, 6.833341121673584, 7.246404647827148, 7.659468173980713, 8.072531700134277, 8.485594749450684, 8.898658752441406, 9.311721801757812, 9.724784851074219, 10.137847900390625, 10.550911903381348, 10.963974952697754, 11.377038955688477, 11.790102005004883, 12.203165054321289, 12.616229057312012, 13.029292106628418, 13.44235610961914, 13.855419158935547]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 7.0, 5.0, 4.0, 3.0, 6.0, 5.0, 9.0, 9.0, 13.0, 14.0, 12.0, 22.0, 18.0, 19.0, 25.0, 29.0, 38.0, 34.0, 26.0, 38.0, 35.0, 40.0, 41.0, 29.0, 29.0, 42.0, 38.0, 45.0, 31.0, 29.0, 38.0, 42.0, 32.0, 23.0, 32.0, 31.0, 16.0, 15.0, 18.0, 14.0, 8.0, 11.0, 5.0, 6.0, 7.0, 8.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.6806640625, -1.627288818359375, -1.57391357421875, -1.520538330078125, -1.4671630859375, -1.413787841796875, -1.36041259765625, -1.307037353515625, -1.253662109375, -1.200286865234375, -1.14691162109375, -1.093536376953125, -1.0401611328125, -0.986785888671875, -0.93341064453125, -0.880035400390625, -0.82666015625, -0.773284912109375, -0.71990966796875, -0.666534423828125, -0.6131591796875, -0.559783935546875, -0.50640869140625, -0.453033447265625, -0.399658203125, -0.346282958984375, -0.29290771484375, -0.239532470703125, -0.1861572265625, -0.132781982421875, -0.07940673828125, -0.026031494140625, 0.02734375, 0.080718994140625, 0.13409423828125, 0.187469482421875, 0.2408447265625, 0.294219970703125, 0.34759521484375, 0.400970458984375, 0.454345703125, 0.507720947265625, 0.56109619140625, 0.614471435546875, 0.6678466796875, 0.721221923828125, 0.77459716796875, 0.827972412109375, 0.88134765625, 0.934722900390625, 0.98809814453125, 1.041473388671875, 1.0948486328125, 1.148223876953125, 1.20159912109375, 1.254974365234375, 1.308349609375, 1.361724853515625, 1.41510009765625, 1.468475341796875, 1.5218505859375, 1.575225830078125, 1.62860107421875, 1.681976318359375, 1.7353515625]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 8.0, 11.0, 17.0, 19.0, 15.0, 37.0, 45.0, 70.0, 119.0, 172.0, 227.0, 354.0, 593.0, 914.0, 1638.0, 2937.0, 5397.0, 10322.0, 21858.0, 52736.0, 170015.0, 921887.0, 2207055.0, 597042.0, 121117.0, 41503.0, 18036.0, 8716.0, 4616.0, 2629.0, 1474.0, 934.0, 630.0, 357.0, 239.0, 169.0, 126.0, 67.0, 51.0, 36.0, 30.0, 19.0, 12.0, 5.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.12890625, -3.02239990234375, -2.9158935546875, -2.80938720703125, -2.702880859375, -2.59637451171875, -2.4898681640625, -2.38336181640625, -2.27685546875, -2.17034912109375, -2.0638427734375, -1.95733642578125, -1.850830078125, -1.74432373046875, -1.6378173828125, -1.53131103515625, -1.4248046875, -1.31829833984375, -1.2117919921875, -1.10528564453125, -0.998779296875, -0.89227294921875, -0.7857666015625, -0.67926025390625, -0.57275390625, -0.46624755859375, -0.3597412109375, -0.25323486328125, -0.146728515625, -0.04022216796875, 0.0662841796875, 0.17279052734375, 0.279296875, 0.38580322265625, 0.4923095703125, 0.59881591796875, 0.705322265625, 0.81182861328125, 0.9183349609375, 1.02484130859375, 1.13134765625, 1.23785400390625, 1.3443603515625, 1.45086669921875, 1.557373046875, 1.66387939453125, 1.7703857421875, 1.87689208984375, 1.9833984375, 2.08990478515625, 2.1964111328125, 2.30291748046875, 2.409423828125, 2.51593017578125, 2.6224365234375, 2.72894287109375, 2.83544921875, 2.94195556640625, 3.0484619140625, 3.15496826171875, 3.261474609375, 3.36798095703125, 3.4744873046875, 3.58099365234375, 3.6875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 8.0, 6.0, 8.0, 7.0, 21.0, 33.0, 25.0, 44.0, 52.0, 53.0, 84.0, 92.0, 161.0, 221.0, 323.0, 445.0, 527.0, 522.0, 392.0, 304.0, 195.0, 124.0, 86.0, 70.0, 57.0, 42.0, 38.0, 34.0, 19.0, 10.0, 18.0, 10.0, 6.0, 8.0, 5.0, 2.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3046875, -3.194061279296875, -3.08343505859375, -2.972808837890625, -2.8621826171875, -2.751556396484375, -2.64093017578125, -2.530303955078125, -2.419677734375, -2.309051513671875, -2.19842529296875, -2.087799072265625, -1.9771728515625, -1.866546630859375, -1.75592041015625, -1.645294189453125, -1.53466796875, -1.424041748046875, -1.31341552734375, -1.202789306640625, -1.0921630859375, -0.981536865234375, -0.87091064453125, -0.760284423828125, -0.649658203125, -0.539031982421875, -0.42840576171875, -0.317779541015625, -0.2071533203125, -0.096527099609375, 0.01409912109375, 0.124725341796875, 0.2353515625, 0.345977783203125, 0.45660400390625, 0.567230224609375, 0.6778564453125, 0.788482666015625, 0.89910888671875, 1.009735107421875, 1.120361328125, 1.230987548828125, 1.34161376953125, 1.452239990234375, 1.5628662109375, 1.673492431640625, 1.78411865234375, 1.894744873046875, 2.00537109375, 2.115997314453125, 2.22662353515625, 2.337249755859375, 2.4478759765625, 2.558502197265625, 2.66912841796875, 2.779754638671875, 2.890380859375, 3.001007080078125, 3.11163330078125, 3.222259521484375, 3.3328857421875, 3.443511962890625, 3.55413818359375, 3.664764404296875, 3.775390625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 1.0, 4.0, 3.0, 3.0, 6.0, 5.0, 9.0, 14.0, 16.0, 19.0, 29.0, 38.0, 48.0, 73.0, 105.0, 160.0, 342.0, 791.0, 2420.0, 9215.0, 48144.0, 456075.0, 3306700.0, 320908.0, 37971.0, 7643.0, 1955.0, 755.0, 340.0, 149.0, 84.0, 70.0, 56.0, 25.0, 34.0, 21.0, 22.0, 10.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.515625, -8.226318359375, -7.93701171875, -7.647705078125, -7.3583984375, -7.069091796875, -6.77978515625, -6.490478515625, -6.201171875, -5.911865234375, -5.62255859375, -5.333251953125, -5.0439453125, -4.754638671875, -4.46533203125, -4.176025390625, -3.88671875, -3.597412109375, -3.30810546875, -3.018798828125, -2.7294921875, -2.440185546875, -2.15087890625, -1.861572265625, -1.572265625, -1.282958984375, -0.99365234375, -0.704345703125, -0.4150390625, -0.125732421875, 0.16357421875, 0.452880859375, 0.7421875, 1.031494140625, 1.32080078125, 1.610107421875, 1.8994140625, 2.188720703125, 2.47802734375, 2.767333984375, 3.056640625, 3.345947265625, 3.63525390625, 3.924560546875, 4.2138671875, 4.503173828125, 4.79248046875, 5.081787109375, 5.37109375, 5.660400390625, 5.94970703125, 6.239013671875, 6.5283203125, 6.817626953125, 7.10693359375, 7.396240234375, 7.685546875, 7.974853515625, 8.26416015625, 8.553466796875, 8.8427734375, 9.132080078125, 9.42138671875, 9.710693359375, 10.0]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 9.0, 9.0, 21.0, 25.0, 29.0, 28.0, 50.0, 61.0, 69.0, 73.0, 81.0, 80.0, 91.0, 65.0, 68.0, 53.0, 42.0, 30.0, 27.0, 20.0, 21.0, 10.0, 9.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.132604598999023, -18.691152572631836, -18.24970054626465, -17.80824851989746, -17.366796493530273, -16.925344467163086, -16.4838924407959, -16.042442321777344, -15.60098934173584, -15.159537315368652, -14.718085289001465, -14.276633262634277, -13.835182189941406, -13.393730163574219, -12.952278137207031, -12.510826110839844, -12.069374084472656, -11.627922058105469, -11.186470031738281, -10.745018005371094, -10.303565979003906, -9.862113952636719, -9.420662879943848, -8.97921085357666, -8.537758827209473, -8.096306800842285, -7.654854774475098, -7.213403224945068, -6.771951198577881, -6.330499172210693, -5.889047622680664, -5.447595596313477, -5.006142616271973, -4.564690589904785, -4.123238563537598, -3.6817870140075684, -3.240334987640381, -2.7988829612731934, -2.357431173324585, -1.9159793853759766, -1.474527359008789, -1.0330754518508911, -0.5916235446929932, -0.15017163753509521, 0.29128026962280273, 0.7327322959899902, 1.1741840839385986, 1.615635871887207, 2.0570878982543945, 2.498539924621582, 2.9399917125701904, 3.381443500518799, 3.8228955268859863, 4.264347553253174, 4.705799102783203, 5.147251129150391, 5.588703155517578, 6.030155181884766, 6.471607208251953, 6.913058757781982, 7.35451078414917, 7.795962810516357, 8.237414360046387, 8.678866386413574, 9.120318412780762]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 9.0, 3.0, 12.0, 10.0, 14.0, 11.0, 17.0, 24.0, 16.0, 20.0, 24.0, 31.0, 26.0, 39.0, 36.0, 30.0, 39.0, 27.0, 40.0, 31.0, 38.0, 39.0, 48.0, 34.0, 40.0, 38.0, 34.0, 37.0, 34.0, 29.0, 22.0, 22.0, 17.0, 21.0, 15.0, 18.0, 15.0, 8.0, 6.0, 3.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-12.023050308227539, -11.662965774536133, -11.302882194519043, -10.942797660827637, -10.58271312713623, -10.22262954711914, -9.862545013427734, -9.502460479736328, -9.142375946044922, -8.782291412353516, -8.422207832336426, -8.06212329864502, -7.702038764953613, -7.341954708099365, -6.981870651245117, -6.621786117553711, -6.261702537536621, -5.901618480682373, -5.541533946990967, -5.181449890136719, -4.8213653564453125, -4.4612812995910645, -4.101197242736816, -3.7411129474639893, -3.381028652191162, -3.020944356918335, -2.660860061645508, -2.3007760047912598, -1.9406917095184326, -1.5806074142456055, -1.2205233573913574, -0.8604390621185303, -0.5003557205200195, -0.14027148485183716, 0.21981275081634521, 0.5798969268798828, 0.93998122215271, 1.300065517425537, 1.6601495742797852, 2.0202338695526123, 2.3803181648254395, 2.7404024600982666, 3.1004867553710938, 3.460570812225342, 3.820655107498169, 4.180739402770996, 4.540823459625244, 4.900907516479492, 5.260992050170898, 5.6210761070251465, 5.981160640716553, 6.341244697570801, 6.701329231262207, 7.061413288116455, 7.421497344970703, 7.781581878662109, 8.141666412353516, 8.501750946044922, 8.861834526062012, 9.221919059753418, 9.582003593444824, 9.942087173461914, 10.30217170715332, 10.662256240844727, 11.022339820861816]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 8.0, 10.0, 9.0, 11.0, 7.0, 16.0, 22.0, 23.0, 24.0, 21.0, 26.0, 20.0, 30.0, 23.0, 27.0, 42.0, 37.0, 37.0, 43.0, 40.0, 31.0, 55.0, 36.0, 37.0, 41.0, 34.0, 34.0, 39.0, 27.0, 29.0, 30.0, 28.0, 22.0, 14.0, 6.0, 12.0, 6.0, 7.0, 11.0, 5.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6240234375, -1.5715789794921875, -1.519134521484375, -1.4666900634765625, -1.41424560546875, -1.3618011474609375, -1.309356689453125, -1.2569122314453125, -1.2044677734375, -1.1520233154296875, -1.099578857421875, -1.0471343994140625, -0.99468994140625, -0.9422454833984375, -0.889801025390625, -0.8373565673828125, -0.784912109375, -0.7324676513671875, -0.680023193359375, -0.6275787353515625, -0.57513427734375, -0.5226898193359375, -0.470245361328125, -0.4178009033203125, -0.3653564453125, -0.3129119873046875, -0.260467529296875, -0.2080230712890625, -0.15557861328125, -0.1031341552734375, -0.050689697265625, 0.0017547607421875, 0.05419921875, 0.1066436767578125, 0.159088134765625, 0.2115325927734375, 0.26397705078125, 0.3164215087890625, 0.368865966796875, 0.4213104248046875, 0.4737548828125, 0.5261993408203125, 0.578643798828125, 0.6310882568359375, 0.68353271484375, 0.7359771728515625, 0.788421630859375, 0.8408660888671875, 0.893310546875, 0.9457550048828125, 0.998199462890625, 1.0506439208984375, 1.10308837890625, 1.1555328369140625, 1.207977294921875, 1.2604217529296875, 1.3128662109375, 1.3653106689453125, 1.417755126953125, 1.4701995849609375, 1.52264404296875, 1.5750885009765625, 1.627532958984375, 1.6799774169921875, 1.732421875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 2.0, 3.0, 3.0, 10.0, 11.0, 16.0, 30.0, 25.0, 45.0, 55.0, 98.0, 138.0, 194.0, 317.0, 412.0, 677.0, 1078.0, 1706.0, 2680.0, 4596.0, 7754.0, 14516.0, 30406.0, 71817.0, 194401.0, 366899.0, 206871.0, 76348.0, 31609.0, 15292.0, 8172.0, 4624.0, 2716.0, 1737.0, 1156.0, 714.0, 443.0, 308.0, 192.0, 171.0, 107.0, 61.0, 45.0, 41.0, 16.0, 13.0, 11.0, 6.0, 10.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55859375, -0.5408782958984375, -0.523162841796875, -0.5054473876953125, -0.48773193359375, -0.4700164794921875, -0.452301025390625, -0.4345855712890625, -0.4168701171875, -0.3991546630859375, -0.381439208984375, -0.3637237548828125, -0.34600830078125, -0.3282928466796875, -0.310577392578125, -0.2928619384765625, -0.275146484375, -0.2574310302734375, -0.239715576171875, -0.2220001220703125, -0.20428466796875, -0.1865692138671875, -0.168853759765625, -0.1511383056640625, -0.1334228515625, -0.1157073974609375, -0.097991943359375, -0.0802764892578125, -0.06256103515625, -0.0448455810546875, -0.027130126953125, -0.0094146728515625, 0.00830078125, 0.0260162353515625, 0.043731689453125, 0.0614471435546875, 0.07916259765625, 0.0968780517578125, 0.114593505859375, 0.1323089599609375, 0.1500244140625, 0.1677398681640625, 0.185455322265625, 0.2031707763671875, 0.22088623046875, 0.2386016845703125, 0.256317138671875, 0.2740325927734375, 0.291748046875, 0.3094635009765625, 0.327178955078125, 0.3448944091796875, 0.36260986328125, 0.3803253173828125, 0.398040771484375, 0.4157562255859375, 0.4334716796875, 0.4511871337890625, 0.468902587890625, 0.4866180419921875, 0.50433349609375, 0.5220489501953125, 0.539764404296875, 0.5574798583984375, 0.5751953125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 6.0, 10.0, 12.0, 10.0, 14.0, 14.0, 12.0, 23.0, 21.0, 23.0, 25.0, 21.0, 28.0, 30.0, 42.0, 27.0, 36.0, 38.0, 41.0, 1071.0, 55.0, 49.0, 46.0, 41.0, 36.0, 34.0, 27.0, 36.0, 29.0, 25.0, 16.0, 17.0, 15.0, 21.0, 11.0, 9.0, 11.0, 9.0, 6.0, 2.0, 5.0, 7.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.326171875, -1.28765869140625, -1.2491455078125, -1.21063232421875, -1.172119140625, -1.13360595703125, -1.0950927734375, -1.05657958984375, -1.01806640625, -0.97955322265625, -0.9410400390625, -0.90252685546875, -0.864013671875, -0.82550048828125, -0.7869873046875, -0.74847412109375, -0.7099609375, -0.67144775390625, -0.6329345703125, -0.59442138671875, -0.555908203125, -0.51739501953125, -0.4788818359375, -0.44036865234375, -0.40185546875, -0.36334228515625, -0.3248291015625, -0.28631591796875, -0.247802734375, -0.20928955078125, -0.1707763671875, -0.13226318359375, -0.09375, -0.05523681640625, -0.0167236328125, 0.02178955078125, 0.060302734375, 0.09881591796875, 0.1373291015625, 0.17584228515625, 0.21435546875, 0.25286865234375, 0.2913818359375, 0.32989501953125, 0.368408203125, 0.40692138671875, 0.4454345703125, 0.48394775390625, 0.5224609375, 0.56097412109375, 0.5994873046875, 0.63800048828125, 0.676513671875, 0.71502685546875, 0.7535400390625, 0.79205322265625, 0.83056640625, 0.86907958984375, 0.9075927734375, 0.94610595703125, 0.984619140625, 1.02313232421875, 1.0616455078125, 1.10015869140625, 1.138671875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 13.0, 10.0, 24.0, 29.0, 45.0, 43.0, 98.0, 147.0, 297.0, 502.0, 972.0, 1865.0, 4199.0, 11393.0, 48435.0, 1933643.0, 72312.0, 13620.0, 4883.0, 2132.0, 1111.0, 558.0, 307.0, 180.0, 107.0, 72.0, 37.0, 26.0, 19.0, 13.0, 9.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.6435546875, -1.6020355224609375, -1.560516357421875, -1.5189971923828125, -1.47747802734375, -1.4359588623046875, -1.394439697265625, -1.3529205322265625, -1.3114013671875, -1.2698822021484375, -1.228363037109375, -1.1868438720703125, -1.14532470703125, -1.1038055419921875, -1.062286376953125, -1.0207672119140625, -0.979248046875, -0.9377288818359375, -0.896209716796875, -0.8546905517578125, -0.81317138671875, -0.7716522216796875, -0.730133056640625, -0.6886138916015625, -0.6470947265625, -0.6055755615234375, -0.564056396484375, -0.5225372314453125, -0.48101806640625, -0.4394989013671875, -0.397979736328125, -0.3564605712890625, -0.31494140625, -0.2734222412109375, -0.231903076171875, -0.1903839111328125, -0.14886474609375, -0.1073455810546875, -0.065826416015625, -0.0243072509765625, 0.0172119140625, 0.0587310791015625, 0.100250244140625, 0.1417694091796875, 0.18328857421875, 0.2248077392578125, 0.266326904296875, 0.3078460693359375, 0.349365234375, 0.3908843994140625, 0.432403564453125, 0.4739227294921875, 0.51544189453125, 0.5569610595703125, 0.598480224609375, 0.6399993896484375, 0.6815185546875, 0.7230377197265625, 0.764556884765625, 0.8060760498046875, 0.84759521484375, 0.8891143798828125, 0.930633544921875, 0.9721527099609375, 1.013671875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 2.0, 2.0, 8.0, 6.0, 12.0, 9.0, 10.0, 27.0, 32.0, 36.0, 35.0, 56.0, 66.0, 99.0, 114.0, 78.0, 80.0, 86.0, 58.0, 43.0, 29.0, 30.0, 23.0, 19.0, 8.0, 13.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0310516357421875, -0.02994084358215332, -0.02883005142211914, -0.02771925926208496, -0.02660846710205078, -0.0254976749420166, -0.024386882781982422, -0.023276090621948242, -0.022165298461914062, -0.021054506301879883, -0.019943714141845703, -0.018832921981811523, -0.017722129821777344, -0.016611337661743164, -0.015500545501708984, -0.014389753341674805, -0.013278961181640625, -0.012168169021606445, -0.011057376861572266, -0.009946584701538086, -0.008835792541503906, -0.0077250003814697266, -0.006614208221435547, -0.005503416061401367, -0.0043926239013671875, -0.003281831741333008, -0.002171039581298828, -0.0010602474212646484, 5.054473876953125e-05, 0.001161336898803711, 0.0022721290588378906, 0.0033829212188720703, 0.00449371337890625, 0.00560450553894043, 0.006715297698974609, 0.007826089859008789, 0.008936882019042969, 0.010047674179077148, 0.011158466339111328, 0.012269258499145508, 0.013380050659179688, 0.014490842819213867, 0.015601634979248047, 0.016712427139282227, 0.017823219299316406, 0.018934011459350586, 0.020044803619384766, 0.021155595779418945, 0.022266387939453125, 0.023377180099487305, 0.024487972259521484, 0.025598764419555664, 0.026709556579589844, 0.027820348739624023, 0.028931140899658203, 0.030041933059692383, 0.031152725219726562, 0.03226351737976074, 0.03337430953979492, 0.0344851016998291, 0.03559589385986328, 0.03670668601989746, 0.03781747817993164, 0.03892827033996582, 0.0400390625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 14.0, 20.0, 32.0, 50.0, 94.0, 215.0, 891.0, 60959.0, 980840.0, 4712.0, 401.0, 132.0, 71.0, 41.0, 19.0, 13.0, 8.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93408203125, -0.9075927734375, -0.881103515625, -0.8546142578125, -0.828125, -0.8016357421875, -0.775146484375, -0.7486572265625, -0.72216796875, -0.6956787109375, -0.669189453125, -0.6427001953125, -0.6162109375, -0.5897216796875, -0.563232421875, -0.5367431640625, -0.51025390625, -0.4837646484375, -0.457275390625, -0.4307861328125, -0.404296875, -0.3778076171875, -0.351318359375, -0.3248291015625, -0.29833984375, -0.2718505859375, -0.245361328125, -0.2188720703125, -0.1923828125, -0.1658935546875, -0.139404296875, -0.1129150390625, -0.08642578125, -0.0599365234375, -0.033447265625, -0.0069580078125, 0.01953125, 0.0460205078125, 0.072509765625, 0.0989990234375, 0.12548828125, 0.1519775390625, 0.178466796875, 0.2049560546875, 0.2314453125, 0.2579345703125, 0.284423828125, 0.3109130859375, 0.33740234375, 0.3638916015625, 0.390380859375, 0.4168701171875, 0.443359375, 0.4698486328125, 0.496337890625, 0.5228271484375, 0.54931640625, 0.5758056640625, 0.602294921875, 0.6287841796875, 0.6552734375, 0.6817626953125, 0.708251953125, 0.7347412109375, 0.76123046875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 9.0, 35.0, 162.0, 345.0, 287.0, 107.0, 42.0, 22.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07558318227529526, -0.0670434907078743, -0.058503806591033936, -0.049964115023612976, -0.041424427181482315, -0.032884739339351654, -0.024345047771930695, -0.015805359929800034, -0.0072656720876693726, 0.001274016685783863, 0.009813705459237099, 0.01835339516401291, 0.02689308300614357, 0.03543277084827423, 0.04397246241569519, 0.05251215025782585, 0.06105183809995651, 0.06959152966737747, 0.07813121378421783, 0.0866709053516388, 0.09521059691905975, 0.10375028103590012, 0.11228997260332108, 0.12082965672016144, 0.1293693482875824, 0.13790903985500336, 0.14644873142242432, 0.15498840808868408, 0.16352809965610504, 0.172067791223526, 0.18060748279094696, 0.18914717435836792, 0.19768688082695007, 0.20622657239437103, 0.214766263961792, 0.22330594062805176, 0.23184563219547272, 0.24038532376289368, 0.24892501533031464, 0.2574647068977356, 0.26600438356399536, 0.2745440602302551, 0.2830837666988373, 0.29162344336509705, 0.3001631498336792, 0.30870282649993896, 0.31724250316619873, 0.3257822096347809, 0.33432191610336304, 0.3428615927696228, 0.35140129923820496, 0.3599409759044647, 0.3684806823730469, 0.37702035903930664, 0.3855600357055664, 0.39409974217414856, 0.4026394188404083, 0.4111790955066681, 0.41971880197525024, 0.42825847864151, 0.43679818511009216, 0.44533786177635193, 0.4538775682449341, 0.46241724491119385, 0.4709569215774536]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 3.0, 2.0, 8.0, 11.0, 8.0, 5.0, 15.0, 19.0, 13.0, 29.0, 25.0, 26.0, 24.0, 32.0, 34.0, 53.0, 45.0, 34.0, 53.0, 42.0, 59.0, 40.0, 36.0, 45.0, 33.0, 42.0, 33.0, 28.0, 31.0, 35.0, 24.0, 17.0, 22.0, 13.0, 13.0, 9.0, 8.0, 8.0, 7.0, 1.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.03874337673187256, -0.0376732312142849, -0.036603085696697235, -0.03553294390439987, -0.03446279838681221, -0.03339265286922455, -0.032322511076927185, -0.03125236555933952, -0.03018222004175186, -0.0291120745241642, -0.028041930869221687, -0.026971787214279175, -0.025901641696691513, -0.02483149617910385, -0.02376135252416134, -0.022691208869218826, -0.021621063351631165, -0.020550917834043503, -0.01948077417910099, -0.018410630524158478, -0.017340485006570816, -0.016270339488983154, -0.015200195834040642, -0.014130051247775555, -0.013059906661510468, -0.01198976207524538, -0.010919617488980293, -0.009849472902715206, -0.008779328316450119, -0.007709183730185032, -0.006639039143919945, -0.005568894557654858, -0.0044987499713897705, -0.0034286053851246834, -0.0023584607988595963, -0.0012883162125945091, -0.000218171626329422, 0.0008519729599356651, 0.0019221175462007523, 0.0029922621324658394, 0.0040624067187309265, 0.005132551304996014, 0.006202695891261101, 0.007272840477526188, 0.008342985063791275, 0.009413129650056362, 0.01048327423632145, 0.011553418822586536, 0.012623563408851624, 0.01369370799511671, 0.014763852581381798, 0.01583399623632431, 0.016904141753911972, 0.017974287271499634, 0.019044430926442146, 0.02011457458138466, 0.02118472009897232, 0.022254865616559982, 0.023325009271502495, 0.024395152926445007, 0.02546529844403267, 0.02653544396162033, 0.027605587616562843, 0.028675731271505356, 0.029745876789093018]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 8.0, 10.0, 8.0, 12.0, 7.0, 16.0, 22.0, 23.0, 24.0, 20.0, 27.0, 19.0, 31.0, 23.0, 26.0, 42.0, 37.0, 38.0, 41.0, 40.0, 31.0, 56.0, 37.0, 36.0, 42.0, 34.0, 35.0, 38.0, 27.0, 30.0, 29.0, 28.0, 22.0, 14.0, 7.0, 11.0, 6.0, 7.0, 11.0, 5.0, 5.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.625, -1.5725250244140625, -1.520050048828125, -1.4675750732421875, -1.41510009765625, -1.3626251220703125, -1.310150146484375, -1.2576751708984375, -1.2052001953125, -1.1527252197265625, -1.100250244140625, -1.0477752685546875, -0.99530029296875, -0.9428253173828125, -0.890350341796875, -0.8378753662109375, -0.785400390625, -0.7329254150390625, -0.680450439453125, -0.6279754638671875, -0.57550048828125, -0.5230255126953125, -0.470550537109375, -0.4180755615234375, -0.3656005859375, -0.3131256103515625, -0.260650634765625, -0.2081756591796875, -0.15570068359375, -0.1032257080078125, -0.050750732421875, 0.0017242431640625, 0.05419921875, 0.1066741943359375, 0.159149169921875, 0.2116241455078125, 0.26409912109375, 0.3165740966796875, 0.369049072265625, 0.4215240478515625, 0.4739990234375, 0.5264739990234375, 0.578948974609375, 0.6314239501953125, 0.68389892578125, 0.7363739013671875, 0.788848876953125, 0.8413238525390625, 0.893798828125, 0.9462738037109375, 0.998748779296875, 1.0512237548828125, 1.10369873046875, 1.1561737060546875, 1.208648681640625, 1.2611236572265625, 1.3135986328125, 1.3660736083984375, 1.418548583984375, 1.4710235595703125, 1.52349853515625, 1.5759735107421875, 1.628448486328125, 1.6809234619140625, 1.7333984375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 4.0, 6.0, 7.0, 4.0, 12.0, 14.0, 31.0, 27.0, 46.0, 68.0, 103.0, 118.0, 220.0, 288.0, 469.0, 732.0, 1070.0, 1598.0, 2555.0, 4050.0, 6787.0, 11726.0, 20497.0, 38334.0, 79585.0, 193553.0, 380963.0, 158246.0, 68589.0, 33702.0, 18264.0, 10291.0, 5997.0, 3731.0, 2373.0, 1506.0, 969.0, 690.0, 429.0, 292.0, 194.0, 129.0, 91.0, 68.0, 46.0, 37.0, 11.0, 14.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-2.189453125, -2.1258087158203125, -2.062164306640625, -1.9985198974609375, -1.93487548828125, -1.8712310791015625, -1.807586669921875, -1.7439422607421875, -1.6802978515625, -1.6166534423828125, -1.553009033203125, -1.4893646240234375, -1.42572021484375, -1.3620758056640625, -1.298431396484375, -1.2347869873046875, -1.171142578125, -1.1074981689453125, -1.043853759765625, -0.9802093505859375, -0.91656494140625, -0.8529205322265625, -0.789276123046875, -0.7256317138671875, -0.6619873046875, -0.5983428955078125, -0.534698486328125, -0.4710540771484375, -0.40740966796875, -0.3437652587890625, -0.280120849609375, -0.2164764404296875, -0.15283203125, -0.0891876220703125, -0.025543212890625, 0.0381011962890625, 0.10174560546875, 0.1653900146484375, 0.229034423828125, 0.2926788330078125, 0.3563232421875, 0.4199676513671875, 0.483612060546875, 0.5472564697265625, 0.61090087890625, 0.6745452880859375, 0.738189697265625, 0.8018341064453125, 0.865478515625, 0.9291229248046875, 0.992767333984375, 1.0564117431640625, 1.12005615234375, 1.1837005615234375, 1.247344970703125, 1.3109893798828125, 1.3746337890625, 1.4382781982421875, 1.501922607421875, 1.5655670166015625, 1.62921142578125, 1.6928558349609375, 1.756500244140625, 1.8201446533203125, 1.8837890625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 7.0, 2.0, 5.0, 9.0, 6.0, 7.0, 12.0, 13.0, 11.0, 9.0, 15.0, 23.0, 28.0, 30.0, 26.0, 29.0, 38.0, 41.0, 34.0, 84.0, 106.0, 147.0, 280.0, 1393.0, 145.0, 104.0, 78.0, 68.0, 60.0, 41.0, 32.0, 34.0, 25.0, 21.0, 19.0, 17.0, 7.0, 9.0, 10.0, 12.0, 5.0, 6.0, 4.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.453125, -4.2886962890625, -4.124267578125, -3.9598388671875, -3.79541015625, -3.6309814453125, -3.466552734375, -3.3021240234375, -3.1376953125, -2.9732666015625, -2.808837890625, -2.6444091796875, -2.47998046875, -2.3155517578125, -2.151123046875, -1.9866943359375, -1.822265625, -1.6578369140625, -1.493408203125, -1.3289794921875, -1.16455078125, -1.0001220703125, -0.835693359375, -0.6712646484375, -0.5068359375, -0.3424072265625, -0.177978515625, -0.0135498046875, 0.15087890625, 0.3153076171875, 0.479736328125, 0.6441650390625, 0.80859375, 0.9730224609375, 1.137451171875, 1.3018798828125, 1.46630859375, 1.6307373046875, 1.795166015625, 1.9595947265625, 2.1240234375, 2.2884521484375, 2.452880859375, 2.6173095703125, 2.78173828125, 2.9461669921875, 3.110595703125, 3.2750244140625, 3.439453125, 3.6038818359375, 3.768310546875, 3.9327392578125, 4.09716796875, 4.2615966796875, 4.426025390625, 4.5904541015625, 4.7548828125, 4.9193115234375, 5.083740234375, 5.2481689453125, 5.41259765625, 5.5770263671875, 5.741455078125, 5.9058837890625, 6.0703125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 6.0, 4.0, 11.0, 14.0, 28.0, 45.0, 74.0, 148.0, 297.0, 619.0, 2403.0, 60506.0, 3043710.0, 34698.0, 1928.0, 580.0, 298.0, 139.0, 81.0, 39.0, 23.0, 29.0, 13.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.0625, -19.462646484375, -18.86279296875, -18.262939453125, -17.6630859375, -17.063232421875, -16.46337890625, -15.863525390625, -15.263671875, -14.663818359375, -14.06396484375, -13.464111328125, -12.8642578125, -12.264404296875, -11.66455078125, -11.064697265625, -10.46484375, -9.864990234375, -9.26513671875, -8.665283203125, -8.0654296875, -7.465576171875, -6.86572265625, -6.265869140625, -5.666015625, -5.066162109375, -4.46630859375, -3.866455078125, -3.2666015625, -2.666748046875, -2.06689453125, -1.467041015625, -0.8671875, -0.267333984375, 0.33251953125, 0.932373046875, 1.5322265625, 2.132080078125, 2.73193359375, 3.331787109375, 3.931640625, 4.531494140625, 5.13134765625, 5.731201171875, 6.3310546875, 6.930908203125, 7.53076171875, 8.130615234375, 8.73046875, 9.330322265625, 9.93017578125, 10.530029296875, 11.1298828125, 11.729736328125, 12.32958984375, 12.929443359375, 13.529296875, 14.129150390625, 14.72900390625, 15.328857421875, 15.9287109375, 16.528564453125, 17.12841796875, 17.728271484375, 18.328125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 145.0, 818.0, 51.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.058042526245117, -23.397809982299805, -19.737577438354492, -16.077342987060547, -12.41711139678955, -8.756877899169922, -5.096645355224609, -1.4364128112792969, 2.2238197326660156, 5.884052276611328, 9.54428482055664, 13.20451831817627, 16.864749908447266, 20.52498435974121, 24.185216903686523, 27.845449447631836, 31.50568199157715, 35.165916442871094, 38.826148986816406, 42.48638153076172, 46.14661407470703, 49.806846618652344, 53.467079162597656, 57.12731170654297, 60.78754425048828, 64.4477767944336, 68.1080093383789, 71.76824188232422, 75.42847442626953, 79.08870697021484, 82.74893951416016, 86.40917205810547, 90.06940460205078, 93.7296371459961, 97.3898696899414, 101.05010223388672, 104.71033477783203, 108.37056732177734, 112.03079986572266, 115.69103240966797, 119.35126495361328, 123.0114974975586, 126.6717300415039, 130.33197021484375, 133.99220275878906, 137.65243530273438, 141.3126678466797, 144.972900390625, 148.6331329345703, 152.29336547851562, 155.95359802246094, 159.61383056640625, 163.27406311035156, 166.93429565429688, 170.5945281982422, 174.2547607421875, 177.9149932861328, 181.57522583007812, 185.23545837402344, 188.89569091796875, 192.55592346191406, 196.21615600585938, 199.8763885498047, 203.53662109375, 207.1968536376953]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 2.0, 8.0, 6.0, 8.0, 13.0, 13.0, 10.0, 10.0, 22.0, 24.0, 28.0, 26.0, 38.0, 29.0, 31.0, 35.0, 47.0, 32.0, 49.0, 38.0, 45.0, 38.0, 47.0, 44.0, 39.0, 31.0, 40.0, 26.0, 43.0, 30.0, 28.0, 19.0, 18.0, 20.0, 12.0, 12.0, 11.0, 5.0, 5.0, 3.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.62879753112793, -15.188730239868164, -14.748661994934082, -14.30859375, -13.868526458740234, -13.428459167480469, -12.988390922546387, -12.548322677612305, -12.108255386352539, -11.668188095092773, -11.228119850158691, -10.78805160522461, -10.347984313964844, -9.907917022705078, -9.467848777770996, -9.027780532836914, -8.587713241577148, -8.147645950317383, -7.707577705383301, -7.267509937286377, -6.827442169189453, -6.387374401092529, -5.9473066329956055, -5.507238864898682, -5.067171096801758, -4.627103328704834, -4.18703556060791, -3.7469677925109863, -3.3069000244140625, -2.8668322563171387, -2.426764488220215, -1.986696720123291, -1.5466299057006836, -1.1065621376037598, -0.6664943695068359, -0.2264266014099121, 0.21364116668701172, 0.6537089347839355, 1.0937767028808594, 1.5338444709777832, 1.973912239074707, 2.413980007171631, 2.8540477752685547, 3.2941155433654785, 3.7341833114624023, 4.174251079559326, 4.61431884765625, 5.054386615753174, 5.494454383850098, 5.9345221519470215, 6.374589920043945, 6.814657688140869, 7.254725456237793, 7.694793224334717, 8.13486099243164, 8.574928283691406, 9.014996528625488, 9.45506477355957, 9.895132064819336, 10.335199356079102, 10.775267601013184, 11.215335845947266, 11.655403137207031, 12.095470428466797, 12.535538673400879]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 11.0, 12.0, 9.0, 8.0, 11.0, 8.0, 21.0, 20.0, 13.0, 26.0, 23.0, 21.0, 26.0, 25.0, 27.0, 39.0, 37.0, 35.0, 38.0, 43.0, 37.0, 37.0, 48.0, 32.0, 43.0, 34.0, 21.0, 35.0, 25.0, 32.0, 26.0, 25.0, 26.0, 22.0, 20.0, 20.0, 16.0, 11.0, 8.0, 9.0, 2.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5634765625, -1.51116943359375, -1.4588623046875, -1.40655517578125, -1.354248046875, -1.30194091796875, -1.2496337890625, -1.19732666015625, -1.14501953125, -1.09271240234375, -1.0404052734375, -0.98809814453125, -0.935791015625, -0.88348388671875, -0.8311767578125, -0.77886962890625, -0.7265625, -0.67425537109375, -0.6219482421875, -0.56964111328125, -0.517333984375, -0.46502685546875, -0.4127197265625, -0.36041259765625, -0.30810546875, -0.25579833984375, -0.2034912109375, -0.15118408203125, -0.098876953125, -0.04656982421875, 0.0057373046875, 0.05804443359375, 0.1103515625, 0.16265869140625, 0.2149658203125, 0.26727294921875, 0.319580078125, 0.37188720703125, 0.4241943359375, 0.47650146484375, 0.52880859375, 0.58111572265625, 0.6334228515625, 0.68572998046875, 0.738037109375, 0.79034423828125, 0.8426513671875, 0.89495849609375, 0.947265625, 0.99957275390625, 1.0518798828125, 1.10418701171875, 1.156494140625, 1.20880126953125, 1.2611083984375, 1.31341552734375, 1.36572265625, 1.41802978515625, 1.4703369140625, 1.52264404296875, 1.574951171875, 1.62725830078125, 1.6795654296875, 1.73187255859375, 1.7841796875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 4.0, 2.0, 17.0, 22.0, 27.0, 34.0, 56.0, 83.0, 133.0, 194.0, 293.0, 523.0, 893.0, 1573.0, 2949.0, 5754.0, 11828.0, 27413.0, 73984.0, 288832.0, 1672407.0, 1680531.0, 299140.0, 74819.0, 28019.0, 12093.0, 5847.0, 2894.0, 1547.0, 955.0, 536.0, 327.0, 168.0, 127.0, 94.0, 48.0, 30.0, 30.0, 21.0, 11.0, 9.0, 10.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.41015625, -3.3001708984375, -3.190185546875, -3.0802001953125, -2.97021484375, -2.8602294921875, -2.750244140625, -2.6402587890625, -2.5302734375, -2.4202880859375, -2.310302734375, -2.2003173828125, -2.09033203125, -1.9803466796875, -1.870361328125, -1.7603759765625, -1.650390625, -1.5404052734375, -1.430419921875, -1.3204345703125, -1.21044921875, -1.1004638671875, -0.990478515625, -0.8804931640625, -0.7705078125, -0.6605224609375, -0.550537109375, -0.4405517578125, -0.33056640625, -0.2205810546875, -0.110595703125, -0.0006103515625, 0.109375, 0.2193603515625, 0.329345703125, 0.4393310546875, 0.54931640625, 0.6593017578125, 0.769287109375, 0.8792724609375, 0.9892578125, 1.0992431640625, 1.209228515625, 1.3192138671875, 1.42919921875, 1.5391845703125, 1.649169921875, 1.7591552734375, 1.869140625, 1.9791259765625, 2.089111328125, 2.1990966796875, 2.30908203125, 2.4190673828125, 2.529052734375, 2.6390380859375, 2.7490234375, 2.8590087890625, 2.968994140625, 3.0789794921875, 3.18896484375, 3.2989501953125, 3.408935546875, 3.5189208984375, 3.62890625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 10.0, 7.0, 11.0, 11.0, 20.0, 19.0, 25.0, 40.0, 37.0, 57.0, 85.0, 141.0, 142.0, 213.0, 349.0, 503.0, 568.0, 506.0, 373.0, 244.0, 192.0, 127.0, 80.0, 66.0, 49.0, 47.0, 38.0, 25.0, 21.0, 18.0, 13.0, 7.0, 8.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.392578125, -3.28179931640625, -3.1710205078125, -3.06024169921875, -2.949462890625, -2.83868408203125, -2.7279052734375, -2.61712646484375, -2.50634765625, -2.39556884765625, -2.2847900390625, -2.17401123046875, -2.063232421875, -1.95245361328125, -1.8416748046875, -1.73089599609375, -1.6201171875, -1.50933837890625, -1.3985595703125, -1.28778076171875, -1.177001953125, -1.06622314453125, -0.9554443359375, -0.84466552734375, -0.73388671875, -0.62310791015625, -0.5123291015625, -0.40155029296875, -0.290771484375, -0.17999267578125, -0.0692138671875, 0.04156494140625, 0.15234375, 0.26312255859375, 0.3739013671875, 0.48468017578125, 0.595458984375, 0.70623779296875, 0.8170166015625, 0.92779541015625, 1.03857421875, 1.14935302734375, 1.2601318359375, 1.37091064453125, 1.481689453125, 1.59246826171875, 1.7032470703125, 1.81402587890625, 1.9248046875, 2.03558349609375, 2.1463623046875, 2.25714111328125, 2.367919921875, 2.47869873046875, 2.5894775390625, 2.70025634765625, 2.81103515625, 2.92181396484375, 3.0325927734375, 3.14337158203125, 3.254150390625, 3.36492919921875, 3.4757080078125, 3.58648681640625, 3.697265625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 1.0, 6.0, 10.0, 7.0, 12.0, 15.0, 26.0, 39.0, 31.0, 51.0, 65.0, 73.0, 159.0, 291.0, 1064.0, 7854.0, 126195.0, 3732210.0, 309114.0, 14562.0, 1563.0, 406.0, 170.0, 101.0, 68.0, 52.0, 34.0, 31.0, 17.0, 13.0, 16.0, 8.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.25, -15.7938232421875, -15.337646484375, -14.8814697265625, -14.42529296875, -13.9691162109375, -13.512939453125, -13.0567626953125, -12.6005859375, -12.1444091796875, -11.688232421875, -11.2320556640625, -10.77587890625, -10.3197021484375, -9.863525390625, -9.4073486328125, -8.951171875, -8.4949951171875, -8.038818359375, -7.5826416015625, -7.12646484375, -6.6702880859375, -6.214111328125, -5.7579345703125, -5.3017578125, -4.8455810546875, -4.389404296875, -3.9332275390625, -3.47705078125, -3.0208740234375, -2.564697265625, -2.1085205078125, -1.65234375, -1.1961669921875, -0.739990234375, -0.2838134765625, 0.17236328125, 0.6285400390625, 1.084716796875, 1.5408935546875, 1.9970703125, 2.4532470703125, 2.909423828125, 3.3656005859375, 3.82177734375, 4.2779541015625, 4.734130859375, 5.1903076171875, 5.646484375, 6.1026611328125, 6.558837890625, 7.0150146484375, 7.47119140625, 7.9273681640625, 8.383544921875, 8.8397216796875, 9.2958984375, 9.7520751953125, 10.208251953125, 10.6644287109375, 11.12060546875, 11.5767822265625, 12.032958984375, 12.4891357421875, 12.9453125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 30.0, 38.0, 94.0, 127.0, 205.0, 173.0, 154.0, 98.0, 39.0, 31.0, 11.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.95746612548828, -24.87469482421875, -23.79192352294922, -22.709152221679688, -21.626380920410156, -20.543609619140625, -19.460840225219727, -18.378068923950195, -17.295297622680664, -16.212526321411133, -15.129755020141602, -14.046984672546387, -12.964213371276855, -11.881442070007324, -10.79867172241211, -9.715900421142578, -8.633129119873047, -7.550357818603516, -6.467586994171143, -5.3848161697387695, -4.302044868469238, -3.219273567199707, -2.136502742767334, -1.053731918334961, 0.029039382934570312, 1.1118104457855225, 2.1945815086364746, 3.2773525714874268, 4.360123634338379, 5.44289493560791, 6.525665760040283, 7.608436584472656, 8.691204071044922, 9.773975372314453, 10.856746673583984, 11.9395170211792, 13.02228832244873, 14.105059623718262, 15.187829971313477, 16.270601272583008, 17.35337257385254, 18.43614387512207, 19.5189151763916, 20.601686477661133, 21.68445587158203, 22.767227172851562, 23.849998474121094, 24.932769775390625, 26.015541076660156, 27.098312377929688, 28.18108367919922, 29.26385498046875, 30.34662628173828, 31.429397583007812, 32.512168884277344, 33.594940185546875, 34.677711486816406, 35.76048278808594, 36.84325408935547, 37.926025390625, 39.00879669189453, 40.09156799316406, 41.174339294433594, 42.257110595703125, 43.33987808227539]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 11.0, 8.0, 15.0, 9.0, 11.0, 17.0, 20.0, 12.0, 35.0, 27.0, 39.0, 29.0, 27.0, 24.0, 46.0, 38.0, 38.0, 35.0, 46.0, 41.0, 31.0, 48.0, 42.0, 33.0, 28.0, 33.0, 28.0, 29.0, 22.0, 25.0, 21.0, 19.0, 11.0, 17.0, 21.0, 11.0, 8.0, 10.0, 3.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.523058891296387, -9.193673133850098, -8.864287376403809, -8.534900665283203, -8.205514907836914, -7.876129150390625, -7.546743392944336, -7.217357635498047, -6.8879714012146, -6.5585856437683105, -6.229199409484863, -5.899813652038574, -5.570427894592285, -5.241041660308838, -4.911655902862549, -4.582269668579102, -4.2528839111328125, -3.9234979152679443, -3.594111919403076, -3.264726161956787, -2.935340166091919, -2.605954170227051, -2.2765684127807617, -1.9471824169158936, -1.6177964210510254, -1.2884104251861572, -0.9590245485305786, -0.6296386122703552, -0.30025267601013184, 0.029133319854736328, 0.35851919651031494, 0.6879050731658936, 1.0172910690307617, 1.3466770648956299, 1.6760629415512085, 2.005448818206787, 2.3348348140716553, 2.6642208099365234, 2.9936065673828125, 3.3229925632476807, 3.652378559112549, 3.981764554977417, 4.311150550842285, 4.640536308288574, 4.969922065734863, 5.2993083000183105, 5.6286940574646, 5.958080291748047, 6.287466049194336, 6.616851806640625, 6.946238040924072, 7.275623798370361, 7.605010032653809, 7.934395790100098, 8.263781547546387, 8.593167304992676, 8.922554016113281, 9.25193977355957, 9.58132553100586, 9.910712242126465, 10.240097999572754, 10.569483757019043, 10.898869514465332, 11.228255271911621, 11.55764102935791]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 8.0, 7.0, 13.0, 11.0, 10.0, 21.0, 11.0, 13.0, 27.0, 24.0, 33.0, 37.0, 28.0, 28.0, 35.0, 35.0, 41.0, 47.0, 54.0, 41.0, 44.0, 49.0, 40.0, 31.0, 38.0, 35.0, 30.0, 28.0, 28.0, 27.0, 19.0, 23.0, 13.0, 16.0, 13.0, 7.0, 13.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.724609375, -1.669158935546875, -1.61370849609375, -1.558258056640625, -1.5028076171875, -1.447357177734375, -1.39190673828125, -1.336456298828125, -1.281005859375, -1.225555419921875, -1.17010498046875, -1.114654541015625, -1.0592041015625, -1.003753662109375, -0.94830322265625, -0.892852783203125, -0.83740234375, -0.781951904296875, -0.72650146484375, -0.671051025390625, -0.6156005859375, -0.560150146484375, -0.50469970703125, -0.449249267578125, -0.393798828125, -0.338348388671875, -0.28289794921875, -0.227447509765625, -0.1719970703125, -0.116546630859375, -0.06109619140625, -0.005645751953125, 0.0498046875, 0.105255126953125, 0.16070556640625, 0.216156005859375, 0.2716064453125, 0.327056884765625, 0.38250732421875, 0.437957763671875, 0.493408203125, 0.548858642578125, 0.60430908203125, 0.659759521484375, 0.7152099609375, 0.770660400390625, 0.82611083984375, 0.881561279296875, 0.93701171875, 0.992462158203125, 1.04791259765625, 1.103363037109375, 1.1588134765625, 1.214263916015625, 1.26971435546875, 1.325164794921875, 1.380615234375, 1.436065673828125, 1.49151611328125, 1.546966552734375, 1.6024169921875, 1.657867431640625, 1.71331787109375, 1.768768310546875, 1.82421875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 7.0, 13.0, 18.0, 23.0, 37.0, 54.0, 72.0, 116.0, 171.0, 233.0, 373.0, 550.0, 852.0, 1271.0, 1938.0, 2916.0, 4489.0, 6782.0, 10225.0, 15788.0, 24158.0, 37994.0, 58280.0, 90746.0, 135508.0, 173297.0, 158936.0, 113589.0, 74182.0, 47627.0, 30970.0, 19708.0, 12918.0, 8400.0, 5551.0, 3636.0, 2393.0, 1612.0, 1019.0, 695.0, 505.0, 309.0, 210.0, 127.0, 69.0, 66.0, 42.0, 28.0, 15.0, 13.0, 7.0, 7.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.198974609375, -0.19271087646484375, -0.1864471435546875, -0.18018341064453125, -0.173919677734375, -0.16765594482421875, -0.1613922119140625, -0.15512847900390625, -0.14886474609375, -0.14260101318359375, -0.1363372802734375, -0.13007354736328125, -0.123809814453125, -0.11754608154296875, -0.1112823486328125, -0.10501861572265625, -0.0987548828125, -0.09249114990234375, -0.0862274169921875, -0.07996368408203125, -0.073699951171875, -0.06743621826171875, -0.0611724853515625, -0.05490875244140625, -0.04864501953125, -0.04238128662109375, -0.0361175537109375, -0.02985382080078125, -0.023590087890625, -0.01732635498046875, -0.0110626220703125, -0.00479888916015625, 0.00146484375, 0.00772857666015625, 0.0139923095703125, 0.02025604248046875, 0.026519775390625, 0.03278350830078125, 0.0390472412109375, 0.04531097412109375, 0.05157470703125, 0.05783843994140625, 0.0641021728515625, 0.07036590576171875, 0.076629638671875, 0.08289337158203125, 0.0891571044921875, 0.09542083740234375, 0.1016845703125, 0.10794830322265625, 0.1142120361328125, 0.12047576904296875, 0.126739501953125, 0.13300323486328125, 0.1392669677734375, 0.14553070068359375, 0.15179443359375, 0.15805816650390625, 0.1643218994140625, 0.17058563232421875, 0.176849365234375, 0.18311309814453125, 0.1893768310546875, 0.19564056396484375, 0.201904296875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 6.0, 8.0, 6.0, 5.0, 7.0, 14.0, 12.0, 17.0, 24.0, 23.0, 31.0, 23.0, 31.0, 27.0, 34.0, 34.0, 37.0, 38.0, 53.0, 45.0, 1069.0, 45.0, 44.0, 40.0, 43.0, 44.0, 24.0, 31.0, 28.0, 29.0, 26.0, 20.0, 26.0, 15.0, 7.0, 13.0, 11.0, 8.0, 7.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.3818359375, -1.3421783447265625, -1.302520751953125, -1.2628631591796875, -1.22320556640625, -1.1835479736328125, -1.143890380859375, -1.1042327880859375, -1.0645751953125, -1.0249176025390625, -0.985260009765625, -0.9456024169921875, -0.90594482421875, -0.8662872314453125, -0.826629638671875, -0.7869720458984375, -0.747314453125, -0.7076568603515625, -0.667999267578125, -0.6283416748046875, -0.58868408203125, -0.5490264892578125, -0.509368896484375, -0.4697113037109375, -0.4300537109375, -0.3903961181640625, -0.350738525390625, -0.3110809326171875, -0.27142333984375, -0.2317657470703125, -0.192108154296875, -0.1524505615234375, -0.11279296875, -0.0731353759765625, -0.033477783203125, 0.0061798095703125, 0.04583740234375, 0.0854949951171875, 0.125152587890625, 0.1648101806640625, 0.2044677734375, 0.2441253662109375, 0.283782958984375, 0.3234405517578125, 0.36309814453125, 0.4027557373046875, 0.442413330078125, 0.4820709228515625, 0.521728515625, 0.5613861083984375, 0.601043701171875, 0.6407012939453125, 0.68035888671875, 0.7200164794921875, 0.759674072265625, 0.7993316650390625, 0.8389892578125, 0.8786468505859375, 0.918304443359375, 0.9579620361328125, 0.99761962890625, 1.0372772216796875, 1.076934814453125, 1.1165924072265625, 1.15625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 12.0, 13.0, 18.0, 28.0, 45.0, 55.0, 89.0, 145.0, 233.0, 368.0, 565.0, 1105.0, 2196.0, 4080.0, 8637.0, 19427.0, 69089.0, 1842138.0, 105462.0, 23280.0, 9997.0, 4661.0, 2441.0, 1280.0, 722.0, 398.0, 216.0, 133.0, 81.0, 54.0, 36.0, 27.0, 20.0, 19.0, 9.0, 5.0, 3.0, 5.0, 8.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.61474609375, -0.59747314453125, -0.5802001953125, -0.56292724609375, -0.545654296875, -0.52838134765625, -0.5111083984375, -0.49383544921875, -0.4765625, -0.45928955078125, -0.4420166015625, -0.42474365234375, -0.407470703125, -0.39019775390625, -0.3729248046875, -0.35565185546875, -0.33837890625, -0.32110595703125, -0.3038330078125, -0.28656005859375, -0.269287109375, -0.25201416015625, -0.2347412109375, -0.21746826171875, -0.2001953125, -0.18292236328125, -0.1656494140625, -0.14837646484375, -0.131103515625, -0.11383056640625, -0.0965576171875, -0.07928466796875, -0.06201171875, -0.04473876953125, -0.0274658203125, -0.01019287109375, 0.007080078125, 0.02435302734375, 0.0416259765625, 0.05889892578125, 0.076171875, 0.09344482421875, 0.1107177734375, 0.12799072265625, 0.145263671875, 0.16253662109375, 0.1798095703125, 0.19708251953125, 0.21435546875, 0.23162841796875, 0.2489013671875, 0.26617431640625, 0.283447265625, 0.30072021484375, 0.3179931640625, 0.33526611328125, 0.3525390625, 0.36981201171875, 0.3870849609375, 0.40435791015625, 0.421630859375, 0.43890380859375, 0.4561767578125, 0.47344970703125, 0.49072265625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 9.0, 16.0, 14.0, 13.0, 17.0, 28.0, 30.0, 44.0, 62.0, 83.0, 53.0, 68.0, 92.0, 81.0, 62.0, 57.0, 56.0, 38.0, 34.0, 29.0, 21.0, 17.0, 21.0, 14.0, 6.0, 8.0, 1.0, 3.0, 7.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0236968994140625, -0.023090600967407227, -0.022484302520751953, -0.02187800407409668, -0.021271705627441406, -0.020665407180786133, -0.02005910873413086, -0.019452810287475586, -0.018846511840820312, -0.01824021339416504, -0.017633914947509766, -0.017027616500854492, -0.01642131805419922, -0.015815019607543945, -0.015208721160888672, -0.014602422714233398, -0.013996124267578125, -0.013389825820922852, -0.012783527374267578, -0.012177228927612305, -0.011570930480957031, -0.010964632034301758, -0.010358333587646484, -0.009752035140991211, -0.009145736694335938, -0.008539438247680664, -0.00793313980102539, -0.007326841354370117, -0.006720542907714844, -0.00611424446105957, -0.005507946014404297, -0.0049016475677490234, -0.00429534912109375, -0.0036890506744384766, -0.003082752227783203, -0.0024764537811279297, -0.0018701553344726562, -0.0012638568878173828, -0.0006575584411621094, -5.125999450683594e-05, 0.0005550384521484375, 0.001161336898803711, 0.0017676353454589844, 0.002373933792114258, 0.0029802322387695312, 0.0035865306854248047, 0.004192829132080078, 0.0047991275787353516, 0.005405426025390625, 0.0060117244720458984, 0.006618022918701172, 0.007224321365356445, 0.007830619812011719, 0.008436918258666992, 0.009043216705322266, 0.009649515151977539, 0.010255813598632812, 0.010862112045288086, 0.01146841049194336, 0.012074708938598633, 0.012681007385253906, 0.01328730583190918, 0.013893604278564453, 0.014499902725219727, 0.015106201171875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 5.0, 7.0, 3.0, 8.0, 10.0, 15.0, 12.0, 28.0, 26.0, 30.0, 74.0, 122.0, 208.0, 487.0, 2628.0, 461916.0, 578856.0, 3158.0, 462.0, 211.0, 112.0, 63.0, 33.0, 19.0, 17.0, 14.0, 9.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2890625, -0.2775115966796875, -0.265960693359375, -0.2544097900390625, -0.24285888671875, -0.2313079833984375, -0.219757080078125, -0.2082061767578125, -0.1966552734375, -0.1851043701171875, -0.173553466796875, -0.1620025634765625, -0.15045166015625, -0.1389007568359375, -0.127349853515625, -0.1157989501953125, -0.104248046875, -0.0926971435546875, -0.081146240234375, -0.0695953369140625, -0.05804443359375, -0.0464935302734375, -0.034942626953125, -0.0233917236328125, -0.0118408203125, -0.0002899169921875, 0.011260986328125, 0.0228118896484375, 0.03436279296875, 0.0459136962890625, 0.057464599609375, 0.0690155029296875, 0.08056640625, 0.0921173095703125, 0.103668212890625, 0.1152191162109375, 0.12677001953125, 0.1383209228515625, 0.149871826171875, 0.1614227294921875, 0.1729736328125, 0.1845245361328125, 0.196075439453125, 0.2076263427734375, 0.21917724609375, 0.2307281494140625, 0.242279052734375, 0.2538299560546875, 0.265380859375, 0.2769317626953125, 0.288482666015625, 0.3000335693359375, 0.31158447265625, 0.3231353759765625, 0.334686279296875, 0.3462371826171875, 0.3577880859375, 0.3693389892578125, 0.380889892578125, 0.3924407958984375, 0.40399169921875, 0.4155426025390625, 0.427093505859375, 0.4386444091796875, 0.4501953125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [7.0, 24.0, 110.0, 393.0, 345.0, 92.0, 36.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022047948092222214, -0.01636606454849243, -0.010684180073440075, -0.005002295598387718, 0.0006795879453420639, 0.006361471489071846, 0.012043356895446777, 0.01772524043917656, 0.02340712398290634, 0.029089007526636124, 0.034770891070365906, 0.040452778339385986, 0.04613465815782547, 0.05181654542684555, 0.05749842897057533, 0.06318031251430511, 0.0688621997833252, 0.07454408705234528, 0.08022596687078476, 0.08590785413980484, 0.09158973395824432, 0.0972716212272644, 0.10295350849628448, 0.10863538831472397, 0.11431726813316345, 0.11999915540218353, 0.1256810426712036, 0.1313629150390625, 0.13704480230808258, 0.14272668957710266, 0.14840857684612274, 0.15409046411514282, 0.1597723513841629, 0.16545423865318298, 0.17113612592220306, 0.17681799829006195, 0.18249988555908203, 0.1881817728281021, 0.1938636600971222, 0.19954553246498108, 0.20522741973400116, 0.21090930700302124, 0.21659119427204132, 0.2222730666399002, 0.2279549539089203, 0.23363684117794037, 0.23931872844696045, 0.24500060081481934, 0.2506825029850006, 0.2563643753528595, 0.26204627752304077, 0.26772814989089966, 0.27341005206108093, 0.2790919244289398, 0.2847737967967987, 0.29045569896698, 0.29613757133483887, 0.30181944370269775, 0.30750134587287903, 0.3131832182407379, 0.3188651204109192, 0.3245469927787781, 0.33022886514663696, 0.33591076731681824, 0.3415926396846771]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 7.0, 11.0, 14.0, 13.0, 22.0, 31.0, 24.0, 20.0, 33.0, 30.0, 28.0, 46.0, 38.0, 32.0, 39.0, 52.0, 49.0, 46.0, 42.0, 41.0, 46.0, 30.0, 37.0, 33.0, 26.0, 39.0, 24.0, 23.0, 17.0, 14.0, 19.0, 12.0, 8.0, 9.0, 4.0, 4.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.021047592163085938, -0.02042924053966999, -0.019810888916254044, -0.019192537292838097, -0.01857418566942215, -0.017955834046006203, -0.017337482422590256, -0.01671913079917431, -0.016100779175758362, -0.015482427552342415, -0.014864075928926468, -0.014245724305510521, -0.013627372682094574, -0.013009021058678627, -0.01239066943526268, -0.011772317811846733, -0.011153966188430786, -0.01053561456501484, -0.009917262941598892, -0.009298911318182945, -0.008680559694766998, -0.008062208071351051, -0.007443856447935104, -0.006825504824519157, -0.0062071532011032104, -0.0055888015776872635, -0.0049704499542713165, -0.00435209833085537, -0.0037337467074394226, -0.0031153950840234756, -0.0024970434606075287, -0.0018786918371915817, -0.0012603402137756348, -0.0006419885903596878, -2.3636966943740845e-05, 0.0005947146564722061, 0.001213066279888153, 0.0018314179033041, 0.002449769526720047, 0.003068121150135994, 0.003686472773551941, 0.004304824396967888, 0.004923176020383835, 0.005541527643799782, 0.006159879267215729, 0.006778230890631676, 0.007396582514047623, 0.00801493413746357, 0.008633285760879517, 0.009251637384295464, 0.00986998900771141, 0.010488340631127357, 0.011106692254543304, 0.011725043877959251, 0.012343395501375198, 0.012961747124791145, 0.013580098748207092, 0.01419845037162304, 0.014816801995038986, 0.015435153618454933, 0.01605350524187088, 0.016671856865286827, 0.017290208488702774, 0.01790856011211872, 0.018526911735534668]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 8.0, 8.0, 12.0, 11.0, 10.0, 21.0, 11.0, 13.0, 28.0, 25.0, 31.0, 37.0, 30.0, 27.0, 34.0, 35.0, 41.0, 47.0, 54.0, 42.0, 44.0, 49.0, 39.0, 32.0, 37.0, 35.0, 30.0, 28.0, 28.0, 27.0, 19.0, 23.0, 13.0, 16.0, 13.0, 8.0, 12.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7236328125, -1.6681976318359375, -1.612762451171875, -1.5573272705078125, -1.50189208984375, -1.4464569091796875, -1.391021728515625, -1.3355865478515625, -1.2801513671875, -1.2247161865234375, -1.169281005859375, -1.1138458251953125, -1.05841064453125, -1.0029754638671875, -0.947540283203125, -0.8921051025390625, -0.836669921875, -0.7812347412109375, -0.725799560546875, -0.6703643798828125, -0.61492919921875, -0.5594940185546875, -0.504058837890625, -0.4486236572265625, -0.3931884765625, -0.3377532958984375, -0.282318115234375, -0.2268829345703125, -0.17144775390625, -0.1160125732421875, -0.060577392578125, -0.0051422119140625, 0.05029296875, 0.1057281494140625, 0.161163330078125, 0.2165985107421875, 0.27203369140625, 0.3274688720703125, 0.382904052734375, 0.4383392333984375, 0.4937744140625, 0.5492095947265625, 0.604644775390625, 0.6600799560546875, 0.71551513671875, 0.7709503173828125, 0.826385498046875, 0.8818206787109375, 0.937255859375, 0.9926910400390625, 1.048126220703125, 1.1035614013671875, 1.15899658203125, 1.2144317626953125, 1.269866943359375, 1.3253021240234375, 1.3807373046875, 1.4361724853515625, 1.491607666015625, 1.5470428466796875, 1.60247802734375, 1.6579132080078125, 1.713348388671875, 1.7687835693359375, 1.82421875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 4.0, 6.0, 3.0, 6.0, 10.0, 14.0, 23.0, 37.0, 62.0, 102.0, 136.0, 236.0, 377.0, 633.0, 1129.0, 1963.0, 3385.0, 5866.0, 10310.0, 19469.0, 35860.0, 71265.0, 149652.0, 364029.0, 195464.0, 90397.0, 45279.0, 23659.0, 12652.0, 6983.0, 3981.0, 2250.0, 1339.0, 771.0, 450.0, 278.0, 178.0, 110.0, 67.0, 45.0, 27.0, 17.0, 12.0, 12.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.44921875, -2.374237060546875, -2.29925537109375, -2.224273681640625, -2.1492919921875, -2.074310302734375, -1.99932861328125, -1.924346923828125, -1.849365234375, -1.774383544921875, -1.69940185546875, -1.624420166015625, -1.5494384765625, -1.474456787109375, -1.39947509765625, -1.324493408203125, -1.24951171875, -1.174530029296875, -1.09954833984375, -1.024566650390625, -0.9495849609375, -0.874603271484375, -0.79962158203125, -0.724639892578125, -0.649658203125, -0.574676513671875, -0.49969482421875, -0.424713134765625, -0.3497314453125, -0.274749755859375, -0.19976806640625, -0.124786376953125, -0.0498046875, 0.025177001953125, 0.10015869140625, 0.175140380859375, 0.2501220703125, 0.325103759765625, 0.40008544921875, 0.475067138671875, 0.550048828125, 0.625030517578125, 0.70001220703125, 0.774993896484375, 0.8499755859375, 0.924957275390625, 0.99993896484375, 1.074920654296875, 1.14990234375, 1.224884033203125, 1.29986572265625, 1.374847412109375, 1.4498291015625, 1.524810791015625, 1.59979248046875, 1.674774169921875, 1.749755859375, 1.824737548828125, 1.89971923828125, 1.974700927734375, 2.0496826171875, 2.124664306640625, 2.19964599609375, 2.274627685546875, 2.349609375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 7.0, 4.0, 5.0, 5.0, 14.0, 14.0, 15.0, 16.0, 32.0, 29.0, 44.0, 31.0, 46.0, 58.0, 75.0, 98.0, 150.0, 267.0, 1373.0, 185.0, 132.0, 83.0, 56.0, 48.0, 54.0, 37.0, 30.0, 34.0, 18.0, 19.0, 19.0, 9.0, 14.0, 9.0, 4.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.2734375, -7.0780029296875, -6.882568359375, -6.6871337890625, -6.49169921875, -6.2962646484375, -6.100830078125, -5.9053955078125, -5.7099609375, -5.5145263671875, -5.319091796875, -5.1236572265625, -4.92822265625, -4.7327880859375, -4.537353515625, -4.3419189453125, -4.146484375, -3.9510498046875, -3.755615234375, -3.5601806640625, -3.36474609375, -3.1693115234375, -2.973876953125, -2.7784423828125, -2.5830078125, -2.3875732421875, -2.192138671875, -1.9967041015625, -1.80126953125, -1.6058349609375, -1.410400390625, -1.2149658203125, -1.01953125, -0.8240966796875, -0.628662109375, -0.4332275390625, -0.23779296875, -0.0423583984375, 0.153076171875, 0.3485107421875, 0.5439453125, 0.7393798828125, 0.934814453125, 1.1302490234375, 1.32568359375, 1.5211181640625, 1.716552734375, 1.9119873046875, 2.107421875, 2.3028564453125, 2.498291015625, 2.6937255859375, 2.88916015625, 3.0845947265625, 3.280029296875, 3.4754638671875, 3.6708984375, 3.8663330078125, 4.061767578125, 4.2572021484375, 4.45263671875, 4.6480712890625, 4.843505859375, 5.0389404296875, 5.234375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 12.0, 9.0, 7.0, 10.0, 21.0, 19.0, 29.0, 34.0, 47.0, 73.0, 99.0, 147.0, 259.0, 376.0, 1043.0, 5133.0, 64196.0, 2452289.0, 597970.0, 19940.0, 2411.0, 678.0, 301.0, 170.0, 99.0, 95.0, 69.0, 36.0, 35.0, 26.0, 16.0, 9.0, 14.0, 10.0, 7.0, 4.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.2969970703125, -8.922119140625, -8.5472412109375, -8.17236328125, -7.7974853515625, -7.422607421875, -7.0477294921875, -6.6728515625, -6.2979736328125, -5.923095703125, -5.5482177734375, -5.17333984375, -4.7984619140625, -4.423583984375, -4.0487060546875, -3.673828125, -3.2989501953125, -2.924072265625, -2.5491943359375, -2.17431640625, -1.7994384765625, -1.424560546875, -1.0496826171875, -0.6748046875, -0.2999267578125, 0.074951171875, 0.4498291015625, 0.82470703125, 1.1995849609375, 1.574462890625, 1.9493408203125, 2.32421875, 2.6990966796875, 3.073974609375, 3.4488525390625, 3.82373046875, 4.1986083984375, 4.573486328125, 4.9483642578125, 5.3232421875, 5.6981201171875, 6.072998046875, 6.4478759765625, 6.82275390625, 7.1976318359375, 7.572509765625, 7.9473876953125, 8.322265625, 8.6971435546875, 9.072021484375, 9.4468994140625, 9.82177734375, 10.1966552734375, 10.571533203125, 10.9464111328125, 11.3212890625, 11.6961669921875, 12.071044921875, 12.4459228515625, 12.82080078125, 13.1956787109375, 13.570556640625, 13.9454345703125, 14.3203125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [3.0, 25.0, 942.0, 50.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.661325454711914, -10.20665168762207, -3.751978874206543, 2.7026939392089844, 9.157367706298828, 15.612039566040039, 22.066713333129883, 28.521387100219727, 34.97605895996094, 41.43073272705078, 47.885406494140625, 54.34008026123047, 60.79475402832031, 67.24942016601562, 73.7041015625, 80.15876770019531, 86.61344909667969, 93.06812286376953, 99.52279663085938, 105.97747039794922, 112.43214416503906, 118.88681030273438, 125.34149169921875, 131.79615783691406, 138.25083923339844, 144.70550537109375, 151.16018676757812, 157.61485290527344, 164.0695343017578, 170.52420043945312, 176.9788818359375, 183.4335479736328, 189.8882293701172, 196.3428955078125, 202.79757690429688, 209.2522430419922, 215.70692443847656, 222.16159057617188, 228.61627197265625, 235.07093811035156, 241.52561950683594, 247.98028564453125, 254.43496704101562, 260.8896484375, 267.34429931640625, 273.7989807128906, 280.253662109375, 286.7083435058594, 293.1629943847656, 299.61767578125, 306.07232666015625, 312.5270080566406, 318.981689453125, 325.4363708496094, 331.8910217285156, 338.345703125, 344.8003845214844, 351.25506591796875, 357.709716796875, 364.1643981933594, 370.61907958984375, 377.0737609863281, 383.5284118652344, 389.98309326171875, 396.4377746582031]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 11.0, 9.0, 13.0, 11.0, 12.0, 13.0, 23.0, 14.0, 18.0, 29.0, 28.0, 34.0, 54.0, 40.0, 56.0, 41.0, 58.0, 47.0, 47.0, 56.0, 56.0, 37.0, 34.0, 40.0, 37.0, 30.0, 26.0, 20.0, 18.0, 16.0, 12.0, 14.0, 11.0, 13.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.79469108581543, -16.25420570373535, -15.71371841430664, -15.173232078552246, -14.632745742797852, -14.092260360717773, -13.551774024963379, -13.011287689208984, -12.47080135345459, -11.930315017700195, -11.3898286819458, -10.849342346191406, -10.308856964111328, -9.768369674682617, -9.227884292602539, -8.687397956848145, -8.14691162109375, -7.6064252853393555, -7.065938949584961, -6.525453090667725, -5.98496675491333, -5.4444804191589355, -4.903994560241699, -4.363508224487305, -3.82302188873291, -3.2825355529785156, -2.7420494556427, -2.2015633583068848, -1.6610770225524902, -1.1205906867980957, -0.5801045894622803, -0.039618492126464844, 0.5008659362792969, 1.0413521528244019, 1.5818383693695068, 2.1223244667053223, 2.662810802459717, 3.2032971382141113, 3.7437832355499268, 4.284269332885742, 4.824755668640137, 5.365242004394531, 5.905728340148926, 6.446214199066162, 6.986700534820557, 7.527186870574951, 8.067672729492188, 8.608159065246582, 9.148645401000977, 9.689131736755371, 10.229618072509766, 10.77010440826416, 11.310590744018555, 11.851076126098633, 12.391562461853027, 12.932048797607422, 13.472535133361816, 14.013021469116211, 14.553507804870605, 15.093994140625, 15.634479522705078, 16.17496681213379, 16.715452194213867, 17.255939483642578, 17.796424865722656]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 6.0, 5.0, 5.0, 8.0, 12.0, 12.0, 11.0, 14.0, 16.0, 11.0, 15.0, 21.0, 27.0, 34.0, 34.0, 28.0, 31.0, 40.0, 26.0, 37.0, 45.0, 44.0, 41.0, 46.0, 30.0, 40.0, 47.0, 33.0, 27.0, 28.0, 29.0, 17.0, 23.0, 24.0, 23.0, 24.0, 20.0, 8.0, 14.0, 8.0, 10.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7099609375, -1.6551055908203125, -1.600250244140625, -1.5453948974609375, -1.49053955078125, -1.4356842041015625, -1.380828857421875, -1.3259735107421875, -1.2711181640625, -1.2162628173828125, -1.161407470703125, -1.1065521240234375, -1.05169677734375, -0.9968414306640625, -0.941986083984375, -0.8871307373046875, -0.832275390625, -0.7774200439453125, -0.722564697265625, -0.6677093505859375, -0.61285400390625, -0.5579986572265625, -0.503143310546875, -0.4482879638671875, -0.3934326171875, -0.3385772705078125, -0.283721923828125, -0.2288665771484375, -0.17401123046875, -0.1191558837890625, -0.064300537109375, -0.0094451904296875, 0.04541015625, 0.1002655029296875, 0.155120849609375, 0.2099761962890625, 0.26483154296875, 0.3196868896484375, 0.374542236328125, 0.4293975830078125, 0.4842529296875, 0.5391082763671875, 0.593963623046875, 0.6488189697265625, 0.70367431640625, 0.7585296630859375, 0.813385009765625, 0.8682403564453125, 0.923095703125, 0.9779510498046875, 1.032806396484375, 1.0876617431640625, 1.14251708984375, 1.1973724365234375, 1.252227783203125, 1.3070831298828125, 1.3619384765625, 1.4167938232421875, 1.471649169921875, 1.5265045166015625, 1.58135986328125, 1.6362152099609375, 1.691070556640625, 1.7459259033203125, 1.80078125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 10.0, 9.0, 18.0, 32.0, 43.0, 78.0, 125.0, 204.0, 368.0, 624.0, 1034.0, 1706.0, 3194.0, 5934.0, 11863.0, 26152.0, 67243.0, 243280.0, 1383413.0, 1919466.0, 376697.0, 90075.0, 32853.0, 14588.0, 6994.0, 3720.0, 1957.0, 1116.0, 607.0, 333.0, 233.0, 131.0, 79.0, 42.0, 29.0, 16.0, 11.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.42578125, -3.31207275390625, -3.1983642578125, -3.08465576171875, -2.970947265625, -2.85723876953125, -2.7435302734375, -2.62982177734375, -2.51611328125, -2.40240478515625, -2.2886962890625, -2.17498779296875, -2.061279296875, -1.94757080078125, -1.8338623046875, -1.72015380859375, -1.6064453125, -1.49273681640625, -1.3790283203125, -1.26531982421875, -1.151611328125, -1.03790283203125, -0.9241943359375, -0.81048583984375, -0.69677734375, -0.58306884765625, -0.4693603515625, -0.35565185546875, -0.241943359375, -0.12823486328125, -0.0145263671875, 0.09918212890625, 0.212890625, 0.32659912109375, 0.4403076171875, 0.55401611328125, 0.667724609375, 0.78143310546875, 0.8951416015625, 1.00885009765625, 1.12255859375, 1.23626708984375, 1.3499755859375, 1.46368408203125, 1.577392578125, 1.69110107421875, 1.8048095703125, 1.91851806640625, 2.0322265625, 2.14593505859375, 2.2596435546875, 2.37335205078125, 2.487060546875, 2.60076904296875, 2.7144775390625, 2.82818603515625, 2.94189453125, 3.05560302734375, 3.1693115234375, 3.28302001953125, 3.396728515625, 3.51043701171875, 3.6241455078125, 3.73785400390625, 3.8515625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 13.0, 10.0, 19.0, 34.0, 31.0, 55.0, 71.0, 91.0, 129.0, 208.0, 307.0, 478.0, 688.0, 591.0, 406.0, 304.0, 194.0, 116.0, 67.0, 62.0, 41.0, 43.0, 23.0, 22.0, 20.0, 8.0, 12.0, 12.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.134765625, -3.003143310546875, -2.87152099609375, -2.739898681640625, -2.6082763671875, -2.476654052734375, -2.34503173828125, -2.213409423828125, -2.081787109375, -1.950164794921875, -1.81854248046875, -1.686920166015625, -1.5552978515625, -1.423675537109375, -1.29205322265625, -1.160430908203125, -1.02880859375, -0.897186279296875, -0.76556396484375, -0.633941650390625, -0.5023193359375, -0.370697021484375, -0.23907470703125, -0.107452392578125, 0.024169921875, 0.155792236328125, 0.28741455078125, 0.419036865234375, 0.5506591796875, 0.682281494140625, 0.81390380859375, 0.945526123046875, 1.0771484375, 1.208770751953125, 1.34039306640625, 1.472015380859375, 1.6036376953125, 1.735260009765625, 1.86688232421875, 1.998504638671875, 2.130126953125, 2.261749267578125, 2.39337158203125, 2.524993896484375, 2.6566162109375, 2.788238525390625, 2.91986083984375, 3.051483154296875, 3.18310546875, 3.314727783203125, 3.44635009765625, 3.577972412109375, 3.7095947265625, 3.841217041015625, 3.97283935546875, 4.104461669921875, 4.236083984375, 4.367706298828125, 4.49932861328125, 4.630950927734375, 4.7625732421875, 4.894195556640625, 5.02581787109375, 5.157440185546875, 5.2890625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 12.0, 11.0, 15.0, 20.0, 27.0, 41.0, 59.0, 73.0, 105.0, 226.0, 515.0, 3023.0, 59373.0, 3642881.0, 474307.0, 11734.0, 1110.0, 294.0, 135.0, 104.0, 55.0, 38.0, 37.0, 29.0, 13.0, 13.0, 7.0, 1.0, 3.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.953125, -21.4144287109375, -20.875732421875, -20.3370361328125, -19.79833984375, -19.2596435546875, -18.720947265625, -18.1822509765625, -17.6435546875, -17.1048583984375, -16.566162109375, -16.0274658203125, -15.48876953125, -14.9500732421875, -14.411376953125, -13.8726806640625, -13.333984375, -12.7952880859375, -12.256591796875, -11.7178955078125, -11.17919921875, -10.6405029296875, -10.101806640625, -9.5631103515625, -9.0244140625, -8.4857177734375, -7.947021484375, -7.4083251953125, -6.86962890625, -6.3309326171875, -5.792236328125, -5.2535400390625, -4.71484375, -4.1761474609375, -3.637451171875, -3.0987548828125, -2.56005859375, -2.0213623046875, -1.482666015625, -0.9439697265625, -0.4052734375, 0.1334228515625, 0.672119140625, 1.2108154296875, 1.74951171875, 2.2882080078125, 2.826904296875, 3.3656005859375, 3.904296875, 4.4429931640625, 4.981689453125, 5.5203857421875, 6.05908203125, 6.5977783203125, 7.136474609375, 7.6751708984375, 8.2138671875, 8.7525634765625, 9.291259765625, 9.8299560546875, 10.36865234375, 10.9073486328125, 11.446044921875, 11.9847412109375, 12.5234375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 14.0, 33.0, 76.0, 163.0, 266.0, 222.0, 132.0, 69.0, 24.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.50320816040039, -39.09246063232422, -37.68170928955078, -36.27096176147461, -34.86021423339844, -33.449462890625, -32.03871536254883, -30.627967834472656, -29.21721839904785, -27.806468963623047, -26.395721435546875, -24.98497200012207, -23.574222564697266, -22.163475036621094, -20.75272560119629, -19.341976165771484, -17.931228637695312, -16.520479202270508, -15.109731674194336, -13.698982238769531, -12.288233757019043, -10.877485275268555, -9.46673583984375, -8.055987358093262, -6.645238876342773, -5.234490394592285, -3.8237414360046387, -2.412992477416992, -1.002243995666504, 0.4085044860839844, 1.819253921508789, 3.2300024032592773, 4.6407470703125, 6.051495552062988, 7.462244510650635, 8.872993469238281, 10.28374195098877, 11.694490432739258, 13.105239868164062, 14.51598834991455, 15.926736831665039, 17.337486267089844, 18.748233795166016, 20.15898323059082, 21.569732666015625, 22.980480194091797, 24.3912296295166, 25.801979064941406, 27.212726593017578, 28.623476028442383, 30.034223556518555, 31.44497299194336, 32.85572052001953, 34.26647186279297, 35.67721939086914, 37.08796691894531, 38.49871826171875, 39.90946578979492, 41.32021713256836, 42.73096466064453, 44.1417121887207, 45.552459716796875, 46.96321105957031, 48.373958587646484, 49.784706115722656]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 12.0, 13.0, 13.0, 11.0, 20.0, 22.0, 19.0, 21.0, 35.0, 30.0, 35.0, 47.0, 52.0, 44.0, 41.0, 35.0, 48.0, 45.0, 37.0, 40.0, 48.0, 54.0, 38.0, 31.0, 28.0, 29.0, 25.0, 22.0, 21.0, 13.0, 16.0, 8.0, 5.0, 6.0, 7.0, 6.0, 7.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.54681396484375, -13.137932777404785, -12.72905158996582, -12.320170402526855, -11.91128921508789, -11.502408027648926, -11.093526840209961, -10.684645652770996, -10.275764465332031, -9.866883277893066, -9.458002090454102, -9.049120903015137, -8.640239715576172, -8.231358528137207, -7.822477340698242, -7.413596153259277, -7.004715442657471, -6.595834255218506, -6.186953067779541, -5.778071880340576, -5.369190692901611, -4.960309982299805, -4.55142879486084, -4.142547607421875, -3.733666181564331, -3.324784994125366, -2.9159038066864014, -2.5070228576660156, -2.098141670227051, -1.689260482788086, -1.280379295349121, -0.8714981079101562, -0.4626169204711914, -0.05373576283454895, 0.3551453948020935, 0.7640265226364136, 1.1729077100753784, 1.5817887783050537, 1.9906699657440186, 2.3995511531829834, 2.8084323406219482, 3.217313528060913, 3.626194715499878, 4.035075664520264, 4.4439568519592285, 4.852838039398193, 5.261719226837158, 5.670600414276123, 6.079481601715088, 6.488362789154053, 6.897243976593018, 7.306125164031982, 7.715006351470947, 8.123887062072754, 8.532768249511719, 8.941649436950684, 9.350530624389648, 9.759411811828613, 10.168292999267578, 10.577174186706543, 10.986055374145508, 11.394936561584473, 11.803817749023438, 12.212698936462402, 12.621580123901367]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 2.0, 9.0, 3.0, 5.0, 8.0, 14.0, 14.0, 5.0, 11.0, 14.0, 19.0, 15.0, 21.0, 26.0, 30.0, 19.0, 29.0, 26.0, 30.0, 41.0, 29.0, 56.0, 24.0, 29.0, 37.0, 40.0, 39.0, 42.0, 29.0, 37.0, 24.0, 30.0, 32.0, 25.0, 29.0, 26.0, 16.0, 12.0, 13.0, 21.0, 10.0, 10.0, 7.0, 6.0, 10.0, 10.0, 3.0, 5.0, 2.0, 0.0, 0.0, 6.0, 1.0, 2.0], "bins": [-1.6240234375, -1.57623291015625, -1.5284423828125, -1.48065185546875, -1.432861328125, -1.38507080078125, -1.3372802734375, -1.28948974609375, -1.24169921875, -1.19390869140625, -1.1461181640625, -1.09832763671875, -1.050537109375, -1.00274658203125, -0.9549560546875, -0.90716552734375, -0.859375, -0.81158447265625, -0.7637939453125, -0.71600341796875, -0.668212890625, -0.62042236328125, -0.5726318359375, -0.52484130859375, -0.47705078125, -0.42926025390625, -0.3814697265625, -0.33367919921875, -0.285888671875, -0.23809814453125, -0.1903076171875, -0.14251708984375, -0.0947265625, -0.04693603515625, 0.0008544921875, 0.04864501953125, 0.096435546875, 0.14422607421875, 0.1920166015625, 0.23980712890625, 0.28759765625, 0.33538818359375, 0.3831787109375, 0.43096923828125, 0.478759765625, 0.52655029296875, 0.5743408203125, 0.62213134765625, 0.669921875, 0.71771240234375, 0.7655029296875, 0.81329345703125, 0.861083984375, 0.90887451171875, 0.9566650390625, 1.00445556640625, 1.05224609375, 1.10003662109375, 1.1478271484375, 1.19561767578125, 1.243408203125, 1.29119873046875, 1.3389892578125, 1.38677978515625, 1.4345703125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 4.0, 8.0, 13.0, 28.0, 36.0, 49.0, 66.0, 99.0, 158.0, 186.0, 325.0, 431.0, 677.0, 858.0, 1231.0, 1803.0, 2596.0, 3581.0, 5248.0, 7630.0, 11273.0, 16803.0, 25141.0, 38675.0, 60168.0, 91528.0, 133259.0, 164025.0, 152347.0, 111508.0, 74422.0, 48419.0, 31591.0, 20581.0, 13681.0, 9079.0, 6307.0, 4457.0, 3014.0, 2121.0, 1519.0, 1106.0, 741.0, 559.0, 383.0, 260.0, 163.0, 127.0, 97.0, 72.0, 39.0, 34.0, 14.0, 12.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.1568603515625, -0.15192031860351562, -0.14698028564453125, -0.14204025268554688, -0.1371002197265625, -0.13216018676757812, -0.12722015380859375, -0.12228012084960938, -0.117340087890625, -0.11240005493164062, -0.10746002197265625, -0.10251998901367188, -0.0975799560546875, -0.09263992309570312, -0.08769989013671875, -0.08275985717773438, -0.07781982421875, -0.07287979125976562, -0.06793975830078125, -0.06299972534179688, -0.0580596923828125, -0.053119659423828125, -0.04817962646484375, -0.043239593505859375, -0.038299560546875, -0.033359527587890625, -0.02841949462890625, -0.023479461669921875, -0.0185394287109375, -0.013599395751953125, -0.00865936279296875, -0.003719329833984375, 0.001220703125, 0.006160736083984375, 0.01110076904296875, 0.016040802001953125, 0.0209808349609375, 0.025920867919921875, 0.03086090087890625, 0.035800933837890625, 0.040740966796875, 0.045680999755859375, 0.05062103271484375, 0.055561065673828125, 0.0605010986328125, 0.06544113159179688, 0.07038116455078125, 0.07532119750976562, 0.08026123046875, 0.08520126342773438, 0.09014129638671875, 0.09508132934570312, 0.1000213623046875, 0.10496139526367188, 0.10990142822265625, 0.11484146118164062, 0.119781494140625, 0.12472152709960938, 0.12966156005859375, 0.13460159301757812, 0.1395416259765625, 0.14448165893554688, 0.14942169189453125, 0.15436172485351562, 0.1593017578125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 17.0, 10.0, 13.0, 20.0, 19.0, 24.0, 26.0, 28.0, 22.0, 24.0, 39.0, 38.0, 41.0, 31.0, 35.0, 44.0, 41.0, 1076.0, 45.0, 43.0, 42.0, 41.0, 35.0, 45.0, 28.0, 37.0, 24.0, 23.0, 19.0, 18.0, 10.0, 17.0, 8.0, 9.0, 7.0, 8.0, 4.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5361328125, -1.49505615234375, -1.4539794921875, -1.41290283203125, -1.371826171875, -1.33074951171875, -1.2896728515625, -1.24859619140625, -1.20751953125, -1.16644287109375, -1.1253662109375, -1.08428955078125, -1.043212890625, -1.00213623046875, -0.9610595703125, -0.91998291015625, -0.87890625, -0.83782958984375, -0.7967529296875, -0.75567626953125, -0.714599609375, -0.67352294921875, -0.6324462890625, -0.59136962890625, -0.55029296875, -0.50921630859375, -0.4681396484375, -0.42706298828125, -0.385986328125, -0.34490966796875, -0.3038330078125, -0.26275634765625, -0.2216796875, -0.18060302734375, -0.1395263671875, -0.09844970703125, -0.057373046875, -0.01629638671875, 0.0247802734375, 0.06585693359375, 0.10693359375, 0.14801025390625, 0.1890869140625, 0.23016357421875, 0.271240234375, 0.31231689453125, 0.3533935546875, 0.39447021484375, 0.435546875, 0.47662353515625, 0.5177001953125, 0.55877685546875, 0.599853515625, 0.64093017578125, 0.6820068359375, 0.72308349609375, 0.76416015625, 0.80523681640625, 0.8463134765625, 0.88739013671875, 0.928466796875, 0.96954345703125, 1.0106201171875, 1.05169677734375, 1.0927734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 9.0, 7.0, 11.0, 16.0, 24.0, 36.0, 45.0, 90.0, 102.0, 176.0, 294.0, 498.0, 875.0, 1670.0, 3442.0, 7420.0, 16764.0, 47296.0, 1759408.0, 207104.0, 28674.0, 11944.0, 5431.0, 2686.0, 1379.0, 706.0, 391.0, 211.0, 137.0, 92.0, 45.0, 42.0, 34.0, 19.0, 18.0, 15.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447509765625, -0.43297576904296875, -0.4184417724609375, -0.40390777587890625, -0.389373779296875, -0.37483978271484375, -0.3603057861328125, -0.34577178955078125, -0.33123779296875, -0.31670379638671875, -0.3021697998046875, -0.28763580322265625, -0.273101806640625, -0.25856781005859375, -0.2440338134765625, -0.22949981689453125, -0.2149658203125, -0.20043182373046875, -0.1858978271484375, -0.17136383056640625, -0.156829833984375, -0.14229583740234375, -0.1277618408203125, -0.11322784423828125, -0.09869384765625, -0.08415985107421875, -0.0696258544921875, -0.05509185791015625, -0.040557861328125, -0.02602386474609375, -0.0114898681640625, 0.00304412841796875, 0.017578125, 0.03211212158203125, 0.0466461181640625, 0.06118011474609375, 0.075714111328125, 0.09024810791015625, 0.1047821044921875, 0.11931610107421875, 0.13385009765625, 0.14838409423828125, 0.1629180908203125, 0.17745208740234375, 0.191986083984375, 0.20652008056640625, 0.2210540771484375, 0.23558807373046875, 0.2501220703125, 0.26465606689453125, 0.2791900634765625, 0.29372406005859375, 0.308258056640625, 0.32279205322265625, 0.3373260498046875, 0.35186004638671875, 0.36639404296875, 0.38092803955078125, 0.3954620361328125, 0.40999603271484375, 0.424530029296875, 0.43906402587890625, 0.4535980224609375, 0.46813201904296875, 0.482666015625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 7.0, 10.0, 21.0, 14.0, 16.0, 21.0, 22.0, 15.0, 35.0, 34.0, 41.0, 36.0, 42.0, 44.0, 59.0, 52.0, 44.0, 42.0, 58.0, 60.0, 46.0, 45.0, 36.0, 35.0, 33.0, 20.0, 23.0, 13.0, 17.0, 9.0, 7.0, 6.0, 7.0, 6.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01160430908203125, -0.011227965354919434, -0.010851621627807617, -0.0104752779006958, -0.010098934173583984, -0.009722590446472168, -0.009346246719360352, -0.008969902992248535, -0.008593559265136719, -0.008217215538024902, -0.007840871810913086, -0.0074645280838012695, -0.007088184356689453, -0.006711840629577637, -0.00633549690246582, -0.005959153175354004, -0.0055828094482421875, -0.005206465721130371, -0.004830121994018555, -0.004453778266906738, -0.004077434539794922, -0.0037010908126831055, -0.003324747085571289, -0.0029484033584594727, -0.0025720596313476562, -0.00219571590423584, -0.0018193721771240234, -0.001443028450012207, -0.0010666847229003906, -0.0006903409957885742, -0.0003139972686767578, 6.23464584350586e-05, 0.000438690185546875, 0.0008150339126586914, 0.0011913776397705078, 0.0015677213668823242, 0.0019440650939941406, 0.002320408821105957, 0.0026967525482177734, 0.00307309627532959, 0.0034494400024414062, 0.0038257837295532227, 0.004202127456665039, 0.0045784711837768555, 0.004954814910888672, 0.005331158638000488, 0.005707502365112305, 0.006083846092224121, 0.0064601898193359375, 0.006836533546447754, 0.00721287727355957, 0.007589221000671387, 0.007965564727783203, 0.00834190845489502, 0.008718252182006836, 0.009094595909118652, 0.009470939636230469, 0.009847283363342285, 0.010223627090454102, 0.010599970817565918, 0.010976314544677734, 0.01135265827178955, 0.011729001998901367, 0.012105345726013184, 0.012481689453125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 2.0, 3.0, 7.0, 6.0, 16.0, 17.0, 16.0, 19.0, 24.0, 32.0, 46.0, 77.0, 95.0, 170.0, 267.0, 574.0, 4262.0, 276079.0, 750866.0, 14129.0, 902.0, 324.0, 199.0, 115.0, 79.0, 45.0, 35.0, 24.0, 21.0, 17.0, 20.0, 16.0, 11.0, 9.0, 11.0, 8.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.222412109375, -0.21570587158203125, -0.2089996337890625, -0.20229339599609375, -0.195587158203125, -0.18888092041015625, -0.1821746826171875, -0.17546844482421875, -0.16876220703125, -0.16205596923828125, -0.1553497314453125, -0.14864349365234375, -0.141937255859375, -0.13523101806640625, -0.1285247802734375, -0.12181854248046875, -0.1151123046875, -0.10840606689453125, -0.1016998291015625, -0.09499359130859375, -0.088287353515625, -0.08158111572265625, -0.0748748779296875, -0.06816864013671875, -0.06146240234375, -0.05475616455078125, -0.0480499267578125, -0.04134368896484375, -0.034637451171875, -0.02793121337890625, -0.0212249755859375, -0.01451873779296875, -0.0078125, -0.00110626220703125, 0.0055999755859375, 0.01230621337890625, 0.019012451171875, 0.02571868896484375, 0.0324249267578125, 0.03913116455078125, 0.04583740234375, 0.05254364013671875, 0.0592498779296875, 0.06595611572265625, 0.072662353515625, 0.07936859130859375, 0.0860748291015625, 0.09278106689453125, 0.0994873046875, 0.10619354248046875, 0.1128997802734375, 0.11960601806640625, 0.126312255859375, 0.13301849365234375, 0.1397247314453125, 0.14643096923828125, 0.15313720703125, 0.15984344482421875, 0.1665496826171875, 0.17325592041015625, 0.179962158203125, 0.18666839599609375, 0.1933746337890625, 0.20008087158203125, 0.206787109375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 18.0, 65.0, 186.0, 375.0, 215.0, 85.0, 33.0, 22.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020047765225172043, -0.01696363277733326, -0.013879502192139626, -0.010795369744300842, -0.007711238227784634, -0.004627106711268425, -0.0015429742634296417, 0.0015411563217639923, 0.004625288769602776, 0.007709420286118984, 0.010793551802635193, 0.013877684250473976, 0.01696181669831276, 0.020045947283506393, 0.023130079731345177, 0.02621421031653881, 0.029298342764377594, 0.03238247334957123, 0.03546660766005516, 0.038550738245248795, 0.04163486883044243, 0.04471900314092636, 0.047803133726119995, 0.05088726431131363, 0.05397139489650726, 0.0570555254817009, 0.06013965979218483, 0.06322379410266876, 0.0663079246878624, 0.06939205527305603, 0.07247618585824966, 0.0755603164434433, 0.07864444702863693, 0.08172857761383057, 0.0848127081990242, 0.08789683878421783, 0.09098097681999207, 0.0940651074051857, 0.09714923799037933, 0.10023336857557297, 0.1033174991607666, 0.10640162974596024, 0.10948576033115387, 0.1125698983669281, 0.11565402895212173, 0.11873815953731537, 0.121822290122509, 0.12490642070770264, 0.12799055874347687, 0.1310746967792511, 0.13415881991386414, 0.13724295794963837, 0.1403270810842514, 0.14341121912002563, 0.14649534225463867, 0.1495794802904129, 0.15266360342502594, 0.15574774146080017, 0.1588318645954132, 0.16191600263118744, 0.16500012576580048, 0.1680842638015747, 0.17116838693618774, 0.17425252497196198, 0.1773366630077362]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 11.0, 4.0, 10.0, 7.0, 21.0, 35.0, 20.0, 32.0, 42.0, 38.0, 56.0, 42.0, 61.0, 65.0, 71.0, 55.0, 70.0, 66.0, 54.0, 50.0, 41.0, 33.0, 36.0, 18.0, 18.0, 12.0, 15.0, 8.0, 4.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036606669425964355, -0.03565093129873276, -0.03469519317150116, -0.03373945876955986, -0.03278372064232826, -0.031827982515096664, -0.030872246250510216, -0.029916509985923767, -0.02896077185869217, -0.02800503373146057, -0.027049297466874123, -0.026093561202287674, -0.025137823075056076, -0.024182084947824478, -0.02322634868323803, -0.02227061241865158, -0.021314874291419983, -0.020359136164188385, -0.019403399899601936, -0.018447663635015488, -0.01749192550778389, -0.016536187380552292, -0.015580451115965843, -0.01462471392005682, -0.013668976724147797, -0.012713239528238773, -0.01175750233232975, -0.010801765136420727, -0.009846027940511703, -0.00889029074460268, -0.007934553548693657, -0.006978816352784634, -0.00602307915687561, -0.005067341960966587, -0.004111604765057564, -0.0031558675691485405, -0.002200130373239517, -0.001244393177330494, -0.00028865598142147064, 0.0006670812144875526, 0.001622818410396576, 0.002578555606305599, 0.0035342928022146225, 0.004490029998123646, 0.005445767194032669, 0.006401504389941692, 0.007357241585850716, 0.008312978781759739, 0.009268715977668762, 0.010224453173577785, 0.011180190369486809, 0.012135927565395832, 0.013091664761304855, 0.014047401957213879, 0.015003139153122902, 0.01595887541770935, 0.01691461354494095, 0.017870351672172546, 0.018826087936758995, 0.019781824201345444, 0.02073756232857704, 0.02169330045580864, 0.022649036720395088, 0.023604772984981537, 0.024560511112213135]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 2.0, 10.0, 2.0, 6.0, 7.0, 14.0, 14.0, 5.0, 11.0, 15.0, 18.0, 15.0, 21.0, 27.0, 29.0, 19.0, 29.0, 27.0, 29.0, 41.0, 29.0, 56.0, 23.0, 31.0, 36.0, 41.0, 37.0, 42.0, 30.0, 37.0, 24.0, 30.0, 32.0, 26.0, 28.0, 25.0, 17.0, 12.0, 13.0, 22.0, 9.0, 10.0, 7.0, 6.0, 9.0, 11.0, 3.0, 5.0, 2.0, 0.0, 0.0, 6.0, 1.0, 2.0], "bins": [-1.623046875, -1.575286865234375, -1.52752685546875, -1.479766845703125, -1.4320068359375, -1.384246826171875, -1.33648681640625, -1.288726806640625, -1.240966796875, -1.193206787109375, -1.14544677734375, -1.097686767578125, -1.0499267578125, -1.002166748046875, -0.95440673828125, -0.906646728515625, -0.85888671875, -0.811126708984375, -0.76336669921875, -0.715606689453125, -0.6678466796875, -0.620086669921875, -0.57232666015625, -0.524566650390625, -0.476806640625, -0.429046630859375, -0.38128662109375, -0.333526611328125, -0.2857666015625, -0.238006591796875, -0.19024658203125, -0.142486572265625, -0.0947265625, -0.046966552734375, 0.00079345703125, 0.048553466796875, 0.0963134765625, 0.144073486328125, 0.19183349609375, 0.239593505859375, 0.287353515625, 0.335113525390625, 0.38287353515625, 0.430633544921875, 0.4783935546875, 0.526153564453125, 0.57391357421875, 0.621673583984375, 0.66943359375, 0.717193603515625, 0.76495361328125, 0.812713623046875, 0.8604736328125, 0.908233642578125, 0.95599365234375, 1.003753662109375, 1.051513671875, 1.099273681640625, 1.14703369140625, 1.194793701171875, 1.2425537109375, 1.290313720703125, 1.33807373046875, 1.385833740234375, 1.43359375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 19.0, 21.0, 29.0, 46.0, 66.0, 93.0, 140.0, 225.0, 334.0, 472.0, 735.0, 1229.0, 2010.0, 3372.0, 6082.0, 10935.0, 21660.0, 47112.0, 110583.0, 299182.0, 327844.0, 117217.0, 49330.0, 22868.0, 11514.0, 6179.0, 3632.0, 2074.0, 1271.0, 799.0, 499.0, 311.0, 216.0, 135.0, 101.0, 58.0, 55.0, 32.0, 20.0, 17.0, 10.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.31640625, -2.24176025390625, -2.1671142578125, -2.09246826171875, -2.017822265625, -1.94317626953125, -1.8685302734375, -1.79388427734375, -1.71923828125, -1.64459228515625, -1.5699462890625, -1.49530029296875, -1.420654296875, -1.34600830078125, -1.2713623046875, -1.19671630859375, -1.1220703125, -1.04742431640625, -0.9727783203125, -0.89813232421875, -0.823486328125, -0.74884033203125, -0.6741943359375, -0.59954833984375, -0.52490234375, -0.45025634765625, -0.3756103515625, -0.30096435546875, -0.226318359375, -0.15167236328125, -0.0770263671875, -0.00238037109375, 0.072265625, 0.14691162109375, 0.2215576171875, 0.29620361328125, 0.370849609375, 0.44549560546875, 0.5201416015625, 0.59478759765625, 0.66943359375, 0.74407958984375, 0.8187255859375, 0.89337158203125, 0.968017578125, 1.04266357421875, 1.1173095703125, 1.19195556640625, 1.2666015625, 1.34124755859375, 1.4158935546875, 1.49053955078125, 1.565185546875, 1.63983154296875, 1.7144775390625, 1.78912353515625, 1.86376953125, 1.93841552734375, 2.0130615234375, 2.08770751953125, 2.162353515625, 2.23699951171875, 2.3116455078125, 2.38629150390625, 2.4609375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 14.0, 9.0, 10.0, 17.0, 6.0, 18.0, 25.0, 34.0, 29.0, 38.0, 25.0, 25.0, 37.0, 35.0, 77.0, 101.0, 178.0, 1412.0, 291.0, 168.0, 98.0, 60.0, 46.0, 32.0, 32.0, 34.0, 38.0, 35.0, 24.0, 16.0, 16.0, 11.0, 13.0, 11.0, 7.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.328125, -5.160888671875, -4.99365234375, -4.826416015625, -4.6591796875, -4.491943359375, -4.32470703125, -4.157470703125, -3.990234375, -3.822998046875, -3.65576171875, -3.488525390625, -3.3212890625, -3.154052734375, -2.98681640625, -2.819580078125, -2.65234375, -2.485107421875, -2.31787109375, -2.150634765625, -1.9833984375, -1.816162109375, -1.64892578125, -1.481689453125, -1.314453125, -1.147216796875, -0.97998046875, -0.812744140625, -0.6455078125, -0.478271484375, -0.31103515625, -0.143798828125, 0.0234375, 0.190673828125, 0.35791015625, 0.525146484375, 0.6923828125, 0.859619140625, 1.02685546875, 1.194091796875, 1.361328125, 1.528564453125, 1.69580078125, 1.863037109375, 2.0302734375, 2.197509765625, 2.36474609375, 2.531982421875, 2.69921875, 2.866455078125, 3.03369140625, 3.200927734375, 3.3681640625, 3.535400390625, 3.70263671875, 3.869873046875, 4.037109375, 4.204345703125, 4.37158203125, 4.538818359375, 4.7060546875, 4.873291015625, 5.04052734375, 5.207763671875, 5.375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 6.0, 13.0, 9.0, 11.0, 20.0, 23.0, 27.0, 30.0, 39.0, 40.0, 63.0, 96.0, 124.0, 193.0, 307.0, 576.0, 1048.0, 3109.0, 18052.0, 424485.0, 2612690.0, 73941.0, 7074.0, 1735.0, 756.0, 377.0, 243.0, 137.0, 107.0, 97.0, 57.0, 40.0, 26.0, 34.0, 26.0, 25.0, 13.0, 13.0, 13.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.4921875, -9.197998046875, -8.90380859375, -8.609619140625, -8.3154296875, -8.021240234375, -7.72705078125, -7.432861328125, -7.138671875, -6.844482421875, -6.55029296875, -6.256103515625, -5.9619140625, -5.667724609375, -5.37353515625, -5.079345703125, -4.78515625, -4.490966796875, -4.19677734375, -3.902587890625, -3.6083984375, -3.314208984375, -3.02001953125, -2.725830078125, -2.431640625, -2.137451171875, -1.84326171875, -1.549072265625, -1.2548828125, -0.960693359375, -0.66650390625, -0.372314453125, -0.078125, 0.216064453125, 0.51025390625, 0.804443359375, 1.0986328125, 1.392822265625, 1.68701171875, 1.981201171875, 2.275390625, 2.569580078125, 2.86376953125, 3.157958984375, 3.4521484375, 3.746337890625, 4.04052734375, 4.334716796875, 4.62890625, 4.923095703125, 5.21728515625, 5.511474609375, 5.8056640625, 6.099853515625, 6.39404296875, 6.688232421875, 6.982421875, 7.276611328125, 7.57080078125, 7.864990234375, 8.1591796875, 8.453369140625, 8.74755859375, 9.041748046875, 9.3359375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [2.0, 7.0, 120.0, 519.0, 333.0, 35.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.651029109954834, -4.908016204833984, -3.1650032997131348, -1.4219903945922852, 0.32102251052856445, 2.0640358924865723, 3.8070483207702637, 5.550060749053955, 7.293074131011963, 9.036087036132812, 10.77910041809082, 12.522112846374512, 14.265125274658203, 16.00813865661621, 17.75115203857422, 19.494163513183594, 21.2371768951416, 22.98019027709961, 24.723201751708984, 26.466215133666992, 28.209228515625, 29.952241897583008, 31.695255279541016, 33.43826675415039, 35.18128204345703, 36.924293518066406, 38.66730880737305, 40.41032028198242, 42.15333557128906, 43.89634704589844, 45.63935852050781, 47.38236999511719, 49.12538146972656, 50.86839294433594, 52.61140823364258, 54.35441970825195, 56.097434997558594, 57.84044647216797, 59.583457946777344, 61.32646942138672, 63.06948471069336, 64.8125, 66.55551147460938, 68.29852294921875, 70.04153442382812, 71.7845458984375, 73.5275650024414, 75.27057647705078, 77.01358795166016, 78.75659942626953, 80.4996109008789, 82.24263000488281, 83.98564147949219, 85.72865295410156, 87.47166442871094, 89.21467590332031, 90.95768737792969, 92.70069885253906, 94.44371032714844, 96.18672943115234, 97.92974090576172, 99.6727523803711, 101.41576385498047, 103.15877532958984, 104.90179443359375]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 2.0, 6.0, 8.0, 6.0, 9.0, 12.0, 13.0, 14.0, 13.0, 19.0, 23.0, 26.0, 27.0, 36.0, 33.0, 38.0, 38.0, 38.0, 41.0, 42.0, 55.0, 45.0, 46.0, 42.0, 41.0, 36.0, 37.0, 40.0, 35.0, 36.0, 21.0, 23.0, 33.0, 8.0, 13.0, 6.0, 5.0, 4.0, 9.0, 7.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.230670928955078, -14.74410343170166, -14.257536888122559, -13.77096939086914, -13.284402847290039, -12.797835350036621, -12.311267852783203, -11.824701309204102, -11.338133811950684, -10.851566314697266, -10.364999771118164, -9.878432273864746, -9.391864776611328, -8.905298233032227, -8.418730735778809, -7.932163715362549, -7.445596694946289, -6.959029674530029, -6.4724626541137695, -5.985895156860352, -5.499328136444092, -5.012761116027832, -4.526193618774414, -4.039626598358154, -3.5530595779418945, -3.0664925575256348, -2.579925298690796, -2.093358039855957, -1.6067910194396973, -1.1202239990234375, -0.6336567401885986, -0.14708948135375977, 0.3394784927368164, 0.8260456323623657, 1.312612771987915, 1.7991799116134644, 2.2857470512390137, 2.7723140716552734, 3.2588813304901123, 3.745448589324951, 4.232015609741211, 4.718582630157471, 5.2051496505737305, 5.691717147827148, 6.178284168243408, 6.664851188659668, 7.151418685913086, 7.637985706329346, 8.124552726745605, 8.611120223999023, 9.097686767578125, 9.584254264831543, 10.070821762084961, 10.557388305664062, 11.04395580291748, 11.530523300170898, 12.01708984375, 12.503657341003418, 12.99022388458252, 13.476791381835938, 13.963357925415039, 14.449925422668457, 14.936492919921875, 15.423059463500977, 15.909626960754395]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 6.0, 7.0, 3.0, 9.0, 9.0, 9.0, 12.0, 17.0, 11.0, 14.0, 25.0, 15.0, 19.0, 22.0, 31.0, 25.0, 30.0, 35.0, 37.0, 43.0, 45.0, 43.0, 44.0, 55.0, 29.0, 42.0, 29.0, 34.0, 39.0, 30.0, 29.0, 22.0, 19.0, 23.0, 24.0, 19.0, 17.0, 20.0, 6.0, 12.0, 15.0, 10.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.72265625, -1.6666259765625, -1.610595703125, -1.5545654296875, -1.49853515625, -1.4425048828125, -1.386474609375, -1.3304443359375, -1.2744140625, -1.2183837890625, -1.162353515625, -1.1063232421875, -1.05029296875, -0.9942626953125, -0.938232421875, -0.8822021484375, -0.826171875, -0.7701416015625, -0.714111328125, -0.6580810546875, -0.60205078125, -0.5460205078125, -0.489990234375, -0.4339599609375, -0.3779296875, -0.3218994140625, -0.265869140625, -0.2098388671875, -0.15380859375, -0.0977783203125, -0.041748046875, 0.0142822265625, 0.0703125, 0.1263427734375, 0.182373046875, 0.2384033203125, 0.29443359375, 0.3504638671875, 0.406494140625, 0.4625244140625, 0.5185546875, 0.5745849609375, 0.630615234375, 0.6866455078125, 0.74267578125, 0.7987060546875, 0.854736328125, 0.9107666015625, 0.966796875, 1.0228271484375, 1.078857421875, 1.1348876953125, 1.19091796875, 1.2469482421875, 1.302978515625, 1.3590087890625, 1.4150390625, 1.4710693359375, 1.527099609375, 1.5831298828125, 1.63916015625, 1.6951904296875, 1.751220703125, 1.8072509765625, 1.86328125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 11.0, 19.0, 20.0, 45.0, 54.0, 70.0, 133.0, 211.0, 311.0, 523.0, 995.0, 1757.0, 3263.0, 6292.0, 13418.0, 31193.0, 86719.0, 369187.0, 1909464.0, 1401798.0, 252754.0, 66828.0, 25618.0, 11599.0, 5543.0, 2836.0, 1483.0, 868.0, 452.0, 314.0, 163.0, 127.0, 61.0, 52.0, 24.0, 20.0, 20.0, 8.0, 6.0, 7.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.802734375, -3.6937255859375, -3.584716796875, -3.4757080078125, -3.36669921875, -3.2576904296875, -3.148681640625, -3.0396728515625, -2.9306640625, -2.8216552734375, -2.712646484375, -2.6036376953125, -2.49462890625, -2.3856201171875, -2.276611328125, -2.1676025390625, -2.05859375, -1.9495849609375, -1.840576171875, -1.7315673828125, -1.62255859375, -1.5135498046875, -1.404541015625, -1.2955322265625, -1.1865234375, -1.0775146484375, -0.968505859375, -0.8594970703125, -0.75048828125, -0.6414794921875, -0.532470703125, -0.4234619140625, -0.314453125, -0.2054443359375, -0.096435546875, 0.0125732421875, 0.12158203125, 0.2305908203125, 0.339599609375, 0.4486083984375, 0.5576171875, 0.6666259765625, 0.775634765625, 0.8846435546875, 0.99365234375, 1.1026611328125, 1.211669921875, 1.3206787109375, 1.4296875, 1.5386962890625, 1.647705078125, 1.7567138671875, 1.86572265625, 1.9747314453125, 2.083740234375, 2.1927490234375, 2.3017578125, 2.4107666015625, 2.519775390625, 2.6287841796875, 2.73779296875, 2.8468017578125, 2.955810546875, 3.0648193359375, 3.173828125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 4.0, 1.0, 8.0, 12.0, 7.0, 9.0, 13.0, 16.0, 24.0, 21.0, 38.0, 46.0, 50.0, 74.0, 105.0, 139.0, 173.0, 281.0, 396.0, 465.0, 510.0, 455.0, 320.0, 215.0, 153.0, 107.0, 88.0, 69.0, 50.0, 44.0, 26.0, 32.0, 23.0, 19.0, 14.0, 15.0, 19.0, 10.0, 2.0, 2.0, 7.0, 4.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.060546875, -2.971405029296875, -2.88226318359375, -2.793121337890625, -2.7039794921875, -2.614837646484375, -2.52569580078125, -2.436553955078125, -2.347412109375, -2.258270263671875, -2.16912841796875, -2.079986572265625, -1.9908447265625, -1.901702880859375, -1.81256103515625, -1.723419189453125, -1.63427734375, -1.545135498046875, -1.45599365234375, -1.366851806640625, -1.2777099609375, -1.188568115234375, -1.09942626953125, -1.010284423828125, -0.921142578125, -0.832000732421875, -0.74285888671875, -0.653717041015625, -0.5645751953125, -0.475433349609375, -0.38629150390625, -0.297149658203125, -0.2080078125, -0.118865966796875, -0.02972412109375, 0.059417724609375, 0.1485595703125, 0.237701416015625, 0.32684326171875, 0.415985107421875, 0.505126953125, 0.594268798828125, 0.68341064453125, 0.772552490234375, 0.8616943359375, 0.950836181640625, 1.03997802734375, 1.129119873046875, 1.21826171875, 1.307403564453125, 1.39654541015625, 1.485687255859375, 1.5748291015625, 1.663970947265625, 1.75311279296875, 1.842254638671875, 1.931396484375, 2.020538330078125, 2.10968017578125, 2.198822021484375, 2.2879638671875, 2.377105712890625, 2.46624755859375, 2.555389404296875, 2.64453125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 3.0, 7.0, 6.0, 1.0, 12.0, 16.0, 17.0, 12.0, 28.0, 18.0, 31.0, 41.0, 53.0, 59.0, 83.0, 109.0, 182.0, 353.0, 2250.0, 33288.0, 2104708.0, 2016927.0, 32756.0, 2247.0, 381.0, 203.0, 131.0, 83.0, 70.0, 51.0, 35.0, 21.0, 13.0, 24.0, 13.0, 11.0, 9.0, 7.0, 7.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.7421875, -13.2840576171875, -12.825927734375, -12.3677978515625, -11.90966796875, -11.4515380859375, -10.993408203125, -10.5352783203125, -10.0771484375, -9.6190185546875, -9.160888671875, -8.7027587890625, -8.24462890625, -7.7864990234375, -7.328369140625, -6.8702392578125, -6.412109375, -5.9539794921875, -5.495849609375, -5.0377197265625, -4.57958984375, -4.1214599609375, -3.663330078125, -3.2052001953125, -2.7470703125, -2.2889404296875, -1.830810546875, -1.3726806640625, -0.91455078125, -0.4564208984375, 0.001708984375, 0.4598388671875, 0.91796875, 1.3760986328125, 1.834228515625, 2.2923583984375, 2.75048828125, 3.2086181640625, 3.666748046875, 4.1248779296875, 4.5830078125, 5.0411376953125, 5.499267578125, 5.9573974609375, 6.41552734375, 6.8736572265625, 7.331787109375, 7.7899169921875, 8.248046875, 8.7061767578125, 9.164306640625, 9.6224365234375, 10.08056640625, 10.5386962890625, 10.996826171875, 11.4549560546875, 11.9130859375, 12.3712158203125, 12.829345703125, 13.2874755859375, 13.74560546875, 14.2037353515625, 14.661865234375, 15.1199951171875, 15.578125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 16.0, 42.0, 79.0, 132.0, 207.0, 199.0, 147.0, 94.0, 51.0, 25.0, 9.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.470516204833984, -11.527605056762695, -10.584693908691406, -9.6417818069458, -8.698870658874512, -7.755959510803223, -6.813047885894775, -5.870136260986328, -4.927225112915039, -3.984313726425171, -3.0414023399353027, -2.0984909534454346, -1.1555795669555664, -0.21266841888427734, 0.7302432060241699, 1.6731548309326172, 2.6160659790039062, 3.5589773654937744, 4.501888751983643, 5.44480037689209, 6.387711524963379, 7.330622673034668, 8.273534774780273, 9.216445922851562, 10.159357070922852, 11.10226821899414, 12.04517936706543, 12.988091468811035, 13.931002616882324, 14.873913764953613, 15.816825866699219, 16.759737014770508, 17.702648162841797, 18.645559310913086, 19.588470458984375, 20.531381607055664, 21.474292755126953, 22.417205810546875, 23.360116958618164, 24.303028106689453, 25.245939254760742, 26.18885040283203, 27.13176155090332, 28.07467269897461, 29.01758575439453, 29.960494995117188, 30.90340805053711, 31.8463191986084, 32.78923034667969, 33.73214340209961, 34.675052642822266, 35.61796569824219, 36.560874938964844, 37.503787994384766, 38.44669723510742, 39.389610290527344, 40.33251953125, 41.27543258666992, 42.21834182739258, 43.1612548828125, 44.104164123535156, 45.04707717895508, 45.989986419677734, 46.932899475097656, 47.87581253051758]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 4.0, 5.0, 5.0, 8.0, 9.0, 8.0, 14.0, 7.0, 17.0, 17.0, 24.0, 18.0, 18.0, 42.0, 40.0, 35.0, 55.0, 43.0, 43.0, 39.0, 36.0, 46.0, 44.0, 47.0, 42.0, 39.0, 42.0, 36.0, 37.0, 34.0, 23.0, 13.0, 20.0, 13.0, 16.0, 12.0, 13.0, 15.0, 8.0, 10.0, 4.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.769462585449219, -10.439175605773926, -10.108887672424316, -9.778600692749023, -9.448312759399414, -9.118025779724121, -8.787737846374512, -8.457450866699219, -8.12716293334961, -7.796875476837158, -7.466588020324707, -7.136300563812256, -6.806013107299805, -6.475726127624512, -6.1454386711120605, -5.815151214599609, -5.484864234924316, -5.154576778411865, -4.824289321899414, -4.494001865386963, -4.163714408874512, -3.8334271907806396, -3.5031399726867676, -3.1728525161743164, -2.8425650596618652, -2.512277603149414, -2.181990146636963, -1.8517029285430908, -1.5214154720306396, -1.1911280155181885, -0.8608406782150269, -0.5305533409118652, -0.20026683807373047, 0.13002055883407593, 0.4603079557418823, 0.7905953526496887, 1.1208827495574951, 1.4511702060699463, 1.781457543373108, 2.1117448806762695, 2.4420323371887207, 2.772319793701172, 3.102607250213623, 3.432894468307495, 3.7631819248199463, 4.093469619750977, 4.4237565994262695, 4.754044055938721, 5.084331512451172, 5.414618968963623, 5.744906425476074, 6.075193881988525, 6.405481338500977, 6.7357683181762695, 7.066055774688721, 7.396343231201172, 7.726630687713623, 8.056918144226074, 8.387205123901367, 8.717493057250977, 9.04778003692627, 9.378067970275879, 9.708354949951172, 10.038642883300781, 10.368929862976074]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 6.0, 6.0, 8.0, 15.0, 7.0, 8.0, 13.0, 21.0, 21.0, 21.0, 25.0, 23.0, 39.0, 38.0, 31.0, 36.0, 47.0, 32.0, 41.0, 45.0, 30.0, 41.0, 39.0, 37.0, 30.0, 35.0, 41.0, 26.0, 27.0, 24.0, 14.0, 27.0, 25.0, 27.0, 22.0, 8.0, 12.0, 13.0, 10.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.744140625, -1.690185546875, -1.63623046875, -1.582275390625, -1.5283203125, -1.474365234375, -1.42041015625, -1.366455078125, -1.3125, -1.258544921875, -1.20458984375, -1.150634765625, -1.0966796875, -1.042724609375, -0.98876953125, -0.934814453125, -0.880859375, -0.826904296875, -0.77294921875, -0.718994140625, -0.6650390625, -0.611083984375, -0.55712890625, -0.503173828125, -0.44921875, -0.395263671875, -0.34130859375, -0.287353515625, -0.2333984375, -0.179443359375, -0.12548828125, -0.071533203125, -0.017578125, 0.036376953125, 0.09033203125, 0.144287109375, 0.1982421875, 0.252197265625, 0.30615234375, 0.360107421875, 0.4140625, 0.468017578125, 0.52197265625, 0.575927734375, 0.6298828125, 0.683837890625, 0.73779296875, 0.791748046875, 0.845703125, 0.899658203125, 0.95361328125, 1.007568359375, 1.0615234375, 1.115478515625, 1.16943359375, 1.223388671875, 1.27734375, 1.331298828125, 1.38525390625, 1.439208984375, 1.4931640625, 1.547119140625, 1.60107421875, 1.655029296875, 1.708984375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 10.0, 8.0, 16.0, 23.0, 34.0, 48.0, 61.0, 89.0, 132.0, 224.0, 323.0, 438.0, 704.0, 923.0, 1389.0, 2120.0, 3118.0, 4636.0, 6974.0, 10230.0, 15201.0, 22774.0, 34378.0, 52215.0, 79451.0, 117475.0, 153626.0, 158930.0, 126089.0, 86722.0, 57245.0, 37492.0, 24843.0, 16688.0, 10882.0, 7448.0, 5075.0, 3358.0, 2326.0, 1522.0, 1092.0, 705.0, 468.0, 333.0, 210.0, 166.0, 101.0, 89.0, 50.0, 24.0, 31.0, 20.0, 13.0, 10.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.1495361328125, -0.14487838745117188, -0.14022064208984375, -0.13556289672851562, -0.1309051513671875, -0.12624740600585938, -0.12158966064453125, -0.11693191528320312, -0.112274169921875, -0.10761642456054688, -0.10295867919921875, -0.09830093383789062, -0.0936431884765625, -0.08898544311523438, -0.08432769775390625, -0.07966995239257812, -0.07501220703125, -0.07035446166992188, -0.06569671630859375, -0.061038970947265625, -0.0563812255859375, -0.051723480224609375, -0.04706573486328125, -0.042407989501953125, -0.037750244140625, -0.033092498779296875, -0.02843475341796875, -0.023777008056640625, -0.0191192626953125, -0.014461517333984375, -0.00980377197265625, -0.005146026611328125, -0.00048828125, 0.004169464111328125, 0.00882720947265625, 0.013484954833984375, 0.0181427001953125, 0.022800445556640625, 0.02745819091796875, 0.032115936279296875, 0.036773681640625, 0.041431427001953125, 0.04608917236328125, 0.050746917724609375, 0.0554046630859375, 0.060062408447265625, 0.06472015380859375, 0.06937789916992188, 0.07403564453125, 0.07869338989257812, 0.08335113525390625, 0.08800888061523438, 0.0926666259765625, 0.09732437133789062, 0.10198211669921875, 0.10663986206054688, 0.111297607421875, 0.11595535278320312, 0.12061309814453125, 0.12527084350585938, 0.1299285888671875, 0.13458633422851562, 0.13924407958984375, 0.14390182495117188, 0.1485595703125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 10.0, 11.0, 5.0, 12.0, 14.0, 15.0, 18.0, 16.0, 24.0, 20.0, 32.0, 24.0, 28.0, 32.0, 42.0, 35.0, 47.0, 38.0, 47.0, 44.0, 1060.0, 45.0, 42.0, 29.0, 26.0, 38.0, 41.0, 34.0, 15.0, 16.0, 20.0, 17.0, 18.0, 25.0, 14.0, 14.0, 13.0, 13.0, 5.0, 5.0, 7.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0543060302734375, -1.016815185546875, -0.9793243408203125, -0.94183349609375, -0.9043426513671875, -0.866851806640625, -0.8293609619140625, -0.7918701171875, -0.7543792724609375, -0.716888427734375, -0.6793975830078125, -0.64190673828125, -0.6044158935546875, -0.566925048828125, -0.5294342041015625, -0.491943359375, -0.4544525146484375, -0.416961669921875, -0.3794708251953125, -0.34197998046875, -0.3044891357421875, -0.266998291015625, -0.2295074462890625, -0.1920166015625, -0.1545257568359375, -0.117034912109375, -0.0795440673828125, -0.04205322265625, -0.0045623779296875, 0.032928466796875, 0.0704193115234375, 0.10791015625, 0.1454010009765625, 0.182891845703125, 0.2203826904296875, 0.25787353515625, 0.2953643798828125, 0.332855224609375, 0.3703460693359375, 0.4078369140625, 0.4453277587890625, 0.482818603515625, 0.5203094482421875, 0.55780029296875, 0.5952911376953125, 0.632781982421875, 0.6702728271484375, 0.707763671875, 0.7452545166015625, 0.782745361328125, 0.8202362060546875, 0.85772705078125, 0.8952178955078125, 0.932708740234375, 0.9701995849609375, 1.0076904296875, 1.0451812744140625, 1.082672119140625, 1.1201629638671875, 1.15765380859375, 1.1951446533203125, 1.232635498046875, 1.2701263427734375, 1.3076171875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 11.0, 12.0, 14.0, 23.0, 43.0, 65.0, 80.0, 127.0, 197.0, 367.0, 687.0, 1164.0, 2456.0, 4679.0, 9758.0, 21061.0, 70410.0, 1806528.0, 129761.0, 26138.0, 11652.0, 5715.0, 2805.0, 1432.0, 821.0, 410.0, 251.0, 167.0, 85.0, 57.0, 42.0, 31.0, 30.0, 7.0, 12.0, 8.0, 6.0, 0.0, 8.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370849609375, -0.35912322998046875, -0.3473968505859375, -0.33567047119140625, -0.323944091796875, -0.31221771240234375, -0.3004913330078125, -0.28876495361328125, -0.27703857421875, -0.26531219482421875, -0.2535858154296875, -0.24185943603515625, -0.230133056640625, -0.21840667724609375, -0.2066802978515625, -0.19495391845703125, -0.1832275390625, -0.17150115966796875, -0.1597747802734375, -0.14804840087890625, -0.136322021484375, -0.12459564208984375, -0.1128692626953125, -0.10114288330078125, -0.08941650390625, -0.07769012451171875, -0.0659637451171875, -0.05423736572265625, -0.042510986328125, -0.03078460693359375, -0.0190582275390625, -0.00733184814453125, 0.00439453125, 0.01612091064453125, 0.0278472900390625, 0.03957366943359375, 0.051300048828125, 0.06302642822265625, 0.0747528076171875, 0.08647918701171875, 0.09820556640625, 0.10993194580078125, 0.1216583251953125, 0.13338470458984375, 0.145111083984375, 0.15683746337890625, 0.1685638427734375, 0.18029022216796875, 0.1920166015625, 0.20374298095703125, 0.2154693603515625, 0.22719573974609375, 0.238922119140625, 0.25064849853515625, 0.2623748779296875, 0.27410125732421875, 0.28582763671875, 0.29755401611328125, 0.3092803955078125, 0.32100677490234375, 0.332733154296875, 0.34445953369140625, 0.3561859130859375, 0.36791229248046875, 0.379638671875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 10.0, 10.0, 6.0, 11.0, 13.0, 21.0, 21.0, 16.0, 39.0, 37.0, 34.0, 52.0, 55.0, 55.0, 53.0, 58.0, 65.0, 47.0, 59.0, 45.0, 53.0, 34.0, 25.0, 26.0, 23.0, 20.0, 20.0, 13.0, 9.0, 10.0, 11.0, 6.0, 4.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00753021240234375, -0.007203340530395508, -0.006876468658447266, -0.0065495967864990234, -0.006222724914550781, -0.005895853042602539, -0.005568981170654297, -0.005242109298706055, -0.0049152374267578125, -0.00458836555480957, -0.004261493682861328, -0.003934621810913086, -0.0036077499389648438, -0.0032808780670166016, -0.0029540061950683594, -0.002627134323120117, -0.002300262451171875, -0.001973390579223633, -0.0016465187072753906, -0.0013196468353271484, -0.0009927749633789062, -0.0006659030914306641, -0.0003390312194824219, -1.2159347534179688e-05, 0.0003147125244140625, 0.0006415843963623047, 0.0009684562683105469, 0.001295328140258789, 0.0016222000122070312, 0.0019490718841552734, 0.0022759437561035156, 0.002602815628051758, 0.0029296875, 0.003256559371948242, 0.0035834312438964844, 0.0039103031158447266, 0.004237174987792969, 0.004564046859741211, 0.004890918731689453, 0.005217790603637695, 0.0055446624755859375, 0.00587153434753418, 0.006198406219482422, 0.006525278091430664, 0.006852149963378906, 0.0071790218353271484, 0.007505893707275391, 0.007832765579223633, 0.008159637451171875, 0.008486509323120117, 0.00881338119506836, 0.009140253067016602, 0.009467124938964844, 0.009793996810913086, 0.010120868682861328, 0.01044774055480957, 0.010774612426757812, 0.011101484298706055, 0.011428356170654297, 0.011755228042602539, 0.012082099914550781, 0.012408971786499023, 0.012735843658447266, 0.013062715530395508, 0.01338958740234375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 11.0, 5.0, 13.0, 9.0, 9.0, 21.0, 25.0, 21.0, 27.0, 48.0, 46.0, 91.0, 145.0, 288.0, 664.0, 7793.0, 531603.0, 498909.0, 7392.0, 662.0, 255.0, 142.0, 94.0, 67.0, 53.0, 34.0, 21.0, 28.0, 11.0, 9.0, 9.0, 12.0, 8.0, 9.0, 1.0, 6.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.2666015625, -0.2600975036621094, -0.25359344482421875, -0.24708938598632812, -0.2405853271484375, -0.23408126831054688, -0.22757720947265625, -0.22107315063476562, -0.214569091796875, -0.20806503295898438, -0.20156097412109375, -0.19505691528320312, -0.1885528564453125, -0.18204879760742188, -0.17554473876953125, -0.16904067993164062, -0.16253662109375, -0.15603256225585938, -0.14952850341796875, -0.14302444458007812, -0.1365203857421875, -0.13001632690429688, -0.12351226806640625, -0.11700820922851562, -0.110504150390625, -0.10400009155273438, -0.09749603271484375, -0.09099197387695312, -0.0844879150390625, -0.07798385620117188, -0.07147979736328125, -0.06497573852539062, -0.0584716796875, -0.051967620849609375, -0.04546356201171875, -0.038959503173828125, -0.0324554443359375, -0.025951385498046875, -0.01944732666015625, -0.012943267822265625, -0.006439208984375, 6.4849853515625e-05, 0.00656890869140625, 0.013072967529296875, 0.0195770263671875, 0.026081085205078125, 0.03258514404296875, 0.039089202880859375, 0.04559326171875, 0.052097320556640625, 0.05860137939453125, 0.06510543823242188, 0.0716094970703125, 0.07811355590820312, 0.08461761474609375, 0.09112167358398438, 0.097625732421875, 0.10412979125976562, 0.11063385009765625, 0.11713790893554688, 0.1236419677734375, 0.13014602661132812, 0.13665008544921875, 0.14315414428710938, 0.149658203125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [5.0, 2.0, 11.0, 38.0, 171.0, 406.0, 247.0, 89.0, 29.0, 12.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01768149994313717, -0.014589086174964905, -0.01149667240679264, -0.008404258638620377, -0.0053118448704481125, -0.0022194311022758484, 0.0008729826658964157, 0.00396539643406868, 0.007057810202240944, 0.010150223970413208, 0.013242637738585472, 0.016335051506757736, 0.01942746527493, 0.022519879043102264, 0.02561229281127453, 0.028704706579446793, 0.03179711848497391, 0.03488953411579132, 0.037981946021318436, 0.04107435792684555, 0.044166773557662964, 0.04725918918848038, 0.05035160109400749, 0.05344401299953461, 0.05653642863035202, 0.059628844261169434, 0.06272125244140625, 0.06581366807222366, 0.06890608370304108, 0.07199849933385849, 0.0750909149646759, 0.07818332314491272, 0.08127574622631073, 0.08436816185712814, 0.08746057748794556, 0.09055298566818237, 0.09364540129899979, 0.0967378169298172, 0.09983022511005402, 0.10292264074087143, 0.10601505637168884, 0.10910747200250626, 0.11219988763332367, 0.11529229581356049, 0.1183847114443779, 0.12147712707519531, 0.12456953525543213, 0.12766195833683014, 0.13075436651706696, 0.13384677469730377, 0.13693919777870178, 0.1400316059589386, 0.14312401413917542, 0.14621643722057343, 0.14930884540081024, 0.15240126848220825, 0.15549367666244507, 0.15858608484268188, 0.1616785079240799, 0.1647709161043167, 0.16786333918571472, 0.17095574736595154, 0.17404815554618835, 0.17714057862758636, 0.18023298680782318]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 6.0, 13.0, 15.0, 13.0, 16.0, 15.0, 20.0, 29.0, 24.0, 27.0, 29.0, 37.0, 33.0, 46.0, 40.0, 36.0, 43.0, 45.0, 37.0, 32.0, 50.0, 40.0, 39.0, 28.0, 29.0, 28.0, 40.0, 32.0, 25.0, 19.0, 18.0, 16.0, 17.0, 12.0, 7.0, 9.0, 5.0, 6.0, 6.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009915947914123535, -0.009606151841580868, -0.0092963557690382, -0.008986559696495533, -0.008676763623952866, -0.008366967551410198, -0.00805717147886753, -0.0077473754063248634, -0.007437579333782196, -0.007127783261239529, -0.006817987188696861, -0.006508191116154194, -0.0061983950436115265, -0.005888598971068859, -0.005578802898526192, -0.005269006825983524, -0.004959210753440857, -0.0046494146808981895, -0.004339618608355522, -0.004029822535812855, -0.0037200264632701874, -0.00341023039072752, -0.0031004343181848526, -0.002790638245642185, -0.002480842173099518, -0.0021710461005568504, -0.001861250028014183, -0.0015514539554715157, -0.0012416578829288483, -0.0009318618103861809, -0.0006220657378435135, -0.0003122696653008461, -2.473592758178711e-06, 0.0003073224797844887, 0.0006171185523271561, 0.0009269146248698235, 0.0012367106974124908, 0.0015465067699551582, 0.0018563028424978256, 0.002166098915040493, 0.0024758949875831604, 0.002785691060125828, 0.003095487132668495, 0.0034052832052111626, 0.00371507927775383, 0.004024875350296497, 0.004334671422839165, 0.004644467495381832, 0.0049542635679244995, 0.005264059640467167, 0.005573855713009834, 0.005883651785552502, 0.006193447858095169, 0.0065032439306378365, 0.006813040003180504, 0.007122836075723171, 0.007432632148265839, 0.007742428220808506, 0.008052224293351173, 0.00836202036589384, 0.008671816438436508, 0.008981612510979176, 0.009291408583521843, 0.00960120465606451, 0.009911000728607178]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 6.0, 6.0, 8.0, 15.0, 7.0, 8.0, 13.0, 21.0, 21.0, 21.0, 25.0, 23.0, 39.0, 38.0, 31.0, 36.0, 47.0, 31.0, 42.0, 46.0, 29.0, 42.0, 37.0, 38.0, 31.0, 33.0, 41.0, 27.0, 27.0, 24.0, 14.0, 27.0, 25.0, 27.0, 23.0, 7.0, 12.0, 12.0, 11.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.744140625, -1.690185546875, -1.63623046875, -1.582275390625, -1.5283203125, -1.474365234375, -1.42041015625, -1.366455078125, -1.3125, -1.258544921875, -1.20458984375, -1.150634765625, -1.0966796875, -1.042724609375, -0.98876953125, -0.934814453125, -0.880859375, -0.826904296875, -0.77294921875, -0.718994140625, -0.6650390625, -0.611083984375, -0.55712890625, -0.503173828125, -0.44921875, -0.395263671875, -0.34130859375, -0.287353515625, -0.2333984375, -0.179443359375, -0.12548828125, -0.071533203125, -0.017578125, 0.036376953125, 0.09033203125, 0.144287109375, 0.1982421875, 0.252197265625, 0.30615234375, 0.360107421875, 0.4140625, 0.468017578125, 0.52197265625, 0.575927734375, 0.6298828125, 0.683837890625, 0.73779296875, 0.791748046875, 0.845703125, 0.899658203125, 0.95361328125, 1.007568359375, 1.0615234375, 1.115478515625, 1.16943359375, 1.223388671875, 1.27734375, 1.331298828125, 1.38525390625, 1.439208984375, 1.4931640625, 1.547119140625, 1.60107421875, 1.655029296875, 1.708984375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 15.0, 19.0, 11.0, 35.0, 41.0, 78.0, 120.0, 179.0, 282.0, 499.0, 916.0, 1526.0, 2787.0, 5159.0, 10269.0, 21441.0, 50359.0, 154443.0, 507581.0, 187336.0, 57589.0, 23811.0, 11380.0, 5611.0, 2963.0, 1748.0, 954.0, 527.0, 340.0, 195.0, 124.0, 60.0, 55.0, 38.0, 28.0, 7.0, 11.0, 3.0, 2.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.1015625, -3.0118408203125, -2.922119140625, -2.8323974609375, -2.74267578125, -2.6529541015625, -2.563232421875, -2.4735107421875, -2.3837890625, -2.2940673828125, -2.204345703125, -2.1146240234375, -2.02490234375, -1.9351806640625, -1.845458984375, -1.7557373046875, -1.666015625, -1.5762939453125, -1.486572265625, -1.3968505859375, -1.30712890625, -1.2174072265625, -1.127685546875, -1.0379638671875, -0.9482421875, -0.8585205078125, -0.768798828125, -0.6790771484375, -0.58935546875, -0.4996337890625, -0.409912109375, -0.3201904296875, -0.23046875, -0.1407470703125, -0.051025390625, 0.0386962890625, 0.12841796875, 0.2181396484375, 0.307861328125, 0.3975830078125, 0.4873046875, 0.5770263671875, 0.666748046875, 0.7564697265625, 0.84619140625, 0.9359130859375, 1.025634765625, 1.1153564453125, 1.205078125, 1.2947998046875, 1.384521484375, 1.4742431640625, 1.56396484375, 1.6536865234375, 1.743408203125, 1.8331298828125, 1.9228515625, 2.0125732421875, 2.102294921875, 2.1920166015625, 2.28173828125, 2.3714599609375, 2.461181640625, 2.5509033203125, 2.640625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 0.0, 7.0, 2.0, 4.0, 4.0, 15.0, 18.0, 12.0, 20.0, 16.0, 18.0, 25.0, 26.0, 40.0, 50.0, 51.0, 53.0, 86.0, 103.0, 265.0, 1460.0, 244.0, 106.0, 80.0, 53.0, 51.0, 33.0, 31.0, 27.0, 26.0, 23.0, 15.0, 20.0, 19.0, 15.0, 8.0, 6.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.890625, -5.703125, -5.515625, -5.328125, -5.140625, -4.953125, -4.765625, -4.578125, -4.390625, -4.203125, -4.015625, -3.828125, -3.640625, -3.453125, -3.265625, -3.078125, -2.890625, -2.703125, -2.515625, -2.328125, -2.140625, -1.953125, -1.765625, -1.578125, -1.390625, -1.203125, -1.015625, -0.828125, -0.640625, -0.453125, -0.265625, -0.078125, 0.109375, 0.296875, 0.484375, 0.671875, 0.859375, 1.046875, 1.234375, 1.421875, 1.609375, 1.796875, 1.984375, 2.171875, 2.359375, 2.546875, 2.734375, 2.921875, 3.109375, 3.296875, 3.484375, 3.671875, 3.859375, 4.046875, 4.234375, 4.421875, 4.609375, 4.796875, 4.984375, 5.171875, 5.359375, 5.546875, 5.734375, 5.921875, 6.109375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 2.0, 14.0, 15.0, 21.0, 19.0, 30.0, 27.0, 31.0, 58.0, 69.0, 122.0, 200.0, 361.0, 1700.0, 21935.0, 2527905.0, 581021.0, 10165.0, 1122.0, 320.0, 164.0, 96.0, 77.0, 52.0, 25.0, 29.0, 21.0, 17.0, 19.0, 11.0, 13.0, 11.0, 7.0, 4.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.5625, -14.1195068359375, -13.676513671875, -13.2335205078125, -12.79052734375, -12.3475341796875, -11.904541015625, -11.4615478515625, -11.0185546875, -10.5755615234375, -10.132568359375, -9.6895751953125, -9.24658203125, -8.8035888671875, -8.360595703125, -7.9176025390625, -7.474609375, -7.0316162109375, -6.588623046875, -6.1456298828125, -5.70263671875, -5.2596435546875, -4.816650390625, -4.3736572265625, -3.9306640625, -3.4876708984375, -3.044677734375, -2.6016845703125, -2.15869140625, -1.7156982421875, -1.272705078125, -0.8297119140625, -0.38671875, 0.0562744140625, 0.499267578125, 0.9422607421875, 1.38525390625, 1.8282470703125, 2.271240234375, 2.7142333984375, 3.1572265625, 3.6002197265625, 4.043212890625, 4.4862060546875, 4.92919921875, 5.3721923828125, 5.815185546875, 6.2581787109375, 6.701171875, 7.1441650390625, 7.587158203125, 8.0301513671875, 8.47314453125, 8.9161376953125, 9.359130859375, 9.8021240234375, 10.2451171875, 10.6881103515625, 11.131103515625, 11.5740966796875, 12.01708984375, 12.4600830078125, 12.903076171875, 13.3460693359375, 13.7890625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 17.0, 178.0, 447.0, 299.0, 60.0, 9.0, 1.0], "bins": [-77.63846588134766, -76.33688354492188, -75.03530883789062, -73.73372650146484, -72.4321517944336, -71.13056945800781, -69.82899475097656, -68.52741241455078, -67.22583770751953, -65.92425537109375, -64.6226806640625, -63.321102142333984, -62.01952362060547, -60.71794509887695, -59.41636657714844, -58.11478805541992, -56.813209533691406, -55.51163101196289, -54.210052490234375, -52.90847396850586, -51.606895446777344, -50.30531692504883, -49.00373840332031, -47.7021598815918, -46.400577545166016, -45.0989990234375, -43.797420501708984, -42.49584197998047, -41.19426345825195, -39.89268493652344, -38.59110641479492, -37.289527893066406, -35.987953186035156, -34.68637466430664, -33.384796142578125, -32.08321762084961, -30.781639099121094, -29.480060577392578, -28.178482055664062, -26.876903533935547, -25.5753231048584, -24.273744583129883, -22.972166061401367, -21.67058753967285, -20.369009017944336, -19.06743049621582, -17.765850067138672, -16.464271545410156, -15.162694931030273, -13.861116409301758, -12.559537887573242, -11.257959365844727, -9.956380844116211, -8.654802322387695, -7.353222846984863, -6.051644325256348, -4.750065326690674, -3.448486804962158, -2.1469080448150635, -0.8453292846679688, 0.4562492370605469, 1.7578277587890625, 3.0594067573547363, 4.360985279083252, 5.662563800811768]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 7.0, 5.0, 6.0, 6.0, 8.0, 11.0, 18.0, 18.0, 20.0, 25.0, 22.0, 31.0, 50.0, 40.0, 39.0, 42.0, 48.0, 38.0, 44.0, 45.0, 65.0, 38.0, 42.0, 38.0, 38.0, 42.0, 31.0, 36.0, 31.0, 25.0, 26.0, 6.0, 15.0, 12.0, 8.0, 11.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.133684158325195, -18.570449829101562, -18.00721549987793, -17.44398307800293, -16.880748748779297, -16.317514419555664, -15.754280090332031, -15.191045761108398, -14.627812385559082, -14.06457805633545, -13.501344680786133, -12.9381103515625, -12.374876022338867, -11.81164264678955, -11.248408317565918, -10.685174942016602, -10.121940612792969, -9.558706283569336, -8.99547290802002, -8.432238578796387, -7.869004726409912, -7.3057708740234375, -6.742536544799805, -6.17930269241333, -5.6160688400268555, -5.052834987640381, -4.489601135253906, -3.9263668060302734, -3.363132953643799, -2.799899101257324, -2.2366650104522705, -1.6734309196472168, -1.110198974609375, -0.5469650030136108, 0.01626896858215332, 0.5795029401779175, 1.1427369117736816, 1.7059707641601562, 2.26920485496521, 2.8324389457702637, 3.3956727981567383, 3.958906650543213, 4.5221405029296875, 5.08537483215332, 5.648608684539795, 6.2118425369262695, 6.775076866149902, 7.338310718536377, 7.901544570922852, 8.464778900146484, 9.0280122756958, 9.591246604919434, 10.15447998046875, 10.717714309692383, 11.280948638916016, 11.844182968139648, 12.407416343688965, 12.970650672912598, 13.533884048461914, 14.097118377685547, 14.66035270690918, 15.223586082458496, 15.786820411682129, 16.350053787231445, 16.913288116455078]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 7.0, 5.0, 4.0, 9.0, 6.0, 8.0, 14.0, 12.0, 15.0, 7.0, 18.0, 22.0, 21.0, 29.0, 23.0, 28.0, 32.0, 35.0, 48.0, 49.0, 39.0, 32.0, 39.0, 37.0, 37.0, 24.0, 35.0, 39.0, 32.0, 32.0, 37.0, 24.0, 30.0, 25.0, 18.0, 15.0, 23.0, 20.0, 14.0, 15.0, 9.0, 5.0, 9.0, 6.0, 4.0, 9.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7607421875, -1.704376220703125, -1.64801025390625, -1.591644287109375, -1.5352783203125, -1.478912353515625, -1.42254638671875, -1.366180419921875, -1.309814453125, -1.253448486328125, -1.19708251953125, -1.140716552734375, -1.0843505859375, -1.027984619140625, -0.97161865234375, -0.915252685546875, -0.85888671875, -0.802520751953125, -0.74615478515625, -0.689788818359375, -0.6334228515625, -0.577056884765625, -0.52069091796875, -0.464324951171875, -0.407958984375, -0.351593017578125, -0.29522705078125, -0.238861083984375, -0.1824951171875, -0.126129150390625, -0.06976318359375, -0.013397216796875, 0.04296875, 0.099334716796875, 0.15570068359375, 0.212066650390625, 0.2684326171875, 0.324798583984375, 0.38116455078125, 0.437530517578125, 0.493896484375, 0.550262451171875, 0.60662841796875, 0.662994384765625, 0.7193603515625, 0.775726318359375, 0.83209228515625, 0.888458251953125, 0.94482421875, 1.001190185546875, 1.05755615234375, 1.113922119140625, 1.1702880859375, 1.226654052734375, 1.28302001953125, 1.339385986328125, 1.395751953125, 1.452117919921875, 1.50848388671875, 1.564849853515625, 1.6212158203125, 1.677581787109375, 1.73394775390625, 1.790313720703125, 1.8466796875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 13.0, 11.0, 22.0, 36.0, 58.0, 87.0, 161.0, 218.0, 373.0, 586.0, 1106.0, 1966.0, 3740.0, 8110.0, 16978.0, 41443.0, 119299.0, 474742.0, 1824234.0, 1276869.0, 285399.0, 81740.0, 30473.0, 13306.0, 6193.0, 3096.0, 1662.0, 950.0, 517.0, 328.0, 213.0, 123.0, 83.0, 53.0, 32.0, 16.0, 16.0, 11.0, 11.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.783203125, -3.674591064453125, -3.56597900390625, -3.457366943359375, -3.3487548828125, -3.240142822265625, -3.13153076171875, -3.022918701171875, -2.914306640625, -2.805694580078125, -2.69708251953125, -2.588470458984375, -2.4798583984375, -2.371246337890625, -2.26263427734375, -2.154022216796875, -2.04541015625, -1.936798095703125, -1.82818603515625, -1.719573974609375, -1.6109619140625, -1.502349853515625, -1.39373779296875, -1.285125732421875, -1.176513671875, -1.067901611328125, -0.95928955078125, -0.850677490234375, -0.7420654296875, -0.633453369140625, -0.52484130859375, -0.416229248046875, -0.3076171875, -0.199005126953125, -0.09039306640625, 0.018218994140625, 0.1268310546875, 0.235443115234375, 0.34405517578125, 0.452667236328125, 0.561279296875, 0.669891357421875, 0.77850341796875, 0.887115478515625, 0.9957275390625, 1.104339599609375, 1.21295166015625, 1.321563720703125, 1.43017578125, 1.538787841796875, 1.64739990234375, 1.756011962890625, 1.8646240234375, 1.973236083984375, 2.08184814453125, 2.190460205078125, 2.299072265625, 2.407684326171875, 2.51629638671875, 2.624908447265625, 2.7335205078125, 2.842132568359375, 2.95074462890625, 3.059356689453125, 3.16796875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 10.0, 6.0, 7.0, 14.0, 21.0, 18.0, 21.0, 30.0, 62.0, 54.0, 80.0, 109.0, 155.0, 152.0, 235.0, 287.0, 368.0, 472.0, 462.0, 400.0, 278.0, 182.0, 158.0, 127.0, 92.0, 57.0, 49.0, 33.0, 27.0, 24.0, 14.0, 16.0, 8.0, 11.0, 13.0, 9.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.25, -3.14801025390625, -3.0460205078125, -2.94403076171875, -2.842041015625, -2.74005126953125, -2.6380615234375, -2.53607177734375, -2.43408203125, -2.33209228515625, -2.2301025390625, -2.12811279296875, -2.026123046875, -1.92413330078125, -1.8221435546875, -1.72015380859375, -1.6181640625, -1.51617431640625, -1.4141845703125, -1.31219482421875, -1.210205078125, -1.10821533203125, -1.0062255859375, -0.90423583984375, -0.80224609375, -0.70025634765625, -0.5982666015625, -0.49627685546875, -0.394287109375, -0.29229736328125, -0.1903076171875, -0.08831787109375, 0.013671875, 0.11566162109375, 0.2176513671875, 0.31964111328125, 0.421630859375, 0.52362060546875, 0.6256103515625, 0.72760009765625, 0.82958984375, 0.93157958984375, 1.0335693359375, 1.13555908203125, 1.237548828125, 1.33953857421875, 1.4415283203125, 1.54351806640625, 1.6455078125, 1.74749755859375, 1.8494873046875, 1.95147705078125, 2.053466796875, 2.15545654296875, 2.2574462890625, 2.35943603515625, 2.46142578125, 2.56341552734375, 2.6654052734375, 2.76739501953125, 2.869384765625, 2.97137451171875, 3.0733642578125, 3.17535400390625, 3.27734375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 10.0, 4.0, 10.0, 9.0, 14.0, 17.0, 19.0, 25.0, 31.0, 45.0, 57.0, 73.0, 130.0, 190.0, 354.0, 962.0, 4261.0, 31193.0, 522537.0, 3416916.0, 197030.0, 16153.0, 2571.0, 744.0, 290.0, 195.0, 124.0, 68.0, 52.0, 57.0, 33.0, 19.0, 18.0, 14.0, 7.0, 12.0, 10.0, 9.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-11.59375, -11.24609375, -10.8984375, -10.55078125, -10.203125, -9.85546875, -9.5078125, -9.16015625, -8.8125, -8.46484375, -8.1171875, -7.76953125, -7.421875, -7.07421875, -6.7265625, -6.37890625, -6.03125, -5.68359375, -5.3359375, -4.98828125, -4.640625, -4.29296875, -3.9453125, -3.59765625, -3.25, -2.90234375, -2.5546875, -2.20703125, -1.859375, -1.51171875, -1.1640625, -0.81640625, -0.46875, -0.12109375, 0.2265625, 0.57421875, 0.921875, 1.26953125, 1.6171875, 1.96484375, 2.3125, 2.66015625, 3.0078125, 3.35546875, 3.703125, 4.05078125, 4.3984375, 4.74609375, 5.09375, 5.44140625, 5.7890625, 6.13671875, 6.484375, 6.83203125, 7.1796875, 7.52734375, 7.875, 8.22265625, 8.5703125, 8.91796875, 9.265625, 9.61328125, 9.9609375, 10.30859375, 10.65625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 11.0, 22.0, 70.0, 160.0, 210.0, 237.0, 159.0, 89.0, 35.0, 17.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.082590103149414, -19.771987915039062, -18.461383819580078, -17.150781631469727, -15.840177536010742, -14.52957534790039, -13.218972206115723, -11.908369064331055, -10.597765922546387, -9.287162780761719, -7.976559638977051, -6.665956974029541, -5.355353832244873, -4.044750690460205, -2.7341480255126953, -1.4235448837280273, -0.11294174194335938, 1.197661280632019, 2.5082643032073975, 3.8188672065734863, 5.129470348358154, 6.440073490142822, 7.750676155090332, 9.061279296875, 10.371882438659668, 11.682485580444336, 12.993088722229004, 14.303691864013672, 15.614294052124023, 16.924898147583008, 18.23550033569336, 19.546104431152344, 20.856704711914062, 22.167306900024414, 23.4779109954834, 24.78851318359375, 26.099117279052734, 27.409719467163086, 28.720321655273438, 30.030925750732422, 31.341529846191406, 32.65213394165039, 33.96273422241211, 35.273338317871094, 36.58394241333008, 37.89454650878906, 39.20514678955078, 40.515750885009766, 41.82635498046875, 43.136959075927734, 44.44755935668945, 45.75816345214844, 47.06876754760742, 48.379371643066406, 49.689971923828125, 51.00057601928711, 52.31117630004883, 53.62178039550781, 54.93238067626953, 56.242984771728516, 57.5535888671875, 58.864192962646484, 60.1747932434082, 61.48539733886719, 62.79600143432617]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 3.0, 3.0, 10.0, 15.0, 6.0, 12.0, 13.0, 13.0, 22.0, 25.0, 27.0, 28.0, 28.0, 29.0, 42.0, 50.0, 47.0, 31.0, 38.0, 39.0, 42.0, 48.0, 60.0, 42.0, 41.0, 40.0, 27.0, 28.0, 18.0, 23.0, 25.0, 18.0, 22.0, 14.0, 16.0, 12.0, 6.0, 6.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.533114433288574, -10.15221881866455, -9.771322250366211, -9.390426635742188, -9.009530067443848, -8.628634452819824, -8.247737884521484, -7.866842269897461, -7.4859466552734375, -7.105050563812256, -6.724154472351074, -6.343258857727051, -5.962362766265869, -5.5814666748046875, -5.200570583343506, -4.819674491882324, -4.438778400421143, -4.057882308959961, -3.6769864559173584, -3.2960903644561768, -2.915194511413574, -2.5342984199523926, -2.153402328491211, -1.7725064754486084, -1.3916103839874268, -1.0107144117355347, -0.6298183798789978, -0.24892234802246094, 0.13197362422943115, 0.5128695964813232, 0.8937656879425049, 1.2746615409851074, 1.655557632446289, 2.0364537239074707, 2.4173495769500732, 2.798245668411255, 3.1791415214538574, 3.560037612915039, 3.9409337043762207, 4.321829795837402, 4.702725410461426, 5.083621501922607, 5.464517593383789, 5.8454132080078125, 6.226309299468994, 6.607205390930176, 6.988101482391357, 7.368997573852539, 7.749893665313721, 8.130789756774902, 8.511685371398926, 8.892581939697266, 9.273477554321289, 9.654373168945312, 10.035269737243652, 10.416165351867676, 10.797061920166016, 11.177957534790039, 11.558854103088379, 11.939749717712402, 12.320646286010742, 12.701541900634766, 13.082437515258789, 13.463334083557129, 13.844229698181152]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 5.0, 12.0, 7.0, 10.0, 12.0, 16.0, 28.0, 20.0, 25.0, 38.0, 44.0, 43.0, 43.0, 38.0, 42.0, 44.0, 46.0, 47.0, 42.0, 50.0, 53.0, 29.0, 34.0, 44.0, 30.0, 30.0, 20.0, 30.0, 16.0, 18.0, 18.0, 16.0, 13.0, 12.0, 7.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.27734375, -2.2131500244140625, -2.148956298828125, -2.0847625732421875, -2.02056884765625, -1.9563751220703125, -1.892181396484375, -1.8279876708984375, -1.7637939453125, -1.6996002197265625, -1.635406494140625, -1.5712127685546875, -1.50701904296875, -1.4428253173828125, -1.378631591796875, -1.3144378662109375, -1.250244140625, -1.1860504150390625, -1.121856689453125, -1.0576629638671875, -0.99346923828125, -0.9292755126953125, -0.865081787109375, -0.8008880615234375, -0.7366943359375, -0.6725006103515625, -0.608306884765625, -0.5441131591796875, -0.47991943359375, -0.4157257080078125, -0.351531982421875, -0.2873382568359375, -0.22314453125, -0.1589508056640625, -0.094757080078125, -0.0305633544921875, 0.03363037109375, 0.0978240966796875, 0.162017822265625, 0.2262115478515625, 0.2904052734375, 0.3545989990234375, 0.418792724609375, 0.4829864501953125, 0.54718017578125, 0.6113739013671875, 0.675567626953125, 0.7397613525390625, 0.803955078125, 0.8681488037109375, 0.932342529296875, 0.9965362548828125, 1.06072998046875, 1.1249237060546875, 1.189117431640625, 1.2533111572265625, 1.3175048828125, 1.3816986083984375, 1.445892333984375, 1.5100860595703125, 1.57427978515625, 1.6384735107421875, 1.702667236328125, 1.7668609619140625, 1.8310546875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 4.0, 15.0, 33.0, 31.0, 49.0, 65.0, 97.0, 133.0, 197.0, 311.0, 433.0, 631.0, 870.0, 1320.0, 2188.0, 3030.0, 4766.0, 7382.0, 11116.0, 17106.0, 26217.0, 41326.0, 66606.0, 110477.0, 167244.0, 189628.0, 147165.0, 92679.0, 56584.0, 35222.0, 22692.0, 14800.0, 9672.0, 6143.0, 4074.0, 2779.0, 1841.0, 1150.0, 767.0, 520.0, 397.0, 252.0, 167.0, 108.0, 73.0, 81.0, 36.0, 29.0, 18.0, 13.0, 11.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.168701171875, -0.1629486083984375, -0.157196044921875, -0.1514434814453125, -0.14569091796875, -0.1399383544921875, -0.134185791015625, -0.1284332275390625, -0.1226806640625, -0.1169281005859375, -0.111175537109375, -0.1054229736328125, -0.09967041015625, -0.0939178466796875, -0.088165283203125, -0.0824127197265625, -0.07666015625, -0.0709075927734375, -0.065155029296875, -0.0594024658203125, -0.05364990234375, -0.0478973388671875, -0.042144775390625, -0.0363922119140625, -0.0306396484375, -0.0248870849609375, -0.019134521484375, -0.0133819580078125, -0.00762939453125, -0.0018768310546875, 0.003875732421875, 0.0096282958984375, 0.015380859375, 0.0211334228515625, 0.026885986328125, 0.0326385498046875, 0.03839111328125, 0.0441436767578125, 0.049896240234375, 0.0556488037109375, 0.0614013671875, 0.0671539306640625, 0.072906494140625, 0.0786590576171875, 0.08441162109375, 0.0901641845703125, 0.095916748046875, 0.1016693115234375, 0.107421875, 0.1131744384765625, 0.118927001953125, 0.1246795654296875, 0.13043212890625, 0.1361846923828125, 0.141937255859375, 0.1476898193359375, 0.1534423828125, 0.1591949462890625, 0.164947509765625, 0.1707000732421875, 0.17645263671875, 0.1822052001953125, 0.187957763671875, 0.1937103271484375, 0.199462890625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 6.0, 4.0, 5.0, 6.0, 13.0, 7.0, 9.0, 18.0, 15.0, 16.0, 16.0, 20.0, 20.0, 25.0, 26.0, 30.0, 28.0, 52.0, 40.0, 42.0, 37.0, 40.0, 1080.0, 43.0, 43.0, 45.0, 31.0, 33.0, 31.0, 22.0, 24.0, 25.0, 28.0, 16.0, 21.0, 23.0, 18.0, 10.0, 12.0, 11.0, 10.0, 9.0, 5.0, 2.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3369140625, -1.2968902587890625, -1.256866455078125, -1.2168426513671875, -1.17681884765625, -1.1367950439453125, -1.096771240234375, -1.0567474365234375, -1.0167236328125, -0.9766998291015625, -0.936676025390625, -0.8966522216796875, -0.85662841796875, -0.8166046142578125, -0.776580810546875, -0.7365570068359375, -0.696533203125, -0.6565093994140625, -0.616485595703125, -0.5764617919921875, -0.53643798828125, -0.4964141845703125, -0.456390380859375, -0.4163665771484375, -0.3763427734375, -0.3363189697265625, -0.296295166015625, -0.2562713623046875, -0.21624755859375, -0.1762237548828125, -0.136199951171875, -0.0961761474609375, -0.05615234375, -0.0161285400390625, 0.023895263671875, 0.0639190673828125, 0.10394287109375, 0.1439666748046875, 0.183990478515625, 0.2240142822265625, 0.2640380859375, 0.3040618896484375, 0.344085693359375, 0.3841094970703125, 0.42413330078125, 0.4641571044921875, 0.504180908203125, 0.5442047119140625, 0.584228515625, 0.6242523193359375, 0.664276123046875, 0.7042999267578125, 0.74432373046875, 0.7843475341796875, 0.824371337890625, 0.8643951416015625, 0.9044189453125, 0.9444427490234375, 0.984466552734375, 1.0244903564453125, 1.06451416015625, 1.1045379638671875, 1.144561767578125, 1.1845855712890625, 1.224609375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 9.0, 6.0, 8.0, 7.0, 15.0, 29.0, 28.0, 33.0, 46.0, 73.0, 90.0, 135.0, 177.0, 301.0, 409.0, 581.0, 973.0, 1418.0, 2433.0, 3862.0, 6597.0, 11371.0, 22835.0, 72513.0, 1716566.0, 187931.0, 32753.0, 14890.0, 8209.0, 4698.0, 2932.0, 1790.0, 1129.0, 706.0, 453.0, 321.0, 247.0, 159.0, 123.0, 60.0, 51.0, 38.0, 39.0, 25.0, 17.0, 14.0, 6.0, 9.0, 6.0, 7.0, 7.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.31787109375, -0.3081512451171875, -0.298431396484375, -0.2887115478515625, -0.27899169921875, -0.2692718505859375, -0.259552001953125, -0.2498321533203125, -0.2401123046875, -0.2303924560546875, -0.220672607421875, -0.2109527587890625, -0.20123291015625, -0.1915130615234375, -0.181793212890625, -0.1720733642578125, -0.162353515625, -0.1526336669921875, -0.142913818359375, -0.1331939697265625, -0.12347412109375, -0.1137542724609375, -0.104034423828125, -0.0943145751953125, -0.0845947265625, -0.0748748779296875, -0.065155029296875, -0.0554351806640625, -0.04571533203125, -0.0359954833984375, -0.026275634765625, -0.0165557861328125, -0.0068359375, 0.0028839111328125, 0.012603759765625, 0.0223236083984375, 0.03204345703125, 0.0417633056640625, 0.051483154296875, 0.0612030029296875, 0.0709228515625, 0.0806427001953125, 0.090362548828125, 0.1000823974609375, 0.10980224609375, 0.1195220947265625, 0.129241943359375, 0.1389617919921875, 0.148681640625, 0.1584014892578125, 0.168121337890625, 0.1778411865234375, 0.18756103515625, 0.1972808837890625, 0.207000732421875, 0.2167205810546875, 0.2264404296875, 0.2361602783203125, 0.245880126953125, 0.2555999755859375, 0.26531982421875, 0.2750396728515625, 0.284759521484375, 0.2944793701171875, 0.30419921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 1.0, 3.0, 7.0, 6.0, 8.0, 6.0, 11.0, 18.0, 20.0, 21.0, 29.0, 18.0, 29.0, 34.0, 39.0, 33.0, 44.0, 39.0, 56.0, 53.0, 49.0, 52.0, 45.0, 38.0, 39.0, 43.0, 34.0, 28.0, 31.0, 26.0, 26.0, 21.0, 18.0, 13.0, 14.0, 17.0, 10.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0], "bins": [-0.01299285888671875, -0.012636065483093262, -0.012279272079467773, -0.011922478675842285, -0.011565685272216797, -0.011208891868591309, -0.01085209846496582, -0.010495305061340332, -0.010138511657714844, -0.009781718254089355, -0.009424924850463867, -0.009068131446838379, -0.00871133804321289, -0.008354544639587402, -0.007997751235961914, -0.007640957832336426, -0.0072841644287109375, -0.006927371025085449, -0.006570577621459961, -0.006213784217834473, -0.005856990814208984, -0.005500197410583496, -0.005143404006958008, -0.0047866106033325195, -0.004429817199707031, -0.004073023796081543, -0.0037162303924560547, -0.0033594369888305664, -0.003002643585205078, -0.00264585018157959, -0.0022890567779541016, -0.0019322633743286133, -0.001575469970703125, -0.0012186765670776367, -0.0008618831634521484, -0.0005050897598266602, -0.00014829635620117188, 0.0002084970474243164, 0.0005652904510498047, 0.000922083854675293, 0.0012788772583007812, 0.0016356706619262695, 0.001992464065551758, 0.002349257469177246, 0.0027060508728027344, 0.0030628442764282227, 0.003419637680053711, 0.0037764310836791992, 0.0041332244873046875, 0.004490017890930176, 0.004846811294555664, 0.005203604698181152, 0.005560398101806641, 0.005917191505432129, 0.006273984909057617, 0.0066307783126831055, 0.006987571716308594, 0.007344365119934082, 0.00770115852355957, 0.008057951927185059, 0.008414745330810547, 0.008771538734436035, 0.009128332138061523, 0.009485125541687012, 0.0098419189453125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 4.0, 5.0, 11.0, 19.0, 14.0, 16.0, 22.0, 25.0, 24.0, 27.0, 51.0, 48.0, 68.0, 105.0, 154.0, 322.0, 776.0, 13931.0, 888606.0, 141453.0, 1720.0, 464.0, 195.0, 124.0, 69.0, 59.0, 50.0, 28.0, 22.0, 23.0, 30.0, 10.0, 16.0, 14.0, 7.0, 8.0, 5.0, 5.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1983642578125, -0.19145774841308594, -0.18455123901367188, -0.1776447296142578, -0.17073822021484375, -0.1638317108154297, -0.15692520141601562, -0.15001869201660156, -0.1431121826171875, -0.13620567321777344, -0.12929916381835938, -0.12239265441894531, -0.11548614501953125, -0.10857963562011719, -0.10167312622070312, -0.09476661682128906, -0.087860107421875, -0.08095359802246094, -0.07404708862304688, -0.06714057922363281, -0.06023406982421875, -0.05332756042480469, -0.046421051025390625, -0.03951454162597656, -0.0326080322265625, -0.025701522827148438, -0.018795013427734375, -0.011888504028320312, -0.00498199462890625, 0.0019245147705078125, 0.008831024169921875, 0.015737533569335938, 0.02264404296875, 0.029550552368164062, 0.036457061767578125, 0.04336357116699219, 0.05027008056640625, 0.05717658996582031, 0.06408309936523438, 0.07098960876464844, 0.0778961181640625, 0.08480262756347656, 0.09170913696289062, 0.09861564636230469, 0.10552215576171875, 0.11242866516113281, 0.11933517456054688, 0.12624168395996094, 0.133148193359375, 0.14005470275878906, 0.14696121215820312, 0.1538677215576172, 0.16077423095703125, 0.1676807403564453, 0.17458724975585938, 0.18149375915527344, 0.1884002685546875, 0.19530677795410156, 0.20221328735351562, 0.2091197967529297, 0.21602630615234375, 0.2229328155517578, 0.22983932495117188, 0.23674583435058594, 0.24365234375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 28.0, 222.0, 588.0, 136.0, 27.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17983974516391754, -0.17559866607189178, -0.17135757207870483, -0.16711649298667908, -0.16287539899349213, -0.15863431990146637, -0.15439322590827942, -0.15015214681625366, -0.1459110677242279, -0.14166998863220215, -0.1374288946390152, -0.13318781554698944, -0.1289467215538025, -0.12470564246177673, -0.12046455591917038, -0.11622346937656403, -0.11198238283395767, -0.10774129629135132, -0.10350020974874496, -0.09925912320613861, -0.09501804411411285, -0.0907769575715065, -0.08653587102890015, -0.08229478448629379, -0.07805369794368744, -0.07381261140108109, -0.06957152485847473, -0.06533044576644897, -0.06108935922384262, -0.05684827268123627, -0.05260718613862991, -0.04836609959602356, -0.0441250205039978, -0.03988393396139145, -0.035642851144075394, -0.03140176460146904, -0.027160679921507835, -0.02291959524154663, -0.018678508698940277, -0.014437424018979073, -0.010196339339017868, -0.005955254193395376, -0.0017141690477728844, 0.0025269165635108948, 0.006768001243472099, 0.011009085923433304, 0.015250172466039658, 0.019491257146000862, 0.023732341825962067, 0.02797342650592327, 0.032214511185884476, 0.03645559772849083, 0.040696680545806885, 0.04493776708841324, 0.04917885363101959, 0.053419940173625946, 0.057661022990942, 0.061902109533548355, 0.06614319235086441, 0.07038427889347076, 0.07462536543607712, 0.07886645197868347, 0.08310753107070923, 0.08734861761331558, 0.09158970415592194]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 8.0, 8.0, 16.0, 12.0, 15.0, 21.0, 26.0, 21.0, 29.0, 41.0, 35.0, 53.0, 42.0, 47.0, 37.0, 49.0, 50.0, 39.0, 55.0, 46.0, 30.0, 35.0, 39.0, 37.0, 38.0, 30.0, 27.0, 16.0, 18.0, 21.0, 11.0, 8.0, 5.0, 7.0, 11.0, 4.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.021970510482788086, -0.021376032382249832, -0.02078155241906643, -0.020187072455883026, -0.019592594355344772, -0.01899811625480652, -0.018403636291623116, -0.017809156328439713, -0.01721467822790146, -0.016620200127363205, -0.016025720164179802, -0.015431241132318974, -0.014836762100458145, -0.014242283068597317, -0.013647804036736488, -0.01305332500487566, -0.012458845973014832, -0.011864366941154003, -0.011269887909293175, -0.010675408877432346, -0.010080929845571518, -0.00948645081371069, -0.008891971781849861, -0.008297492749989033, -0.007703013718128204, -0.007108534686267376, -0.0065140556544065475, -0.005919576622545719, -0.005325097590684891, -0.004730618558824062, -0.004136139526963234, -0.0035416604951024055, -0.002947181463241577, -0.0023527024313807487, -0.0017582233995199203, -0.001163744367659092, -0.0005692653357982635, 2.521369606256485e-05, 0.0006196927279233932, 0.0012141717597842216, 0.00180865079164505, 0.0024031298235058784, 0.002997608855366707, 0.0035920878872275352, 0.004186566919088364, 0.004781045950949192, 0.0053755249828100204, 0.005970004014670849, 0.006564483046531677, 0.007158962078392506, 0.007753441110253334, 0.008347920142114162, 0.00894239917397499, 0.00953687820583582, 0.010131357237696648, 0.010725836269557476, 0.011320315301418304, 0.011914794333279133, 0.012509273365139961, 0.01310375239700079, 0.013698231428861618, 0.014292710460722446, 0.014887189492583275, 0.015481668524444103, 0.01607614755630493]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 5.0, 12.0, 7.0, 10.0, 12.0, 16.0, 28.0, 20.0, 25.0, 38.0, 44.0, 43.0, 43.0, 37.0, 42.0, 45.0, 47.0, 46.0, 41.0, 51.0, 53.0, 29.0, 34.0, 44.0, 29.0, 30.0, 21.0, 30.0, 16.0, 18.0, 17.0, 17.0, 13.0, 12.0, 7.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.27734375, -2.2131500244140625, -2.148956298828125, -2.0847625732421875, -2.02056884765625, -1.9563751220703125, -1.892181396484375, -1.8279876708984375, -1.7637939453125, -1.6996002197265625, -1.635406494140625, -1.5712127685546875, -1.50701904296875, -1.4428253173828125, -1.378631591796875, -1.3144378662109375, -1.250244140625, -1.1860504150390625, -1.121856689453125, -1.0576629638671875, -0.99346923828125, -0.9292755126953125, -0.865081787109375, -0.8008880615234375, -0.7366943359375, -0.6725006103515625, -0.608306884765625, -0.5441131591796875, -0.47991943359375, -0.4157257080078125, -0.351531982421875, -0.2873382568359375, -0.22314453125, -0.1589508056640625, -0.094757080078125, -0.0305633544921875, 0.03363037109375, 0.0978240966796875, 0.162017822265625, 0.2262115478515625, 0.2904052734375, 0.3545989990234375, 0.418792724609375, 0.4829864501953125, 0.54718017578125, 0.6113739013671875, 0.675567626953125, 0.7397613525390625, 0.803955078125, 0.8681488037109375, 0.932342529296875, 0.9965362548828125, 1.06072998046875, 1.1249237060546875, 1.189117431640625, 1.2533111572265625, 1.3175048828125, 1.3816986083984375, 1.445892333984375, 1.5100860595703125, 1.57427978515625, 1.6384735107421875, 1.702667236328125, 1.7668609619140625, 1.8310546875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 10.0, 17.0, 16.0, 28.0, 46.0, 46.0, 94.0, 128.0, 181.0, 224.0, 375.0, 505.0, 801.0, 1246.0, 1887.0, 2939.0, 4771.0, 7476.0, 12421.0, 20584.0, 37031.0, 73443.0, 161221.0, 286657.0, 218877.0, 101928.0, 48759.0, 26226.0, 15285.0, 9172.0, 5764.0, 3571.0, 2345.0, 1463.0, 1009.0, 642.0, 433.0, 275.0, 198.0, 127.0, 99.0, 72.0, 49.0, 30.0, 22.0, 17.0, 13.0, 8.0, 3.0, 7.0, 4.0, 1.0, 4.0, 0.0, 2.0], "bins": [-2.01953125, -1.957794189453125, -1.89605712890625, -1.834320068359375, -1.7725830078125, -1.710845947265625, -1.64910888671875, -1.587371826171875, -1.525634765625, -1.463897705078125, -1.40216064453125, -1.340423583984375, -1.2786865234375, -1.216949462890625, -1.15521240234375, -1.093475341796875, -1.03173828125, -0.970001220703125, -0.90826416015625, -0.846527099609375, -0.7847900390625, -0.723052978515625, -0.66131591796875, -0.599578857421875, -0.537841796875, -0.476104736328125, -0.41436767578125, -0.352630615234375, -0.2908935546875, -0.229156494140625, -0.16741943359375, -0.105682373046875, -0.0439453125, 0.017791748046875, 0.07952880859375, 0.141265869140625, 0.2030029296875, 0.264739990234375, 0.32647705078125, 0.388214111328125, 0.449951171875, 0.511688232421875, 0.57342529296875, 0.635162353515625, 0.6968994140625, 0.758636474609375, 0.82037353515625, 0.882110595703125, 0.94384765625, 1.005584716796875, 1.06732177734375, 1.129058837890625, 1.1907958984375, 1.252532958984375, 1.31427001953125, 1.376007080078125, 1.437744140625, 1.499481201171875, 1.56121826171875, 1.622955322265625, 1.6846923828125, 1.746429443359375, 1.80816650390625, 1.869903564453125, 1.931640625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 7.0, 3.0, 10.0, 9.0, 8.0, 10.0, 11.0, 18.0, 19.0, 27.0, 20.0, 24.0, 37.0, 43.0, 37.0, 57.0, 56.0, 101.0, 163.0, 321.0, 1366.0, 192.0, 120.0, 53.0, 42.0, 43.0, 33.0, 38.0, 26.0, 23.0, 18.0, 16.0, 22.0, 15.0, 16.0, 5.0, 12.0, 14.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.66876220703125, -4.4898681640625, -4.31097412109375, -4.132080078125, -3.95318603515625, -3.7742919921875, -3.59539794921875, -3.41650390625, -3.23760986328125, -3.0587158203125, -2.87982177734375, -2.700927734375, -2.52203369140625, -2.3431396484375, -2.16424560546875, -1.9853515625, -1.80645751953125, -1.6275634765625, -1.44866943359375, -1.269775390625, -1.09088134765625, -0.9119873046875, -0.73309326171875, -0.55419921875, -0.37530517578125, -0.1964111328125, -0.01751708984375, 0.161376953125, 0.34027099609375, 0.5191650390625, 0.69805908203125, 0.876953125, 1.05584716796875, 1.2347412109375, 1.41363525390625, 1.592529296875, 1.77142333984375, 1.9503173828125, 2.12921142578125, 2.30810546875, 2.48699951171875, 2.6658935546875, 2.84478759765625, 3.023681640625, 3.20257568359375, 3.3814697265625, 3.56036376953125, 3.7392578125, 3.91815185546875, 4.0970458984375, 4.27593994140625, 4.454833984375, 4.63372802734375, 4.8126220703125, 4.99151611328125, 5.17041015625, 5.34930419921875, 5.5281982421875, 5.70709228515625, 5.885986328125, 6.06488037109375, 6.2437744140625, 6.42266845703125, 6.6015625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 0.0, 4.0, 4.0, 3.0, 14.0, 13.0, 14.0, 14.0, 23.0, 24.0, 29.0, 35.0, 57.0, 75.0, 92.0, 137.0, 253.0, 486.0, 1438.0, 6790.0, 50840.0, 974299.0, 2005166.0, 91484.0, 10770.0, 2087.0, 655.0, 281.0, 154.0, 115.0, 87.0, 63.0, 32.0, 32.0, 28.0, 28.0, 12.0, 15.0, 11.0, 7.0, 8.0, 10.0, 6.0, 5.0, 6.0, 0.0, 3.0, 5.0], "bins": [-8.828125, -8.5965576171875, -8.364990234375, -8.1334228515625, -7.90185546875, -7.6702880859375, -7.438720703125, -7.2071533203125, -6.9755859375, -6.7440185546875, -6.512451171875, -6.2808837890625, -6.04931640625, -5.8177490234375, -5.586181640625, -5.3546142578125, -5.123046875, -4.8914794921875, -4.659912109375, -4.4283447265625, -4.19677734375, -3.9652099609375, -3.733642578125, -3.5020751953125, -3.2705078125, -3.0389404296875, -2.807373046875, -2.5758056640625, -2.34423828125, -2.1126708984375, -1.881103515625, -1.6495361328125, -1.41796875, -1.1864013671875, -0.954833984375, -0.7232666015625, -0.49169921875, -0.2601318359375, -0.028564453125, 0.2030029296875, 0.4345703125, 0.6661376953125, 0.897705078125, 1.1292724609375, 1.36083984375, 1.5924072265625, 1.823974609375, 2.0555419921875, 2.287109375, 2.5186767578125, 2.750244140625, 2.9818115234375, 3.21337890625, 3.4449462890625, 3.676513671875, 3.9080810546875, 4.1396484375, 4.3712158203125, 4.602783203125, 4.8343505859375, 5.06591796875, 5.2974853515625, 5.529052734375, 5.7606201171875, 5.9921875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [29.0, 383.0, 517.0, 83.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3833417892456055, -2.3127946853637695, -0.2422475814819336, 1.8282995223999023, 3.8988466262817383, 5.969393730163574, 8.03994083404541, 10.110487937927246, 12.181035041809082, 14.251582145690918, 16.322128295898438, 18.392677307128906, 20.46322250366211, 22.533771514892578, 24.60431671142578, 26.67486572265625, 28.745410919189453, 30.81595802307129, 32.886505126953125, 34.957054138183594, 37.0275993347168, 39.09814453125, 41.16869354248047, 43.23924255371094, 45.30978775024414, 47.380332946777344, 49.45088195800781, 51.52143096923828, 53.591976165771484, 55.66252136230469, 57.733070373535156, 59.803619384765625, 61.87416076660156, 63.94470977783203, 66.0152587890625, 68.08580017089844, 70.1563491821289, 72.22689819335938, 74.29743957519531, 76.36798858642578, 78.43853759765625, 80.50908660888672, 82.57963562011719, 84.65017700195312, 86.7207260131836, 88.79127502441406, 90.86181640625, 92.93236541748047, 95.00291442871094, 97.0734634399414, 99.14401245117188, 101.21455383300781, 103.28510284423828, 105.35565185546875, 107.42619323730469, 109.49674224853516, 111.56729125976562, 113.6378402709961, 115.70838928222656, 117.7789306640625, 119.84947967529297, 121.92002868652344, 123.99057006835938, 126.06111907958984, 128.1316680908203]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 2.0, 2.0, 6.0, 4.0, 7.0, 5.0, 7.0, 14.0, 10.0, 18.0, 18.0, 14.0, 25.0, 18.0, 29.0, 24.0, 31.0, 31.0, 37.0, 39.0, 27.0, 37.0, 38.0, 47.0, 42.0, 32.0, 42.0, 40.0, 40.0, 29.0, 28.0, 37.0, 24.0, 21.0, 28.0, 22.0, 19.0, 13.0, 17.0, 15.0, 16.0, 14.0, 9.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.269007682800293, -12.836888313293457, -12.404769897460938, -11.972650527954102, -11.540532112121582, -11.108412742614746, -10.676294326782227, -10.24417495727539, -9.812055587768555, -9.379936218261719, -8.9478178024292, -8.515698432922363, -8.083580017089844, -7.651460647583008, -7.21934175491333, -6.787222862243652, -6.355103969573975, -5.922985076904297, -5.490866184234619, -5.058747291564941, -4.6266279220581055, -4.194509029388428, -3.76239013671875, -3.330271005630493, -2.8981521129608154, -2.4660332202911377, -2.033914089202881, -1.6017951965332031, -1.1696761846542358, -0.7375571727752686, -0.3054382801055908, 0.12668085098266602, 0.5587997436523438, 0.990918755531311, 1.4230377674102783, 1.855156660079956, 2.287275791168213, 2.7193946838378906, 3.1515135765075684, 3.583632707595825, 4.015751838684082, 4.44787073135376, 4.8799896240234375, 5.312108993530273, 5.744227886199951, 6.176346778869629, 6.608465671539307, 7.040584564208984, 7.472703456878662, 7.90482234954834, 8.336941719055176, 8.769060134887695, 9.201179504394531, 9.633298873901367, 10.065417289733887, 10.497536659240723, 10.929655075073242, 11.361774444580078, 11.793892860412598, 12.226012229919434, 12.658130645751953, 13.090250015258789, 13.522369384765625, 13.954487800598145, 14.38660717010498]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 12.0, 11.0, 15.0, 13.0, 11.0, 12.0, 14.0, 26.0, 35.0, 25.0, 32.0, 33.0, 36.0, 31.0, 40.0, 51.0, 32.0, 44.0, 39.0, 57.0, 38.0, 44.0, 38.0, 29.0, 29.0, 31.0, 23.0, 26.0, 29.0, 17.0, 20.0, 13.0, 19.0, 15.0, 13.0, 10.0, 9.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0], "bins": [-2.208984375, -2.1495513916015625, -2.090118408203125, -2.0306854248046875, -1.97125244140625, -1.9118194580078125, -1.852386474609375, -1.7929534912109375, -1.7335205078125, -1.6740875244140625, -1.614654541015625, -1.5552215576171875, -1.49578857421875, -1.4363555908203125, -1.376922607421875, -1.3174896240234375, -1.258056640625, -1.1986236572265625, -1.139190673828125, -1.0797576904296875, -1.02032470703125, -0.9608917236328125, -0.901458740234375, -0.8420257568359375, -0.7825927734375, -0.7231597900390625, -0.663726806640625, -0.6042938232421875, -0.54486083984375, -0.4854278564453125, -0.425994873046875, -0.3665618896484375, -0.30712890625, -0.2476959228515625, -0.188262939453125, -0.1288299560546875, -0.06939697265625, -0.0099639892578125, 0.049468994140625, 0.1089019775390625, 0.1683349609375, 0.2277679443359375, 0.287200927734375, 0.3466339111328125, 0.40606689453125, 0.4654998779296875, 0.524932861328125, 0.5843658447265625, 0.643798828125, 0.7032318115234375, 0.762664794921875, 0.8220977783203125, 0.88153076171875, 0.9409637451171875, 1.000396728515625, 1.0598297119140625, 1.1192626953125, 1.1786956787109375, 1.238128662109375, 1.2975616455078125, 1.35699462890625, 1.4164276123046875, 1.475860595703125, 1.5352935791015625, 1.5947265625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 10.0, 13.0, 12.0, 28.0, 36.0, 43.0, 67.0, 75.0, 114.0, 148.0, 232.0, 369.0, 541.0, 957.0, 1364.0, 2477.0, 4441.0, 8309.0, 16910.0, 38730.0, 109347.0, 479281.0, 2214070.0, 1022484.0, 188716.0, 57056.0, 23510.0, 11090.0, 5665.0, 3247.0, 1746.0, 1068.0, 671.0, 419.0, 275.0, 234.0, 130.0, 111.0, 82.0, 52.0, 53.0, 35.0, 17.0, 16.0, 8.0, 6.0, 6.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.794921875, -3.682342529296875, -3.56976318359375, -3.457183837890625, -3.3446044921875, -3.232025146484375, -3.11944580078125, -3.006866455078125, -2.894287109375, -2.781707763671875, -2.66912841796875, -2.556549072265625, -2.4439697265625, -2.331390380859375, -2.21881103515625, -2.106231689453125, -1.99365234375, -1.881072998046875, -1.76849365234375, -1.655914306640625, -1.5433349609375, -1.430755615234375, -1.31817626953125, -1.205596923828125, -1.093017578125, -0.980438232421875, -0.86785888671875, -0.755279541015625, -0.6427001953125, -0.530120849609375, -0.41754150390625, -0.304962158203125, -0.1923828125, -0.079803466796875, 0.03277587890625, 0.145355224609375, 0.2579345703125, 0.370513916015625, 0.48309326171875, 0.595672607421875, 0.708251953125, 0.820831298828125, 0.93341064453125, 1.045989990234375, 1.1585693359375, 1.271148681640625, 1.38372802734375, 1.496307373046875, 1.60888671875, 1.721466064453125, 1.83404541015625, 1.946624755859375, 2.0592041015625, 2.171783447265625, 2.28436279296875, 2.396942138671875, 2.509521484375, 2.622100830078125, 2.73468017578125, 2.847259521484375, 2.9598388671875, 3.072418212890625, 3.18499755859375, 3.297576904296875, 3.41015625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 6.0, 7.0, 13.0, 17.0, 31.0, 34.0, 53.0, 59.0, 70.0, 129.0, 149.0, 240.0, 307.0, 477.0, 584.0, 503.0, 385.0, 303.0, 173.0, 145.0, 77.0, 88.0, 55.0, 22.0, 39.0, 14.0, 21.0, 14.0, 11.0, 6.0, 8.0, 6.0, 6.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.818359375, -3.711669921875, -3.60498046875, -3.498291015625, -3.3916015625, -3.284912109375, -3.17822265625, -3.071533203125, -2.96484375, -2.858154296875, -2.75146484375, -2.644775390625, -2.5380859375, -2.431396484375, -2.32470703125, -2.218017578125, -2.111328125, -2.004638671875, -1.89794921875, -1.791259765625, -1.6845703125, -1.577880859375, -1.47119140625, -1.364501953125, -1.2578125, -1.151123046875, -1.04443359375, -0.937744140625, -0.8310546875, -0.724365234375, -0.61767578125, -0.510986328125, -0.404296875, -0.297607421875, -0.19091796875, -0.084228515625, 0.0224609375, 0.129150390625, 0.23583984375, 0.342529296875, 0.44921875, 0.555908203125, 0.66259765625, 0.769287109375, 0.8759765625, 0.982666015625, 1.08935546875, 1.196044921875, 1.302734375, 1.409423828125, 1.51611328125, 1.622802734375, 1.7294921875, 1.836181640625, 1.94287109375, 2.049560546875, 2.15625, 2.262939453125, 2.36962890625, 2.476318359375, 2.5830078125, 2.689697265625, 2.79638671875, 2.903076171875, 3.009765625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 3.0, 8.0, 16.0, 22.0, 12.0, 38.0, 34.0, 51.0, 67.0, 164.0, 248.0, 622.0, 1913.0, 8970.0, 70268.0, 1621314.0, 2386199.0, 89733.0, 10957.0, 2207.0, 700.0, 283.0, 147.0, 87.0, 59.0, 46.0, 32.0, 21.0, 11.0, 8.0, 4.0, 6.0, 5.0, 5.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.0675048828125, -9.720947265625, -9.3743896484375, -9.02783203125, -8.6812744140625, -8.334716796875, -7.9881591796875, -7.6416015625, -7.2950439453125, -6.948486328125, -6.6019287109375, -6.25537109375, -5.9088134765625, -5.562255859375, -5.2156982421875, -4.869140625, -4.5225830078125, -4.176025390625, -3.8294677734375, -3.48291015625, -3.1363525390625, -2.789794921875, -2.4432373046875, -2.0966796875, -1.7501220703125, -1.403564453125, -1.0570068359375, -0.71044921875, -0.3638916015625, -0.017333984375, 0.3292236328125, 0.67578125, 1.0223388671875, 1.368896484375, 1.7154541015625, 2.06201171875, 2.4085693359375, 2.755126953125, 3.1016845703125, 3.4482421875, 3.7947998046875, 4.141357421875, 4.4879150390625, 4.83447265625, 5.1810302734375, 5.527587890625, 5.8741455078125, 6.220703125, 6.5672607421875, 6.913818359375, 7.2603759765625, 7.60693359375, 7.9534912109375, 8.300048828125, 8.6466064453125, 8.9931640625, 9.3397216796875, 9.686279296875, 10.0328369140625, 10.37939453125, 10.7259521484375, 11.072509765625, 11.4190673828125, 11.765625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 10.0, 42.0, 145.0, 331.0, 303.0, 129.0, 36.0, 13.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.71071434020996, -27.10619354248047, -25.501670837402344, -23.89714813232422, -22.292627334594727, -20.688106536865234, -19.08358383178711, -17.479061126708984, -15.874540328979492, -14.270018577575684, -12.665496826171875, -11.060975074768066, -9.456453323364258, -7.851931571960449, -6.247409820556641, -4.642888069152832, -3.0383663177490234, -1.4338445663452148, 0.17067718505859375, 1.7751989364624023, 3.379720687866211, 4.9842424392700195, 6.588764190673828, 8.193285942077637, 9.797807693481445, 11.402329444885254, 13.006851196289062, 14.611372947692871, 16.21589469909668, 17.820415496826172, 19.424938201904297, 21.029460906982422, 22.63397979736328, 24.238502502441406, 25.8430233001709, 27.44754409790039, 29.052066802978516, 30.65658950805664, 32.2611083984375, 33.865631103515625, 35.47015380859375, 37.074676513671875, 38.67919921875, 40.28371810913086, 41.888240814208984, 43.49276351928711, 45.09728240966797, 46.701805114746094, 48.30632781982422, 49.910850524902344, 51.51537322998047, 53.11989212036133, 54.72441482543945, 56.32893753051758, 57.93345642089844, 59.53797912597656, 61.14250183105469, 62.74702453613281, 64.35154724121094, 65.95606994628906, 67.56059265136719, 69.16510772705078, 70.7696304321289, 72.37415313720703, 73.97867584228516]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 5.0, 5.0, 5.0, 9.0, 11.0, 8.0, 13.0, 14.0, 25.0, 9.0, 22.0, 18.0, 34.0, 35.0, 36.0, 29.0, 35.0, 53.0, 39.0, 57.0, 55.0, 35.0, 38.0, 48.0, 33.0, 33.0, 42.0, 26.0, 24.0, 30.0, 27.0, 19.0, 27.0, 20.0, 19.0, 11.0, 17.0, 12.0, 11.0, 1.0, 2.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.029692649841309, -10.685018539428711, -10.340344429016113, -9.995670318603516, -9.650996208190918, -9.30632209777832, -8.961647987365723, -8.616973876953125, -8.272299766540527, -7.92762565612793, -7.582951545715332, -7.238277435302734, -6.893603324890137, -6.548929214477539, -6.204255104064941, -5.859580993652344, -5.514906883239746, -5.170232772827148, -4.825558662414551, -4.480884552001953, -4.1362104415893555, -3.791536331176758, -3.44686222076416, -3.1021881103515625, -2.757513999938965, -2.412839889526367, -2.0681657791137695, -1.7234916687011719, -1.3788175582885742, -1.0341434478759766, -0.6894693374633789, -0.34479522705078125, -0.00012111663818359375, 0.34455299377441406, 0.6892271041870117, 1.0339012145996094, 1.378575325012207, 1.7232494354248047, 2.0679235458374023, 2.41259765625, 2.7572717666625977, 3.1019458770751953, 3.446619987487793, 3.7912940979003906, 4.135968208312988, 4.480642318725586, 4.825316429138184, 5.169990539550781, 5.514664649963379, 5.859338760375977, 6.204012870788574, 6.548686981201172, 6.8933610916137695, 7.238035202026367, 7.582709312438965, 7.9273834228515625, 8.27205753326416, 8.616731643676758, 8.961405754089355, 9.306079864501953, 9.65075397491455, 9.995428085327148, 10.340102195739746, 10.684776306152344, 11.029450416564941]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 7.0, 18.0, 13.0, 13.0, 16.0, 24.0, 30.0, 20.0, 26.0, 35.0, 38.0, 39.0, 39.0, 41.0, 36.0, 40.0, 41.0, 40.0, 47.0, 38.0, 33.0, 44.0, 33.0, 31.0, 21.0, 30.0, 22.0, 25.0, 29.0, 17.0, 14.0, 14.0, 7.0, 15.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8583984375, -1.80157470703125, -1.7447509765625, -1.68792724609375, -1.631103515625, -1.57427978515625, -1.5174560546875, -1.46063232421875, -1.40380859375, -1.34698486328125, -1.2901611328125, -1.23333740234375, -1.176513671875, -1.11968994140625, -1.0628662109375, -1.00604248046875, -0.94921875, -0.89239501953125, -0.8355712890625, -0.77874755859375, -0.721923828125, -0.66510009765625, -0.6082763671875, -0.55145263671875, -0.49462890625, -0.43780517578125, -0.3809814453125, -0.32415771484375, -0.267333984375, -0.21051025390625, -0.1536865234375, -0.09686279296875, -0.0400390625, 0.01678466796875, 0.0736083984375, 0.13043212890625, 0.187255859375, 0.24407958984375, 0.3009033203125, 0.35772705078125, 0.41455078125, 0.47137451171875, 0.5281982421875, 0.58502197265625, 0.641845703125, 0.69866943359375, 0.7554931640625, 0.81231689453125, 0.869140625, 0.92596435546875, 0.9827880859375, 1.03961181640625, 1.096435546875, 1.15325927734375, 1.2100830078125, 1.26690673828125, 1.32373046875, 1.38055419921875, 1.4373779296875, 1.49420166015625, 1.551025390625, 1.60784912109375, 1.6646728515625, 1.72149658203125, 1.7783203125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 12.0, 11.0, 21.0, 40.0, 42.0, 73.0, 82.0, 112.0, 186.0, 298.0, 463.0, 656.0, 1072.0, 1625.0, 2697.0, 4054.0, 6863.0, 11472.0, 19487.0, 33834.0, 61349.0, 115538.0, 201114.0, 235909.0, 156703.0, 84975.0, 45593.0, 25679.0, 14961.0, 8986.0, 5431.0, 3339.0, 2074.0, 1280.0, 861.0, 545.0, 341.0, 249.0, 170.0, 109.0, 57.0, 62.0, 34.0, 31.0, 23.0, 13.0, 11.0, 9.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.2213134765625, -0.2146587371826172, -0.20800399780273438, -0.20134925842285156, -0.19469451904296875, -0.18803977966308594, -0.18138504028320312, -0.1747303009033203, -0.1680755615234375, -0.1614208221435547, -0.15476608276367188, -0.14811134338378906, -0.14145660400390625, -0.13480186462402344, -0.12814712524414062, -0.12149238586425781, -0.114837646484375, -0.10818290710449219, -0.10152816772460938, -0.09487342834472656, -0.08821868896484375, -0.08156394958496094, -0.07490921020507812, -0.06825447082519531, -0.0615997314453125, -0.05494499206542969, -0.048290252685546875, -0.04163551330566406, -0.03498077392578125, -0.028326034545898438, -0.021671295166015625, -0.015016555786132812, -0.00836181640625, -0.0017070770263671875, 0.004947662353515625, 0.011602401733398438, 0.01825714111328125, 0.024911880493164062, 0.031566619873046875, 0.03822135925292969, 0.0448760986328125, 0.05153083801269531, 0.058185577392578125, 0.06484031677246094, 0.07149505615234375, 0.07814979553222656, 0.08480453491210938, 0.09145927429199219, 0.098114013671875, 0.10476875305175781, 0.11142349243164062, 0.11807823181152344, 0.12473297119140625, 0.13138771057128906, 0.13804244995117188, 0.1446971893310547, 0.1513519287109375, 0.1580066680908203, 0.16466140747070312, 0.17131614685058594, 0.17797088623046875, 0.18462562561035156, 0.19128036499023438, 0.1979351043701172, 0.20458984375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 9.0, 12.0, 12.0, 11.0, 19.0, 17.0, 29.0, 25.0, 25.0, 30.0, 30.0, 46.0, 34.0, 31.0, 39.0, 36.0, 40.0, 1066.0, 44.0, 40.0, 38.0, 26.0, 50.0, 41.0, 26.0, 31.0, 34.0, 29.0, 18.0, 16.0, 24.0, 16.0, 7.0, 9.0, 16.0, 5.0, 7.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.3232421875, -1.2835845947265625, -1.243927001953125, -1.2042694091796875, -1.16461181640625, -1.1249542236328125, -1.085296630859375, -1.0456390380859375, -1.0059814453125, -0.9663238525390625, -0.926666259765625, -0.8870086669921875, -0.84735107421875, -0.8076934814453125, -0.768035888671875, -0.7283782958984375, -0.688720703125, -0.6490631103515625, -0.609405517578125, -0.5697479248046875, -0.53009033203125, -0.4904327392578125, -0.450775146484375, -0.4111175537109375, -0.3714599609375, -0.3318023681640625, -0.292144775390625, -0.2524871826171875, -0.21282958984375, -0.1731719970703125, -0.133514404296875, -0.0938568115234375, -0.05419921875, -0.0145416259765625, 0.025115966796875, 0.0647735595703125, 0.10443115234375, 0.1440887451171875, 0.183746337890625, 0.2234039306640625, 0.2630615234375, 0.3027191162109375, 0.342376708984375, 0.3820343017578125, 0.42169189453125, 0.4613494873046875, 0.501007080078125, 0.5406646728515625, 0.580322265625, 0.6199798583984375, 0.659637451171875, 0.6992950439453125, 0.73895263671875, 0.7786102294921875, 0.818267822265625, 0.8579254150390625, 0.8975830078125, 0.9372406005859375, 0.976898193359375, 1.0165557861328125, 1.05621337890625, 1.0958709716796875, 1.135528564453125, 1.1751861572265625, 1.21484375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 8.0, 13.0, 8.0, 31.0, 32.0, 37.0, 57.0, 68.0, 86.0, 174.0, 221.0, 434.0, 679.0, 1069.0, 1964.0, 3565.0, 6410.0, 12529.0, 28426.0, 161378.0, 1773532.0, 64645.0, 20154.0, 9631.0, 5232.0, 2785.0, 1482.0, 914.0, 533.0, 322.0, 221.0, 153.0, 105.0, 64.0, 50.0, 33.0, 17.0, 12.0, 11.0, 10.0, 10.0, 7.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.3427734375, -0.3321647644042969, -0.32155609130859375, -0.3109474182128906, -0.3003387451171875, -0.2897300720214844, -0.27912139892578125, -0.2685127258300781, -0.257904052734375, -0.24729537963867188, -0.23668670654296875, -0.22607803344726562, -0.2154693603515625, -0.20486068725585938, -0.19425201416015625, -0.18364334106445312, -0.17303466796875, -0.16242599487304688, -0.15181732177734375, -0.14120864868164062, -0.1305999755859375, -0.11999130249023438, -0.10938262939453125, -0.09877395629882812, -0.088165283203125, -0.07755661010742188, -0.06694793701171875, -0.056339263916015625, -0.0457305908203125, -0.035121917724609375, -0.02451324462890625, -0.013904571533203125, -0.0032958984375, 0.007312774658203125, 0.01792144775390625, 0.028530120849609375, 0.0391387939453125, 0.049747467041015625, 0.06035614013671875, 0.07096481323242188, 0.081573486328125, 0.09218215942382812, 0.10279083251953125, 0.11339950561523438, 0.1240081787109375, 0.13461685180664062, 0.14522552490234375, 0.15583419799804688, 0.16644287109375, 0.17705154418945312, 0.18766021728515625, 0.19826889038085938, 0.2088775634765625, 0.21948623657226562, 0.23009490966796875, 0.24070358276367188, 0.251312255859375, 0.2619209289550781, 0.27252960205078125, 0.2831382751464844, 0.2937469482421875, 0.3043556213378906, 0.31496429443359375, 0.3255729675292969, 0.336181640625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 5.0, 3.0, 8.0, 9.0, 8.0, 5.0, 15.0, 21.0, 21.0, 20.0, 33.0, 47.0, 55.0, 50.0, 70.0, 66.0, 71.0, 70.0, 55.0, 62.0, 56.0, 47.0, 30.0, 29.0, 30.0, 22.0, 16.0, 13.0, 10.0, 12.0, 7.0, 8.0, 4.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0169219970703125, -0.016411781311035156, -0.015901565551757812, -0.015391349792480469, -0.014881134033203125, -0.014370918273925781, -0.013860702514648438, -0.013350486755371094, -0.01284027099609375, -0.012330055236816406, -0.011819839477539062, -0.011309623718261719, -0.010799407958984375, -0.010289192199707031, -0.009778976440429688, -0.009268760681152344, -0.008758544921875, -0.008248329162597656, -0.0077381134033203125, -0.007227897644042969, -0.006717681884765625, -0.006207466125488281, -0.0056972503662109375, -0.005187034606933594, -0.00467681884765625, -0.004166603088378906, -0.0036563873291015625, -0.0031461715698242188, -0.002635955810546875, -0.0021257400512695312, -0.0016155242919921875, -0.0011053085327148438, -0.0005950927734375, -8.487701416015625e-05, 0.0004253387451171875, 0.0009355545043945312, 0.001445770263671875, 0.0019559860229492188, 0.0024662017822265625, 0.0029764175415039062, 0.00348663330078125, 0.003996849060058594, 0.0045070648193359375, 0.005017280578613281, 0.005527496337890625, 0.006037712097167969, 0.0065479278564453125, 0.007058143615722656, 0.007568359375, 0.008078575134277344, 0.008588790893554688, 0.009099006652832031, 0.009609222412109375, 0.010119438171386719, 0.010629653930664062, 0.011139869689941406, 0.01165008544921875, 0.012160301208496094, 0.012670516967773438, 0.013180732727050781, 0.013690948486328125, 0.014201164245605469, 0.014711380004882812, 0.015221595764160156, 0.0157318115234375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 18.0, 21.0, 31.0, 26.0, 43.0, 50.0, 90.0, 133.0, 259.0, 735.0, 37156.0, 1002606.0, 6139.0, 531.0, 216.0, 125.0, 87.0, 67.0, 43.0, 33.0, 17.0, 19.0, 11.0, 8.0, 11.0, 6.0, 6.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.324951171875, -0.3145866394042969, -0.30422210693359375, -0.2938575744628906, -0.2834930419921875, -0.2731285095214844, -0.26276397705078125, -0.2523994445800781, -0.242034912109375, -0.23167037963867188, -0.22130584716796875, -0.21094131469726562, -0.2005767822265625, -0.19021224975585938, -0.17984771728515625, -0.16948318481445312, -0.15911865234375, -0.14875411987304688, -0.13838958740234375, -0.12802505493164062, -0.1176605224609375, -0.10729598999023438, -0.09693145751953125, -0.08656692504882812, -0.076202392578125, -0.06583786010742188, -0.05547332763671875, -0.045108795166015625, -0.0347442626953125, -0.024379730224609375, -0.01401519775390625, -0.003650665283203125, 0.0067138671875, 0.017078399658203125, 0.02744293212890625, 0.037807464599609375, 0.0481719970703125, 0.058536529541015625, 0.06890106201171875, 0.07926559448242188, 0.089630126953125, 0.09999465942382812, 0.11035919189453125, 0.12072372436523438, 0.1310882568359375, 0.14145278930664062, 0.15181732177734375, 0.16218185424804688, 0.17254638671875, 0.18291091918945312, 0.19327545166015625, 0.20363998413085938, 0.2140045166015625, 0.22436904907226562, 0.23473358154296875, 0.24509811401367188, 0.255462646484375, 0.2658271789550781, 0.27619171142578125, 0.2865562438964844, 0.2969207763671875, 0.3072853088378906, 0.31764984130859375, 0.3280143737792969, 0.33837890625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 59.0, 746.0, 204.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3873315155506134, -0.3799889087677002, -0.372646301984787, -0.3653036952018738, -0.35796108841896057, -0.35061848163604736, -0.34327584505081177, -0.33593323826789856, -0.32859063148498535, -0.32124802470207214, -0.31390541791915894, -0.3065628111362457, -0.2992202043533325, -0.2918775677680969, -0.2845349609851837, -0.2771923542022705, -0.2698497474193573, -0.2625071406364441, -0.2551645338535309, -0.24782191216945648, -0.24047930538654327, -0.23313669860363007, -0.22579409182071686, -0.21845147013664246, -0.21110887825489044, -0.20376627147197723, -0.19642366468906403, -0.18908104300498962, -0.18173843622207642, -0.1743958294391632, -0.16705322265625, -0.1597106158733368, -0.1523679941892624, -0.14502538740634918, -0.13768278062343597, -0.13034015893936157, -0.12299755215644836, -0.11565494537353516, -0.10831233859062195, -0.10096972435712814, -0.09362711012363434, -0.08628450334072113, -0.07894188910722733, -0.07159928232431412, -0.06425666809082031, -0.056914061307907104, -0.0495714507997036, -0.04222884029150009, -0.034886233508586884, -0.027543623000383377, -0.02020101249217987, -0.012858403846621513, -0.005515793338418007, 0.0018268153071403503, 0.009169425815343857, 0.016512036323547363, 0.02385464683175087, 0.031197257339954376, 0.03853986784815788, 0.04588247835636139, 0.0532250851392746, 0.060567695647478104, 0.06791030615568161, 0.07525292038917542, 0.08259552717208862]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 7.0, 1.0, 4.0, 7.0, 8.0, 9.0, 9.0, 8.0, 12.0, 13.0, 12.0, 15.0, 16.0, 19.0, 18.0, 17.0, 22.0, 31.0, 32.0, 21.0, 30.0, 43.0, 31.0, 40.0, 39.0, 49.0, 37.0, 39.0, 47.0, 27.0, 43.0, 28.0, 31.0, 25.0, 30.0, 19.0, 23.0, 24.0, 24.0, 17.0, 16.0, 12.0, 13.0, 9.0, 7.0, 2.0, 3.0, 7.0, 1.0, 1.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.020894289016723633, -0.020195595920085907, -0.01949690468609333, -0.018798213452100754, -0.018099520355463028, -0.017400827258825302, -0.016702136024832726, -0.01600344479084015, -0.015304751694202423, -0.014606059528887272, -0.01390736736357212, -0.01320867519825697, -0.012509983032941818, -0.011811290867626667, -0.011112598702311516, -0.010413906536996365, -0.009715214371681213, -0.009016522206366062, -0.008317830041050911, -0.00761913787573576, -0.0069204457104206085, -0.006221753545105457, -0.005523061379790306, -0.004824369214475155, -0.004125677049160004, -0.0034269848838448524, -0.0027282927185297012, -0.00202960055321455, -0.0013309083878993988, -0.0006322162225842476, 6.647594273090363e-05, 0.0007651681080460548, 0.001463860273361206, 0.0021625524386763573, 0.0028612446039915085, 0.0035599367693066597, 0.004258628934621811, 0.004957321099936962, 0.005656013265252113, 0.0063547054305672646, 0.007053397595882416, 0.007752089761197567, 0.008450781926512718, 0.00914947409182787, 0.00984816625714302, 0.010546858422458172, 0.011245550587773323, 0.011944242753088474, 0.012642934918403625, 0.013341627083718777, 0.014040319249033928, 0.014739011414349079, 0.01543770357966423, 0.016136396676301956, 0.016835087910294533, 0.01753377914428711, 0.018232472240924835, 0.01893116533756256, 0.019629856571555138, 0.020328547805547714, 0.02102724090218544, 0.021725933998823166, 0.022424625232815742, 0.02312331646680832, 0.023822009563446045]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 10.0, 6.0, 18.0, 13.0, 13.0, 17.0, 23.0, 30.0, 21.0, 25.0, 37.0, 37.0, 40.0, 37.0, 42.0, 37.0, 40.0, 42.0, 38.0, 48.0, 39.0, 32.0, 44.0, 33.0, 30.0, 21.0, 30.0, 22.0, 26.0, 27.0, 17.0, 14.0, 14.0, 7.0, 15.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8564453125, -1.79962158203125, -1.7427978515625, -1.68597412109375, -1.629150390625, -1.57232666015625, -1.5155029296875, -1.45867919921875, -1.40185546875, -1.34503173828125, -1.2882080078125, -1.23138427734375, -1.174560546875, -1.11773681640625, -1.0609130859375, -1.00408935546875, -0.947265625, -0.89044189453125, -0.8336181640625, -0.77679443359375, -0.719970703125, -0.66314697265625, -0.6063232421875, -0.54949951171875, -0.49267578125, -0.43585205078125, -0.3790283203125, -0.32220458984375, -0.265380859375, -0.20855712890625, -0.1517333984375, -0.09490966796875, -0.0380859375, 0.01873779296875, 0.0755615234375, 0.13238525390625, 0.189208984375, 0.24603271484375, 0.3028564453125, 0.35968017578125, 0.41650390625, 0.47332763671875, 0.5301513671875, 0.58697509765625, 0.643798828125, 0.70062255859375, 0.7574462890625, 0.81427001953125, 0.87109375, 0.92791748046875, 0.9847412109375, 1.04156494140625, 1.098388671875, 1.15521240234375, 1.2120361328125, 1.26885986328125, 1.32568359375, 1.38250732421875, 1.4393310546875, 1.49615478515625, 1.552978515625, 1.60980224609375, 1.6666259765625, 1.72344970703125, 1.7802734375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 1.0, 2.0, 4.0, 10.0, 12.0, 16.0, 18.0, 34.0, 36.0, 48.0, 91.0, 150.0, 245.0, 336.0, 541.0, 839.0, 1428.0, 2387.0, 4242.0, 8132.0, 16915.0, 40503.0, 113128.0, 374762.0, 319389.0, 97388.0, 35902.0, 15165.0, 7142.0, 3847.0, 2235.0, 1289.0, 836.0, 500.0, 321.0, 194.0, 160.0, 100.0, 60.0, 42.0, 31.0, 17.0, 11.0, 16.0, 10.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0], "bins": [-3.142578125, -3.047149658203125, -2.95172119140625, -2.856292724609375, -2.7608642578125, -2.665435791015625, -2.57000732421875, -2.474578857421875, -2.379150390625, -2.283721923828125, -2.18829345703125, -2.092864990234375, -1.9974365234375, -1.902008056640625, -1.80657958984375, -1.711151123046875, -1.61572265625, -1.520294189453125, -1.42486572265625, -1.329437255859375, -1.2340087890625, -1.138580322265625, -1.04315185546875, -0.947723388671875, -0.852294921875, -0.756866455078125, -0.66143798828125, -0.566009521484375, -0.4705810546875, -0.375152587890625, -0.27972412109375, -0.184295654296875, -0.0888671875, 0.006561279296875, 0.10198974609375, 0.197418212890625, 0.2928466796875, 0.388275146484375, 0.48370361328125, 0.579132080078125, 0.674560546875, 0.769989013671875, 0.86541748046875, 0.960845947265625, 1.0562744140625, 1.151702880859375, 1.24713134765625, 1.342559814453125, 1.43798828125, 1.533416748046875, 1.62884521484375, 1.724273681640625, 1.8197021484375, 1.915130615234375, 2.01055908203125, 2.105987548828125, 2.201416015625, 2.296844482421875, 2.39227294921875, 2.487701416015625, 2.5831298828125, 2.678558349609375, 2.77398681640625, 2.869415283203125, 2.96484375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 6.0, 9.0, 2.0, 11.0, 6.0, 14.0, 8.0, 18.0, 12.0, 20.0, 24.0, 24.0, 25.0, 33.0, 35.0, 46.0, 55.0, 78.0, 191.0, 1421.0, 335.0, 169.0, 107.0, 49.0, 53.0, 44.0, 46.0, 34.0, 32.0, 31.0, 13.0, 16.0, 18.0, 15.0, 6.0, 9.0, 7.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9453125, -5.76495361328125, -5.5845947265625, -5.40423583984375, -5.223876953125, -5.04351806640625, -4.8631591796875, -4.68280029296875, -4.50244140625, -4.32208251953125, -4.1417236328125, -3.96136474609375, -3.781005859375, -3.60064697265625, -3.4202880859375, -3.23992919921875, -3.0595703125, -2.87921142578125, -2.6988525390625, -2.51849365234375, -2.338134765625, -2.15777587890625, -1.9774169921875, -1.79705810546875, -1.61669921875, -1.43634033203125, -1.2559814453125, -1.07562255859375, -0.895263671875, -0.71490478515625, -0.5345458984375, -0.35418701171875, -0.173828125, 0.00653076171875, 0.1868896484375, 0.36724853515625, 0.547607421875, 0.72796630859375, 0.9083251953125, 1.08868408203125, 1.26904296875, 1.44940185546875, 1.6297607421875, 1.81011962890625, 1.990478515625, 2.17083740234375, 2.3511962890625, 2.53155517578125, 2.7119140625, 2.89227294921875, 3.0726318359375, 3.25299072265625, 3.433349609375, 3.61370849609375, 3.7940673828125, 3.97442626953125, 4.15478515625, 4.33514404296875, 4.5155029296875, 4.69586181640625, 4.876220703125, 5.05657958984375, 5.2369384765625, 5.41729736328125, 5.59765625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 8.0, 5.0, 7.0, 7.0, 9.0, 9.0, 24.0, 24.0, 16.0, 35.0, 29.0, 38.0, 79.0, 104.0, 160.0, 326.0, 998.0, 4757.0, 43159.0, 2602053.0, 475128.0, 15300.0, 2248.0, 545.0, 203.0, 114.0, 80.0, 45.0, 53.0, 22.0, 23.0, 26.0, 12.0, 16.0, 9.0, 6.0, 7.0, 9.0, 6.0, 7.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8515625, -9.5316162109375, -9.211669921875, -8.8917236328125, -8.57177734375, -8.2518310546875, -7.931884765625, -7.6119384765625, -7.2919921875, -6.9720458984375, -6.652099609375, -6.3321533203125, -6.01220703125, -5.6922607421875, -5.372314453125, -5.0523681640625, -4.732421875, -4.4124755859375, -4.092529296875, -3.7725830078125, -3.45263671875, -3.1326904296875, -2.812744140625, -2.4927978515625, -2.1728515625, -1.8529052734375, -1.532958984375, -1.2130126953125, -0.89306640625, -0.5731201171875, -0.253173828125, 0.0667724609375, 0.38671875, 0.7066650390625, 1.026611328125, 1.3465576171875, 1.66650390625, 1.9864501953125, 2.306396484375, 2.6263427734375, 2.9462890625, 3.2662353515625, 3.586181640625, 3.9061279296875, 4.22607421875, 4.5460205078125, 4.865966796875, 5.1859130859375, 5.505859375, 5.8258056640625, 6.145751953125, 6.4656982421875, 6.78564453125, 7.1055908203125, 7.425537109375, 7.7454833984375, 8.0654296875, 8.3853759765625, 8.705322265625, 9.0252685546875, 9.34521484375, 9.6651611328125, 9.985107421875, 10.3050537109375, 10.625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 96.0, 369.0, 416.0, 113.0, 13.0], "bins": [-75.31529235839844, -74.08158874511719, -72.84788513183594, -71.61418151855469, -70.38047790527344, -69.14677429199219, -67.91307067871094, -66.67936706542969, -65.44567108154297, -64.21196746826172, -62.97826385498047, -61.74456024169922, -60.510860443115234, -59.277156829833984, -58.043453216552734, -56.809749603271484, -55.57604217529297, -54.34233856201172, -53.10863494873047, -51.87493133544922, -50.641231536865234, -49.407527923583984, -48.173824310302734, -46.940120697021484, -45.7064208984375, -44.47271728515625, -43.239013671875, -42.00531005859375, -40.771610260009766, -39.537906646728516, -38.304203033447266, -37.070499420166016, -35.8367919921875, -34.60308837890625, -33.369384765625, -32.13568115234375, -30.901979446411133, -29.668277740478516, -28.434574127197266, -27.200870513916016, -25.9671688079834, -24.73346519470215, -23.49976348876953, -22.26605987548828, -21.03235626220703, -19.79865264892578, -18.564950942993164, -17.331247329711914, -16.097545623779297, -14.863842964172363, -13.630139350891113, -12.39643669128418, -11.16273307800293, -9.929030418395996, -8.695327758789062, -7.4616241455078125, -6.227921485900879, -4.994218349456787, -3.7605154514312744, -2.5268125534057617, -1.29310941696167, -0.059406280517578125, 1.1742963790893555, 2.4079999923706055, 3.641702890396118]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 8.0, 6.0, 12.0, 5.0, 11.0, 12.0, 17.0, 19.0, 12.0, 17.0, 25.0, 33.0, 34.0, 32.0, 35.0, 33.0, 27.0, 29.0, 35.0, 40.0, 45.0, 35.0, 38.0, 43.0, 35.0, 24.0, 32.0, 31.0, 39.0, 31.0, 30.0, 29.0, 17.0, 21.0, 15.0, 6.0, 12.0, 11.0, 6.0, 12.0, 4.0, 9.0, 5.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.173398971557617, -11.778363227844238, -11.383328437805176, -10.988292694091797, -10.593257904052734, -10.198222160339355, -9.803187370300293, -9.408151626586914, -9.013116836547852, -8.618081092834473, -8.22304630279541, -7.8280110359191895, -7.432975769042969, -7.037940502166748, -6.642905235290527, -6.247869491577148, -5.852834224700928, -5.457798957824707, -5.062763690948486, -4.667728424072266, -4.272693157196045, -3.877657890319824, -3.4826223850250244, -3.0875871181488037, -2.692551851272583, -2.2975165843963623, -1.9024813175201416, -1.5074459314346313, -1.1124106645584106, -0.7173753976821899, -0.3223400115966797, 0.07269525527954102, 0.4677305221557617, 0.8627657890319824, 1.2578010559082031, 1.6528364419937134, 2.0478715896606445, 2.4429068565368652, 2.837942361831665, 3.2329776287078857, 3.6280128955841064, 4.023048400878906, 4.418083667755127, 4.813118934631348, 5.208154201507568, 5.603189468383789, 5.99822473526001, 6.3932600021362305, 6.788295269012451, 7.183330535888672, 7.578365802764893, 7.973401069641113, 8.368436813354492, 8.763471603393555, 9.158507347106934, 9.553542137145996, 9.948577880859375, 10.343613624572754, 10.738648414611816, 11.133684158325195, 11.528718948364258, 11.923754692077637, 12.3187894821167, 12.713825225830078, 13.10886001586914]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 8.0, 7.0, 6.0, 13.0, 10.0, 12.0, 21.0, 21.0, 21.0, 19.0, 15.0, 29.0, 28.0, 34.0, 37.0, 40.0, 44.0, 52.0, 33.0, 44.0, 41.0, 43.0, 40.0, 39.0, 23.0, 32.0, 34.0, 40.0, 29.0, 24.0, 21.0, 19.0, 28.0, 18.0, 12.0, 9.0, 11.0, 8.0, 7.0, 10.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.958984375, -1.8996429443359375, -1.840301513671875, -1.7809600830078125, -1.72161865234375, -1.6622772216796875, -1.602935791015625, -1.5435943603515625, -1.4842529296875, -1.4249114990234375, -1.365570068359375, -1.3062286376953125, -1.24688720703125, -1.1875457763671875, -1.128204345703125, -1.0688629150390625, -1.009521484375, -0.9501800537109375, -0.890838623046875, -0.8314971923828125, -0.77215576171875, -0.7128143310546875, -0.653472900390625, -0.5941314697265625, -0.5347900390625, -0.4754486083984375, -0.416107177734375, -0.3567657470703125, -0.29742431640625, -0.2380828857421875, -0.178741455078125, -0.1194000244140625, -0.06005859375, -0.0007171630859375, 0.058624267578125, 0.1179656982421875, 0.17730712890625, 0.2366485595703125, 0.295989990234375, 0.3553314208984375, 0.4146728515625, 0.4740142822265625, 0.533355712890625, 0.5926971435546875, 0.65203857421875, 0.7113800048828125, 0.770721435546875, 0.8300628662109375, 0.889404296875, 0.9487457275390625, 1.008087158203125, 1.0674285888671875, 1.12677001953125, 1.1861114501953125, 1.245452880859375, 1.3047943115234375, 1.3641357421875, 1.4234771728515625, 1.482818603515625, 1.5421600341796875, 1.60150146484375, 1.6608428955078125, 1.720184326171875, 1.7795257568359375, 1.8388671875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 11.0, 15.0, 15.0, 39.0, 56.0, 58.0, 94.0, 163.0, 212.0, 351.0, 585.0, 841.0, 1471.0, 2355.0, 4144.0, 7560.0, 15044.0, 33437.0, 90572.0, 361233.0, 1779074.0, 1475718.0, 286904.0, 75741.0, 28789.0, 13301.0, 6711.0, 3677.0, 2216.0, 1351.0, 820.0, 571.0, 369.0, 234.0, 166.0, 107.0, 92.0, 58.0, 36.0, 30.0, 24.0, 9.0, 7.0, 13.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.078125, -2.9678955078125, -2.857666015625, -2.7474365234375, -2.63720703125, -2.5269775390625, -2.416748046875, -2.3065185546875, -2.1962890625, -2.0860595703125, -1.975830078125, -1.8656005859375, -1.75537109375, -1.6451416015625, -1.534912109375, -1.4246826171875, -1.314453125, -1.2042236328125, -1.093994140625, -0.9837646484375, -0.87353515625, -0.7633056640625, -0.653076171875, -0.5428466796875, -0.4326171875, -0.3223876953125, -0.212158203125, -0.1019287109375, 0.00830078125, 0.1185302734375, 0.228759765625, 0.3389892578125, 0.44921875, 0.5594482421875, 0.669677734375, 0.7799072265625, 0.89013671875, 1.0003662109375, 1.110595703125, 1.2208251953125, 1.3310546875, 1.4412841796875, 1.551513671875, 1.6617431640625, 1.77197265625, 1.8822021484375, 1.992431640625, 2.1026611328125, 2.212890625, 2.3231201171875, 2.433349609375, 2.5435791015625, 2.65380859375, 2.7640380859375, 2.874267578125, 2.9844970703125, 3.0947265625, 3.2049560546875, 3.315185546875, 3.4254150390625, 3.53564453125, 3.6458740234375, 3.756103515625, 3.8663330078125, 3.9765625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 9.0, 10.0, 10.0, 10.0, 24.0, 27.0, 32.0, 44.0, 47.0, 66.0, 89.0, 93.0, 144.0, 229.0, 290.0, 394.0, 463.0, 471.0, 405.0, 293.0, 228.0, 180.0, 119.0, 104.0, 59.0, 38.0, 36.0, 27.0, 28.0, 22.0, 17.0, 17.0, 7.0, 11.0, 9.0, 1.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.12890625, -3.03466796875, -2.9404296875, -2.84619140625, -2.751953125, -2.65771484375, -2.5634765625, -2.46923828125, -2.375, -2.28076171875, -2.1865234375, -2.09228515625, -1.998046875, -1.90380859375, -1.8095703125, -1.71533203125, -1.62109375, -1.52685546875, -1.4326171875, -1.33837890625, -1.244140625, -1.14990234375, -1.0556640625, -0.96142578125, -0.8671875, -0.77294921875, -0.6787109375, -0.58447265625, -0.490234375, -0.39599609375, -0.3017578125, -0.20751953125, -0.11328125, -0.01904296875, 0.0751953125, 0.16943359375, 0.263671875, 0.35791015625, 0.4521484375, 0.54638671875, 0.640625, 0.73486328125, 0.8291015625, 0.92333984375, 1.017578125, 1.11181640625, 1.2060546875, 1.30029296875, 1.39453125, 1.48876953125, 1.5830078125, 1.67724609375, 1.771484375, 1.86572265625, 1.9599609375, 2.05419921875, 2.1484375, 2.24267578125, 2.3369140625, 2.43115234375, 2.525390625, 2.61962890625, 2.7138671875, 2.80810546875, 2.90234375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 14.0, 6.0, 17.0, 23.0, 31.0, 21.0, 42.0, 53.0, 88.0, 186.0, 358.0, 786.0, 1985.0, 5630.0, 19174.0, 84461.0, 685129.0, 3006499.0, 318389.0, 51639.0, 13031.0, 3966.0, 1425.0, 564.0, 278.0, 163.0, 111.0, 70.0, 30.0, 30.0, 20.0, 18.0, 13.0, 5.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.7421875, -7.510009765625, -7.27783203125, -7.045654296875, -6.8134765625, -6.581298828125, -6.34912109375, -6.116943359375, -5.884765625, -5.652587890625, -5.42041015625, -5.188232421875, -4.9560546875, -4.723876953125, -4.49169921875, -4.259521484375, -4.02734375, -3.795166015625, -3.56298828125, -3.330810546875, -3.0986328125, -2.866455078125, -2.63427734375, -2.402099609375, -2.169921875, -1.937744140625, -1.70556640625, -1.473388671875, -1.2412109375, -1.009033203125, -0.77685546875, -0.544677734375, -0.3125, -0.080322265625, 0.15185546875, 0.384033203125, 0.6162109375, 0.848388671875, 1.08056640625, 1.312744140625, 1.544921875, 1.777099609375, 2.00927734375, 2.241455078125, 2.4736328125, 2.705810546875, 2.93798828125, 3.170166015625, 3.40234375, 3.634521484375, 3.86669921875, 4.098876953125, 4.3310546875, 4.563232421875, 4.79541015625, 5.027587890625, 5.259765625, 5.491943359375, 5.72412109375, 5.956298828125, 6.1884765625, 6.420654296875, 6.65283203125, 6.885009765625, 7.1171875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 16.0, 127.0, 528.0, 295.0, 48.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.980958938598633, -12.382728576660156, -9.784497261047363, -7.1862664222717285, -4.588035583496094, -1.9898052215576172, 0.6084260940551758, 3.2066574096679688, 5.804887771606445, 8.403118133544922, 11.001349449157715, 13.599580764770508, 16.197811126708984, 18.79604148864746, 21.394271850585938, 23.992504119873047, 26.590734481811523, 29.18896484375, 31.78719711303711, 34.38542556762695, 36.98365783691406, 39.581886291503906, 42.180118560791016, 44.778350830078125, 47.37657928466797, 49.97481155395508, 52.57304000854492, 55.17127227783203, 57.769500732421875, 60.367733001708984, 62.965965270996094, 65.56419372558594, 68.16242980957031, 70.76065826416016, 73.35889434814453, 75.95712280273438, 78.55535125732422, 81.15357971191406, 83.75181579589844, 86.35004425048828, 88.94827270507812, 91.54650115966797, 94.14473724365234, 96.74296569824219, 99.34119415283203, 101.93942260742188, 104.53765869140625, 107.1358871459961, 109.73412322998047, 112.33235168457031, 114.93058776855469, 117.52881622314453, 120.12704467773438, 122.72528076171875, 125.3235092163086, 127.92173767089844, 130.5199737548828, 133.1182098388672, 135.7164306640625, 138.31466674804688, 140.91290283203125, 143.51112365722656, 146.10935974121094, 148.7075958251953, 151.30581665039062]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 8.0, 6.0, 4.0, 10.0, 17.0, 12.0, 11.0, 16.0, 22.0, 21.0, 28.0, 33.0, 23.0, 31.0, 36.0, 26.0, 34.0, 39.0, 32.0, 43.0, 29.0, 37.0, 35.0, 36.0, 40.0, 28.0, 31.0, 26.0, 37.0, 38.0, 28.0, 22.0, 22.0, 26.0, 14.0, 17.0, 13.0, 8.0, 9.0, 4.0, 6.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-9.001373291015625, -8.692272186279297, -8.383171081542969, -8.07406997680664, -7.7649688720703125, -7.455867767333984, -7.146766662597656, -6.837665557861328, -6.528564453125, -6.219463348388672, -5.910362243652344, -5.601261138916016, -5.2921600341796875, -4.983058929443359, -4.673957824707031, -4.364856719970703, -4.055755615234375, -3.746654510498047, -3.4375534057617188, -3.1284523010253906, -2.8193511962890625, -2.5102500915527344, -2.2011489868164062, -1.8920478820800781, -1.58294677734375, -1.2738456726074219, -0.9647445678710938, -0.6556434631347656, -0.3465423583984375, -0.037441253662109375, 0.27165985107421875, 0.5807609558105469, 0.8898630142211914, 1.1989641189575195, 1.5080652236938477, 1.8171663284301758, 2.126267433166504, 2.435368537902832, 2.74446964263916, 3.0535707473754883, 3.3626718521118164, 3.6717729568481445, 3.9808740615844727, 4.289975166320801, 4.599076271057129, 4.908177375793457, 5.217278480529785, 5.526379585266113, 5.835480690002441, 6.1445817947387695, 6.453682899475098, 6.762784004211426, 7.071885108947754, 7.380986213684082, 7.69008731842041, 7.999188423156738, 8.308289527893066, 8.617390632629395, 8.926491737365723, 9.23559284210205, 9.544693946838379, 9.853795051574707, 10.162896156311035, 10.471997261047363, 10.781098365783691]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 7.0, 8.0, 7.0, 10.0, 4.0, 19.0, 15.0, 20.0, 23.0, 37.0, 28.0, 25.0, 25.0, 30.0, 36.0, 41.0, 41.0, 41.0, 44.0, 56.0, 45.0, 34.0, 42.0, 32.0, 38.0, 35.0, 36.0, 26.0, 28.0, 29.0, 22.0, 20.0, 17.0, 12.0, 12.0, 7.0, 12.0, 8.0, 3.0, 5.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9951171875, -1.9335784912109375, -1.872039794921875, -1.8105010986328125, -1.74896240234375, -1.6874237060546875, -1.625885009765625, -1.5643463134765625, -1.5028076171875, -1.4412689208984375, -1.379730224609375, -1.3181915283203125, -1.25665283203125, -1.1951141357421875, -1.133575439453125, -1.0720367431640625, -1.010498046875, -0.9489593505859375, -0.887420654296875, -0.8258819580078125, -0.76434326171875, -0.7028045654296875, -0.641265869140625, -0.5797271728515625, -0.5181884765625, -0.4566497802734375, -0.395111083984375, -0.3335723876953125, -0.27203369140625, -0.2104949951171875, -0.148956298828125, -0.0874176025390625, -0.02587890625, 0.0356597900390625, 0.097198486328125, 0.1587371826171875, 0.22027587890625, 0.2818145751953125, 0.343353271484375, 0.4048919677734375, 0.4664306640625, 0.5279693603515625, 0.589508056640625, 0.6510467529296875, 0.71258544921875, 0.7741241455078125, 0.835662841796875, 0.8972015380859375, 0.958740234375, 1.0202789306640625, 1.081817626953125, 1.1433563232421875, 1.20489501953125, 1.2664337158203125, 1.327972412109375, 1.3895111083984375, 1.4510498046875, 1.5125885009765625, 1.574127197265625, 1.6356658935546875, 1.69720458984375, 1.7587432861328125, 1.820281982421875, 1.8818206787109375, 1.943359375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 8.0, 6.0, 9.0, 16.0, 27.0, 43.0, 58.0, 89.0, 134.0, 182.0, 262.0, 385.0, 577.0, 828.0, 1355.0, 2106.0, 3197.0, 4961.0, 7849.0, 12483.0, 20620.0, 34269.0, 59299.0, 106165.0, 178700.0, 221789.0, 164535.0, 94298.0, 53223.0, 30692.0, 18630.0, 11393.0, 7203.0, 4532.0, 2926.0, 1883.0, 1270.0, 878.0, 577.0, 350.0, 261.0, 161.0, 111.0, 72.0, 47.0, 27.0, 29.0, 17.0, 11.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.1649169921875, -0.15949249267578125, -0.1540679931640625, -0.14864349365234375, -0.143218994140625, -0.13779449462890625, -0.1323699951171875, -0.12694549560546875, -0.12152099609375, -0.11609649658203125, -0.1106719970703125, -0.10524749755859375, -0.099822998046875, -0.09439849853515625, -0.0889739990234375, -0.08354949951171875, -0.078125, -0.07270050048828125, -0.0672760009765625, -0.06185150146484375, -0.056427001953125, -0.05100250244140625, -0.0455780029296875, -0.04015350341796875, -0.03472900390625, -0.02930450439453125, -0.0238800048828125, -0.01845550537109375, -0.013031005859375, -0.00760650634765625, -0.0021820068359375, 0.00324249267578125, 0.0086669921875, 0.01409149169921875, 0.0195159912109375, 0.02494049072265625, 0.030364990234375, 0.03578948974609375, 0.0412139892578125, 0.04663848876953125, 0.05206298828125, 0.05748748779296875, 0.0629119873046875, 0.06833648681640625, 0.073760986328125, 0.07918548583984375, 0.0846099853515625, 0.09003448486328125, 0.095458984375, 0.10088348388671875, 0.1063079833984375, 0.11173248291015625, 0.117156982421875, 0.12258148193359375, 0.1280059814453125, 0.13343048095703125, 0.13885498046875, 0.14427947998046875, 0.1497039794921875, 0.15512847900390625, 0.160552978515625, 0.16597747802734375, 0.1714019775390625, 0.17682647705078125, 0.1822509765625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 3.0, 6.0, 2.0, 8.0, 7.0, 14.0, 11.0, 12.0, 14.0, 21.0, 22.0, 21.0, 28.0, 37.0, 27.0, 37.0, 34.0, 38.0, 44.0, 45.0, 1075.0, 34.0, 41.0, 38.0, 46.0, 36.0, 45.0, 31.0, 23.0, 32.0, 32.0, 25.0, 18.0, 18.0, 18.0, 13.0, 14.0, 8.0, 12.0, 6.0, 10.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.373046875, -1.329925537109375, -1.28680419921875, -1.243682861328125, -1.2005615234375, -1.157440185546875, -1.11431884765625, -1.071197509765625, -1.028076171875, -0.984954833984375, -0.94183349609375, -0.898712158203125, -0.8555908203125, -0.812469482421875, -0.76934814453125, -0.726226806640625, -0.68310546875, -0.639984130859375, -0.59686279296875, -0.553741455078125, -0.5106201171875, -0.467498779296875, -0.42437744140625, -0.381256103515625, -0.338134765625, -0.295013427734375, -0.25189208984375, -0.208770751953125, -0.1656494140625, -0.122528076171875, -0.07940673828125, -0.036285400390625, 0.0068359375, 0.049957275390625, 0.09307861328125, 0.136199951171875, 0.1793212890625, 0.222442626953125, 0.26556396484375, 0.308685302734375, 0.351806640625, 0.394927978515625, 0.43804931640625, 0.481170654296875, 0.5242919921875, 0.567413330078125, 0.61053466796875, 0.653656005859375, 0.69677734375, 0.739898681640625, 0.78302001953125, 0.826141357421875, 0.8692626953125, 0.912384033203125, 0.95550537109375, 0.998626708984375, 1.041748046875, 1.084869384765625, 1.12799072265625, 1.171112060546875, 1.2142333984375, 1.257354736328125, 1.30047607421875, 1.343597412109375, 1.38671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 11.0, 8.0, 15.0, 15.0, 20.0, 34.0, 48.0, 68.0, 86.0, 156.0, 219.0, 375.0, 683.0, 1116.0, 2126.0, 4158.0, 8322.0, 18711.0, 61841.0, 1818702.0, 133318.0, 25571.0, 10550.0, 5029.0, 2533.0, 1356.0, 768.0, 446.0, 276.0, 177.0, 117.0, 74.0, 50.0, 46.0, 25.0, 18.0, 18.0, 11.0, 11.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38916015625, -0.37686920166015625, -0.3645782470703125, -0.35228729248046875, -0.339996337890625, -0.32770538330078125, -0.3154144287109375, -0.30312347412109375, -0.29083251953125, -0.27854156494140625, -0.2662506103515625, -0.25395965576171875, -0.241668701171875, -0.22937774658203125, -0.2170867919921875, -0.20479583740234375, -0.1925048828125, -0.18021392822265625, -0.1679229736328125, -0.15563201904296875, -0.143341064453125, -0.13105010986328125, -0.1187591552734375, -0.10646820068359375, -0.09417724609375, -0.08188629150390625, -0.0695953369140625, -0.05730438232421875, -0.045013427734375, -0.03272247314453125, -0.0204315185546875, -0.00814056396484375, 0.004150390625, 0.01644134521484375, 0.0287322998046875, 0.04102325439453125, 0.053314208984375, 0.06560516357421875, 0.0778961181640625, 0.09018707275390625, 0.10247802734375, 0.11476898193359375, 0.1270599365234375, 0.13935089111328125, 0.151641845703125, 0.16393280029296875, 0.1762237548828125, 0.18851470947265625, 0.2008056640625, 0.21309661865234375, 0.2253875732421875, 0.23767852783203125, 0.249969482421875, 0.26226043701171875, 0.2745513916015625, 0.28684234619140625, 0.29913330078125, 0.31142425537109375, 0.3237152099609375, 0.33600616455078125, 0.348297119140625, 0.36058807373046875, 0.3728790283203125, 0.38516998291015625, 0.3974609375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 0.0, 5.0, 6.0, 6.0, 9.0, 9.0, 8.0, 14.0, 16.0, 19.0, 16.0, 29.0, 36.0, 41.0, 42.0, 53.0, 67.0, 58.0, 72.0, 46.0, 64.0, 57.0, 51.0, 31.0, 43.0, 43.0, 29.0, 26.0, 17.0, 13.0, 11.0, 13.0, 9.0, 11.0, 3.0, 4.0, 8.0, 2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.012969970703125, -0.012548446655273438, -0.012126922607421875, -0.011705398559570312, -0.01128387451171875, -0.010862350463867188, -0.010440826416015625, -0.010019302368164062, -0.0095977783203125, -0.009176254272460938, -0.008754730224609375, -0.008333206176757812, -0.00791168212890625, -0.0074901580810546875, -0.007068634033203125, -0.0066471099853515625, -0.0062255859375, -0.0058040618896484375, -0.005382537841796875, -0.0049610137939453125, -0.00453948974609375, -0.0041179656982421875, -0.003696441650390625, -0.0032749176025390625, -0.0028533935546875, -0.0024318695068359375, -0.002010345458984375, -0.0015888214111328125, -0.00116729736328125, -0.0007457733154296875, -0.000324249267578125, 9.72747802734375e-05, 0.000518798828125, 0.0009403228759765625, 0.001361846923828125, 0.0017833709716796875, 0.00220489501953125, 0.0026264190673828125, 0.003047943115234375, 0.0034694671630859375, 0.0038909912109375, 0.0043125152587890625, 0.004734039306640625, 0.0051555633544921875, 0.00557708740234375, 0.0059986114501953125, 0.006420135498046875, 0.0068416595458984375, 0.00726318359375, 0.0076847076416015625, 0.008106231689453125, 0.008527755737304688, 0.00894927978515625, 0.009370803833007812, 0.009792327880859375, 0.010213851928710938, 0.0106353759765625, 0.011056900024414062, 0.011478424072265625, 0.011899948120117188, 0.01232147216796875, 0.012742996215820312, 0.013164520263671875, 0.013586044311523438, 0.014007568359375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 4.0, 6.0, 12.0, 9.0, 7.0, 15.0, 18.0, 24.0, 27.0, 44.0, 74.0, 58.0, 90.0, 156.0, 265.0, 596.0, 6229.0, 903795.0, 134746.0, 1352.0, 398.0, 186.0, 111.0, 64.0, 65.0, 40.0, 27.0, 29.0, 22.0, 20.0, 12.0, 11.0, 6.0, 9.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.265625, -0.2575187683105469, -0.24941253662109375, -0.24130630493164062, -0.2332000732421875, -0.22509384155273438, -0.21698760986328125, -0.20888137817382812, -0.200775146484375, -0.19266891479492188, -0.18456268310546875, -0.17645645141601562, -0.1683502197265625, -0.16024398803710938, -0.15213775634765625, -0.14403152465820312, -0.13592529296875, -0.12781906127929688, -0.11971282958984375, -0.11160659790039062, -0.1035003662109375, -0.09539413452148438, -0.08728790283203125, -0.07918167114257812, -0.071075439453125, -0.06296920776367188, -0.05486297607421875, -0.046756744384765625, -0.0386505126953125, -0.030544281005859375, -0.02243804931640625, -0.014331817626953125, -0.0062255859375, 0.001880645751953125, 0.00998687744140625, 0.018093109130859375, 0.0261993408203125, 0.034305572509765625, 0.04241180419921875, 0.050518035888671875, 0.058624267578125, 0.06673049926757812, 0.07483673095703125, 0.08294296264648438, 0.0910491943359375, 0.09915542602539062, 0.10726165771484375, 0.11536788940429688, 0.12347412109375, 0.13158035278320312, 0.13968658447265625, 0.14779281616210938, 0.1558990478515625, 0.16400527954101562, 0.17211151123046875, 0.18021774291992188, 0.188323974609375, 0.19643020629882812, 0.20453643798828125, 0.21264266967773438, 0.2207489013671875, 0.22885513305664062, 0.23696136474609375, 0.24506759643554688, 0.253173828125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 14.0, 87.0, 619.0, 276.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24704067409038544, -0.24244318902492523, -0.23784571886062622, -0.23324823379516602, -0.228650763630867, -0.2240532785654068, -0.2194558084011078, -0.21485832333564758, -0.21026083827018738, -0.20566335320472717, -0.20106588304042816, -0.19646839797496796, -0.19187092781066895, -0.18727344274520874, -0.18267597258090973, -0.17807848751544952, -0.1734810173511505, -0.1688835322856903, -0.1642860621213913, -0.1596885770559311, -0.15509110689163208, -0.15049362182617188, -0.14589615166187286, -0.14129866659641266, -0.13670119643211365, -0.13210371136665344, -0.12750624120235443, -0.12290876358747482, -0.11831128597259521, -0.11371380090713501, -0.1091163232922554, -0.1045188456773758, -0.09992136061191559, -0.09532388299703598, -0.09072640538215637, -0.08612892776727676, -0.08153145015239716, -0.07693396508693695, -0.07233648747205734, -0.06773900985717773, -0.06314152479171753, -0.05854404717683792, -0.05394656956195831, -0.049349088221788406, -0.0447516106069088, -0.04015413299202919, -0.03555665165185928, -0.030959174036979675, -0.026361700147390366, -0.021764222532510757, -0.017166743054986, -0.012569264508783817, -0.007971785962581635, -0.0033743083477020264, 0.001223171129822731, 0.005820650607347488, 0.010418128222227097, 0.01501560676842928, 0.019613085314631462, 0.02421056479215622, 0.028808042407035828, 0.033405520021915436, 0.038002997636795044, 0.04260047897696495, 0.04719795659184456]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 10.0, 16.0, 13.0, 18.0, 31.0, 27.0, 21.0, 34.0, 35.0, 41.0, 42.0, 46.0, 44.0, 49.0, 52.0, 45.0, 49.0, 34.0, 59.0, 36.0, 36.0, 37.0, 24.0, 32.0, 24.0, 22.0, 19.0, 14.0, 12.0, 14.0, 14.0, 9.0, 5.0, 10.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.022968649864196777, -0.02235008031129837, -0.021731510758399963, -0.021112941205501556, -0.02049437165260315, -0.019875802099704742, -0.019257232546806335, -0.01863866299390793, -0.01802009344100952, -0.017401523888111115, -0.016782954335212708, -0.0161643847823143, -0.015545815229415894, -0.014927245676517487, -0.01430867612361908, -0.013690106570720673, -0.013071537017822266, -0.012452967464923859, -0.011834397912025452, -0.011215828359127045, -0.010597258806228638, -0.00997868925333023, -0.009360119700431824, -0.008741550147533417, -0.00812298059463501, -0.007504411041736603, -0.006885841488838196, -0.006267271935939789, -0.005648702383041382, -0.005030132830142975, -0.004411563277244568, -0.003792993724346161, -0.003174424171447754, -0.002555854618549347, -0.00193728506565094, -0.001318715512752533, -0.000700145959854126, -8.1576406955719e-05, 0.000536993145942688, 0.001155562698841095, 0.001774132251739502, 0.002392701804637909, 0.003011271357536316, 0.003629840910434723, 0.00424841046333313, 0.004866980016231537, 0.005485549569129944, 0.006104119122028351, 0.006722688674926758, 0.007341258227825165, 0.007959827780723572, 0.008578397333621979, 0.009196966886520386, 0.009815536439418793, 0.0104341059923172, 0.011052675545215607, 0.011671245098114014, 0.01228981465101242, 0.012908384203910828, 0.013526953756809235, 0.014145523309707642, 0.014764092862606049, 0.015382662415504456, 0.016001231968402863, 0.01661980152130127]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 10.0, 6.0, 8.0, 7.0, 10.0, 4.0, 18.0, 16.0, 20.0, 26.0, 34.0, 28.0, 25.0, 25.0, 31.0, 35.0, 43.0, 40.0, 40.0, 44.0, 57.0, 44.0, 36.0, 40.0, 34.0, 37.0, 35.0, 35.0, 26.0, 28.0, 29.0, 23.0, 19.0, 18.0, 12.0, 12.0, 8.0, 10.0, 9.0, 2.0, 5.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9951171875, -1.9335479736328125, -1.871978759765625, -1.8104095458984375, -1.74884033203125, -1.6872711181640625, -1.625701904296875, -1.5641326904296875, -1.5025634765625, -1.4409942626953125, -1.379425048828125, -1.3178558349609375, -1.25628662109375, -1.1947174072265625, -1.133148193359375, -1.0715789794921875, -1.010009765625, -0.9484405517578125, -0.886871337890625, -0.8253021240234375, -0.76373291015625, -0.7021636962890625, -0.640594482421875, -0.5790252685546875, -0.5174560546875, -0.4558868408203125, -0.394317626953125, -0.3327484130859375, -0.27117919921875, -0.2096099853515625, -0.148040771484375, -0.0864715576171875, -0.02490234375, 0.0366668701171875, 0.098236083984375, 0.1598052978515625, 0.22137451171875, 0.2829437255859375, 0.344512939453125, 0.4060821533203125, 0.4676513671875, 0.5292205810546875, 0.590789794921875, 0.6523590087890625, 0.71392822265625, 0.7754974365234375, 0.837066650390625, 0.8986358642578125, 0.960205078125, 1.0217742919921875, 1.083343505859375, 1.1449127197265625, 1.20648193359375, 1.2680511474609375, 1.329620361328125, 1.3911895751953125, 1.4527587890625, 1.5143280029296875, 1.575897216796875, 1.6374664306640625, 1.69903564453125, 1.7606048583984375, 1.822174072265625, 1.8837432861328125, 1.9453125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 10.0, 6.0, 9.0, 14.0, 19.0, 15.0, 32.0, 36.0, 60.0, 71.0, 87.0, 120.0, 219.0, 372.0, 529.0, 898.0, 1566.0, 2561.0, 4506.0, 8127.0, 14942.0, 29833.0, 74288.0, 392495.0, 381663.0, 72466.0, 29576.0, 14840.0, 8090.0, 4529.0, 2574.0, 1516.0, 901.0, 529.0, 325.0, 217.0, 153.0, 96.0, 73.0, 43.0, 39.0, 30.0, 19.0, 13.0, 18.0, 7.0, 6.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.869140625, -3.748199462890625, -3.62725830078125, -3.506317138671875, -3.3853759765625, -3.264434814453125, -3.14349365234375, -3.022552490234375, -2.901611328125, -2.780670166015625, -2.65972900390625, -2.538787841796875, -2.4178466796875, -2.296905517578125, -2.17596435546875, -2.055023193359375, -1.93408203125, -1.813140869140625, -1.69219970703125, -1.571258544921875, -1.4503173828125, -1.329376220703125, -1.20843505859375, -1.087493896484375, -0.966552734375, -0.845611572265625, -0.72467041015625, -0.603729248046875, -0.4827880859375, -0.361846923828125, -0.24090576171875, -0.119964599609375, 0.0009765625, 0.121917724609375, 0.24285888671875, 0.363800048828125, 0.4847412109375, 0.605682373046875, 0.72662353515625, 0.847564697265625, 0.968505859375, 1.089447021484375, 1.21038818359375, 1.331329345703125, 1.4522705078125, 1.573211669921875, 1.69415283203125, 1.815093994140625, 1.93603515625, 2.056976318359375, 2.17791748046875, 2.298858642578125, 2.4197998046875, 2.540740966796875, 2.66168212890625, 2.782623291015625, 2.903564453125, 3.024505615234375, 3.14544677734375, 3.266387939453125, 3.3873291015625, 3.508270263671875, 3.62921142578125, 3.750152587890625, 3.87109375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 14.0, 11.0, 14.0, 9.0, 25.0, 16.0, 24.0, 25.0, 42.0, 39.0, 29.0, 53.0, 50.0, 51.0, 80.0, 166.0, 1422.0, 369.0, 150.0, 82.0, 62.0, 44.0, 34.0, 37.0, 32.0, 31.0, 20.0, 22.0, 17.0, 14.0, 8.0, 10.0, 12.0, 2.0, 7.0, 5.0, 2.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.39453125, -6.21685791015625, -6.0391845703125, -5.86151123046875, -5.683837890625, -5.50616455078125, -5.3284912109375, -5.15081787109375, -4.97314453125, -4.79547119140625, -4.6177978515625, -4.44012451171875, -4.262451171875, -4.08477783203125, -3.9071044921875, -3.72943115234375, -3.5517578125, -3.37408447265625, -3.1964111328125, -3.01873779296875, -2.841064453125, -2.66339111328125, -2.4857177734375, -2.30804443359375, -2.13037109375, -1.95269775390625, -1.7750244140625, -1.59735107421875, -1.419677734375, -1.24200439453125, -1.0643310546875, -0.88665771484375, -0.708984375, -0.53131103515625, -0.3536376953125, -0.17596435546875, 0.001708984375, 0.17938232421875, 0.3570556640625, 0.53472900390625, 0.71240234375, 0.89007568359375, 1.0677490234375, 1.24542236328125, 1.423095703125, 1.60076904296875, 1.7784423828125, 1.95611572265625, 2.1337890625, 2.31146240234375, 2.4891357421875, 2.66680908203125, 2.844482421875, 3.02215576171875, 3.1998291015625, 3.37750244140625, 3.55517578125, 3.73284912109375, 3.9105224609375, 4.08819580078125, 4.265869140625, 4.44354248046875, 4.6212158203125, 4.79888916015625, 4.9765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 7.0, 5.0, 5.0, 4.0, 8.0, 13.0, 7.0, 18.0, 19.0, 19.0, 35.0, 43.0, 64.0, 76.0, 88.0, 177.0, 333.0, 1091.0, 6190.0, 44368.0, 2563042.0, 503465.0, 21691.0, 3315.0, 736.0, 276.0, 181.0, 92.0, 78.0, 52.0, 41.0, 34.0, 28.0, 26.0, 21.0, 19.0, 12.0, 14.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.7774658203125, -8.437744140625, -8.0980224609375, -7.75830078125, -7.4185791015625, -7.078857421875, -6.7391357421875, -6.3994140625, -6.0596923828125, -5.719970703125, -5.3802490234375, -5.04052734375, -4.7008056640625, -4.361083984375, -4.0213623046875, -3.681640625, -3.3419189453125, -3.002197265625, -2.6624755859375, -2.32275390625, -1.9830322265625, -1.643310546875, -1.3035888671875, -0.9638671875, -0.6241455078125, -0.284423828125, 0.0552978515625, 0.39501953125, 0.7347412109375, 1.074462890625, 1.4141845703125, 1.75390625, 2.0936279296875, 2.433349609375, 2.7730712890625, 3.11279296875, 3.4525146484375, 3.792236328125, 4.1319580078125, 4.4716796875, 4.8114013671875, 5.151123046875, 5.4908447265625, 5.83056640625, 6.1702880859375, 6.510009765625, 6.8497314453125, 7.189453125, 7.5291748046875, 7.868896484375, 8.2086181640625, 8.54833984375, 8.8880615234375, 9.227783203125, 9.5675048828125, 9.9072265625, 10.2469482421875, 10.586669921875, 10.9263916015625, 11.26611328125, 11.6058349609375, 11.945556640625, 12.2852783203125, 12.625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 25.0, 165.0, 420.0, 314.0, 77.0, 6.0, 3.0], "bins": [-65.53144073486328, -64.43355560302734, -63.33566665649414, -62.23777770996094, -61.139892578125, -60.0420036315918, -58.944114685058594, -57.846229553222656, -56.74834060668945, -55.65045166015625, -54.55256652832031, -53.45467758178711, -52.356788635253906, -51.25890350341797, -50.161014556884766, -49.06312942504883, -47.965240478515625, -46.86735153198242, -45.769466400146484, -44.67157745361328, -43.573692321777344, -42.47580337524414, -41.37791442871094, -40.280029296875, -39.1821403503418, -38.084251403808594, -36.986366271972656, -35.88847732543945, -34.79058837890625, -33.69270324707031, -32.59481430053711, -31.49692726135254, -30.39904022216797, -29.3011531829834, -28.203266143798828, -27.105377197265625, -26.007490158081055, -24.909603118896484, -23.81171417236328, -22.71382713317871, -21.61594009399414, -20.51805305480957, -19.420166015625, -18.322277069091797, -17.224390029907227, -16.126502990722656, -15.02861499786377, -13.930727005004883, -12.832840919494629, -11.734952926635742, -10.637065887451172, -9.539178848266602, -8.441290855407715, -7.343403339385986, -6.245515823364258, -5.147628307342529, -4.049740791320801, -2.9518532752990723, -1.8539657592773438, -0.7560782432556152, 0.3418092727661133, 1.4396967887878418, 2.5375843048095703, 3.635471820831299, 4.733359336853027]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 6.0, 11.0, 9.0, 13.0, 11.0, 15.0, 27.0, 28.0, 28.0, 31.0, 36.0, 34.0, 43.0, 52.0, 44.0, 45.0, 53.0, 46.0, 46.0, 29.0, 41.0, 33.0, 33.0, 48.0, 39.0, 30.0, 22.0, 33.0, 15.0, 14.0, 16.0, 11.0, 11.0, 16.0, 9.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.955085754394531, -15.45468521118164, -14.95428466796875, -14.45388412475586, -13.953482627868652, -13.453082084655762, -12.952681541442871, -12.45228099822998, -11.951879501342773, -11.451478958129883, -10.951078414916992, -10.450677871704102, -9.950276374816895, -9.449875831604004, -8.949475288391113, -8.449074745178223, -7.948674201965332, -7.448273658752441, -6.947872638702393, -6.447472095489502, -5.947071075439453, -5.4466705322265625, -4.946269989013672, -4.445869445800781, -3.9454684257507324, -3.4450676441192627, -2.944666862487793, -2.4442663192749023, -1.9438655376434326, -1.443464756011963, -0.9430642127990723, -0.44266343116760254, 0.05773735046386719, 0.5581380724906921, 1.058538794517517, 1.5589394569396973, 2.059340238571167, 2.5597410202026367, 3.0601415634155273, 3.560542345046997, 4.060943126678467, 4.561343669891357, 5.061744689941406, 5.562145233154297, 6.0625457763671875, 6.562946796417236, 7.063347339630127, 7.563748359680176, 8.064148902893066, 8.564549446105957, 9.064949989318848, 9.565351486206055, 10.065752029418945, 10.566152572631836, 11.066553115844727, 11.566953659057617, 12.067354202270508, 12.567754745483398, 13.068155288696289, 13.56855583190918, 14.068957328796387, 14.569357872009277, 15.069758415222168, 15.570158958435059, 16.070560455322266]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 8.0, 7.0, 8.0, 10.0, 13.0, 20.0, 14.0, 19.0, 27.0, 30.0, 26.0, 29.0, 30.0, 26.0, 40.0, 56.0, 52.0, 44.0, 47.0, 50.0, 43.0, 39.0, 40.0, 30.0, 44.0, 41.0, 31.0, 29.0, 25.0, 21.0, 21.0, 17.0, 13.0, 12.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.388671875, -2.319854736328125, -2.25103759765625, -2.182220458984375, -2.1134033203125, -2.044586181640625, -1.97576904296875, -1.906951904296875, -1.838134765625, -1.769317626953125, -1.70050048828125, -1.631683349609375, -1.5628662109375, -1.494049072265625, -1.42523193359375, -1.356414794921875, -1.28759765625, -1.218780517578125, -1.14996337890625, -1.081146240234375, -1.0123291015625, -0.943511962890625, -0.87469482421875, -0.805877685546875, -0.737060546875, -0.668243408203125, -0.59942626953125, -0.530609130859375, -0.4617919921875, -0.392974853515625, -0.32415771484375, -0.255340576171875, -0.1865234375, -0.117706298828125, -0.04888916015625, 0.019927978515625, 0.0887451171875, 0.157562255859375, 0.22637939453125, 0.295196533203125, 0.364013671875, 0.432830810546875, 0.50164794921875, 0.570465087890625, 0.6392822265625, 0.708099365234375, 0.77691650390625, 0.845733642578125, 0.91455078125, 0.983367919921875, 1.05218505859375, 1.121002197265625, 1.1898193359375, 1.258636474609375, 1.32745361328125, 1.396270751953125, 1.465087890625, 1.533905029296875, 1.60272216796875, 1.671539306640625, 1.7403564453125, 1.809173583984375, 1.87799072265625, 1.946807861328125, 2.015625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 6.0, 8.0, 6.0, 13.0, 31.0, 34.0, 51.0, 55.0, 102.0, 150.0, 183.0, 300.0, 503.0, 648.0, 1040.0, 1650.0, 2687.0, 4472.0, 7819.0, 15053.0, 31442.0, 79974.0, 272947.0, 1150813.0, 1842810.0, 547918.0, 139431.0, 47937.0, 20836.0, 10377.0, 5752.0, 3321.0, 2053.0, 1308.0, 861.0, 560.0, 369.0, 237.0, 154.0, 119.0, 80.0, 54.0, 38.0, 29.0, 16.0, 11.0, 12.0, 10.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.78515625, -2.69305419921875, -2.6009521484375, -2.50885009765625, -2.416748046875, -2.32464599609375, -2.2325439453125, -2.14044189453125, -2.04833984375, -1.95623779296875, -1.8641357421875, -1.77203369140625, -1.679931640625, -1.58782958984375, -1.4957275390625, -1.40362548828125, -1.3115234375, -1.21942138671875, -1.1273193359375, -1.03521728515625, -0.943115234375, -0.85101318359375, -0.7589111328125, -0.66680908203125, -0.57470703125, -0.48260498046875, -0.3905029296875, -0.29840087890625, -0.206298828125, -0.11419677734375, -0.0220947265625, 0.07000732421875, 0.162109375, 0.25421142578125, 0.3463134765625, 0.43841552734375, 0.530517578125, 0.62261962890625, 0.7147216796875, 0.80682373046875, 0.89892578125, 0.99102783203125, 1.0831298828125, 1.17523193359375, 1.267333984375, 1.35943603515625, 1.4515380859375, 1.54364013671875, 1.6357421875, 1.72784423828125, 1.8199462890625, 1.91204833984375, 2.004150390625, 2.09625244140625, 2.1883544921875, 2.28045654296875, 2.37255859375, 2.46466064453125, 2.5567626953125, 2.64886474609375, 2.740966796875, 2.83306884765625, 2.9251708984375, 3.01727294921875, 3.109375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 3.0, 0.0, 14.0, 7.0, 17.0, 27.0, 35.0, 39.0, 40.0, 55.0, 90.0, 116.0, 162.0, 213.0, 315.0, 467.0, 620.0, 540.0, 412.0, 280.0, 185.0, 131.0, 64.0, 75.0, 47.0, 23.0, 24.0, 14.0, 17.0, 5.0, 9.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-4.81640625, -4.70391845703125, -4.5914306640625, -4.47894287109375, -4.366455078125, -4.25396728515625, -4.1414794921875, -4.02899169921875, -3.91650390625, -3.80401611328125, -3.6915283203125, -3.57904052734375, -3.466552734375, -3.35406494140625, -3.2415771484375, -3.12908935546875, -3.0166015625, -2.90411376953125, -2.7916259765625, -2.67913818359375, -2.566650390625, -2.45416259765625, -2.3416748046875, -2.22918701171875, -2.11669921875, -2.00421142578125, -1.8917236328125, -1.77923583984375, -1.666748046875, -1.55426025390625, -1.4417724609375, -1.32928466796875, -1.216796875, -1.10430908203125, -0.9918212890625, -0.87933349609375, -0.766845703125, -0.65435791015625, -0.5418701171875, -0.42938232421875, -0.31689453125, -0.20440673828125, -0.0919189453125, 0.02056884765625, 0.133056640625, 0.24554443359375, 0.3580322265625, 0.47052001953125, 0.5830078125, 0.69549560546875, 0.8079833984375, 0.92047119140625, 1.032958984375, 1.14544677734375, 1.2579345703125, 1.37042236328125, 1.48291015625, 1.59539794921875, 1.7078857421875, 1.82037353515625, 1.932861328125, 2.04534912109375, 2.1578369140625, 2.27032470703125, 2.3828125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 5.0, 11.0, 14.0, 22.0, 36.0, 53.0, 95.0, 181.0, 476.0, 1644.0, 7478.0, 55819.0, 1606691.0, 2439348.0, 70509.0, 8895.0, 1912.0, 523.0, 224.0, 110.0, 68.0, 52.0, 38.0, 31.0, 10.0, 7.0, 5.0, 6.0, 6.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.8648681640625, -8.510986328125, -8.1571044921875, -7.80322265625, -7.4493408203125, -7.095458984375, -6.7415771484375, -6.3876953125, -6.0338134765625, -5.679931640625, -5.3260498046875, -4.97216796875, -4.6182861328125, -4.264404296875, -3.9105224609375, -3.556640625, -3.2027587890625, -2.848876953125, -2.4949951171875, -2.14111328125, -1.7872314453125, -1.433349609375, -1.0794677734375, -0.7255859375, -0.3717041015625, -0.017822265625, 0.3360595703125, 0.68994140625, 1.0438232421875, 1.397705078125, 1.7515869140625, 2.10546875, 2.4593505859375, 2.813232421875, 3.1671142578125, 3.52099609375, 3.8748779296875, 4.228759765625, 4.5826416015625, 4.9365234375, 5.2904052734375, 5.644287109375, 5.9981689453125, 6.35205078125, 6.7059326171875, 7.059814453125, 7.4136962890625, 7.767578125, 8.1214599609375, 8.475341796875, 8.8292236328125, 9.18310546875, 9.5369873046875, 9.890869140625, 10.2447509765625, 10.5986328125, 10.9525146484375, 11.306396484375, 11.6602783203125, 12.01416015625, 12.3680419921875, 12.721923828125, 13.0758056640625, 13.4296875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 61.0, 257.0, 465.0, 188.0, 32.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.371055603027344, -54.23624038696289, -52.10142517089844, -49.96661376953125, -47.8317985534668, -45.696983337402344, -43.562171936035156, -41.4273567199707, -39.29254150390625, -37.1577262878418, -35.022911071777344, -32.888099670410156, -30.753284454345703, -28.61846923828125, -26.48365592956543, -24.34884262084961, -22.214027404785156, -20.079212188720703, -17.944398880004883, -15.809584617614746, -13.67477035522461, -11.539956092834473, -9.405141830444336, -7.270327568054199, -5.1355133056640625, -3.000699043273926, -0.8658847808837891, 1.2689294815063477, 3.4037437438964844, 5.538558006286621, 7.673372268676758, 9.808186531066895, 11.943000793457031, 14.077815055847168, 16.212629318237305, 18.347442626953125, 20.482257843017578, 22.61707305908203, 24.75188636779785, 26.886699676513672, 29.021514892578125, 31.156330108642578, 33.29114532470703, 35.42595672607422, 37.56077194213867, 39.695587158203125, 41.83039855957031, 43.965213775634766, 46.10002899169922, 48.23484420776367, 50.369659423828125, 52.50447082519531, 54.639286041259766, 56.77410125732422, 58.908912658691406, 61.04372787475586, 63.17854309082031, 65.3133544921875, 67.44817352294922, 69.5829849243164, 71.71780395507812, 73.85261535644531, 75.9874267578125, 78.12224578857422, 80.2570571899414]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 10.0, 3.0, 15.0, 13.0, 14.0, 25.0, 16.0, 21.0, 24.0, 29.0, 31.0, 24.0, 33.0, 28.0, 32.0, 36.0, 46.0, 36.0, 37.0, 43.0, 27.0, 36.0, 52.0, 38.0, 24.0, 27.0, 32.0, 39.0, 32.0, 27.0, 22.0, 21.0, 20.0, 20.0, 17.0, 14.0, 7.0, 5.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.115355491638184, -9.756152153015137, -9.39694881439209, -9.03774642944336, -8.678543090820312, -8.319339752197266, -7.960136413574219, -7.600933074951172, -7.241730213165283, -6.882526874542236, -6.523324012756348, -6.164120674133301, -5.804917335510254, -5.445714473724365, -5.086511135101318, -4.72730827331543, -4.368104934692383, -4.008901596069336, -3.6496987342834473, -3.2904953956604004, -2.9312922954559326, -2.572089195251465, -2.212885856628418, -1.8536827564239502, -1.4944796562194824, -1.1352765560150146, -0.7760733366012573, -0.4168701171875, -0.05766701698303223, 0.30153608322143555, 0.6607394218444824, 1.0199425220489502, 1.3791465759277344, 1.7383496761322021, 2.09755277633667, 2.456756114959717, 2.8159592151641846, 3.1751623153686523, 3.534365653991699, 3.893568754196167, 4.252771854400635, 4.611975193023682, 4.97117805480957, 5.330381393432617, 5.689584732055664, 6.048787593841553, 6.4079909324646, 6.767193794250488, 7.126397132873535, 7.485600471496582, 7.844803333282471, 8.20400619506836, 8.563209533691406, 8.922412872314453, 9.2816162109375, 9.640819549560547, 10.000022888183594, 10.35922622680664, 10.718429565429688, 11.077632904052734, 11.436835289001465, 11.796038627624512, 12.155241966247559, 12.514445304870605, 12.873647689819336]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 5.0, 8.0, 9.0, 17.0, 16.0, 21.0, 19.0, 28.0, 17.0, 24.0, 31.0, 32.0, 38.0, 38.0, 33.0, 34.0, 54.0, 37.0, 56.0, 37.0, 39.0, 30.0, 36.0, 42.0, 27.0, 29.0, 33.0, 36.0, 34.0, 17.0, 17.0, 16.0, 16.0, 14.0, 12.0, 6.0, 7.0, 7.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9306640625, -1.8691558837890625, -1.807647705078125, -1.7461395263671875, -1.68463134765625, -1.6231231689453125, -1.561614990234375, -1.5001068115234375, -1.4385986328125, -1.3770904541015625, -1.315582275390625, -1.2540740966796875, -1.19256591796875, -1.1310577392578125, -1.069549560546875, -1.0080413818359375, -0.946533203125, -0.8850250244140625, -0.823516845703125, -0.7620086669921875, -0.70050048828125, -0.6389923095703125, -0.577484130859375, -0.5159759521484375, -0.4544677734375, -0.3929595947265625, -0.331451416015625, -0.2699432373046875, -0.20843505859375, -0.1469268798828125, -0.085418701171875, -0.0239105224609375, 0.03759765625, 0.0991058349609375, 0.160614013671875, 0.2221221923828125, 0.28363037109375, 0.3451385498046875, 0.406646728515625, 0.4681549072265625, 0.5296630859375, 0.5911712646484375, 0.652679443359375, 0.7141876220703125, 0.77569580078125, 0.8372039794921875, 0.898712158203125, 0.9602203369140625, 1.021728515625, 1.0832366943359375, 1.144744873046875, 1.2062530517578125, 1.26776123046875, 1.3292694091796875, 1.390777587890625, 1.4522857666015625, 1.5137939453125, 1.5753021240234375, 1.636810302734375, 1.6983184814453125, 1.75982666015625, 1.8213348388671875, 1.882843017578125, 1.9443511962890625, 2.005859375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 15.0, 15.0, 23.0, 17.0, 33.0, 54.0, 72.0, 115.0, 185.0, 252.0, 332.0, 534.0, 781.0, 1084.0, 1656.0, 2576.0, 3791.0, 5836.0, 8884.0, 13724.0, 21290.0, 33921.0, 55627.0, 94511.0, 156412.0, 206664.0, 169757.0, 104696.0, 61521.0, 37558.0, 23021.0, 14901.0, 9734.0, 6239.0, 4177.0, 2735.0, 1890.0, 1266.0, 887.0, 569.0, 355.0, 251.0, 197.0, 124.0, 84.0, 61.0, 49.0, 29.0, 22.0, 10.0, 7.0, 5.0, 6.0, 1.0, 1.0, 5.0], "bins": [-0.16162109375, -0.15681076049804688, -0.15200042724609375, -0.14719009399414062, -0.1423797607421875, -0.13756942749023438, -0.13275909423828125, -0.12794876098632812, -0.123138427734375, -0.11832809448242188, -0.11351776123046875, -0.10870742797851562, -0.1038970947265625, -0.09908676147460938, -0.09427642822265625, -0.08946609497070312, -0.08465576171875, -0.07984542846679688, -0.07503509521484375, -0.07022476196289062, -0.0654144287109375, -0.060604095458984375, -0.05579376220703125, -0.050983428955078125, -0.046173095703125, -0.041362762451171875, -0.03655242919921875, -0.031742095947265625, -0.0269317626953125, -0.022121429443359375, -0.01731109619140625, -0.012500762939453125, -0.0076904296875, -0.002880096435546875, 0.00193023681640625, 0.006740570068359375, 0.0115509033203125, 0.016361236572265625, 0.02117156982421875, 0.025981903076171875, 0.030792236328125, 0.035602569580078125, 0.04041290283203125, 0.045223236083984375, 0.0500335693359375, 0.054843902587890625, 0.05965423583984375, 0.06446456909179688, 0.06927490234375, 0.07408523559570312, 0.07889556884765625, 0.08370590209960938, 0.0885162353515625, 0.09332656860351562, 0.09813690185546875, 0.10294723510742188, 0.107757568359375, 0.11256790161132812, 0.11737823486328125, 0.12218856811523438, 0.1269989013671875, 0.13180923461914062, 0.13661956787109375, 0.14142990112304688, 0.146240234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 1.0, 3.0, 10.0, 11.0, 4.0, 12.0, 17.0, 13.0, 11.0, 17.0, 24.0, 29.0, 20.0, 26.0, 28.0, 34.0, 33.0, 33.0, 33.0, 38.0, 33.0, 1067.0, 45.0, 37.0, 37.0, 42.0, 32.0, 41.0, 30.0, 33.0, 27.0, 14.0, 22.0, 33.0, 17.0, 24.0, 16.0, 15.0, 9.0, 10.0, 8.0, 5.0, 8.0, 5.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2283782958984375, -1.188201904296875, -1.1480255126953125, -1.10784912109375, -1.0676727294921875, -1.027496337890625, -0.9873199462890625, -0.9471435546875, -0.9069671630859375, -0.866790771484375, -0.8266143798828125, -0.78643798828125, -0.7462615966796875, -0.706085205078125, -0.6659088134765625, -0.625732421875, -0.5855560302734375, -0.545379638671875, -0.5052032470703125, -0.46502685546875, -0.4248504638671875, -0.384674072265625, -0.3444976806640625, -0.3043212890625, -0.2641448974609375, -0.223968505859375, -0.1837921142578125, -0.14361572265625, -0.1034393310546875, -0.063262939453125, -0.0230865478515625, 0.01708984375, 0.0572662353515625, 0.097442626953125, 0.1376190185546875, 0.17779541015625, 0.2179718017578125, 0.258148193359375, 0.2983245849609375, 0.3385009765625, 0.3786773681640625, 0.418853759765625, 0.4590301513671875, 0.49920654296875, 0.5393829345703125, 0.579559326171875, 0.6197357177734375, 0.659912109375, 0.7000885009765625, 0.740264892578125, 0.7804412841796875, 0.82061767578125, 0.8607940673828125, 0.900970458984375, 0.9411468505859375, 0.9813232421875, 1.0214996337890625, 1.061676025390625, 1.1018524169921875, 1.14202880859375, 1.1822052001953125, 1.222381591796875, 1.2625579833984375, 1.302734375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 4.0, 11.0, 12.0, 13.0, 17.0, 25.0, 34.0, 39.0, 49.0, 91.0, 153.0, 200.0, 333.0, 546.0, 938.0, 1637.0, 2991.0, 5443.0, 11031.0, 24121.0, 98258.0, 1820495.0, 84999.0, 23081.0, 10592.0, 5318.0, 2864.0, 1543.0, 858.0, 480.0, 301.0, 208.0, 141.0, 86.0, 55.0, 45.0, 44.0, 19.0, 14.0, 15.0, 8.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.37255859375, -0.36142730712890625, -0.3502960205078125, -0.33916473388671875, -0.328033447265625, -0.31690216064453125, -0.3057708740234375, -0.29463958740234375, -0.28350830078125, -0.27237701416015625, -0.2612457275390625, -0.25011444091796875, -0.238983154296875, -0.22785186767578125, -0.2167205810546875, -0.20558929443359375, -0.1944580078125, -0.18332672119140625, -0.1721954345703125, -0.16106414794921875, -0.149932861328125, -0.13880157470703125, -0.1276702880859375, -0.11653900146484375, -0.10540771484375, -0.09427642822265625, -0.0831451416015625, -0.07201385498046875, -0.060882568359375, -0.04975128173828125, -0.0386199951171875, -0.02748870849609375, -0.016357421875, -0.00522613525390625, 0.0059051513671875, 0.01703643798828125, 0.028167724609375, 0.03929901123046875, 0.0504302978515625, 0.06156158447265625, 0.07269287109375, 0.08382415771484375, 0.0949554443359375, 0.10608673095703125, 0.117218017578125, 0.12834930419921875, 0.1394805908203125, 0.15061187744140625, 0.1617431640625, 0.17287445068359375, 0.1840057373046875, 0.19513702392578125, 0.206268310546875, 0.21739959716796875, 0.2285308837890625, 0.23966217041015625, 0.25079345703125, 0.26192474365234375, 0.2730560302734375, 0.28418731689453125, 0.295318603515625, 0.30644989013671875, 0.3175811767578125, 0.32871246337890625, 0.33984375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 8.0, 13.0, 16.0, 13.0, 23.0, 20.0, 34.0, 32.0, 46.0, 37.0, 46.0, 54.0, 75.0, 79.0, 73.0, 68.0, 59.0, 44.0, 42.0, 46.0, 32.0, 21.0, 22.0, 10.0, 11.0, 7.0, 8.0, 10.0, 4.0, 5.0, 4.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0], "bins": [-0.0136260986328125, -0.013263463973999023, -0.012900829315185547, -0.01253819465637207, -0.012175559997558594, -0.011812925338745117, -0.01145029067993164, -0.011087656021118164, -0.010725021362304688, -0.010362386703491211, -0.009999752044677734, -0.009637117385864258, -0.009274482727050781, -0.008911848068237305, -0.008549213409423828, -0.008186578750610352, -0.007823944091796875, -0.0074613094329833984, -0.007098674774169922, -0.006736040115356445, -0.006373405456542969, -0.006010770797729492, -0.005648136138916016, -0.005285501480102539, -0.0049228668212890625, -0.004560232162475586, -0.004197597503662109, -0.003834962844848633, -0.0034723281860351562, -0.0031096935272216797, -0.002747058868408203, -0.0023844242095947266, -0.00202178955078125, -0.0016591548919677734, -0.0012965202331542969, -0.0009338855743408203, -0.0005712509155273438, -0.0002086162567138672, 0.00015401840209960938, 0.0005166530609130859, 0.0008792877197265625, 0.001241922378540039, 0.0016045570373535156, 0.001967191696166992, 0.0023298263549804688, 0.0026924610137939453, 0.003055095672607422, 0.0034177303314208984, 0.003780364990234375, 0.0041429996490478516, 0.004505634307861328, 0.004868268966674805, 0.005230903625488281, 0.005593538284301758, 0.005956172943115234, 0.006318807601928711, 0.0066814422607421875, 0.007044076919555664, 0.007406711578369141, 0.007769346237182617, 0.008131980895996094, 0.00849461555480957, 0.008857250213623047, 0.009219884872436523, 0.00958251953125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 3.0, 8.0, 5.0, 13.0, 6.0, 18.0, 20.0, 27.0, 24.0, 57.0, 75.0, 76.0, 158.0, 298.0, 615.0, 9544.0, 985531.0, 50238.0, 922.0, 331.0, 155.0, 123.0, 80.0, 47.0, 39.0, 28.0, 18.0, 16.0, 19.0, 6.0, 8.0, 9.0, 8.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2049560546875, -0.1975383758544922, -0.19012069702148438, -0.18270301818847656, -0.17528533935546875, -0.16786766052246094, -0.16044998168945312, -0.1530323028564453, -0.1456146240234375, -0.1381969451904297, -0.13077926635742188, -0.12336158752441406, -0.11594390869140625, -0.10852622985839844, -0.10110855102539062, -0.09369087219238281, -0.086273193359375, -0.07885551452636719, -0.07143783569335938, -0.06402015686035156, -0.05660247802734375, -0.04918479919433594, -0.041767120361328125, -0.03434944152832031, -0.0269317626953125, -0.019514083862304688, -0.012096405029296875, -0.0046787261962890625, 0.00273895263671875, 0.010156631469726562, 0.017574310302734375, 0.024991989135742188, 0.03240966796875, 0.03982734680175781, 0.047245025634765625, 0.05466270446777344, 0.06208038330078125, 0.06949806213378906, 0.07691574096679688, 0.08433341979980469, 0.0917510986328125, 0.09916877746582031, 0.10658645629882812, 0.11400413513183594, 0.12142181396484375, 0.12883949279785156, 0.13625717163085938, 0.1436748504638672, 0.151092529296875, 0.1585102081298828, 0.16592788696289062, 0.17334556579589844, 0.18076324462890625, 0.18818092346191406, 0.19559860229492188, 0.2030162811279297, 0.2104339599609375, 0.2178516387939453, 0.22526931762695312, 0.23268699645996094, 0.24010467529296875, 0.24752235412597656, 0.2549400329589844, 0.2623577117919922, 0.269775390625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 19.0, 106.0, 473.0, 345.0, 58.0, 11.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.150141641497612, -0.1471300572156906, -0.14411847293376923, -0.14110688865184784, -0.13809530436992645, -0.13508372008800507, -0.13207213580608368, -0.1290605515241623, -0.1260489672422409, -0.12303738296031952, -0.12002579867839813, -0.11701421439647675, -0.11400263011455536, -0.11099104583263397, -0.10797946155071259, -0.1049678772687912, -0.10195629298686981, -0.09894470870494843, -0.09593312442302704, -0.09292154014110565, -0.08990995585918427, -0.08689837157726288, -0.08388678729534149, -0.0808752030134201, -0.07786361873149872, -0.07485203444957733, -0.07184045016765594, -0.06882886588573456, -0.06581728160381317, -0.06280569732189178, -0.0597941130399704, -0.05678252875804901, -0.05377093702554703, -0.05075935274362564, -0.047747768461704254, -0.04473618417978287, -0.04172459989786148, -0.038713015615940094, -0.03570143133401871, -0.03268984705209732, -0.029678262770175934, -0.026666678488254547, -0.02365509420633316, -0.020643509924411774, -0.017631925642490387, -0.014620341360569, -0.011608757078647614, -0.008597172796726227, -0.00558558851480484, -0.0025740042328834534, 0.00043758004903793335, 0.00344916433095932, 0.006460748612880707, 0.009472332894802094, 0.01248391717672348, 0.015495501458644867, 0.018507085740566254, 0.02151867002248764, 0.024530254304409027, 0.027541838586330414, 0.0305534228682518, 0.03356500715017319, 0.036576591432094574, 0.03958817571401596, 0.04259975999593735]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 5.0, 5.0, 9.0, 5.0, 9.0, 15.0, 16.0, 19.0, 16.0, 19.0, 22.0, 21.0, 23.0, 25.0, 37.0, 28.0, 39.0, 38.0, 44.0, 47.0, 48.0, 32.0, 45.0, 41.0, 41.0, 43.0, 33.0, 28.0, 26.0, 20.0, 39.0, 14.0, 23.0, 10.0, 28.0, 17.0, 12.0, 12.0, 6.0, 8.0, 11.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.01127314567565918, -0.010935102589428425, -0.01059705950319767, -0.010259016416966915, -0.00992097333073616, -0.009582930244505405, -0.00924488715827465, -0.008906844072043896, -0.008568800985813141, -0.008230757899582386, -0.007892714813351631, -0.007554671727120876, -0.0072166286408901215, -0.006878585554659367, -0.006540542468428612, -0.006202499382197857, -0.005864456295967102, -0.005526413209736347, -0.005188370123505592, -0.0048503270372748375, -0.004512283951044083, -0.004174240864813328, -0.003836197778582573, -0.003498154692351818, -0.0031601116061210632, -0.0028220685198903084, -0.0024840254336595535, -0.0021459823474287987, -0.0018079392611980438, -0.001469896174967289, -0.0011318530887365341, -0.0007938100025057793, -0.0004557669162750244, -0.00011772383004426956, 0.0002203192561864853, 0.0005583623424172401, 0.000896405428647995, 0.0012344485148787498, 0.0015724916011095047, 0.0019105346873402596, 0.0022485777735710144, 0.0025866208598017693, 0.002924663946032524, 0.003262707032263279, 0.003600750118494034, 0.003938793204724789, 0.0042768362909555435, 0.004614879377186298, 0.004952922463417053, 0.005290965549647808, 0.005629008635878563, 0.005967051722109318, 0.006305094808340073, 0.0066431378945708275, 0.006981180980801582, 0.007319224067032337, 0.007657267153263092, 0.007995310239493847, 0.008333353325724602, 0.008671396411955357, 0.009009439498186111, 0.009347482584416866, 0.009685525670647621, 0.010023568756878376, 0.01036161184310913]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 8.0, 4.0, 8.0, 8.0, 18.0, 17.0, 20.0, 19.0, 28.0, 17.0, 24.0, 31.0, 33.0, 36.0, 39.0, 33.0, 34.0, 53.0, 37.0, 56.0, 38.0, 39.0, 30.0, 36.0, 42.0, 27.0, 29.0, 33.0, 36.0, 33.0, 17.0, 18.0, 16.0, 16.0, 14.0, 12.0, 6.0, 7.0, 7.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9296875, -1.86822509765625, -1.8067626953125, -1.74530029296875, -1.683837890625, -1.62237548828125, -1.5609130859375, -1.49945068359375, -1.43798828125, -1.37652587890625, -1.3150634765625, -1.25360107421875, -1.192138671875, -1.13067626953125, -1.0692138671875, -1.00775146484375, -0.9462890625, -0.88482666015625, -0.8233642578125, -0.76190185546875, -0.700439453125, -0.63897705078125, -0.5775146484375, -0.51605224609375, -0.45458984375, -0.39312744140625, -0.3316650390625, -0.27020263671875, -0.208740234375, -0.14727783203125, -0.0858154296875, -0.02435302734375, 0.037109375, 0.09857177734375, 0.1600341796875, 0.22149658203125, 0.282958984375, 0.34442138671875, 0.4058837890625, 0.46734619140625, 0.52880859375, 0.59027099609375, 0.6517333984375, 0.71319580078125, 0.774658203125, 0.83612060546875, 0.8975830078125, 0.95904541015625, 1.0205078125, 1.08197021484375, 1.1434326171875, 1.20489501953125, 1.266357421875, 1.32781982421875, 1.3892822265625, 1.45074462890625, 1.51220703125, 1.57366943359375, 1.6351318359375, 1.69659423828125, 1.758056640625, 1.81951904296875, 1.8809814453125, 1.94244384765625, 2.00390625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 13.0, 35.0, 30.0, 49.0, 68.0, 103.0, 152.0, 210.0, 319.0, 528.0, 752.0, 1124.0, 1688.0, 2607.0, 4038.0, 6618.0, 11051.0, 19190.0, 34019.0, 63339.0, 128997.0, 287396.0, 248868.0, 109327.0, 54908.0, 29764.0, 16967.0, 9868.0, 5886.0, 3606.0, 2330.0, 1604.0, 1021.0, 661.0, 476.0, 347.0, 174.0, 122.0, 105.0, 52.0, 43.0, 32.0, 17.0, 11.0, 6.0, 11.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.419921875, -2.346343994140625, -2.27276611328125, -2.199188232421875, -2.1256103515625, -2.052032470703125, -1.97845458984375, -1.904876708984375, -1.831298828125, -1.757720947265625, -1.68414306640625, -1.610565185546875, -1.5369873046875, -1.463409423828125, -1.38983154296875, -1.316253662109375, -1.24267578125, -1.169097900390625, -1.09552001953125, -1.021942138671875, -0.9483642578125, -0.874786376953125, -0.80120849609375, -0.727630615234375, -0.654052734375, -0.580474853515625, -0.50689697265625, -0.433319091796875, -0.3597412109375, -0.286163330078125, -0.21258544921875, -0.139007568359375, -0.0654296875, 0.008148193359375, 0.08172607421875, 0.155303955078125, 0.2288818359375, 0.302459716796875, 0.37603759765625, 0.449615478515625, 0.523193359375, 0.596771240234375, 0.67034912109375, 0.743927001953125, 0.8175048828125, 0.891082763671875, 0.96466064453125, 1.038238525390625, 1.11181640625, 1.185394287109375, 1.25897216796875, 1.332550048828125, 1.4061279296875, 1.479705810546875, 1.55328369140625, 1.626861572265625, 1.700439453125, 1.774017333984375, 1.84759521484375, 1.921173095703125, 1.9947509765625, 2.068328857421875, 2.14190673828125, 2.215484619140625, 2.2890625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 9.0, 15.0, 15.0, 10.0, 12.0, 14.0, 16.0, 17.0, 26.0, 22.0, 28.0, 41.0, 37.0, 33.0, 60.0, 78.0, 120.0, 139.0, 258.0, 1343.0, 162.0, 100.0, 78.0, 63.0, 48.0, 33.0, 27.0, 43.0, 34.0, 26.0, 21.0, 16.0, 19.0, 15.0, 11.0, 7.0, 4.0, 9.0, 12.0, 4.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.16015625, -5.00457763671875, -4.8489990234375, -4.69342041015625, -4.537841796875, -4.38226318359375, -4.2266845703125, -4.07110595703125, -3.91552734375, -3.75994873046875, -3.6043701171875, -3.44879150390625, -3.293212890625, -3.13763427734375, -2.9820556640625, -2.82647705078125, -2.6708984375, -2.51531982421875, -2.3597412109375, -2.20416259765625, -2.048583984375, -1.89300537109375, -1.7374267578125, -1.58184814453125, -1.42626953125, -1.27069091796875, -1.1151123046875, -0.95953369140625, -0.803955078125, -0.64837646484375, -0.4927978515625, -0.33721923828125, -0.181640625, -0.02606201171875, 0.1295166015625, 0.28509521484375, 0.440673828125, 0.59625244140625, 0.7518310546875, 0.90740966796875, 1.06298828125, 1.21856689453125, 1.3741455078125, 1.52972412109375, 1.685302734375, 1.84088134765625, 1.9964599609375, 2.15203857421875, 2.3076171875, 2.46319580078125, 2.6187744140625, 2.77435302734375, 2.929931640625, 3.08551025390625, 3.2410888671875, 3.39666748046875, 3.55224609375, 3.70782470703125, 3.8634033203125, 4.01898193359375, 4.174560546875, 4.33013916015625, 4.4857177734375, 4.64129638671875, 4.796875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 2.0, 5.0, 14.0, 13.0, 20.0, 16.0, 28.0, 36.0, 59.0, 63.0, 94.0, 127.0, 183.0, 280.0, 479.0, 1162.0, 2603.0, 7911.0, 26034.0, 115313.0, 949426.0, 1795635.0, 190268.0, 38364.0, 10692.0, 3712.0, 1474.0, 622.0, 345.0, 184.0, 129.0, 107.0, 78.0, 52.0, 38.0, 31.0, 27.0, 23.0, 15.0, 7.0, 4.0, 8.0, 8.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.50177001953125, -4.3472900390625, -4.19281005859375, -4.038330078125, -3.88385009765625, -3.7293701171875, -3.57489013671875, -3.42041015625, -3.26593017578125, -3.1114501953125, -2.95697021484375, -2.802490234375, -2.64801025390625, -2.4935302734375, -2.33905029296875, -2.1845703125, -2.03009033203125, -1.8756103515625, -1.72113037109375, -1.566650390625, -1.41217041015625, -1.2576904296875, -1.10321044921875, -0.94873046875, -0.79425048828125, -0.6397705078125, -0.48529052734375, -0.330810546875, -0.17633056640625, -0.0218505859375, 0.13262939453125, 0.287109375, 0.44158935546875, 0.5960693359375, 0.75054931640625, 0.905029296875, 1.05950927734375, 1.2139892578125, 1.36846923828125, 1.52294921875, 1.67742919921875, 1.8319091796875, 1.98638916015625, 2.140869140625, 2.29534912109375, 2.4498291015625, 2.60430908203125, 2.7587890625, 2.91326904296875, 3.0677490234375, 3.22222900390625, 3.376708984375, 3.53118896484375, 3.6856689453125, 3.84014892578125, 3.99462890625, 4.14910888671875, 4.3035888671875, 4.45806884765625, 4.612548828125, 4.76702880859375, 4.9215087890625, 5.07598876953125, 5.23046875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 13.0, 34.0, 54.0, 139.0, 208.0, 216.0, 155.0, 109.0, 40.0, 18.0, 10.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.130715370178223, -8.39884090423584, -7.666966915130615, -6.935092449188232, -6.203218460083008, -5.471343994140625, -4.739469528198242, -4.007595539093018, -3.2757210731506348, -2.543846845626831, -1.8119724988937378, -1.0800981521606445, -0.3482239246368408, 0.3836503028869629, 1.1155247688293457, 1.8473987579345703, 2.579273223876953, 3.311147451400757, 4.0430216789245605, 4.774896144866943, 5.506770133972168, 6.238644599914551, 6.970519065856934, 7.702393054962158, 8.434267044067383, 9.166141510009766, 9.898015975952148, 10.629890441894531, 11.361763954162598, 12.09363842010498, 12.825512886047363, 13.55738639831543, 14.289262771606445, 15.021137237548828, 15.753011703491211, 16.484886169433594, 17.216760635375977, 17.94863510131836, 18.68050765991211, 19.412382125854492, 20.144256591796875, 20.876131057739258, 21.60800552368164, 22.339879989624023, 23.071754455566406, 23.803627014160156, 24.535503387451172, 25.267375946044922, 25.999252319335938, 26.73112678527832, 27.463001251220703, 28.194875717163086, 28.92675018310547, 29.65862274169922, 30.390499114990234, 31.122371673583984, 31.854246139526367, 32.58612060546875, 33.3179931640625, 34.049869537353516, 34.781742095947266, 35.51361846923828, 36.24549102783203, 36.97736740112305, 37.7092399597168]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 8.0, 11.0, 5.0, 17.0, 12.0, 14.0, 13.0, 14.0, 16.0, 27.0, 27.0, 27.0, 29.0, 25.0, 48.0, 37.0, 41.0, 41.0, 32.0, 38.0, 46.0, 49.0, 36.0, 30.0, 36.0, 42.0, 39.0, 28.0, 21.0, 30.0, 20.0, 22.0, 24.0, 15.0, 9.0, 17.0, 15.0, 11.0, 9.0, 5.0, 4.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.430721282958984, -12.01568603515625, -11.600650787353516, -11.185615539550781, -10.770581245422363, -10.355545997619629, -9.940510749816895, -9.52547550201416, -9.110441207885742, -8.695405960083008, -8.280370712280273, -7.865335941314697, -7.450301170349121, -7.035265922546387, -6.620230674743652, -6.205195426940918, -5.790160179138184, -5.375124931335449, -4.960090160369873, -4.545054912567139, -4.1300201416015625, -3.714984893798828, -3.2999496459960938, -2.8849146366119385, -2.469879627227783, -2.054844617843628, -1.639809489250183, -1.2247743606567383, -0.809739351272583, -0.39470434188842773, 0.02033090591430664, 0.4353659152984619, 0.8503999710083008, 1.265434980392456, 1.6804701089859009, 2.0955052375793457, 2.510540246963501, 2.9255752563476562, 3.3406105041503906, 3.755645513534546, 4.170680522918701, 4.5857157707214355, 5.000750541687012, 5.415785789489746, 5.8308210372924805, 6.245855808258057, 6.660891056060791, 7.075925827026367, 7.490961074829102, 7.905996322631836, 8.32103157043457, 8.736066818237305, 9.151101112365723, 9.566136360168457, 9.981171607971191, 10.396206855773926, 10.811241149902344, 11.226276397705078, 11.641311645507812, 12.056346893310547, 12.471381187438965, 12.8864164352417, 13.301451683044434, 13.716486930847168, 14.131522178649902]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 5.0, 6.0, 13.0, 12.0, 14.0, 6.0, 8.0, 24.0, 22.0, 27.0, 15.0, 35.0, 30.0, 27.0, 39.0, 30.0, 35.0, 52.0, 43.0, 40.0, 53.0, 40.0, 38.0, 43.0, 27.0, 41.0, 28.0, 30.0, 35.0, 23.0, 13.0, 22.0, 18.0, 17.0, 19.0, 10.0, 11.0, 12.0, 10.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.9755859375, -1.91412353515625, -1.8526611328125, -1.79119873046875, -1.729736328125, -1.66827392578125, -1.6068115234375, -1.54534912109375, -1.48388671875, -1.42242431640625, -1.3609619140625, -1.29949951171875, -1.238037109375, -1.17657470703125, -1.1151123046875, -1.05364990234375, -0.9921875, -0.93072509765625, -0.8692626953125, -0.80780029296875, -0.746337890625, -0.68487548828125, -0.6234130859375, -0.56195068359375, -0.50048828125, -0.43902587890625, -0.3775634765625, -0.31610107421875, -0.254638671875, -0.19317626953125, -0.1317138671875, -0.07025146484375, -0.0087890625, 0.05267333984375, 0.1141357421875, 0.17559814453125, 0.237060546875, 0.29852294921875, 0.3599853515625, 0.42144775390625, 0.48291015625, 0.54437255859375, 0.6058349609375, 0.66729736328125, 0.728759765625, 0.79022216796875, 0.8516845703125, 0.91314697265625, 0.974609375, 1.03607177734375, 1.0975341796875, 1.15899658203125, 1.220458984375, 1.28192138671875, 1.3433837890625, 1.40484619140625, 1.46630859375, 1.52777099609375, 1.5892333984375, 1.65069580078125, 1.712158203125, 1.77362060546875, 1.8350830078125, 1.89654541015625, 1.9580078125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 5.0, 11.0, 19.0, 26.0, 22.0, 36.0, 77.0, 99.0, 113.0, 183.0, 266.0, 392.0, 626.0, 935.0, 1533.0, 2651.0, 4679.0, 8625.0, 17533.0, 40188.0, 121727.0, 572405.0, 2181786.0, 954285.0, 184512.0, 54991.0, 22126.0, 10736.0, 5505.0, 3165.0, 1788.0, 1147.0, 686.0, 429.0, 295.0, 187.0, 159.0, 90.0, 65.0, 45.0, 35.0, 33.0, 15.0, 13.0, 17.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.169921875, -3.066497802734375, -2.96307373046875, -2.859649658203125, -2.7562255859375, -2.652801513671875, -2.54937744140625, -2.445953369140625, -2.342529296875, -2.239105224609375, -2.13568115234375, -2.032257080078125, -1.9288330078125, -1.825408935546875, -1.72198486328125, -1.618560791015625, -1.51513671875, -1.411712646484375, -1.30828857421875, -1.204864501953125, -1.1014404296875, -0.998016357421875, -0.89459228515625, -0.791168212890625, -0.687744140625, -0.584320068359375, -0.48089599609375, -0.377471923828125, -0.2740478515625, -0.170623779296875, -0.06719970703125, 0.036224365234375, 0.1396484375, 0.243072509765625, 0.34649658203125, 0.449920654296875, 0.5533447265625, 0.656768798828125, 0.76019287109375, 0.863616943359375, 0.967041015625, 1.070465087890625, 1.17388916015625, 1.277313232421875, 1.3807373046875, 1.484161376953125, 1.58758544921875, 1.691009521484375, 1.79443359375, 1.897857666015625, 2.00128173828125, 2.104705810546875, 2.2081298828125, 2.311553955078125, 2.41497802734375, 2.518402099609375, 2.621826171875, 2.725250244140625, 2.82867431640625, 2.932098388671875, 3.0355224609375, 3.138946533203125, 3.24237060546875, 3.345794677734375, 3.44921875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 9.0, 5.0, 8.0, 12.0, 16.0, 15.0, 16.0, 14.0, 25.0, 33.0, 51.0, 59.0, 96.0, 105.0, 162.0, 245.0, 319.0, 521.0, 551.0, 475.0, 355.0, 277.0, 161.0, 137.0, 104.0, 77.0, 55.0, 36.0, 24.0, 31.0, 13.0, 14.0, 13.0, 13.0, 8.0, 6.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.318359375, -3.222137451171875, -3.12591552734375, -3.029693603515625, -2.9334716796875, -2.837249755859375, -2.74102783203125, -2.644805908203125, -2.548583984375, -2.452362060546875, -2.35614013671875, -2.259918212890625, -2.1636962890625, -2.067474365234375, -1.97125244140625, -1.875030517578125, -1.77880859375, -1.682586669921875, -1.58636474609375, -1.490142822265625, -1.3939208984375, -1.297698974609375, -1.20147705078125, -1.105255126953125, -1.009033203125, -0.912811279296875, -0.81658935546875, -0.720367431640625, -0.6241455078125, -0.527923583984375, -0.43170166015625, -0.335479736328125, -0.2392578125, -0.143035888671875, -0.04681396484375, 0.049407958984375, 0.1456298828125, 0.241851806640625, 0.33807373046875, 0.434295654296875, 0.530517578125, 0.626739501953125, 0.72296142578125, 0.819183349609375, 0.9154052734375, 1.011627197265625, 1.10784912109375, 1.204071044921875, 1.30029296875, 1.396514892578125, 1.49273681640625, 1.588958740234375, 1.6851806640625, 1.781402587890625, 1.87762451171875, 1.973846435546875, 2.070068359375, 2.166290283203125, 2.26251220703125, 2.358734130859375, 2.4549560546875, 2.551177978515625, 2.64739990234375, 2.743621826171875, 2.83984375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 6.0, 17.0, 32.0, 41.0, 59.0, 83.0, 141.0, 217.0, 379.0, 641.0, 1177.0, 2287.0, 4498.0, 9447.0, 21819.0, 55801.0, 184967.0, 1199256.0, 2266896.0, 311735.0, 81028.0, 29318.0, 12384.0, 5705.0, 2863.0, 1525.0, 817.0, 426.0, 244.0, 173.0, 104.0, 63.0, 39.0, 26.0, 21.0, 13.0, 5.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.53125, -4.3858642578125, -4.240478515625, -4.0950927734375, -3.94970703125, -3.8043212890625, -3.658935546875, -3.5135498046875, -3.3681640625, -3.2227783203125, -3.077392578125, -2.9320068359375, -2.78662109375, -2.6412353515625, -2.495849609375, -2.3504638671875, -2.205078125, -2.0596923828125, -1.914306640625, -1.7689208984375, -1.62353515625, -1.4781494140625, -1.332763671875, -1.1873779296875, -1.0419921875, -0.8966064453125, -0.751220703125, -0.6058349609375, -0.46044921875, -0.3150634765625, -0.169677734375, -0.0242919921875, 0.12109375, 0.2664794921875, 0.411865234375, 0.5572509765625, 0.70263671875, 0.8480224609375, 0.993408203125, 1.1387939453125, 1.2841796875, 1.4295654296875, 1.574951171875, 1.7203369140625, 1.86572265625, 2.0111083984375, 2.156494140625, 2.3018798828125, 2.447265625, 2.5926513671875, 2.738037109375, 2.8834228515625, 3.02880859375, 3.1741943359375, 3.319580078125, 3.4649658203125, 3.6103515625, 3.7557373046875, 3.901123046875, 4.0465087890625, 4.19189453125, 4.3372802734375, 4.482666015625, 4.6280517578125, 4.7734375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 11.0, 25.0, 40.0, 88.0, 154.0, 197.0, 194.0, 160.0, 85.0, 32.0, 14.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-45.445701599121094, -44.5341682434082, -43.62263488769531, -42.711097717285156, -41.799564361572266, -40.888031005859375, -39.976497650146484, -39.064964294433594, -38.1534309387207, -37.24189758300781, -36.33036422729492, -35.41883087158203, -34.507293701171875, -33.595760345458984, -32.684226989746094, -31.772693634033203, -30.86115837097168, -29.94962501525879, -29.038089752197266, -28.126556396484375, -27.215023040771484, -26.303489685058594, -25.39195442199707, -24.48042106628418, -23.568885803222656, -22.657352447509766, -21.745817184448242, -20.83428382873535, -19.92275047302246, -19.011215209960938, -18.099681854248047, -17.188148498535156, -16.276615142822266, -15.365080833435059, -14.453547477722168, -13.542013168334961, -12.63047981262207, -11.718945503234863, -10.807411193847656, -9.895877838134766, -8.984344482421875, -8.072810173034668, -7.161276817321777, -6.24974250793457, -5.3382086753845215, -4.426674842834473, -3.5151405334472656, -2.603606700897217, -1.692072868347168, -0.7805389165878296, 0.1309950351715088, 1.0425291061401367, 1.9540629386901855, 2.8655967712402344, 3.7771310806274414, 4.68866491317749, 5.600198745727539, 6.511732578277588, 7.423266410827637, 8.334800720214844, 9.246334075927734, 10.157868385314941, 11.069402694702148, 11.980936050415039, 12.892470359802246]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 6.0, 3.0, 10.0, 12.0, 12.0, 21.0, 14.0, 20.0, 26.0, 24.0, 22.0, 40.0, 32.0, 39.0, 45.0, 49.0, 35.0, 43.0, 51.0, 43.0, 52.0, 53.0, 36.0, 45.0, 36.0, 33.0, 27.0, 29.0, 24.0, 20.0, 12.0, 10.0, 16.0, 11.0, 7.0, 7.0, 4.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.34267807006836, -11.980058670043945, -11.617439270019531, -11.254819869995117, -10.89220142364502, -10.529582023620605, -10.166962623596191, -9.804343223571777, -9.441723823547363, -9.07910442352295, -8.716485023498535, -8.353866577148438, -7.991246700286865, -7.628627777099609, -7.266008377075195, -6.903388977050781, -6.540770053863525, -6.178150653839111, -5.8155317306518555, -5.452912330627441, -5.090292930603027, -4.727673530578613, -4.365054607391357, -4.002435207366943, -3.6398160457611084, -3.2771968841552734, -2.9145774841308594, -2.5519583225250244, -2.1893391609191895, -1.8267197608947754, -1.4641005992889404, -1.1014811992645264, -0.7388620376586914, -0.3762427866458893, -0.013623535633087158, 0.3489956855773926, 0.7116149663925171, 1.0742342472076416, 1.4368534088134766, 1.7994728088378906, 2.1620919704437256, 2.5247111320495605, 2.8873305320739746, 3.2499496936798096, 3.6125688552856445, 3.9751882553100586, 4.337807655334473, 4.700427055358887, 5.063045978546143, 5.425665378570557, 5.7882843017578125, 6.150903701782227, 6.513523101806641, 6.876142501831055, 7.2387614250183105, 7.601380825042725, 7.9639997482299805, 8.326619148254395, 8.689238548278809, 9.051856994628906, 9.41447639465332, 9.777095794677734, 10.139715194702148, 10.502334594726562, 10.864953994750977]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 2.0, 6.0, 7.0, 14.0, 16.0, 15.0, 13.0, 20.0, 24.0, 17.0, 22.0, 20.0, 25.0, 33.0, 30.0, 49.0, 41.0, 41.0, 42.0, 43.0, 37.0, 40.0, 36.0, 45.0, 38.0, 33.0, 33.0, 33.0, 22.0, 26.0, 30.0, 25.0, 19.0, 18.0, 13.0, 10.0, 6.0, 15.0, 4.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-2.20703125, -2.144500732421875, -2.08197021484375, -2.019439697265625, -1.9569091796875, -1.894378662109375, -1.83184814453125, -1.769317626953125, -1.706787109375, -1.644256591796875, -1.58172607421875, -1.519195556640625, -1.4566650390625, -1.394134521484375, -1.33160400390625, -1.269073486328125, -1.20654296875, -1.144012451171875, -1.08148193359375, -1.018951416015625, -0.9564208984375, -0.893890380859375, -0.83135986328125, -0.768829345703125, -0.706298828125, -0.643768310546875, -0.58123779296875, -0.518707275390625, -0.4561767578125, -0.393646240234375, -0.33111572265625, -0.268585205078125, -0.2060546875, -0.143524169921875, -0.08099365234375, -0.018463134765625, 0.0440673828125, 0.106597900390625, 0.16912841796875, 0.231658935546875, 0.294189453125, 0.356719970703125, 0.41925048828125, 0.481781005859375, 0.5443115234375, 0.606842041015625, 0.66937255859375, 0.731903076171875, 0.79443359375, 0.856964111328125, 0.91949462890625, 0.982025146484375, 1.0445556640625, 1.107086181640625, 1.16961669921875, 1.232147216796875, 1.294677734375, 1.357208251953125, 1.41973876953125, 1.482269287109375, 1.5447998046875, 1.607330322265625, 1.66986083984375, 1.732391357421875, 1.794921875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 5.0, 9.0, 8.0, 15.0, 27.0, 34.0, 39.0, 54.0, 96.0, 145.0, 188.0, 269.0, 399.0, 600.0, 848.0, 1253.0, 1901.0, 2904.0, 4211.0, 6178.0, 9152.0, 14231.0, 21918.0, 35410.0, 57109.0, 95967.0, 157392.0, 202312.0, 165937.0, 103128.0, 61327.0, 37237.0, 23187.0, 15069.0, 9877.0, 6587.0, 4407.0, 2826.0, 2005.0, 1379.0, 906.0, 656.0, 432.0, 276.0, 213.0, 141.0, 101.0, 66.0, 40.0, 33.0, 20.0, 18.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.159423828125, -0.1543731689453125, -0.149322509765625, -0.1442718505859375, -0.13922119140625, -0.1341705322265625, -0.129119873046875, -0.1240692138671875, -0.1190185546875, -0.1139678955078125, -0.108917236328125, -0.1038665771484375, -0.09881591796875, -0.0937652587890625, -0.088714599609375, -0.0836639404296875, -0.07861328125, -0.0735626220703125, -0.068511962890625, -0.0634613037109375, -0.05841064453125, -0.0533599853515625, -0.048309326171875, -0.0432586669921875, -0.0382080078125, -0.0331573486328125, -0.028106689453125, -0.0230560302734375, -0.01800537109375, -0.0129547119140625, -0.007904052734375, -0.0028533935546875, 0.002197265625, 0.0072479248046875, 0.012298583984375, 0.0173492431640625, 0.02239990234375, 0.0274505615234375, 0.032501220703125, 0.0375518798828125, 0.0426025390625, 0.0476531982421875, 0.052703857421875, 0.0577545166015625, 0.06280517578125, 0.0678558349609375, 0.072906494140625, 0.0779571533203125, 0.0830078125, 0.0880584716796875, 0.093109130859375, 0.0981597900390625, 0.10321044921875, 0.1082611083984375, 0.113311767578125, 0.1183624267578125, 0.1234130859375, 0.1284637451171875, 0.133514404296875, 0.1385650634765625, 0.14361572265625, 0.1486663818359375, 0.153717041015625, 0.1587677001953125, 0.163818359375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 7.0, 5.0, 5.0, 5.0, 14.0, 12.0, 8.0, 17.0, 17.0, 22.0, 14.0, 20.0, 27.0, 27.0, 21.0, 33.0, 25.0, 34.0, 35.0, 33.0, 41.0, 44.0, 1074.0, 43.0, 41.0, 37.0, 39.0, 42.0, 32.0, 25.0, 21.0, 20.0, 13.0, 23.0, 24.0, 21.0, 19.0, 12.0, 9.0, 12.0, 7.0, 9.0, 9.0, 9.0, 1.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.3662109375, -1.3244781494140625, -1.282745361328125, -1.2410125732421875, -1.19927978515625, -1.1575469970703125, -1.115814208984375, -1.0740814208984375, -1.0323486328125, -0.9906158447265625, -0.948883056640625, -0.9071502685546875, -0.86541748046875, -0.8236846923828125, -0.781951904296875, -0.7402191162109375, -0.698486328125, -0.6567535400390625, -0.615020751953125, -0.5732879638671875, -0.53155517578125, -0.4898223876953125, -0.448089599609375, -0.4063568115234375, -0.3646240234375, -0.3228912353515625, -0.281158447265625, -0.2394256591796875, -0.19769287109375, -0.1559600830078125, -0.114227294921875, -0.0724945068359375, -0.03076171875, 0.0109710693359375, 0.052703857421875, 0.0944366455078125, 0.13616943359375, 0.1779022216796875, 0.219635009765625, 0.2613677978515625, 0.3031005859375, 0.3448333740234375, 0.386566162109375, 0.4282989501953125, 0.47003173828125, 0.5117645263671875, 0.553497314453125, 0.5952301025390625, 0.636962890625, 0.6786956787109375, 0.720428466796875, 0.7621612548828125, 0.80389404296875, 0.8456268310546875, 0.887359619140625, 0.9290924072265625, 0.9708251953125, 1.0125579833984375, 1.054290771484375, 1.0960235595703125, 1.13775634765625, 1.1794891357421875, 1.221221923828125, 1.2629547119140625, 1.3046875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 8.0, 24.0, 21.0, 35.0, 48.0, 77.0, 121.0, 181.0, 233.0, 397.0, 652.0, 1127.0, 1984.0, 3891.0, 7535.0, 16424.0, 48775.0, 1742372.0, 219296.0, 29211.0, 11922.0, 5661.0, 3036.0, 1661.0, 931.0, 497.0, 334.0, 201.0, 135.0, 92.0, 52.0, 49.0, 21.0, 25.0, 18.0, 21.0, 14.0, 8.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3916015625, -0.3788871765136719, -0.36617279052734375, -0.3534584045410156, -0.3407440185546875, -0.3280296325683594, -0.31531524658203125, -0.3026008605957031, -0.289886474609375, -0.2771720886230469, -0.26445770263671875, -0.2517433166503906, -0.2390289306640625, -0.22631454467773438, -0.21360015869140625, -0.20088577270507812, -0.18817138671875, -0.17545700073242188, -0.16274261474609375, -0.15002822875976562, -0.1373138427734375, -0.12459945678710938, -0.11188507080078125, -0.09917068481445312, -0.086456298828125, -0.07374191284179688, -0.06102752685546875, -0.048313140869140625, -0.0355987548828125, -0.022884368896484375, -0.01016998291015625, 0.002544403076171875, 0.0152587890625, 0.027973175048828125, 0.04068756103515625, 0.053401947021484375, 0.0661163330078125, 0.07883071899414062, 0.09154510498046875, 0.10425949096679688, 0.116973876953125, 0.12968826293945312, 0.14240264892578125, 0.15511703491210938, 0.1678314208984375, 0.18054580688476562, 0.19326019287109375, 0.20597457885742188, 0.21868896484375, 0.23140335083007812, 0.24411773681640625, 0.2568321228027344, 0.2695465087890625, 0.2822608947753906, 0.29497528076171875, 0.3076896667480469, 0.320404052734375, 0.3331184387207031, 0.34583282470703125, 0.3585472106933594, 0.3712615966796875, 0.3839759826660156, 0.39669036865234375, 0.4094047546386719, 0.422119140625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 8.0, 11.0, 17.0, 14.0, 22.0, 24.0, 24.0, 22.0, 16.0, 31.0, 52.0, 25.0, 49.0, 46.0, 53.0, 31.0, 53.0, 50.0, 63.0, 44.0, 62.0, 42.0, 43.0, 33.0, 30.0, 21.0, 26.0, 17.0, 18.0, 10.0, 7.0, 14.0, 2.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01430511474609375, -0.013888239860534668, -0.013471364974975586, -0.013054490089416504, -0.012637615203857422, -0.01222074031829834, -0.011803865432739258, -0.011386990547180176, -0.010970115661621094, -0.010553240776062012, -0.01013636589050293, -0.009719491004943848, -0.009302616119384766, -0.008885741233825684, -0.008468866348266602, -0.00805199146270752, -0.0076351165771484375, -0.0072182416915893555, -0.0068013668060302734, -0.006384491920471191, -0.005967617034912109, -0.005550742149353027, -0.005133867263793945, -0.004716992378234863, -0.004300117492675781, -0.0038832426071166992, -0.003466367721557617, -0.003049492835998535, -0.002632617950439453, -0.002215743064880371, -0.001798868179321289, -0.001381993293762207, -0.000965118408203125, -0.000548243522644043, -0.00013136863708496094, 0.0002855062484741211, 0.0007023811340332031, 0.0011192560195922852, 0.0015361309051513672, 0.0019530057907104492, 0.0023698806762695312, 0.0027867555618286133, 0.0032036304473876953, 0.0036205053329467773, 0.004037380218505859, 0.004454255104064941, 0.0048711299896240234, 0.0052880048751831055, 0.0057048797607421875, 0.0061217546463012695, 0.0065386295318603516, 0.006955504417419434, 0.007372379302978516, 0.007789254188537598, 0.00820612907409668, 0.008623003959655762, 0.009039878845214844, 0.009456753730773926, 0.009873628616333008, 0.01029050350189209, 0.010707378387451172, 0.011124253273010254, 0.011541128158569336, 0.011958003044128418, 0.0123748779296875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 2.0, 10.0, 10.0, 9.0, 19.0, 21.0, 28.0, 34.0, 41.0, 55.0, 78.0, 108.0, 167.0, 286.0, 634.0, 4153.0, 991980.0, 49041.0, 834.0, 366.0, 181.0, 102.0, 98.0, 64.0, 50.0, 36.0, 24.0, 30.0, 17.0, 21.0, 16.0, 11.0, 6.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.266357421875, -0.25738525390625, -0.2484130859375, -0.23944091796875, -0.23046875, -0.22149658203125, -0.2125244140625, -0.20355224609375, -0.194580078125, -0.18560791015625, -0.1766357421875, -0.16766357421875, -0.15869140625, -0.14971923828125, -0.1407470703125, -0.13177490234375, -0.122802734375, -0.11383056640625, -0.1048583984375, -0.09588623046875, -0.0869140625, -0.07794189453125, -0.0689697265625, -0.05999755859375, -0.051025390625, -0.04205322265625, -0.0330810546875, -0.02410888671875, -0.01513671875, -0.00616455078125, 0.0028076171875, 0.01177978515625, 0.020751953125, 0.02972412109375, 0.0386962890625, 0.04766845703125, 0.056640625, 0.06561279296875, 0.0745849609375, 0.08355712890625, 0.092529296875, 0.10150146484375, 0.1104736328125, 0.11944580078125, 0.12841796875, 0.13739013671875, 0.1463623046875, 0.15533447265625, 0.164306640625, 0.17327880859375, 0.1822509765625, 0.19122314453125, 0.2001953125, 0.20916748046875, 0.2181396484375, 0.22711181640625, 0.236083984375, 0.24505615234375, 0.2540283203125, 0.26300048828125, 0.27197265625, 0.28094482421875, 0.2899169921875, 0.29888916015625, 0.307861328125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 16.0, 48.0, 233.0, 545.0, 143.0, 22.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14738336205482483, -0.14413972198963165, -0.14089608192443848, -0.1376524269580841, -0.13440878689289093, -0.13116514682769775, -0.12792150676250458, -0.1246778666973114, -0.12143422663211823, -0.11819058656692505, -0.11494693905115128, -0.1117032989859581, -0.10845965892076492, -0.10521601140499115, -0.10197237133979797, -0.0987287312746048, -0.09548508375883102, -0.09224144369363785, -0.08899779617786407, -0.0857541561126709, -0.08251051604747772, -0.07926687598228455, -0.07602322846651077, -0.0727795884013176, -0.06953594088554382, -0.06629230082035065, -0.06304865330457687, -0.0598050132393837, -0.05656137317419052, -0.053317729383707047, -0.05007408559322357, -0.046830445528030396, -0.043586812913417816, -0.04034316912293434, -0.037099529057741165, -0.03385588526725769, -0.030612243339419365, -0.02736860141158104, -0.024124957621097565, -0.02088131569325924, -0.017637673765420914, -0.014394031837582588, -0.011150388978421688, -0.007906746119260788, -0.0046631041914224625, -0.001419462263584137, 0.0018241815268993378, 0.005067823454737663, 0.008311465382575989, 0.011555107310414314, 0.014798750169575214, 0.018042393028736115, 0.02128603495657444, 0.024529676884412766, 0.02777332067489624, 0.031016962602734566, 0.03426060453057289, 0.037504248321056366, 0.04074788838624954, 0.04399153217673302, 0.04723517596721649, 0.05047881603240967, 0.05372245982289314, 0.05696610361337662, 0.060209743678569794]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 7.0, 7.0, 6.0, 19.0, 10.0, 22.0, 22.0, 22.0, 34.0, 30.0, 31.0, 22.0, 39.0, 51.0, 36.0, 47.0, 45.0, 49.0, 34.0, 35.0, 36.0, 45.0, 38.0, 37.0, 31.0, 31.0, 42.0, 23.0, 24.0, 13.0, 19.0, 19.0, 9.0, 9.0, 12.0, 5.0, 7.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.019085168838500977, -0.018519429489970207, -0.017953690141439438, -0.01738795079290867, -0.0168222114443779, -0.01625647209584713, -0.01569073274731636, -0.015124993398785591, -0.014559254050254822, -0.013993514701724052, -0.013427775353193283, -0.012862036004662514, -0.012296296656131744, -0.011730557307600975, -0.011164817959070206, -0.010599078610539436, -0.010033339262008667, -0.009467599913477898, -0.008901860564947128, -0.008336121216416359, -0.00777038186788559, -0.00720464251935482, -0.006638903170824051, -0.0060731638222932816, -0.005507424473762512, -0.004941685125231743, -0.0043759457767009735, -0.003810206428170204, -0.003244467079639435, -0.0026787277311086655, -0.002112988382577896, -0.0015472490340471268, -0.0009815096855163574, -0.0004157703369855881, 0.00014996901154518127, 0.0007157083600759506, 0.00128144770860672, 0.0018471870571374893, 0.0024129264056682587, 0.002978665754199028, 0.0035444051027297974, 0.004110144451260567, 0.004675883799791336, 0.005241623148322105, 0.005807362496852875, 0.006373101845383644, 0.0069388411939144135, 0.007504580542445183, 0.008070319890975952, 0.008636059239506721, 0.00920179858803749, 0.00976753793656826, 0.01033327728509903, 0.010899016633629799, 0.011464755982160568, 0.012030495330691338, 0.012596234679222107, 0.013161974027752876, 0.013727713376283646, 0.014293452724814415, 0.014859192073345184, 0.015424931421875954, 0.015990670770406723, 0.016556410118937492, 0.01712214946746826]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 2.0, 6.0, 7.0, 14.0, 16.0, 14.0, 14.0, 20.0, 24.0, 18.0, 21.0, 20.0, 24.0, 34.0, 29.0, 50.0, 41.0, 41.0, 41.0, 43.0, 37.0, 41.0, 36.0, 45.0, 38.0, 33.0, 33.0, 32.0, 24.0, 25.0, 30.0, 24.0, 20.0, 18.0, 13.0, 10.0, 6.0, 15.0, 4.0, 10.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-2.20703125, -2.144500732421875, -2.08197021484375, -2.019439697265625, -1.9569091796875, -1.894378662109375, -1.83184814453125, -1.769317626953125, -1.706787109375, -1.644256591796875, -1.58172607421875, -1.519195556640625, -1.4566650390625, -1.394134521484375, -1.33160400390625, -1.269073486328125, -1.20654296875, -1.144012451171875, -1.08148193359375, -1.018951416015625, -0.9564208984375, -0.893890380859375, -0.83135986328125, -0.768829345703125, -0.706298828125, -0.643768310546875, -0.58123779296875, -0.518707275390625, -0.4561767578125, -0.393646240234375, -0.33111572265625, -0.268585205078125, -0.2060546875, -0.143524169921875, -0.08099365234375, -0.018463134765625, 0.0440673828125, 0.106597900390625, 0.16912841796875, 0.231658935546875, 0.294189453125, 0.356719970703125, 0.41925048828125, 0.481781005859375, 0.5443115234375, 0.606842041015625, 0.66937255859375, 0.731903076171875, 0.79443359375, 0.856964111328125, 0.91949462890625, 0.982025146484375, 1.0445556640625, 1.107086181640625, 1.16961669921875, 1.232147216796875, 1.294677734375, 1.357208251953125, 1.41973876953125, 1.482269287109375, 1.5447998046875, 1.607330322265625, 1.66986083984375, 1.732391357421875, 1.794921875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 11.0, 20.0, 32.0, 29.0, 45.0, 88.0, 105.0, 170.0, 227.0, 319.0, 498.0, 719.0, 1106.0, 1617.0, 2314.0, 3699.0, 5803.0, 9132.0, 14538.0, 24036.0, 40680.0, 73160.0, 141531.0, 250443.0, 216234.0, 112804.0, 59877.0, 34031.0, 20398.0, 12397.0, 7765.0, 4998.0, 3290.0, 2120.0, 1425.0, 949.0, 574.0, 428.0, 288.0, 174.0, 131.0, 100.0, 67.0, 42.0, 29.0, 19.0, 24.0, 18.0, 11.0, 9.0, 7.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.15234375, -2.0802001953125, -2.008056640625, -1.9359130859375, -1.86376953125, -1.7916259765625, -1.719482421875, -1.6473388671875, -1.5751953125, -1.5030517578125, -1.430908203125, -1.3587646484375, -1.28662109375, -1.2144775390625, -1.142333984375, -1.0701904296875, -0.998046875, -0.9259033203125, -0.853759765625, -0.7816162109375, -0.70947265625, -0.6373291015625, -0.565185546875, -0.4930419921875, -0.4208984375, -0.3487548828125, -0.276611328125, -0.2044677734375, -0.13232421875, -0.0601806640625, 0.011962890625, 0.0841064453125, 0.15625, 0.2283935546875, 0.300537109375, 0.3726806640625, 0.44482421875, 0.5169677734375, 0.589111328125, 0.6612548828125, 0.7333984375, 0.8055419921875, 0.877685546875, 0.9498291015625, 1.02197265625, 1.0941162109375, 1.166259765625, 1.2384033203125, 1.310546875, 1.3826904296875, 1.454833984375, 1.5269775390625, 1.59912109375, 1.6712646484375, 1.743408203125, 1.8155517578125, 1.8876953125, 1.9598388671875, 2.031982421875, 2.1041259765625, 2.17626953125, 2.2484130859375, 2.320556640625, 2.3927001953125, 2.46484375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 7.0, 5.0, 5.0, 5.0, 6.0, 6.0, 10.0, 12.0, 15.0, 20.0, 20.0, 25.0, 29.0, 36.0, 37.0, 38.0, 60.0, 65.0, 89.0, 125.0, 214.0, 1319.0, 240.0, 136.0, 94.0, 73.0, 55.0, 52.0, 43.0, 32.0, 25.0, 29.0, 27.0, 20.0, 21.0, 19.0, 13.0, 5.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4140625, -5.2530517578125, -5.092041015625, -4.9310302734375, -4.77001953125, -4.6090087890625, -4.447998046875, -4.2869873046875, -4.1259765625, -3.9649658203125, -3.803955078125, -3.6429443359375, -3.48193359375, -3.3209228515625, -3.159912109375, -2.9989013671875, -2.837890625, -2.6768798828125, -2.515869140625, -2.3548583984375, -2.19384765625, -2.0328369140625, -1.871826171875, -1.7108154296875, -1.5498046875, -1.3887939453125, -1.227783203125, -1.0667724609375, -0.90576171875, -0.7447509765625, -0.583740234375, -0.4227294921875, -0.26171875, -0.1007080078125, 0.060302734375, 0.2213134765625, 0.38232421875, 0.5433349609375, 0.704345703125, 0.8653564453125, 1.0263671875, 1.1873779296875, 1.348388671875, 1.5093994140625, 1.67041015625, 1.8314208984375, 1.992431640625, 2.1534423828125, 2.314453125, 2.4754638671875, 2.636474609375, 2.7974853515625, 2.95849609375, 3.1195068359375, 3.280517578125, 3.4415283203125, 3.6025390625, 3.7635498046875, 3.924560546875, 4.0855712890625, 4.24658203125, 4.4075927734375, 4.568603515625, 4.7296142578125, 4.890625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 11.0, 10.0, 16.0, 20.0, 19.0, 33.0, 27.0, 61.0, 80.0, 114.0, 186.0, 238.0, 510.0, 1064.0, 3085.0, 10045.0, 35896.0, 227084.0, 2459779.0, 343645.0, 45705.0, 11803.0, 3583.0, 1235.0, 529.0, 307.0, 176.0, 114.0, 86.0, 54.0, 40.0, 24.0, 27.0, 21.0, 11.0, 13.0, 11.0, 5.0, 6.0, 9.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.37890625, -6.1702880859375, -5.961669921875, -5.7530517578125, -5.54443359375, -5.3358154296875, -5.127197265625, -4.9185791015625, -4.7099609375, -4.5013427734375, -4.292724609375, -4.0841064453125, -3.87548828125, -3.6668701171875, -3.458251953125, -3.2496337890625, -3.041015625, -2.8323974609375, -2.623779296875, -2.4151611328125, -2.20654296875, -1.9979248046875, -1.789306640625, -1.5806884765625, -1.3720703125, -1.1634521484375, -0.954833984375, -0.7462158203125, -0.53759765625, -0.3289794921875, -0.120361328125, 0.0882568359375, 0.296875, 0.5054931640625, 0.714111328125, 0.9227294921875, 1.13134765625, 1.3399658203125, 1.548583984375, 1.7572021484375, 1.9658203125, 2.1744384765625, 2.383056640625, 2.5916748046875, 2.80029296875, 3.0089111328125, 3.217529296875, 3.4261474609375, 3.634765625, 3.8433837890625, 4.052001953125, 4.2606201171875, 4.46923828125, 4.6778564453125, 4.886474609375, 5.0950927734375, 5.3037109375, 5.5123291015625, 5.720947265625, 5.9295654296875, 6.13818359375, 6.3468017578125, 6.555419921875, 6.7640380859375, 6.97265625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 26.0, 71.0, 189.0, 251.0, 260.0, 127.0, 58.0, 16.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.67680740356445, -44.46885681152344, -43.26090621948242, -42.052955627441406, -40.84500503540039, -39.637054443359375, -38.429107666015625, -37.22115707397461, -36.013206481933594, -34.80525588989258, -33.59730529785156, -32.38935470581055, -31.181406021118164, -29.97345542907715, -28.765504837036133, -27.55755615234375, -26.3496036529541, -25.141653060913086, -23.93370246887207, -22.725753784179688, -21.517803192138672, -20.309852600097656, -19.10190200805664, -17.893951416015625, -16.68600082397461, -15.478050231933594, -14.270100593566895, -13.062150001525879, -11.85420036315918, -10.646249771118164, -9.438299179077148, -8.23034954071045, -7.02239990234375, -5.814449787139893, -4.606499671936035, -3.3985490798950195, -2.190598964691162, -0.9826488494873047, 0.22530174255371094, 1.4332513809204102, 2.641201972961426, 3.849152088165283, 5.057102203369141, 6.265052795410156, 7.473002910614014, 8.680953025817871, 9.888903617858887, 11.096853256225586, 12.304803848266602, 13.512754440307617, 14.720704078674316, 15.928654670715332, 17.13660430908203, 18.344554901123047, 19.552505493164062, 20.760456085205078, 21.968406677246094, 23.17635726928711, 24.384307861328125, 25.59225845336914, 26.800207138061523, 28.00815773010254, 29.216108322143555, 30.424057006835938, 31.632007598876953]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 4.0, 15.0, 12.0, 13.0, 10.0, 15.0, 24.0, 23.0, 21.0, 32.0, 37.0, 22.0, 31.0, 38.0, 36.0, 47.0, 39.0, 52.0, 43.0, 48.0, 49.0, 44.0, 41.0, 38.0, 34.0, 33.0, 32.0, 24.0, 22.0, 22.0, 16.0, 20.0, 8.0, 13.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.214388847351074, -12.81005573272705, -12.405723571777344, -12.00139045715332, -11.597057342529297, -11.192724227905273, -10.788392066955566, -10.384058952331543, -9.979726791381836, -9.575393676757812, -9.171061515808105, -8.766728401184082, -8.362395286560059, -7.958062648773193, -7.553730010986328, -7.149396896362305, -6.745063781738281, -6.340731143951416, -5.936398029327393, -5.532065391540527, -5.127732276916504, -4.723399639129639, -4.319067001342773, -3.914734125137329, -3.5104012489318848, -3.1060683727264404, -2.701735496520996, -2.297402858734131, -1.8930699825286865, -1.4887371063232422, -1.084404468536377, -0.6800715923309326, -0.2757396697998047, 0.12859314680099487, 0.5329259634017944, 0.9372587203979492, 1.3415915966033936, 1.745924472808838, 2.150257110595703, 2.5545899868011475, 2.958922863006592, 3.363255739212036, 3.7675886154174805, 4.171921253204346, 4.576253890991211, 4.980587005615234, 5.3849196434021, 5.789252281188965, 6.193585395812988, 6.5979180335998535, 7.002251148223877, 7.406583786010742, 7.810916900634766, 8.215250015258789, 8.619582176208496, 9.02391529083252, 9.428247451782227, 9.83258056640625, 10.236912727355957, 10.64124584197998, 11.045578956604004, 11.449911117553711, 11.854244232177734, 12.258577346801758, 12.662910461425781]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 4.0, 3.0, 6.0, 10.0, 18.0, 10.0, 13.0, 14.0, 13.0, 18.0, 20.0, 22.0, 23.0, 33.0, 43.0, 45.0, 33.0, 44.0, 47.0, 49.0, 43.0, 45.0, 48.0, 36.0, 43.0, 23.0, 38.0, 30.0, 34.0, 19.0, 29.0, 20.0, 18.0, 16.0, 19.0, 12.0, 16.0, 4.0, 8.0, 7.0, 2.0, 5.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-2.458984375, -2.3902740478515625, -2.321563720703125, -2.2528533935546875, -2.18414306640625, -2.1154327392578125, -2.046722412109375, -1.9780120849609375, -1.9093017578125, -1.8405914306640625, -1.771881103515625, -1.7031707763671875, -1.63446044921875, -1.5657501220703125, -1.497039794921875, -1.4283294677734375, -1.359619140625, -1.2909088134765625, -1.222198486328125, -1.1534881591796875, -1.08477783203125, -1.0160675048828125, -0.947357177734375, -0.8786468505859375, -0.8099365234375, -0.7412261962890625, -0.672515869140625, -0.6038055419921875, -0.53509521484375, -0.4663848876953125, -0.397674560546875, -0.3289642333984375, -0.26025390625, -0.1915435791015625, -0.122833251953125, -0.0541229248046875, 0.01458740234375, 0.0832977294921875, 0.152008056640625, 0.2207183837890625, 0.2894287109375, 0.3581390380859375, 0.426849365234375, 0.4955596923828125, 0.56427001953125, 0.6329803466796875, 0.701690673828125, 0.7704010009765625, 0.839111328125, 0.9078216552734375, 0.976531982421875, 1.0452423095703125, 1.11395263671875, 1.1826629638671875, 1.251373291015625, 1.3200836181640625, 1.3887939453125, 1.4575042724609375, 1.526214599609375, 1.5949249267578125, 1.66363525390625, 1.7323455810546875, 1.801055908203125, 1.8697662353515625, 1.9384765625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 10.0, 6.0, 9.0, 12.0, 10.0, 18.0, 14.0, 29.0, 40.0, 47.0, 52.0, 72.0, 95.0, 148.0, 179.0, 326.0, 944.0, 5075.0, 79127.0, 4012538.0, 87848.0, 5500.0, 1013.0, 357.0, 203.0, 135.0, 116.0, 74.0, 55.0, 42.0, 36.0, 27.0, 23.0, 19.0, 11.0, 17.0, 6.0, 8.0, 9.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.90625, -19.312255859375, -18.71826171875, -18.124267578125, -17.5302734375, -16.936279296875, -16.34228515625, -15.748291015625, -15.154296875, -14.560302734375, -13.96630859375, -13.372314453125, -12.7783203125, -12.184326171875, -11.59033203125, -10.996337890625, -10.40234375, -9.808349609375, -9.21435546875, -8.620361328125, -8.0263671875, -7.432373046875, -6.83837890625, -6.244384765625, -5.650390625, -5.056396484375, -4.46240234375, -3.868408203125, -3.2744140625, -2.680419921875, -2.08642578125, -1.492431640625, -0.8984375, -0.304443359375, 0.28955078125, 0.883544921875, 1.4775390625, 2.071533203125, 2.66552734375, 3.259521484375, 3.853515625, 4.447509765625, 5.04150390625, 5.635498046875, 6.2294921875, 6.823486328125, 7.41748046875, 8.011474609375, 8.60546875, 9.199462890625, 9.79345703125, 10.387451171875, 10.9814453125, 11.575439453125, 12.16943359375, 12.763427734375, 13.357421875, 13.951416015625, 14.54541015625, 15.139404296875, 15.7333984375, 16.327392578125, 16.92138671875, 17.515380859375, 18.109375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 14.0, 5.0, 10.0, 15.0, 21.0, 20.0, 25.0, 43.0, 61.0, 85.0, 108.0, 146.0, 220.0, 292.0, 489.0, 754.0, 585.0, 359.0, 241.0, 144.0, 107.0, 68.0, 65.0, 55.0, 32.0, 23.0, 16.0, 15.0, 9.0, 5.0, 11.0, 3.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.02734375, -3.907684326171875, -3.78802490234375, -3.668365478515625, -3.5487060546875, -3.429046630859375, -3.30938720703125, -3.189727783203125, -3.070068359375, -2.950408935546875, -2.83074951171875, -2.711090087890625, -2.5914306640625, -2.471771240234375, -2.35211181640625, -2.232452392578125, -2.11279296875, -1.993133544921875, -1.87347412109375, -1.753814697265625, -1.6341552734375, -1.514495849609375, -1.39483642578125, -1.275177001953125, -1.155517578125, -1.035858154296875, -0.91619873046875, -0.796539306640625, -0.6768798828125, -0.557220458984375, -0.43756103515625, -0.317901611328125, -0.1982421875, -0.078582763671875, 0.04107666015625, 0.160736083984375, 0.2803955078125, 0.400054931640625, 0.51971435546875, 0.639373779296875, 0.759033203125, 0.878692626953125, 0.99835205078125, 1.118011474609375, 1.2376708984375, 1.357330322265625, 1.47698974609375, 1.596649169921875, 1.71630859375, 1.835968017578125, 1.95562744140625, 2.075286865234375, 2.1949462890625, 2.314605712890625, 2.43426513671875, 2.553924560546875, 2.673583984375, 2.793243408203125, 2.91290283203125, 3.032562255859375, 3.1522216796875, 3.271881103515625, 3.39154052734375, 3.511199951171875, 3.630859375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 14.0, 11.0, 16.0, 12.0, 36.0, 48.0, 65.0, 87.0, 165.0, 273.0, 622.0, 1405.0, 4514.0, 17359.0, 88894.0, 1127901.0, 2774585.0, 143631.0, 25064.0, 6119.0, 1835.0, 703.0, 331.0, 211.0, 112.0, 64.0, 50.0, 35.0, 24.0, 24.0, 18.0, 12.0, 5.0, 8.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.03125, -7.7554931640625, -7.479736328125, -7.2039794921875, -6.92822265625, -6.6524658203125, -6.376708984375, -6.1009521484375, -5.8251953125, -5.5494384765625, -5.273681640625, -4.9979248046875, -4.72216796875, -4.4464111328125, -4.170654296875, -3.8948974609375, -3.619140625, -3.3433837890625, -3.067626953125, -2.7918701171875, -2.51611328125, -2.2403564453125, -1.964599609375, -1.6888427734375, -1.4130859375, -1.1373291015625, -0.861572265625, -0.5858154296875, -0.31005859375, -0.0343017578125, 0.241455078125, 0.5172119140625, 0.79296875, 1.0687255859375, 1.344482421875, 1.6202392578125, 1.89599609375, 2.1717529296875, 2.447509765625, 2.7232666015625, 2.9990234375, 3.2747802734375, 3.550537109375, 3.8262939453125, 4.10205078125, 4.3778076171875, 4.653564453125, 4.9293212890625, 5.205078125, 5.4808349609375, 5.756591796875, 6.0323486328125, 6.30810546875, 6.5838623046875, 6.859619140625, 7.1353759765625, 7.4111328125, 7.6868896484375, 7.962646484375, 8.2384033203125, 8.51416015625, 8.7899169921875, 9.065673828125, 9.3414306640625, 9.6171875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 10.0, 49.0, 110.0, 246.0, 304.0, 182.0, 78.0, 26.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.19058227539062, -74.70643615722656, -73.22228240966797, -71.7381362915039, -70.25398254394531, -68.76983642578125, -67.28569030761719, -65.8015365600586, -64.31739044189453, -62.8332405090332, -61.349090576171875, -59.86494445800781, -58.380794525146484, -56.896644592285156, -55.412498474121094, -53.928348541259766, -52.44419860839844, -50.96004867553711, -49.47589874267578, -47.99175262451172, -46.50760269165039, -45.02345275878906, -43.539306640625, -42.05515670776367, -40.571006774902344, -39.086856842041016, -37.60270690917969, -36.118560791015625, -34.6344108581543, -33.15026092529297, -31.666112899780273, -30.181964874267578, -28.69781494140625, -27.213665008544922, -25.729516983032227, -24.24536895751953, -22.761219024658203, -21.277069091796875, -19.79292106628418, -18.308773040771484, -16.824623107910156, -15.340474128723145, -13.856325149536133, -12.372176170349121, -10.88802719116211, -9.403878211975098, -7.919729232788086, -6.435580253601074, -4.9514312744140625, -3.467282295227051, -1.983133316040039, -0.49898433685302734, 0.9851646423339844, 2.469313621520996, 3.953462600708008, 5.4376115798950195, 6.921760559082031, 8.405909538269043, 9.890058517456055, 11.374207496643066, 12.858356475830078, 14.34250545501709, 15.826654434204102, 17.310802459716797, 18.794952392578125]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 9.0, 7.0, 6.0, 12.0, 16.0, 11.0, 17.0, 13.0, 21.0, 21.0, 26.0, 33.0, 18.0, 29.0, 28.0, 34.0, 30.0, 27.0, 33.0, 31.0, 31.0, 34.0, 42.0, 39.0, 36.0, 40.0, 35.0, 38.0, 36.0, 29.0, 14.0, 31.0, 26.0, 21.0, 15.0, 20.0, 15.0, 15.0, 15.0, 11.0, 11.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.849674224853516, -10.510754585266113, -10.171834945678711, -9.832914352416992, -9.49399471282959, -9.155075073242188, -8.816155433654785, -8.477235794067383, -8.138315200805664, -7.799395561218262, -7.460475444793701, -7.121555805206299, -6.782635688781738, -6.443716049194336, -6.104796409606934, -5.765876770019531, -5.426957130432129, -5.088037490844727, -4.749117374420166, -4.410197734832764, -4.071277618408203, -3.732357978820801, -3.3934383392333984, -3.054518461227417, -2.7155985832214355, -2.376678705215454, -2.0377588272094727, -1.6988391876220703, -1.3599193096160889, -1.0209994316101074, -0.6820797920227051, -0.34315991401672363, -0.0042400360107421875, 0.3346797823905945, 0.6735996007919312, 1.012519359588623, 1.3514392375946045, 1.690359115600586, 2.0292787551879883, 2.3681986331939697, 2.707118511199951, 3.0460383892059326, 3.384958267211914, 3.7238779067993164, 4.062797546386719, 4.401717662811279, 4.740637302398682, 5.079557418823242, 5.4184770584106445, 5.757396697998047, 6.096316814422607, 6.43523645401001, 6.77415657043457, 7.113076210021973, 7.451995849609375, 7.790915489196777, 8.12983512878418, 8.468754768371582, 8.807674407958984, 9.146595001220703, 9.485514640808105, 9.824434280395508, 10.16335391998291, 10.502273559570312, 10.841194152832031]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 10.0, 9.0, 8.0, 17.0, 11.0, 18.0, 33.0, 24.0, 26.0, 38.0, 34.0, 48.0, 39.0, 45.0, 39.0, 44.0, 43.0, 46.0, 54.0, 40.0, 38.0, 40.0, 48.0, 39.0, 30.0, 17.0, 24.0, 24.0, 16.0, 18.0, 16.0, 10.0, 13.0, 8.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.548828125, -2.473663330078125, -2.39849853515625, -2.323333740234375, -2.2481689453125, -2.173004150390625, -2.09783935546875, -2.022674560546875, -1.947509765625, -1.872344970703125, -1.79718017578125, -1.722015380859375, -1.6468505859375, -1.571685791015625, -1.49652099609375, -1.421356201171875, -1.34619140625, -1.271026611328125, -1.19586181640625, -1.120697021484375, -1.0455322265625, -0.970367431640625, -0.89520263671875, -0.820037841796875, -0.744873046875, -0.669708251953125, -0.59454345703125, -0.519378662109375, -0.4442138671875, -0.369049072265625, -0.29388427734375, -0.218719482421875, -0.1435546875, -0.068389892578125, 0.00677490234375, 0.081939697265625, 0.1571044921875, 0.232269287109375, 0.30743408203125, 0.382598876953125, 0.457763671875, 0.532928466796875, 0.60809326171875, 0.683258056640625, 0.7584228515625, 0.833587646484375, 0.90875244140625, 0.983917236328125, 1.05908203125, 1.134246826171875, 1.20941162109375, 1.284576416015625, 1.3597412109375, 1.434906005859375, 1.51007080078125, 1.585235595703125, 1.660400390625, 1.735565185546875, 1.81072998046875, 1.885894775390625, 1.9610595703125, 2.036224365234375, 2.11138916015625, 2.186553955078125, 2.26171875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 5.0, 5.0, 6.0, 12.0, 16.0, 20.0, 25.0, 36.0, 39.0, 65.0, 94.0, 133.0, 203.0, 301.0, 465.0, 692.0, 1111.0, 1694.0, 2814.0, 4451.0, 7275.0, 12016.0, 20999.0, 37172.0, 70331.0, 137804.0, 235456.0, 230189.0, 131399.0, 67513.0, 35739.0, 20133.0, 11614.0, 6965.0, 4234.0, 2604.0, 1636.0, 1135.0, 683.0, 457.0, 334.0, 209.0, 173.0, 102.0, 64.0, 48.0, 26.0, 20.0, 14.0, 16.0, 10.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.232177734375, -0.22467994689941406, -0.21718215942382812, -0.2096843719482422, -0.20218658447265625, -0.1946887969970703, -0.18719100952148438, -0.17969322204589844, -0.1721954345703125, -0.16469764709472656, -0.15719985961914062, -0.1497020721435547, -0.14220428466796875, -0.1347064971923828, -0.12720870971679688, -0.11971092224121094, -0.112213134765625, -0.10471534729003906, -0.09721755981445312, -0.08971977233886719, -0.08222198486328125, -0.07472419738769531, -0.06722640991210938, -0.05972862243652344, -0.0522308349609375, -0.04473304748535156, -0.037235260009765625, -0.029737472534179688, -0.02223968505859375, -0.014741897583007812, -0.007244110107421875, 0.0002536773681640625, 0.00775146484375, 0.015249252319335938, 0.022747039794921875, 0.030244827270507812, 0.03774261474609375, 0.04524040222167969, 0.052738189697265625, 0.06023597717285156, 0.0677337646484375, 0.07523155212402344, 0.08272933959960938, 0.09022712707519531, 0.09772491455078125, 0.10522270202636719, 0.11272048950195312, 0.12021827697753906, 0.127716064453125, 0.13521385192871094, 0.14271163940429688, 0.1502094268798828, 0.15770721435546875, 0.1652050018310547, 0.17270278930664062, 0.18020057678222656, 0.1876983642578125, 0.19519615173339844, 0.20269393920898438, 0.2101917266845703, 0.21768951416015625, 0.2251873016357422, 0.23268508911132812, 0.24018287658691406, 0.2476806640625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 9.0, 13.0, 13.0, 5.0, 8.0, 13.0, 19.0, 17.0, 16.0, 15.0, 24.0, 33.0, 30.0, 44.0, 30.0, 40.0, 34.0, 44.0, 45.0, 1064.0, 47.0, 39.0, 35.0, 29.0, 41.0, 41.0, 36.0, 26.0, 27.0, 30.0, 25.0, 20.0, 29.0, 12.0, 21.0, 7.0, 10.0, 11.0, 3.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5380859375, -1.488037109375, -1.43798828125, -1.387939453125, -1.337890625, -1.287841796875, -1.23779296875, -1.187744140625, -1.1376953125, -1.087646484375, -1.03759765625, -0.987548828125, -0.9375, -0.887451171875, -0.83740234375, -0.787353515625, -0.7373046875, -0.687255859375, -0.63720703125, -0.587158203125, -0.537109375, -0.487060546875, -0.43701171875, -0.386962890625, -0.3369140625, -0.286865234375, -0.23681640625, -0.186767578125, -0.13671875, -0.086669921875, -0.03662109375, 0.013427734375, 0.0634765625, 0.113525390625, 0.16357421875, 0.213623046875, 0.263671875, 0.313720703125, 0.36376953125, 0.413818359375, 0.4638671875, 0.513916015625, 0.56396484375, 0.614013671875, 0.6640625, 0.714111328125, 0.76416015625, 0.814208984375, 0.8642578125, 0.914306640625, 0.96435546875, 1.014404296875, 1.064453125, 1.114501953125, 1.16455078125, 1.214599609375, 1.2646484375, 1.314697265625, 1.36474609375, 1.414794921875, 1.46484375, 1.514892578125, 1.56494140625, 1.614990234375, 1.6650390625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 7.0, 9.0, 9.0, 10.0, 14.0, 22.0, 26.0, 48.0, 47.0, 65.0, 114.0, 161.0, 217.0, 272.0, 521.0, 763.0, 1243.0, 2196.0, 4071.0, 7315.0, 14414.0, 34758.0, 290847.0, 1650791.0, 50893.0, 18200.0, 8708.0, 4645.0, 2598.0, 1516.0, 869.0, 555.0, 356.0, 225.0, 167.0, 119.0, 93.0, 46.0, 45.0, 41.0, 31.0, 24.0, 13.0, 10.0, 6.0, 7.0, 5.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.407470703125, -0.39517974853515625, -0.3828887939453125, -0.37059783935546875, -0.358306884765625, -0.34601593017578125, -0.3337249755859375, -0.32143402099609375, -0.30914306640625, -0.29685211181640625, -0.2845611572265625, -0.27227020263671875, -0.259979248046875, -0.24768829345703125, -0.2353973388671875, -0.22310638427734375, -0.2108154296875, -0.19852447509765625, -0.1862335205078125, -0.17394256591796875, -0.161651611328125, -0.14936065673828125, -0.1370697021484375, -0.12477874755859375, -0.11248779296875, -0.10019683837890625, -0.0879058837890625, -0.07561492919921875, -0.063323974609375, -0.05103302001953125, -0.0387420654296875, -0.02645111083984375, -0.01416015625, -0.00186920166015625, 0.0104217529296875, 0.02271270751953125, 0.035003662109375, 0.04729461669921875, 0.0595855712890625, 0.07187652587890625, 0.08416748046875, 0.09645843505859375, 0.1087493896484375, 0.12104034423828125, 0.133331298828125, 0.14562225341796875, 0.1579132080078125, 0.17020416259765625, 0.1824951171875, 0.19478607177734375, 0.2070770263671875, 0.21936798095703125, 0.231658935546875, 0.24394989013671875, 0.2562408447265625, 0.26853179931640625, 0.28082275390625, 0.29311370849609375, 0.3054046630859375, 0.31769561767578125, 0.329986572265625, 0.34227752685546875, 0.3545684814453125, 0.36685943603515625, 0.379150390625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 1.0, 4.0, 3.0, 6.0, 4.0, 9.0, 9.0, 10.0, 14.0, 24.0, 23.0, 28.0, 22.0, 31.0, 44.0, 61.0, 57.0, 62.0, 72.0, 65.0, 59.0, 56.0, 58.0, 46.0, 46.0, 38.0, 24.0, 25.0, 18.0, 11.0, 13.0, 13.0, 9.0, 12.0, 6.0, 4.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0156402587890625, -0.015194177627563477, -0.014748096466064453, -0.01430201530456543, -0.013855934143066406, -0.013409852981567383, -0.01296377182006836, -0.012517690658569336, -0.012071609497070312, -0.011625528335571289, -0.011179447174072266, -0.010733366012573242, -0.010287284851074219, -0.009841203689575195, -0.009395122528076172, -0.008949041366577148, -0.008502960205078125, -0.008056879043579102, -0.007610797882080078, -0.007164716720581055, -0.006718635559082031, -0.006272554397583008, -0.005826473236083984, -0.005380392074584961, -0.0049343109130859375, -0.004488229751586914, -0.004042148590087891, -0.003596067428588867, -0.0031499862670898438, -0.0027039051055908203, -0.002257823944091797, -0.0018117427825927734, -0.00136566162109375, -0.0009195804595947266, -0.0004734992980957031, -2.7418136596679688e-05, 0.00041866302490234375, 0.0008647441864013672, 0.0013108253479003906, 0.001756906509399414, 0.0022029876708984375, 0.002649068832397461, 0.0030951499938964844, 0.003541231155395508, 0.003987312316894531, 0.004433393478393555, 0.004879474639892578, 0.0053255558013916016, 0.005771636962890625, 0.0062177181243896484, 0.006663799285888672, 0.007109880447387695, 0.007555961608886719, 0.008002042770385742, 0.008448123931884766, 0.008894205093383789, 0.009340286254882812, 0.009786367416381836, 0.01023244857788086, 0.010678529739379883, 0.011124610900878906, 0.01157069206237793, 0.012016773223876953, 0.012462854385375977, 0.012908935546875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 6.0, 10.0, 8.0, 18.0, 21.0, 19.0, 32.0, 49.0, 58.0, 84.0, 106.0, 212.0, 341.0, 825.0, 23137.0, 1012712.0, 9304.0, 718.0, 294.0, 173.0, 128.0, 70.0, 42.0, 47.0, 31.0, 24.0, 16.0, 14.0, 12.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2686271667480469, -0.25917816162109375, -0.24972915649414062, -0.2402801513671875, -0.23083114624023438, -0.22138214111328125, -0.21193313598632812, -0.202484130859375, -0.19303512573242188, -0.18358612060546875, -0.17413711547851562, -0.1646881103515625, -0.15523910522460938, -0.14579010009765625, -0.13634109497070312, -0.12689208984375, -0.11744308471679688, -0.10799407958984375, -0.09854507446289062, -0.0890960693359375, -0.07964706420898438, -0.07019805908203125, -0.060749053955078125, -0.051300048828125, -0.041851043701171875, -0.03240203857421875, -0.022953033447265625, -0.0135040283203125, -0.004055023193359375, 0.00539398193359375, 0.014842987060546875, 0.0242919921875, 0.033740997314453125, 0.04319000244140625, 0.052639007568359375, 0.0620880126953125, 0.07153701782226562, 0.08098602294921875, 0.09043502807617188, 0.099884033203125, 0.10933303833007812, 0.11878204345703125, 0.12823104858398438, 0.1376800537109375, 0.14712905883789062, 0.15657806396484375, 0.16602706909179688, 0.17547607421875, 0.18492507934570312, 0.19437408447265625, 0.20382308959960938, 0.2132720947265625, 0.22272109985351562, 0.23217010498046875, 0.24161911010742188, 0.251068115234375, 0.2605171203613281, 0.26996612548828125, 0.2794151306152344, 0.2888641357421875, 0.2983131408691406, 0.30776214599609375, 0.3172111511230469, 0.32666015625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 12.0, 90.0, 451.0, 392.0, 59.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1871306598186493, -0.18359684944152832, -0.18006303906440735, -0.17652922868728638, -0.1729954183101654, -0.16946160793304443, -0.16592779755592346, -0.1623939722776413, -0.15886016190052032, -0.15532635152339935, -0.15179254114627838, -0.1482587307691574, -0.14472492039203644, -0.14119109511375427, -0.1376572847366333, -0.13412347435951233, -0.13058966398239136, -0.12705585360527039, -0.12352204322814941, -0.11998823285102844, -0.11645441502332687, -0.1129206046462059, -0.10938679426908493, -0.10585298389196396, -0.10231918096542358, -0.09878537058830261, -0.09525156021118164, -0.09171774983406067, -0.0881839320063591, -0.08465012162923813, -0.08111631125211716, -0.07758250087499619, -0.07404869049787521, -0.07051488012075424, -0.06698106974363327, -0.0634472519159317, -0.05991344153881073, -0.05637963116168976, -0.05284582078456879, -0.049312010407447815, -0.045778196305036545, -0.04224438592791557, -0.0387105718255043, -0.03517676144838333, -0.03164295107126236, -0.02810913696885109, -0.024575326591730118, -0.021041514351963997, -0.017507702112197876, -0.013973889872431755, -0.010440078563988209, -0.0069062672555446625, -0.0033724550157785416, 0.00016135722398757935, 0.003695167601108551, 0.007228979840874672, 0.010762792080640793, 0.014296604320406914, 0.017830416560173035, 0.021364226937294006, 0.024898039177060127, 0.028431851416826248, 0.03196566179394722, 0.03549947589635849, 0.03903328627347946]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 7.0, 9.0, 1.0, 14.0, 15.0, 17.0, 17.0, 25.0, 19.0, 31.0, 26.0, 33.0, 35.0, 39.0, 33.0, 45.0, 39.0, 37.0, 34.0, 35.0, 35.0, 49.0, 33.0, 38.0, 31.0, 49.0, 30.0, 28.0, 26.0, 26.0, 19.0, 21.0, 17.0, 17.0, 10.0, 9.0, 11.0, 10.0, 7.0, 7.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.019025146961212158, -0.018441013991832733, -0.017856881022453308, -0.017272748053073883, -0.016688615083694458, -0.016104482114315033, -0.015520349144935608, -0.014936216175556183, -0.014352083206176758, -0.013767950236797333, -0.013183817267417908, -0.012599684298038483, -0.012015551328659058, -0.011431418359279633, -0.010847285389900208, -0.010263152420520782, -0.009679019451141357, -0.009094886481761932, -0.008510753512382507, -0.007926620543003082, -0.007342487573623657, -0.006758354604244232, -0.006174221634864807, -0.005590088665485382, -0.005005955696105957, -0.004421822726726532, -0.003837689757347107, -0.003253556787967682, -0.002669423818588257, -0.002085290849208832, -0.0015011578798294067, -0.0009170249104499817, -0.00033289194107055664, 0.0002512410283088684, 0.0008353739976882935, 0.0014195069670677185, 0.0020036399364471436, 0.0025877729058265686, 0.0031719058752059937, 0.0037560388445854187, 0.004340171813964844, 0.004924304783344269, 0.005508437752723694, 0.006092570722103119, 0.006676703691482544, 0.007260836660861969, 0.007844969630241394, 0.008429102599620819, 0.009013235569000244, 0.00959736853837967, 0.010181501507759094, 0.01076563447713852, 0.011349767446517944, 0.01193390041589737, 0.012518033385276794, 0.01310216635465622, 0.013686299324035645, 0.01427043229341507, 0.014854565262794495, 0.01543869823217392, 0.016022831201553345, 0.01660696417093277, 0.017191097140312195, 0.01777523010969162, 0.018359363079071045]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 10.0, 8.0, 7.0, 19.0, 11.0, 16.0, 35.0, 23.0, 26.0, 38.0, 33.0, 50.0, 38.0, 46.0, 39.0, 43.0, 44.0, 45.0, 54.0, 41.0, 36.0, 40.0, 49.0, 40.0, 29.0, 18.0, 24.0, 23.0, 16.0, 19.0, 16.0, 10.0, 13.0, 8.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.55078125, -2.4755859375, -2.400390625, -2.3251953125, -2.25, -2.1748046875, -2.099609375, -2.0244140625, -1.94921875, -1.8740234375, -1.798828125, -1.7236328125, -1.6484375, -1.5732421875, -1.498046875, -1.4228515625, -1.34765625, -1.2724609375, -1.197265625, -1.1220703125, -1.046875, -0.9716796875, -0.896484375, -0.8212890625, -0.74609375, -0.6708984375, -0.595703125, -0.5205078125, -0.4453125, -0.3701171875, -0.294921875, -0.2197265625, -0.14453125, -0.0693359375, 0.005859375, 0.0810546875, 0.15625, 0.2314453125, 0.306640625, 0.3818359375, 0.45703125, 0.5322265625, 0.607421875, 0.6826171875, 0.7578125, 0.8330078125, 0.908203125, 0.9833984375, 1.05859375, 1.1337890625, 1.208984375, 1.2841796875, 1.359375, 1.4345703125, 1.509765625, 1.5849609375, 1.66015625, 1.7353515625, 1.810546875, 1.8857421875, 1.9609375, 2.0361328125, 2.111328125, 2.1865234375, 2.26171875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 5.0, 6.0, 7.0, 8.0, 15.0, 22.0, 29.0, 53.0, 88.0, 129.0, 196.0, 374.0, 684.0, 1298.0, 2516.0, 5359.0, 12824.0, 35885.0, 129306.0, 500474.0, 261351.0, 62701.0, 19997.0, 8034.0, 3476.0, 1685.0, 873.0, 459.0, 259.0, 167.0, 88.0, 65.0, 47.0, 25.0, 16.0, 16.0, 9.0, 5.0, 0.0, 1.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83203125, -4.67974853515625, -4.5274658203125, -4.37518310546875, -4.222900390625, -4.07061767578125, -3.9183349609375, -3.76605224609375, -3.61376953125, -3.46148681640625, -3.3092041015625, -3.15692138671875, -3.004638671875, -2.85235595703125, -2.7000732421875, -2.54779052734375, -2.3955078125, -2.24322509765625, -2.0909423828125, -1.93865966796875, -1.786376953125, -1.63409423828125, -1.4818115234375, -1.32952880859375, -1.17724609375, -1.02496337890625, -0.8726806640625, -0.72039794921875, -0.568115234375, -0.41583251953125, -0.2635498046875, -0.11126708984375, 0.041015625, 0.19329833984375, 0.3455810546875, 0.49786376953125, 0.650146484375, 0.80242919921875, 0.9547119140625, 1.10699462890625, 1.25927734375, 1.41156005859375, 1.5638427734375, 1.71612548828125, 1.868408203125, 2.02069091796875, 2.1729736328125, 2.32525634765625, 2.4775390625, 2.62982177734375, 2.7821044921875, 2.93438720703125, 3.086669921875, 3.23895263671875, 3.3912353515625, 3.54351806640625, 3.69580078125, 3.84808349609375, 4.0003662109375, 4.15264892578125, 4.304931640625, 4.45721435546875, 4.6094970703125, 4.76177978515625, 4.9140625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 8.0, 5.0, 3.0, 7.0, 7.0, 10.0, 13.0, 16.0, 16.0, 25.0, 27.0, 21.0, 33.0, 35.0, 45.0, 48.0, 70.0, 90.0, 152.0, 345.0, 1406.0, 185.0, 89.0, 72.0, 53.0, 30.0, 43.0, 39.0, 26.0, 27.0, 31.0, 20.0, 14.0, 14.0, 6.0, 5.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30859375, -5.12615966796875, -4.9437255859375, -4.76129150390625, -4.578857421875, -4.39642333984375, -4.2139892578125, -4.03155517578125, -3.84912109375, -3.66668701171875, -3.4842529296875, -3.30181884765625, -3.119384765625, -2.93695068359375, -2.7545166015625, -2.57208251953125, -2.3896484375, -2.20721435546875, -2.0247802734375, -1.84234619140625, -1.659912109375, -1.47747802734375, -1.2950439453125, -1.11260986328125, -0.93017578125, -0.74774169921875, -0.5653076171875, -0.38287353515625, -0.200439453125, -0.01800537109375, 0.1644287109375, 0.34686279296875, 0.529296875, 0.71173095703125, 0.8941650390625, 1.07659912109375, 1.259033203125, 1.44146728515625, 1.6239013671875, 1.80633544921875, 1.98876953125, 2.17120361328125, 2.3536376953125, 2.53607177734375, 2.718505859375, 2.90093994140625, 3.0833740234375, 3.26580810546875, 3.4482421875, 3.63067626953125, 3.8131103515625, 3.99554443359375, 4.177978515625, 4.36041259765625, 4.5428466796875, 4.72528076171875, 4.90771484375, 5.09014892578125, 5.2725830078125, 5.45501708984375, 5.637451171875, 5.81988525390625, 6.0023193359375, 6.18475341796875, 6.3671875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 11.0, 12.0, 13.0, 21.0, 35.0, 58.0, 78.0, 160.0, 238.0, 500.0, 1099.0, 6879.0, 3022241.0, 110629.0, 2108.0, 709.0, 379.0, 183.0, 106.0, 81.0, 50.0, 25.0, 30.0, 13.0, 17.0, 8.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.296875, -24.589599609375, -23.88232421875, -23.175048828125, -22.4677734375, -21.760498046875, -21.05322265625, -20.345947265625, -19.638671875, -18.931396484375, -18.22412109375, -17.516845703125, -16.8095703125, -16.102294921875, -15.39501953125, -14.687744140625, -13.98046875, -13.273193359375, -12.56591796875, -11.858642578125, -11.1513671875, -10.444091796875, -9.73681640625, -9.029541015625, -8.322265625, -7.614990234375, -6.90771484375, -6.200439453125, -5.4931640625, -4.785888671875, -4.07861328125, -3.371337890625, -2.6640625, -1.956787109375, -1.24951171875, -0.542236328125, 0.1650390625, 0.872314453125, 1.57958984375, 2.286865234375, 2.994140625, 3.701416015625, 4.40869140625, 5.115966796875, 5.8232421875, 6.530517578125, 7.23779296875, 7.945068359375, 8.65234375, 9.359619140625, 10.06689453125, 10.774169921875, 11.4814453125, 12.188720703125, 12.89599609375, 13.603271484375, 14.310546875, 15.017822265625, 15.72509765625, 16.432373046875, 17.1396484375, 17.846923828125, 18.55419921875, 19.261474609375, 19.96875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 16.0, 90.0, 304.0, 313.0, 218.0, 53.0, 10.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.57160568237305, -45.0859489440918, -43.60029602050781, -42.11463928222656, -40.62898635864258, -39.14332962036133, -37.657676696777344, -36.172019958496094, -34.68636703491211, -33.20071029663086, -31.715057373046875, -30.229402542114258, -28.74374771118164, -27.258092880249023, -25.772438049316406, -24.286781311035156, -22.80112648010254, -21.315471649169922, -19.829816818237305, -18.344161987304688, -16.85850715637207, -15.372852325439453, -13.88719654083252, -12.401541709899902, -10.915886878967285, -9.430232048034668, -7.944577217102051, -6.458921909332275, -4.973267078399658, -3.487612247467041, -2.0019569396972656, -0.5163021087646484, 0.9693527221679688, 2.455007553100586, 3.9406626224517822, 5.4263176918029785, 6.911972522735596, 8.397626876831055, 9.883282661437988, 11.368937492370605, 12.854592323303223, 14.34024715423584, 15.825901985168457, 17.31155776977539, 18.797212600708008, 20.282867431640625, 21.768522262573242, 23.25417709350586, 24.739831924438477, 26.225486755371094, 27.71114158630371, 29.196796417236328, 30.682451248168945, 32.16810607910156, 33.65376281738281, 35.1394157409668, 36.62507247924805, 38.1107292175293, 39.59638214111328, 41.08203887939453, 42.567691802978516, 44.053348541259766, 45.53900146484375, 47.024658203125, 48.510311126708984]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 5.0, 5.0, 8.0, 11.0, 13.0, 10.0, 14.0, 14.0, 21.0, 28.0, 18.0, 19.0, 23.0, 28.0, 35.0, 40.0, 46.0, 30.0, 44.0, 43.0, 47.0, 37.0, 34.0, 35.0, 40.0, 29.0, 36.0, 30.0, 20.0, 26.0, 35.0, 24.0, 23.0, 26.0, 11.0, 16.0, 12.0, 10.0, 14.0, 3.0, 6.0, 3.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-14.960890769958496, -14.529606819152832, -14.098321914672852, -13.667037963867188, -13.235754013061523, -12.80447006225586, -12.373186111450195, -11.941901206970215, -11.51061725616455, -11.079333305358887, -10.648048400878906, -10.216764450073242, -9.785480499267578, -9.354196548461914, -8.92291259765625, -8.49162769317627, -8.060343742370605, -7.629059791564941, -7.197775363922119, -6.766490936279297, -6.335206985473633, -5.903923034667969, -5.4726386070251465, -5.041354179382324, -4.61007022857666, -4.178786277770996, -3.747501850128174, -3.3162176609039307, -2.8849334716796875, -2.4536492824554443, -2.022365093231201, -1.591080904006958, -1.1597967147827148, -0.7285125255584717, -0.2972283363342285, 0.13405585289001465, 0.5653400421142578, 0.996624231338501, 1.4279084205627441, 1.8591926097869873, 2.2904767990112305, 2.7217609882354736, 3.153045177459717, 3.58432936668396, 4.015613555908203, 4.446897506713867, 4.8781819343566895, 5.309466361999512, 5.740750312805176, 6.17203426361084, 6.603318691253662, 7.034603118896484, 7.465887069702148, 7.8971710205078125, 8.328454971313477, 8.759739875793457, 9.191023826599121, 9.622307777404785, 10.053592681884766, 10.48487663269043, 10.916160583496094, 11.347444534301758, 11.778728485107422, 12.210013389587402, 12.641297340393066]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 8.0, 21.0, 17.0, 19.0, 16.0, 17.0, 22.0, 22.0, 40.0, 28.0, 41.0, 41.0, 43.0, 37.0, 51.0, 42.0, 36.0, 56.0, 39.0, 34.0, 30.0, 51.0, 31.0, 36.0, 31.0, 20.0, 24.0, 21.0, 16.0, 27.0, 12.0, 10.0, 10.0, 7.0, 10.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.451171875, -2.380279541015625, -2.30938720703125, -2.238494873046875, -2.1676025390625, -2.096710205078125, -2.02581787109375, -1.954925537109375, -1.884033203125, -1.813140869140625, -1.74224853515625, -1.671356201171875, -1.6004638671875, -1.529571533203125, -1.45867919921875, -1.387786865234375, -1.31689453125, -1.246002197265625, -1.17510986328125, -1.104217529296875, -1.0333251953125, -0.962432861328125, -0.89154052734375, -0.820648193359375, -0.749755859375, -0.678863525390625, -0.60797119140625, -0.537078857421875, -0.4661865234375, -0.395294189453125, -0.32440185546875, -0.253509521484375, -0.1826171875, -0.111724853515625, -0.04083251953125, 0.030059814453125, 0.1009521484375, 0.171844482421875, 0.24273681640625, 0.313629150390625, 0.384521484375, 0.455413818359375, 0.52630615234375, 0.597198486328125, 0.6680908203125, 0.738983154296875, 0.80987548828125, 0.880767822265625, 0.95166015625, 1.022552490234375, 1.09344482421875, 1.164337158203125, 1.2352294921875, 1.306121826171875, 1.37701416015625, 1.447906494140625, 1.518798828125, 1.589691162109375, 1.66058349609375, 1.731475830078125, 1.8023681640625, 1.873260498046875, 1.94415283203125, 2.015045166015625, 2.0859375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 11.0, 12.0, 14.0, 45.0, 53.0, 123.0, 203.0, 467.0, 1144.0, 2720.0, 8499.0, 46522.0, 1835734.0, 2231474.0, 53309.0, 9020.0, 2816.0, 1148.0, 472.0, 214.0, 114.0, 78.0, 45.0, 21.0, 10.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.7109375, -9.40771484375, -9.1044921875, -8.80126953125, -8.498046875, -8.19482421875, -7.8916015625, -7.58837890625, -7.28515625, -6.98193359375, -6.6787109375, -6.37548828125, -6.072265625, -5.76904296875, -5.4658203125, -5.16259765625, -4.859375, -4.55615234375, -4.2529296875, -3.94970703125, -3.646484375, -3.34326171875, -3.0400390625, -2.73681640625, -2.43359375, -2.13037109375, -1.8271484375, -1.52392578125, -1.220703125, -0.91748046875, -0.6142578125, -0.31103515625, -0.0078125, 0.29541015625, 0.5986328125, 0.90185546875, 1.205078125, 1.50830078125, 1.8115234375, 2.11474609375, 2.41796875, 2.72119140625, 3.0244140625, 3.32763671875, 3.630859375, 3.93408203125, 4.2373046875, 4.54052734375, 4.84375, 5.14697265625, 5.4501953125, 5.75341796875, 6.056640625, 6.35986328125, 6.6630859375, 6.96630859375, 7.26953125, 7.57275390625, 7.8759765625, 8.17919921875, 8.482421875, 8.78564453125, 9.0888671875, 9.39208984375, 9.6953125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 15.0, 15.0, 20.0, 31.0, 35.0, 33.0, 61.0, 67.0, 114.0, 119.0, 173.0, 283.0, 370.0, 586.0, 577.0, 394.0, 327.0, 234.0, 128.0, 121.0, 74.0, 69.0, 52.0, 42.0, 28.0, 29.0, 21.0, 15.0, 5.0, 12.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.55078125, -4.4349365234375, -4.319091796875, -4.2032470703125, -4.08740234375, -3.9715576171875, -3.855712890625, -3.7398681640625, -3.6240234375, -3.5081787109375, -3.392333984375, -3.2764892578125, -3.16064453125, -3.0447998046875, -2.928955078125, -2.8131103515625, -2.697265625, -2.5814208984375, -2.465576171875, -2.3497314453125, -2.23388671875, -2.1180419921875, -2.002197265625, -1.8863525390625, -1.7705078125, -1.6546630859375, -1.538818359375, -1.4229736328125, -1.30712890625, -1.1912841796875, -1.075439453125, -0.9595947265625, -0.84375, -0.7279052734375, -0.612060546875, -0.4962158203125, -0.38037109375, -0.2645263671875, -0.148681640625, -0.0328369140625, 0.0830078125, 0.1988525390625, 0.314697265625, 0.4305419921875, 0.54638671875, 0.6622314453125, 0.778076171875, 0.8939208984375, 1.009765625, 1.1256103515625, 1.241455078125, 1.3572998046875, 1.47314453125, 1.5889892578125, 1.704833984375, 1.8206787109375, 1.9365234375, 2.0523681640625, 2.168212890625, 2.2840576171875, 2.39990234375, 2.5157470703125, 2.631591796875, 2.7474365234375, 2.86328125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 3.0, 12.0, 15.0, 29.0, 40.0, 71.0, 99.0, 178.0, 396.0, 987.0, 2585.0, 8289.0, 37358.0, 248100.0, 2930251.0, 852390.0, 88823.0, 17416.0, 4459.0, 1554.0, 574.0, 253.0, 167.0, 97.0, 42.0, 25.0, 21.0, 13.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.72265625, -7.51806640625, -7.3134765625, -7.10888671875, -6.904296875, -6.69970703125, -6.4951171875, -6.29052734375, -6.0859375, -5.88134765625, -5.6767578125, -5.47216796875, -5.267578125, -5.06298828125, -4.8583984375, -4.65380859375, -4.44921875, -4.24462890625, -4.0400390625, -3.83544921875, -3.630859375, -3.42626953125, -3.2216796875, -3.01708984375, -2.8125, -2.60791015625, -2.4033203125, -2.19873046875, -1.994140625, -1.78955078125, -1.5849609375, -1.38037109375, -1.17578125, -0.97119140625, -0.7666015625, -0.56201171875, -0.357421875, -0.15283203125, 0.0517578125, 0.25634765625, 0.4609375, 0.66552734375, 0.8701171875, 1.07470703125, 1.279296875, 1.48388671875, 1.6884765625, 1.89306640625, 2.09765625, 2.30224609375, 2.5068359375, 2.71142578125, 2.916015625, 3.12060546875, 3.3251953125, 3.52978515625, 3.734375, 3.93896484375, 4.1435546875, 4.34814453125, 4.552734375, 4.75732421875, 4.9619140625, 5.16650390625, 5.37109375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 11.0, 202.0, 634.0, 157.0, 11.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.56571960449219, -122.3822250366211, -119.19873809814453, -116.01524353027344, -112.83175659179688, -109.64826202392578, -106.46476745605469, -103.28128051757812, -100.09779357910156, -96.91429901123047, -93.7308120727539, -90.54731750488281, -87.36383056640625, -84.18033599853516, -80.99684143066406, -77.8133544921875, -74.6298599243164, -71.44636535644531, -68.26287841796875, -65.07938385009766, -61.895896911621094, -58.71240234375, -55.52891159057617, -52.345420837402344, -49.161930084228516, -45.97843933105469, -42.79494857788086, -39.61145782470703, -36.42796325683594, -33.244476318359375, -30.06098175048828, -26.877490997314453, -23.694007873535156, -20.510517120361328, -17.3270263671875, -14.143533706665039, -10.960042953491211, -7.776552200317383, -4.593059539794922, -1.4095687866210938, 1.7739219665527344, 4.957413196563721, 8.140904426574707, 11.324396133422852, 14.50788688659668, 17.691377639770508, 20.87487030029297, 24.058361053466797, 27.241851806640625, 30.425342559814453, 33.60883331298828, 36.792327880859375, 39.97581481933594, 43.15930938720703, 46.34280014038086, 49.52629089355469, 52.709781646728516, 55.893272399902344, 59.07676315307617, 62.26025390625, 65.4437484741211, 68.62723541259766, 71.81072998046875, 74.99421691894531, 78.1777114868164]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 9.0, 6.0, 6.0, 6.0, 21.0, 13.0, 14.0, 22.0, 24.0, 27.0, 29.0, 32.0, 35.0, 27.0, 42.0, 47.0, 39.0, 33.0, 43.0, 48.0, 44.0, 45.0, 47.0, 41.0, 29.0, 26.0, 35.0, 25.0, 28.0, 23.0, 27.0, 21.0, 14.0, 15.0, 13.0, 6.0, 10.0, 8.0, 6.0, 8.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.026976585388184, -13.616568565368652, -13.206160545349121, -12.79575252532959, -12.385344505310059, -11.974936485290527, -11.564528465270996, -11.154120445251465, -10.743712425231934, -10.333304405212402, -9.922896385192871, -9.51248836517334, -9.102080345153809, -8.691672325134277, -8.281264305114746, -7.870856285095215, -7.460447788238525, -7.050039768218994, -6.639631748199463, -6.229223728179932, -5.8188157081604, -5.408407211303711, -4.99799919128418, -4.587591171264648, -4.177183151245117, -3.766775131225586, -3.3563671112060547, -2.9459590911865234, -2.535551071166992, -2.125142812728882, -1.7147347927093506, -1.3043267726898193, -0.8939189910888672, -0.48351094126701355, -0.07310289144515991, 0.3373051881790161, 0.7477132081985474, 1.1581213474273682, 1.5685293674468994, 1.9789373874664307, 2.389345407485962, 2.799753427505493, 3.2101614475250244, 3.6205697059631348, 4.030977725982666, 4.441385746002197, 4.8517937660217285, 5.26220178604126, 5.672609806060791, 6.083017826080322, 6.4934258460998535, 6.903833866119385, 7.314241886138916, 7.7246503829956055, 8.135058403015137, 8.545466423034668, 8.9558744430542, 9.36628246307373, 9.776690483093262, 10.187098503112793, 10.597506523132324, 11.007914543151855, 11.418322563171387, 11.828730583190918, 12.23913860321045]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 11.0, 5.0, 8.0, 13.0, 8.0, 13.0, 21.0, 32.0, 34.0, 27.0, 39.0, 55.0, 48.0, 46.0, 44.0, 49.0, 44.0, 48.0, 67.0, 49.0, 44.0, 50.0, 34.0, 34.0, 32.0, 26.0, 34.0, 22.0, 14.0, 13.0, 6.0, 5.0, 7.0, 5.0, 4.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.458465576171875, -2.38568115234375, -2.312896728515625, -2.2401123046875, -2.167327880859375, -2.09454345703125, -2.021759033203125, -1.948974609375, -1.876190185546875, -1.80340576171875, -1.730621337890625, -1.6578369140625, -1.585052490234375, -1.51226806640625, -1.439483642578125, -1.36669921875, -1.293914794921875, -1.22113037109375, -1.148345947265625, -1.0755615234375, -1.002777099609375, -0.92999267578125, -0.857208251953125, -0.784423828125, -0.711639404296875, -0.63885498046875, -0.566070556640625, -0.4932861328125, -0.420501708984375, -0.34771728515625, -0.274932861328125, -0.2021484375, -0.129364013671875, -0.05657958984375, 0.016204833984375, 0.0889892578125, 0.161773681640625, 0.23455810546875, 0.307342529296875, 0.380126953125, 0.452911376953125, 0.52569580078125, 0.598480224609375, 0.6712646484375, 0.744049072265625, 0.81683349609375, 0.889617919921875, 0.96240234375, 1.035186767578125, 1.10797119140625, 1.180755615234375, 1.2535400390625, 1.326324462890625, 1.39910888671875, 1.471893310546875, 1.544677734375, 1.617462158203125, 1.69024658203125, 1.763031005859375, 1.8358154296875, 1.908599853515625, 1.98138427734375, 2.054168701171875, 2.126953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 7.0, 22.0, 13.0, 21.0, 33.0, 69.0, 85.0, 132.0, 233.0, 380.0, 556.0, 855.0, 1448.0, 2442.0, 4013.0, 6784.0, 11583.0, 19503.0, 34180.0, 62054.0, 116540.0, 210739.0, 241878.0, 152291.0, 79251.0, 43319.0, 24719.0, 14295.0, 8368.0, 5016.0, 2944.0, 1779.0, 1134.0, 662.0, 426.0, 286.0, 163.0, 100.0, 69.0, 48.0, 34.0, 23.0, 15.0, 11.0, 6.0, 7.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1826171875, -0.17694664001464844, -0.17127609252929688, -0.1656055450439453, -0.15993499755859375, -0.1542644500732422, -0.14859390258789062, -0.14292335510253906, -0.1372528076171875, -0.13158226013183594, -0.12591171264648438, -0.12024116516113281, -0.11457061767578125, -0.10890007019042969, -0.10322952270507812, -0.09755897521972656, -0.091888427734375, -0.08621788024902344, -0.08054733276367188, -0.07487678527832031, -0.06920623779296875, -0.06353569030761719, -0.057865142822265625, -0.05219459533691406, -0.0465240478515625, -0.04085350036621094, -0.035182952880859375, -0.029512405395507812, -0.02384185791015625, -0.018171310424804688, -0.012500762939453125, -0.0068302154541015625, -0.00115966796875, 0.0045108795166015625, 0.010181427001953125, 0.015851974487304688, 0.02152252197265625, 0.027193069458007812, 0.032863616943359375, 0.03853416442871094, 0.0442047119140625, 0.04987525939941406, 0.055545806884765625, 0.06121635437011719, 0.06688690185546875, 0.07255744934082031, 0.07822799682617188, 0.08389854431152344, 0.089569091796875, 0.09523963928222656, 0.10091018676757812, 0.10658073425292969, 0.11225128173828125, 0.11792182922363281, 0.12359237670898438, 0.12926292419433594, 0.1349334716796875, 0.14060401916503906, 0.14627456665039062, 0.1519451141357422, 0.15761566162109375, 0.1632862091064453, 0.16895675659179688, 0.17462730407714844, 0.1802978515625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 9.0, 7.0, 10.0, 7.0, 14.0, 11.0, 13.0, 24.0, 18.0, 33.0, 17.0, 15.0, 22.0, 29.0, 35.0, 45.0, 42.0, 46.0, 44.0, 33.0, 1074.0, 31.0, 49.0, 30.0, 34.0, 39.0, 47.0, 24.0, 27.0, 23.0, 25.0, 21.0, 25.0, 19.0, 18.0, 12.0, 10.0, 7.0, 3.0, 6.0, 7.0, 4.0, 6.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2646484375, -1.225677490234375, -1.18670654296875, -1.147735595703125, -1.1087646484375, -1.069793701171875, -1.03082275390625, -0.991851806640625, -0.952880859375, -0.913909912109375, -0.87493896484375, -0.835968017578125, -0.7969970703125, -0.758026123046875, -0.71905517578125, -0.680084228515625, -0.64111328125, -0.602142333984375, -0.56317138671875, -0.524200439453125, -0.4852294921875, -0.446258544921875, -0.40728759765625, -0.368316650390625, -0.329345703125, -0.290374755859375, -0.25140380859375, -0.212432861328125, -0.1734619140625, -0.134490966796875, -0.09552001953125, -0.056549072265625, -0.017578125, 0.021392822265625, 0.06036376953125, 0.099334716796875, 0.1383056640625, 0.177276611328125, 0.21624755859375, 0.255218505859375, 0.294189453125, 0.333160400390625, 0.37213134765625, 0.411102294921875, 0.4500732421875, 0.489044189453125, 0.52801513671875, 0.566986083984375, 0.60595703125, 0.644927978515625, 0.68389892578125, 0.722869873046875, 0.7618408203125, 0.800811767578125, 0.83978271484375, 0.878753662109375, 0.917724609375, 0.956695556640625, 0.99566650390625, 1.034637451171875, 1.0736083984375, 1.112579345703125, 1.15155029296875, 1.190521240234375, 1.2294921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 10.0, 3.0, 16.0, 9.0, 11.0, 21.0, 24.0, 33.0, 52.0, 80.0, 96.0, 181.0, 220.0, 378.0, 635.0, 1167.0, 2111.0, 3895.0, 7439.0, 15410.0, 38264.0, 406576.0, 1536818.0, 47614.0, 17605.0, 8423.0, 4408.0, 2349.0, 1272.0, 795.0, 416.0, 233.0, 170.0, 120.0, 85.0, 50.0, 39.0, 27.0, 18.0, 6.0, 14.0, 10.0, 12.0, 9.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.292236328125, -0.28218841552734375, -0.2721405029296875, -0.26209259033203125, -0.252044677734375, -0.24199676513671875, -0.2319488525390625, -0.22190093994140625, -0.21185302734375, -0.20180511474609375, -0.1917572021484375, -0.18170928955078125, -0.171661376953125, -0.16161346435546875, -0.1515655517578125, -0.14151763916015625, -0.1314697265625, -0.12142181396484375, -0.1113739013671875, -0.10132598876953125, -0.091278076171875, -0.08123016357421875, -0.0711822509765625, -0.06113433837890625, -0.05108642578125, -0.04103851318359375, -0.0309906005859375, -0.02094268798828125, -0.010894775390625, -0.00084686279296875, 0.0092010498046875, 0.01924896240234375, 0.029296875, 0.03934478759765625, 0.0493927001953125, 0.05944061279296875, 0.069488525390625, 0.07953643798828125, 0.0895843505859375, 0.09963226318359375, 0.10968017578125, 0.11972808837890625, 0.1297760009765625, 0.13982391357421875, 0.149871826171875, 0.15991973876953125, 0.1699676513671875, 0.18001556396484375, 0.1900634765625, 0.20011138916015625, 0.2101593017578125, 0.22020721435546875, 0.230255126953125, 0.24030303955078125, 0.2503509521484375, 0.26039886474609375, 0.27044677734375, 0.28049468994140625, 0.2905426025390625, 0.30059051513671875, 0.310638427734375, 0.32068634033203125, 0.3307342529296875, 0.34078216552734375, 0.350830078125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 6.0, 6.0, 9.0, 11.0, 13.0, 17.0, 24.0, 20.0, 36.0, 47.0, 61.0, 52.0, 77.0, 73.0, 106.0, 76.0, 54.0, 52.0, 44.0, 36.0, 37.0, 30.0, 20.0, 20.0, 11.0, 10.0, 4.0, 6.0, 4.0, 4.0, 6.0, 1.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01409912109375, -0.013662457466125488, -0.013225793838500977, -0.012789130210876465, -0.012352466583251953, -0.011915802955627441, -0.01147913932800293, -0.011042475700378418, -0.010605812072753906, -0.010169148445129395, -0.009732484817504883, -0.009295821189880371, -0.00885915756225586, -0.008422493934631348, -0.007985830307006836, -0.007549166679382324, -0.0071125030517578125, -0.006675839424133301, -0.006239175796508789, -0.005802512168884277, -0.005365848541259766, -0.004929184913635254, -0.004492521286010742, -0.0040558576583862305, -0.0036191940307617188, -0.003182530403137207, -0.0027458667755126953, -0.0023092031478881836, -0.0018725395202636719, -0.0014358758926391602, -0.0009992122650146484, -0.0005625486373901367, -0.000125885009765625, 0.0003107786178588867, 0.0007474422454833984, 0.0011841058731079102, 0.0016207695007324219, 0.0020574331283569336, 0.0024940967559814453, 0.002930760383605957, 0.0033674240112304688, 0.0038040876388549805, 0.004240751266479492, 0.004677414894104004, 0.005114078521728516, 0.005550742149353027, 0.005987405776977539, 0.006424069404602051, 0.0068607330322265625, 0.007297396659851074, 0.007734060287475586, 0.008170723915100098, 0.00860738754272461, 0.009044051170349121, 0.009480714797973633, 0.009917378425598145, 0.010354042053222656, 0.010790705680847168, 0.01122736930847168, 0.011664032936096191, 0.012100696563720703, 0.012537360191345215, 0.012974023818969727, 0.013410687446594238, 0.01384735107421875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 2.0, 11.0, 5.0, 4.0, 11.0, 14.0, 25.0, 19.0, 31.0, 38.0, 68.0, 81.0, 128.0, 212.0, 392.0, 892.0, 25471.0, 1014091.0, 5375.0, 724.0, 353.0, 168.0, 137.0, 76.0, 48.0, 43.0, 26.0, 16.0, 20.0, 11.0, 11.0, 12.0, 2.0, 4.0, 7.0, 4.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.282470703125, -0.273468017578125, -0.26446533203125, -0.255462646484375, -0.2464599609375, -0.237457275390625, -0.22845458984375, -0.219451904296875, -0.21044921875, -0.201446533203125, -0.19244384765625, -0.183441162109375, -0.1744384765625, -0.165435791015625, -0.15643310546875, -0.147430419921875, -0.138427734375, -0.129425048828125, -0.12042236328125, -0.111419677734375, -0.1024169921875, -0.093414306640625, -0.08441162109375, -0.075408935546875, -0.06640625, -0.057403564453125, -0.04840087890625, -0.039398193359375, -0.0303955078125, -0.021392822265625, -0.01239013671875, -0.003387451171875, 0.005615234375, 0.014617919921875, 0.02362060546875, 0.032623291015625, 0.0416259765625, 0.050628662109375, 0.05963134765625, 0.068634033203125, 0.07763671875, 0.086639404296875, 0.09564208984375, 0.104644775390625, 0.1136474609375, 0.122650146484375, 0.13165283203125, 0.140655517578125, 0.149658203125, 0.158660888671875, 0.16766357421875, 0.176666259765625, 0.1856689453125, 0.194671630859375, 0.20367431640625, 0.212677001953125, 0.2216796875, 0.230682373046875, 0.23968505859375, 0.248687744140625, 0.2576904296875, 0.266693115234375, 0.27569580078125, 0.284698486328125, 0.293701171875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [7.0, 23.0, 217.0, 525.0, 196.0, 40.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008215038105845451, -0.005786461755633354, -0.0033578849397599697, -0.0009293081238865852, 0.001499268226325512, 0.003927844576537609, 0.006356421858072281, 0.008784998208284378, 0.011213574558496475, 0.013642150908708572, 0.01607072725892067, 0.018499303609132767, 0.020927879959344864, 0.02335645630955696, 0.025785034522414207, 0.028213610872626305, 0.030642187222838402, 0.03307076543569565, 0.035499341785907745, 0.03792791813611984, 0.04035649448633194, 0.04278507083654404, 0.045213647186756134, 0.04764222353696823, 0.05007079988718033, 0.052499376237392426, 0.05492795258760452, 0.05735652893781662, 0.05978510528802872, 0.062213681638240814, 0.06464225798845291, 0.06707083433866501, 0.0694994106888771, 0.0719279870390892, 0.0743565633893013, 0.0767851397395134, 0.0792137160897255, 0.08164229243993759, 0.08407086879014969, 0.08649944514036179, 0.08892802149057388, 0.09135659784078598, 0.09378517419099808, 0.09621375054121017, 0.09864232689142227, 0.10107090324163437, 0.10349947959184647, 0.10592805594205856, 0.10835663974285126, 0.11078521609306335, 0.11321379244327545, 0.11564236879348755, 0.11807094514369965, 0.12049952149391174, 0.12292809784412384, 0.12535667419433594, 0.12778525054454803, 0.13021382689476013, 0.13264240324497223, 0.13507097959518433, 0.13749955594539642, 0.13992813229560852, 0.14235670864582062, 0.14478528499603271, 0.1472138613462448]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 10.0, 15.0, 15.0, 14.0, 17.0, 21.0, 17.0, 33.0, 29.0, 33.0, 40.0, 32.0, 47.0, 36.0, 43.0, 44.0, 45.0, 58.0, 43.0, 38.0, 42.0, 44.0, 35.0, 43.0, 42.0, 18.0, 28.0, 17.0, 17.0, 18.0, 14.0, 7.0, 9.0, 4.0, 12.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.012679636478424072, -0.012279914692044258, -0.011880192905664444, -0.01148047111928463, -0.011080749332904816, -0.010681027546525002, -0.010281305760145187, -0.009881583973765373, -0.009481862187385559, -0.009082140401005745, -0.00868241861462593, -0.008282696828246117, -0.007882975041866302, -0.007483253255486488, -0.007083531469106674, -0.00668380968272686, -0.006284087896347046, -0.005884366109967232, -0.005484644323587418, -0.0050849225372076035, -0.004685200750827789, -0.004285478964447975, -0.003885757178068161, -0.003486035391688347, -0.0030863136053085327, -0.0026865918189287186, -0.0022868700325489044, -0.0018871482461690903, -0.0014874264597892761, -0.001087704673409462, -0.0006879828870296478, -0.0002882611006498337, 0.00011146068572998047, 0.0005111824721097946, 0.0009109042584896088, 0.001310626044869423, 0.001710347831249237, 0.002110069617629051, 0.0025097914040088654, 0.0029095131903886795, 0.0033092349767684937, 0.003708956763148308, 0.004108678549528122, 0.004508400335907936, 0.00490812212228775, 0.005307843908667564, 0.0057075656950473785, 0.006107287481427193, 0.006507009267807007, 0.006906731054186821, 0.007306452840566635, 0.007706174626946449, 0.008105896413326263, 0.008505618199706078, 0.008905339986085892, 0.009305061772465706, 0.00970478355884552, 0.010104505345225334, 0.010504227131605148, 0.010903948917984962, 0.011303670704364777, 0.01170339249074459, 0.012103114277124405, 0.012502836063504219, 0.012902557849884033]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 12.0, 4.0, 8.0, 13.0, 8.0, 13.0, 21.0, 31.0, 35.0, 27.0, 39.0, 56.0, 47.0, 45.0, 45.0, 50.0, 43.0, 48.0, 67.0, 49.0, 44.0, 49.0, 35.0, 34.0, 34.0, 24.0, 34.0, 22.0, 14.0, 13.0, 6.0, 5.0, 7.0, 5.0, 4.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.458465576171875, -2.38568115234375, -2.312896728515625, -2.2401123046875, -2.167327880859375, -2.09454345703125, -2.021759033203125, -1.948974609375, -1.876190185546875, -1.80340576171875, -1.730621337890625, -1.6578369140625, -1.585052490234375, -1.51226806640625, -1.439483642578125, -1.36669921875, -1.293914794921875, -1.22113037109375, -1.148345947265625, -1.0755615234375, -1.002777099609375, -0.92999267578125, -0.857208251953125, -0.784423828125, -0.711639404296875, -0.63885498046875, -0.566070556640625, -0.4932861328125, -0.420501708984375, -0.34771728515625, -0.274932861328125, -0.2021484375, -0.129364013671875, -0.05657958984375, 0.016204833984375, 0.0889892578125, 0.161773681640625, 0.23455810546875, 0.307342529296875, 0.380126953125, 0.452911376953125, 0.52569580078125, 0.598480224609375, 0.6712646484375, 0.744049072265625, 0.81683349609375, 0.889617919921875, 0.96240234375, 1.035186767578125, 1.10797119140625, 1.180755615234375, 1.2535400390625, 1.326324462890625, 1.39910888671875, 1.471893310546875, 1.544677734375, 1.617462158203125, 1.69024658203125, 1.763031005859375, 1.8358154296875, 1.908599853515625, 1.98138427734375, 2.054168701171875, 2.126953125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 9.0, 4.0, 15.0, 10.0, 21.0, 40.0, 50.0, 81.0, 80.0, 140.0, 234.0, 363.0, 601.0, 978.0, 1802.0, 3575.0, 7928.0, 22520.0, 103998.0, 668581.0, 185096.0, 32458.0, 10340.0, 4492.0, 2124.0, 1170.0, 643.0, 393.0, 285.0, 176.0, 122.0, 74.0, 45.0, 36.0, 29.0, 18.0, 13.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.6717529296875, -4.519287109375, -4.3668212890625, -4.21435546875, -4.0618896484375, -3.909423828125, -3.7569580078125, -3.6044921875, -3.4520263671875, -3.299560546875, -3.1470947265625, -2.99462890625, -2.8421630859375, -2.689697265625, -2.5372314453125, -2.384765625, -2.2322998046875, -2.079833984375, -1.9273681640625, -1.77490234375, -1.6224365234375, -1.469970703125, -1.3175048828125, -1.1650390625, -1.0125732421875, -0.860107421875, -0.7076416015625, -0.55517578125, -0.4027099609375, -0.250244140625, -0.0977783203125, 0.0546875, 0.2071533203125, 0.359619140625, 0.5120849609375, 0.66455078125, 0.8170166015625, 0.969482421875, 1.1219482421875, 1.2744140625, 1.4268798828125, 1.579345703125, 1.7318115234375, 1.88427734375, 2.0367431640625, 2.189208984375, 2.3416748046875, 2.494140625, 2.6466064453125, 2.799072265625, 2.9515380859375, 3.10400390625, 3.2564697265625, 3.408935546875, 3.5614013671875, 3.7138671875, 3.8663330078125, 4.018798828125, 4.1712646484375, 4.32373046875, 4.4761962890625, 4.628662109375, 4.7811279296875, 4.93359375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 9.0, 8.0, 13.0, 14.0, 17.0, 22.0, 13.0, 33.0, 28.0, 34.0, 53.0, 57.0, 82.0, 115.0, 162.0, 306.0, 1373.0, 197.0, 125.0, 75.0, 53.0, 50.0, 35.0, 31.0, 19.0, 16.0, 20.0, 19.0, 11.0, 8.0, 8.0, 5.0, 8.0, 5.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8359375, -4.66937255859375, -4.5028076171875, -4.33624267578125, -4.169677734375, -4.00311279296875, -3.8365478515625, -3.66998291015625, -3.50341796875, -3.33685302734375, -3.1702880859375, -3.00372314453125, -2.837158203125, -2.67059326171875, -2.5040283203125, -2.33746337890625, -2.1708984375, -2.00433349609375, -1.8377685546875, -1.67120361328125, -1.504638671875, -1.33807373046875, -1.1715087890625, -1.00494384765625, -0.83837890625, -0.67181396484375, -0.5052490234375, -0.33868408203125, -0.172119140625, -0.00555419921875, 0.1610107421875, 0.32757568359375, 0.494140625, 0.66070556640625, 0.8272705078125, 0.99383544921875, 1.160400390625, 1.32696533203125, 1.4935302734375, 1.66009521484375, 1.82666015625, 1.99322509765625, 2.1597900390625, 2.32635498046875, 2.492919921875, 2.65948486328125, 2.8260498046875, 2.99261474609375, 3.1591796875, 3.32574462890625, 3.4923095703125, 3.65887451171875, 3.825439453125, 3.99200439453125, 4.1585693359375, 4.32513427734375, 4.49169921875, 4.65826416015625, 4.8248291015625, 4.99139404296875, 5.157958984375, 5.32452392578125, 5.4910888671875, 5.65765380859375, 5.82421875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 9.0, 7.0, 8.0, 8.0, 14.0, 18.0, 20.0, 31.0, 35.0, 43.0, 88.0, 155.0, 215.0, 440.0, 838.0, 2141.0, 21576.0, 3095304.0, 20723.0, 2136.0, 808.0, 408.0, 234.0, 139.0, 80.0, 63.0, 50.0, 26.0, 22.0, 16.0, 10.0, 11.0, 11.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.53125, -16.00634765625, -15.4814453125, -14.95654296875, -14.431640625, -13.90673828125, -13.3818359375, -12.85693359375, -12.33203125, -11.80712890625, -11.2822265625, -10.75732421875, -10.232421875, -9.70751953125, -9.1826171875, -8.65771484375, -8.1328125, -7.60791015625, -7.0830078125, -6.55810546875, -6.033203125, -5.50830078125, -4.9833984375, -4.45849609375, -3.93359375, -3.40869140625, -2.8837890625, -2.35888671875, -1.833984375, -1.30908203125, -0.7841796875, -0.25927734375, 0.265625, 0.79052734375, 1.3154296875, 1.84033203125, 2.365234375, 2.89013671875, 3.4150390625, 3.93994140625, 4.46484375, 4.98974609375, 5.5146484375, 6.03955078125, 6.564453125, 7.08935546875, 7.6142578125, 8.13916015625, 8.6640625, 9.18896484375, 9.7138671875, 10.23876953125, 10.763671875, 11.28857421875, 11.8134765625, 12.33837890625, 12.86328125, 13.38818359375, 13.9130859375, 14.43798828125, 14.962890625, 15.48779296875, 16.0126953125, 16.53759765625, 17.0625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 12.0, 25.0, 69.0, 170.0, 290.0, 245.0, 140.0, 43.0, 11.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.30647659301758, -50.08176040649414, -48.85704803466797, -47.63233184814453, -46.407615661621094, -45.182899475097656, -43.958187103271484, -42.73347091674805, -41.508758544921875, -40.28404235839844, -39.059329986572266, -37.83461380004883, -36.60989761352539, -35.38518524169922, -34.16046905517578, -32.935752868652344, -31.711036682128906, -30.4863224029541, -29.261606216430664, -28.03689193725586, -26.812175750732422, -25.587461471557617, -24.362747192382812, -23.138031005859375, -21.91331672668457, -20.688602447509766, -19.463886260986328, -18.239171981811523, -17.01445770263672, -15.789741516113281, -14.565027236938477, -13.340312004089355, -12.115594863891602, -10.89087963104248, -9.66616439819336, -8.441450119018555, -7.216734886169434, -5.9920196533203125, -4.76730489730835, -3.5425901412963867, -2.3178749084472656, -1.0931599140167236, 0.13155508041381836, 1.3562700748443604, 2.5809850692749023, 3.8057003021240234, 5.030415058135986, 6.255129814147949, 7.47984504699707, 8.704560279846191, 9.929275512695312, 11.153989791870117, 12.378705024719238, 13.60342025756836, 14.828134536743164, 16.05284881591797, 17.277565002441406, 18.50227928161621, 19.72699546813965, 20.951709747314453, 22.17642593383789, 23.401140213012695, 24.6258544921875, 25.850570678710938, 27.075284957885742]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 11.0, 15.0, 9.0, 12.0, 18.0, 13.0, 12.0, 23.0, 15.0, 20.0, 30.0, 32.0, 35.0, 27.0, 44.0, 37.0, 46.0, 52.0, 36.0, 37.0, 48.0, 49.0, 42.0, 33.0, 34.0, 40.0, 31.0, 24.0, 23.0, 27.0, 16.0, 12.0, 19.0, 11.0, 9.0, 9.0, 9.0, 11.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.330209732055664, -14.839971542358398, -14.34973430633545, -13.859496116638184, -13.369258880615234, -12.879020690917969, -12.388782501220703, -11.898545265197754, -11.408308029174805, -10.918069839477539, -10.42783260345459, -9.937594413757324, -9.447357177734375, -8.95711898803711, -8.466880798339844, -7.9766435623168945, -7.486405372619629, -6.9961676597595215, -6.505929946899414, -6.015691757202148, -5.525454521179199, -5.035216331481934, -4.544978618621826, -4.054740905761719, -3.5645031929016113, -3.074265480041504, -2.5840277671813965, -2.09378981590271, -1.6035521030426025, -1.1133143901824951, -0.6230764389038086, -0.13283872604370117, 0.35739898681640625, 0.8476367592811584, 1.3378745317459106, 1.8281123638153076, 2.318350076675415, 2.8085877895355225, 3.298825740814209, 3.7890634536743164, 4.279301166534424, 4.769538879394531, 5.259776592254639, 5.750014305114746, 6.240252494812012, 6.730489730834961, 7.220727920532227, 7.710965633392334, 8.201203346252441, 8.691441535949707, 9.181678771972656, 9.671916961669922, 10.162154197692871, 10.652392387390137, 11.142629623413086, 11.632867813110352, 12.123106002807617, 12.613344192504883, 13.103581428527832, 13.593819618225098, 14.084056854248047, 14.574295043945312, 15.064533233642578, 15.554770469665527, 16.045007705688477]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 11.0, 7.0, 6.0, 7.0, 13.0, 15.0, 16.0, 33.0, 24.0, 38.0, 30.0, 42.0, 37.0, 40.0, 42.0, 48.0, 57.0, 42.0, 37.0, 34.0, 42.0, 49.0, 44.0, 42.0, 43.0, 30.0, 26.0, 21.0, 18.0, 10.0, 19.0, 25.0, 11.0, 9.0, 7.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.166015625, -2.09814453125, -2.0302734375, -1.96240234375, -1.89453125, -1.82666015625, -1.7587890625, -1.69091796875, -1.623046875, -1.55517578125, -1.4873046875, -1.41943359375, -1.3515625, -1.28369140625, -1.2158203125, -1.14794921875, -1.080078125, -1.01220703125, -0.9443359375, -0.87646484375, -0.80859375, -0.74072265625, -0.6728515625, -0.60498046875, -0.537109375, -0.46923828125, -0.4013671875, -0.33349609375, -0.265625, -0.19775390625, -0.1298828125, -0.06201171875, 0.005859375, 0.07373046875, 0.1416015625, 0.20947265625, 0.27734375, 0.34521484375, 0.4130859375, 0.48095703125, 0.548828125, 0.61669921875, 0.6845703125, 0.75244140625, 0.8203125, 0.88818359375, 0.9560546875, 1.02392578125, 1.091796875, 1.15966796875, 1.2275390625, 1.29541015625, 1.36328125, 1.43115234375, 1.4990234375, 1.56689453125, 1.634765625, 1.70263671875, 1.7705078125, 1.83837890625, 1.90625, 1.97412109375, 2.0419921875, 2.10986328125, 2.177734375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 10.0, 12.0, 20.0, 22.0, 32.0, 51.0, 54.0, 82.0, 127.0, 198.0, 308.0, 445.0, 603.0, 1031.0, 1607.0, 2724.0, 4796.0, 10045.0, 31126.0, 236745.0, 2306104.0, 1432629.0, 124536.0, 22008.0, 8134.0, 4242.0, 2342.0, 1433.0, 897.0, 577.0, 405.0, 281.0, 170.0, 136.0, 108.0, 67.0, 51.0, 36.0, 23.0, 15.0, 12.0, 11.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-5.28515625, -5.1378173828125, -4.990478515625, -4.8431396484375, -4.69580078125, -4.5484619140625, -4.401123046875, -4.2537841796875, -4.1064453125, -3.9591064453125, -3.811767578125, -3.6644287109375, -3.51708984375, -3.3697509765625, -3.222412109375, -3.0750732421875, -2.927734375, -2.7803955078125, -2.633056640625, -2.4857177734375, -2.33837890625, -2.1910400390625, -2.043701171875, -1.8963623046875, -1.7490234375, -1.6016845703125, -1.454345703125, -1.3070068359375, -1.15966796875, -1.0123291015625, -0.864990234375, -0.7176513671875, -0.5703125, -0.4229736328125, -0.275634765625, -0.1282958984375, 0.01904296875, 0.1663818359375, 0.313720703125, 0.4610595703125, 0.6083984375, 0.7557373046875, 0.903076171875, 1.0504150390625, 1.19775390625, 1.3450927734375, 1.492431640625, 1.6397705078125, 1.787109375, 1.9344482421875, 2.081787109375, 2.2291259765625, 2.37646484375, 2.5238037109375, 2.671142578125, 2.8184814453125, 2.9658203125, 3.1131591796875, 3.260498046875, 3.4078369140625, 3.55517578125, 3.7025146484375, 3.849853515625, 3.9971923828125, 4.14453125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 4.0, 6.0, 5.0, 12.0, 21.0, 26.0, 52.0, 49.0, 89.0, 140.0, 202.0, 301.0, 482.0, 698.0, 693.0, 441.0, 330.0, 196.0, 120.0, 72.0, 51.0, 30.0, 23.0, 14.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.29296875, -5.149627685546875, -5.00628662109375, -4.862945556640625, -4.7196044921875, -4.576263427734375, -4.43292236328125, -4.289581298828125, -4.146240234375, -4.002899169921875, -3.85955810546875, -3.716217041015625, -3.5728759765625, -3.429534912109375, -3.28619384765625, -3.142852783203125, -2.99951171875, -2.856170654296875, -2.71282958984375, -2.569488525390625, -2.4261474609375, -2.282806396484375, -2.13946533203125, -1.996124267578125, -1.852783203125, -1.709442138671875, -1.56610107421875, -1.422760009765625, -1.2794189453125, -1.136077880859375, -0.99273681640625, -0.849395751953125, -0.7060546875, -0.562713623046875, -0.41937255859375, -0.276031494140625, -0.1326904296875, 0.010650634765625, 0.15399169921875, 0.297332763671875, 0.440673828125, 0.584014892578125, 0.72735595703125, 0.870697021484375, 1.0140380859375, 1.157379150390625, 1.30072021484375, 1.444061279296875, 1.58740234375, 1.730743408203125, 1.87408447265625, 2.017425537109375, 2.1607666015625, 2.304107666015625, 2.44744873046875, 2.590789794921875, 2.734130859375, 2.877471923828125, 3.02081298828125, 3.164154052734375, 3.3074951171875, 3.450836181640625, 3.59417724609375, 3.737518310546875, 3.880859375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 5.0, 13.0, 12.0, 35.0, 59.0, 77.0, 165.0, 360.0, 857.0, 2398.0, 8944.0, 62770.0, 1881017.0, 2155719.0, 68064.0, 9506.0, 2542.0, 898.0, 387.0, 191.0, 101.0, 58.0, 35.0, 20.0, 18.0, 8.0, 12.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2890625, -6.0562744140625, -5.823486328125, -5.5906982421875, -5.35791015625, -5.1251220703125, -4.892333984375, -4.6595458984375, -4.4267578125, -4.1939697265625, -3.961181640625, -3.7283935546875, -3.49560546875, -3.2628173828125, -3.030029296875, -2.7972412109375, -2.564453125, -2.3316650390625, -2.098876953125, -1.8660888671875, -1.63330078125, -1.4005126953125, -1.167724609375, -0.9349365234375, -0.7021484375, -0.4693603515625, -0.236572265625, -0.0037841796875, 0.22900390625, 0.4617919921875, 0.694580078125, 0.9273681640625, 1.16015625, 1.3929443359375, 1.625732421875, 1.8585205078125, 2.09130859375, 2.3240966796875, 2.556884765625, 2.7896728515625, 3.0224609375, 3.2552490234375, 3.488037109375, 3.7208251953125, 3.95361328125, 4.1864013671875, 4.419189453125, 4.6519775390625, 4.884765625, 5.1175537109375, 5.350341796875, 5.5831298828125, 5.81591796875, 6.0487060546875, 6.281494140625, 6.5142822265625, 6.7470703125, 6.9798583984375, 7.212646484375, 7.4454345703125, 7.67822265625, 7.9110107421875, 8.143798828125, 8.3765869140625, 8.609375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 9.0, 140.0, 699.0, 164.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.62832641601562, -200.87313842773438, -197.11795043945312, -193.3627471923828, -189.60755920410156, -185.8523712158203, -182.09718322753906, -178.3419952392578, -174.5867919921875, -170.83160400390625, -167.076416015625, -163.3212127685547, -159.56602478027344, -155.8108367919922, -152.05564880371094, -148.3004608154297, -144.54527282714844, -140.7900848388672, -137.03489685058594, -133.27969360351562, -129.52450561523438, -125.76931762695312, -122.01412963867188, -118.25894165039062, -114.50374603271484, -110.7485580444336, -106.99336242675781, -103.23817443847656, -99.48298645019531, -95.72779083251953, -91.97260284423828, -88.2174072265625, -84.46222686767578, -80.70703887939453, -76.95184326171875, -73.1966552734375, -69.44146728515625, -65.68627166748047, -61.93108367919922, -58.1758918762207, -54.42070007324219, -50.66550827026367, -46.910316467285156, -43.155128479003906, -39.39993667602539, -35.644744873046875, -31.889554977416992, -28.13436508178711, -24.379173278808594, -20.623981475830078, -16.868791580200195, -13.113600730895996, -9.358409881591797, -5.603218078613281, -1.8480281829833984, 1.9071617126464844, 5.662353515625, 9.4175443649292, 13.172735214233398, 16.92792510986328, 20.683116912841797, 24.438308715820312, 28.193498611450195, 31.948688507080078, 35.703880310058594]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 6.0, 13.0, 12.0, 13.0, 17.0, 20.0, 17.0, 26.0, 29.0, 28.0, 29.0, 42.0, 37.0, 34.0, 57.0, 42.0, 50.0, 37.0, 43.0, 43.0, 47.0, 41.0, 37.0, 34.0, 40.0, 27.0, 23.0, 29.0, 18.0, 15.0, 21.0, 21.0, 8.0, 2.0, 2.0, 7.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.683809280395508, -13.257638931274414, -12.831469535827637, -12.405299186706543, -11.97912883758545, -11.552959442138672, -11.126789093017578, -10.700618743896484, -10.27444839477539, -9.848278045654297, -9.42210865020752, -8.995938301086426, -8.569767951965332, -8.143598556518555, -7.717428207397461, -7.291257858276367, -6.865087985992432, -6.438918113708496, -6.012747764587402, -5.586577892303467, -5.160407543182373, -4.7342376708984375, -4.308067321777344, -3.881897449493408, -3.4557273387908936, -3.029557228088379, -2.6033871173858643, -2.1772170066833496, -1.7510470151901245, -1.3248770236968994, -0.8987069129943848, -0.4725368022918701, -0.04636669158935547, 0.3798033893108368, 0.805973470211029, 1.232143521308899, 1.6583136320114136, 2.0844836235046387, 2.5106537342071533, 2.936823844909668, 3.3629939556121826, 3.7891640663146973, 4.215333938598633, 4.641504287719727, 5.067674160003662, 5.493844032287598, 5.920014381408691, 6.346184730529785, 6.772354602813721, 7.198524475097656, 7.62469482421875, 8.050865173339844, 8.477034568786621, 8.903204917907715, 9.329375267028809, 9.755544662475586, 10.18171501159668, 10.607885360717773, 11.03405475616455, 11.460225105285645, 11.886395454406738, 12.312564849853516, 12.73873519897461, 13.164905548095703, 13.591075897216797]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 6.0, 11.0, 8.0, 6.0, 17.0, 25.0, 16.0, 22.0, 19.0, 29.0, 35.0, 18.0, 46.0, 29.0, 36.0, 41.0, 41.0, 51.0, 42.0, 49.0, 28.0, 31.0, 38.0, 36.0, 39.0, 33.0, 24.0, 24.0, 37.0, 23.0, 13.0, 23.0, 10.0, 12.0, 15.0, 7.0, 5.0, 15.0, 5.0, 3.0, 6.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.62109375, -1.569976806640625, -1.51885986328125, -1.467742919921875, -1.4166259765625, -1.365509033203125, -1.31439208984375, -1.263275146484375, -1.212158203125, -1.161041259765625, -1.10992431640625, -1.058807373046875, -1.0076904296875, -0.956573486328125, -0.90545654296875, -0.854339599609375, -0.80322265625, -0.752105712890625, -0.70098876953125, -0.649871826171875, -0.5987548828125, -0.547637939453125, -0.49652099609375, -0.445404052734375, -0.394287109375, -0.343170166015625, -0.29205322265625, -0.240936279296875, -0.1898193359375, -0.138702392578125, -0.08758544921875, -0.036468505859375, 0.0146484375, 0.065765380859375, 0.11688232421875, 0.167999267578125, 0.2191162109375, 0.270233154296875, 0.32135009765625, 0.372467041015625, 0.423583984375, 0.474700927734375, 0.52581787109375, 0.576934814453125, 0.6280517578125, 0.679168701171875, 0.73028564453125, 0.781402587890625, 0.83251953125, 0.883636474609375, 0.93475341796875, 0.985870361328125, 1.0369873046875, 1.088104248046875, 1.13922119140625, 1.190338134765625, 1.241455078125, 1.292572021484375, 1.34368896484375, 1.394805908203125, 1.4459228515625, 1.497039794921875, 1.54815673828125, 1.599273681640625, 1.650390625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 7.0, 8.0, 10.0, 13.0, 14.0, 17.0, 33.0, 47.0, 76.0, 91.0, 157.0, 250.0, 273.0, 403.0, 560.0, 749.0, 1135.0, 1552.0, 2094.0, 2941.0, 3989.0, 5613.0, 8060.0, 11603.0, 16735.0, 24186.0, 36751.0, 56756.0, 90594.0, 146161.0, 193722.0, 157631.0, 99176.0, 61311.0, 39766.0, 25831.0, 17795.0, 12309.0, 8620.0, 6194.0, 4337.0, 3091.0, 2213.0, 1629.0, 1153.0, 809.0, 601.0, 419.0, 322.0, 219.0, 169.0, 106.0, 80.0, 62.0, 40.0, 30.0, 19.0, 15.0, 11.0, 4.0, 3.0, 3.0], "bins": [-0.11810302734375, -0.11447906494140625, -0.1108551025390625, -0.10723114013671875, -0.103607177734375, -0.09998321533203125, -0.0963592529296875, -0.09273529052734375, -0.089111328125, -0.08548736572265625, -0.0818634033203125, -0.07823944091796875, -0.074615478515625, -0.07099151611328125, -0.0673675537109375, -0.06374359130859375, -0.06011962890625, -0.05649566650390625, -0.0528717041015625, -0.04924774169921875, -0.045623779296875, -0.04199981689453125, -0.0383758544921875, -0.03475189208984375, -0.0311279296875, -0.02750396728515625, -0.0238800048828125, -0.02025604248046875, -0.016632080078125, -0.01300811767578125, -0.0093841552734375, -0.00576019287109375, -0.00213623046875, 0.00148773193359375, 0.0051116943359375, 0.00873565673828125, 0.012359619140625, 0.01598358154296875, 0.0196075439453125, 0.02323150634765625, 0.02685546875, 0.03047943115234375, 0.0341033935546875, 0.03772735595703125, 0.041351318359375, 0.04497528076171875, 0.0485992431640625, 0.05222320556640625, 0.05584716796875, 0.05947113037109375, 0.0630950927734375, 0.06671905517578125, 0.070343017578125, 0.07396697998046875, 0.0775909423828125, 0.08121490478515625, 0.0848388671875, 0.08846282958984375, 0.0920867919921875, 0.09571075439453125, 0.099334716796875, 0.10295867919921875, 0.1065826416015625, 0.11020660400390625, 0.11383056640625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 10.0, 7.0, 7.0, 14.0, 12.0, 24.0, 18.0, 19.0, 27.0, 27.0, 35.0, 36.0, 43.0, 36.0, 52.0, 52.0, 44.0, 1078.0, 50.0, 35.0, 50.0, 36.0, 48.0, 33.0, 46.0, 28.0, 23.0, 23.0, 25.0, 16.0, 16.0, 10.0, 6.0, 11.0, 6.0, 5.0, 6.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.23046875, -1.1895904541015625, -1.148712158203125, -1.1078338623046875, -1.06695556640625, -1.0260772705078125, -0.985198974609375, -0.9443206787109375, -0.9034423828125, -0.8625640869140625, -0.821685791015625, -0.7808074951171875, -0.73992919921875, -0.6990509033203125, -0.658172607421875, -0.6172943115234375, -0.576416015625, -0.5355377197265625, -0.494659423828125, -0.4537811279296875, -0.41290283203125, -0.3720245361328125, -0.331146240234375, -0.2902679443359375, -0.2493896484375, -0.2085113525390625, -0.167633056640625, -0.1267547607421875, -0.08587646484375, -0.0449981689453125, -0.004119873046875, 0.0367584228515625, 0.07763671875, 0.1185150146484375, 0.159393310546875, 0.2002716064453125, 0.24114990234375, 0.2820281982421875, 0.322906494140625, 0.3637847900390625, 0.4046630859375, 0.4455413818359375, 0.486419677734375, 0.5272979736328125, 0.56817626953125, 0.6090545654296875, 0.649932861328125, 0.6908111572265625, 0.731689453125, 0.7725677490234375, 0.813446044921875, 0.8543243408203125, 0.89520263671875, 0.9360809326171875, 0.976959228515625, 1.0178375244140625, 1.0587158203125, 1.0995941162109375, 1.140472412109375, 1.1813507080078125, 1.22222900390625, 1.2631072998046875, 1.303985595703125, 1.3448638916015625, 1.3857421875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 9.0, 8.0, 15.0, 26.0, 50.0, 41.0, 75.0, 109.0, 125.0, 231.0, 348.0, 562.0, 908.0, 1641.0, 3053.0, 6083.0, 13208.0, 34078.0, 416916.0, 1550544.0, 40162.0, 14543.0, 6595.0, 3345.0, 1757.0, 1015.0, 590.0, 318.0, 236.0, 152.0, 109.0, 68.0, 56.0, 41.0, 19.0, 22.0, 11.0, 12.0, 11.0, 3.0, 2.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.305419921875, -0.2952613830566406, -0.28510284423828125, -0.2749443054199219, -0.2647857666015625, -0.2546272277832031, -0.24446868896484375, -0.23431015014648438, -0.224151611328125, -0.21399307250976562, -0.20383453369140625, -0.19367599487304688, -0.1835174560546875, -0.17335891723632812, -0.16320037841796875, -0.15304183959960938, -0.14288330078125, -0.13272476196289062, -0.12256622314453125, -0.11240768432617188, -0.1022491455078125, -0.09209060668945312, -0.08193206787109375, -0.07177352905273438, -0.061614990234375, -0.051456451416015625, -0.04129791259765625, -0.031139373779296875, -0.0209808349609375, -0.010822296142578125, -0.00066375732421875, 0.009494781494140625, 0.0196533203125, 0.029811859130859375, 0.03997039794921875, 0.050128936767578125, 0.0602874755859375, 0.07044601440429688, 0.08060455322265625, 0.09076309204101562, 0.100921630859375, 0.11108016967773438, 0.12123870849609375, 0.13139724731445312, 0.1415557861328125, 0.15171432495117188, 0.16187286376953125, 0.17203140258789062, 0.18218994140625, 0.19234848022460938, 0.20250701904296875, 0.21266555786132812, 0.2228240966796875, 0.23298263549804688, 0.24314117431640625, 0.2532997131347656, 0.263458251953125, 0.2736167907714844, 0.28377532958984375, 0.2939338684082031, 0.3040924072265625, 0.3142509460449219, 0.32440948486328125, 0.3345680236816406, 0.3447265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 4.0, 6.0, 1.0, 5.0, 9.0, 7.0, 10.0, 12.0, 17.0, 15.0, 23.0, 21.0, 36.0, 31.0, 35.0, 40.0, 49.0, 43.0, 47.0, 59.0, 74.0, 71.0, 52.0, 41.0, 45.0, 27.0, 37.0, 19.0, 25.0, 26.0, 13.0, 10.0, 14.0, 17.0, 15.0, 10.0, 8.0, 9.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0078125, -0.0075681209564208984, -0.007323741912841797, -0.007079362869262695, -0.006834983825683594, -0.006590604782104492, -0.006346225738525391, -0.006101846694946289, -0.0058574676513671875, -0.005613088607788086, -0.005368709564208984, -0.005124330520629883, -0.004879951477050781, -0.00463557243347168, -0.004391193389892578, -0.0041468143463134766, -0.003902435302734375, -0.0036580562591552734, -0.003413677215576172, -0.0031692981719970703, -0.0029249191284179688, -0.002680540084838867, -0.0024361610412597656, -0.002191781997680664, -0.0019474029541015625, -0.001703023910522461, -0.0014586448669433594, -0.0012142658233642578, -0.0009698867797851562, -0.0007255077362060547, -0.0004811286926269531, -0.00023674964904785156, 7.62939453125e-06, 0.00025200843811035156, 0.0004963874816894531, 0.0007407665252685547, 0.0009851455688476562, 0.0012295246124267578, 0.0014739036560058594, 0.001718282699584961, 0.0019626617431640625, 0.002207040786743164, 0.0024514198303222656, 0.002695798873901367, 0.0029401779174804688, 0.0031845569610595703, 0.003428936004638672, 0.0036733150482177734, 0.003917694091796875, 0.0041620731353759766, 0.004406452178955078, 0.00465083122253418, 0.004895210266113281, 0.005139589309692383, 0.005383968353271484, 0.005628347396850586, 0.0058727264404296875, 0.006117105484008789, 0.006361484527587891, 0.006605863571166992, 0.006850242614746094, 0.007094621658325195, 0.007339000701904297, 0.0075833797454833984, 0.0078277587890625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 10.0, 6.0, 8.0, 13.0, 19.0, 20.0, 18.0, 21.0, 25.0, 48.0, 50.0, 47.0, 106.0, 112.0, 221.0, 350.0, 604.0, 1325.0, 72856.0, 965220.0, 5335.0, 848.0, 445.0, 267.0, 153.0, 100.0, 82.0, 58.0, 48.0, 27.0, 28.0, 22.0, 13.0, 10.0, 10.0, 6.0, 6.0, 5.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1627197265625, -0.15768051147460938, -0.15264129638671875, -0.14760208129882812, -0.1425628662109375, -0.13752365112304688, -0.13248443603515625, -0.12744522094726562, -0.122406005859375, -0.11736679077148438, -0.11232757568359375, -0.10728836059570312, -0.1022491455078125, -0.09720993041992188, -0.09217071533203125, -0.08713150024414062, -0.08209228515625, -0.07705307006835938, -0.07201385498046875, -0.06697463989257812, -0.0619354248046875, -0.056896209716796875, -0.05185699462890625, -0.046817779541015625, -0.041778564453125, -0.036739349365234375, -0.03170013427734375, -0.026660919189453125, -0.0216217041015625, -0.016582489013671875, -0.01154327392578125, -0.006504058837890625, -0.00146484375, 0.003574371337890625, 0.00861358642578125, 0.013652801513671875, 0.0186920166015625, 0.023731231689453125, 0.02877044677734375, 0.033809661865234375, 0.038848876953125, 0.043888092041015625, 0.04892730712890625, 0.053966522216796875, 0.0590057373046875, 0.06404495239257812, 0.06908416748046875, 0.07412338256835938, 0.07916259765625, 0.08420181274414062, 0.08924102783203125, 0.09428024291992188, 0.0993194580078125, 0.10435867309570312, 0.10939788818359375, 0.11443710327148438, 0.119476318359375, 0.12451553344726562, 0.12955474853515625, 0.13459396362304688, 0.1396331787109375, 0.14467239379882812, 0.14971160888671875, 0.15475082397460938, 0.1597900390625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 13.0, 51.0, 249.0, 490.0, 164.0, 36.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08371630311012268, -0.08194980025291443, -0.08018328994512558, -0.07841678708791733, -0.07665027678012848, -0.07488377392292023, -0.07311726361513138, -0.07135076075792313, -0.06958425045013428, -0.06781774759292603, -0.06605123728513718, -0.06428473442792892, -0.06251822412014008, -0.060751721262931824, -0.058985210955142975, -0.05721870809793472, -0.05545220524072647, -0.05368569865822792, -0.05191919207572937, -0.05015268549323082, -0.04838617891073227, -0.04661967605352402, -0.04485316574573517, -0.043086662888526917, -0.04132015258073807, -0.03955364599823952, -0.03778713941574097, -0.036020632833242416, -0.034254126250743866, -0.032487623393535614, -0.030721114948391914, -0.028954610228538513, -0.027188103646039963, -0.025421597063541412, -0.023655090481042862, -0.02188858389854431, -0.02012207917869091, -0.01835557259619236, -0.01658906601369381, -0.014822560362517834, -0.013056053780019283, -0.011289547197520733, -0.009523041546344757, -0.007756534963846207, -0.0059900288470089436, -0.0042235227301716805, -0.00245701614767313, -0.0006905104964971542, 0.0010759960860013962, 0.0028425022028386593, 0.004609008319675922, 0.006375514902174473, 0.008142020553350449, 0.009908527135848999, 0.01167503371834755, 0.013441539369523525, 0.015208045952022076, 0.01697455160319805, 0.018741058185696602, 0.020507564768195152, 0.022274071350693703, 0.024040576070547104, 0.025807082653045654, 0.027573589235544205, 0.029340095818042755]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 7.0, 11.0, 6.0, 16.0, 17.0, 14.0, 17.0, 25.0, 22.0, 25.0, 33.0, 25.0, 37.0, 41.0, 46.0, 28.0, 39.0, 53.0, 45.0, 38.0, 46.0, 48.0, 43.0, 35.0, 33.0, 43.0, 37.0, 24.0, 23.0, 15.0, 15.0, 17.0, 7.0, 15.0, 3.0, 7.0, 8.0, 6.0, 3.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.009371161460876465, -0.00905415415763855, -0.008737146854400635, -0.00842013955116272, -0.008103132247924805, -0.00778612494468689, -0.007469117641448975, -0.00715211033821106, -0.0068351030349731445, -0.0065180957317352295, -0.0062010884284973145, -0.005884081125259399, -0.005567073822021484, -0.005250066518783569, -0.004933059215545654, -0.004616051912307739, -0.004299044609069824, -0.003982037305831909, -0.003665030002593994, -0.003348022699356079, -0.003031015396118164, -0.002714008092880249, -0.002397000789642334, -0.002079993486404419, -0.001762986183166504, -0.0014459788799285889, -0.0011289715766906738, -0.0008119642734527588, -0.0004949569702148438, -0.0001779496669769287, 0.00013905763626098633, 0.00045606493949890137, 0.0007730722427368164, 0.0010900795459747314, 0.0014070868492126465, 0.0017240941524505615, 0.0020411014556884766, 0.0023581087589263916, 0.0026751160621643066, 0.0029921233654022217, 0.0033091306686401367, 0.0036261379718780518, 0.003943145275115967, 0.004260152578353882, 0.004577159881591797, 0.004894167184829712, 0.005211174488067627, 0.005528181791305542, 0.005845189094543457, 0.006162196397781372, 0.006479203701019287, 0.006796211004257202, 0.007113218307495117, 0.007430225610733032, 0.007747232913970947, 0.008064240217208862, 0.008381247520446777, 0.008698254823684692, 0.009015262126922607, 0.009332269430160522, 0.009649276733398438, 0.009966284036636353, 0.010283291339874268, 0.010600298643112183, 0.010917305946350098]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 6.0, 11.0, 8.0, 6.0, 18.0, 24.0, 17.0, 22.0, 19.0, 28.0, 37.0, 17.0, 46.0, 28.0, 36.0, 41.0, 42.0, 49.0, 42.0, 49.0, 29.0, 31.0, 39.0, 36.0, 39.0, 32.0, 24.0, 24.0, 37.0, 23.0, 13.0, 23.0, 10.0, 12.0, 15.0, 8.0, 5.0, 14.0, 5.0, 3.0, 6.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6201171875, -1.5690155029296875, -1.517913818359375, -1.4668121337890625, -1.41571044921875, -1.3646087646484375, -1.313507080078125, -1.2624053955078125, -1.2113037109375, -1.1602020263671875, -1.109100341796875, -1.0579986572265625, -1.00689697265625, -0.9557952880859375, -0.904693603515625, -0.8535919189453125, -0.802490234375, -0.7513885498046875, -0.700286865234375, -0.6491851806640625, -0.59808349609375, -0.5469818115234375, -0.495880126953125, -0.4447784423828125, -0.3936767578125, -0.3425750732421875, -0.291473388671875, -0.2403717041015625, -0.18927001953125, -0.1381683349609375, -0.087066650390625, -0.0359649658203125, 0.01513671875, 0.0662384033203125, 0.117340087890625, 0.1684417724609375, 0.21954345703125, 0.2706451416015625, 0.321746826171875, 0.3728485107421875, 0.4239501953125, 0.4750518798828125, 0.526153564453125, 0.5772552490234375, 0.62835693359375, 0.6794586181640625, 0.730560302734375, 0.7816619873046875, 0.832763671875, 0.8838653564453125, 0.934967041015625, 0.9860687255859375, 1.03717041015625, 1.0882720947265625, 1.139373779296875, 1.1904754638671875, 1.2415771484375, 1.2926788330078125, 1.343780517578125, 1.3948822021484375, 1.44598388671875, 1.4970855712890625, 1.548187255859375, 1.5992889404296875, 1.650390625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 9.0, 4.0, 6.0, 5.0, 8.0, 18.0, 9.0, 18.0, 28.0, 35.0, 47.0, 56.0, 65.0, 119.0, 112.0, 172.0, 204.0, 286.0, 386.0, 546.0, 820.0, 1354.0, 2348.0, 4777.0, 11169.0, 33100.0, 135623.0, 557908.0, 222336.0, 48272.0, 14920.0, 6038.0, 2847.0, 1620.0, 947.0, 573.0, 475.0, 333.0, 226.0, 183.0, 125.0, 84.0, 82.0, 63.0, 54.0, 37.0, 22.0, 24.0, 15.0, 22.0, 13.0, 10.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.275390625, -2.2034912109375, -2.131591796875, -2.0596923828125, -1.98779296875, -1.9158935546875, -1.843994140625, -1.7720947265625, -1.7001953125, -1.6282958984375, -1.556396484375, -1.4844970703125, -1.41259765625, -1.3406982421875, -1.268798828125, -1.1968994140625, -1.125, -1.0531005859375, -0.981201171875, -0.9093017578125, -0.83740234375, -0.7655029296875, -0.693603515625, -0.6217041015625, -0.5498046875, -0.4779052734375, -0.406005859375, -0.3341064453125, -0.26220703125, -0.1903076171875, -0.118408203125, -0.0465087890625, 0.025390625, 0.0972900390625, 0.169189453125, 0.2410888671875, 0.31298828125, 0.3848876953125, 0.456787109375, 0.5286865234375, 0.6005859375, 0.6724853515625, 0.744384765625, 0.8162841796875, 0.88818359375, 0.9600830078125, 1.031982421875, 1.1038818359375, 1.17578125, 1.2476806640625, 1.319580078125, 1.3914794921875, 1.46337890625, 1.5352783203125, 1.607177734375, 1.6790771484375, 1.7509765625, 1.8228759765625, 1.894775390625, 1.9666748046875, 2.03857421875, 2.1104736328125, 2.182373046875, 2.2542724609375, 2.326171875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 3.0, 11.0, 12.0, 10.0, 9.0, 20.0, 30.0, 25.0, 32.0, 41.0, 64.0, 57.0, 86.0, 154.0, 400.0, 1471.0, 152.0, 93.0, 59.0, 42.0, 48.0, 47.0, 29.0, 32.0, 31.0, 18.0, 19.0, 10.0, 9.0, 7.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.7109375, -5.54345703125, -5.3759765625, -5.20849609375, -5.041015625, -4.87353515625, -4.7060546875, -4.53857421875, -4.37109375, -4.20361328125, -4.0361328125, -3.86865234375, -3.701171875, -3.53369140625, -3.3662109375, -3.19873046875, -3.03125, -2.86376953125, -2.6962890625, -2.52880859375, -2.361328125, -2.19384765625, -2.0263671875, -1.85888671875, -1.69140625, -1.52392578125, -1.3564453125, -1.18896484375, -1.021484375, -0.85400390625, -0.6865234375, -0.51904296875, -0.3515625, -0.18408203125, -0.0166015625, 0.15087890625, 0.318359375, 0.48583984375, 0.6533203125, 0.82080078125, 0.98828125, 1.15576171875, 1.3232421875, 1.49072265625, 1.658203125, 1.82568359375, 1.9931640625, 2.16064453125, 2.328125, 2.49560546875, 2.6630859375, 2.83056640625, 2.998046875, 3.16552734375, 3.3330078125, 3.50048828125, 3.66796875, 3.83544921875, 4.0029296875, 4.17041015625, 4.337890625, 4.50537109375, 4.6728515625, 4.84033203125, 5.0078125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 15.0, 17.0, 25.0, 46.0, 69.0, 60.0, 132.0, 186.0, 382.0, 805.0, 6176.0, 3100472.0, 35028.0, 1234.0, 431.0, 216.0, 123.0, 91.0, 57.0, 43.0, 24.0, 23.0, 11.0, 7.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.9337158203125, -11.531494140625, -11.1292724609375, -10.72705078125, -10.3248291015625, -9.922607421875, -9.5203857421875, -9.1181640625, -8.7159423828125, -8.313720703125, -7.9114990234375, -7.50927734375, -7.1070556640625, -6.704833984375, -6.3026123046875, -5.900390625, -5.4981689453125, -5.095947265625, -4.6937255859375, -4.29150390625, -3.8892822265625, -3.487060546875, -3.0848388671875, -2.6826171875, -2.2803955078125, -1.878173828125, -1.4759521484375, -1.07373046875, -0.6715087890625, -0.269287109375, 0.1329345703125, 0.53515625, 0.9373779296875, 1.339599609375, 1.7418212890625, 2.14404296875, 2.5462646484375, 2.948486328125, 3.3507080078125, 3.7529296875, 4.1551513671875, 4.557373046875, 4.9595947265625, 5.36181640625, 5.7640380859375, 6.166259765625, 6.5684814453125, 6.970703125, 7.3729248046875, 7.775146484375, 8.1773681640625, 8.57958984375, 8.9818115234375, 9.384033203125, 9.7862548828125, 10.1884765625, 10.5906982421875, 10.992919921875, 11.3951416015625, 11.79736328125, 12.1995849609375, 12.601806640625, 13.0040283203125, 13.40625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 422.0, 575.0, 11.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.99500274658203, -30.011463165283203, -27.027923583984375, -24.04438591003418, -21.06084632873535, -18.077306747436523, -15.093769073486328, -12.1102294921875, -9.126689910888672, -6.143150806427002, -3.159611701965332, -0.1760730743408203, 2.807466506958008, 5.791006088256836, 8.774543762207031, 11.75808334350586, 14.741622924804688, 17.725162506103516, 20.708702087402344, 23.69223976135254, 26.675779342651367, 29.659318923950195, 32.64285659790039, 35.62639617919922, 38.60993576049805, 41.593475341796875, 44.5770149230957, 47.56055450439453, 50.544090270996094, 53.52763366699219, 56.51116943359375, 59.49470901489258, 62.47825622558594, 65.4617919921875, 68.4453353881836, 71.42887115478516, 74.41241455078125, 77.39595031738281, 80.37948608398438, 83.36302947998047, 86.34657287597656, 89.33010864257812, 92.31365203857422, 95.29718780517578, 98.28073120117188, 101.26426696777344, 104.247802734375, 107.2313461303711, 110.21488189697266, 113.19841766357422, 116.18196105957031, 119.16549682617188, 122.14904022216797, 125.13257598876953, 128.11611938476562, 131.0996551513672, 134.08319091796875, 137.0667266845703, 140.05026245117188, 143.0338134765625, 146.01734924316406, 149.00088500976562, 151.9844207763672, 154.96795654296875, 157.95150756835938]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 4.0, 7.0, 10.0, 10.0, 10.0, 16.0, 13.0, 11.0, 20.0, 22.0, 24.0, 15.0, 35.0, 39.0, 27.0, 34.0, 33.0, 36.0, 29.0, 45.0, 34.0, 37.0, 36.0, 38.0, 44.0, 35.0, 34.0, 23.0, 30.0, 27.0, 28.0, 29.0, 19.0, 19.0, 22.0, 14.0, 9.0, 16.0, 10.0, 8.0, 7.0, 11.0, 3.0, 8.0, 1.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-10.323773384094238, -10.025274276733398, -9.726776123046875, -9.428277969360352, -9.129778861999512, -8.831279754638672, -8.532781600952148, -8.234283447265625, -7.935784339904785, -7.6372857093811035, -7.338787078857422, -7.04028844833374, -6.741789817810059, -6.443291187286377, -6.144792556762695, -5.846293926239014, -5.547795295715332, -5.24929666519165, -4.950798034667969, -4.652299404144287, -4.3538007736206055, -4.055302143096924, -3.756803512573242, -3.4583048820495605, -3.159806251525879, -2.8613076210021973, -2.5628089904785156, -2.264310359954834, -1.9658117294311523, -1.6673130989074707, -1.368814468383789, -1.0703158378601074, -0.7718172073364258, -0.47331857681274414, -0.1748199462890625, 0.12367868423461914, 0.4221773147583008, 0.7206759452819824, 1.019174575805664, 1.3176732063293457, 1.6161718368530273, 1.914670467376709, 2.2131690979003906, 2.5116677284240723, 2.810166358947754, 3.1086649894714355, 3.407163619995117, 3.705662250518799, 4.0041608810424805, 4.302659511566162, 4.601158142089844, 4.899656772613525, 5.198155403137207, 5.496654033660889, 5.79515266418457, 6.093651294708252, 6.392149925231934, 6.690648555755615, 6.989147186279297, 7.2876458168029785, 7.58614444732666, 7.884643077850342, 8.183141708374023, 8.481639862060547, 8.780138969421387]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 7.0, 12.0, 6.0, 7.0, 10.0, 8.0, 13.0, 25.0, 28.0, 23.0, 35.0, 18.0, 36.0, 32.0, 38.0, 25.0, 53.0, 40.0, 40.0, 40.0, 53.0, 54.0, 39.0, 44.0, 35.0, 28.0, 28.0, 25.0, 27.0, 25.0, 25.0, 20.0, 16.0, 14.0, 11.0, 14.0, 11.0, 8.0, 7.0, 8.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.044921875, -1.9842681884765625, -1.923614501953125, -1.8629608154296875, -1.80230712890625, -1.7416534423828125, -1.680999755859375, -1.6203460693359375, -1.5596923828125, -1.4990386962890625, -1.438385009765625, -1.3777313232421875, -1.31707763671875, -1.2564239501953125, -1.195770263671875, -1.1351165771484375, -1.074462890625, -1.0138092041015625, -0.953155517578125, -0.8925018310546875, -0.83184814453125, -0.7711944580078125, -0.710540771484375, -0.6498870849609375, -0.5892333984375, -0.5285797119140625, -0.467926025390625, -0.4072723388671875, -0.34661865234375, -0.2859649658203125, -0.225311279296875, -0.1646575927734375, -0.10400390625, -0.0433502197265625, 0.017303466796875, 0.0779571533203125, 0.13861083984375, 0.1992645263671875, 0.259918212890625, 0.3205718994140625, 0.3812255859375, 0.4418792724609375, 0.502532958984375, 0.5631866455078125, 0.62384033203125, 0.6844940185546875, 0.745147705078125, 0.8058013916015625, 0.866455078125, 0.9271087646484375, 0.987762451171875, 1.0484161376953125, 1.10906982421875, 1.1697235107421875, 1.230377197265625, 1.2910308837890625, 1.3516845703125, 1.4123382568359375, 1.472991943359375, 1.5336456298828125, 1.59429931640625, 1.6549530029296875, 1.715606689453125, 1.7762603759765625, 1.8369140625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 4.0, 7.0, 9.0, 13.0, 16.0, 18.0, 21.0, 38.0, 62.0, 76.0, 112.0, 139.0, 218.0, 323.0, 489.0, 839.0, 1638.0, 3985.0, 12130.0, 51766.0, 684353.0, 3186915.0, 206812.0, 30134.0, 7959.0, 2908.0, 1284.0, 688.0, 384.0, 316.0, 183.0, 125.0, 85.0, 72.0, 40.0, 36.0, 26.0, 13.0, 10.0, 14.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.03125, -8.76025390625, -8.4892578125, -8.21826171875, -7.947265625, -7.67626953125, -7.4052734375, -7.13427734375, -6.86328125, -6.59228515625, -6.3212890625, -6.05029296875, -5.779296875, -5.50830078125, -5.2373046875, -4.96630859375, -4.6953125, -4.42431640625, -4.1533203125, -3.88232421875, -3.611328125, -3.34033203125, -3.0693359375, -2.79833984375, -2.52734375, -2.25634765625, -1.9853515625, -1.71435546875, -1.443359375, -1.17236328125, -0.9013671875, -0.63037109375, -0.359375, -0.08837890625, 0.1826171875, 0.45361328125, 0.724609375, 0.99560546875, 1.2666015625, 1.53759765625, 1.80859375, 2.07958984375, 2.3505859375, 2.62158203125, 2.892578125, 3.16357421875, 3.4345703125, 3.70556640625, 3.9765625, 4.24755859375, 4.5185546875, 4.78955078125, 5.060546875, 5.33154296875, 5.6025390625, 5.87353515625, 6.14453125, 6.41552734375, 6.6865234375, 6.95751953125, 7.228515625, 7.49951171875, 7.7705078125, 8.04150390625, 8.3125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 4.0, 3.0, 2.0, 9.0, 12.0, 6.0, 18.0, 22.0, 27.0, 24.0, 44.0, 71.0, 82.0, 120.0, 201.0, 202.0, 323.0, 426.0, 536.0, 521.0, 410.0, 277.0, 197.0, 138.0, 109.0, 70.0, 49.0, 41.0, 31.0, 21.0, 15.0, 18.0, 14.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30859375, -4.184906005859375, -4.06121826171875, -3.937530517578125, -3.8138427734375, -3.690155029296875, -3.56646728515625, -3.442779541015625, -3.319091796875, -3.195404052734375, -3.07171630859375, -2.948028564453125, -2.8243408203125, -2.700653076171875, -2.57696533203125, -2.453277587890625, -2.32958984375, -2.205902099609375, -2.08221435546875, -1.958526611328125, -1.8348388671875, -1.711151123046875, -1.58746337890625, -1.463775634765625, -1.340087890625, -1.216400146484375, -1.09271240234375, -0.969024658203125, -0.8453369140625, -0.721649169921875, -0.59796142578125, -0.474273681640625, -0.3505859375, -0.226898193359375, -0.10321044921875, 0.020477294921875, 0.1441650390625, 0.267852783203125, 0.39154052734375, 0.515228271484375, 0.638916015625, 0.762603759765625, 0.88629150390625, 1.009979248046875, 1.1336669921875, 1.257354736328125, 1.38104248046875, 1.504730224609375, 1.62841796875, 1.752105712890625, 1.87579345703125, 1.999481201171875, 2.1231689453125, 2.246856689453125, 2.37054443359375, 2.494232177734375, 2.617919921875, 2.741607666015625, 2.86529541015625, 2.988983154296875, 3.1126708984375, 3.236358642578125, 3.36004638671875, 3.483734130859375, 3.607421875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 15.0, 20.0, 40.0, 64.0, 118.0, 269.0, 548.0, 948.0, 2062.0, 4446.0, 10239.0, 26136.0, 78866.0, 303968.0, 1747121.0, 1620540.0, 281756.0, 74048.0, 25081.0, 9850.0, 4264.0, 1985.0, 911.0, 475.0, 235.0, 131.0, 54.0, 34.0, 14.0, 9.0, 10.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.412109375, -3.29827880859375, -3.1844482421875, -3.07061767578125, -2.956787109375, -2.84295654296875, -2.7291259765625, -2.61529541015625, -2.50146484375, -2.38763427734375, -2.2738037109375, -2.15997314453125, -2.046142578125, -1.93231201171875, -1.8184814453125, -1.70465087890625, -1.5908203125, -1.47698974609375, -1.3631591796875, -1.24932861328125, -1.135498046875, -1.02166748046875, -0.9078369140625, -0.79400634765625, -0.68017578125, -0.56634521484375, -0.4525146484375, -0.33868408203125, -0.224853515625, -0.11102294921875, 0.0028076171875, 0.11663818359375, 0.23046875, 0.34429931640625, 0.4581298828125, 0.57196044921875, 0.685791015625, 0.79962158203125, 0.9134521484375, 1.02728271484375, 1.14111328125, 1.25494384765625, 1.3687744140625, 1.48260498046875, 1.596435546875, 1.71026611328125, 1.8240966796875, 1.93792724609375, 2.0517578125, 2.16558837890625, 2.2794189453125, 2.39324951171875, 2.507080078125, 2.62091064453125, 2.7347412109375, 2.84857177734375, 2.96240234375, 3.07623291015625, 3.1900634765625, 3.30389404296875, 3.417724609375, 3.53155517578125, 3.6453857421875, 3.75921630859375, 3.873046875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 6.0, 10.0, 13.0, 13.0, 17.0, 19.0, 34.0, 34.0, 35.0, 37.0, 56.0, 66.0, 64.0, 68.0, 79.0, 71.0, 64.0, 54.0, 53.0, 39.0, 36.0, 27.0, 18.0, 17.0, 18.0, 10.0, 5.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.133560180664062, -22.4728946685791, -21.81222915649414, -21.151561737060547, -20.490896224975586, -19.830230712890625, -19.16956329345703, -18.50889778137207, -17.84823226928711, -17.18756675720215, -16.526901245117188, -15.866233825683594, -15.205568313598633, -14.544902801513672, -13.884236335754395, -13.223569869995117, -12.562904357910156, -11.902238845825195, -11.241572380065918, -10.58090591430664, -9.92024040222168, -9.259574890136719, -8.598908424377441, -7.938242435455322, -7.277576446533203, -6.616910457611084, -5.956244468688965, -5.295578479766846, -4.634912490844727, -3.9742465019226074, -3.3135805130004883, -2.652914524078369, -1.99224853515625, -1.3315825462341309, -0.6709165573120117, -0.010250568389892578, 0.6504154205322266, 1.3110814094543457, 1.9717473983764648, 2.632413387298584, 3.293079376220703, 3.9537453651428223, 4.614411354064941, 5.2750773429870605, 5.93574333190918, 6.596409320831299, 7.257075309753418, 7.917741298675537, 8.578407287597656, 9.239072799682617, 9.899739265441895, 10.560405731201172, 11.221071243286133, 11.881736755371094, 12.542403221130371, 13.203069686889648, 13.86373519897461, 14.52440071105957, 15.185067176818848, 15.845733642578125, 16.506399154663086, 17.167064666748047, 17.82773208618164, 18.4883975982666, 19.149063110351562]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 3.0, 4.0, 5.0, 4.0, 6.0, 10.0, 10.0, 11.0, 13.0, 11.0, 28.0, 15.0, 21.0, 28.0, 30.0, 26.0, 37.0, 32.0, 48.0, 33.0, 47.0, 48.0, 51.0, 40.0, 37.0, 29.0, 41.0, 42.0, 34.0, 27.0, 35.0, 29.0, 22.0, 34.0, 24.0, 12.0, 14.0, 13.0, 14.0, 5.0, 11.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.55138397216797, -16.04643440246582, -15.541484832763672, -15.036535263061523, -14.531585693359375, -14.026636123657227, -13.521687507629395, -13.016737937927246, -12.511788368225098, -12.00683879852295, -11.5018892288208, -10.996939659118652, -10.49199104309082, -9.987041473388672, -9.482091903686523, -8.977142333984375, -8.472192764282227, -7.967243194580078, -7.46229362487793, -6.9573445320129395, -6.452394962310791, -5.947445392608643, -5.442496299743652, -4.937546730041504, -4.4325971603393555, -3.927647590637207, -3.4226982593536377, -2.9177489280700684, -2.41279935836792, -1.9078497886657715, -1.4029004573822021, -0.8979511260986328, -0.39300060272216797, 0.11194884777069092, 0.6168982982635498, 1.1218477487564087, 1.6267971992492676, 2.131746768951416, 2.6366961002349854, 3.1416454315185547, 3.646595001220703, 4.151544570922852, 4.656494140625, 5.16144323348999, 5.666392803192139, 6.171342372894287, 6.676291465759277, 7.181241035461426, 7.686190605163574, 8.191140174865723, 8.696089744567871, 9.20103931427002, 9.705987930297852, 10.2109375, 10.715887069702148, 11.220836639404297, 11.725786209106445, 12.230735778808594, 12.735685348510742, 13.24063491821289, 13.745584487915039, 14.250534057617188, 14.75548267364502, 15.260432243347168, 15.765381813049316]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 4.0, 4.0, 4.0, 6.0, 7.0, 7.0, 16.0, 13.0, 13.0, 17.0, 22.0, 26.0, 28.0, 20.0, 34.0, 41.0, 36.0, 34.0, 45.0, 45.0, 47.0, 44.0, 50.0, 39.0, 31.0, 35.0, 53.0, 38.0, 26.0, 32.0, 24.0, 37.0, 21.0, 21.0, 17.0, 10.0, 17.0, 6.0, 11.0, 4.0, 4.0, 5.0, 4.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.5, -33.4091796875, -32.318359375, -31.2275390625, -30.13671875, -29.0458984375, -27.955078125, -26.8642578125, -25.7734375, -24.6826171875, -23.591796875, -22.5009765625, -21.41015625, -20.3193359375, -19.228515625, -18.1376953125, -17.046875, -15.9560546875, -14.865234375, -13.7744140625, -12.68359375, -11.5927734375, -10.501953125, -9.4111328125, -8.3203125, -7.2294921875, -6.138671875, -5.0478515625, -3.95703125, -2.8662109375, -1.775390625, -0.6845703125, 0.40625, 1.4970703125, 2.587890625, 3.6787109375, 4.76953125, 5.8603515625, 6.951171875, 8.0419921875, 9.1328125, 10.2236328125, 11.314453125, 12.4052734375, 13.49609375, 14.5869140625, 15.677734375, 16.7685546875, 17.859375, 18.9501953125, 20.041015625, 21.1318359375, 22.22265625, 23.3134765625, 24.404296875, 25.4951171875, 26.5859375, 27.6767578125, 28.767578125, 29.8583984375, 30.94921875, 32.0400390625, 33.130859375, 34.2216796875, 35.3125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 10.0, 9.0, 18.0, 23.0, 33.0, 49.0, 71.0, 131.0, 211.0, 333.0, 446.0, 719.0, 1171.0, 1844.0, 2904.0, 4732.0, 7428.0, 12456.0, 20899.0, 36781.0, 67273.0, 128665.0, 232751.0, 236607.0, 132151.0, 68689.0, 37423.0, 21371.0, 12863.0, 7572.0, 4726.0, 3015.0, 1871.0, 1220.0, 739.0, 485.0, 325.0, 195.0, 136.0, 73.0, 43.0, 42.0, 19.0, 16.0, 7.0, 12.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.7607421875, -1.708984375, -1.6572265625, -1.60546875, -1.5537109375, -1.501953125, -1.4501953125, -1.3984375, -1.3466796875, -1.294921875, -1.2431640625, -1.19140625, -1.1396484375, -1.087890625, -1.0361328125, -0.984375, -0.9326171875, -0.880859375, -0.8291015625, -0.77734375, -0.7255859375, -0.673828125, -0.6220703125, -0.5703125, -0.5185546875, -0.466796875, -0.4150390625, -0.36328125, -0.3115234375, -0.259765625, -0.2080078125, -0.15625, -0.1044921875, -0.052734375, -0.0009765625, 0.05078125, 0.1025390625, 0.154296875, 0.2060546875, 0.2578125, 0.3095703125, 0.361328125, 0.4130859375, 0.46484375, 0.5166015625, 0.568359375, 0.6201171875, 0.671875, 0.7236328125, 0.775390625, 0.8271484375, 0.87890625, 0.9306640625, 0.982421875, 1.0341796875, 1.0859375, 1.1376953125, 1.189453125, 1.2412109375, 1.29296875, 1.3447265625, 1.396484375, 1.4482421875, 1.5, 1.5517578125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 9.0, 7.0, 10.0, 6.0, 9.0, 16.0, 12.0, 18.0, 21.0, 20.0, 32.0, 38.0, 24.0, 30.0, 43.0, 42.0, 42.0, 39.0, 43.0, 1080.0, 33.0, 35.0, 51.0, 48.0, 37.0, 30.0, 30.0, 36.0, 34.0, 26.0, 26.0, 17.0, 14.0, 12.0, 12.0, 10.0, 10.0, 6.0, 9.0, 2.0, 1.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.8125, -20.1337890625, -19.455078125, -18.7763671875, -18.09765625, -17.4189453125, -16.740234375, -16.0615234375, -15.3828125, -14.7041015625, -14.025390625, -13.3466796875, -12.66796875, -11.9892578125, -11.310546875, -10.6318359375, -9.953125, -9.2744140625, -8.595703125, -7.9169921875, -7.23828125, -6.5595703125, -5.880859375, -5.2021484375, -4.5234375, -3.8447265625, -3.166015625, -2.4873046875, -1.80859375, -1.1298828125, -0.451171875, 0.2275390625, 0.90625, 1.5849609375, 2.263671875, 2.9423828125, 3.62109375, 4.2998046875, 4.978515625, 5.6572265625, 6.3359375, 7.0146484375, 7.693359375, 8.3720703125, 9.05078125, 9.7294921875, 10.408203125, 11.0869140625, 11.765625, 12.4443359375, 13.123046875, 13.8017578125, 14.48046875, 15.1591796875, 15.837890625, 16.5166015625, 17.1953125, 17.8740234375, 18.552734375, 19.2314453125, 19.91015625, 20.5888671875, 21.267578125, 21.9462890625, 22.625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 9.0, 4.0, 8.0, 12.0, 10.0, 13.0, 15.0, 19.0, 26.0, 33.0, 36.0, 74.0, 112.0, 212.0, 391.0, 887.0, 1837.0, 4442.0, 11350.0, 38294.0, 1674848.0, 320521.0, 28060.0, 9128.0, 3649.0, 1571.0, 697.0, 339.0, 165.0, 116.0, 66.0, 38.0, 22.0, 26.0, 21.0, 17.0, 17.0, 6.0, 9.0, 5.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.6328125, -5.4378662109375, -5.242919921875, -5.0479736328125, -4.85302734375, -4.6580810546875, -4.463134765625, -4.2681884765625, -4.0732421875, -3.8782958984375, -3.683349609375, -3.4884033203125, -3.29345703125, -3.0985107421875, -2.903564453125, -2.7086181640625, -2.513671875, -2.3187255859375, -2.123779296875, -1.9288330078125, -1.73388671875, -1.5389404296875, -1.343994140625, -1.1490478515625, -0.9541015625, -0.7591552734375, -0.564208984375, -0.3692626953125, -0.17431640625, 0.0206298828125, 0.215576171875, 0.4105224609375, 0.60546875, 0.8004150390625, 0.995361328125, 1.1903076171875, 1.38525390625, 1.5802001953125, 1.775146484375, 1.9700927734375, 2.1650390625, 2.3599853515625, 2.554931640625, 2.7498779296875, 2.94482421875, 3.1397705078125, 3.334716796875, 3.5296630859375, 3.724609375, 3.9195556640625, 4.114501953125, 4.3094482421875, 4.50439453125, 4.6993408203125, 4.894287109375, 5.0892333984375, 5.2841796875, 5.4791259765625, 5.674072265625, 5.8690185546875, 6.06396484375, 6.2589111328125, 6.453857421875, 6.6488037109375, 6.84375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 7.0, 3.0, 2.0, 8.0, 8.0, 6.0, 10.0, 13.0, 16.0, 16.0, 21.0, 30.0, 23.0, 28.0, 35.0, 40.0, 35.0, 43.0, 59.0, 54.0, 44.0, 45.0, 51.0, 50.0, 41.0, 38.0, 42.0, 31.0, 30.0, 38.0, 27.0, 17.0, 18.0, 16.0, 13.0, 10.0, 9.0, 6.0, 7.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0623779296875, -0.060550689697265625, -0.05872344970703125, -0.056896209716796875, -0.0550689697265625, -0.053241729736328125, -0.05141448974609375, -0.049587249755859375, -0.047760009765625, -0.045932769775390625, -0.04410552978515625, -0.042278289794921875, -0.0404510498046875, -0.038623809814453125, -0.03679656982421875, -0.034969329833984375, -0.03314208984375, -0.031314849853515625, -0.02948760986328125, -0.027660369873046875, -0.0258331298828125, -0.024005889892578125, -0.02217864990234375, -0.020351409912109375, -0.018524169921875, -0.016696929931640625, -0.01486968994140625, -0.013042449951171875, -0.0112152099609375, -0.009387969970703125, -0.00756072998046875, -0.005733489990234375, -0.00390625, -0.002079010009765625, -0.00025177001953125, 0.001575469970703125, 0.0034027099609375, 0.005229949951171875, 0.00705718994140625, 0.008884429931640625, 0.010711669921875, 0.012538909912109375, 0.01436614990234375, 0.016193389892578125, 0.0180206298828125, 0.019847869873046875, 0.02167510986328125, 0.023502349853515625, 0.02532958984375, 0.027156829833984375, 0.02898406982421875, 0.030811309814453125, 0.0326385498046875, 0.034465789794921875, 0.03629302978515625, 0.038120269775390625, 0.039947509765625, 0.041774749755859375, 0.04360198974609375, 0.045429229736328125, 0.0472564697265625, 0.049083709716796875, 0.05091094970703125, 0.052738189697265625, 0.0545654296875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 12.0, 11.0, 18.0, 30.0, 60.0, 52.0, 94.0, 167.0, 232.0, 397.0, 621.0, 945.0, 1708.0, 2953.0, 5736.0, 11328.0, 23759.0, 51736.0, 111335.0, 209871.0, 267898.0, 183987.0, 92406.0, 42540.0, 19839.0, 9495.0, 4844.0, 2651.0, 1499.0, 851.0, 525.0, 337.0, 203.0, 135.0, 98.0, 56.0, 34.0, 30.0, 9.0, 14.0, 10.0, 9.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2432861328125, -0.2352771759033203, -0.22726821899414062, -0.21925926208496094, -0.21125030517578125, -0.20324134826660156, -0.19523239135742188, -0.1872234344482422, -0.1792144775390625, -0.1712055206298828, -0.16319656372070312, -0.15518760681152344, -0.14717864990234375, -0.13916969299316406, -0.13116073608398438, -0.12315177917480469, -0.115142822265625, -0.10713386535644531, -0.09912490844726562, -0.09111595153808594, -0.08310699462890625, -0.07509803771972656, -0.06708908081054688, -0.05908012390136719, -0.0510711669921875, -0.04306221008300781, -0.035053253173828125, -0.027044296264648438, -0.01903533935546875, -0.011026382446289062, -0.003017425537109375, 0.0049915313720703125, 0.01300048828125, 0.021009445190429688, 0.029018402099609375, 0.03702735900878906, 0.04503631591796875, 0.05304527282714844, 0.061054229736328125, 0.06906318664550781, 0.0770721435546875, 0.08508110046386719, 0.09309005737304688, 0.10109901428222656, 0.10910797119140625, 0.11711692810058594, 0.12512588500976562, 0.1331348419189453, 0.141143798828125, 0.1491527557373047, 0.15716171264648438, 0.16517066955566406, 0.17317962646484375, 0.18118858337402344, 0.18919754028320312, 0.1972064971923828, 0.2052154541015625, 0.2132244110107422, 0.22123336791992188, 0.22924232482910156, 0.23725128173828125, 0.24526023864746094, 0.2532691955566406, 0.2612781524658203, 0.269287109375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 11.0, 13.0, 19.0, 29.0, 37.0, 58.0, 68.0, 67.0, 125.0, 99.0, 104.0, 87.0, 79.0, 55.0, 42.0, 33.0, 20.0, 20.0, 7.0, 13.0, 10.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058886390179395676, -0.054578181356191635, -0.050269972532987595, -0.04596176743507385, -0.04165355861186981, -0.03734534978866577, -0.03303714096546173, -0.02872893214225769, -0.02442072331905365, -0.02011251449584961, -0.01580430567264557, -0.011496098712086678, -0.007187889888882637, -0.0028796810656785965, 0.0014285258948802948, 0.005736734718084335, 0.010044943541288376, 0.014353152364492416, 0.018661361187696457, 0.022969568148255348, 0.02727777697145939, 0.03158598393201828, 0.03589419275522232, 0.04020240157842636, 0.0445106104016304, 0.04881881922483444, 0.05312702804803848, 0.05743523687124252, 0.061743445694446564, 0.0660516545176506, 0.07035985589027405, 0.07466806471347809, 0.07897628843784332, 0.08328449726104736, 0.0875927060842514, 0.09190091490745544, 0.09620912373065948, 0.10051733255386353, 0.10482554137706757, 0.1091337502002716, 0.11344195902347565, 0.11775016784667969, 0.12205837666988373, 0.12636658549308777, 0.1306747943162918, 0.13498300313949585, 0.1392912119626999, 0.14359942078590393, 0.14790761470794678, 0.15221582353115082, 0.15652403235435486, 0.1608322411775589, 0.16514045000076294, 0.16944865882396698, 0.17375686764717102, 0.17806507647037506, 0.1823732852935791, 0.18668149411678314, 0.19098970293998718, 0.19529791176319122, 0.19960612058639526, 0.2039143294095993, 0.20822253823280334, 0.21253074705600739, 0.21683895587921143]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 13.0, 11.0, 11.0, 15.0, 17.0, 23.0, 21.0, 27.0, 22.0, 21.0, 40.0, 30.0, 42.0, 52.0, 44.0, 40.0, 44.0, 55.0, 33.0, 36.0, 37.0, 42.0, 42.0, 37.0, 33.0, 31.0, 20.0, 18.0, 23.0, 22.0, 9.0, 18.0, 12.0, 8.0, 12.0, 10.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06269901990890503, -0.060835160315036774, -0.05897130072116852, -0.057107437402009964, -0.05524357780814171, -0.05337971821427345, -0.0515158548951149, -0.04965199530124664, -0.04778813570737839, -0.04592427611351013, -0.044060416519641876, -0.04219655320048332, -0.040332693606615067, -0.03846883401274681, -0.03660497069358826, -0.03474111109972, -0.032877251505851746, -0.03101339191198349, -0.029149530455470085, -0.02728566899895668, -0.025421809405088425, -0.02355794981122017, -0.021694088354706764, -0.01983022689819336, -0.017966367304325104, -0.016102507710456848, -0.014238646253943443, -0.012374785728752613, -0.010510925203561783, -0.008647064678370953, -0.006783204153180122, -0.004919343627989292, -0.003055483102798462, -0.0011916225776076317, 0.0006722379475831985, 0.0025360984727740288, 0.004399958997964859, 0.006263819523155689, 0.00812768004834652, 0.00999154057353735, 0.01185540109872818, 0.01371926162391901, 0.01558312214910984, 0.017446983605623245, 0.0193108431994915, 0.021174702793359756, 0.02303856424987316, 0.024902425706386566, 0.026766285300254822, 0.028630144894123077, 0.030494006350636482, 0.03235786780714989, 0.03422172740101814, 0.0360855869948864, 0.03794945031404495, 0.03981330990791321, 0.041677169501781464, 0.04354102909564972, 0.045404888689517975, 0.04726875200867653, 0.049132611602544785, 0.05099647119641304, 0.052860334515571594, 0.05472419410943985, 0.056588053703308105]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 4.0, 5.0, 6.0, 7.0, 6.0, 17.0, 13.0, 14.0, 19.0, 18.0, 29.0, 28.0, 19.0, 37.0, 40.0, 36.0, 38.0, 39.0, 50.0, 42.0, 51.0, 42.0, 44.0, 30.0, 36.0, 51.0, 36.0, 24.0, 35.0, 28.0, 36.0, 21.0, 20.0, 11.0, 10.0, 20.0, 5.0, 10.0, 5.0, 4.0, 6.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.46875, -33.37451171875, -32.2802734375, -31.18603515625, -30.091796875, -28.99755859375, -27.9033203125, -26.80908203125, -25.71484375, -24.62060546875, -23.5263671875, -22.43212890625, -21.337890625, -20.24365234375, -19.1494140625, -18.05517578125, -16.9609375, -15.86669921875, -14.7724609375, -13.67822265625, -12.583984375, -11.48974609375, -10.3955078125, -9.30126953125, -8.20703125, -7.11279296875, -6.0185546875, -4.92431640625, -3.830078125, -2.73583984375, -1.6416015625, -0.54736328125, 0.546875, 1.64111328125, 2.7353515625, 3.82958984375, 4.923828125, 6.01806640625, 7.1123046875, 8.20654296875, 9.30078125, 10.39501953125, 11.4892578125, 12.58349609375, 13.677734375, 14.77197265625, 15.8662109375, 16.96044921875, 18.0546875, 19.14892578125, 20.2431640625, 21.33740234375, 22.431640625, 23.52587890625, 24.6201171875, 25.71435546875, 26.80859375, 27.90283203125, 28.9970703125, 30.09130859375, 31.185546875, 32.27978515625, 33.3740234375, 34.46826171875, 35.5625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 4.0, 5.0, 6.0, 5.0, 8.0, 10.0, 17.0, 15.0, 21.0, 26.0, 41.0, 44.0, 70.0, 103.0, 138.0, 252.0, 405.0, 946.0, 3475.0, 17540.0, 152906.0, 732397.0, 120605.0, 14505.0, 2952.0, 882.0, 430.0, 225.0, 125.0, 113.0, 69.0, 46.0, 49.0, 34.0, 16.0, 15.0, 15.0, 11.0, 6.0, 5.0, 7.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.9400634765625, -6.712158203125, -6.4842529296875, -6.25634765625, -6.0284423828125, -5.800537109375, -5.5726318359375, -5.3447265625, -5.1168212890625, -4.888916015625, -4.6610107421875, -4.43310546875, -4.2052001953125, -3.977294921875, -3.7493896484375, -3.521484375, -3.2935791015625, -3.065673828125, -2.8377685546875, -2.60986328125, -2.3819580078125, -2.154052734375, -1.9261474609375, -1.6982421875, -1.4703369140625, -1.242431640625, -1.0145263671875, -0.78662109375, -0.5587158203125, -0.330810546875, -0.1029052734375, 0.125, 0.3529052734375, 0.580810546875, 0.8087158203125, 1.03662109375, 1.2645263671875, 1.492431640625, 1.7203369140625, 1.9482421875, 2.1761474609375, 2.404052734375, 2.6319580078125, 2.85986328125, 3.0877685546875, 3.315673828125, 3.5435791015625, 3.771484375, 3.9993896484375, 4.227294921875, 4.4552001953125, 4.68310546875, 4.9110107421875, 5.138916015625, 5.3668212890625, 5.5947265625, 5.8226318359375, 6.050537109375, 6.2784423828125, 6.50634765625, 6.7342529296875, 6.962158203125, 7.1900634765625, 7.41796875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 9.0, 18.0, 28.0, 30.0, 23.0, 22.0, 28.0, 31.0, 37.0, 40.0, 53.0, 58.0, 55.0, 2049.0, 100.0, 51.0, 51.0, 53.0, 39.0, 39.0, 36.0, 37.0, 28.0, 22.0, 23.0, 19.0, 16.0, 6.0, 14.0, 4.0, 4.0, 5.0, 5.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.09375, -41.5439453125, -39.994140625, -38.4443359375, -36.89453125, -35.3447265625, -33.794921875, -32.2451171875, -30.6953125, -29.1455078125, -27.595703125, -26.0458984375, -24.49609375, -22.9462890625, -21.396484375, -19.8466796875, -18.296875, -16.7470703125, -15.197265625, -13.6474609375, -12.09765625, -10.5478515625, -8.998046875, -7.4482421875, -5.8984375, -4.3486328125, -2.798828125, -1.2490234375, 0.30078125, 1.8505859375, 3.400390625, 4.9501953125, 6.5, 8.0498046875, 9.599609375, 11.1494140625, 12.69921875, 14.2490234375, 15.798828125, 17.3486328125, 18.8984375, 20.4482421875, 21.998046875, 23.5478515625, 25.09765625, 26.6474609375, 28.197265625, 29.7470703125, 31.296875, 32.8466796875, 34.396484375, 35.9462890625, 37.49609375, 39.0458984375, 40.595703125, 42.1455078125, 43.6953125, 45.2451171875, 46.794921875, 48.3447265625, 49.89453125, 51.4443359375, 52.994140625, 54.5439453125, 56.09375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 3.0, 8.0, 7.0, 9.0, 20.0, 26.0, 38.0, 58.0, 81.0, 147.0, 216.0, 303.0, 551.0, 1069.0, 2158.0, 5576.0, 17695.0, 74911.0, 553973.0, 2364737.0, 91842.0, 20794.0, 6267.0, 2461.0, 1094.0, 609.0, 372.0, 222.0, 133.0, 115.0, 67.0, 35.0, 33.0, 16.0, 18.0, 12.0, 10.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.33984375, -3.2208251953125, -3.101806640625, -2.9827880859375, -2.86376953125, -2.7447509765625, -2.625732421875, -2.5067138671875, -2.3876953125, -2.2686767578125, -2.149658203125, -2.0306396484375, -1.91162109375, -1.7926025390625, -1.673583984375, -1.5545654296875, -1.435546875, -1.3165283203125, -1.197509765625, -1.0784912109375, -0.95947265625, -0.8404541015625, -0.721435546875, -0.6024169921875, -0.4833984375, -0.3643798828125, -0.245361328125, -0.1263427734375, -0.00732421875, 0.1116943359375, 0.230712890625, 0.3497314453125, 0.46875, 0.5877685546875, 0.706787109375, 0.8258056640625, 0.94482421875, 1.0638427734375, 1.182861328125, 1.3018798828125, 1.4208984375, 1.5399169921875, 1.658935546875, 1.7779541015625, 1.89697265625, 2.0159912109375, 2.135009765625, 2.2540283203125, 2.373046875, 2.4920654296875, 2.611083984375, 2.7301025390625, 2.84912109375, 2.9681396484375, 3.087158203125, 3.2061767578125, 3.3251953125, 3.4442138671875, 3.563232421875, 3.6822509765625, 3.80126953125, 3.9202880859375, 4.039306640625, 4.1583251953125, 4.27734375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 13.0, 30.0, 40.0, 75.0, 157.0, 219.0, 199.0, 119.0, 59.0, 30.0, 21.0, 9.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.55130004882812, -118.57617950439453, -115.60105895996094, -112.62593841552734, -109.65081787109375, -106.67569732666016, -103.70057678222656, -100.7254638671875, -97.75033569335938, -94.77521514892578, -91.80009460449219, -88.8249740600586, -85.849853515625, -82.8747329711914, -79.89961242675781, -76.92449951171875, -73.94937896728516, -70.97425842285156, -67.99913787841797, -65.02401733398438, -62.04889678955078, -59.07377624511719, -56.09865951538086, -53.123538970947266, -50.14841842651367, -47.17329788208008, -44.198177337646484, -41.223060607910156, -38.24794006347656, -35.27281951904297, -32.297698974609375, -29.32257843017578, -26.347457885742188, -23.372337341308594, -20.397216796875, -17.42209815979004, -14.446977615356445, -11.471857070922852, -8.49673843383789, -5.521617889404297, -2.546497344970703, 0.4286227226257324, 3.403742790222168, 6.378862380981445, 9.353982925415039, 12.329103469848633, 15.304222106933594, 18.279342651367188, 21.25446319580078, 24.229583740234375, 27.20470428466797, 30.17982292175293, 33.154945373535156, 36.13006591796875, 39.10518264770508, 42.08030319213867, 45.055423736572266, 48.03054428100586, 51.00566482543945, 53.98078155517578, 56.955902099609375, 59.93102264404297, 62.90614318847656, 65.88126373291016, 68.85638427734375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 8.0, 6.0, 10.0, 21.0, 15.0, 17.0, 21.0, 30.0, 37.0, 37.0, 39.0, 49.0, 47.0, 56.0, 61.0, 51.0, 59.0, 54.0, 45.0, 48.0, 49.0, 35.0, 29.0, 37.0, 26.0, 27.0, 22.0, 17.0, 14.0, 8.0, 9.0, 6.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-90.20960998535156, -87.64225006103516, -85.07489776611328, -82.50753784179688, -79.940185546875, -77.3728256225586, -74.80546569824219, -72.23811340332031, -69.6707534790039, -67.1033935546875, -64.53604125976562, -61.96868133544922, -59.40132522583008, -56.83396911621094, -54.2666130065918, -51.699256896972656, -49.131900787353516, -46.564544677734375, -43.997188568115234, -41.429832458496094, -38.86247253417969, -36.29511642456055, -33.727760314941406, -31.160402297973633, -28.593046188354492, -26.02569007873535, -23.458332061767578, -20.890975952148438, -18.323619842529297, -15.756261825561523, -13.188905715942383, -10.62154769897461, -8.054191589355469, -5.486834526062012, -2.919477939605713, -0.35212135314941406, 2.215235710144043, 4.7825927734375, 7.349948883056641, 9.917306900024414, 12.484663009643555, 15.052020072937012, 17.61937713623047, 20.18673324584961, 22.75408935546875, 25.321447372436523, 27.888803482055664, 30.456161499023438, 33.02351760864258, 35.59087371826172, 38.15822982788086, 40.7255859375, 43.292945861816406, 45.86030197143555, 48.42765808105469, 50.995018005371094, 53.56237030029297, 56.12972640991211, 58.69708251953125, 61.264442443847656, 63.8317985534668, 66.39915466308594, 68.96650695800781, 71.53386688232422, 74.10122680664062]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 5.0, 9.0, 10.0, 20.0, 22.0, 21.0, 32.0, 36.0, 41.0, 61.0, 98.0, 137.0, 200.0, 308.0, 554.0, 1366.0, 4315.0, 1019026.0, 15786.0, 3764.0, 1185.0, 535.0, 284.0, 200.0, 129.0, 107.0, 73.0, 56.0, 41.0, 27.0, 21.0, 17.0, 8.0, 11.0, 7.0, 6.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.108352661132812, -22.361698150634766, -21.61504364013672, -20.86838722229004, -20.121732711791992, -19.375078201293945, -18.628421783447266, -17.88176727294922, -17.135112762451172, -16.388458251953125, -15.641802787780762, -14.895147323608398, -14.148492813110352, -13.401838302612305, -12.655182838439941, -11.908527374267578, -11.161872863769531, -10.415218353271484, -9.668562889099121, -8.921907424926758, -8.175252914428711, -7.428597927093506, -6.681942939758301, -5.935287952423096, -5.188632965087891, -4.4419779777526855, -3.6953229904174805, -2.9486680030822754, -2.2020130157470703, -1.4553580284118652, -0.7087030410766602, 0.03795194625854492, 0.78460693359375, 1.531261920928955, 2.27791690826416, 3.0245718955993652, 3.7712268829345703, 4.517881870269775, 5.2645368576049805, 6.0111918449401855, 6.757846832275391, 7.504501819610596, 8.2511568069458, 8.997812271118164, 9.744466781616211, 10.491121292114258, 11.237776756286621, 11.984432220458984, 12.731086730957031, 13.477741241455078, 14.224396705627441, 14.971052169799805, 15.717706680297852, 16.4643611907959, 17.211017608642578, 17.957672119140625, 18.704326629638672, 19.45098114013672, 20.197635650634766, 20.944292068481445, 21.690946578979492, 22.43760108947754, 23.18425750732422, 23.930912017822266, 24.677566528320312]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 12.0, 39.0, 815.0, 51461460.0, 759.0, 43.0, 10.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1185.8385009765625, -1158.567626953125, -1131.296630859375, -1104.0257568359375, -1076.7548828125, -1049.48388671875, -1022.2130126953125, -994.942138671875, -967.6712036132812, -940.4002685546875, -913.12939453125, -885.8584594726562, -858.5875244140625, -831.316650390625, -804.0457153320312, -776.7747802734375, -749.50390625, -722.2329711914062, -694.9620971679688, -667.691162109375, -640.4202270507812, -613.1493530273438, -585.87841796875, -558.6075439453125, -531.3365478515625, -504.0656433105469, -476.7947082519531, -449.5238037109375, -422.2528991699219, -394.98199462890625, -367.7110595703125, -340.4401550292969, -313.16925048828125, -285.8983459472656, -258.6274108886719, -231.35650634765625, -204.08560180664062, -176.81468200683594, -149.54376220703125, -122.27285766601562, -95.00193786621094, -67.73102569580078, -40.46010971069336, -13.189193725585938, 14.081718444824219, 41.352630615234375, 68.62355041503906, 95.89445495605469, 123.16537475585938, 150.43629455566406, 177.7071990966797, 204.97811889648438, 232.2490234375, 259.51995849609375, 286.7908630371094, 314.061767578125, 341.33270263671875, 368.6036071777344, 395.8745422363281, 423.14544677734375, 450.4163513183594, 477.687255859375, 504.95819091796875, 532.2291259765625, 559.5]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 10.0, 6.0, 4.0, 13.0, 10.0, 18.0, 25.0, 27.0, 40.0, 57.0, 62.0, 102.0, 95.0, 105.0, 75.0, 70.0, 47.0, 50.0, 36.0, 26.0, 24.0, 12.0, 12.0, 13.0, 7.0, 4.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.205787658691406, -40.80736541748047, -39.40894317626953, -38.010520935058594, -36.61209487915039, -35.21367263793945, -33.815250396728516, -32.41682815551758, -31.018404006958008, -29.61998176574707, -28.2215576171875, -26.823135375976562, -25.424713134765625, -24.026288986206055, -22.627866744995117, -21.229442596435547, -19.83102035522461, -18.432598114013672, -17.0341739654541, -15.635751724243164, -14.23732852935791, -12.838905334472656, -11.440483093261719, -10.042059898376465, -8.643636703491211, -7.245213508605957, -5.846790790557861, -4.448368072509766, -3.0499448776245117, -1.6515216827392578, -0.2530994415283203, 1.1453237533569336, 2.543750762939453, 3.942173719406128, 5.340596675872803, 6.739019393920898, 8.137442588806152, 9.535865783691406, 10.934288024902344, 12.332711219787598, 13.731134414672852, 15.129557609558105, 16.52798080444336, 17.926403045654297, 19.324825286865234, 20.723249435424805, 22.121671676635742, 23.520095825195312, 24.91851806640625, 26.316940307617188, 27.715364456176758, 29.113786697387695, 30.512210845947266, 31.910633087158203, 33.30905532836914, 34.70747756958008, 36.10590362548828, 37.50432586669922, 38.902748107910156, 40.301170349121094, 41.6995964050293, 43.098018646240234, 44.49644088745117, 45.89486312866211, 47.29328536987305]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 7.0, 10.0, 6.0, 8.0, 18.0, 26.0, 19.0, 15.0, 27.0, 24.0, 26.0, 20.0, 41.0, 32.0, 46.0, 38.0, 51.0, 48.0, 47.0, 49.0, 36.0, 42.0, 40.0, 32.0, 35.0, 23.0, 24.0, 31.0, 28.0, 18.0, 31.0, 25.0, 16.0, 9.0, 8.0, 13.0, 5.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.257793426513672, -30.28750228881836, -29.317211151123047, -28.346920013427734, -27.376628875732422, -26.40633773803711, -25.436046600341797, -24.465755462646484, -23.495464324951172, -22.52517318725586, -21.554882049560547, -20.584590911865234, -19.614299774169922, -18.64400863647461, -17.673717498779297, -16.703426361083984, -15.733135223388672, -14.76284408569336, -13.792552947998047, -12.822261810302734, -11.851970672607422, -10.88167953491211, -9.911388397216797, -8.941097259521484, -7.970806121826172, -7.000514984130859, -6.030223846435547, -5.059932708740234, -4.089641571044922, -3.1193504333496094, -2.149059295654297, -1.1787681579589844, -0.20847702026367188, 0.7618141174316406, 1.7321052551269531, 2.7023963928222656, 3.672687530517578, 4.642978668212891, 5.613269805908203, 6.583560943603516, 7.553852081298828, 8.52414321899414, 9.494434356689453, 10.464725494384766, 11.435016632080078, 12.40530776977539, 13.375598907470703, 14.345890045166016, 15.316181182861328, 16.28647232055664, 17.256763458251953, 18.227054595947266, 19.197345733642578, 20.16763687133789, 21.137928009033203, 22.108219146728516, 23.078510284423828, 24.04880142211914, 25.019092559814453, 25.989383697509766, 26.959674835205078, 27.92996597290039, 28.900257110595703, 29.870548248291016, 30.840839385986328]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 2.0, 7.0, 3.0, 6.0, 10.0, 16.0, 22.0, 20.0, 30.0, 48.0, 69.0, 98.0, 122.0, 212.0, 322.0, 385.0, 543.0, 809.0, 1267.0, 1853.0, 2994.0, 4792.0, 7865.0, 14412.0, 30166.0, 84028.0, 421860.0, 3237872.0, 255817.0, 63965.0, 27105.0, 14180.0, 8289.0, 5122.0, 3325.0, 2088.0, 1402.0, 1012.0, 713.0, 431.0, 278.0, 207.0, 155.0, 98.0, 69.0, 51.0, 50.0, 30.0, 20.0, 16.0, 12.0, 10.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8623046875, -1.8010406494140625, -1.739776611328125, -1.6785125732421875, -1.61724853515625, -1.5559844970703125, -1.494720458984375, -1.4334564208984375, -1.3721923828125, -1.3109283447265625, -1.249664306640625, -1.1884002685546875, -1.12713623046875, -1.0658721923828125, -1.004608154296875, -0.9433441162109375, -0.882080078125, -0.8208160400390625, -0.759552001953125, -0.6982879638671875, -0.63702392578125, -0.5757598876953125, -0.514495849609375, -0.4532318115234375, -0.3919677734375, -0.3307037353515625, -0.269439697265625, -0.2081756591796875, -0.14691162109375, -0.0856475830078125, -0.024383544921875, 0.0368804931640625, 0.09814453125, 0.1594085693359375, 0.220672607421875, 0.2819366455078125, 0.34320068359375, 0.4044647216796875, 0.465728759765625, 0.5269927978515625, 0.5882568359375, 0.6495208740234375, 0.710784912109375, 0.7720489501953125, 0.83331298828125, 0.8945770263671875, 0.955841064453125, 1.0171051025390625, 1.078369140625, 1.1396331787109375, 1.200897216796875, 1.2621612548828125, 1.32342529296875, 1.3846893310546875, 1.445953369140625, 1.5072174072265625, 1.5684814453125, 1.6297454833984375, 1.691009521484375, 1.7522735595703125, 1.81353759765625, 1.8748016357421875, 1.936065673828125, 1.9973297119140625, 2.05859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 1.0, 7.0, 6.0, 7.0, 14.0, 18.0, 31.0, 46.0, 67.0, 102.0, 122.0, 129.0, 136.0, 97.0, 69.0, 41.0, 24.0, 15.0, 12.0, 14.0, 5.0, 6.0, 8.0, 5.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1561279296875, -0.15026283264160156, -0.14439773559570312, -0.1385326385498047, -0.13266754150390625, -0.1268024444580078, -0.12093734741210938, -0.11507225036621094, -0.1092071533203125, -0.10334205627441406, -0.09747695922851562, -0.09161186218261719, -0.08574676513671875, -0.07988166809082031, -0.07401657104492188, -0.06815147399902344, -0.062286376953125, -0.05642127990722656, -0.050556182861328125, -0.04469108581542969, -0.03882598876953125, -0.03296089172363281, -0.027095794677734375, -0.021230697631835938, -0.0153656005859375, -0.009500503540039062, -0.003635406494140625, 0.0022296905517578125, 0.00809478759765625, 0.013959884643554688, 0.019824981689453125, 0.025690078735351562, 0.03155517578125, 0.03742027282714844, 0.043285369873046875, 0.04915046691894531, 0.05501556396484375, 0.06088066101074219, 0.06674575805664062, 0.07261085510253906, 0.0784759521484375, 0.08434104919433594, 0.09020614624023438, 0.09607124328613281, 0.10193634033203125, 0.10780143737792969, 0.11366653442382812, 0.11953163146972656, 0.125396728515625, 0.13126182556152344, 0.13712692260742188, 0.1429920196533203, 0.14885711669921875, 0.1547222137451172, 0.16058731079101562, 0.16645240783691406, 0.1723175048828125, 0.17818260192871094, 0.18404769897460938, 0.1899127960205078, 0.19577789306640625, 0.2016429901123047, 0.20750808715820312, 0.21337318420410156, 0.21923828125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 9.0, 10.0, 19.0, 27.0, 26.0, 47.0, 83.0, 96.0, 141.0, 256.0, 350.0, 597.0, 904.0, 1399.0, 2494.0, 4217.0, 7273.0, 13480.0, 26534.0, 54008.0, 123275.0, 318295.0, 1823630.0, 1299407.0, 296787.0, 115022.0, 51039.0, 24777.0, 12754.0, 7012.0, 4104.0, 2406.0, 1395.0, 856.0, 546.0, 329.0, 220.0, 159.0, 97.0, 79.0, 37.0, 26.0, 25.0, 11.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.337890625, -1.2960357666015625, -1.254180908203125, -1.2123260498046875, -1.17047119140625, -1.1286163330078125, -1.086761474609375, -1.0449066162109375, -1.0030517578125, -0.9611968994140625, -0.919342041015625, -0.8774871826171875, -0.83563232421875, -0.7937774658203125, -0.751922607421875, -0.7100677490234375, -0.668212890625, -0.6263580322265625, -0.584503173828125, -0.5426483154296875, -0.50079345703125, -0.4589385986328125, -0.417083740234375, -0.3752288818359375, -0.3333740234375, -0.2915191650390625, -0.249664306640625, -0.2078094482421875, -0.16595458984375, -0.1240997314453125, -0.082244873046875, -0.0403900146484375, 0.00146484375, 0.0433197021484375, 0.085174560546875, 0.1270294189453125, 0.16888427734375, 0.2107391357421875, 0.252593994140625, 0.2944488525390625, 0.3363037109375, 0.3781585693359375, 0.420013427734375, 0.4618682861328125, 0.50372314453125, 0.5455780029296875, 0.587432861328125, 0.6292877197265625, 0.671142578125, 0.7129974365234375, 0.754852294921875, 0.7967071533203125, 0.83856201171875, 0.8804168701171875, 0.922271728515625, 0.9641265869140625, 1.0059814453125, 1.0478363037109375, 1.089691162109375, 1.1315460205078125, 1.17340087890625, 1.2152557373046875, 1.257110595703125, 1.2989654541015625, 1.3408203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 10.0, 15.0, 21.0, 15.0, 18.0, 25.0, 46.0, 56.0, 49.0, 89.0, 115.0, 124.0, 153.0, 214.0, 324.0, 608.0, 800.0, 351.0, 252.0, 160.0, 148.0, 126.0, 93.0, 63.0, 52.0, 29.0, 23.0, 18.0, 23.0, 9.0, 8.0, 10.0, 8.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32275390625, -0.30989837646484375, -0.2970428466796875, -0.28418731689453125, -0.271331787109375, -0.25847625732421875, -0.2456207275390625, -0.23276519775390625, -0.21990966796875, -0.20705413818359375, -0.1941986083984375, -0.18134307861328125, -0.168487548828125, -0.15563201904296875, -0.1427764892578125, -0.12992095947265625, -0.1170654296875, -0.10420989990234375, -0.0913543701171875, -0.07849884033203125, -0.065643310546875, -0.05278778076171875, -0.0399322509765625, -0.02707672119140625, -0.01422119140625, -0.00136566162109375, 0.0114898681640625, 0.02434539794921875, 0.037200927734375, 0.05005645751953125, 0.0629119873046875, 0.07576751708984375, 0.088623046875, 0.10147857666015625, 0.1143341064453125, 0.12718963623046875, 0.140045166015625, 0.15290069580078125, 0.1657562255859375, 0.17861175537109375, 0.19146728515625, 0.20432281494140625, 0.2171783447265625, 0.23003387451171875, 0.242889404296875, 0.25574493408203125, 0.2686004638671875, 0.28145599365234375, 0.2943115234375, 0.30716705322265625, 0.3200225830078125, 0.33287811279296875, 0.345733642578125, 0.35858917236328125, 0.3714447021484375, 0.38430023193359375, 0.39715576171875, 0.41001129150390625, 0.4228668212890625, 0.43572235107421875, 0.448577880859375, 0.46143341064453125, 0.4742889404296875, 0.48714447021484375, 0.5]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 2.0, 2.0, 4.0, 5.0, 13.0, 9.0, 27.0, 24.0, 49.0, 65.0, 95.0, 132.0, 125.0, 141.0, 99.0, 63.0, 41.0, 34.0, 27.0, 6.0, 15.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.102021217346191, -5.895606517791748, -5.689192295074463, -5.4827775955200195, -5.276363372802734, -5.069948673248291, -4.863533973693848, -4.6571197509765625, -4.450705051422119, -4.244290351867676, -4.037876129150391, -3.8314614295959473, -3.625046968460083, -3.4186325073242188, -3.2122178077697754, -3.005803346633911, -2.799388885498047, -2.5929744243621826, -2.3865599632263184, -2.180145263671875, -1.9737308025360107, -1.7673163414001465, -1.5609017610549927, -1.3544871807098389, -1.1480727195739746, -0.9416581988334656, -0.7352436780929565, -0.5288291573524475, -0.3224146366119385, -0.11600017547607422, 0.09041440486907959, 0.2968289852142334, 0.5032439231872559, 0.7096584439277649, 0.9160729646682739, 1.1224875450134277, 1.328902006149292, 1.5353164672851562, 1.74173104763031, 1.9481456279754639, 2.154560089111328, 2.3609745502471924, 2.5673890113830566, 2.7738037109375, 2.9802181720733643, 3.1866326332092285, 3.393047332763672, 3.599461793899536, 3.8058762550354004, 4.012290954589844, 4.218705177307129, 4.425119876861572, 4.631534576416016, 4.837948799133301, 5.044363498687744, 5.2507781982421875, 5.457192420959473, 5.663607120513916, 5.870021343231201, 6.0764360427856445, 6.28285026550293, 6.489264965057373, 6.695679664611816, 6.902093887329102, 7.108508586883545]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 5.0, 9.0, 9.0, 9.0, 13.0, 10.0, 14.0, 12.0, 17.0, 26.0, 29.0, 21.0, 33.0, 35.0, 34.0, 34.0, 38.0, 41.0, 41.0, 35.0, 42.0, 44.0, 35.0, 39.0, 35.0, 30.0, 41.0, 35.0, 29.0, 28.0, 24.0, 27.0, 17.0, 22.0, 18.0, 15.0, 15.0, 8.0, 6.0, 14.0, 5.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.78509521484375, -1.728391408920288, -1.6716874837875366, -1.6149836778640747, -1.5582798719406128, -1.5015759468078613, -1.4448721408843994, -1.3881683349609375, -1.331464409828186, -1.2747606039047241, -1.2180566787719727, -1.1613528728485107, -1.1046490669250488, -1.0479451417922974, -0.9912413358688354, -0.9345374703407288, -0.8778336644172668, -0.8211297988891602, -0.7644259929656982, -0.7077221274375916, -0.6510182619094849, -0.594314455986023, -0.5376105904579163, -0.48090672492980957, -0.42420288920402527, -0.36749905347824097, -0.3107951879501343, -0.25409135222435, -0.19738750159740448, -0.14068365097045898, -0.08397981524467468, -0.027275949716567993, 0.02942788600921631, 0.0861317366361618, 0.1428355872631073, 0.1995394229888916, 0.2562432885169983, 0.3129471242427826, 0.3696509599685669, 0.4263548254966736, 0.4830586612224579, 0.5397624969482422, 0.5964663624763489, 0.6531702280044556, 0.7098740339279175, 0.7665778994560242, 0.8232817649841309, 0.8799855709075928, 0.9366894364356995, 0.9933933019638062, 1.050097107887268, 1.1068010330200195, 1.1635048389434814, 1.2202086448669434, 1.2769124507904053, 1.3336163759231567, 1.3903201818466187, 1.4470239877700806, 1.503727912902832, 1.560431718826294, 1.6171355247497559, 1.6738394498825073, 1.7305432558059692, 1.7872471809387207, 1.8439509868621826]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 8.0, 10.0, 13.0, 21.0, 28.0, 52.0, 52.0, 69.0, 96.0, 153.0, 199.0, 314.0, 482.0, 786.0, 1205.0, 1998.0, 3359.0, 6246.0, 12596.0, 29412.0, 94037.0, 397812.0, 360344.0, 85596.0, 27386.0, 11828.0, 5886.0, 3204.0, 1962.0, 1198.0, 735.0, 445.0, 277.0, 208.0, 151.0, 90.0, 73.0, 56.0, 38.0, 31.0, 31.0, 13.0, 10.0, 9.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0], "bins": [-1.3388671875, -1.298248291015625, -1.25762939453125, -1.217010498046875, -1.1763916015625, -1.135772705078125, -1.09515380859375, -1.054534912109375, -1.013916015625, -0.973297119140625, -0.93267822265625, -0.892059326171875, -0.8514404296875, -0.810821533203125, -0.77020263671875, -0.729583740234375, -0.68896484375, -0.648345947265625, -0.60772705078125, -0.567108154296875, -0.5264892578125, -0.485870361328125, -0.44525146484375, -0.404632568359375, -0.364013671875, -0.323394775390625, -0.28277587890625, -0.242156982421875, -0.2015380859375, -0.160919189453125, -0.12030029296875, -0.079681396484375, -0.0390625, 0.001556396484375, 0.04217529296875, 0.082794189453125, 0.1234130859375, 0.164031982421875, 0.20465087890625, 0.245269775390625, 0.285888671875, 0.326507568359375, 0.36712646484375, 0.407745361328125, 0.4483642578125, 0.488983154296875, 0.52960205078125, 0.570220947265625, 0.61083984375, 0.651458740234375, 0.69207763671875, 0.732696533203125, 0.7733154296875, 0.813934326171875, 0.85455322265625, 0.895172119140625, 0.935791015625, 0.976409912109375, 1.01702880859375, 1.057647705078125, 1.0982666015625, 1.138885498046875, 1.17950439453125, 1.220123291015625, 1.2607421875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 10.0, 10.0, 16.0, 11.0, 33.0, 34.0, 55.0, 47.0, 86.0, 91.0, 94.0, 107.0, 95.0, 91.0, 54.0, 38.0, 32.0, 18.0, 9.0, 15.0, 10.0, 9.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1536865234375, -0.14820289611816406, -0.14271926879882812, -0.1372356414794922, -0.13175201416015625, -0.1262683868408203, -0.12078475952148438, -0.11530113220214844, -0.1098175048828125, -0.10433387756347656, -0.09885025024414062, -0.09336662292480469, -0.08788299560546875, -0.08239936828613281, -0.07691574096679688, -0.07143211364746094, -0.065948486328125, -0.06046485900878906, -0.054981231689453125, -0.04949760437011719, -0.04401397705078125, -0.03853034973144531, -0.033046722412109375, -0.027563095092773438, -0.0220794677734375, -0.016595840454101562, -0.011112213134765625, -0.0056285858154296875, -0.00014495849609375, 0.0053386688232421875, 0.010822296142578125, 0.016305923461914062, 0.02178955078125, 0.027273178100585938, 0.032756805419921875, 0.03824043273925781, 0.04372406005859375, 0.04920768737792969, 0.054691314697265625, 0.06017494201660156, 0.0656585693359375, 0.07114219665527344, 0.07662582397460938, 0.08210945129394531, 0.08759307861328125, 0.09307670593261719, 0.09856033325195312, 0.10404396057128906, 0.109527587890625, 0.11501121520996094, 0.12049484252929688, 0.1259784698486328, 0.13146209716796875, 0.1369457244873047, 0.14242935180664062, 0.14791297912597656, 0.1533966064453125, 0.15888023376464844, 0.16436386108398438, 0.1698474884033203, 0.17533111572265625, 0.1808147430419922, 0.18629837036132812, 0.19178199768066406, 0.197265625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 11.0, 7.0, 11.0, 14.0, 21.0, 35.0, 39.0, 44.0, 78.0, 123.0, 194.0, 279.0, 379.0, 612.0, 920.0, 1372.0, 2262.0, 3673.0, 6282.0, 11588.0, 24315.0, 61825.0, 200610.0, 447426.0, 180753.0, 56566.0, 22656.0, 10736.0, 6036.0, 3476.0, 2180.0, 1387.0, 854.0, 587.0, 378.0, 255.0, 162.0, 133.0, 80.0, 63.0, 39.0, 28.0, 20.0, 13.0, 17.0, 11.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.91943359375, -0.8902053833007812, -0.8609771728515625, -0.8317489624023438, -0.802520751953125, -0.7732925415039062, -0.7440643310546875, -0.7148361206054688, -0.68560791015625, -0.6563796997070312, -0.6271514892578125, -0.5979232788085938, -0.568695068359375, -0.5394668579101562, -0.5102386474609375, -0.48101043701171875, -0.4517822265625, -0.42255401611328125, -0.3933258056640625, -0.36409759521484375, -0.334869384765625, -0.30564117431640625, -0.2764129638671875, -0.24718475341796875, -0.21795654296875, -0.18872833251953125, -0.1595001220703125, -0.13027191162109375, -0.101043701171875, -0.07181549072265625, -0.0425872802734375, -0.01335906982421875, 0.015869140625, 0.04509735107421875, 0.0743255615234375, 0.10355377197265625, 0.132781982421875, 0.16201019287109375, 0.1912384033203125, 0.22046661376953125, 0.24969482421875, 0.27892303466796875, 0.3081512451171875, 0.33737945556640625, 0.366607666015625, 0.39583587646484375, 0.4250640869140625, 0.45429229736328125, 0.4835205078125, 0.5127487182617188, 0.5419769287109375, 0.5712051391601562, 0.600433349609375, 0.6296615600585938, 0.6588897705078125, 0.6881179809570312, 0.71734619140625, 0.7465744018554688, 0.7758026123046875, 0.8050308227539062, 0.834259033203125, 0.8634872436523438, 0.8927154541015625, 0.9219436645507812, 0.951171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 11.0, 12.0, 10.0, 16.0, 16.0, 17.0, 23.0, 24.0, 27.0, 33.0, 33.0, 44.0, 28.0, 37.0, 49.0, 37.0, 48.0, 42.0, 40.0, 43.0, 50.0, 42.0, 34.0, 32.0, 36.0, 29.0, 25.0, 23.0, 10.0, 17.0, 14.0, 18.0, 9.0, 10.0, 10.0, 10.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.666015625, -0.6439437866210938, -0.6218719482421875, -0.5998001098632812, -0.577728271484375, -0.5556564331054688, -0.5335845947265625, -0.5115127563476562, -0.48944091796875, -0.46736907958984375, -0.4452972412109375, -0.42322540283203125, -0.401153564453125, -0.37908172607421875, -0.3570098876953125, -0.33493804931640625, -0.3128662109375, -0.29079437255859375, -0.2687225341796875, -0.24665069580078125, -0.224578857421875, -0.20250701904296875, -0.1804351806640625, -0.15836334228515625, -0.13629150390625, -0.11421966552734375, -0.0921478271484375, -0.07007598876953125, -0.048004150390625, -0.02593231201171875, -0.0038604736328125, 0.01821136474609375, 0.040283203125, 0.06235504150390625, 0.0844268798828125, 0.10649871826171875, 0.128570556640625, 0.15064239501953125, 0.1727142333984375, 0.19478607177734375, 0.21685791015625, 0.23892974853515625, 0.2610015869140625, 0.28307342529296875, 0.305145263671875, 0.32721710205078125, 0.3492889404296875, 0.37136077880859375, 0.3934326171875, 0.41550445556640625, 0.4375762939453125, 0.45964813232421875, 0.481719970703125, 0.5037918090820312, 0.5258636474609375, 0.5479354858398438, 0.57000732421875, 0.5920791625976562, 0.6141510009765625, 0.6362228393554688, 0.658294677734375, 0.6803665161132812, 0.7024383544921875, 0.7245101928710938, 0.74658203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 10.0, 12.0, 27.0, 41.0, 60.0, 102.0, 162.0, 284.0, 515.0, 1075.0, 2299.0, 5660.0, 17381.0, 85830.0, 713634.0, 180833.0, 26803.0, 7935.0, 2945.0, 1355.0, 679.0, 375.0, 223.0, 122.0, 73.0, 30.0, 33.0, 19.0, 11.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.041015625, -2.94183349609375, -2.8426513671875, -2.74346923828125, -2.644287109375, -2.54510498046875, -2.4459228515625, -2.34674072265625, -2.24755859375, -2.14837646484375, -2.0491943359375, -1.95001220703125, -1.850830078125, -1.75164794921875, -1.6524658203125, -1.55328369140625, -1.4541015625, -1.35491943359375, -1.2557373046875, -1.15655517578125, -1.057373046875, -0.95819091796875, -0.8590087890625, -0.75982666015625, -0.66064453125, -0.56146240234375, -0.4622802734375, -0.36309814453125, -0.263916015625, -0.16473388671875, -0.0655517578125, 0.03363037109375, 0.1328125, 0.23199462890625, 0.3311767578125, 0.43035888671875, 0.529541015625, 0.62872314453125, 0.7279052734375, 0.82708740234375, 0.92626953125, 1.02545166015625, 1.1246337890625, 1.22381591796875, 1.322998046875, 1.42218017578125, 1.5213623046875, 1.62054443359375, 1.7197265625, 1.81890869140625, 1.9180908203125, 2.01727294921875, 2.116455078125, 2.21563720703125, 2.3148193359375, 2.41400146484375, 2.51318359375, 2.61236572265625, 2.7115478515625, 2.81072998046875, 2.909912109375, 3.00909423828125, 3.1082763671875, 3.20745849609375, 3.306640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 4.0, 2.0, 6.0, 9.0, 13.0, 21.0, 21.0, 29.0, 38.0, 53.0, 54.0, 62.0, 96.0, 104.0, 83.0, 79.0, 69.0, 61.0, 45.0, 29.0, 25.0, 16.0, 15.0, 15.0, 4.0, 8.0, 7.0, 10.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004897117614746094, -0.00047555938363075256, -0.00046140700578689575, -0.00044725462794303894, -0.00043310225009918213, -0.0004189498722553253, -0.0004047974944114685, -0.0003906451165676117, -0.0003764927387237549, -0.00036234036087989807, -0.00034818798303604126, -0.00033403560519218445, -0.00031988322734832764, -0.0003057308495044708, -0.000291578471660614, -0.0002774260938167572, -0.0002632737159729004, -0.0002491213381290436, -0.00023496896028518677, -0.00022081658244132996, -0.00020666420459747314, -0.00019251182675361633, -0.00017835944890975952, -0.0001642070710659027, -0.0001500546932220459, -0.0001359023153781891, -0.00012174993753433228, -0.00010759755969047546, -9.344518184661865e-05, -7.929280400276184e-05, -6.514042615890503e-05, -5.098804831504822e-05, -3.6835670471191406e-05, -2.2683292627334595e-05, -8.530914783477783e-06, 5.621463060379028e-06, 1.977384090423584e-05, 3.392621874809265e-05, 4.807859659194946e-05, 6.223097443580627e-05, 7.638335227966309e-05, 9.05357301235199e-05, 0.00010468810796737671, 0.00011884048581123352, 0.00013299286365509033, 0.00014714524149894714, 0.00016129761934280396, 0.00017544999718666077, 0.00018960237503051758, 0.0002037547528743744, 0.0002179071307182312, 0.000232059508562088, 0.0002462118864059448, 0.00026036426424980164, 0.00027451664209365845, 0.00028866901993751526, 0.00030282139778137207, 0.0003169737756252289, 0.0003311261534690857, 0.0003452785313129425, 0.0003594309091567993, 0.00037358328700065613, 0.00038773566484451294, 0.00040188804268836975, 0.00041604042053222656]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 8.0, 10.0, 24.0, 34.0, 57.0, 53.0, 106.0, 139.0, 182.0, 339.0, 532.0, 899.0, 1411.0, 2421.0, 4382.0, 8224.0, 17956.0, 46188.0, 173311.0, 525174.0, 181551.0, 48079.0, 18095.0, 8555.0, 4433.0, 2477.0, 1464.0, 868.0, 543.0, 355.0, 228.0, 138.0, 106.0, 62.0, 43.0, 40.0, 19.0, 12.0, 9.0, 6.0, 8.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8408203125, -1.78240966796875, -1.7239990234375, -1.66558837890625, -1.607177734375, -1.54876708984375, -1.4903564453125, -1.43194580078125, -1.37353515625, -1.31512451171875, -1.2567138671875, -1.19830322265625, -1.139892578125, -1.08148193359375, -1.0230712890625, -0.96466064453125, -0.90625, -0.84783935546875, -0.7894287109375, -0.73101806640625, -0.672607421875, -0.61419677734375, -0.5557861328125, -0.49737548828125, -0.43896484375, -0.38055419921875, -0.3221435546875, -0.26373291015625, -0.205322265625, -0.14691162109375, -0.0885009765625, -0.03009033203125, 0.0283203125, 0.08673095703125, 0.1451416015625, 0.20355224609375, 0.261962890625, 0.32037353515625, 0.3787841796875, 0.43719482421875, 0.49560546875, 0.55401611328125, 0.6124267578125, 0.67083740234375, 0.729248046875, 0.78765869140625, 0.8460693359375, 0.90447998046875, 0.962890625, 1.02130126953125, 1.0797119140625, 1.13812255859375, 1.196533203125, 1.25494384765625, 1.3133544921875, 1.37176513671875, 1.43017578125, 1.48858642578125, 1.5469970703125, 1.60540771484375, 1.663818359375, 1.72222900390625, 1.7806396484375, 1.83905029296875, 1.8974609375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 6.0, 11.0, 9.0, 14.0, 24.0, 25.0, 33.0, 32.0, 46.0, 43.0, 54.0, 71.0, 65.0, 76.0, 61.0, 75.0, 63.0, 54.0, 46.0, 32.0, 40.0, 16.0, 23.0, 14.0, 8.0, 6.0, 10.0, 13.0, 4.0, 2.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.92529296875, -0.8929061889648438, -0.8605194091796875, -0.8281326293945312, -0.795745849609375, -0.7633590698242188, -0.7309722900390625, -0.6985855102539062, -0.66619873046875, -0.6338119506835938, -0.6014251708984375, -0.5690383911132812, -0.536651611328125, -0.5042648315429688, -0.4718780517578125, -0.43949127197265625, -0.4071044921875, -0.37471771240234375, -0.3423309326171875, -0.30994415283203125, -0.277557373046875, -0.24517059326171875, -0.2127838134765625, -0.18039703369140625, -0.14801025390625, -0.11562347412109375, -0.0832366943359375, -0.05084991455078125, -0.018463134765625, 0.01392364501953125, 0.0463104248046875, 0.07869720458984375, 0.111083984375, 0.14347076416015625, 0.1758575439453125, 0.20824432373046875, 0.240631103515625, 0.27301788330078125, 0.3054046630859375, 0.33779144287109375, 0.37017822265625, 0.40256500244140625, 0.4349517822265625, 0.46733856201171875, 0.499725341796875, 0.5321121215820312, 0.5644989013671875, 0.5968856811523438, 0.6292724609375, 0.6616592407226562, 0.6940460205078125, 0.7264328002929688, 0.758819580078125, 0.7912063598632812, 0.8235931396484375, 0.8559799194335938, 0.88836669921875, 0.9207534790039062, 0.9531402587890625, 0.9855270385742188, 1.017913818359375, 1.0503005981445312, 1.0826873779296875, 1.1150741577148438, 1.1474609375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 12.0, 16.0, 42.0, 109.0, 326.0, 327.0, 97.0, 36.0, 20.0, 11.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-49.814300537109375, -48.53561019897461, -47.25691604614258, -45.97822570800781, -44.69953155517578, -43.420841217041016, -42.142147064208984, -40.86345672607422, -39.58476257324219, -38.30607223510742, -37.02737808227539, -35.748687744140625, -34.469993591308594, -33.19130325317383, -31.91261100769043, -30.63391876220703, -29.355228424072266, -28.076536178588867, -26.79784393310547, -25.51915168762207, -24.240459442138672, -22.961769104003906, -21.683076858520508, -20.40438461303711, -19.12569236755371, -17.847000122070312, -16.568307876586914, -15.289616584777832, -14.010924339294434, -12.732232093811035, -11.453540802001953, -10.174848556518555, -8.89615249633789, -7.617460250854492, -6.338768482208252, -5.060076713562012, -3.7813844680786133, -2.502692222595215, -1.2240004539489746, 0.054691314697265625, 1.333383560180664, 2.6120755672454834, 3.8907675743103027, 5.169459342956543, 6.448151588439941, 7.72684383392334, 9.005535125732422, 10.28422737121582, 11.562919616699219, 12.841611862182617, 14.120304107666016, 15.398995399475098, 16.677688598632812, 17.956378936767578, 19.235071182250977, 20.513763427734375, 21.792455673217773, 23.071147918701172, 24.34984016418457, 25.62853240966797, 26.907222747802734, 28.185916900634766, 29.46460723876953, 30.74329948425293, 32.02199172973633]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 4.0, 9.0, 14.0, 15.0, 21.0, 43.0, 83.0, 91.0, 117.0, 121.0, 140.0, 78.0, 84.0, 38.0, 24.0, 14.0, 18.0, 14.0, 6.0, 7.0, 6.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.420930862426758, -10.975160598754883, -10.529391288757324, -10.08362102508545, -9.63785171508789, -9.192081451416016, -8.74631118774414, -8.300541877746582, -7.854772090911865, -7.409002304077148, -6.963232517242432, -6.517462730407715, -6.07169246673584, -5.625923156738281, -5.180152893066406, -4.7343831062316895, -4.288613319396973, -3.842843532562256, -3.397073745727539, -2.951303720474243, -2.5055339336395264, -2.0597641468048096, -1.6139941215515137, -1.1682243347167969, -0.7224545478820801, -0.2766847014427185, 0.16908514499664307, 0.6148550510406494, 1.0606248378753662, 1.506394624710083, 1.952164649963379, 2.3979344367980957, 2.8437042236328125, 3.2894740104675293, 3.735243797302246, 4.181014060974121, 4.62678337097168, 5.072553634643555, 5.5183234214782715, 5.964093208312988, 6.409862995147705, 6.855632781982422, 7.301402568817139, 7.7471723556518555, 8.19294261932373, 8.638711929321289, 9.084482192993164, 9.530252456665039, 9.976021766662598, 10.421792030334473, 10.867561340332031, 11.313331604003906, 11.759100914001465, 12.20487117767334, 12.650640487670898, 13.096410751342773, 13.542181015014648, 13.987951278686523, 14.433720588684082, 14.879490852355957, 15.325260162353516, 15.77103042602539, 16.216800689697266, 16.66257095336914, 17.108339309692383]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 5.0, 3.0, 8.0, 23.0, 21.0, 43.0, 52.0, 99.0, 203.0, 319.0, 611.0, 1203.0, 2729.0, 7168.0, 24956.0, 168418.0, 3849193.0, 107952.0, 19884.0, 6348.0, 2585.0, 1150.0, 578.0, 291.0, 171.0, 108.0, 44.0, 39.0, 20.0, 11.0, 14.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44140625, -4.30438232421875, -4.1673583984375, -4.03033447265625, -3.893310546875, -3.75628662109375, -3.6192626953125, -3.48223876953125, -3.34521484375, -3.20819091796875, -3.0711669921875, -2.93414306640625, -2.797119140625, -2.66009521484375, -2.5230712890625, -2.38604736328125, -2.2490234375, -2.11199951171875, -1.9749755859375, -1.83795166015625, -1.700927734375, -1.56390380859375, -1.4268798828125, -1.28985595703125, -1.15283203125, -1.01580810546875, -0.8787841796875, -0.74176025390625, -0.604736328125, -0.46771240234375, -0.3306884765625, -0.19366455078125, -0.056640625, 0.08038330078125, 0.2174072265625, 0.35443115234375, 0.491455078125, 0.62847900390625, 0.7655029296875, 0.90252685546875, 1.03955078125, 1.17657470703125, 1.3135986328125, 1.45062255859375, 1.587646484375, 1.72467041015625, 1.8616943359375, 1.99871826171875, 2.1357421875, 2.27276611328125, 2.4097900390625, 2.54681396484375, 2.683837890625, 2.82086181640625, 2.9578857421875, 3.09490966796875, 3.23193359375, 3.36895751953125, 3.5059814453125, 3.64300537109375, 3.780029296875, 3.91705322265625, 4.0540771484375, 4.19110107421875, 4.328125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 6.0, 2.0, 5.0, 4.0, 5.0, 7.0, 8.0, 11.0, 25.0, 25.0, 28.0, 34.0, 47.0, 58.0, 69.0, 79.0, 87.0, 84.0, 101.0, 68.0, 50.0, 43.0, 28.0, 25.0, 13.0, 18.0, 14.0, 7.0, 8.0, 8.0, 5.0, 2.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.145263671875, -0.1405658721923828, -0.13586807250976562, -0.13117027282714844, -0.12647247314453125, -0.12177467346191406, -0.11707687377929688, -0.11237907409667969, -0.1076812744140625, -0.10298347473144531, -0.09828567504882812, -0.09358787536621094, -0.08889007568359375, -0.08419227600097656, -0.07949447631835938, -0.07479667663574219, -0.070098876953125, -0.06540107727050781, -0.060703277587890625, -0.05600547790527344, -0.05130767822265625, -0.04660987854003906, -0.041912078857421875, -0.03721427917480469, -0.0325164794921875, -0.027818679809570312, -0.023120880126953125, -0.018423080444335938, -0.01372528076171875, -0.009027481079101562, -0.004329681396484375, 0.0003681182861328125, 0.00506591796875, 0.009763717651367188, 0.014461517333984375, 0.019159317016601562, 0.02385711669921875, 0.028554916381835938, 0.033252716064453125, 0.03795051574707031, 0.0426483154296875, 0.04734611511230469, 0.052043914794921875, 0.05674171447753906, 0.06143951416015625, 0.06613731384277344, 0.07083511352539062, 0.07553291320800781, 0.080230712890625, 0.08492851257324219, 0.08962631225585938, 0.09432411193847656, 0.09902191162109375, 0.10371971130371094, 0.10841751098632812, 0.11311531066894531, 0.1178131103515625, 0.12251091003417969, 0.12720870971679688, 0.13190650939941406, 0.13660430908203125, 0.14130210876464844, 0.14599990844726562, 0.1506977081298828, 0.1553955078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 12.0, 18.0, 22.0, 48.0, 50.0, 81.0, 141.0, 245.0, 428.0, 873.0, 1798.0, 3786.0, 9328.0, 27781.0, 101831.0, 2420781.0, 1483860.0, 99125.0, 27285.0, 9360.0, 3807.0, 1673.0, 833.0, 460.0, 253.0, 146.0, 85.0, 52.0, 31.0, 27.0, 15.0, 15.0, 8.0, 9.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0234375, -2.925872802734375, -2.82830810546875, -2.730743408203125, -2.6331787109375, -2.535614013671875, -2.43804931640625, -2.340484619140625, -2.242919921875, -2.145355224609375, -2.04779052734375, -1.950225830078125, -1.8526611328125, -1.755096435546875, -1.65753173828125, -1.559967041015625, -1.46240234375, -1.364837646484375, -1.26727294921875, -1.169708251953125, -1.0721435546875, -0.974578857421875, -0.87701416015625, -0.779449462890625, -0.681884765625, -0.584320068359375, -0.48675537109375, -0.389190673828125, -0.2916259765625, -0.194061279296875, -0.09649658203125, 0.001068115234375, 0.0986328125, 0.196197509765625, 0.29376220703125, 0.391326904296875, 0.4888916015625, 0.586456298828125, 0.68402099609375, 0.781585693359375, 0.879150390625, 0.976715087890625, 1.07427978515625, 1.171844482421875, 1.2694091796875, 1.366973876953125, 1.46453857421875, 1.562103271484375, 1.65966796875, 1.757232666015625, 1.85479736328125, 1.952362060546875, 2.0499267578125, 2.147491455078125, 2.24505615234375, 2.342620849609375, 2.440185546875, 2.537750244140625, 2.63531494140625, 2.732879638671875, 2.8304443359375, 2.928009033203125, 3.02557373046875, 3.123138427734375, 3.220703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 4.0, 18.0, 18.0, 29.0, 26.0, 31.0, 49.0, 59.0, 92.0, 144.0, 335.0, 1898.0, 671.0, 217.0, 125.0, 94.0, 61.0, 51.0, 37.0, 26.0, 24.0, 16.0, 6.0, 5.0, 12.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.446533203125, -0.43404388427734375, -0.4215545654296875, -0.40906524658203125, -0.396575927734375, -0.38408660888671875, -0.3715972900390625, -0.35910797119140625, -0.34661865234375, -0.33412933349609375, -0.3216400146484375, -0.30915069580078125, -0.296661376953125, -0.28417205810546875, -0.2716827392578125, -0.25919342041015625, -0.2467041015625, -0.23421478271484375, -0.2217254638671875, -0.20923614501953125, -0.196746826171875, -0.18425750732421875, -0.1717681884765625, -0.15927886962890625, -0.14678955078125, -0.13430023193359375, -0.1218109130859375, -0.10932159423828125, -0.096832275390625, -0.08434295654296875, -0.0718536376953125, -0.05936431884765625, -0.046875, -0.03438568115234375, -0.0218963623046875, -0.00940704345703125, 0.003082275390625, 0.01557159423828125, 0.0280609130859375, 0.04055023193359375, 0.05303955078125, 0.06552886962890625, 0.0780181884765625, 0.09050750732421875, 0.102996826171875, 0.11548614501953125, 0.1279754638671875, 0.14046478271484375, 0.1529541015625, 0.16544342041015625, 0.1779327392578125, 0.19042205810546875, 0.202911376953125, 0.21540069580078125, 0.2278900146484375, 0.24037933349609375, 0.25286865234375, 0.26535797119140625, 0.2778472900390625, 0.29033660888671875, 0.302825927734375, 0.31531524658203125, 0.3278045654296875, 0.34029388427734375, 0.352783203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 8.0, 4.0, 12.0, 12.0, 38.0, 95.0, 174.0, 263.0, 206.0, 93.0, 56.0, 21.0, 6.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.254312992095947, -6.095088005065918, -5.9358625411987305, -5.776637077331543, -5.617412090301514, -5.458187103271484, -5.298961639404297, -5.139736175537109, -4.98051118850708, -4.821286201477051, -4.662060737609863, -4.502835273742676, -4.3436102867126465, -4.184385299682617, -4.02515983581543, -3.8659346103668213, -3.706709384918213, -3.5474841594696045, -3.388258934020996, -3.2290337085723877, -3.0698084831237793, -2.910583257675171, -2.7513580322265625, -2.592132806777954, -2.4329075813293457, -2.2736823558807373, -2.114457130432129, -1.9552319049835205, -1.796006679534912, -1.6367814540863037, -1.4775562286376953, -1.318331003189087, -1.1591060161590576, -0.9998807907104492, -0.8406555652618408, -0.6814303398132324, -0.522205114364624, -0.3629798889160156, -0.20375466346740723, -0.04452943801879883, 0.11469578742980957, 0.27392101287841797, 0.43314623832702637, 0.5923714637756348, 0.7515966892242432, 0.9108219146728516, 1.07004714012146, 1.2292723655700684, 1.3884975910186768, 1.5477228164672852, 1.7069480419158936, 1.866173267364502, 2.0253984928131104, 2.1846237182617188, 2.343848943710327, 2.5030741691589355, 2.662299394607544, 2.8215246200561523, 2.9807498455047607, 3.139975070953369, 3.2992002964019775, 3.458425521850586, 3.6176507472991943, 3.7768759727478027, 3.936101198196411]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 10.0, 6.0, 5.0, 15.0, 7.0, 21.0, 17.0, 28.0, 23.0, 38.0, 30.0, 44.0, 47.0, 46.0, 42.0, 45.0, 67.0, 63.0, 62.0, 48.0, 51.0, 37.0, 34.0, 35.0, 31.0, 21.0, 19.0, 24.0, 17.0, 16.0, 11.0, 7.0, 7.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.480839729309082, -1.4274035692214966, -1.3739674091339111, -1.3205312490463257, -1.2670950889587402, -1.2136590480804443, -1.1602227687835693, -1.1067867279052734, -1.053350567817688, -0.9999144077301025, -0.9464782476425171, -0.8930420875549316, -0.839605987071991, -0.7861698269844055, -0.7327336668968201, -0.6792975664138794, -0.6258613467216492, -0.5724251866340637, -0.5189890265464783, -0.4655528962612152, -0.41211676597595215, -0.3586806058883667, -0.30524444580078125, -0.2518083155155182, -0.19837215542793274, -0.14493601024150848, -0.09149985760450363, -0.03806370496749878, 0.015372440218925476, 0.06880858540534973, 0.12224474549293518, 0.17568087577819824, 0.2291170358657837, 0.28255319595336914, 0.3359893262386322, 0.38942548632621765, 0.4428616166114807, 0.49629777669906616, 0.5497339367866516, 0.6031700372695923, 0.6566061973571777, 0.7100423574447632, 0.7634785175323486, 0.8169146776199341, 0.8703507781028748, 0.9237869381904602, 0.9772230982780457, 1.0306591987609863, 1.0840954780578613, 1.1375316381454468, 1.1909677982330322, 1.2444039583206177, 1.2978401184082031, 1.351276159286499, 1.404712438583374, 1.45814847946167, 1.5115846395492554, 1.5650207996368408, 1.6184569597244263, 1.6718931198120117, 1.7253292798995972, 1.7787654399871826, 1.8322014808654785, 1.885637640953064, 1.9390738010406494]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 9.0, 12.0, 26.0, 21.0, 42.0, 66.0, 92.0, 118.0, 183.0, 256.0, 430.0, 666.0, 1110.0, 1791.0, 2879.0, 5138.0, 9725.0, 19532.0, 42280.0, 102596.0, 256268.0, 338420.0, 151631.0, 59807.0, 26251.0, 12777.0, 6805.0, 3688.0, 2206.0, 1347.0, 853.0, 459.0, 334.0, 219.0, 173.0, 115.0, 71.0, 46.0, 42.0, 15.0, 13.0, 7.0, 6.0, 2.0, 5.0, 8.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2119140625, -1.1730804443359375, -1.134246826171875, -1.0954132080078125, -1.05657958984375, -1.0177459716796875, -0.978912353515625, -0.9400787353515625, -0.9012451171875, -0.8624114990234375, -0.823577880859375, -0.7847442626953125, -0.74591064453125, -0.7070770263671875, -0.668243408203125, -0.6294097900390625, -0.590576171875, -0.5517425537109375, -0.512908935546875, -0.4740753173828125, -0.43524169921875, -0.3964080810546875, -0.357574462890625, -0.3187408447265625, -0.2799072265625, -0.2410736083984375, -0.202239990234375, -0.1634063720703125, -0.12457275390625, -0.0857391357421875, -0.046905517578125, -0.0080718994140625, 0.03076171875, 0.0695953369140625, 0.108428955078125, 0.1472625732421875, 0.18609619140625, 0.2249298095703125, 0.263763427734375, 0.3025970458984375, 0.3414306640625, 0.3802642822265625, 0.419097900390625, 0.4579315185546875, 0.49676513671875, 0.5355987548828125, 0.574432373046875, 0.6132659912109375, 0.652099609375, 0.6909332275390625, 0.729766845703125, 0.7686004638671875, 0.80743408203125, 0.8462677001953125, 0.885101318359375, 0.9239349365234375, 0.9627685546875, 1.0016021728515625, 1.040435791015625, 1.0792694091796875, 1.11810302734375, 1.1569366455078125, 1.195770263671875, 1.2346038818359375, 1.2734375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 5.0, 4.0, 4.0, 7.0, 15.0, 13.0, 12.0, 22.0, 32.0, 30.0, 30.0, 49.0, 57.0, 68.0, 74.0, 88.0, 75.0, 84.0, 57.0, 66.0, 32.0, 30.0, 29.0, 26.0, 19.0, 13.0, 10.0, 6.0, 7.0, 5.0, 6.0, 4.0, 4.0, 3.0, 4.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1339111328125, -0.1291351318359375, -0.124359130859375, -0.1195831298828125, -0.11480712890625, -0.1100311279296875, -0.105255126953125, -0.1004791259765625, -0.095703125, -0.0909271240234375, -0.086151123046875, -0.0813751220703125, -0.07659912109375, -0.0718231201171875, -0.067047119140625, -0.0622711181640625, -0.0574951171875, -0.0527191162109375, -0.047943115234375, -0.0431671142578125, -0.03839111328125, -0.0336151123046875, -0.028839111328125, -0.0240631103515625, -0.019287109375, -0.0145111083984375, -0.009735107421875, -0.0049591064453125, -0.00018310546875, 0.0045928955078125, 0.009368896484375, 0.0141448974609375, 0.0189208984375, 0.0236968994140625, 0.028472900390625, 0.0332489013671875, 0.03802490234375, 0.0428009033203125, 0.047576904296875, 0.0523529052734375, 0.05712890625, 0.0619049072265625, 0.066680908203125, 0.0714569091796875, 0.07623291015625, 0.0810089111328125, 0.085784912109375, 0.0905609130859375, 0.0953369140625, 0.1001129150390625, 0.104888916015625, 0.1096649169921875, 0.11444091796875, 0.1192169189453125, 0.123992919921875, 0.1287689208984375, 0.133544921875, 0.1383209228515625, 0.143096923828125, 0.1478729248046875, 0.15264892578125, 0.1574249267578125, 0.162200927734375, 0.1669769287109375, 0.1717529296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 11.0, 20.0, 25.0, 46.0, 87.0, 160.0, 306.0, 583.0, 1214.0, 2938.0, 7654.0, 25113.0, 111304.0, 492071.0, 319113.0, 62642.0, 15826.0, 5253.0, 2152.0, 992.0, 464.0, 244.0, 134.0, 70.0, 48.0, 27.0, 16.0, 12.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6904296875, -1.6404571533203125, -1.590484619140625, -1.5405120849609375, -1.49053955078125, -1.4405670166015625, -1.390594482421875, -1.3406219482421875, -1.2906494140625, -1.2406768798828125, -1.190704345703125, -1.1407318115234375, -1.09075927734375, -1.0407867431640625, -0.990814208984375, -0.9408416748046875, -0.890869140625, -0.8408966064453125, -0.790924072265625, -0.7409515380859375, -0.69097900390625, -0.6410064697265625, -0.591033935546875, -0.5410614013671875, -0.4910888671875, -0.4411163330078125, -0.391143798828125, -0.3411712646484375, -0.29119873046875, -0.2412261962890625, -0.191253662109375, -0.1412811279296875, -0.09130859375, -0.0413360595703125, 0.008636474609375, 0.0586090087890625, 0.10858154296875, 0.1585540771484375, 0.208526611328125, 0.2584991455078125, 0.3084716796875, 0.3584442138671875, 0.408416748046875, 0.4583892822265625, 0.50836181640625, 0.5583343505859375, 0.608306884765625, 0.6582794189453125, 0.708251953125, 0.7582244873046875, 0.808197021484375, 0.8581695556640625, 0.90814208984375, 0.9581146240234375, 1.008087158203125, 1.0580596923828125, 1.1080322265625, 1.1580047607421875, 1.207977294921875, 1.2579498291015625, 1.30792236328125, 1.3578948974609375, 1.407867431640625, 1.4578399658203125, 1.5078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 7.0, 13.0, 6.0, 19.0, 20.0, 17.0, 23.0, 21.0, 17.0, 27.0, 38.0, 31.0, 49.0, 40.0, 45.0, 43.0, 47.0, 42.0, 44.0, 46.0, 47.0, 40.0, 33.0, 40.0, 32.0, 27.0, 24.0, 30.0, 20.0, 27.0, 16.0, 13.0, 7.0, 10.0, 8.0, 4.0, 6.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.67822265625, -0.6584091186523438, -0.6385955810546875, -0.6187820434570312, -0.598968505859375, -0.5791549682617188, -0.5593414306640625, -0.5395278930664062, -0.51971435546875, -0.49990081787109375, -0.4800872802734375, -0.46027374267578125, -0.440460205078125, -0.42064666748046875, -0.4008331298828125, -0.38101959228515625, -0.3612060546875, -0.34139251708984375, -0.3215789794921875, -0.30176544189453125, -0.281951904296875, -0.26213836669921875, -0.2423248291015625, -0.22251129150390625, -0.20269775390625, -0.18288421630859375, -0.1630706787109375, -0.14325714111328125, -0.123443603515625, -0.10363006591796875, -0.0838165283203125, -0.06400299072265625, -0.044189453125, -0.02437591552734375, -0.0045623779296875, 0.01525115966796875, 0.035064697265625, 0.05487823486328125, 0.0746917724609375, 0.09450531005859375, 0.11431884765625, 0.13413238525390625, 0.1539459228515625, 0.17375946044921875, 0.193572998046875, 0.21338653564453125, 0.2332000732421875, 0.25301361083984375, 0.2728271484375, 0.29264068603515625, 0.3124542236328125, 0.33226776123046875, 0.352081298828125, 0.37189483642578125, 0.3917083740234375, 0.41152191162109375, 0.43133544921875, 0.45114898681640625, 0.4709625244140625, 0.49077606201171875, 0.510589599609375, 0.5304031372070312, 0.5502166748046875, 0.5700302124023438, 0.58984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 14.0, 22.0, 26.0, 49.0, 54.0, 97.0, 139.0, 290.0, 495.0, 1099.0, 2560.0, 7304.0, 27333.0, 169598.0, 661766.0, 142658.0, 23882.0, 6555.0, 2425.0, 1044.0, 474.0, 252.0, 129.0, 84.0, 54.0, 31.0, 34.0, 24.0, 13.0, 10.0, 9.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6240234375, -1.5739898681640625, -1.523956298828125, -1.4739227294921875, -1.42388916015625, -1.3738555908203125, -1.323822021484375, -1.2737884521484375, -1.2237548828125, -1.1737213134765625, -1.123687744140625, -1.0736541748046875, -1.02362060546875, -0.9735870361328125, -0.923553466796875, -0.8735198974609375, -0.823486328125, -0.7734527587890625, -0.723419189453125, -0.6733856201171875, -0.62335205078125, -0.5733184814453125, -0.523284912109375, -0.4732513427734375, -0.4232177734375, -0.3731842041015625, -0.323150634765625, -0.2731170654296875, -0.22308349609375, -0.1730499267578125, -0.123016357421875, -0.0729827880859375, -0.02294921875, 0.0270843505859375, 0.077117919921875, 0.1271514892578125, 0.17718505859375, 0.2272186279296875, 0.277252197265625, 0.3272857666015625, 0.3773193359375, 0.4273529052734375, 0.477386474609375, 0.5274200439453125, 0.57745361328125, 0.6274871826171875, 0.677520751953125, 0.7275543212890625, 0.777587890625, 0.8276214599609375, 0.877655029296875, 0.9276885986328125, 0.97772216796875, 1.0277557373046875, 1.077789306640625, 1.1278228759765625, 1.1778564453125, 1.2278900146484375, 1.277923583984375, 1.3279571533203125, 1.37799072265625, 1.4280242919921875, 1.478057861328125, 1.5280914306640625, 1.578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 7.0, 5.0, 3.0, 7.0, 4.0, 7.0, 15.0, 7.0, 18.0, 13.0, 30.0, 40.0, 37.0, 51.0, 64.0, 61.0, 87.0, 64.0, 88.0, 64.0, 60.0, 53.0, 39.0, 30.0, 30.0, 26.0, 17.0, 14.0, 15.0, 10.0, 9.0, 13.0, 6.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00022494792938232422, -0.00021739117801189423, -0.00020983442664146423, -0.00020227767527103424, -0.00019472092390060425, -0.00018716417253017426, -0.00017960742115974426, -0.00017205066978931427, -0.00016449391841888428, -0.00015693716704845428, -0.0001493804156780243, -0.0001418236643075943, -0.0001342669129371643, -0.00012671016156673431, -0.00011915341019630432, -0.00011159665882587433, -0.00010403990745544434, -9.648315608501434e-05, -8.892640471458435e-05, -8.136965334415436e-05, -7.381290197372437e-05, -6.625615060329437e-05, -5.869939923286438e-05, -5.114264786243439e-05, -4.3585896492004395e-05, -3.60291451215744e-05, -2.847239375114441e-05, -2.0915642380714417e-05, -1.3358891010284424e-05, -5.802139639854431e-06, 1.7546117305755615e-06, 9.311363101005554e-06, 1.6868114471435547e-05, 2.442486584186554e-05, 3.198161721229553e-05, 3.9538368582725525e-05, 4.709511995315552e-05, 5.465187132358551e-05, 6.22086226940155e-05, 6.97653740644455e-05, 7.732212543487549e-05, 8.487887680530548e-05, 9.243562817573547e-05, 9.999237954616547e-05, 0.00010754913091659546, 0.00011510588228702545, 0.00012266263365745544, 0.00013021938502788544, 0.00013777613639831543, 0.00014533288776874542, 0.00015288963913917542, 0.0001604463905096054, 0.0001680031418800354, 0.0001755598932504654, 0.00018311664462089539, 0.00019067339599132538, 0.00019823014736175537, 0.00020578689873218536, 0.00021334365010261536, 0.00022090040147304535, 0.00022845715284347534, 0.00023601390421390533, 0.00024357065558433533, 0.0002511274069547653, 0.0002586841583251953]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 8.0, 9.0, 6.0, 8.0, 16.0, 19.0, 33.0, 34.0, 54.0, 65.0, 127.0, 159.0, 250.0, 392.0, 674.0, 1233.0, 2677.0, 6024.0, 18996.0, 96578.0, 605204.0, 259616.0, 38159.0, 10263.0, 3802.0, 1728.0, 975.0, 491.0, 303.0, 206.0, 127.0, 89.0, 60.0, 43.0, 36.0, 24.0, 20.0, 9.0, 11.0, 8.0, 4.0, 5.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6083984375, -1.55926513671875, -1.5101318359375, -1.46099853515625, -1.411865234375, -1.36273193359375, -1.3135986328125, -1.26446533203125, -1.21533203125, -1.16619873046875, -1.1170654296875, -1.06793212890625, -1.018798828125, -0.96966552734375, -0.9205322265625, -0.87139892578125, -0.822265625, -0.77313232421875, -0.7239990234375, -0.67486572265625, -0.625732421875, -0.57659912109375, -0.5274658203125, -0.47833251953125, -0.42919921875, -0.38006591796875, -0.3309326171875, -0.28179931640625, -0.232666015625, -0.18353271484375, -0.1343994140625, -0.08526611328125, -0.0361328125, 0.01300048828125, 0.0621337890625, 0.11126708984375, 0.160400390625, 0.20953369140625, 0.2586669921875, 0.30780029296875, 0.35693359375, 0.40606689453125, 0.4552001953125, 0.50433349609375, 0.553466796875, 0.60260009765625, 0.6517333984375, 0.70086669921875, 0.75, 0.79913330078125, 0.8482666015625, 0.89739990234375, 0.946533203125, 0.99566650390625, 1.0447998046875, 1.09393310546875, 1.14306640625, 1.19219970703125, 1.2413330078125, 1.29046630859375, 1.339599609375, 1.38873291015625, 1.4378662109375, 1.48699951171875, 1.5361328125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 15.0, 30.0, 51.0, 87.0, 170.0, 179.0, 167.0, 127.0, 58.0, 46.0, 28.0, 13.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.501953125, -1.4586639404296875, -1.415374755859375, -1.3720855712890625, -1.32879638671875, -1.2855072021484375, -1.242218017578125, -1.1989288330078125, -1.1556396484375, -1.1123504638671875, -1.069061279296875, -1.0257720947265625, -0.98248291015625, -0.9391937255859375, -0.895904541015625, -0.8526153564453125, -0.809326171875, -0.7660369873046875, -0.722747802734375, -0.6794586181640625, -0.63616943359375, -0.5928802490234375, -0.549591064453125, -0.5063018798828125, -0.4630126953125, -0.4197235107421875, -0.376434326171875, -0.3331451416015625, -0.28985595703125, -0.2465667724609375, -0.203277587890625, -0.1599884033203125, -0.11669921875, -0.0734100341796875, -0.030120849609375, 0.0131683349609375, 0.05645751953125, 0.0997467041015625, 0.143035888671875, 0.1863250732421875, 0.2296142578125, 0.2729034423828125, 0.316192626953125, 0.3594818115234375, 0.40277099609375, 0.4460601806640625, 0.489349365234375, 0.5326385498046875, 0.575927734375, 0.6192169189453125, 0.662506103515625, 0.7057952880859375, 0.74908447265625, 0.7923736572265625, 0.835662841796875, 0.8789520263671875, 0.9222412109375, 0.9655303955078125, 1.008819580078125, 1.0521087646484375, 1.09539794921875, 1.1386871337890625, 1.181976318359375, 1.2252655029296875, 1.2685546875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 12.0, 17.0, 65.0, 166.0, 279.0, 248.0, 110.0, 53.0, 15.0, 9.0, 9.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.427313804626465, -14.942720413208008, -14.458127975463867, -13.97353458404541, -13.488941192626953, -13.004348754882812, -12.519755363464355, -12.035161972045898, -11.550569534301758, -11.0659761428833, -10.58138370513916, -10.096790313720703, -9.612196922302246, -9.127603530883789, -8.643011093139648, -8.158417701721191, -7.673824310302734, -7.1892313957214355, -6.7046380043029785, -6.22004508972168, -5.735451698303223, -5.250858783721924, -4.766265869140625, -4.281672477722168, -3.797079563140869, -3.312486410140991, -2.8278932571411133, -2.3433003425598145, -1.8587071895599365, -1.3741140365600586, -0.8895211219787598, -0.40492796897888184, 0.07966423034667969, 0.5642573237419128, 1.048850417137146, 1.5334434509277344, 2.0180366039276123, 2.5026297569274902, 2.987222671508789, 3.471815824508667, 3.956408977508545, 4.441001892089844, 4.925595283508301, 5.4101881980896, 5.894781112670898, 6.3793745040893555, 6.863967418670654, 7.348560333251953, 7.83315372467041, 8.317747116088867, 8.802339553833008, 9.286932945251465, 9.771526336669922, 10.256118774414062, 10.74071216583252, 11.225305557250977, 11.709897994995117, 12.194491386413574, 12.679083824157715, 13.163677215576172, 13.648270606994629, 14.132863998413086, 14.617456436157227, 15.102049827575684, 15.58664321899414]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 7.0, 20.0, 10.0, 17.0, 39.0, 51.0, 71.0, 90.0, 98.0, 118.0, 110.0, 115.0, 69.0, 68.0, 36.0, 19.0, 18.0, 9.0, 3.0, 4.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0905122756958, -9.769287109375, -9.4480619430542, -9.126836776733398, -8.805612564086914, -8.484387397766113, -8.163162231445312, -7.841937065124512, -7.520711898803711, -7.19948673248291, -6.878261566162109, -6.557036876678467, -6.235811710357666, -5.914586544036865, -5.593361854553223, -5.272136688232422, -4.950911521911621, -4.62968635559082, -4.3084611892700195, -3.987236499786377, -3.666011333465576, -3.3447861671447754, -3.0235612392425537, -2.702336311340332, -2.3811111450195312, -2.0598859786987305, -1.7386610507965088, -1.4174360036849976, -1.0962109565734863, -0.7749859094619751, -0.45376086235046387, -0.1325359344482422, 0.188690185546875, 0.5099152326583862, 0.8311402797698975, 1.1523653268814087, 1.47359037399292, 1.7948154211044312, 2.1160404682159424, 2.437265396118164, 2.758490562438965, 3.0797157287597656, 3.4009406566619873, 3.722165584564209, 4.04339075088501, 4.3646159172058105, 4.685840606689453, 5.007065773010254, 5.328290939331055, 5.6495161056518555, 5.970741271972656, 6.291965961456299, 6.6131911277771, 6.9344162940979, 7.255640983581543, 7.576866149902344, 7.8980913162231445, 8.219316482543945, 8.540541648864746, 8.861766815185547, 9.182991027832031, 9.504216194152832, 9.825441360473633, 10.146666526794434, 10.467891693115234]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 10.0, 12.0, 15.0, 25.0, 41.0, 48.0, 74.0, 110.0, 164.0, 226.0, 367.0, 652.0, 1051.0, 1734.0, 3105.0, 5838.0, 12379.0, 31416.0, 116763.0, 3578688.0, 348068.0, 55288.0, 19018.0, 8375.0, 4295.0, 2441.0, 1403.0, 890.0, 548.0, 359.0, 249.0, 148.0, 112.0, 89.0, 59.0, 37.0, 39.0, 31.0, 29.0, 19.0, 13.0, 10.0, 17.0, 8.0, 4.0, 1.0, 8.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.2578125, -2.179290771484375, -2.10076904296875, -2.022247314453125, -1.9437255859375, -1.865203857421875, -1.78668212890625, -1.708160400390625, -1.629638671875, -1.551116943359375, -1.47259521484375, -1.394073486328125, -1.3155517578125, -1.237030029296875, -1.15850830078125, -1.079986572265625, -1.00146484375, -0.922943115234375, -0.84442138671875, -0.765899658203125, -0.6873779296875, -0.608856201171875, -0.53033447265625, -0.451812744140625, -0.373291015625, -0.294769287109375, -0.21624755859375, -0.137725830078125, -0.0592041015625, 0.019317626953125, 0.09783935546875, 0.176361083984375, 0.2548828125, 0.333404541015625, 0.41192626953125, 0.490447998046875, 0.5689697265625, 0.647491455078125, 0.72601318359375, 0.804534912109375, 0.883056640625, 0.961578369140625, 1.04010009765625, 1.118621826171875, 1.1971435546875, 1.275665283203125, 1.35418701171875, 1.432708740234375, 1.51123046875, 1.589752197265625, 1.66827392578125, 1.746795654296875, 1.8253173828125, 1.903839111328125, 1.98236083984375, 2.060882568359375, 2.139404296875, 2.217926025390625, 2.29644775390625, 2.374969482421875, 2.4534912109375, 2.532012939453125, 2.61053466796875, 2.689056396484375, 2.767578125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 8.0, 13.0, 15.0, 17.0, 23.0, 35.0, 27.0, 50.0, 62.0, 59.0, 72.0, 95.0, 79.0, 92.0, 78.0, 63.0, 52.0, 33.0, 22.0, 25.0, 19.0, 11.0, 10.0, 6.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1326904296875, -0.12720870971679688, -0.12172698974609375, -0.11624526977539062, -0.1107635498046875, -0.10528182983398438, -0.09980010986328125, -0.09431838989257812, -0.088836669921875, -0.08335494995117188, -0.07787322998046875, -0.07239151000976562, -0.0669097900390625, -0.061428070068359375, -0.05594635009765625, -0.050464630126953125, -0.04498291015625, -0.039501190185546875, -0.03401947021484375, -0.028537750244140625, -0.0230560302734375, -0.017574310302734375, -0.01209259033203125, -0.006610870361328125, -0.001129150390625, 0.004352569580078125, 0.00983428955078125, 0.015316009521484375, 0.0207977294921875, 0.026279449462890625, 0.03176116943359375, 0.037242889404296875, 0.042724609375, 0.048206329345703125, 0.05368804931640625, 0.059169769287109375, 0.0646514892578125, 0.07013320922851562, 0.07561492919921875, 0.08109664916992188, 0.086578369140625, 0.09206008911132812, 0.09754180908203125, 0.10302352905273438, 0.1085052490234375, 0.11398696899414062, 0.11946868896484375, 0.12495040893554688, 0.13043212890625, 0.13591384887695312, 0.14139556884765625, 0.14687728881835938, 0.1523590087890625, 0.15784072875976562, 0.16332244873046875, 0.16880416870117188, 0.174285888671875, 0.17976760864257812, 0.18524932861328125, 0.19073104858398438, 0.1962127685546875, 0.20169448852539062, 0.20717620849609375, 0.21265792846679688, 0.2181396484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 13.0, 6.0, 27.0, 44.0, 81.0, 133.0, 247.0, 496.0, 1190.0, 3730.0, 15355.0, 90241.0, 3772691.0, 270692.0, 29661.0, 6488.0, 1843.0, 681.0, 284.0, 143.0, 79.0, 40.0, 32.0, 20.0, 19.0, 12.0, 8.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.8795166015625, -3.739501953125, -3.5994873046875, -3.45947265625, -3.3194580078125, -3.179443359375, -3.0394287109375, -2.8994140625, -2.7593994140625, -2.619384765625, -2.4793701171875, -2.33935546875, -2.1993408203125, -2.059326171875, -1.9193115234375, -1.779296875, -1.6392822265625, -1.499267578125, -1.3592529296875, -1.21923828125, -1.0792236328125, -0.939208984375, -0.7991943359375, -0.6591796875, -0.5191650390625, -0.379150390625, -0.2391357421875, -0.09912109375, 0.0408935546875, 0.180908203125, 0.3209228515625, 0.4609375, 0.6009521484375, 0.740966796875, 0.8809814453125, 1.02099609375, 1.1610107421875, 1.301025390625, 1.4410400390625, 1.5810546875, 1.7210693359375, 1.861083984375, 2.0010986328125, 2.14111328125, 2.2811279296875, 2.421142578125, 2.5611572265625, 2.701171875, 2.8411865234375, 2.981201171875, 3.1212158203125, 3.26123046875, 3.4012451171875, 3.541259765625, 3.6812744140625, 3.8212890625, 3.9613037109375, 4.101318359375, 4.2413330078125, 4.38134765625, 4.5213623046875, 4.661376953125, 4.8013916015625, 4.94140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 6.0, 9.0, 5.0, 12.0, 16.0, 22.0, 21.0, 35.0, 59.0, 102.0, 140.0, 409.0, 2163.0, 555.0, 171.0, 114.0, 82.0, 42.0, 27.0, 25.0, 17.0, 9.0, 10.0, 5.0, 8.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.60888671875, -0.5935249328613281, -0.5781631469726562, -0.5628013610839844, -0.5474395751953125, -0.5320777893066406, -0.5167160034179688, -0.5013542175292969, -0.485992431640625, -0.4706306457519531, -0.45526885986328125, -0.4399070739746094, -0.4245452880859375, -0.4091835021972656, -0.39382171630859375, -0.3784599304199219, -0.36309814453125, -0.3477363586425781, -0.33237457275390625, -0.3170127868652344, -0.3016510009765625, -0.2862892150878906, -0.27092742919921875, -0.2555656433105469, -0.240203857421875, -0.22484207153320312, -0.20948028564453125, -0.19411849975585938, -0.1787567138671875, -0.16339492797851562, -0.14803314208984375, -0.13267135620117188, -0.1173095703125, -0.10194778442382812, -0.08658599853515625, -0.07122421264648438, -0.0558624267578125, -0.040500640869140625, -0.02513885498046875, -0.009777069091796875, 0.005584716796875, 0.020946502685546875, 0.03630828857421875, 0.051670074462890625, 0.0670318603515625, 0.08239364624023438, 0.09775543212890625, 0.11311721801757812, 0.12847900390625, 0.14384078979492188, 0.15920257568359375, 0.17456436157226562, 0.1899261474609375, 0.20528793334960938, 0.22064971923828125, 0.23601150512695312, 0.251373291015625, 0.2667350769042969, 0.28209686279296875, 0.2974586486816406, 0.3128204345703125, 0.3281822204589844, 0.34354400634765625, 0.3589057922363281, 0.374267578125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 5.0, 3.0, 6.0, 7.0, 21.0, 15.0, 27.0, 49.0, 58.0, 84.0, 116.0, 132.0, 126.0, 103.0, 93.0, 50.0, 31.0, 21.0, 17.0, 9.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9242444038391113, -2.84871506690979, -2.7731854915618896, -2.6976561546325684, -2.622126579284668, -2.5465972423553467, -2.4710676670074463, -2.395538330078125, -2.3200087547302246, -2.2444794178009033, -2.168949842453003, -2.0934205055236816, -2.0178909301757812, -1.94236159324646, -1.8668321371078491, -1.7913026809692383, -1.715773344039917, -1.6402438879013062, -1.5647144317626953, -1.4891849756240845, -1.4136555194854736, -1.3381261825561523, -1.2625967264175415, -1.1870672702789307, -1.1115378141403198, -1.036008358001709, -0.9604789018630981, -0.8849495053291321, -0.8094200491905212, -0.7338905930519104, -0.6583611965179443, -0.5828317403793335, -0.5073025226593018, -0.4317730665206909, -0.35624364018440247, -0.280714213848114, -0.20518475770950317, -0.12965530157089233, -0.05412587523460388, 0.02140355110168457, 0.09693300724029541, 0.17246244847774506, 0.2479918897151947, 0.32352131605148315, 0.399050772190094, 0.47458022832870483, 0.5501096248626709, 0.6256390810012817, 0.7011685371398926, 0.7766979932785034, 0.8522274494171143, 0.9277568459510803, 1.003286361694336, 1.0788156986236572, 1.154345154762268, 1.229874610900879, 1.3054040670394897, 1.3809335231781006, 1.4564629793167114, 1.5319924354553223, 1.6075217723846436, 1.683051347732544, 1.7585806846618652, 1.834110140800476, 1.909639596939087]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 11.0, 11.0, 14.0, 24.0, 26.0, 27.0, 40.0, 38.0, 39.0, 62.0, 68.0, 59.0, 61.0, 83.0, 72.0, 52.0, 35.0, 52.0, 49.0, 32.0, 30.0, 20.0, 18.0, 19.0, 11.0, 17.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.746351957321167, -1.6872366666793823, -1.6281213760375977, -1.5690059661865234, -1.5098906755447388, -1.450775384902954, -1.3916600942611694, -1.3325448036193848, -1.2734295129776, -1.2143142223358154, -1.1551989316940308, -1.096083641052246, -1.0369682312011719, -0.9778529405593872, -0.9187376499176025, -0.8596223592758179, -0.8005070090293884, -0.7413917183876038, -0.6822763681411743, -0.6231610774993896, -0.564045786857605, -0.5049304962158203, -0.44581514596939087, -0.3866998553276062, -0.32758453488349915, -0.2684692144393921, -0.20935392379760742, -0.15023860335350037, -0.0911232978105545, -0.03200799226760864, 0.027107328176498413, 0.08622261881828308, 0.14533793926239014, 0.204453244805336, 0.26356855034828186, 0.3226838707923889, 0.3817991614341736, 0.44091448187828064, 0.5000298023223877, 0.5591450929641724, 0.618260383605957, 0.6773756742477417, 0.7364910244941711, 0.7956063151359558, 0.8547216057777405, 0.9138369560241699, 0.9729522466659546, 1.0320675373077393, 1.0911829471588135, 1.1502982378005981, 1.2094135284423828, 1.268528938293457, 1.3276442289352417, 1.3867595195770264, 1.445874810218811, 1.5049901008605957, 1.5641053915023804, 1.623220682144165, 1.6823359727859497, 1.7414512634277344, 1.8005666732788086, 1.8596819639205933, 1.918797254562378, 1.9779125452041626, 2.0370278358459473]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 11.0, 9.0, 17.0, 33.0, 58.0, 70.0, 131.0, 218.0, 374.0, 641.0, 1221.0, 2717.0, 6347.0, 16719.0, 51979.0, 189920.0, 465504.0, 220696.0, 59994.0, 18998.0, 7000.0, 2891.0, 1427.0, 642.0, 375.0, 225.0, 119.0, 66.0, 53.0, 33.0, 29.0, 15.0, 7.0, 7.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.90234375, -1.837982177734375, -1.77362060546875, -1.709259033203125, -1.6448974609375, -1.580535888671875, -1.51617431640625, -1.451812744140625, -1.387451171875, -1.323089599609375, -1.25872802734375, -1.194366455078125, -1.1300048828125, -1.065643310546875, -1.00128173828125, -0.936920166015625, -0.87255859375, -0.808197021484375, -0.74383544921875, -0.679473876953125, -0.6151123046875, -0.550750732421875, -0.48638916015625, -0.422027587890625, -0.357666015625, -0.293304443359375, -0.22894287109375, -0.164581298828125, -0.1002197265625, -0.035858154296875, 0.02850341796875, 0.092864990234375, 0.1572265625, 0.221588134765625, 0.28594970703125, 0.350311279296875, 0.4146728515625, 0.479034423828125, 0.54339599609375, 0.607757568359375, 0.672119140625, 0.736480712890625, 0.80084228515625, 0.865203857421875, 0.9295654296875, 0.993927001953125, 1.05828857421875, 1.122650146484375, 1.18701171875, 1.251373291015625, 1.31573486328125, 1.380096435546875, 1.4444580078125, 1.508819580078125, 1.57318115234375, 1.637542724609375, 1.701904296875, 1.766265869140625, 1.83062744140625, 1.894989013671875, 1.9593505859375, 2.023712158203125, 2.08807373046875, 2.152435302734375, 2.216796875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 9.0, 11.0, 14.0, 24.0, 29.0, 33.0, 57.0, 61.0, 98.0, 82.0, 91.0, 80.0, 96.0, 64.0, 65.0, 51.0, 40.0, 30.0, 13.0, 16.0, 9.0, 6.0, 7.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135498046875, -0.12932968139648438, -0.12316131591796875, -0.11699295043945312, -0.1108245849609375, -0.10465621948242188, -0.09848785400390625, -0.09231948852539062, -0.086151123046875, -0.07998275756835938, -0.07381439208984375, -0.06764602661132812, -0.0614776611328125, -0.055309295654296875, -0.04914093017578125, -0.042972564697265625, -0.03680419921875, -0.030635833740234375, -0.02446746826171875, -0.018299102783203125, -0.0121307373046875, -0.005962371826171875, 0.00020599365234375, 0.006374359130859375, 0.012542724609375, 0.018711090087890625, 0.02487945556640625, 0.031047821044921875, 0.0372161865234375, 0.043384552001953125, 0.04955291748046875, 0.055721282958984375, 0.0618896484375, 0.06805801391601562, 0.07422637939453125, 0.08039474487304688, 0.0865631103515625, 0.09273147583007812, 0.09889984130859375, 0.10506820678710938, 0.111236572265625, 0.11740493774414062, 0.12357330322265625, 0.12974166870117188, 0.1359100341796875, 0.14207839965820312, 0.14824676513671875, 0.15441513061523438, 0.16058349609375, 0.16675186157226562, 0.17292022705078125, 0.17908859252929688, 0.1852569580078125, 0.19142532348632812, 0.19759368896484375, 0.20376205444335938, 0.209930419921875, 0.21609878540039062, 0.22226715087890625, 0.22843551635742188, 0.2346038818359375, 0.24077224731445312, 0.24694061279296875, 0.2531089782714844, 0.25927734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 3.0, 16.0, 13.0, 18.0, 27.0, 33.0, 48.0, 63.0, 90.0, 127.0, 218.0, 302.0, 426.0, 776.0, 1400.0, 3133.0, 7786.0, 24086.0, 87828.0, 321521.0, 415945.0, 130941.0, 34803.0, 10748.0, 3875.0, 1780.0, 957.0, 549.0, 336.0, 227.0, 128.0, 93.0, 73.0, 56.0, 37.0, 25.0, 19.0, 16.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0], "bins": [-2.27734375, -2.216033935546875, -2.15472412109375, -2.093414306640625, -2.0321044921875, -1.970794677734375, -1.90948486328125, -1.848175048828125, -1.786865234375, -1.725555419921875, -1.66424560546875, -1.602935791015625, -1.5416259765625, -1.480316162109375, -1.41900634765625, -1.357696533203125, -1.29638671875, -1.235076904296875, -1.17376708984375, -1.112457275390625, -1.0511474609375, -0.989837646484375, -0.92852783203125, -0.867218017578125, -0.805908203125, -0.744598388671875, -0.68328857421875, -0.621978759765625, -0.5606689453125, -0.499359130859375, -0.43804931640625, -0.376739501953125, -0.3154296875, -0.254119873046875, -0.19281005859375, -0.131500244140625, -0.0701904296875, -0.008880615234375, 0.05242919921875, 0.113739013671875, 0.175048828125, 0.236358642578125, 0.29766845703125, 0.358978271484375, 0.4202880859375, 0.481597900390625, 0.54290771484375, 0.604217529296875, 0.66552734375, 0.726837158203125, 0.78814697265625, 0.849456787109375, 0.9107666015625, 0.972076416015625, 1.03338623046875, 1.094696044921875, 1.156005859375, 1.217315673828125, 1.27862548828125, 1.339935302734375, 1.4012451171875, 1.462554931640625, 1.52386474609375, 1.585174560546875, 1.646484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 5.0, 5.0, 4.0, 10.0, 3.0, 9.0, 9.0, 16.0, 11.0, 12.0, 23.0, 21.0, 29.0, 37.0, 30.0, 39.0, 39.0, 36.0, 45.0, 62.0, 51.0, 51.0, 42.0, 46.0, 33.0, 42.0, 41.0, 32.0, 25.0, 24.0, 25.0, 29.0, 21.0, 15.0, 13.0, 11.0, 9.0, 10.0, 7.0, 10.0, 7.0, 8.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.92041015625, -0.8949203491210938, -0.8694305419921875, -0.8439407348632812, -0.818450927734375, -0.7929611206054688, -0.7674713134765625, -0.7419815063476562, -0.71649169921875, -0.6910018920898438, -0.6655120849609375, -0.6400222778320312, -0.614532470703125, -0.5890426635742188, -0.5635528564453125, -0.5380630493164062, -0.5125732421875, -0.48708343505859375, -0.4615936279296875, -0.43610382080078125, -0.410614013671875, -0.38512420654296875, -0.3596343994140625, -0.33414459228515625, -0.30865478515625, -0.28316497802734375, -0.2576751708984375, -0.23218536376953125, -0.206695556640625, -0.18120574951171875, -0.1557159423828125, -0.13022613525390625, -0.104736328125, -0.07924652099609375, -0.0537567138671875, -0.02826690673828125, -0.002777099609375, 0.02271270751953125, 0.0482025146484375, 0.07369232177734375, 0.09918212890625, 0.12467193603515625, 0.1501617431640625, 0.17565155029296875, 0.201141357421875, 0.22663116455078125, 0.2521209716796875, 0.27761077880859375, 0.3031005859375, 0.32859039306640625, 0.3540802001953125, 0.37957000732421875, 0.405059814453125, 0.43054962158203125, 0.4560394287109375, 0.48152923583984375, 0.50701904296875, 0.5325088500976562, 0.5579986572265625, 0.5834884643554688, 0.608978271484375, 0.6344680786132812, 0.6599578857421875, 0.6854476928710938, 0.7109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 7.0, 18.0, 13.0, 18.0, 36.0, 48.0, 73.0, 105.0, 175.0, 326.0, 566.0, 1185.0, 2894.0, 8328.0, 30635.0, 158317.0, 575597.0, 214268.0, 39699.0, 10047.0, 3242.0, 1359.0, 686.0, 344.0, 193.0, 134.0, 73.0, 46.0, 37.0, 19.0, 18.0, 14.0, 7.0, 9.0, 5.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03515625, -0.9962158203125, -0.957275390625, -0.9183349609375, -0.87939453125, -0.8404541015625, -0.801513671875, -0.7625732421875, -0.7236328125, -0.6846923828125, -0.645751953125, -0.6068115234375, -0.56787109375, -0.5289306640625, -0.489990234375, -0.4510498046875, -0.412109375, -0.3731689453125, -0.334228515625, -0.2952880859375, -0.25634765625, -0.2174072265625, -0.178466796875, -0.1395263671875, -0.1005859375, -0.0616455078125, -0.022705078125, 0.0162353515625, 0.05517578125, 0.0941162109375, 0.133056640625, 0.1719970703125, 0.2109375, 0.2498779296875, 0.288818359375, 0.3277587890625, 0.36669921875, 0.4056396484375, 0.444580078125, 0.4835205078125, 0.5224609375, 0.5614013671875, 0.600341796875, 0.6392822265625, 0.67822265625, 0.7171630859375, 0.756103515625, 0.7950439453125, 0.833984375, 0.8729248046875, 0.911865234375, 0.9508056640625, 0.98974609375, 1.0286865234375, 1.067626953125, 1.1065673828125, 1.1455078125, 1.1844482421875, 1.223388671875, 1.2623291015625, 1.30126953125, 1.3402099609375, 1.379150390625, 1.4180908203125, 1.45703125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 8.0, 3.0, 10.0, 9.0, 18.0, 21.0, 26.0, 42.0, 45.0, 58.0, 84.0, 97.0, 104.0, 108.0, 80.0, 70.0, 43.0, 52.0, 21.0, 25.0, 18.0, 17.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002281665802001953, -0.00022071972489356995, -0.00021327286958694458, -0.00020582601428031921, -0.00019837915897369385, -0.00019093230366706848, -0.00018348544836044312, -0.00017603859305381775, -0.00016859173774719238, -0.00016114488244056702, -0.00015369802713394165, -0.00014625117182731628, -0.00013880431652069092, -0.00013135746121406555, -0.00012391060590744019, -0.00011646375060081482, -0.00010901689529418945, -0.00010157003998756409, -9.412318468093872e-05, -8.667632937431335e-05, -7.922947406768799e-05, -7.178261876106262e-05, -6.433576345443726e-05, -5.688890814781189e-05, -4.9442052841186523e-05, -4.199519753456116e-05, -3.454834222793579e-05, -2.7101486921310425e-05, -1.965463161468506e-05, -1.2207776308059692e-05, -4.760921001434326e-06, 2.68593430519104e-06, 1.0132789611816406e-05, 1.7579644918441772e-05, 2.502650022506714e-05, 3.2473355531692505e-05, 3.992021083831787e-05, 4.736706614494324e-05, 5.4813921451568604e-05, 6.226077675819397e-05, 6.970763206481934e-05, 7.71544873714447e-05, 8.460134267807007e-05, 9.204819798469543e-05, 9.94950532913208e-05, 0.00010694190859794617, 0.00011438876390457153, 0.0001218356192111969, 0.00012928247451782227, 0.00013672932982444763, 0.000144176185131073, 0.00015162304043769836, 0.00015906989574432373, 0.0001665167510509491, 0.00017396360635757446, 0.00018141046166419983, 0.0001888573169708252, 0.00019630417227745056, 0.00020375102758407593, 0.0002111978828907013, 0.00021864473819732666, 0.00022609159350395203, 0.0002335384488105774, 0.00024098530411720276, 0.0002484321594238281]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 9.0, 10.0, 18.0, 25.0, 55.0, 69.0, 153.0, 289.0, 824.0, 2405.0, 10096.0, 96972.0, 846905.0, 78030.0, 8974.0, 2253.0, 754.0, 331.0, 156.0, 93.0, 49.0, 28.0, 22.0, 9.0, 8.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.771484375, -2.68865966796875, -2.6058349609375, -2.52301025390625, -2.440185546875, -2.35736083984375, -2.2745361328125, -2.19171142578125, -2.10888671875, -2.02606201171875, -1.9432373046875, -1.86041259765625, -1.777587890625, -1.69476318359375, -1.6119384765625, -1.52911376953125, -1.4462890625, -1.36346435546875, -1.2806396484375, -1.19781494140625, -1.114990234375, -1.03216552734375, -0.9493408203125, -0.86651611328125, -0.78369140625, -0.70086669921875, -0.6180419921875, -0.53521728515625, -0.452392578125, -0.36956787109375, -0.2867431640625, -0.20391845703125, -0.12109375, -0.03826904296875, 0.0445556640625, 0.12738037109375, 0.210205078125, 0.29302978515625, 0.3758544921875, 0.45867919921875, 0.54150390625, 0.62432861328125, 0.7071533203125, 0.78997802734375, 0.872802734375, 0.95562744140625, 1.0384521484375, 1.12127685546875, 1.2041015625, 1.28692626953125, 1.3697509765625, 1.45257568359375, 1.535400390625, 1.61822509765625, 1.7010498046875, 1.78387451171875, 1.86669921875, 1.94952392578125, 2.0323486328125, 2.11517333984375, 2.197998046875, 2.28082275390625, 2.3636474609375, 2.44647216796875, 2.529296875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 5.0, 9.0, 9.0, 19.0, 28.0, 26.0, 44.0, 64.0, 87.0, 93.0, 109.0, 123.0, 104.0, 78.0, 48.0, 37.0, 33.0, 17.0, 16.0, 12.0, 8.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65087890625, -0.6281814575195312, -0.6054840087890625, -0.5827865600585938, -0.560089111328125, -0.5373916625976562, -0.5146942138671875, -0.49199676513671875, -0.46929931640625, -0.44660186767578125, -0.4239044189453125, -0.40120697021484375, -0.378509521484375, -0.35581207275390625, -0.3331146240234375, -0.31041717529296875, -0.2877197265625, -0.26502227783203125, -0.2423248291015625, -0.21962738037109375, -0.196929931640625, -0.17423248291015625, -0.1515350341796875, -0.12883758544921875, -0.10614013671875, -0.08344268798828125, -0.0607452392578125, -0.03804779052734375, -0.015350341796875, 0.00734710693359375, 0.0300445556640625, 0.05274200439453125, 0.075439453125, 0.09813690185546875, 0.1208343505859375, 0.14353179931640625, 0.166229248046875, 0.18892669677734375, 0.2116241455078125, 0.23432159423828125, 0.25701904296875, 0.27971649169921875, 0.3024139404296875, 0.32511138916015625, 0.347808837890625, 0.37050628662109375, 0.3932037353515625, 0.41590118408203125, 0.4385986328125, 0.46129608154296875, 0.4839935302734375, 0.5066909790039062, 0.529388427734375, 0.5520858764648438, 0.5747833251953125, 0.5974807739257812, 0.62017822265625, 0.6428756713867188, 0.6655731201171875, 0.6882705688476562, 0.710968017578125, 0.7336654663085938, 0.7563629150390625, 0.7790603637695312, 0.8017578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 15.0, 38.0, 53.0, 130.0, 220.0, 241.0, 158.0, 78.0, 38.0, 10.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.42030906677246, -21.815692901611328, -21.211078643798828, -20.606462478637695, -20.001846313476562, -19.39723014831543, -18.792613983154297, -18.187999725341797, -17.583383560180664, -16.97876739501953, -16.37415313720703, -15.769536972045898, -15.164920806884766, -14.560304641723633, -13.955689430236816, -13.35107421875, -12.746458053588867, -12.141841888427734, -11.537226676940918, -10.932611465454102, -10.327995300292969, -9.723379135131836, -9.11876392364502, -8.514148712158203, -7.90953254699707, -7.304916858673096, -6.700301170349121, -6.0956854820251465, -5.491069793701172, -4.886454105377197, -4.281838417053223, -3.677222728729248, -3.0726089477539062, -2.4679932594299316, -1.863377571105957, -1.2587618827819824, -0.6541461944580078, -0.0495305061340332, 0.5550851821899414, 1.159700870513916, 1.7643165588378906, 2.3689322471618652, 2.97354793548584, 3.5781636238098145, 4.182779312133789, 4.787395000457764, 5.392010688781738, 5.996626377105713, 6.6012420654296875, 7.205857753753662, 7.810473442077637, 8.415088653564453, 9.019704818725586, 9.624320983886719, 10.228936195373535, 10.833551406860352, 11.438167572021484, 12.042783737182617, 12.647398948669434, 13.25201416015625, 13.856630325317383, 14.461246490478516, 15.065861701965332, 15.670476913452148, 16.27509307861328]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 10.0, 10.0, 18.0, 18.0, 26.0, 25.0, 36.0, 33.0, 47.0, 44.0, 37.0, 46.0, 49.0, 63.0, 48.0, 48.0, 48.0, 46.0, 46.0, 52.0, 42.0, 39.0, 28.0, 21.0, 20.0, 18.0, 17.0, 14.0, 12.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.888740539550781, -5.6534423828125, -5.418144226074219, -5.182845592498779, -4.947547435760498, -4.712249279022217, -4.476950645446777, -4.241652488708496, -4.006354331970215, -3.7710561752319336, -3.5357577800750732, -3.300459384918213, -3.0651612281799316, -2.8298630714416504, -2.59456467628479, -2.3592662811279297, -2.1239681243896484, -1.8886698484420776, -1.6533715724945068, -1.418073296546936, -1.1827750205993652, -0.9474767446517944, -0.7121784687042236, -0.47688019275665283, -0.24158191680908203, -0.0062836408615112305, 0.22901463508605957, 0.46431291103363037, 0.6996111869812012, 0.934909462928772, 1.1702077388763428, 1.4055060148239136, 1.6408042907714844, 1.8761025667190552, 2.111400842666626, 2.3466992378234863, 2.5819973945617676, 2.817295551300049, 3.052593946456909, 3.2878923416137695, 3.523190498352051, 3.758488655090332, 3.9937870502471924, 4.229085445404053, 4.464383602142334, 4.699681758880615, 4.934980392456055, 5.170278549194336, 5.405576705932617, 5.640874862670898, 5.87617301940918, 6.111471652984619, 6.3467698097229, 6.582067966461182, 6.817366600036621, 7.052664756774902, 7.287962913513184, 7.523261070251465, 7.758559226989746, 7.9938578605651855, 8.229156494140625, 8.464454650878906, 8.699752807617188, 8.935050964355469, 9.17034912109375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 12.0, 18.0, 17.0, 29.0, 34.0, 45.0, 81.0, 180.0, 850.0, 24356.0, 4155833.0, 11610.0, 750.0, 199.0, 98.0, 51.0, 36.0, 30.0, 15.0, 14.0, 5.0, 8.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.515625, -8.098388671875, -7.68115234375, -7.263916015625, -6.8466796875, -6.429443359375, -6.01220703125, -5.594970703125, -5.177734375, -4.760498046875, -4.34326171875, -3.926025390625, -3.5087890625, -3.091552734375, -2.67431640625, -2.257080078125, -1.83984375, -1.422607421875, -1.00537109375, -0.588134765625, -0.1708984375, 0.246337890625, 0.66357421875, 1.080810546875, 1.498046875, 1.915283203125, 2.33251953125, 2.749755859375, 3.1669921875, 3.584228515625, 4.00146484375, 4.418701171875, 4.8359375, 5.253173828125, 5.67041015625, 6.087646484375, 6.5048828125, 6.922119140625, 7.33935546875, 7.756591796875, 8.173828125, 8.591064453125, 9.00830078125, 9.425537109375, 9.8427734375, 10.260009765625, 10.67724609375, 11.094482421875, 11.51171875, 11.928955078125, 12.34619140625, 12.763427734375, 13.1806640625, 13.597900390625, 14.01513671875, 14.432373046875, 14.849609375, 15.266845703125, 15.68408203125, 16.101318359375, 16.5185546875, 16.935791015625, 17.35302734375, 17.770263671875, 18.1875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 11.0, 11.0, 20.0, 21.0, 35.0, 37.0, 58.0, 86.0, 82.0, 82.0, 86.0, 96.0, 78.0, 86.0, 68.0, 43.0, 25.0, 25.0, 23.0, 11.0, 9.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.1621074676513672, -0.15343856811523438, -0.14476966857910156, -0.13610076904296875, -0.12743186950683594, -0.11876296997070312, -0.11009407043457031, -0.1014251708984375, -0.09275627136230469, -0.08408737182617188, -0.07541847229003906, -0.06674957275390625, -0.05808067321777344, -0.049411773681640625, -0.04074287414550781, -0.032073974609375, -0.023405075073242188, -0.014736175537109375, -0.0060672760009765625, 0.00260162353515625, 0.011270523071289062, 0.019939422607421875, 0.028608322143554688, 0.0372772216796875, 0.04594612121582031, 0.054615020751953125, 0.06328392028808594, 0.07195281982421875, 0.08062171936035156, 0.08929061889648438, 0.09795951843261719, 0.10662841796875, 0.11529731750488281, 0.12396621704101562, 0.13263511657714844, 0.14130401611328125, 0.14997291564941406, 0.15864181518554688, 0.1673107147216797, 0.1759796142578125, 0.1846485137939453, 0.19331741333007812, 0.20198631286621094, 0.21065521240234375, 0.21932411193847656, 0.22799301147460938, 0.2366619110107422, 0.245330810546875, 0.2539997100830078, 0.2626686096191406, 0.27133750915527344, 0.28000640869140625, 0.28867530822753906, 0.2973442077636719, 0.3060131072998047, 0.3146820068359375, 0.3233509063720703, 0.3320198059082031, 0.34068870544433594, 0.34935760498046875, 0.35802650451660156, 0.3666954040527344, 0.3753643035888672, 0.384033203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 7.0, 14.0, 15.0, 18.0, 19.0, 23.0, 35.0, 51.0, 73.0, 106.0, 205.0, 401.0, 902.0, 2938.0, 11753.0, 64731.0, 3592995.0, 472138.0, 36813.0, 7501.0, 2026.0, 740.0, 303.0, 186.0, 78.0, 55.0, 47.0, 30.0, 20.0, 23.0, 9.0, 9.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3515625, -3.23541259765625, -3.1192626953125, -3.00311279296875, -2.886962890625, -2.77081298828125, -2.6546630859375, -2.53851318359375, -2.42236328125, -2.30621337890625, -2.1900634765625, -2.07391357421875, -1.957763671875, -1.84161376953125, -1.7254638671875, -1.60931396484375, -1.4931640625, -1.37701416015625, -1.2608642578125, -1.14471435546875, -1.028564453125, -0.91241455078125, -0.7962646484375, -0.68011474609375, -0.56396484375, -0.44781494140625, -0.3316650390625, -0.21551513671875, -0.099365234375, 0.01678466796875, 0.1329345703125, 0.24908447265625, 0.365234375, 0.48138427734375, 0.5975341796875, 0.71368408203125, 0.829833984375, 0.94598388671875, 1.0621337890625, 1.17828369140625, 1.29443359375, 1.41058349609375, 1.5267333984375, 1.64288330078125, 1.759033203125, 1.87518310546875, 1.9913330078125, 2.10748291015625, 2.2236328125, 2.33978271484375, 2.4559326171875, 2.57208251953125, 2.688232421875, 2.80438232421875, 2.9205322265625, 3.03668212890625, 3.15283203125, 3.26898193359375, 3.3851318359375, 3.50128173828125, 3.617431640625, 3.73358154296875, 3.8497314453125, 3.96588134765625, 4.08203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 11.0, 2.0, 14.0, 22.0, 38.0, 48.0, 79.0, 159.0, 569.0, 2540.0, 327.0, 116.0, 51.0, 38.0, 21.0, 19.0, 8.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88037109375, -0.857391357421875, -0.83441162109375, -0.811431884765625, -0.7884521484375, -0.765472412109375, -0.74249267578125, -0.719512939453125, -0.696533203125, -0.673553466796875, -0.65057373046875, -0.627593994140625, -0.6046142578125, -0.581634521484375, -0.55865478515625, -0.535675048828125, -0.5126953125, -0.489715576171875, -0.46673583984375, -0.443756103515625, -0.4207763671875, -0.397796630859375, -0.37481689453125, -0.351837158203125, -0.328857421875, -0.305877685546875, -0.28289794921875, -0.259918212890625, -0.2369384765625, -0.213958740234375, -0.19097900390625, -0.167999267578125, -0.14501953125, -0.122039794921875, -0.09906005859375, -0.076080322265625, -0.0531005859375, -0.030120849609375, -0.00714111328125, 0.015838623046875, 0.038818359375, 0.061798095703125, 0.08477783203125, 0.107757568359375, 0.1307373046875, 0.153717041015625, 0.17669677734375, 0.199676513671875, 0.22265625, 0.245635986328125, 0.26861572265625, 0.291595458984375, 0.3145751953125, 0.337554931640625, 0.36053466796875, 0.383514404296875, 0.406494140625, 0.429473876953125, 0.45245361328125, 0.475433349609375, 0.4984130859375, 0.521392822265625, 0.54437255859375, 0.567352294921875, 0.59033203125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 9.0, 16.0, 23.0, 29.0, 41.0, 55.0, 72.0, 97.0, 127.0, 139.0, 103.0, 93.0, 59.0, 45.0, 25.0, 15.0, 10.0, 15.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.180996894836426, -2.100832939147949, -2.0206689834594727, -1.9405051469802856, -1.860341191291809, -1.7801772356033325, -1.7000133991241455, -1.619849443435669, -1.5396854877471924, -1.4595215320587158, -1.3793575763702393, -1.2991937398910522, -1.2190297842025757, -1.1388658285140991, -1.058701992034912, -0.9785380363464355, -0.898374080657959, -0.8182101249694824, -0.7380462288856506, -0.6578823328018188, -0.5777183771133423, -0.4975544512271881, -0.41739052534103394, -0.33722662925720215, -0.2570626735687256, -0.1768987476825714, -0.09673482179641724, -0.01657089591026306, 0.06359302997589111, 0.1437569558620453, 0.22392088174819946, 0.30408477783203125, 0.3842487335205078, 0.464412659406662, 0.5445765852928162, 0.624740481376648, 0.7049044370651245, 0.7850683927536011, 0.8652322888374329, 0.9453961849212646, 1.0255601406097412, 1.1057240962982178, 1.1858880519866943, 1.2660518884658813, 1.346215844154358, 1.4263797998428345, 1.5065436363220215, 1.586707592010498, 1.6668715476989746, 1.7470355033874512, 1.8271994590759277, 1.9073632955551147, 1.9875272512435913, 2.0676910877227783, 2.147855043411255, 2.2280189990997314, 2.308182954788208, 2.3883469104766846, 2.468510866165161, 2.5486748218536377, 2.628838539123535, 2.7090024948120117, 2.7891664505004883, 2.869330406188965, 2.9494943618774414]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 10.0, 5.0, 7.0, 14.0, 10.0, 8.0, 8.0, 26.0, 24.0, 32.0, 29.0, 30.0, 33.0, 42.0, 34.0, 41.0, 42.0, 51.0, 43.0, 51.0, 37.0, 39.0, 34.0, 30.0, 31.0, 35.0, 33.0, 39.0, 24.0, 25.0, 21.0, 18.0, 17.0, 8.0, 8.0, 11.0, 7.0, 8.0, 11.0, 8.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2984263896942139, -1.255571722984314, -1.212717056274414, -1.1698623895645142, -1.1270077228546143, -1.084153175354004, -1.041298508644104, -0.9984438419342041, -0.9555891752243042, -0.9127345085144043, -0.8698798418045044, -0.8270252346992493, -0.7841705679893494, -0.7413159012794495, -0.6984612941741943, -0.6556066274642944, -0.6127519607543945, -0.5698972940444946, -0.5270426273345947, -0.4841880202293396, -0.4413333535194397, -0.3984786868095398, -0.3556240499019623, -0.31276941299438477, -0.26991474628448486, -0.22706009447574615, -0.18420544266700745, -0.14135079085826874, -0.09849613904953003, -0.05564148724079132, -0.012786835432052612, 0.030067801475524902, 0.07292258739471436, 0.11577723920345306, 0.15863189101219177, 0.20148654282093048, 0.2443411946296692, 0.2871958613395691, 0.3300504982471466, 0.3729051351547241, 0.415759801864624, 0.4586144685745239, 0.5014691352844238, 0.544323742389679, 0.5871784090995789, 0.6300330758094788, 0.6728876829147339, 0.7157423496246338, 0.7585970163345337, 0.8014516830444336, 0.8443063497543335, 0.8871609568595886, 0.9300156235694885, 0.9728702902793884, 1.0157248973846436, 1.0585795640945435, 1.1014342308044434, 1.1442888975143433, 1.1871435642242432, 1.229998230934143, 1.272852897644043, 1.3157074451446533, 1.3585621118545532, 1.4014167785644531, 1.444271445274353]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 3.0, 5.0, 4.0, 12.0, 13.0, 29.0, 38.0, 59.0, 129.0, 243.0, 377.0, 739.0, 1610.0, 4104.0, 12809.0, 50856.0, 228725.0, 505047.0, 184652.0, 41605.0, 10893.0, 3520.0, 1412.0, 694.0, 396.0, 242.0, 120.0, 86.0, 50.0, 25.0, 21.0, 11.0, 9.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.287109375, -2.216583251953125, -2.14605712890625, -2.075531005859375, -2.0050048828125, -1.934478759765625, -1.86395263671875, -1.793426513671875, -1.722900390625, -1.652374267578125, -1.58184814453125, -1.511322021484375, -1.4407958984375, -1.370269775390625, -1.29974365234375, -1.229217529296875, -1.15869140625, -1.088165283203125, -1.01763916015625, -0.947113037109375, -0.8765869140625, -0.806060791015625, -0.73553466796875, -0.665008544921875, -0.594482421875, -0.523956298828125, -0.45343017578125, -0.382904052734375, -0.3123779296875, -0.241851806640625, -0.17132568359375, -0.100799560546875, -0.0302734375, 0.040252685546875, 0.11077880859375, 0.181304931640625, 0.2518310546875, 0.322357177734375, 0.39288330078125, 0.463409423828125, 0.533935546875, 0.604461669921875, 0.67498779296875, 0.745513916015625, 0.8160400390625, 0.886566162109375, 0.95709228515625, 1.027618408203125, 1.09814453125, 1.168670654296875, 1.23919677734375, 1.309722900390625, 1.3802490234375, 1.450775146484375, 1.52130126953125, 1.591827392578125, 1.662353515625, 1.732879638671875, 1.80340576171875, 1.873931884765625, 1.9444580078125, 2.014984130859375, 2.08551025390625, 2.156036376953125, 2.2265625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 11.0, 10.0, 20.0, 17.0, 29.0, 59.0, 61.0, 70.0, 72.0, 79.0, 80.0, 82.0, 79.0, 83.0, 80.0, 43.0, 44.0, 24.0, 18.0, 18.0, 6.0, 8.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1680908203125, -0.1597003936767578, -0.15130996704101562, -0.14291954040527344, -0.13452911376953125, -0.12613868713378906, -0.11774826049804688, -0.10935783386230469, -0.1009674072265625, -0.09257698059082031, -0.08418655395507812, -0.07579612731933594, -0.06740570068359375, -0.05901527404785156, -0.050624847412109375, -0.04223442077636719, -0.033843994140625, -0.025453567504882812, -0.017063140869140625, -0.008672714233398438, -0.00028228759765625, 0.008108139038085938, 0.016498565673828125, 0.024888992309570312, 0.0332794189453125, 0.04166984558105469, 0.050060272216796875, 0.05845069885253906, 0.06684112548828125, 0.07523155212402344, 0.08362197875976562, 0.09201240539550781, 0.10040283203125, 0.10879325866699219, 0.11718368530273438, 0.12557411193847656, 0.13396453857421875, 0.14235496520996094, 0.15074539184570312, 0.1591358184814453, 0.1675262451171875, 0.1759166717529297, 0.18430709838867188, 0.19269752502441406, 0.20108795166015625, 0.20947837829589844, 0.21786880493164062, 0.2262592315673828, 0.234649658203125, 0.2430400848388672, 0.2514305114746094, 0.25982093811035156, 0.26821136474609375, 0.27660179138183594, 0.2849922180175781, 0.2933826446533203, 0.3017730712890625, 0.3101634979248047, 0.3185539245605469, 0.32694435119628906, 0.33533477783203125, 0.34372520446777344, 0.3521156311035156, 0.3605060577392578, 0.368896484375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 10.0, 17.0, 10.0, 15.0, 36.0, 34.0, 48.0, 49.0, 74.0, 95.0, 147.0, 193.0, 276.0, 416.0, 602.0, 1087.0, 2107.0, 4744.0, 12520.0, 39061.0, 127330.0, 361405.0, 333447.0, 111105.0, 33683.0, 11060.0, 4161.0, 1913.0, 947.0, 584.0, 387.0, 277.0, 194.0, 148.0, 87.0, 65.0, 34.0, 45.0, 26.0, 24.0, 17.0, 14.0, 13.0, 10.0, 9.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.6884765625, -1.6339111328125, -1.579345703125, -1.5247802734375, -1.47021484375, -1.4156494140625, -1.361083984375, -1.3065185546875, -1.251953125, -1.1973876953125, -1.142822265625, -1.0882568359375, -1.03369140625, -0.9791259765625, -0.924560546875, -0.8699951171875, -0.8154296875, -0.7608642578125, -0.706298828125, -0.6517333984375, -0.59716796875, -0.5426025390625, -0.488037109375, -0.4334716796875, -0.37890625, -0.3243408203125, -0.269775390625, -0.2152099609375, -0.16064453125, -0.1060791015625, -0.051513671875, 0.0030517578125, 0.0576171875, 0.1121826171875, 0.166748046875, 0.2213134765625, 0.27587890625, 0.3304443359375, 0.385009765625, 0.4395751953125, 0.494140625, 0.5487060546875, 0.603271484375, 0.6578369140625, 0.71240234375, 0.7669677734375, 0.821533203125, 0.8760986328125, 0.9306640625, 0.9852294921875, 1.039794921875, 1.0943603515625, 1.14892578125, 1.2034912109375, 1.258056640625, 1.3126220703125, 1.3671875, 1.4217529296875, 1.476318359375, 1.5308837890625, 1.58544921875, 1.6400146484375, 1.694580078125, 1.7491455078125, 1.8037109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 6.0, 9.0, 7.0, 7.0, 7.0, 13.0, 17.0, 18.0, 21.0, 12.0, 25.0, 22.0, 29.0, 31.0, 22.0, 39.0, 31.0, 41.0, 38.0, 39.0, 33.0, 47.0, 48.0, 39.0, 42.0, 39.0, 33.0, 36.0, 39.0, 33.0, 28.0, 26.0, 18.0, 14.0, 17.0, 12.0, 12.0, 13.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.92578125, -0.8971405029296875, -0.868499755859375, -0.8398590087890625, -0.81121826171875, -0.7825775146484375, -0.753936767578125, -0.7252960205078125, -0.6966552734375, -0.6680145263671875, -0.639373779296875, -0.6107330322265625, -0.58209228515625, -0.5534515380859375, -0.524810791015625, -0.4961700439453125, -0.467529296875, -0.4388885498046875, -0.410247802734375, -0.3816070556640625, -0.35296630859375, -0.3243255615234375, -0.295684814453125, -0.2670440673828125, -0.2384033203125, -0.2097625732421875, -0.181121826171875, -0.1524810791015625, -0.12384033203125, -0.0951995849609375, -0.066558837890625, -0.0379180908203125, -0.00927734375, 0.0193634033203125, 0.048004150390625, 0.0766448974609375, 0.10528564453125, 0.1339263916015625, 0.162567138671875, 0.1912078857421875, 0.2198486328125, 0.2484893798828125, 0.277130126953125, 0.3057708740234375, 0.33441162109375, 0.3630523681640625, 0.391693115234375, 0.4203338623046875, 0.448974609375, 0.4776153564453125, 0.506256103515625, 0.5348968505859375, 0.56353759765625, 0.5921783447265625, 0.620819091796875, 0.6494598388671875, 0.6781005859375, 0.7067413330078125, 0.735382080078125, 0.7640228271484375, 0.79266357421875, 0.8213043212890625, 0.849945068359375, 0.8785858154296875, 0.9072265625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 0.0, 6.0, 7.0, 8.0, 10.0, 16.0, 34.0, 38.0, 64.0, 104.0, 172.0, 258.0, 405.0, 702.0, 1103.0, 2112.0, 4704.0, 12472.0, 49156.0, 401648.0, 493118.0, 57971.0, 13809.0, 5164.0, 2341.0, 1231.0, 701.0, 429.0, 274.0, 170.0, 117.0, 78.0, 41.0, 28.0, 16.0, 11.0, 10.0, 4.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5224609375, -1.4763946533203125, -1.430328369140625, -1.3842620849609375, -1.33819580078125, -1.2921295166015625, -1.246063232421875, -1.1999969482421875, -1.1539306640625, -1.1078643798828125, -1.061798095703125, -1.0157318115234375, -0.96966552734375, -0.9235992431640625, -0.877532958984375, -0.8314666748046875, -0.785400390625, -0.7393341064453125, -0.693267822265625, -0.6472015380859375, -0.60113525390625, -0.5550689697265625, -0.509002685546875, -0.4629364013671875, -0.4168701171875, -0.3708038330078125, -0.324737548828125, -0.2786712646484375, -0.23260498046875, -0.1865386962890625, -0.140472412109375, -0.0944061279296875, -0.04833984375, -0.0022735595703125, 0.043792724609375, 0.0898590087890625, 0.13592529296875, 0.1819915771484375, 0.228057861328125, 0.2741241455078125, 0.3201904296875, 0.3662567138671875, 0.412322998046875, 0.4583892822265625, 0.50445556640625, 0.5505218505859375, 0.596588134765625, 0.6426544189453125, 0.688720703125, 0.7347869873046875, 0.780853271484375, 0.8269195556640625, 0.87298583984375, 0.9190521240234375, 0.965118408203125, 1.0111846923828125, 1.0572509765625, 1.1033172607421875, 1.149383544921875, 1.1954498291015625, 1.24151611328125, 1.2875823974609375, 1.333648681640625, 1.3797149658203125, 1.42578125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 8.0, 11.0, 7.0, 24.0, 21.0, 45.0, 72.0, 70.0, 120.0, 100.0, 106.0, 105.0, 92.0, 72.0, 56.0, 30.0, 16.0, 10.0, 5.0, 8.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.000335693359375, -0.000327378511428833, -0.000319063663482666, -0.000310748815536499, -0.00030243396759033203, -0.00029411911964416504, -0.00028580427169799805, -0.00027748942375183105, -0.00026917457580566406, -0.00026085972785949707, -0.0002525448799133301, -0.0002442300319671631, -0.0002359151840209961, -0.0002276003360748291, -0.0002192854881286621, -0.00021097064018249512, -0.00020265579223632812, -0.00019434094429016113, -0.00018602609634399414, -0.00017771124839782715, -0.00016939640045166016, -0.00016108155250549316, -0.00015276670455932617, -0.00014445185661315918, -0.0001361370086669922, -0.0001278221607208252, -0.0001195073127746582, -0.00011119246482849121, -0.00010287761688232422, -9.456276893615723e-05, -8.624792098999023e-05, -7.793307304382324e-05, -6.961822509765625e-05, -6.130337715148926e-05, -5.2988529205322266e-05, -4.4673681259155273e-05, -3.635883331298828e-05, -2.804398536682129e-05, -1.9729137420654297e-05, -1.1414289474487305e-05, -3.0994415283203125e-06, 5.21540641784668e-06, 1.3530254364013672e-05, 2.1845102310180664e-05, 3.0159950256347656e-05, 3.847479820251465e-05, 4.678964614868164e-05, 5.510449409484863e-05, 6.341934204101562e-05, 7.173418998718262e-05, 8.004903793334961e-05, 8.83638858795166e-05, 9.66787338256836e-05, 0.00010499358177185059, 0.00011330842971801758, 0.00012162327766418457, 0.00012993812561035156, 0.00013825297355651855, 0.00014656782150268555, 0.00015488266944885254, 0.00016319751739501953, 0.00017151236534118652, 0.00017982721328735352, 0.0001881420612335205, 0.0001964569091796875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 6.0, 9.0, 9.0, 22.0, 21.0, 21.0, 36.0, 54.0, 100.0, 109.0, 198.0, 348.0, 566.0, 994.0, 2343.0, 5935.0, 18309.0, 83409.0, 687815.0, 201980.0, 30548.0, 9105.0, 3343.0, 1447.0, 694.0, 415.0, 237.0, 140.0, 101.0, 65.0, 34.0, 39.0, 13.0, 19.0, 12.0, 12.0, 13.0, 6.0, 4.0, 7.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.884765625, -1.83197021484375, -1.7791748046875, -1.72637939453125, -1.673583984375, -1.62078857421875, -1.5679931640625, -1.51519775390625, -1.46240234375, -1.40960693359375, -1.3568115234375, -1.30401611328125, -1.251220703125, -1.19842529296875, -1.1456298828125, -1.09283447265625, -1.0400390625, -0.98724365234375, -0.9344482421875, -0.88165283203125, -0.828857421875, -0.77606201171875, -0.7232666015625, -0.67047119140625, -0.61767578125, -0.56488037109375, -0.5120849609375, -0.45928955078125, -0.406494140625, -0.35369873046875, -0.3009033203125, -0.24810791015625, -0.1953125, -0.14251708984375, -0.0897216796875, -0.03692626953125, 0.015869140625, 0.06866455078125, 0.1214599609375, 0.17425537109375, 0.22705078125, 0.27984619140625, 0.3326416015625, 0.38543701171875, 0.438232421875, 0.49102783203125, 0.5438232421875, 0.59661865234375, 0.6494140625, 0.70220947265625, 0.7550048828125, 0.80780029296875, 0.860595703125, 0.91339111328125, 0.9661865234375, 1.01898193359375, 1.07177734375, 1.12457275390625, 1.1773681640625, 1.23016357421875, 1.282958984375, 1.33575439453125, 1.3885498046875, 1.44134521484375, 1.494140625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 8.0, 9.0, 14.0, 14.0, 25.0, 31.0, 38.0, 49.0, 82.0, 103.0, 142.0, 128.0, 96.0, 72.0, 45.0, 35.0, 26.0, 17.0, 16.0, 9.0, 10.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.94775390625, -0.9227676391601562, -0.8977813720703125, -0.8727951049804688, -0.847808837890625, -0.8228225708007812, -0.7978363037109375, -0.7728500366210938, -0.74786376953125, -0.7228775024414062, -0.6978912353515625, -0.6729049682617188, -0.647918701171875, -0.6229324340820312, -0.5979461669921875, -0.5729598999023438, -0.5479736328125, -0.5229873657226562, -0.4980010986328125, -0.47301483154296875, -0.448028564453125, -0.42304229736328125, -0.3980560302734375, -0.37306976318359375, -0.34808349609375, -0.32309722900390625, -0.2981109619140625, -0.27312469482421875, -0.248138427734375, -0.22315216064453125, -0.1981658935546875, -0.17317962646484375, -0.148193359375, -0.12320709228515625, -0.0982208251953125, -0.07323455810546875, -0.048248291015625, -0.02326202392578125, 0.0017242431640625, 0.02671051025390625, 0.05169677734375, 0.07668304443359375, 0.1016693115234375, 0.12665557861328125, 0.151641845703125, 0.17662811279296875, 0.2016143798828125, 0.22660064697265625, 0.2515869140625, 0.27657318115234375, 0.3015594482421875, 0.32654571533203125, 0.351531982421875, 0.37651824951171875, 0.4015045166015625, 0.42649078369140625, 0.45147705078125, 0.47646331787109375, 0.5014495849609375, 0.5264358520507812, 0.551422119140625, 0.5764083862304688, 0.6013946533203125, 0.6263809204101562, 0.6513671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 14.0, 4.0, 16.0, 27.0, 54.0, 74.0, 143.0, 175.0, 186.0, 134.0, 88.0, 41.0, 17.0, 20.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.798914909362793, -9.282971382141113, -8.767027854919434, -8.251083374023438, -7.735139846801758, -7.219196319580078, -6.703252792358398, -6.187309265136719, -5.671365261077881, -5.155421733856201, -4.639477729797363, -4.123534202575684, -3.607590436935425, -3.091646671295166, -2.5757031440734863, -2.0597593784332275, -1.5438156127929688, -1.02787184715271, -0.5119282007217407, 0.004015445709228516, 0.5199592113494873, 1.035902976989746, 1.5518465042114258, 2.0677902698516846, 2.5837340354919434, 3.099677801132202, 3.615621566772461, 4.131565093994141, 4.64750862121582, 5.163452625274658, 5.679396152496338, 6.195340156555176, 6.711284637451172, 7.227228164672852, 7.7431721687316895, 8.259115219116211, 8.775059700012207, 9.291003227233887, 9.806946754455566, 10.322890281677246, 10.838834762573242, 11.354778289794922, 11.870721817016602, 12.386665344238281, 12.902609825134277, 13.418553352355957, 13.934496879577637, 14.450440406799316, 14.966383934020996, 15.482327461242676, 15.998270988464355, 16.51421546936035, 17.03015899658203, 17.54610252380371, 18.06204605102539, 18.57798957824707, 19.09393310546875, 19.60987663269043, 20.12582015991211, 20.64176368713379, 21.15770721435547, 21.67365264892578, 22.189594268798828, 22.70553970336914, 23.22148323059082]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 8.0, 6.0, 12.0, 17.0, 17.0, 16.0, 9.0, 24.0, 28.0, 30.0, 34.0, 32.0, 40.0, 59.0, 35.0, 48.0, 37.0, 52.0, 52.0, 33.0, 46.0, 48.0, 48.0, 44.0, 39.0, 25.0, 24.0, 37.0, 12.0, 16.0, 14.0, 18.0, 9.0, 8.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2116546630859375, -6.970138072967529, -6.728621482849121, -6.487104892730713, -6.245588302612305, -6.0040717124938965, -5.762555122375488, -5.521039009094238, -5.279521942138672, -5.038005352020264, -4.7964887619018555, -4.554972171783447, -4.313455581665039, -4.071938991546631, -3.8304226398468018, -3.5889060497283936, -3.3473896980285645, -3.1058731079101562, -2.864356517791748, -2.62283992767334, -2.3813233375549316, -2.1398067474365234, -1.8982903957366943, -1.6567738056182861, -1.415257215499878, -1.1737406253814697, -0.9322240948677063, -0.6907075643539429, -0.44919097423553467, -0.20767438411712646, 0.03384208679199219, 0.2753586769104004, 0.5168752670288086, 0.7583918571472168, 0.9999083876609802, 1.2414249181747437, 1.4829415082931519, 1.72445809841156, 1.9659745693206787, 2.207491159439087, 2.449007749557495, 2.6905243396759033, 2.9320409297943115, 3.1735572814941406, 3.415073871612549, 3.656590461730957, 3.8981070518493652, 4.139623641967773, 4.381140232086182, 4.62265682220459, 4.864173412322998, 5.105690002441406, 5.3472065925598145, 5.588723182678223, 5.830239295959473, 6.071756362915039, 6.313272476196289, 6.554789066314697, 6.7963056564331055, 7.037822246551514, 7.279338836669922, 7.52085542678833, 7.762372016906738, 8.003888130187988, 8.245405197143555]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 9.0, 10.0, 12.0, 22.0, 23.0, 54.0, 85.0, 146.0, 310.0, 683.0, 1531.0, 4333.0, 15109.0, 91364.0, 3895316.0, 155285.0, 20537.0, 5584.0, 2024.0, 818.0, 431.0, 236.0, 127.0, 77.0, 62.0, 22.0, 22.0, 16.0, 15.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.80078125, -1.70892333984375, -1.6170654296875, -1.52520751953125, -1.433349609375, -1.34149169921875, -1.2496337890625, -1.15777587890625, -1.06591796875, -0.97406005859375, -0.8822021484375, -0.79034423828125, -0.698486328125, -0.60662841796875, -0.5147705078125, -0.42291259765625, -0.3310546875, -0.23919677734375, -0.1473388671875, -0.05548095703125, 0.036376953125, 0.12823486328125, 0.2200927734375, 0.31195068359375, 0.40380859375, 0.49566650390625, 0.5875244140625, 0.67938232421875, 0.771240234375, 0.86309814453125, 0.9549560546875, 1.04681396484375, 1.138671875, 1.23052978515625, 1.3223876953125, 1.41424560546875, 1.506103515625, 1.59796142578125, 1.6898193359375, 1.78167724609375, 1.87353515625, 1.96539306640625, 2.0572509765625, 2.14910888671875, 2.240966796875, 2.33282470703125, 2.4246826171875, 2.51654052734375, 2.6083984375, 2.70025634765625, 2.7921142578125, 2.88397216796875, 2.975830078125, 3.06768798828125, 3.1595458984375, 3.25140380859375, 3.34326171875, 3.43511962890625, 3.5269775390625, 3.61883544921875, 3.710693359375, 3.80255126953125, 3.8944091796875, 3.98626708984375, 4.078125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 9.0, 19.0, 18.0, 27.0, 43.0, 50.0, 66.0, 59.0, 63.0, 70.0, 69.0, 81.0, 65.0, 74.0, 52.0, 60.0, 45.0, 35.0, 29.0, 24.0, 14.0, 9.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1876220703125, -0.17827415466308594, -0.16892623901367188, -0.1595783233642578, -0.15023040771484375, -0.1408824920654297, -0.13153457641601562, -0.12218666076660156, -0.1128387451171875, -0.10349082946777344, -0.09414291381835938, -0.08479499816894531, -0.07544708251953125, -0.06609916687011719, -0.056751251220703125, -0.04740333557128906, -0.038055419921875, -0.028707504272460938, -0.019359588623046875, -0.010011672973632812, -0.00066375732421875, 0.008684158325195312, 0.018032073974609375, 0.027379989624023438, 0.0367279052734375, 0.04607582092285156, 0.055423736572265625, 0.06477165222167969, 0.07411956787109375, 0.08346748352050781, 0.09281539916992188, 0.10216331481933594, 0.11151123046875, 0.12085914611816406, 0.13020706176757812, 0.1395549774169922, 0.14890289306640625, 0.1582508087158203, 0.16759872436523438, 0.17694664001464844, 0.1862945556640625, 0.19564247131347656, 0.20499038696289062, 0.2143383026123047, 0.22368621826171875, 0.2330341339111328, 0.24238204956054688, 0.25172996520996094, 0.261077880859375, 0.27042579650878906, 0.2797737121582031, 0.2891216278076172, 0.29846954345703125, 0.3078174591064453, 0.3171653747558594, 0.32651329040527344, 0.3358612060546875, 0.34520912170410156, 0.3545570373535156, 0.3639049530029297, 0.37325286865234375, 0.3826007843017578, 0.3919486999511719, 0.40129661560058594, 0.41064453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 9.0, 13.0, 8.0, 16.0, 33.0, 35.0, 61.0, 73.0, 133.0, 170.0, 258.0, 491.0, 857.0, 1471.0, 2921.0, 5962.0, 13937.0, 36696.0, 130729.0, 3108127.0, 754869.0, 89494.0, 27615.0, 10639.0, 4716.0, 2243.0, 1182.0, 637.0, 333.0, 204.0, 133.0, 79.0, 49.0, 26.0, 21.0, 18.0, 11.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.55078125, -1.4970703125, -1.443359375, -1.3896484375, -1.3359375, -1.2822265625, -1.228515625, -1.1748046875, -1.12109375, -1.0673828125, -1.013671875, -0.9599609375, -0.90625, -0.8525390625, -0.798828125, -0.7451171875, -0.69140625, -0.6376953125, -0.583984375, -0.5302734375, -0.4765625, -0.4228515625, -0.369140625, -0.3154296875, -0.26171875, -0.2080078125, -0.154296875, -0.1005859375, -0.046875, 0.0068359375, 0.060546875, 0.1142578125, 0.16796875, 0.2216796875, 0.275390625, 0.3291015625, 0.3828125, 0.4365234375, 0.490234375, 0.5439453125, 0.59765625, 0.6513671875, 0.705078125, 0.7587890625, 0.8125, 0.8662109375, 0.919921875, 0.9736328125, 1.02734375, 1.0810546875, 1.134765625, 1.1884765625, 1.2421875, 1.2958984375, 1.349609375, 1.4033203125, 1.45703125, 1.5107421875, 1.564453125, 1.6181640625, 1.671875, 1.7255859375, 1.779296875, 1.8330078125, 1.88671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 1.0, 3.0, 7.0, 10.0, 11.0, 7.0, 30.0, 31.0, 44.0, 50.0, 78.0, 133.0, 329.0, 1690.0, 1021.0, 266.0, 122.0, 75.0, 43.0, 33.0, 22.0, 17.0, 15.0, 10.0, 3.0, 5.0, 6.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70947265625, -0.6929473876953125, -0.676422119140625, -0.6598968505859375, -0.64337158203125, -0.6268463134765625, -0.610321044921875, -0.5937957763671875, -0.5772705078125, -0.5607452392578125, -0.544219970703125, -0.5276947021484375, -0.51116943359375, -0.4946441650390625, -0.478118896484375, -0.4615936279296875, -0.445068359375, -0.4285430908203125, -0.412017822265625, -0.3954925537109375, -0.37896728515625, -0.3624420166015625, -0.345916748046875, -0.3293914794921875, -0.3128662109375, -0.2963409423828125, -0.279815673828125, -0.2632904052734375, -0.24676513671875, -0.2302398681640625, -0.213714599609375, -0.1971893310546875, -0.1806640625, -0.1641387939453125, -0.147613525390625, -0.1310882568359375, -0.11456298828125, -0.0980377197265625, -0.081512451171875, -0.0649871826171875, -0.0484619140625, -0.0319366455078125, -0.015411376953125, 0.0011138916015625, 0.01763916015625, 0.0341644287109375, 0.050689697265625, 0.0672149658203125, 0.083740234375, 0.1002655029296875, 0.116790771484375, 0.1333160400390625, 0.14984130859375, 0.1663665771484375, 0.182891845703125, 0.1994171142578125, 0.2159423828125, 0.2324676513671875, 0.248992919921875, 0.2655181884765625, 0.28204345703125, 0.2985687255859375, 0.315093994140625, 0.3316192626953125, 0.34814453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 11.0, 26.0, 38.0, 74.0, 112.0, 174.0, 191.0, 153.0, 101.0, 48.0, 27.0, 13.0, 9.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.412475347518921, -3.2878854274749756, -3.1632957458496094, -3.038705825805664, -2.9141159057617188, -2.7895259857177734, -2.6649363040924072, -2.540346384048462, -2.4157567024230957, -2.2911667823791504, -2.166577100753784, -2.041987180709839, -1.9173972606658936, -1.7928074598312378, -1.668217658996582, -1.5436277389526367, -1.4190378189086914, -1.2944480180740356, -1.1698580980300903, -1.0452682971954346, -0.920678436756134, -0.7960885763168335, -0.6714987754821777, -0.5469089150428772, -0.42231905460357666, -0.2977291941642761, -0.17313936352729797, -0.048549532890319824, 0.07604032754898071, 0.20063018798828125, 0.325219988822937, 0.44980984926223755, 0.574399471282959, 0.6989893317222595, 0.8235791921615601, 0.9481689929962158, 1.0727589130401611, 1.197348713874817, 1.3219385147094727, 1.446528434753418, 1.5711182355880737, 1.6957080364227295, 1.8202979564666748, 1.9448877573013306, 2.0694775581359863, 2.1940674781799316, 2.318657398223877, 2.443247079849243, 2.5678369998931885, 2.692426919937134, 2.8170166015625, 2.9416065216064453, 3.0661964416503906, 3.190786361694336, 3.315376043319702, 3.4399659633636475, 3.5645556449890137, 3.689145565032959, 3.813735246658325, 3.9383251667022705, 4.062914848327637, 4.187504768371582, 4.312094688415527, 4.436684608459473, 4.561274528503418]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 4.0, 6.0, 9.0, 5.0, 14.0, 10.0, 12.0, 23.0, 17.0, 20.0, 26.0, 31.0, 46.0, 37.0, 45.0, 39.0, 50.0, 59.0, 52.0, 45.0, 53.0, 43.0, 48.0, 36.0, 44.0, 49.0, 31.0, 26.0, 16.0, 21.0, 17.0, 12.0, 9.0, 10.0, 9.0, 8.0, 9.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6343889236450195, -1.5829471349716187, -1.5315053462982178, -1.4800636768341064, -1.4286218881607056, -1.3771800994873047, -1.3257383108139038, -1.274296522140503, -1.2228548526763916, -1.1714130640029907, -1.1199712753295898, -1.0685296058654785, -1.0170878171920776, -0.9656460285186768, -0.9142042398452759, -0.862762451171875, -0.8113206624984741, -0.7598788738250732, -0.7084371447563171, -0.6569953560829163, -0.6055536270141602, -0.5541118383407593, -0.5026700496673584, -0.4512282907962799, -0.3997865319252014, -0.3483447730541229, -0.29690301418304443, -0.24546122550964355, -0.19401946663856506, -0.14257770776748657, -0.0911359190940857, -0.0396941602230072, 0.01174771785736084, 0.06318948417901993, 0.11463125050067902, 0.1660730242729187, 0.2175147831439972, 0.2689565420150757, 0.32039833068847656, 0.37184008955955505, 0.42328184843063354, 0.47472360730171204, 0.5261653661727905, 0.5776071548461914, 0.6290489435195923, 0.6804906725883484, 0.7319324612617493, 0.7833741903305054, 0.8348159790039062, 0.8862577676773071, 0.9376994967460632, 0.9891412854194641, 1.0405830144882202, 1.092024803161621, 1.143466591835022, 1.1949083805084229, 1.2463500499725342, 1.297791838645935, 1.349233627319336, 1.4006752967834473, 1.4521170854568481, 1.503558874130249, 1.55500066280365, 1.6064424514770508, 1.6578842401504517]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 3.0, 11.0, 11.0, 14.0, 24.0, 32.0, 36.0, 44.0, 79.0, 99.0, 145.0, 210.0, 354.0, 480.0, 800.0, 1403.0, 2416.0, 4661.0, 8898.0, 18269.0, 37962.0, 78779.0, 160823.0, 283053.0, 224700.0, 115025.0, 55779.0, 26844.0, 12895.0, 6407.0, 3437.0, 1896.0, 1085.0, 670.0, 339.0, 271.0, 216.0, 117.0, 76.0, 54.0, 30.0, 27.0, 22.0, 12.0, 15.0, 4.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.908203125, -0.877685546875, -0.84716796875, -0.816650390625, -0.7861328125, -0.755615234375, -0.72509765625, -0.694580078125, -0.6640625, -0.633544921875, -0.60302734375, -0.572509765625, -0.5419921875, -0.511474609375, -0.48095703125, -0.450439453125, -0.419921875, -0.389404296875, -0.35888671875, -0.328369140625, -0.2978515625, -0.267333984375, -0.23681640625, -0.206298828125, -0.17578125, -0.145263671875, -0.11474609375, -0.084228515625, -0.0537109375, -0.023193359375, 0.00732421875, 0.037841796875, 0.068359375, 0.098876953125, 0.12939453125, 0.159912109375, 0.1904296875, 0.220947265625, 0.25146484375, 0.281982421875, 0.3125, 0.343017578125, 0.37353515625, 0.404052734375, 0.4345703125, 0.465087890625, 0.49560546875, 0.526123046875, 0.556640625, 0.587158203125, 0.61767578125, 0.648193359375, 0.6787109375, 0.709228515625, 0.73974609375, 0.770263671875, 0.80078125, 0.831298828125, 0.86181640625, 0.892333984375, 0.9228515625, 0.953369140625, 0.98388671875, 1.014404296875, 1.044921875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 10.0, 13.0, 15.0, 16.0, 31.0, 50.0, 44.0, 61.0, 60.0, 58.0, 64.0, 66.0, 63.0, 69.0, 66.0, 78.0, 55.0, 47.0, 36.0, 20.0, 31.0, 10.0, 14.0, 9.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.188232421875, -0.17934417724609375, -0.1704559326171875, -0.16156768798828125, -0.152679443359375, -0.14379119873046875, -0.1349029541015625, -0.12601470947265625, -0.11712646484375, -0.10823822021484375, -0.0993499755859375, -0.09046173095703125, -0.081573486328125, -0.07268524169921875, -0.0637969970703125, -0.05490875244140625, -0.0460205078125, -0.03713226318359375, -0.0282440185546875, -0.01935577392578125, -0.010467529296875, -0.00157928466796875, 0.0073089599609375, 0.01619720458984375, 0.02508544921875, 0.03397369384765625, 0.0428619384765625, 0.05175018310546875, 0.060638427734375, 0.06952667236328125, 0.0784149169921875, 0.08730316162109375, 0.09619140625, 0.10507965087890625, 0.1139678955078125, 0.12285614013671875, 0.131744384765625, 0.14063262939453125, 0.1495208740234375, 0.15840911865234375, 0.16729736328125, 0.17618560791015625, 0.1850738525390625, 0.19396209716796875, 0.202850341796875, 0.21173858642578125, 0.2206268310546875, 0.22951507568359375, 0.2384033203125, 0.24729156494140625, 0.2561798095703125, 0.26506805419921875, 0.273956298828125, 0.28284454345703125, 0.2917327880859375, 0.30062103271484375, 0.30950927734375, 0.31839752197265625, 0.3272857666015625, 0.33617401123046875, 0.345062255859375, 0.35395050048828125, 0.3628387451171875, 0.37172698974609375, 0.380615234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 7.0, 11.0, 13.0, 17.0, 19.0, 43.0, 35.0, 58.0, 91.0, 144.0, 206.0, 375.0, 720.0, 1514.0, 4095.0, 14267.0, 63623.0, 293499.0, 490684.0, 137934.0, 28970.0, 7313.0, 2460.0, 1015.0, 568.0, 259.0, 191.0, 117.0, 107.0, 54.0, 35.0, 29.0, 18.0, 14.0, 13.0, 7.0, 3.0, 7.0, 9.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.115234375, -2.0552215576171875, -1.995208740234375, -1.9351959228515625, -1.87518310546875, -1.8151702880859375, -1.755157470703125, -1.6951446533203125, -1.6351318359375, -1.5751190185546875, -1.515106201171875, -1.4550933837890625, -1.39508056640625, -1.3350677490234375, -1.275054931640625, -1.2150421142578125, -1.155029296875, -1.0950164794921875, -1.035003662109375, -0.9749908447265625, -0.91497802734375, -0.8549652099609375, -0.794952392578125, -0.7349395751953125, -0.6749267578125, -0.6149139404296875, -0.554901123046875, -0.4948883056640625, -0.43487548828125, -0.3748626708984375, -0.314849853515625, -0.2548370361328125, -0.19482421875, -0.1348114013671875, -0.074798583984375, -0.0147857666015625, 0.04522705078125, 0.1052398681640625, 0.165252685546875, 0.2252655029296875, 0.2852783203125, 0.3452911376953125, 0.405303955078125, 0.4653167724609375, 0.52532958984375, 0.5853424072265625, 0.645355224609375, 0.7053680419921875, 0.765380859375, 0.8253936767578125, 0.885406494140625, 0.9454193115234375, 1.00543212890625, 1.0654449462890625, 1.125457763671875, 1.1854705810546875, 1.2454833984375, 1.3054962158203125, 1.365509033203125, 1.4255218505859375, 1.48553466796875, 1.5455474853515625, 1.605560302734375, 1.6655731201171875, 1.7255859375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 9.0, 7.0, 12.0, 17.0, 6.0, 18.0, 22.0, 25.0, 25.0, 28.0, 38.0, 25.0, 42.0, 41.0, 44.0, 42.0, 46.0, 49.0, 53.0, 45.0, 46.0, 37.0, 39.0, 37.0, 40.0, 34.0, 23.0, 22.0, 19.0, 24.0, 15.0, 13.0, 9.0, 10.0, 7.0, 10.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.1923828125, -1.1587066650390625, -1.125030517578125, -1.0913543701171875, -1.05767822265625, -1.0240020751953125, -0.990325927734375, -0.9566497802734375, -0.9229736328125, -0.8892974853515625, -0.855621337890625, -0.8219451904296875, -0.78826904296875, -0.7545928955078125, -0.720916748046875, -0.6872406005859375, -0.653564453125, -0.6198883056640625, -0.586212158203125, -0.5525360107421875, -0.51885986328125, -0.4851837158203125, -0.451507568359375, -0.4178314208984375, -0.3841552734375, -0.3504791259765625, -0.316802978515625, -0.2831268310546875, -0.24945068359375, -0.2157745361328125, -0.182098388671875, -0.1484222412109375, -0.11474609375, -0.0810699462890625, -0.047393798828125, -0.0137176513671875, 0.01995849609375, 0.0536346435546875, 0.087310791015625, 0.1209869384765625, 0.1546630859375, 0.1883392333984375, 0.222015380859375, 0.2556915283203125, 0.28936767578125, 0.3230438232421875, 0.356719970703125, 0.3903961181640625, 0.424072265625, 0.4577484130859375, 0.491424560546875, 0.5251007080078125, 0.55877685546875, 0.5924530029296875, 0.626129150390625, 0.6598052978515625, 0.6934814453125, 0.7271575927734375, 0.760833740234375, 0.7945098876953125, 0.82818603515625, 0.8618621826171875, 0.895538330078125, 0.9292144775390625, 0.962890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 11.0, 9.0, 12.0, 21.0, 30.0, 54.0, 91.0, 212.0, 447.0, 1322.0, 4289.0, 17858.0, 239891.0, 740853.0, 33693.0, 6528.0, 1926.0, 709.0, 300.0, 135.0, 60.0, 37.0, 18.0, 13.0, 9.0, 6.0, 4.0, 4.0, 7.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6552734375, -1.5943450927734375, -1.533416748046875, -1.4724884033203125, -1.41156005859375, -1.3506317138671875, -1.289703369140625, -1.2287750244140625, -1.1678466796875, -1.1069183349609375, -1.045989990234375, -0.9850616455078125, -0.92413330078125, -0.8632049560546875, -0.802276611328125, -0.7413482666015625, -0.680419921875, -0.6194915771484375, -0.558563232421875, -0.4976348876953125, -0.43670654296875, -0.3757781982421875, -0.314849853515625, -0.2539215087890625, -0.1929931640625, -0.1320648193359375, -0.071136474609375, -0.0102081298828125, 0.05072021484375, 0.1116485595703125, 0.172576904296875, 0.2335052490234375, 0.29443359375, 0.3553619384765625, 0.416290283203125, 0.4772186279296875, 0.53814697265625, 0.5990753173828125, 0.660003662109375, 0.7209320068359375, 0.7818603515625, 0.8427886962890625, 0.903717041015625, 0.9646453857421875, 1.02557373046875, 1.0865020751953125, 1.147430419921875, 1.2083587646484375, 1.269287109375, 1.3302154541015625, 1.391143798828125, 1.4520721435546875, 1.51300048828125, 1.5739288330078125, 1.634857177734375, 1.6957855224609375, 1.7567138671875, 1.8176422119140625, 1.878570556640625, 1.9394989013671875, 2.00042724609375, 2.0613555908203125, 2.122283935546875, 2.1832122802734375, 2.244140625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 10.0, 13.0, 13.0, 14.0, 15.0, 23.0, 20.0, 40.0, 40.0, 49.0, 78.0, 80.0, 87.0, 87.0, 73.0, 79.0, 58.0, 43.0, 38.0, 28.0, 21.0, 22.0, 18.0, 14.0, 8.0, 10.0, 4.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00018405914306640625, -0.00017879903316497803, -0.0001735389232635498, -0.00016827881336212158, -0.00016301870346069336, -0.00015775859355926514, -0.00015249848365783691, -0.0001472383737564087, -0.00014197826385498047, -0.00013671815395355225, -0.00013145804405212402, -0.0001261979341506958, -0.00012093782424926758, -0.00011567771434783936, -0.00011041760444641113, -0.00010515749454498291, -9.989738464355469e-05, -9.463727474212646e-05, -8.937716484069824e-05, -8.411705493927002e-05, -7.88569450378418e-05, -7.359683513641357e-05, -6.833672523498535e-05, -6.307661533355713e-05, -5.7816505432128906e-05, -5.2556395530700684e-05, -4.729628562927246e-05, -4.203617572784424e-05, -3.6776065826416016e-05, -3.151595592498779e-05, -2.625584602355957e-05, -2.0995736122131348e-05, -1.5735626220703125e-05, -1.0475516319274902e-05, -5.21540641784668e-06, 4.470348358154297e-08, 5.304813385009766e-06, 1.0564923286437988e-05, 1.582503318786621e-05, 2.1085143089294434e-05, 2.6345252990722656e-05, 3.160536289215088e-05, 3.68654727935791e-05, 4.2125582695007324e-05, 4.738569259643555e-05, 5.264580249786377e-05, 5.790591239929199e-05, 6.316602230072021e-05, 6.842613220214844e-05, 7.368624210357666e-05, 7.894635200500488e-05, 8.42064619064331e-05, 8.946657180786133e-05, 9.472668170928955e-05, 9.998679161071777e-05, 0.000105246901512146, 0.00011050701141357422, 0.00011576712131500244, 0.00012102723121643066, 0.0001262873411178589, 0.0001315474510192871, 0.00013680756092071533, 0.00014206767082214355, 0.00014732778072357178, 0.000152587890625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 4.0, 4.0, 19.0, 18.0, 25.0, 33.0, 48.0, 75.0, 145.0, 280.0, 486.0, 1167.0, 2857.0, 8955.0, 43588.0, 741734.0, 219415.0, 20557.0, 5407.0, 1946.0, 827.0, 388.0, 207.0, 116.0, 83.0, 48.0, 27.0, 20.0, 17.0, 10.0, 7.0, 12.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6572265625, -1.6016082763671875, -1.545989990234375, -1.4903717041015625, -1.43475341796875, -1.3791351318359375, -1.323516845703125, -1.2678985595703125, -1.2122802734375, -1.1566619873046875, -1.101043701171875, -1.0454254150390625, -0.98980712890625, -0.9341888427734375, -0.878570556640625, -0.8229522705078125, -0.767333984375, -0.7117156982421875, -0.656097412109375, -0.6004791259765625, -0.54486083984375, -0.4892425537109375, -0.433624267578125, -0.3780059814453125, -0.3223876953125, -0.2667694091796875, -0.211151123046875, -0.1555328369140625, -0.09991455078125, -0.0442962646484375, 0.011322021484375, 0.0669403076171875, 0.12255859375, 0.1781768798828125, 0.233795166015625, 0.2894134521484375, 0.34503173828125, 0.4006500244140625, 0.456268310546875, 0.5118865966796875, 0.5675048828125, 0.6231231689453125, 0.678741455078125, 0.7343597412109375, 0.78997802734375, 0.8455963134765625, 0.901214599609375, 0.9568328857421875, 1.012451171875, 1.0680694580078125, 1.123687744140625, 1.1793060302734375, 1.23492431640625, 1.2905426025390625, 1.346160888671875, 1.4017791748046875, 1.4573974609375, 1.5130157470703125, 1.568634033203125, 1.6242523193359375, 1.67987060546875, 1.7354888916015625, 1.791107177734375, 1.8467254638671875, 1.90234375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 6.0, 9.0, 4.0, 7.0, 9.0, 14.0, 14.0, 21.0, 26.0, 69.0, 69.0, 126.0, 133.0, 161.0, 98.0, 64.0, 40.0, 24.0, 26.0, 15.0, 8.0, 11.0, 6.0, 7.0, 5.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74072265625, -0.7165374755859375, -0.692352294921875, -0.6681671142578125, -0.64398193359375, -0.6197967529296875, -0.595611572265625, -0.5714263916015625, -0.5472412109375, -0.5230560302734375, -0.498870849609375, -0.4746856689453125, -0.45050048828125, -0.4263153076171875, -0.402130126953125, -0.3779449462890625, -0.353759765625, -0.3295745849609375, -0.305389404296875, -0.2812042236328125, -0.25701904296875, -0.2328338623046875, -0.208648681640625, -0.1844635009765625, -0.1602783203125, -0.1360931396484375, -0.111907958984375, -0.0877227783203125, -0.06353759765625, -0.0393524169921875, -0.015167236328125, 0.0090179443359375, 0.033203125, 0.0573883056640625, 0.081573486328125, 0.1057586669921875, 0.12994384765625, 0.1541290283203125, 0.178314208984375, 0.2024993896484375, 0.2266845703125, 0.2508697509765625, 0.275054931640625, 0.2992401123046875, 0.32342529296875, 0.3476104736328125, 0.371795654296875, 0.3959808349609375, 0.420166015625, 0.4443511962890625, 0.468536376953125, 0.4927215576171875, 0.51690673828125, 0.5410919189453125, 0.565277099609375, 0.5894622802734375, 0.6136474609375, 0.6378326416015625, 0.662017822265625, 0.6862030029296875, 0.71038818359375, 0.7345733642578125, 0.758758544921875, 0.7829437255859375, 0.80712890625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 5.0, 0.0, 6.0, 8.0, 9.0, 5.0, 26.0, 22.0, 29.0, 41.0, 49.0, 69.0, 70.0, 81.0, 83.0, 113.0, 85.0, 66.0, 47.0, 43.0, 32.0, 26.0, 16.0, 23.0, 8.0, 5.0, 10.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.729748725891113, -5.523377895355225, -5.317007541656494, -5.1106367111206055, -4.904265880584717, -4.697895526885986, -4.491524696350098, -4.285154342651367, -4.0787835121154785, -3.872412919998169, -3.6660420894622803, -3.4596714973449707, -3.253300905227661, -3.0469303131103516, -2.840559482574463, -2.6341888904571533, -2.4278180599212646, -2.221447467803955, -2.0150766372680664, -1.8087060451507568, -1.6023354530334473, -1.3959647417068481, -1.189594030380249, -0.9832234382629395, -0.7768527269363403, -0.570482075214386, -0.36411139369010925, -0.15774071216583252, 0.048629939556121826, 0.25500059127807617, 0.4613713026046753, 0.6677418947219849, 0.874112606048584, 1.080483317375183, 1.2868539094924927, 1.4932246208190918, 1.6995952129364014, 1.9059659242630005, 2.1123366355895996, 2.318707227706909, 2.5250778198242188, 2.7314484119415283, 2.937819242477417, 3.1441898345947266, 3.350560426712036, 3.5569310188293457, 3.7633018493652344, 3.969672441482544, 4.176043510437012, 4.3824143409729, 4.588784694671631, 4.7951555252075195, 5.001526355743408, 5.207896709442139, 5.414267539978027, 5.620637893676758, 5.8270087242126465, 6.033379554748535, 6.239749908447266, 6.446120738983154, 6.652491569519043, 6.858861923217773, 7.065232753753662, 7.271603584289551, 7.477973937988281]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 5.0, 8.0, 12.0, 6.0, 11.0, 12.0, 24.0, 16.0, 16.0, 27.0, 28.0, 31.0, 30.0, 29.0, 34.0, 44.0, 48.0, 28.0, 43.0, 58.0, 46.0, 44.0, 38.0, 32.0, 35.0, 26.0, 35.0, 24.0, 30.0, 23.0, 21.0, 23.0, 20.0, 17.0, 16.0, 7.0, 9.0, 9.0, 3.0, 3.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.264535427093506, -6.077020645141602, -5.889505386352539, -5.701990604400635, -5.5144758224487305, -5.326960563659668, -5.139445781707764, -4.951930999755859, -4.764415740966797, -4.576900959014893, -4.38938570022583, -4.201870918273926, -4.014355659484863, -3.826840877532959, -3.6393260955810547, -3.4518110752105713, -3.264296054840088, -3.0767810344696045, -2.889266014099121, -2.701751232147217, -2.5142362117767334, -2.32672119140625, -2.1392064094543457, -1.9516913890838623, -1.764176368713379, -1.5766613483428955, -1.3891464471817017, -1.2016315460205078, -1.0141165256500244, -0.8266015648841858, -0.6390866041183472, -0.4515717029571533, -0.2640562057495117, -0.0765412449836731, 0.11097371578216553, 0.29848867654800415, 0.4860036373138428, 0.6735185980796814, 0.86103355884552, 1.0485484600067139, 1.2360634803771973, 1.4235785007476807, 1.6110934019088745, 1.7986083030700684, 1.9861233234405518, 2.173638343811035, 2.3611531257629395, 2.548668146133423, 2.7361831665039062, 2.9236981868743896, 3.111213207244873, 3.2987279891967773, 3.4862430095672607, 3.673758029937744, 3.8612728118896484, 4.048788070678711, 4.236302852630615, 4.4238176345825195, 4.611332893371582, 4.798847675323486, 4.986362457275391, 5.173877716064453, 5.361392498016357, 5.548907279968262, 5.736422538757324]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 7.0, 11.0, 13.0, 18.0, 29.0, 32.0, 37.0, 82.0, 142.0, 259.0, 440.0, 891.0, 2290.0, 6017.0, 18770.0, 96219.0, 3865006.0, 165933.0, 25262.0, 7388.0, 2828.0, 1192.0, 608.0, 312.0, 183.0, 105.0, 67.0, 42.0, 39.0, 22.0, 13.0, 5.0, 2.0, 10.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.49609375, -1.429931640625, -1.36376953125, -1.297607421875, -1.2314453125, -1.165283203125, -1.09912109375, -1.032958984375, -0.966796875, -0.900634765625, -0.83447265625, -0.768310546875, -0.7021484375, -0.635986328125, -0.56982421875, -0.503662109375, -0.4375, -0.371337890625, -0.30517578125, -0.239013671875, -0.1728515625, -0.106689453125, -0.04052734375, 0.025634765625, 0.091796875, 0.157958984375, 0.22412109375, 0.290283203125, 0.3564453125, 0.422607421875, 0.48876953125, 0.554931640625, 0.62109375, 0.687255859375, 0.75341796875, 0.819580078125, 0.8857421875, 0.951904296875, 1.01806640625, 1.084228515625, 1.150390625, 1.216552734375, 1.28271484375, 1.348876953125, 1.4150390625, 1.481201171875, 1.54736328125, 1.613525390625, 1.6796875, 1.745849609375, 1.81201171875, 1.878173828125, 1.9443359375, 2.010498046875, 2.07666015625, 2.142822265625, 2.208984375, 2.275146484375, 2.34130859375, 2.407470703125, 2.4736328125, 2.539794921875, 2.60595703125, 2.672119140625, 2.73828125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 9.0, 13.0, 15.0, 25.0, 26.0, 33.0, 35.0, 51.0, 42.0, 59.0, 54.0, 53.0, 68.0, 60.0, 67.0, 69.0, 62.0, 39.0, 41.0, 35.0, 32.0, 30.0, 14.0, 15.0, 16.0, 5.0, 6.0, 9.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1708984375, -0.1627655029296875, -0.154632568359375, -0.1464996337890625, -0.13836669921875, -0.1302337646484375, -0.122100830078125, -0.1139678955078125, -0.1058349609375, -0.0977020263671875, -0.089569091796875, -0.0814361572265625, -0.07330322265625, -0.0651702880859375, -0.057037353515625, -0.0489044189453125, -0.040771484375, -0.0326385498046875, -0.024505615234375, -0.0163726806640625, -0.00823974609375, -0.0001068115234375, 0.008026123046875, 0.0161590576171875, 0.0242919921875, 0.0324249267578125, 0.040557861328125, 0.0486907958984375, 0.05682373046875, 0.0649566650390625, 0.073089599609375, 0.0812225341796875, 0.08935546875, 0.0974884033203125, 0.105621337890625, 0.1137542724609375, 0.12188720703125, 0.1300201416015625, 0.138153076171875, 0.1462860107421875, 0.1544189453125, 0.1625518798828125, 0.170684814453125, 0.1788177490234375, 0.18695068359375, 0.1950836181640625, 0.203216552734375, 0.2113494873046875, 0.219482421875, 0.2276153564453125, 0.235748291015625, 0.2438812255859375, 0.25201416015625, 0.2601470947265625, 0.268280029296875, 0.2764129638671875, 0.2845458984375, 0.2926788330078125, 0.300811767578125, 0.3089447021484375, 0.31707763671875, 0.3252105712890625, 0.333343505859375, 0.3414764404296875, 0.349609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 5.0, 5.0, 4.0, 12.0, 13.0, 14.0, 14.0, 16.0, 34.0, 47.0, 78.0, 121.0, 229.0, 400.0, 721.0, 1498.0, 3409.0, 8780.0, 26308.0, 111197.0, 3294824.0, 646068.0, 69411.0, 18921.0, 6673.0, 2635.0, 1320.0, 598.0, 325.0, 199.0, 120.0, 75.0, 49.0, 47.0, 20.0, 17.0, 18.0, 16.0, 12.0, 10.0, 5.0, 2.0, 2.0, 8.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.384002685546875, -1.33245849609375, -1.280914306640625, -1.2293701171875, -1.177825927734375, -1.12628173828125, -1.074737548828125, -1.023193359375, -0.971649169921875, -0.92010498046875, -0.868560791015625, -0.8170166015625, -0.765472412109375, -0.71392822265625, -0.662384033203125, -0.61083984375, -0.559295654296875, -0.50775146484375, -0.456207275390625, -0.4046630859375, -0.353118896484375, -0.30157470703125, -0.250030517578125, -0.198486328125, -0.146942138671875, -0.09539794921875, -0.043853759765625, 0.0076904296875, 0.059234619140625, 0.11077880859375, 0.162322998046875, 0.2138671875, 0.265411376953125, 0.31695556640625, 0.368499755859375, 0.4200439453125, 0.471588134765625, 0.52313232421875, 0.574676513671875, 0.626220703125, 0.677764892578125, 0.72930908203125, 0.780853271484375, 0.8323974609375, 0.883941650390625, 0.93548583984375, 0.987030029296875, 1.03857421875, 1.090118408203125, 1.14166259765625, 1.193206787109375, 1.2447509765625, 1.296295166015625, 1.34783935546875, 1.399383544921875, 1.450927734375, 1.502471923828125, 1.55401611328125, 1.605560302734375, 1.6571044921875, 1.708648681640625, 1.76019287109375, 1.811737060546875, 1.86328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 10.0, 6.0, 8.0, 10.0, 15.0, 28.0, 55.0, 67.0, 131.0, 246.0, 857.0, 1872.0, 360.0, 145.0, 90.0, 43.0, 36.0, 26.0, 12.0, 21.0, 8.0, 6.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28564453125, -0.2707061767578125, -0.255767822265625, -0.2408294677734375, -0.22589111328125, -0.2109527587890625, -0.196014404296875, -0.1810760498046875, -0.1661376953125, -0.1511993408203125, -0.136260986328125, -0.1213226318359375, -0.10638427734375, -0.0914459228515625, -0.076507568359375, -0.0615692138671875, -0.046630859375, -0.0316925048828125, -0.016754150390625, -0.0018157958984375, 0.01312255859375, 0.0280609130859375, 0.042999267578125, 0.0579376220703125, 0.0728759765625, 0.0878143310546875, 0.102752685546875, 0.1176910400390625, 0.13262939453125, 0.1475677490234375, 0.162506103515625, 0.1774444580078125, 0.1923828125, 0.2073211669921875, 0.222259521484375, 0.2371978759765625, 0.25213623046875, 0.2670745849609375, 0.282012939453125, 0.2969512939453125, 0.3118896484375, 0.3268280029296875, 0.341766357421875, 0.3567047119140625, 0.37164306640625, 0.3865814208984375, 0.401519775390625, 0.4164581298828125, 0.431396484375, 0.4463348388671875, 0.461273193359375, 0.4762115478515625, 0.49114990234375, 0.5060882568359375, 0.521026611328125, 0.5359649658203125, 0.5509033203125, 0.5658416748046875, 0.580780029296875, 0.5957183837890625, 0.61065673828125, 0.6255950927734375, 0.640533447265625, 0.6554718017578125, 0.67041015625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 5.0, 7.0, 12.0, 33.0, 79.0, 140.0, 178.0, 195.0, 140.0, 101.0, 60.0, 25.0, 19.0, 4.0, 4.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.115701913833618, -2.996549129486084, -2.8773961067199707, -2.7582433223724365, -2.6390905380249023, -2.519937753677368, -2.400784969329834, -2.2816319465637207, -2.1624791622161865, -2.0433263778686523, -1.9241734743118286, -1.8050205707550049, -1.6858677864074707, -1.5667150020599365, -1.4475620985031128, -1.328409194946289, -1.2092564105987549, -1.0901036262512207, -0.970950722694397, -0.851797878742218, -0.7326450347900391, -0.6134921908378601, -0.49433934688568115, -0.3751865029335022, -0.25603365898132324, -0.1368808150291443, -0.017727971076965332, 0.10142487287521362, 0.22057771682739258, 0.33973056077957153, 0.4588834047317505, 0.5780362486839294, 0.6971893310546875, 0.8163421750068665, 0.9354950189590454, 1.0546479225158691, 1.1738007068634033, 1.2929534912109375, 1.4121063947677612, 1.531259298324585, 1.6504120826721191, 1.7695648670196533, 1.888717770576477, 2.007870674133301, 2.127023458480835, 2.246176242828369, 2.3653292655944824, 2.4844820499420166, 2.603634834289551, 2.722787618637085, 2.841940402984619, 2.9610934257507324, 3.0802462100982666, 3.199398994445801, 3.318552017211914, 3.4377048015594482, 3.5568575859069824, 3.6760103702545166, 3.795163154602051, 3.914316177368164, 4.033469200134277, 4.152621746063232, 4.271774768829346, 4.390927314758301, 4.510080337524414]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 6.0, 10.0, 6.0, 13.0, 9.0, 17.0, 16.0, 19.0, 20.0, 30.0, 29.0, 29.0, 34.0, 22.0, 30.0, 28.0, 34.0, 36.0, 30.0, 39.0, 44.0, 39.0, 33.0, 39.0, 35.0, 33.0, 19.0, 30.0, 30.0, 26.0, 27.0, 32.0, 19.0, 21.0, 17.0, 21.0, 11.0, 9.0, 10.0, 5.0, 10.0, 7.0, 4.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.083393931388855, -1.050696611404419, -1.0179994106292725, -0.9853021502494812, -0.9526048898696899, -0.9199076294898987, -0.8872103691101074, -0.8545131087303162, -0.8218158483505249, -0.7891185879707336, -0.7564213275909424, -0.7237240672111511, -0.6910268068313599, -0.6583295464515686, -0.6256322860717773, -0.5929350256919861, -0.5602377653121948, -0.5275405049324036, -0.4948432445526123, -0.46214598417282104, -0.4294487237930298, -0.3967514634132385, -0.36405420303344727, -0.331356942653656, -0.29865968227386475, -0.2659624218940735, -0.23326516151428223, -0.20056790113449097, -0.1678706407546997, -0.13517338037490845, -0.10247611999511719, -0.06977885961532593, -0.03708148002624512, -0.004384219646453857, 0.028313040733337402, 0.06101030111312866, 0.09370756149291992, 0.12640482187271118, 0.15910208225250244, 0.1917993426322937, 0.22449660301208496, 0.2571938633918762, 0.2898911237716675, 0.32258838415145874, 0.35528564453125, 0.38798290491104126, 0.4206801652908325, 0.4533774256706238, 0.48607468605041504, 0.5187719464302063, 0.5514692068099976, 0.5841664671897888, 0.6168637275695801, 0.6495609879493713, 0.6822582483291626, 0.7149555087089539, 0.7476527690887451, 0.7803500294685364, 0.8130472898483276, 0.8457445502281189, 0.8784418106079102, 0.9111390709877014, 0.9438363313674927, 0.9765335917472839, 1.0092308521270752]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 6.0, 12.0, 9.0, 15.0, 26.0, 52.0, 59.0, 89.0, 142.0, 250.0, 347.0, 605.0, 1035.0, 1900.0, 3432.0, 6766.0, 14643.0, 35030.0, 87131.0, 205139.0, 332897.0, 206827.0, 87135.0, 35184.0, 14982.0, 6865.0, 3402.0, 1921.0, 1020.0, 602.0, 333.0, 222.0, 172.0, 97.0, 74.0, 43.0, 25.0, 19.0, 12.0, 10.0, 8.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.247100830078125, -1.21197509765625, -1.176849365234375, -1.1417236328125, -1.106597900390625, -1.07147216796875, -1.036346435546875, -1.001220703125, -0.966094970703125, -0.93096923828125, -0.895843505859375, -0.8607177734375, -0.825592041015625, -0.79046630859375, -0.755340576171875, -0.72021484375, -0.685089111328125, -0.64996337890625, -0.614837646484375, -0.5797119140625, -0.544586181640625, -0.50946044921875, -0.474334716796875, -0.439208984375, -0.404083251953125, -0.36895751953125, -0.333831787109375, -0.2987060546875, -0.263580322265625, -0.22845458984375, -0.193328857421875, -0.158203125, -0.123077392578125, -0.08795166015625, -0.052825927734375, -0.0177001953125, 0.017425537109375, 0.05255126953125, 0.087677001953125, 0.122802734375, 0.157928466796875, 0.19305419921875, 0.228179931640625, 0.2633056640625, 0.298431396484375, 0.33355712890625, 0.368682861328125, 0.40380859375, 0.438934326171875, 0.47406005859375, 0.509185791015625, 0.5443115234375, 0.579437255859375, 0.61456298828125, 0.649688720703125, 0.684814453125, 0.719940185546875, 0.75506591796875, 0.790191650390625, 0.8253173828125, 0.860443115234375, 0.89556884765625, 0.930694580078125, 0.9658203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 8.0, 5.0, 11.0, 13.0, 23.0, 25.0, 24.0, 42.0, 41.0, 56.0, 51.0, 68.0, 64.0, 74.0, 62.0, 67.0, 65.0, 61.0, 43.0, 49.0, 37.0, 26.0, 23.0, 24.0, 14.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2135009765625, -0.2046222686767578, -0.19574356079101562, -0.18686485290527344, -0.17798614501953125, -0.16910743713378906, -0.16022872924804688, -0.1513500213623047, -0.1424713134765625, -0.1335926055908203, -0.12471389770507812, -0.11583518981933594, -0.10695648193359375, -0.09807777404785156, -0.08919906616210938, -0.08032035827636719, -0.071441650390625, -0.06256294250488281, -0.053684234619140625, -0.04480552673339844, -0.03592681884765625, -0.027048110961914062, -0.018169403076171875, -0.009290695190429688, -0.0004119873046875, 0.008466720581054688, 0.017345428466796875, 0.026224136352539062, 0.03510284423828125, 0.04398155212402344, 0.052860260009765625, 0.06173896789550781, 0.07061767578125, 0.07949638366699219, 0.08837509155273438, 0.09725379943847656, 0.10613250732421875, 0.11501121520996094, 0.12388992309570312, 0.1327686309814453, 0.1416473388671875, 0.1505260467529297, 0.15940475463867188, 0.16828346252441406, 0.17716217041015625, 0.18604087829589844, 0.19491958618164062, 0.2037982940673828, 0.212677001953125, 0.2215557098388672, 0.23043441772460938, 0.23931312561035156, 0.24819183349609375, 0.25707054138183594, 0.2659492492675781, 0.2748279571533203, 0.2837066650390625, 0.2925853729248047, 0.3014640808105469, 0.31034278869628906, 0.31922149658203125, 0.32810020446777344, 0.3369789123535156, 0.3458576202392578, 0.354736328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 8.0, 4.0, 3.0, 6.0, 18.0, 19.0, 21.0, 22.0, 52.0, 72.0, 110.0, 154.0, 293.0, 504.0, 960.0, 2283.0, 6698.0, 28499.0, 172752.0, 595698.0, 196550.0, 31812.0, 7367.0, 2372.0, 1050.0, 502.0, 248.0, 156.0, 105.0, 67.0, 38.0, 30.0, 22.0, 16.0, 13.0, 7.0, 13.0, 3.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0], "bins": [-2.50390625, -2.43719482421875, -2.3704833984375, -2.30377197265625, -2.237060546875, -2.17034912109375, -2.1036376953125, -2.03692626953125, -1.97021484375, -1.90350341796875, -1.8367919921875, -1.77008056640625, -1.703369140625, -1.63665771484375, -1.5699462890625, -1.50323486328125, -1.4365234375, -1.36981201171875, -1.3031005859375, -1.23638916015625, -1.169677734375, -1.10296630859375, -1.0362548828125, -0.96954345703125, -0.90283203125, -0.83612060546875, -0.7694091796875, -0.70269775390625, -0.635986328125, -0.56927490234375, -0.5025634765625, -0.43585205078125, -0.369140625, -0.30242919921875, -0.2357177734375, -0.16900634765625, -0.102294921875, -0.03558349609375, 0.0311279296875, 0.09783935546875, 0.16455078125, 0.23126220703125, 0.2979736328125, 0.36468505859375, 0.431396484375, 0.49810791015625, 0.5648193359375, 0.63153076171875, 0.6982421875, 0.76495361328125, 0.8316650390625, 0.89837646484375, 0.965087890625, 1.03179931640625, 1.0985107421875, 1.16522216796875, 1.23193359375, 1.29864501953125, 1.3653564453125, 1.43206787109375, 1.498779296875, 1.56549072265625, 1.6322021484375, 1.69891357421875, 1.765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 12.0, 17.0, 17.0, 19.0, 13.0, 25.0, 17.0, 27.0, 32.0, 28.0, 35.0, 49.0, 37.0, 42.0, 48.0, 41.0, 38.0, 54.0, 45.0, 49.0, 36.0, 36.0, 21.0, 36.0, 29.0, 20.0, 26.0, 27.0, 16.0, 18.0, 21.0, 17.0, 16.0, 4.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0078125, -0.9767532348632812, -0.9456939697265625, -0.9146347045898438, -0.883575439453125, -0.8525161743164062, -0.8214569091796875, -0.7903976440429688, -0.75933837890625, -0.7282791137695312, -0.6972198486328125, -0.6661605834960938, -0.635101318359375, -0.6040420532226562, -0.5729827880859375, -0.5419235229492188, -0.5108642578125, -0.47980499267578125, -0.4487457275390625, -0.41768646240234375, -0.386627197265625, -0.35556793212890625, -0.3245086669921875, -0.29344940185546875, -0.26239013671875, -0.23133087158203125, -0.2002716064453125, -0.16921234130859375, -0.138153076171875, -0.10709381103515625, -0.0760345458984375, -0.04497528076171875, -0.013916015625, 0.01714324951171875, 0.0482025146484375, 0.07926177978515625, 0.110321044921875, 0.14138031005859375, 0.1724395751953125, 0.20349884033203125, 0.23455810546875, 0.26561737060546875, 0.2966766357421875, 0.32773590087890625, 0.358795166015625, 0.38985443115234375, 0.4209136962890625, 0.45197296142578125, 0.4830322265625, 0.5140914916992188, 0.5451507568359375, 0.5762100219726562, 0.607269287109375, 0.6383285522460938, 0.6693878173828125, 0.7004470825195312, 0.73150634765625, 0.7625656127929688, 0.7936248779296875, 0.8246841430664062, 0.855743408203125, 0.8868026733398438, 0.9178619384765625, 0.9489212036132812, 0.97998046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 21.0, 28.0, 44.0, 87.0, 99.0, 187.0, 379.0, 678.0, 1459.0, 3540.0, 11998.0, 101536.0, 844076.0, 68782.0, 9725.0, 3104.0, 1332.0, 645.0, 357.0, 189.0, 90.0, 64.0, 49.0, 22.0, 14.0, 12.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.15625, -2.1029205322265625, -2.049591064453125, -1.9962615966796875, -1.94293212890625, -1.8896026611328125, -1.836273193359375, -1.7829437255859375, -1.7296142578125, -1.6762847900390625, -1.622955322265625, -1.5696258544921875, -1.51629638671875, -1.4629669189453125, -1.409637451171875, -1.3563079833984375, -1.302978515625, -1.2496490478515625, -1.196319580078125, -1.1429901123046875, -1.08966064453125, -1.0363311767578125, -0.983001708984375, -0.9296722412109375, -0.8763427734375, -0.8230133056640625, -0.769683837890625, -0.7163543701171875, -0.66302490234375, -0.6096954345703125, -0.556365966796875, -0.5030364990234375, -0.44970703125, -0.3963775634765625, -0.343048095703125, -0.2897186279296875, -0.23638916015625, -0.1830596923828125, -0.129730224609375, -0.0764007568359375, -0.0230712890625, 0.0302581787109375, 0.083587646484375, 0.1369171142578125, 0.19024658203125, 0.2435760498046875, 0.296905517578125, 0.3502349853515625, 0.403564453125, 0.4568939208984375, 0.510223388671875, 0.5635528564453125, 0.61688232421875, 0.6702117919921875, 0.723541259765625, 0.7768707275390625, 0.8302001953125, 0.8835296630859375, 0.936859130859375, 0.9901885986328125, 1.04351806640625, 1.0968475341796875, 1.150177001953125, 1.2035064697265625, 1.2568359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 20.0, 33.0, 75.0, 137.0, 197.0, 194.0, 169.0, 77.0, 51.0, 22.0, 11.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036454200744628906, -0.00035058334469795227, -0.0003366246819496155, -0.0003226660192012787, -0.0003087073564529419, -0.0002947486937046051, -0.0002807900309562683, -0.0002668313682079315, -0.0002528727054595947, -0.00023891404271125793, -0.00022495537996292114, -0.00021099671721458435, -0.00019703805446624756, -0.00018307939171791077, -0.00016912072896957397, -0.00015516206622123718, -0.0001412034034729004, -0.0001272447407245636, -0.0001132860779762268, -9.932741522789001e-05, -8.536875247955322e-05, -7.141008973121643e-05, -5.745142698287964e-05, -4.349276423454285e-05, -2.9534101486206055e-05, -1.5575438737869263e-05, -1.6167759895324707e-06, 1.2341886758804321e-05, 2.6300549507141113e-05, 4.0259212255477905e-05, 5.42178750038147e-05, 6.817653775215149e-05, 8.213520050048828e-05, 9.609386324882507e-05, 0.00011005252599716187, 0.00012401118874549866, 0.00013796985149383545, 0.00015192851424217224, 0.00016588717699050903, 0.00017984583973884583, 0.00019380450248718262, 0.0002077631652355194, 0.0002217218279838562, 0.000235680490732193, 0.0002496391534805298, 0.0002635978162288666, 0.00027755647897720337, 0.00029151514172554016, 0.00030547380447387695, 0.00031943246722221375, 0.00033339112997055054, 0.00034734979271888733, 0.0003613084554672241, 0.0003752671182155609, 0.0003892257809638977, 0.0004031844437122345, 0.0004171431064605713, 0.0004311017692089081, 0.0004450604319572449, 0.00045901909470558167, 0.00047297775745391846, 0.00048693642020225525, 0.000500895082950592, 0.0005148537456989288, 0.0005288124084472656]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 10.0, 9.0, 22.0, 19.0, 29.0, 40.0, 70.0, 102.0, 182.0, 390.0, 830.0, 1950.0, 6137.0, 32429.0, 859219.0, 129778.0, 11809.0, 3165.0, 1223.0, 531.0, 240.0, 123.0, 81.0, 56.0, 35.0, 21.0, 7.0, 10.0, 10.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.120086669921875, -2.04876708984375, -1.977447509765625, -1.9061279296875, -1.834808349609375, -1.76348876953125, -1.692169189453125, -1.620849609375, -1.549530029296875, -1.47821044921875, -1.406890869140625, -1.3355712890625, -1.264251708984375, -1.19293212890625, -1.121612548828125, -1.05029296875, -0.978973388671875, -0.90765380859375, -0.836334228515625, -0.7650146484375, -0.693695068359375, -0.62237548828125, -0.551055908203125, -0.479736328125, -0.408416748046875, -0.33709716796875, -0.265777587890625, -0.1944580078125, -0.123138427734375, -0.05181884765625, 0.019500732421875, 0.0908203125, 0.162139892578125, 0.23345947265625, 0.304779052734375, 0.3760986328125, 0.447418212890625, 0.51873779296875, 0.590057373046875, 0.661376953125, 0.732696533203125, 0.80401611328125, 0.875335693359375, 0.9466552734375, 1.017974853515625, 1.08929443359375, 1.160614013671875, 1.23193359375, 1.303253173828125, 1.37457275390625, 1.445892333984375, 1.5172119140625, 1.588531494140625, 1.65985107421875, 1.731170654296875, 1.802490234375, 1.873809814453125, 1.94512939453125, 2.016448974609375, 2.0877685546875, 2.159088134765625, 2.23040771484375, 2.301727294921875, 2.373046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 9.0, 5.0, 20.0, 21.0, 36.0, 72.0, 119.0, 184.0, 194.0, 113.0, 70.0, 47.0, 36.0, 14.0, 12.0, 6.0, 6.0, 2.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.169921875, -1.1374969482421875, -1.105072021484375, -1.0726470947265625, -1.04022216796875, -1.0077972412109375, -0.975372314453125, -0.9429473876953125, -0.9105224609375, -0.8780975341796875, -0.845672607421875, -0.8132476806640625, -0.78082275390625, -0.7483978271484375, -0.715972900390625, -0.6835479736328125, -0.651123046875, -0.6186981201171875, -0.586273193359375, -0.5538482666015625, -0.52142333984375, -0.4889984130859375, -0.456573486328125, -0.4241485595703125, -0.3917236328125, -0.3592987060546875, -0.326873779296875, -0.2944488525390625, -0.26202392578125, -0.2295989990234375, -0.197174072265625, -0.1647491455078125, -0.13232421875, -0.0998992919921875, -0.067474365234375, -0.0350494384765625, -0.00262451171875, 0.0298004150390625, 0.062225341796875, 0.0946502685546875, 0.1270751953125, 0.1595001220703125, 0.191925048828125, 0.2243499755859375, 0.25677490234375, 0.2891998291015625, 0.321624755859375, 0.3540496826171875, 0.386474609375, 0.4188995361328125, 0.451324462890625, 0.4837493896484375, 0.51617431640625, 0.5485992431640625, 0.581024169921875, 0.6134490966796875, 0.6458740234375, 0.6782989501953125, 0.710723876953125, 0.7431488037109375, 0.77557373046875, 0.8079986572265625, 0.840423583984375, 0.8728485107421875, 0.9052734375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 8.0, 7.0, 21.0, 33.0, 79.0, 153.0, 195.0, 185.0, 163.0, 93.0, 36.0, 21.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.156837463378906, -21.589847564697266, -21.022857666015625, -20.45586585998535, -19.88887596130371, -19.32188606262207, -18.75489616394043, -18.18790626525879, -17.620914459228516, -17.053924560546875, -16.486934661865234, -15.919943809509277, -15.35295295715332, -14.78596305847168, -14.218973159790039, -13.651983261108398, -13.084993362426758, -12.518003463745117, -11.95101261138916, -11.38402271270752, -10.817031860351562, -10.250041961669922, -9.683052062988281, -9.11606216430664, -8.549071311950684, -7.982080936431885, -7.415090560913086, -6.848100662231445, -6.2811102867126465, -5.714119911193848, -5.147130012512207, -4.580139636993408, -4.013149261474609, -3.4461588859558105, -2.879168748855591, -2.312178611755371, -1.7451882362365723, -1.1781978607177734, -0.6112077236175537, -0.044217586517333984, 0.5227727890014648, 1.0897630453109741, 1.6567533016204834, 2.223743438720703, 2.790733814239502, 3.357724189758301, 3.9247143268585205, 4.49170446395874, 5.058694839477539, 5.625685214996338, 6.192675590515137, 6.759665489196777, 7.326655864715576, 7.893646240234375, 8.460636138916016, 9.027626037597656, 9.594616889953613, 10.161606788635254, 10.728597640991211, 11.295587539672852, 11.862577438354492, 12.42956829071045, 12.99655818939209, 13.563549041748047, 14.130538940429688]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 6.0, 6.0, 8.0, 11.0, 5.0, 16.0, 23.0, 19.0, 25.0, 20.0, 20.0, 24.0, 33.0, 28.0, 38.0, 47.0, 46.0, 45.0, 40.0, 37.0, 43.0, 58.0, 29.0, 46.0, 44.0, 28.0, 23.0, 34.0, 31.0, 29.0, 26.0, 21.0, 13.0, 14.0, 10.0, 7.0, 9.0, 8.0, 7.0, 3.0, 6.0, 1.0, 2.0, 0.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.213404178619385, -6.026819705963135, -5.840235710144043, -5.653651237487793, -5.467067241668701, -5.280482769012451, -5.093898773193359, -4.907314300537109, -4.720730304718018, -4.534145832061768, -4.347561836242676, -4.160977363586426, -3.974393367767334, -3.787809133529663, -3.601224899291992, -3.414640426635742, -3.2280561923980713, -3.0414719581604004, -2.8548877239227295, -2.6683034896850586, -2.4817192554473877, -2.295135021209717, -2.108550548553467, -1.9219664335250854, -1.7353821992874146, -1.5487979650497437, -1.3622137308120728, -1.1756293773651123, -0.9890452027320862, -0.8024609684944153, -0.6158766746520996, -0.4292924404144287, -0.2427082061767578, -0.05612395703792572, 0.13046029210090637, 0.31704455614089966, 0.5036287903785706, 0.6902130246162415, 0.8767973184585571, 1.063381552696228, 1.249965786933899, 1.4365500211715698, 1.6231342554092407, 1.8097186088562012, 1.996302843093872, 2.182887077331543, 2.369471311569214, 2.5560555458068848, 2.7426397800445557, 2.9292240142822266, 3.1158082485198975, 3.3023924827575684, 3.4889767169952393, 3.67556095123291, 3.86214542388916, 4.048729419708252, 4.235313892364502, 4.421898365020752, 4.608482360839844, 4.795066833496094, 4.9816508293151855, 5.1682353019714355, 5.354819297790527, 5.541403770446777, 5.727987766265869]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 11.0, 16.0, 16.0, 24.0, 30.0, 65.0, 82.0, 173.0, 317.0, 552.0, 1183.0, 2918.0, 8358.0, 28617.0, 148900.0, 3689412.0, 255290.0, 39810.0, 11337.0, 3949.0, 1599.0, 722.0, 391.0, 192.0, 103.0, 81.0, 42.0, 30.0, 17.0, 10.0, 9.0, 5.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8125, -1.7532958984375, -1.694091796875, -1.6348876953125, -1.57568359375, -1.5164794921875, -1.457275390625, -1.3980712890625, -1.3388671875, -1.2796630859375, -1.220458984375, -1.1612548828125, -1.10205078125, -1.0428466796875, -0.983642578125, -0.9244384765625, -0.865234375, -0.8060302734375, -0.746826171875, -0.6876220703125, -0.62841796875, -0.5692138671875, -0.510009765625, -0.4508056640625, -0.3916015625, -0.3323974609375, -0.273193359375, -0.2139892578125, -0.15478515625, -0.0955810546875, -0.036376953125, 0.0228271484375, 0.08203125, 0.1412353515625, 0.200439453125, 0.2596435546875, 0.31884765625, 0.3780517578125, 0.437255859375, 0.4964599609375, 0.5556640625, 0.6148681640625, 0.674072265625, 0.7332763671875, 0.79248046875, 0.8516845703125, 0.910888671875, 0.9700927734375, 1.029296875, 1.0885009765625, 1.147705078125, 1.2069091796875, 1.26611328125, 1.3253173828125, 1.384521484375, 1.4437255859375, 1.5029296875, 1.5621337890625, 1.621337890625, 1.6805419921875, 1.73974609375, 1.7989501953125, 1.858154296875, 1.9173583984375, 1.9765625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 5.0, 7.0, 12.0, 16.0, 18.0, 20.0, 26.0, 27.0, 37.0, 32.0, 53.0, 54.0, 67.0, 49.0, 58.0, 65.0, 46.0, 60.0, 60.0, 44.0, 38.0, 43.0, 28.0, 34.0, 30.0, 9.0, 18.0, 13.0, 7.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1754150390625, -0.1671924591064453, -0.15896987915039062, -0.15074729919433594, -0.14252471923828125, -0.13430213928222656, -0.12607955932617188, -0.11785697937011719, -0.1096343994140625, -0.10141181945800781, -0.09318923950195312, -0.08496665954589844, -0.07674407958984375, -0.06852149963378906, -0.060298919677734375, -0.05207633972167969, -0.043853759765625, -0.03563117980957031, -0.027408599853515625, -0.019186019897460938, -0.01096343994140625, -0.0027408599853515625, 0.005481719970703125, 0.013704299926757812, 0.0219268798828125, 0.030149459838867188, 0.038372039794921875, 0.04659461975097656, 0.05481719970703125, 0.06303977966308594, 0.07126235961914062, 0.07948493957519531, 0.08770751953125, 0.09593009948730469, 0.10415267944335938, 0.11237525939941406, 0.12059783935546875, 0.12882041931152344, 0.13704299926757812, 0.1452655792236328, 0.1534881591796875, 0.1617107391357422, 0.16993331909179688, 0.17815589904785156, 0.18637847900390625, 0.19460105895996094, 0.20282363891601562, 0.2110462188720703, 0.219268798828125, 0.2274913787841797, 0.23571395874023438, 0.24393653869628906, 0.25215911865234375, 0.26038169860839844, 0.2686042785644531, 0.2768268585205078, 0.2850494384765625, 0.2932720184326172, 0.3014945983886719, 0.30971717834472656, 0.31793975830078125, 0.32616233825683594, 0.3343849182128906, 0.3426074981689453, 0.350830078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 8.0, 17.0, 24.0, 38.0, 46.0, 72.0, 143.0, 257.0, 446.0, 812.0, 1694.0, 3376.0, 7861.0, 19455.0, 59954.0, 291534.0, 3360996.0, 344608.0, 65370.0, 21119.0, 8562.0, 3861.0, 1866.0, 903.0, 515.0, 279.0, 173.0, 92.0, 60.0, 45.0, 28.0, 15.0, 11.0, 11.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3291015625, -1.2841033935546875, -1.239105224609375, -1.1941070556640625, -1.14910888671875, -1.1041107177734375, -1.059112548828125, -1.0141143798828125, -0.9691162109375, -0.9241180419921875, -0.879119873046875, -0.8341217041015625, -0.78912353515625, -0.7441253662109375, -0.699127197265625, -0.6541290283203125, -0.609130859375, -0.5641326904296875, -0.519134521484375, -0.4741363525390625, -0.42913818359375, -0.3841400146484375, -0.339141845703125, -0.2941436767578125, -0.2491455078125, -0.2041473388671875, -0.159149169921875, -0.1141510009765625, -0.06915283203125, -0.0241546630859375, 0.020843505859375, 0.0658416748046875, 0.11083984375, 0.1558380126953125, 0.200836181640625, 0.2458343505859375, 0.29083251953125, 0.3358306884765625, 0.380828857421875, 0.4258270263671875, 0.4708251953125, 0.5158233642578125, 0.560821533203125, 0.6058197021484375, 0.65081787109375, 0.6958160400390625, 0.740814208984375, 0.7858123779296875, 0.830810546875, 0.8758087158203125, 0.920806884765625, 0.9658050537109375, 1.01080322265625, 1.0558013916015625, 1.100799560546875, 1.1457977294921875, 1.1907958984375, 1.2357940673828125, 1.280792236328125, 1.3257904052734375, 1.37078857421875, 1.4157867431640625, 1.460784912109375, 1.5057830810546875, 1.55078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 5.0, 6.0, 8.0, 6.0, 14.0, 23.0, 25.0, 41.0, 51.0, 58.0, 112.0, 157.0, 308.0, 823.0, 1359.0, 450.0, 215.0, 131.0, 73.0, 63.0, 38.0, 33.0, 18.0, 12.0, 10.0, 5.0, 8.0, 3.0, 2.0, 4.0, 5.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49609375, -0.47785186767578125, -0.4596099853515625, -0.44136810302734375, -0.423126220703125, -0.40488433837890625, -0.3866424560546875, -0.36840057373046875, -0.35015869140625, -0.33191680908203125, -0.3136749267578125, -0.29543304443359375, -0.277191162109375, -0.25894927978515625, -0.2407073974609375, -0.22246551513671875, -0.2042236328125, -0.18598175048828125, -0.1677398681640625, -0.14949798583984375, -0.131256103515625, -0.11301422119140625, -0.0947723388671875, -0.07653045654296875, -0.05828857421875, -0.04004669189453125, -0.0218048095703125, -0.00356292724609375, 0.014678955078125, 0.03292083740234375, 0.0511627197265625, 0.06940460205078125, 0.087646484375, 0.10588836669921875, 0.1241302490234375, 0.14237213134765625, 0.160614013671875, 0.17885589599609375, 0.1970977783203125, 0.21533966064453125, 0.23358154296875, 0.25182342529296875, 0.2700653076171875, 0.28830718994140625, 0.306549072265625, 0.32479095458984375, 0.3430328369140625, 0.36127471923828125, 0.3795166015625, 0.39775848388671875, 0.4160003662109375, 0.43424224853515625, 0.452484130859375, 0.47072601318359375, 0.4889678955078125, 0.5072097778320312, 0.52545166015625, 0.5436935424804688, 0.5619354248046875, 0.5801773071289062, 0.598419189453125, 0.6166610717773438, 0.6349029541015625, 0.6531448364257812, 0.67138671875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 13.0, 23.0, 72.0, 101.0, 149.0, 169.0, 179.0, 123.0, 77.0, 37.0, 24.0, 16.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.350882530212402, -4.16703987121582, -3.983196973800659, -3.799354076385498, -3.615511417388916, -3.431668519973755, -3.2478256225585938, -3.0639829635620117, -2.8801400661468506, -2.6962971687316895, -2.5124545097351074, -2.3286116123199463, -2.144768714904785, -1.9609260559082031, -1.777083158493042, -1.5932403802871704, -1.4093976020812988, -1.2255548238754272, -1.0417120456695557, -0.8578691482543945, -0.674026370048523, -0.49018359184265137, -0.30634069442749023, -0.12249791622161865, 0.06134486198425293, 0.2451876699924469, 0.42903047800064087, 0.6128733158111572, 0.7967160940170288, 0.9805588722229004, 1.1644017696380615, 1.348244547843933, 1.5320868492126465, 1.715929627418518, 1.8997724056243896, 2.083615303039551, 2.267457962036133, 2.451300859451294, 2.635143756866455, 2.818986415863037, 3.0028293132781982, 3.1866722106933594, 3.3705148696899414, 3.5543577671051025, 3.7382006645202637, 3.9220433235168457, 4.105886459350586, 4.289729118347168, 4.47357177734375, 4.657414436340332, 4.841257572174072, 5.025100231170654, 5.208942890167236, 5.392786026000977, 5.576628684997559, 5.760471343994141, 5.944314002990723, 6.128156661987305, 6.311999797821045, 6.495842456817627, 6.679685115814209, 6.863528251647949, 7.047370910644531, 7.231213569641113, 7.4150567054748535]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 11.0, 14.0, 9.0, 10.0, 18.0, 20.0, 20.0, 36.0, 27.0, 35.0, 38.0, 38.0, 42.0, 48.0, 48.0, 54.0, 45.0, 48.0, 48.0, 46.0, 42.0, 43.0, 32.0, 37.0, 33.0, 30.0, 21.0, 14.0, 13.0, 25.0, 11.0, 10.0, 5.0, 8.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.268730640411377, -2.1993966102600098, -2.1300623416900635, -2.0607283115386963, -1.991394281387329, -1.9220601320266724, -1.8527259826660156, -1.7833919525146484, -1.7140578031539917, -1.644723653793335, -1.5753896236419678, -1.506055474281311, -1.4367213249206543, -1.367387294769287, -1.2980531454086304, -1.2287189960479736, -1.1593849658966064, -1.0900508165359497, -1.0207167863845825, -0.9513826370239258, -0.8820485472679138, -0.8127144575119019, -0.7433803081512451, -0.6740462183952332, -0.6047121286392212, -0.5353780388832092, -0.4660439193248749, -0.3967097997665405, -0.32737571001052856, -0.2580416202545166, -0.18870750069618225, -0.1193733811378479, -0.050039052963256836, 0.01929505169391632, 0.08862915635108948, 0.15796326100826263, 0.2272973656654358, 0.29663145542144775, 0.3659655749797821, 0.43529969453811646, 0.5046337842941284, 0.5739678740501404, 0.6433019638061523, 0.7126361131668091, 0.781970202922821, 0.851304292678833, 0.9206384420394897, 0.9899725317955017, 1.0593066215515137, 1.1286407709121704, 1.1979748010635376, 1.2673089504241943, 1.3366429805755615, 1.4059771299362183, 1.475311279296875, 1.5446453094482422, 1.613979458808899, 1.6833136081695557, 1.7526476383209229, 1.8219817876815796, 1.8913159370422363, 1.9606499671936035, 2.0299839973449707, 2.099318265914917, 2.168652296066284]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 9.0, 12.0, 13.0, 31.0, 52.0, 73.0, 119.0, 164.0, 316.0, 607.0, 1123.0, 2519.0, 5828.0, 14770.0, 40531.0, 119354.0, 397315.0, 314661.0, 96530.0, 32827.0, 12392.0, 4798.0, 2205.0, 1035.0, 558.0, 272.0, 161.0, 98.0, 60.0, 47.0, 22.0, 25.0, 3.0, 10.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.9150390625, -1.8631439208984375, -1.811248779296875, -1.7593536376953125, -1.70745849609375, -1.6555633544921875, -1.603668212890625, -1.5517730712890625, -1.4998779296875, -1.4479827880859375, -1.396087646484375, -1.3441925048828125, -1.29229736328125, -1.2404022216796875, -1.188507080078125, -1.1366119384765625, -1.084716796875, -1.0328216552734375, -0.980926513671875, -0.9290313720703125, -0.87713623046875, -0.8252410888671875, -0.773345947265625, -0.7214508056640625, -0.6695556640625, -0.6176605224609375, -0.565765380859375, -0.5138702392578125, -0.46197509765625, -0.4100799560546875, -0.358184814453125, -0.3062896728515625, -0.25439453125, -0.2024993896484375, -0.150604248046875, -0.0987091064453125, -0.04681396484375, 0.0050811767578125, 0.056976318359375, 0.1088714599609375, 0.1607666015625, 0.2126617431640625, 0.264556884765625, 0.3164520263671875, 0.36834716796875, 0.4202423095703125, 0.472137451171875, 0.5240325927734375, 0.575927734375, 0.6278228759765625, 0.679718017578125, 0.7316131591796875, 0.78350830078125, 0.8354034423828125, 0.887298583984375, 0.9391937255859375, 0.9910888671875, 1.0429840087890625, 1.094879150390625, 1.1467742919921875, 1.19866943359375, 1.2505645751953125, 1.302459716796875, 1.3543548583984375, 1.40625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 11.0, 13.0, 25.0, 23.0, 33.0, 30.0, 38.0, 41.0, 54.0, 53.0, 64.0, 58.0, 69.0, 50.0, 62.0, 56.0, 69.0, 47.0, 33.0, 40.0, 27.0, 24.0, 21.0, 18.0, 4.0, 7.0, 8.0, 7.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2100830078125, -0.2012348175048828, -0.19238662719726562, -0.18353843688964844, -0.17469024658203125, -0.16584205627441406, -0.15699386596679688, -0.1481456756591797, -0.1392974853515625, -0.1304492950439453, -0.12160110473632812, -0.11275291442871094, -0.10390472412109375, -0.09505653381347656, -0.08620834350585938, -0.07736015319824219, -0.068511962890625, -0.05966377258300781, -0.050815582275390625, -0.04196739196777344, -0.03311920166015625, -0.024271011352539062, -0.015422821044921875, -0.0065746307373046875, 0.0022735595703125, 0.011121749877929688, 0.019969940185546875, 0.028818130493164062, 0.03766632080078125, 0.04651451110839844, 0.055362701416015625, 0.06421089172363281, 0.07305908203125, 0.08190727233886719, 0.09075546264648438, 0.09960365295410156, 0.10845184326171875, 0.11730003356933594, 0.12614822387695312, 0.1349964141845703, 0.1438446044921875, 0.1526927947998047, 0.16154098510742188, 0.17038917541503906, 0.17923736572265625, 0.18808555603027344, 0.19693374633789062, 0.2057819366455078, 0.214630126953125, 0.2234783172607422, 0.23232650756835938, 0.24117469787597656, 0.25002288818359375, 0.25887107849121094, 0.2677192687988281, 0.2765674591064453, 0.2854156494140625, 0.2942638397216797, 0.3031120300292969, 0.31196022033691406, 0.32080841064453125, 0.32965660095214844, 0.3385047912597656, 0.3473529815673828, 0.356201171875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 3.0, 4.0, 2.0, 7.0, 6.0, 7.0, 13.0, 13.0, 20.0, 17.0, 29.0, 39.0, 69.0, 108.0, 180.0, 326.0, 620.0, 1166.0, 2785.0, 7263.0, 23464.0, 87100.0, 377979.0, 415063.0, 93883.0, 25040.0, 7669.0, 2928.0, 1246.0, 594.0, 320.0, 199.0, 129.0, 84.0, 48.0, 38.0, 29.0, 18.0, 9.0, 11.0, 11.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.091796875, -2.035308837890625, -1.97882080078125, -1.922332763671875, -1.8658447265625, -1.809356689453125, -1.75286865234375, -1.696380615234375, -1.639892578125, -1.583404541015625, -1.52691650390625, -1.470428466796875, -1.4139404296875, -1.357452392578125, -1.30096435546875, -1.244476318359375, -1.18798828125, -1.131500244140625, -1.07501220703125, -1.018524169921875, -0.9620361328125, -0.905548095703125, -0.84906005859375, -0.792572021484375, -0.736083984375, -0.679595947265625, -0.62310791015625, -0.566619873046875, -0.5101318359375, -0.453643798828125, -0.39715576171875, -0.340667724609375, -0.2841796875, -0.227691650390625, -0.17120361328125, -0.114715576171875, -0.0582275390625, -0.001739501953125, 0.05474853515625, 0.111236572265625, 0.167724609375, 0.224212646484375, 0.28070068359375, 0.337188720703125, 0.3936767578125, 0.450164794921875, 0.50665283203125, 0.563140869140625, 0.61962890625, 0.676116943359375, 0.73260498046875, 0.789093017578125, 0.8455810546875, 0.902069091796875, 0.95855712890625, 1.015045166015625, 1.071533203125, 1.128021240234375, 1.18450927734375, 1.240997314453125, 1.2974853515625, 1.353973388671875, 1.41046142578125, 1.466949462890625, 1.5234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 4.0, 4.0, 10.0, 15.0, 7.0, 17.0, 15.0, 13.0, 21.0, 15.0, 26.0, 36.0, 37.0, 38.0, 39.0, 43.0, 40.0, 53.0, 52.0, 59.0, 53.0, 37.0, 46.0, 49.0, 29.0, 40.0, 27.0, 24.0, 26.0, 22.0, 20.0, 9.0, 10.0, 15.0, 18.0, 9.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.2041015625, -1.169189453125, -1.13427734375, -1.099365234375, -1.064453125, -1.029541015625, -0.99462890625, -0.959716796875, -0.9248046875, -0.889892578125, -0.85498046875, -0.820068359375, -0.78515625, -0.750244140625, -0.71533203125, -0.680419921875, -0.6455078125, -0.610595703125, -0.57568359375, -0.540771484375, -0.505859375, -0.470947265625, -0.43603515625, -0.401123046875, -0.3662109375, -0.331298828125, -0.29638671875, -0.261474609375, -0.2265625, -0.191650390625, -0.15673828125, -0.121826171875, -0.0869140625, -0.052001953125, -0.01708984375, 0.017822265625, 0.052734375, 0.087646484375, 0.12255859375, 0.157470703125, 0.1923828125, 0.227294921875, 0.26220703125, 0.297119140625, 0.33203125, 0.366943359375, 0.40185546875, 0.436767578125, 0.4716796875, 0.506591796875, 0.54150390625, 0.576416015625, 0.611328125, 0.646240234375, 0.68115234375, 0.716064453125, 0.7509765625, 0.785888671875, 0.82080078125, 0.855712890625, 0.890625, 0.925537109375, 0.96044921875, 0.995361328125, 1.0302734375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 5.0, 5.0, 7.0, 11.0, 12.0, 17.0, 32.0, 32.0, 41.0, 62.0, 87.0, 128.0, 197.0, 339.0, 521.0, 856.0, 1554.0, 3093.0, 7148.0, 26549.0, 669165.0, 308986.0, 17927.0, 5747.0, 2522.0, 1348.0, 789.0, 464.0, 306.0, 196.0, 134.0, 88.0, 76.0, 24.0, 33.0, 15.0, 10.0, 10.0, 6.0, 7.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.826171875, -1.762939453125, -1.69970703125, -1.636474609375, -1.5732421875, -1.510009765625, -1.44677734375, -1.383544921875, -1.3203125, -1.257080078125, -1.19384765625, -1.130615234375, -1.0673828125, -1.004150390625, -0.94091796875, -0.877685546875, -0.814453125, -0.751220703125, -0.68798828125, -0.624755859375, -0.5615234375, -0.498291015625, -0.43505859375, -0.371826171875, -0.30859375, -0.245361328125, -0.18212890625, -0.118896484375, -0.0556640625, 0.007568359375, 0.07080078125, 0.134033203125, 0.197265625, 0.260498046875, 0.32373046875, 0.386962890625, 0.4501953125, 0.513427734375, 0.57666015625, 0.639892578125, 0.703125, 0.766357421875, 0.82958984375, 0.892822265625, 0.9560546875, 1.019287109375, 1.08251953125, 1.145751953125, 1.208984375, 1.272216796875, 1.33544921875, 1.398681640625, 1.4619140625, 1.525146484375, 1.58837890625, 1.651611328125, 1.71484375, 1.778076171875, 1.84130859375, 1.904541015625, 1.9677734375, 2.031005859375, 2.09423828125, 2.157470703125, 2.220703125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 7.0, 9.0, 18.0, 27.0, 65.0, 129.0, 168.0, 187.0, 159.0, 87.0, 70.0, 37.0, 20.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004177093505859375, -0.0004030168056488037, -0.0003883242607116699, -0.00037363171577453613, -0.00035893917083740234, -0.00034424662590026855, -0.00032955408096313477, -0.000314861536026001, -0.0003001689910888672, -0.0002854764461517334, -0.0002707839012145996, -0.0002560913562774658, -0.00024139881134033203, -0.00022670626640319824, -0.00021201372146606445, -0.00019732117652893066, -0.00018262863159179688, -0.00016793608665466309, -0.0001532435417175293, -0.0001385509967803955, -0.00012385845184326172, -0.00010916590690612793, -9.447336196899414e-05, -7.978081703186035e-05, -6.508827209472656e-05, -5.0395727157592773e-05, -3.5703182220458984e-05, -2.1010637283325195e-05, -6.318092346191406e-06, 8.374452590942383e-06, 2.3066997528076172e-05, 3.775954246520996e-05, 5.245208740234375e-05, 6.714463233947754e-05, 8.183717727661133e-05, 9.652972221374512e-05, 0.0001112222671508789, 0.0001259148120880127, 0.00014060735702514648, 0.00015529990196228027, 0.00016999244689941406, 0.00018468499183654785, 0.00019937753677368164, 0.00021407008171081543, 0.00022876262664794922, 0.000243455171585083, 0.0002581477165222168, 0.0002728402614593506, 0.0002875328063964844, 0.00030222535133361816, 0.00031691789627075195, 0.00033161044120788574, 0.00034630298614501953, 0.0003609955310821533, 0.0003756880760192871, 0.0003903806209564209, 0.0004050731658935547, 0.0004197657108306885, 0.00043445825576782227, 0.00044915080070495605, 0.00046384334564208984, 0.00047853589057922363, 0.0004932284355163574, 0.0005079209804534912, 0.000522613525390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 10.0, 7.0, 11.0, 19.0, 27.0, 33.0, 46.0, 83.0, 143.0, 217.0, 446.0, 795.0, 1483.0, 3090.0, 8185.0, 51927.0, 925648.0, 42415.0, 7763.0, 2941.0, 1459.0, 745.0, 427.0, 229.0, 133.0, 75.0, 58.0, 30.0, 24.0, 15.0, 8.0, 16.0, 10.0, 6.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.21893310546875, -2.1409912109375, -2.06304931640625, -1.985107421875, -1.90716552734375, -1.8292236328125, -1.75128173828125, -1.67333984375, -1.59539794921875, -1.5174560546875, -1.43951416015625, -1.361572265625, -1.28363037109375, -1.2056884765625, -1.12774658203125, -1.0498046875, -0.97186279296875, -0.8939208984375, -0.81597900390625, -0.738037109375, -0.66009521484375, -0.5821533203125, -0.50421142578125, -0.42626953125, -0.34832763671875, -0.2703857421875, -0.19244384765625, -0.114501953125, -0.03656005859375, 0.0413818359375, 0.11932373046875, 0.197265625, 0.27520751953125, 0.3531494140625, 0.43109130859375, 0.509033203125, 0.58697509765625, 0.6649169921875, 0.74285888671875, 0.82080078125, 0.89874267578125, 0.9766845703125, 1.05462646484375, 1.132568359375, 1.21051025390625, 1.2884521484375, 1.36639404296875, 1.4443359375, 1.52227783203125, 1.6002197265625, 1.67816162109375, 1.756103515625, 1.83404541015625, 1.9119873046875, 1.98992919921875, 2.06787109375, 2.14581298828125, 2.2237548828125, 2.30169677734375, 2.379638671875, 2.45758056640625, 2.5355224609375, 2.61346435546875, 2.69140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 14.0, 36.0, 77.0, 167.0, 263.0, 214.0, 106.0, 41.0, 12.0, 11.0, 9.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3935546875, -1.346588134765625, -1.29962158203125, -1.252655029296875, -1.2056884765625, -1.158721923828125, -1.11175537109375, -1.064788818359375, -1.017822265625, -0.970855712890625, -0.92388916015625, -0.876922607421875, -0.8299560546875, -0.782989501953125, -0.73602294921875, -0.689056396484375, -0.64208984375, -0.595123291015625, -0.54815673828125, -0.501190185546875, -0.4542236328125, -0.407257080078125, -0.36029052734375, -0.313323974609375, -0.266357421875, -0.219390869140625, -0.17242431640625, -0.125457763671875, -0.0784912109375, -0.031524658203125, 0.01544189453125, 0.062408447265625, 0.109375, 0.156341552734375, 0.20330810546875, 0.250274658203125, 0.2972412109375, 0.344207763671875, 0.39117431640625, 0.438140869140625, 0.485107421875, 0.532073974609375, 0.57904052734375, 0.626007080078125, 0.6729736328125, 0.719940185546875, 0.76690673828125, 0.813873291015625, 0.86083984375, 0.907806396484375, 0.95477294921875, 1.001739501953125, 1.0487060546875, 1.095672607421875, 1.14263916015625, 1.189605712890625, 1.236572265625, 1.283538818359375, 1.33050537109375, 1.377471923828125, 1.4244384765625, 1.471405029296875, 1.51837158203125, 1.565338134765625, 1.6123046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 3.0, 8.0, 13.0, 11.0, 19.0, 30.0, 35.0, 38.0, 43.0, 74.0, 76.0, 77.0, 90.0, 72.0, 70.0, 66.0, 53.0, 52.0, 39.0, 32.0, 25.0, 16.0, 15.0, 11.0, 10.0, 9.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-9.127408981323242, -8.8901948928833, -8.65298080444336, -8.415766716003418, -8.178552627563477, -7.941338539123535, -7.7041239738464355, -7.466909885406494, -7.229695796966553, -6.992481708526611, -6.75526762008667, -6.5180535316467285, -6.280838966369629, -6.0436248779296875, -5.806410789489746, -5.569196701049805, -5.331982612609863, -5.094768524169922, -4.8575544357299805, -4.620340347290039, -4.383126258850098, -4.145912170410156, -3.9086976051330566, -3.6714835166931152, -3.434269428253174, -3.1970553398132324, -2.959841251373291, -2.7226269245147705, -2.485412836074829, -2.2481987476348877, -2.010984420776367, -1.7737703323364258, -1.5365557670593262, -1.2993416786193848, -1.0621274709701538, -0.8249133229255676, -0.5876991748809814, -0.35048508644104004, -0.11327087879180908, 0.12394332885742188, 0.3611574172973633, 0.5983715653419495, 0.8355857133865356, 1.0727999210357666, 1.310014009475708, 1.5472280979156494, 1.7844423055648804, 2.0216565132141113, 2.2588706016540527, 2.496084690093994, 2.7332987785339355, 2.970513105392456, 3.2077271938323975, 3.444941282272339, 3.6821556091308594, 3.919369697570801, 4.156583786010742, 4.393797874450684, 4.631011962890625, 4.868226051330566, 5.105440139770508, 5.342654228210449, 5.579868793487549, 5.81708288192749, 6.054296970367432]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 7.0, 2.0, 2.0, 5.0, 7.0, 14.0, 17.0, 13.0, 13.0, 22.0, 27.0, 27.0, 30.0, 28.0, 29.0, 38.0, 37.0, 33.0, 41.0, 41.0, 45.0, 38.0, 43.0, 46.0, 42.0, 44.0, 48.0, 34.0, 37.0, 33.0, 22.0, 21.0, 17.0, 20.0, 15.0, 13.0, 13.0, 9.0, 7.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.447185516357422, -5.248849868774414, -5.0505146980285645, -4.852179527282715, -4.653843879699707, -4.455508232116699, -4.25717306137085, -4.058837890625, -3.860502243041992, -3.6621668338775635, -3.4638314247131348, -3.265496015548706, -3.0671606063842773, -2.8688251972198486, -2.67048978805542, -2.472154378890991, -2.2738189697265625, -2.075483560562134, -1.877148151397705, -1.6788127422332764, -1.4804773330688477, -1.282141923904419, -1.0838065147399902, -0.8854711055755615, -0.6871356964111328, -0.4888002872467041, -0.2904648780822754, -0.09212946891784668, 0.10620594024658203, 0.30454134941101074, 0.5028767585754395, 0.7012121677398682, 0.8995475769042969, 1.0978829860687256, 1.2962183952331543, 1.494553804397583, 1.6928892135620117, 1.8912246227264404, 2.089560031890869, 2.287895441055298, 2.4862308502197266, 2.6845662593841553, 2.882901668548584, 3.0812370777130127, 3.2795724868774414, 3.47790789604187, 3.676243305206299, 3.8745787143707275, 4.072914123535156, 4.271249771118164, 4.469584941864014, 4.667920112609863, 4.866255760192871, 5.064591407775879, 5.2629265785217285, 5.461261749267578, 5.659597396850586, 5.857933044433594, 6.056268215179443, 6.254603385925293, 6.452939033508301, 6.651274681091309, 6.849609851837158, 7.047945022583008, 7.246280670166016]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 3.0, 23.0, 23.0, 38.0, 76.0, 153.0, 346.0, 697.0, 1929.0, 6512.0, 29788.0, 647368.0, 3457695.0, 38319.0, 7503.0, 2231.0, 835.0, 354.0, 148.0, 111.0, 49.0, 36.0, 11.0, 15.0, 9.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.150390625, -3.060546875, -2.970703125, -2.880859375, -2.791015625, -2.701171875, -2.611328125, -2.521484375, -2.431640625, -2.341796875, -2.251953125, -2.162109375, -2.072265625, -1.982421875, -1.892578125, -1.802734375, -1.712890625, -1.623046875, -1.533203125, -1.443359375, -1.353515625, -1.263671875, -1.173828125, -1.083984375, -0.994140625, -0.904296875, -0.814453125, -0.724609375, -0.634765625, -0.544921875, -0.455078125, -0.365234375, -0.275390625, -0.185546875, -0.095703125, -0.005859375, 0.083984375, 0.173828125, 0.263671875, 0.353515625, 0.443359375, 0.533203125, 0.623046875, 0.712890625, 0.802734375, 0.892578125, 0.982421875, 1.072265625, 1.162109375, 1.251953125, 1.341796875, 1.431640625, 1.521484375, 1.611328125, 1.701171875, 1.791015625, 1.880859375, 1.970703125, 2.060546875, 2.150390625, 2.240234375, 2.330078125, 2.419921875, 2.509765625, 2.599609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 4.0, 12.0, 12.0, 23.0, 21.0, 24.0, 34.0, 46.0, 33.0, 47.0, 64.0, 57.0, 71.0, 57.0, 57.0, 67.0, 58.0, 61.0, 56.0, 41.0, 22.0, 38.0, 23.0, 22.0, 13.0, 14.0, 3.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.266845703125, -0.2568321228027344, -0.24681854248046875, -0.23680496215820312, -0.2267913818359375, -0.21677780151367188, -0.20676422119140625, -0.19675064086914062, -0.186737060546875, -0.17672348022460938, -0.16670989990234375, -0.15669631958007812, -0.1466827392578125, -0.13666915893554688, -0.12665557861328125, -0.11664199829101562, -0.10662841796875, -0.09661483764648438, -0.08660125732421875, -0.07658767700195312, -0.0665740966796875, -0.056560516357421875, -0.04654693603515625, -0.036533355712890625, -0.026519775390625, -0.016506195068359375, -0.00649261474609375, 0.003520965576171875, 0.0135345458984375, 0.023548126220703125, 0.03356170654296875, 0.043575286865234375, 0.0535888671875, 0.06360244750976562, 0.07361602783203125, 0.08362960815429688, 0.0936431884765625, 0.10365676879882812, 0.11367034912109375, 0.12368392944335938, 0.133697509765625, 0.14371109008789062, 0.15372467041015625, 0.16373825073242188, 0.1737518310546875, 0.18376541137695312, 0.19377899169921875, 0.20379257202148438, 0.21380615234375, 0.22381973266601562, 0.23383331298828125, 0.24384689331054688, 0.2538604736328125, 0.2638740539550781, 0.27388763427734375, 0.2839012145996094, 0.293914794921875, 0.3039283752441406, 0.31394195556640625, 0.3239555358886719, 0.3339691162109375, 0.3439826965332031, 0.35399627685546875, 0.3640098571777344, 0.3740234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 10.0, 17.0, 25.0, 43.0, 77.0, 87.0, 162.0, 260.0, 432.0, 726.0, 1221.0, 2230.0, 4193.0, 8453.0, 18756.0, 49170.0, 197448.0, 3469495.0, 333875.0, 63912.0, 22779.0, 10188.0, 4827.0, 2535.0, 1341.0, 801.0, 455.0, 306.0, 169.0, 105.0, 70.0, 36.0, 23.0, 20.0, 12.0, 10.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.7294921875, -1.6822662353515625, -1.635040283203125, -1.5878143310546875, -1.54058837890625, -1.4933624267578125, -1.446136474609375, -1.3989105224609375, -1.3516845703125, -1.3044586181640625, -1.257232666015625, -1.2100067138671875, -1.16278076171875, -1.1155548095703125, -1.068328857421875, -1.0211029052734375, -0.973876953125, -0.9266510009765625, -0.879425048828125, -0.8321990966796875, -0.78497314453125, -0.7377471923828125, -0.690521240234375, -0.6432952880859375, -0.5960693359375, -0.5488433837890625, -0.501617431640625, -0.4543914794921875, -0.40716552734375, -0.3599395751953125, -0.312713623046875, -0.2654876708984375, -0.21826171875, -0.1710357666015625, -0.123809814453125, -0.0765838623046875, -0.02935791015625, 0.0178680419921875, 0.065093994140625, 0.1123199462890625, 0.1595458984375, 0.2067718505859375, 0.253997802734375, 0.3012237548828125, 0.34844970703125, 0.3956756591796875, 0.442901611328125, 0.4901275634765625, 0.537353515625, 0.5845794677734375, 0.631805419921875, 0.6790313720703125, 0.72625732421875, 0.7734832763671875, 0.820709228515625, 0.8679351806640625, 0.9151611328125, 0.9623870849609375, 1.009613037109375, 1.0568389892578125, 1.10406494140625, 1.1512908935546875, 1.198516845703125, 1.2457427978515625, 1.29296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 8.0, 14.0, 11.0, 16.0, 16.0, 18.0, 37.0, 37.0, 70.0, 99.0, 192.0, 484.0, 2075.0, 471.0, 192.0, 112.0, 66.0, 41.0, 26.0, 13.0, 16.0, 15.0, 13.0, 7.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.85791015625, -0.8377227783203125, -0.817535400390625, -0.7973480224609375, -0.77716064453125, -0.7569732666015625, -0.736785888671875, -0.7165985107421875, -0.6964111328125, -0.6762237548828125, -0.656036376953125, -0.6358489990234375, -0.61566162109375, -0.5954742431640625, -0.575286865234375, -0.5550994873046875, -0.534912109375, -0.5147247314453125, -0.494537353515625, -0.4743499755859375, -0.45416259765625, -0.4339752197265625, -0.413787841796875, -0.3936004638671875, -0.3734130859375, -0.3532257080078125, -0.333038330078125, -0.3128509521484375, -0.29266357421875, -0.2724761962890625, -0.252288818359375, -0.2321014404296875, -0.2119140625, -0.1917266845703125, -0.171539306640625, -0.1513519287109375, -0.13116455078125, -0.1109771728515625, -0.090789794921875, -0.0706024169921875, -0.0504150390625, -0.0302276611328125, -0.010040283203125, 0.0101470947265625, 0.03033447265625, 0.0505218505859375, 0.070709228515625, 0.0908966064453125, 0.111083984375, 0.1312713623046875, 0.151458740234375, 0.1716461181640625, 0.19183349609375, 0.2120208740234375, 0.232208251953125, 0.2523956298828125, 0.2725830078125, 0.2927703857421875, 0.312957763671875, 0.3331451416015625, 0.35333251953125, 0.3735198974609375, 0.393707275390625, 0.4138946533203125, 0.43408203125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 12.0, 13.0, 15.0, 35.0, 72.0, 106.0, 155.0, 172.0, 169.0, 95.0, 64.0, 38.0, 22.0, 18.0, 9.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1535115242004395, -4.990081787109375, -4.826652526855469, -4.663222789764404, -4.499793529510498, -4.336363792419434, -4.172934532165527, -4.009504795074463, -3.8460752964019775, -3.682645797729492, -3.519216299057007, -3.3557868003845215, -3.192357063293457, -3.028927803039551, -2.8654980659484863, -2.702068567276001, -2.5386390686035156, -2.3752095699310303, -2.211780071258545, -2.0483505725860596, -1.8849209547042847, -1.7214914560317993, -1.5580618381500244, -1.394632339477539, -1.2312028408050537, -1.0677733421325684, -0.9043437838554382, -0.7409142255783081, -0.5774847269058228, -0.4140552282333374, -0.2506256699562073, -0.08719611167907715, 0.07623291015625, 0.23966243863105774, 0.4030919671058655, 0.5665215253829956, 0.729951024055481, 0.8933805227279663, 1.0568101406097412, 1.2202396392822266, 1.383669137954712, 1.5470986366271973, 1.7105281352996826, 1.8739577531814575, 2.0373873710632324, 2.2008166313171387, 2.364246368408203, 2.5276758670806885, 2.691105365753174, 2.854534864425659, 3.0179643630981445, 3.18139386177063, 3.3448233604431152, 3.5082530975341797, 3.671682596206665, 3.8351120948791504, 3.9985415935516357, 4.161971092224121, 4.3254008293151855, 4.488830089569092, 4.652259826660156, 4.8156890869140625, 4.979118824005127, 5.142548561096191, 5.305977821350098]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 10.0, 8.0, 14.0, 10.0, 13.0, 19.0, 17.0, 18.0, 19.0, 19.0, 37.0, 28.0, 43.0, 45.0, 36.0, 42.0, 38.0, 43.0, 33.0, 42.0, 38.0, 37.0, 45.0, 39.0, 34.0, 36.0, 35.0, 22.0, 27.0, 24.0, 26.0, 20.0, 15.0, 13.0, 10.0, 4.0, 10.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8968169689178467, -1.8399814367294312, -1.7831459045410156, -1.7263103723526, -1.6694748401641846, -1.612639307975769, -1.5558037757873535, -1.498968243598938, -1.4421327114105225, -1.385297179222107, -1.3284616470336914, -1.2716261148452759, -1.2147905826568604, -1.1579550504684448, -1.1011195182800293, -1.0442839860916138, -0.9874483942985535, -0.9306128621101379, -0.8737773299217224, -0.8169417977333069, -0.7601062655448914, -0.703270673751831, -0.6464351415634155, -0.589599609375, -0.5327640771865845, -0.47592854499816895, -0.4190930128097534, -0.3622574806213379, -0.30542194843292236, -0.24858638644218445, -0.19175085425376892, -0.1349153220653534, -0.07807981967926025, -0.021244283765554428, 0.0355912521481514, 0.09242679178714752, 0.14926232397556305, 0.20609787106513977, 0.2629334032535553, 0.3197689354419708, 0.37660446763038635, 0.4334399998188019, 0.4902755320072174, 0.5471110939979553, 0.6039466261863708, 0.6607821583747864, 0.7176176905632019, 0.7744532227516174, 0.831288754940033, 0.8881242871284485, 0.944959819316864, 1.0017954111099243, 1.0586309432983398, 1.1154664754867554, 1.172302007675171, 1.2291375398635864, 1.285973072052002, 1.3428086042404175, 1.399644136428833, 1.4564796686172485, 1.513315200805664, 1.5701507329940796, 1.6269862651824951, 1.6838217973709106, 1.7406573295593262]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 21.0, 22.0, 30.0, 66.0, 97.0, 174.0, 329.0, 608.0, 1178.0, 2534.0, 6231.0, 16302.0, 44157.0, 129989.0, 400843.0, 296019.0, 95384.0, 33214.0, 12316.0, 4897.0, 2082.0, 979.0, 446.0, 254.0, 146.0, 80.0, 61.0, 25.0, 17.0, 15.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.65625, -1.6042633056640625, -1.552276611328125, -1.5002899169921875, -1.44830322265625, -1.3963165283203125, -1.344329833984375, -1.2923431396484375, -1.2403564453125, -1.1883697509765625, -1.136383056640625, -1.0843963623046875, -1.03240966796875, -0.9804229736328125, -0.928436279296875, -0.8764495849609375, -0.824462890625, -0.7724761962890625, -0.720489501953125, -0.6685028076171875, -0.61651611328125, -0.5645294189453125, -0.512542724609375, -0.4605560302734375, -0.4085693359375, -0.3565826416015625, -0.304595947265625, -0.2526092529296875, -0.20062255859375, -0.1486358642578125, -0.096649169921875, -0.0446624755859375, 0.00732421875, 0.0593109130859375, 0.111297607421875, 0.1632843017578125, 0.21527099609375, 0.2672576904296875, 0.319244384765625, 0.3712310791015625, 0.4232177734375, 0.4752044677734375, 0.527191162109375, 0.5791778564453125, 0.63116455078125, 0.6831512451171875, 0.735137939453125, 0.7871246337890625, 0.839111328125, 0.8910980224609375, 0.943084716796875, 0.9950714111328125, 1.04705810546875, 1.0990447998046875, 1.151031494140625, 1.2030181884765625, 1.2550048828125, 1.3069915771484375, 1.358978271484375, 1.4109649658203125, 1.46295166015625, 1.5149383544921875, 1.566925048828125, 1.6189117431640625, 1.6708984375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 10.0, 13.0, 13.0, 22.0, 22.0, 27.0, 30.0, 35.0, 54.0, 48.0, 57.0, 61.0, 61.0, 62.0, 43.0, 62.0, 48.0, 65.0, 51.0, 49.0, 28.0, 32.0, 31.0, 16.0, 18.0, 14.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2364501953125, -0.22687721252441406, -0.21730422973632812, -0.2077312469482422, -0.19815826416015625, -0.1885852813720703, -0.17901229858398438, -0.16943931579589844, -0.1598663330078125, -0.15029335021972656, -0.14072036743164062, -0.1311473846435547, -0.12157440185546875, -0.11200141906738281, -0.10242843627929688, -0.09285545349121094, -0.083282470703125, -0.07370948791503906, -0.06413650512695312, -0.05456352233886719, -0.04499053955078125, -0.03541755676269531, -0.025844573974609375, -0.016271591186523438, -0.0066986083984375, 0.0028743743896484375, 0.012447357177734375, 0.022020339965820312, 0.03159332275390625, 0.04116630554199219, 0.050739288330078125, 0.06031227111816406, 0.06988525390625, 0.07945823669433594, 0.08903121948242188, 0.09860420227050781, 0.10817718505859375, 0.11775016784667969, 0.12732315063476562, 0.13689613342285156, 0.1464691162109375, 0.15604209899902344, 0.16561508178710938, 0.1751880645751953, 0.18476104736328125, 0.1943340301513672, 0.20390701293945312, 0.21347999572753906, 0.223052978515625, 0.23262596130371094, 0.24219894409179688, 0.2517719268798828, 0.26134490966796875, 0.2709178924560547, 0.2804908752441406, 0.29006385803222656, 0.2996368408203125, 0.30920982360839844, 0.3187828063964844, 0.3283557891845703, 0.33792877197265625, 0.3475017547607422, 0.3570747375488281, 0.36664772033691406, 0.376220703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 10.0, 10.0, 15.0, 25.0, 16.0, 23.0, 39.0, 58.0, 94.0, 148.0, 243.0, 436.0, 925.0, 2336.0, 9592.0, 58120.0, 479323.0, 431562.0, 52610.0, 8598.0, 2298.0, 913.0, 452.0, 226.0, 150.0, 99.0, 62.0, 45.0, 24.0, 29.0, 26.0, 13.0, 11.0, 3.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5078125, -2.426849365234375, -2.34588623046875, -2.264923095703125, -2.1839599609375, -2.102996826171875, -2.02203369140625, -1.941070556640625, -1.860107421875, -1.779144287109375, -1.69818115234375, -1.617218017578125, -1.5362548828125, -1.455291748046875, -1.37432861328125, -1.293365478515625, -1.21240234375, -1.131439208984375, -1.05047607421875, -0.969512939453125, -0.8885498046875, -0.807586669921875, -0.72662353515625, -0.645660400390625, -0.564697265625, -0.483734130859375, -0.40277099609375, -0.321807861328125, -0.2408447265625, -0.159881591796875, -0.07891845703125, 0.002044677734375, 0.0830078125, 0.163970947265625, 0.24493408203125, 0.325897216796875, 0.4068603515625, 0.487823486328125, 0.56878662109375, 0.649749755859375, 0.730712890625, 0.811676025390625, 0.89263916015625, 0.973602294921875, 1.0545654296875, 1.135528564453125, 1.21649169921875, 1.297454833984375, 1.37841796875, 1.459381103515625, 1.54034423828125, 1.621307373046875, 1.7022705078125, 1.783233642578125, 1.86419677734375, 1.945159912109375, 2.026123046875, 2.107086181640625, 2.18804931640625, 2.269012451171875, 2.3499755859375, 2.430938720703125, 2.51190185546875, 2.592864990234375, 2.673828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 5.0, 4.0, 6.0, 10.0, 13.0, 9.0, 10.0, 16.0, 15.0, 24.0, 18.0, 30.0, 25.0, 37.0, 45.0, 43.0, 37.0, 40.0, 38.0, 47.0, 44.0, 50.0, 46.0, 30.0, 50.0, 36.0, 35.0, 35.0, 27.0, 22.0, 26.0, 22.0, 16.0, 19.0, 18.0, 13.0, 9.0, 6.0, 7.0, 2.0, 9.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0439453125, -1.0097808837890625, -0.975616455078125, -0.9414520263671875, -0.90728759765625, -0.8731231689453125, -0.838958740234375, -0.8047943115234375, -0.7706298828125, -0.7364654541015625, -0.702301025390625, -0.6681365966796875, -0.63397216796875, -0.5998077392578125, -0.565643310546875, -0.5314788818359375, -0.497314453125, -0.4631500244140625, -0.428985595703125, -0.3948211669921875, -0.36065673828125, -0.3264923095703125, -0.292327880859375, -0.2581634521484375, -0.2239990234375, -0.1898345947265625, -0.155670166015625, -0.1215057373046875, -0.08734130859375, -0.0531768798828125, -0.019012451171875, 0.0151519775390625, 0.04931640625, 0.0834808349609375, 0.117645263671875, 0.1518096923828125, 0.18597412109375, 0.2201385498046875, 0.254302978515625, 0.2884674072265625, 0.3226318359375, 0.3567962646484375, 0.390960693359375, 0.4251251220703125, 0.45928955078125, 0.4934539794921875, 0.527618408203125, 0.5617828369140625, 0.595947265625, 0.6301116943359375, 0.664276123046875, 0.6984405517578125, 0.73260498046875, 0.7667694091796875, 0.800933837890625, 0.8350982666015625, 0.8692626953125, 0.9034271240234375, 0.937591552734375, 0.9717559814453125, 1.00592041015625, 1.0400848388671875, 1.074249267578125, 1.1084136962890625, 1.142578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 9.0, 4.0, 16.0, 13.0, 25.0, 41.0, 58.0, 108.0, 172.0, 315.0, 501.0, 1080.0, 2314.0, 6419.0, 29900.0, 768698.0, 213903.0, 16852.0, 4507.0, 1709.0, 840.0, 396.0, 248.0, 147.0, 107.0, 62.0, 31.0, 17.0, 15.0, 11.0, 8.0, 8.0, 7.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.9296875, -3.825836181640625, -3.72198486328125, -3.618133544921875, -3.5142822265625, -3.410430908203125, -3.30657958984375, -3.202728271484375, -3.098876953125, -2.995025634765625, -2.89117431640625, -2.787322998046875, -2.6834716796875, -2.579620361328125, -2.47576904296875, -2.371917724609375, -2.26806640625, -2.164215087890625, -2.06036376953125, -1.956512451171875, -1.8526611328125, -1.748809814453125, -1.64495849609375, -1.541107177734375, -1.437255859375, -1.333404541015625, -1.22955322265625, -1.125701904296875, -1.0218505859375, -0.917999267578125, -0.81414794921875, -0.710296630859375, -0.6064453125, -0.502593994140625, -0.39874267578125, -0.294891357421875, -0.1910400390625, -0.087188720703125, 0.01666259765625, 0.120513916015625, 0.224365234375, 0.328216552734375, 0.43206787109375, 0.535919189453125, 0.6397705078125, 0.743621826171875, 0.84747314453125, 0.951324462890625, 1.05517578125, 1.159027099609375, 1.26287841796875, 1.366729736328125, 1.4705810546875, 1.574432373046875, 1.67828369140625, 1.782135009765625, 1.885986328125, 1.989837646484375, 2.09368896484375, 2.197540283203125, 2.3013916015625, 2.405242919921875, 2.50909423828125, 2.612945556640625, 2.716796875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 9.0, 8.0, 24.0, 47.0, 85.0, 163.0, 303.0, 164.0, 92.0, 44.0, 21.0, 8.0, 11.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006422996520996094, -0.0006218776106834412, -0.000601455569267273, -0.0005810335278511047, -0.0005606114864349365, -0.0005401894450187683, -0.0005197674036026001, -0.0004993453621864319, -0.00047892332077026367, -0.00045850127935409546, -0.00043807923793792725, -0.00041765719652175903, -0.0003972351551055908, -0.0003768131136894226, -0.0003563910722732544, -0.0003359690308570862, -0.00031554698944091797, -0.00029512494802474976, -0.00027470290660858154, -0.00025428086519241333, -0.00023385882377624512, -0.0002134367823600769, -0.0001930147409439087, -0.00017259269952774048, -0.00015217065811157227, -0.00013174861669540405, -0.00011132657527923584, -9.090453386306763e-05, -7.048249244689941e-05, -5.00604510307312e-05, -2.9638409614562988e-05, -9.216368198394775e-06, 1.1205673217773438e-05, 3.162771463394165e-05, 5.204975605010986e-05, 7.247179746627808e-05, 9.289383888244629e-05, 0.0001133158802986145, 0.00013373792171478271, 0.00015415996313095093, 0.00017458200454711914, 0.00019500404596328735, 0.00021542608737945557, 0.00023584812879562378, 0.000256270170211792, 0.0002766922116279602, 0.0002971142530441284, 0.00031753629446029663, 0.00033795833587646484, 0.00035838037729263306, 0.00037880241870880127, 0.0003992244601249695, 0.0004196465015411377, 0.0004400685429573059, 0.0004604905843734741, 0.00048091262578964233, 0.0005013346672058105, 0.0005217567086219788, 0.000542178750038147, 0.0005626007914543152, 0.0005830228328704834, 0.0006034448742866516, 0.0006238669157028198, 0.000644288957118988, 0.0006647109985351562]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 12.0, 21.0, 23.0, 38.0, 65.0, 87.0, 183.0, 328.0, 822.0, 2302.0, 8322.0, 60808.0, 929645.0, 36242.0, 6358.0, 1859.0, 700.0, 328.0, 173.0, 86.0, 45.0, 40.0, 22.0, 13.0, 11.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.51171875, -5.368194580078125, -5.22467041015625, -5.081146240234375, -4.9376220703125, -4.794097900390625, -4.65057373046875, -4.507049560546875, -4.363525390625, -4.220001220703125, -4.07647705078125, -3.932952880859375, -3.7894287109375, -3.645904541015625, -3.50238037109375, -3.358856201171875, -3.21533203125, -3.071807861328125, -2.92828369140625, -2.784759521484375, -2.6412353515625, -2.497711181640625, -2.35418701171875, -2.210662841796875, -2.067138671875, -1.923614501953125, -1.78009033203125, -1.636566162109375, -1.4930419921875, -1.349517822265625, -1.20599365234375, -1.062469482421875, -0.9189453125, -0.775421142578125, -0.63189697265625, -0.488372802734375, -0.3448486328125, -0.201324462890625, -0.05780029296875, 0.085723876953125, 0.229248046875, 0.372772216796875, 0.51629638671875, 0.659820556640625, 0.8033447265625, 0.946868896484375, 1.09039306640625, 1.233917236328125, 1.37744140625, 1.520965576171875, 1.66448974609375, 1.808013916015625, 1.9515380859375, 2.095062255859375, 2.23858642578125, 2.382110595703125, 2.525634765625, 2.669158935546875, 2.81268310546875, 2.956207275390625, 3.0997314453125, 3.243255615234375, 3.38677978515625, 3.530303955078125, 3.673828125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 6.0, 6.0, 8.0, 8.0, 4.0, 24.0, 25.0, 59.0, 122.0, 275.0, 207.0, 108.0, 38.0, 27.0, 13.0, 7.0, 8.0, 3.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.447265625, -2.38421630859375, -2.3211669921875, -2.25811767578125, -2.195068359375, -2.13201904296875, -2.0689697265625, -2.00592041015625, -1.94287109375, -1.87982177734375, -1.8167724609375, -1.75372314453125, -1.690673828125, -1.62762451171875, -1.5645751953125, -1.50152587890625, -1.4384765625, -1.37542724609375, -1.3123779296875, -1.24932861328125, -1.186279296875, -1.12322998046875, -1.0601806640625, -0.99713134765625, -0.93408203125, -0.87103271484375, -0.8079833984375, -0.74493408203125, -0.681884765625, -0.61883544921875, -0.5557861328125, -0.49273681640625, -0.4296875, -0.36663818359375, -0.3035888671875, -0.24053955078125, -0.177490234375, -0.11444091796875, -0.0513916015625, 0.01165771484375, 0.07470703125, 0.13775634765625, 0.2008056640625, 0.26385498046875, 0.326904296875, 0.38995361328125, 0.4530029296875, 0.51605224609375, 0.5791015625, 0.64215087890625, 0.7052001953125, 0.76824951171875, 0.831298828125, 0.89434814453125, 0.9573974609375, 1.02044677734375, 1.08349609375, 1.14654541015625, 1.2095947265625, 1.27264404296875, 1.335693359375, 1.39874267578125, 1.4617919921875, 1.52484130859375, 1.587890625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 7.0, 7.0, 17.0, 29.0, 59.0, 78.0, 136.0, 167.0, 165.0, 124.0, 94.0, 47.0, 30.0, 24.0, 8.0, 2.0, 7.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.164249420166016, -17.601972579956055, -17.039695739746094, -16.477418899536133, -15.915142059326172, -15.352865219116211, -14.79058837890625, -14.228311538696289, -13.666034698486328, -13.103757858276367, -12.541481018066406, -11.979204177856445, -11.416927337646484, -10.854650497436523, -10.292373657226562, -9.730096817016602, -9.167820930480957, -8.605544090270996, -8.043267250061035, -7.480990409851074, -6.918713569641113, -6.356436729431152, -5.79416036605835, -5.231883525848389, -4.669606685638428, -4.107329845428467, -3.545053005218506, -2.982776403427124, -2.420499563217163, -1.8582227230072021, -1.2959461212158203, -0.7336692810058594, -0.17139244079589844, 0.3908843398094177, 0.9531611204147339, 1.5154378414154053, 2.077714681625366, 2.639991521835327, 3.202268123626709, 3.76454496383667, 4.326821804046631, 4.889098644256592, 5.451375484466553, 6.0136518478393555, 6.575928688049316, 7.138205528259277, 7.700482368469238, 8.2627592086792, 8.82503604888916, 9.387312889099121, 9.949589729309082, 10.511866569519043, 11.074143409729004, 11.636420249938965, 12.19869613647461, 12.76097297668457, 13.323249816894531, 13.885526657104492, 14.447803497314453, 15.010080337524414, 15.572357177734375, 16.134634017944336, 16.696910858154297, 17.259187698364258, 17.82146453857422]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 10.0, 14.0, 10.0, 10.0, 14.0, 18.0, 13.0, 15.0, 31.0, 25.0, 43.0, 29.0, 27.0, 48.0, 36.0, 52.0, 55.0, 37.0, 37.0, 45.0, 35.0, 39.0, 43.0, 44.0, 32.0, 30.0, 28.0, 21.0, 33.0, 21.0, 13.0, 19.0, 18.0, 11.0, 9.0, 9.0, 8.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.985133171081543, -6.7535247802734375, -6.521915912628174, -6.290307521820068, -6.058699131011963, -5.827090263366699, -5.595481872558594, -5.363873481750488, -5.132265090942383, -4.900656700134277, -4.669047832489014, -4.437439441680908, -4.205831050872803, -3.974222421646118, -3.7426137924194336, -3.511005401611328, -3.2793965339660645, -3.04778790473938, -2.8161795139312744, -2.58457088470459, -2.3529624938964844, -2.1213538646698, -1.8897452354431152, -1.6581367254257202, -1.4265282154083252, -1.1949197053909302, -0.9633111357688904, -0.7317025661468506, -0.5000940561294556, -0.26848554611206055, -0.03687691688537598, 0.19473159313201904, 0.42634010314941406, 0.6579486131668091, 0.8895571827888489, 1.1211657524108887, 1.3527742624282837, 1.5843827724456787, 1.8159914016723633, 2.0475997924804688, 2.2792084217071533, 2.510817050933838, 2.7424254417419434, 2.974034070968628, 3.2056427001953125, 3.437251091003418, 3.6688597202301025, 3.900468349456787, 4.132076740264893, 4.363685131072998, 4.595293998718262, 4.826902389526367, 5.058510780334473, 5.290119171142578, 5.521728038787842, 5.753336429595947, 5.984945297241211, 6.216553688049316, 6.44816255569458, 6.6797709465026855, 6.911379337310791, 7.142988204956055, 7.37459659576416, 7.606204986572266, 7.837813377380371]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 14.0, 22.0, 30.0, 42.0, 68.0, 108.0, 172.0, 274.0, 591.0, 1126.0, 2199.0, 4999.0, 12616.0, 37998.0, 174204.0, 3671303.0, 220448.0, 43165.0, 14171.0, 5609.0, 2437.0, 1199.0, 591.0, 343.0, 179.0, 111.0, 83.0, 49.0, 35.0, 29.0, 18.0, 4.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.005859375, -1.942291259765625, -1.87872314453125, -1.815155029296875, -1.7515869140625, -1.688018798828125, -1.62445068359375, -1.560882568359375, -1.497314453125, -1.433746337890625, -1.37017822265625, -1.306610107421875, -1.2430419921875, -1.179473876953125, -1.11590576171875, -1.052337646484375, -0.98876953125, -0.925201416015625, -0.86163330078125, -0.798065185546875, -0.7344970703125, -0.670928955078125, -0.60736083984375, -0.543792724609375, -0.480224609375, -0.416656494140625, -0.35308837890625, -0.289520263671875, -0.2259521484375, -0.162384033203125, -0.09881591796875, -0.035247802734375, 0.0283203125, 0.091888427734375, 0.15545654296875, 0.219024658203125, 0.2825927734375, 0.346160888671875, 0.40972900390625, 0.473297119140625, 0.536865234375, 0.600433349609375, 0.66400146484375, 0.727569580078125, 0.7911376953125, 0.854705810546875, 0.91827392578125, 0.981842041015625, 1.04541015625, 1.108978271484375, 1.17254638671875, 1.236114501953125, 1.2996826171875, 1.363250732421875, 1.42681884765625, 1.490386962890625, 1.553955078125, 1.617523193359375, 1.68109130859375, 1.744659423828125, 1.8082275390625, 1.871795654296875, 1.93536376953125, 1.998931884765625, 2.0625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 6.0, 16.0, 14.0, 15.0, 22.0, 25.0, 38.0, 42.0, 49.0, 52.0, 57.0, 54.0, 60.0, 62.0, 53.0, 53.0, 58.0, 56.0, 48.0, 36.0, 32.0, 41.0, 23.0, 23.0, 14.0, 9.0, 11.0, 6.0, 6.0, 3.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.2612953186035156, -0.25110626220703125, -0.24091720581054688, -0.2307281494140625, -0.22053909301757812, -0.21035003662109375, -0.20016098022460938, -0.189971923828125, -0.17978286743164062, -0.16959381103515625, -0.15940475463867188, -0.1492156982421875, -0.13902664184570312, -0.12883758544921875, -0.11864852905273438, -0.10845947265625, -0.09827041625976562, -0.08808135986328125, -0.07789230346679688, -0.0677032470703125, -0.057514190673828125, -0.04732513427734375, -0.037136077880859375, -0.026947021484375, -0.016757965087890625, -0.00656890869140625, 0.003620147705078125, 0.0138092041015625, 0.023998260498046875, 0.03418731689453125, 0.044376373291015625, 0.0545654296875, 0.06475448608398438, 0.07494354248046875, 0.08513259887695312, 0.0953216552734375, 0.10551071166992188, 0.11569976806640625, 0.12588882446289062, 0.136077880859375, 0.14626693725585938, 0.15645599365234375, 0.16664505004882812, 0.1768341064453125, 0.18702316284179688, 0.19721221923828125, 0.20740127563476562, 0.21759033203125, 0.22777938842773438, 0.23796844482421875, 0.24815750122070312, 0.2583465576171875, 0.2685356140136719, 0.27872467041015625, 0.2889137268066406, 0.299102783203125, 0.3092918395996094, 0.31948089599609375, 0.3296699523925781, 0.3398590087890625, 0.3500480651855469, 0.36023712158203125, 0.3704261779785156, 0.380615234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 10.0, 14.0, 9.0, 11.0, 18.0, 19.0, 37.0, 45.0, 90.0, 154.0, 199.0, 410.0, 810.0, 1763.0, 3964.0, 10234.0, 32000.0, 146338.0, 3511741.0, 402104.0, 57293.0, 16298.0, 5889.0, 2428.0, 1125.0, 558.0, 261.0, 160.0, 98.0, 62.0, 37.0, 33.0, 17.0, 11.0, 8.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.193359375, -2.1219482421875, -2.050537109375, -1.9791259765625, -1.90771484375, -1.8363037109375, -1.764892578125, -1.6934814453125, -1.6220703125, -1.5506591796875, -1.479248046875, -1.4078369140625, -1.33642578125, -1.2650146484375, -1.193603515625, -1.1221923828125, -1.05078125, -0.9793701171875, -0.907958984375, -0.8365478515625, -0.76513671875, -0.6937255859375, -0.622314453125, -0.5509033203125, -0.4794921875, -0.4080810546875, -0.336669921875, -0.2652587890625, -0.19384765625, -0.1224365234375, -0.051025390625, 0.0203857421875, 0.091796875, 0.1632080078125, 0.234619140625, 0.3060302734375, 0.37744140625, 0.4488525390625, 0.520263671875, 0.5916748046875, 0.6630859375, 0.7344970703125, 0.805908203125, 0.8773193359375, 0.94873046875, 1.0201416015625, 1.091552734375, 1.1629638671875, 1.234375, 1.3057861328125, 1.377197265625, 1.4486083984375, 1.52001953125, 1.5914306640625, 1.662841796875, 1.7342529296875, 1.8056640625, 1.8770751953125, 1.948486328125, 2.0198974609375, 2.09130859375, 2.1627197265625, 2.234130859375, 2.3055419921875, 2.376953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 5.0, 6.0, 8.0, 9.0, 9.0, 9.0, 11.0, 26.0, 30.0, 31.0, 58.0, 74.0, 123.0, 235.0, 606.0, 1851.0, 437.0, 171.0, 109.0, 69.0, 53.0, 43.0, 27.0, 20.0, 13.0, 8.0, 9.0, 4.0, 8.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.98095703125, -0.956024169921875, -0.93109130859375, -0.906158447265625, -0.8812255859375, -0.856292724609375, -0.83135986328125, -0.806427001953125, -0.781494140625, -0.756561279296875, -0.73162841796875, -0.706695556640625, -0.6817626953125, -0.656829833984375, -0.63189697265625, -0.606964111328125, -0.58203125, -0.557098388671875, -0.53216552734375, -0.507232666015625, -0.4822998046875, -0.457366943359375, -0.43243408203125, -0.407501220703125, -0.382568359375, -0.357635498046875, -0.33270263671875, -0.307769775390625, -0.2828369140625, -0.257904052734375, -0.23297119140625, -0.208038330078125, -0.18310546875, -0.158172607421875, -0.13323974609375, -0.108306884765625, -0.0833740234375, -0.058441162109375, -0.03350830078125, -0.008575439453125, 0.016357421875, 0.041290283203125, 0.06622314453125, 0.091156005859375, 0.1160888671875, 0.141021728515625, 0.16595458984375, 0.190887451171875, 0.2158203125, 0.240753173828125, 0.26568603515625, 0.290618896484375, 0.3155517578125, 0.340484619140625, 0.36541748046875, 0.390350341796875, 0.415283203125, 0.440216064453125, 0.46514892578125, 0.490081787109375, 0.5150146484375, 0.539947509765625, 0.56488037109375, 0.589813232421875, 0.61474609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 6.0, 15.0, 19.0, 31.0, 63.0, 107.0, 156.0, 168.0, 157.0, 100.0, 69.0, 44.0, 32.0, 17.0, 15.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90494966506958, -4.677546501159668, -4.450143337249756, -4.222740173339844, -3.9953370094299316, -3.7679338455200195, -3.5405306816101074, -3.3131275177001953, -3.085724353790283, -2.858321189880371, -2.630918025970459, -2.403514862060547, -2.1761116981506348, -1.9487085342407227, -1.7213053703308105, -1.4939022064208984, -1.2664990425109863, -1.0390958786010742, -0.8116927146911621, -0.58428955078125, -0.3568863868713379, -0.12948322296142578, 0.09791994094848633, 0.32532310485839844, 0.5527262687683105, 0.7801294326782227, 1.0075325965881348, 1.2349357604980469, 1.462338924407959, 1.689742088317871, 1.9171452522277832, 2.1445484161376953, 2.3719520568847656, 2.5993552207946777, 2.82675838470459, 3.054161548614502, 3.281564712524414, 3.508967876434326, 3.7363710403442383, 3.9637742042541504, 4.1911773681640625, 4.418580532073975, 4.645983695983887, 4.873386859893799, 5.100790023803711, 5.328193187713623, 5.555596351623535, 5.782999515533447, 6.010402679443359, 6.2378058433532715, 6.465209007263184, 6.692612171173096, 6.920015335083008, 7.14741849899292, 7.374821662902832, 7.602224826812744, 7.829627990722656, 8.057031631469727, 8.28443431854248, 8.511837005615234, 8.739240646362305, 8.966644287109375, 9.194046974182129, 9.421449661254883, 9.648853302001953]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 9.0, 7.0, 14.0, 12.0, 15.0, 15.0, 14.0, 21.0, 22.0, 22.0, 35.0, 28.0, 44.0, 40.0, 38.0, 30.0, 47.0, 38.0, 45.0, 52.0, 39.0, 26.0, 40.0, 43.0, 32.0, 39.0, 33.0, 32.0, 30.0, 29.0, 27.0, 9.0, 11.0, 15.0, 14.0, 3.0, 7.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3729846477508545, -2.2955424785614014, -2.2181003093719482, -2.140658378601074, -2.063216209411621, -1.985774040222168, -1.9083318710327148, -1.8308898210525513, -1.7534477710723877, -1.6760056018829346, -1.598563551902771, -1.5211213827133179, -1.4436793327331543, -1.3662371635437012, -1.288794994354248, -1.2113529443740845, -1.1339107751846313, -1.0564686059951782, -0.9790265560150146, -0.9015843868255615, -0.824142336845398, -0.7467001676559448, -0.6692580580711365, -0.5918159484863281, -0.5143738389015198, -0.4369317293167114, -0.3594896197319031, -0.28204748034477234, -0.204605370759964, -0.12716326117515564, -0.0497211217880249, 0.027720987796783447, 0.1051630973815918, 0.18260520696640015, 0.2600473165512085, 0.33748945593833923, 0.4149315655231476, 0.49237367510795593, 0.5698158144950867, 0.647257924079895, 0.7247000336647034, 0.8021421432495117, 0.8795842528343201, 0.9570263624191284, 1.0344685316085815, 1.1119105815887451, 1.1893527507781982, 1.2667949199676514, 1.344236969947815, 1.421679139137268, 1.4991211891174316, 1.5765633583068848, 1.6540054082870483, 1.7314475774765015, 1.808889627456665, 1.8863317966461182, 1.9637739658355713, 2.0412161350250244, 2.1186583042144775, 2.1961002349853516, 2.2735424041748047, 2.350984573364258, 2.428426742553711, 2.505868911743164, 2.583310842514038]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 11.0, 7.0, 17.0, 30.0, 28.0, 38.0, 86.0, 133.0, 244.0, 403.0, 667.0, 1261.0, 2433.0, 4846.0, 10626.0, 24793.0, 63194.0, 257116.0, 536342.0, 87107.0, 32909.0, 13535.0, 6223.0, 2988.0, 1608.0, 835.0, 447.0, 235.0, 136.0, 92.0, 61.0, 27.0, 22.0, 18.0, 13.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.9052734375, -1.847808837890625, -1.79034423828125, -1.732879638671875, -1.6754150390625, -1.617950439453125, -1.56048583984375, -1.503021240234375, -1.445556640625, -1.388092041015625, -1.33062744140625, -1.273162841796875, -1.2156982421875, -1.158233642578125, -1.10076904296875, -1.043304443359375, -0.98583984375, -0.928375244140625, -0.87091064453125, -0.813446044921875, -0.7559814453125, -0.698516845703125, -0.64105224609375, -0.583587646484375, -0.526123046875, -0.468658447265625, -0.41119384765625, -0.353729248046875, -0.2962646484375, -0.238800048828125, -0.18133544921875, -0.123870849609375, -0.06640625, -0.008941650390625, 0.04852294921875, 0.105987548828125, 0.1634521484375, 0.220916748046875, 0.27838134765625, 0.335845947265625, 0.393310546875, 0.450775146484375, 0.50823974609375, 0.565704345703125, 0.6231689453125, 0.680633544921875, 0.73809814453125, 0.795562744140625, 0.85302734375, 0.910491943359375, 0.96795654296875, 1.025421142578125, 1.0828857421875, 1.140350341796875, 1.19781494140625, 1.255279541015625, 1.312744140625, 1.370208740234375, 1.42767333984375, 1.485137939453125, 1.5426025390625, 1.600067138671875, 1.65753173828125, 1.714996337890625, 1.7724609375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 5.0, 6.0, 15.0, 16.0, 17.0, 23.0, 28.0, 33.0, 40.0, 45.0, 43.0, 55.0, 51.0, 56.0, 62.0, 69.0, 53.0, 58.0, 35.0, 45.0, 54.0, 23.0, 39.0, 26.0, 27.0, 21.0, 11.0, 12.0, 5.0, 8.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2587890625, -0.24875259399414062, -0.23871612548828125, -0.22867965698242188, -0.2186431884765625, -0.20860671997070312, -0.19857025146484375, -0.18853378295898438, -0.178497314453125, -0.16846084594726562, -0.15842437744140625, -0.14838790893554688, -0.1383514404296875, -0.12831497192382812, -0.11827850341796875, -0.10824203491210938, -0.09820556640625, -0.08816909790039062, -0.07813262939453125, -0.06809616088867188, -0.0580596923828125, -0.048023223876953125, -0.03798675537109375, -0.027950286865234375, -0.017913818359375, -0.007877349853515625, 0.00215911865234375, 0.012195587158203125, 0.0222320556640625, 0.032268524169921875, 0.04230499267578125, 0.052341461181640625, 0.0623779296875, 0.07241439819335938, 0.08245086669921875, 0.09248733520507812, 0.1025238037109375, 0.11256027221679688, 0.12259674072265625, 0.13263320922851562, 0.142669677734375, 0.15270614624023438, 0.16274261474609375, 0.17277908325195312, 0.1828155517578125, 0.19285202026367188, 0.20288848876953125, 0.21292495727539062, 0.22296142578125, 0.23299789428710938, 0.24303436279296875, 0.2530708312988281, 0.2631072998046875, 0.2731437683105469, 0.28318023681640625, 0.2932167053222656, 0.303253173828125, 0.3132896423339844, 0.32332611083984375, 0.3333625793457031, 0.3433990478515625, 0.3534355163574219, 0.36347198486328125, 0.3735084533691406, 0.383544921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 8.0, 7.0, 11.0, 12.0, 12.0, 36.0, 31.0, 50.0, 90.0, 129.0, 196.0, 319.0, 575.0, 1487.0, 4837.0, 20704.0, 130626.0, 802317.0, 68981.0, 12591.0, 3181.0, 1100.0, 483.0, 258.0, 170.0, 108.0, 67.0, 52.0, 31.0, 22.0, 18.0, 12.0, 8.0, 4.0, 7.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.111328125, -2.997528076171875, -2.88372802734375, -2.769927978515625, -2.6561279296875, -2.542327880859375, -2.42852783203125, -2.314727783203125, -2.200927734375, -2.087127685546875, -1.97332763671875, -1.859527587890625, -1.7457275390625, -1.631927490234375, -1.51812744140625, -1.404327392578125, -1.29052734375, -1.176727294921875, -1.06292724609375, -0.949127197265625, -0.8353271484375, -0.721527099609375, -0.60772705078125, -0.493927001953125, -0.380126953125, -0.266326904296875, -0.15252685546875, -0.038726806640625, 0.0750732421875, 0.188873291015625, 0.30267333984375, 0.416473388671875, 0.5302734375, 0.644073486328125, 0.75787353515625, 0.871673583984375, 0.9854736328125, 1.099273681640625, 1.21307373046875, 1.326873779296875, 1.440673828125, 1.554473876953125, 1.66827392578125, 1.782073974609375, 1.8958740234375, 2.009674072265625, 2.12347412109375, 2.237274169921875, 2.35107421875, 2.464874267578125, 2.57867431640625, 2.692474365234375, 2.8062744140625, 2.920074462890625, 3.03387451171875, 3.147674560546875, 3.261474609375, 3.375274658203125, 3.48907470703125, 3.602874755859375, 3.7166748046875, 3.830474853515625, 3.94427490234375, 4.058074951171875, 4.171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 12.0, 9.0, 5.0, 10.0, 16.0, 20.0, 19.0, 21.0, 30.0, 29.0, 36.0, 44.0, 44.0, 49.0, 46.0, 49.0, 51.0, 60.0, 52.0, 35.0, 38.0, 38.0, 34.0, 31.0, 41.0, 29.0, 32.0, 23.0, 16.0, 18.0, 15.0, 12.0, 5.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.22265625, -1.1820526123046875, -1.141448974609375, -1.1008453369140625, -1.06024169921875, -1.0196380615234375, -0.979034423828125, -0.9384307861328125, -0.8978271484375, -0.8572235107421875, -0.816619873046875, -0.7760162353515625, -0.73541259765625, -0.6948089599609375, -0.654205322265625, -0.6136016845703125, -0.572998046875, -0.5323944091796875, -0.491790771484375, -0.4511871337890625, -0.41058349609375, -0.3699798583984375, -0.329376220703125, -0.2887725830078125, -0.2481689453125, -0.2075653076171875, -0.166961669921875, -0.1263580322265625, -0.08575439453125, -0.0451507568359375, -0.004547119140625, 0.0360565185546875, 0.07666015625, 0.1172637939453125, 0.157867431640625, 0.1984710693359375, 0.23907470703125, 0.2796783447265625, 0.320281982421875, 0.3608856201171875, 0.4014892578125, 0.4420928955078125, 0.482696533203125, 0.5233001708984375, 0.56390380859375, 0.6045074462890625, 0.645111083984375, 0.6857147216796875, 0.726318359375, 0.7669219970703125, 0.807525634765625, 0.8481292724609375, 0.88873291015625, 0.9293365478515625, 0.969940185546875, 1.0105438232421875, 1.0511474609375, 1.0917510986328125, 1.132354736328125, 1.1729583740234375, 1.21356201171875, 1.2541656494140625, 1.294769287109375, 1.3353729248046875, 1.3759765625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 11.0, 14.0, 17.0, 28.0, 38.0, 81.0, 144.0, 239.0, 384.0, 626.0, 1106.0, 2204.0, 4789.0, 16719.0, 960297.0, 48651.0, 6912.0, 2937.0, 1404.0, 760.0, 457.0, 274.0, 165.0, 102.0, 57.0, 35.0, 32.0, 17.0, 14.0, 9.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.21875, -5.072509765625, -4.92626953125, -4.780029296875, -4.6337890625, -4.487548828125, -4.34130859375, -4.195068359375, -4.048828125, -3.902587890625, -3.75634765625, -3.610107421875, -3.4638671875, -3.317626953125, -3.17138671875, -3.025146484375, -2.87890625, -2.732666015625, -2.58642578125, -2.440185546875, -2.2939453125, -2.147705078125, -2.00146484375, -1.855224609375, -1.708984375, -1.562744140625, -1.41650390625, -1.270263671875, -1.1240234375, -0.977783203125, -0.83154296875, -0.685302734375, -0.5390625, -0.392822265625, -0.24658203125, -0.100341796875, 0.0458984375, 0.192138671875, 0.33837890625, 0.484619140625, 0.630859375, 0.777099609375, 0.92333984375, 1.069580078125, 1.2158203125, 1.362060546875, 1.50830078125, 1.654541015625, 1.80078125, 1.947021484375, 2.09326171875, 2.239501953125, 2.3857421875, 2.531982421875, 2.67822265625, 2.824462890625, 2.970703125, 3.116943359375, 3.26318359375, 3.409423828125, 3.5556640625, 3.701904296875, 3.84814453125, 3.994384765625, 4.140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 2.0, 1.0, 6.0, 18.0, 36.0, 143.0, 466.0, 217.0, 67.0, 17.0, 12.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006232261657714844, -0.0005943998694419861, -0.0005655735731124878, -0.0005367472767829895, -0.0005079209804534912, -0.0004790946841239929, -0.00045026838779449463, -0.00042144209146499634, -0.00039261579513549805, -0.00036378949880599976, -0.00033496320247650146, -0.0003061369061470032, -0.0002773106098175049, -0.0002484843134880066, -0.0002196580171585083, -0.00019083172082901, -0.00016200542449951172, -0.00013317912817001343, -0.00010435283184051514, -7.552653551101685e-05, -4.6700239181518555e-05, -1.7873942852020264e-05, 1.0952353477478027e-05, 3.977864980697632e-05, 6.860494613647461e-05, 9.74312424659729e-05, 0.0001262575387954712, 0.00015508383512496948, 0.00018391013145446777, 0.00021273642778396606, 0.00024156272411346436, 0.00027038902044296265, 0.00029921531677246094, 0.00032804161310195923, 0.0003568679094314575, 0.0003856942057609558, 0.0004145205020904541, 0.0004433467984199524, 0.0004721730947494507, 0.000500999391078949, 0.0005298256874084473, 0.0005586519837379456, 0.0005874782800674438, 0.0006163045763969421, 0.0006451308727264404, 0.0006739571690559387, 0.000702783465385437, 0.0007316097617149353, 0.0007604360580444336, 0.0007892623543739319, 0.0008180886507034302, 0.0008469149470329285, 0.0008757412433624268, 0.000904567539691925, 0.0009333938360214233, 0.0009622201323509216, 0.00099104642868042, 0.0010198727250099182, 0.0010486990213394165, 0.0010775253176689148, 0.001106351613998413, 0.0011351779103279114, 0.0011640042066574097, 0.001192830502986908, 0.0012216567993164062]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 7.0, 19.0, 23.0, 38.0, 66.0, 142.0, 291.0, 663.0, 1898.0, 7063.0, 950962.0, 79680.0, 5023.0, 1563.0, 565.0, 270.0, 108.0, 51.0, 31.0, 26.0, 9.0, 8.0, 6.0, 1.0, 6.0, 4.0, 8.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.15625, -7.8922119140625, -7.628173828125, -7.3641357421875, -7.10009765625, -6.8360595703125, -6.572021484375, -6.3079833984375, -6.0439453125, -5.7799072265625, -5.515869140625, -5.2518310546875, -4.98779296875, -4.7237548828125, -4.459716796875, -4.1956787109375, -3.931640625, -3.6676025390625, -3.403564453125, -3.1395263671875, -2.87548828125, -2.6114501953125, -2.347412109375, -2.0833740234375, -1.8193359375, -1.5552978515625, -1.291259765625, -1.0272216796875, -0.76318359375, -0.4991455078125, -0.235107421875, 0.0289306640625, 0.29296875, 0.5570068359375, 0.821044921875, 1.0850830078125, 1.34912109375, 1.6131591796875, 1.877197265625, 2.1412353515625, 2.4052734375, 2.6693115234375, 2.933349609375, 3.1973876953125, 3.46142578125, 3.7254638671875, 3.989501953125, 4.2535400390625, 4.517578125, 4.7816162109375, 5.045654296875, 5.3096923828125, 5.57373046875, 5.8377685546875, 6.101806640625, 6.3658447265625, 6.6298828125, 6.8939208984375, 7.157958984375, 7.4219970703125, 7.68603515625, 7.9500732421875, 8.214111328125, 8.4781494140625, 8.7421875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 7.0, 12.0, 32.0, 200.0, 579.0, 95.0, 18.0, 10.0, 9.0, 6.0, 5.0, 0.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.26171875, -3.150299072265625, -3.03887939453125, -2.927459716796875, -2.8160400390625, -2.704620361328125, -2.59320068359375, -2.481781005859375, -2.370361328125, -2.258941650390625, -2.14752197265625, -2.036102294921875, -1.9246826171875, -1.813262939453125, -1.70184326171875, -1.590423583984375, -1.47900390625, -1.367584228515625, -1.25616455078125, -1.144744873046875, -1.0333251953125, -0.921905517578125, -0.81048583984375, -0.699066162109375, -0.587646484375, -0.476226806640625, -0.36480712890625, -0.253387451171875, -0.1419677734375, -0.030548095703125, 0.08087158203125, 0.192291259765625, 0.3037109375, 0.415130615234375, 0.52655029296875, 0.637969970703125, 0.7493896484375, 0.860809326171875, 0.97222900390625, 1.083648681640625, 1.195068359375, 1.306488037109375, 1.41790771484375, 1.529327392578125, 1.6407470703125, 1.752166748046875, 1.86358642578125, 1.975006103515625, 2.08642578125, 2.197845458984375, 2.30926513671875, 2.420684814453125, 2.5321044921875, 2.643524169921875, 2.75494384765625, 2.866363525390625, 2.977783203125, 3.089202880859375, 3.20062255859375, 3.312042236328125, 3.4234619140625, 3.534881591796875, 3.64630126953125, 3.757720947265625, 3.869140625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 10.0, 16.0, 28.0, 47.0, 67.0, 99.0, 160.0, 174.0, 155.0, 111.0, 63.0, 31.0, 18.0, 8.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.933391571044922, -22.100812911987305, -21.268232345581055, -20.435653686523438, -19.603073120117188, -18.77049446105957, -17.937915802001953, -17.105335235595703, -16.272756576538086, -15.440176963806152, -14.607597351074219, -13.775018692016602, -12.942439079284668, -12.109859466552734, -11.277280807495117, -10.444701194763184, -9.61212158203125, -8.779541969299316, -7.946962833404541, -7.114383697509766, -6.281804084777832, -5.449224472045898, -4.616645336151123, -3.7840662002563477, -2.951486587524414, -2.1189072132110596, -1.286327838897705, -0.4537484645843506, 0.3788309097290039, 1.2114105224609375, 2.043989658355713, 2.8765687942504883, 3.7091503143310547, 4.541729927062988, 5.374309062957764, 6.206888198852539, 7.039467811584473, 7.872047424316406, 8.704626083374023, 9.537205696105957, 10.36978530883789, 11.202364921569824, 12.034944534301758, 12.867523193359375, 13.700102806091309, 14.532682418823242, 15.36526107788086, 16.19784164428711, 17.030420303344727, 17.862998962402344, 18.695579528808594, 19.52815818786621, 20.360736846923828, 21.193317413330078, 22.025896072387695, 22.858474731445312, 23.691055297851562, 24.52363395690918, 25.35621452331543, 26.188793182373047, 27.021373748779297, 27.853952407836914, 28.68653106689453, 29.51911163330078, 30.3516902923584]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 9.0, 6.0, 10.0, 9.0, 8.0, 18.0, 14.0, 15.0, 22.0, 30.0, 22.0, 30.0, 42.0, 42.0, 49.0, 47.0, 39.0, 47.0, 38.0, 44.0, 53.0, 54.0, 46.0, 29.0, 39.0, 53.0, 25.0, 34.0, 23.0, 18.0, 19.0, 15.0, 17.0, 5.0, 6.0, 5.0, 7.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.406794548034668, -9.117746353149414, -8.828697204589844, -8.53964900970459, -8.25059986114502, -7.961551666259766, -7.6725029945373535, -7.383454322814941, -7.094405651092529, -6.805356979370117, -6.516308307647705, -6.227259635925293, -5.938211441040039, -5.649162292480469, -5.360114097595215, -5.071065425872803, -4.782016754150391, -4.4929680824279785, -4.203919410705566, -3.9148709774017334, -3.6258223056793213, -3.336773633956909, -3.047725200653076, -2.758676528930664, -2.469627857208252, -2.18057918548584, -1.8915306329727173, -1.6024820804595947, -1.3134334087371826, -1.0243847370147705, -0.735336184501648, -0.4462876319885254, -0.15723800659179688, 0.13181060552597046, 0.4208592176437378, 0.7099078297615051, 0.9989564418792725, 1.2880051136016846, 1.5770536661148071, 1.8661022186279297, 2.155150890350342, 2.444199562072754, 2.733248233795166, 3.022296667098999, 3.311345338821411, 3.6003940105438232, 3.8894424438476562, 4.178491115570068, 4.4675397872924805, 4.756588459014893, 5.045637130737305, 5.334685802459717, 5.623734474182129, 5.912782669067383, 6.201831340789795, 6.490880012512207, 6.779928684234619, 7.068977355957031, 7.358026027679443, 7.6470746994018555, 7.936122894287109, 8.22517204284668, 8.514220237731934, 8.803268432617188, 9.092317581176758]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 11.0, 11.0, 11.0, 30.0, 38.0, 76.0, 134.0, 280.0, 544.0, 1243.0, 3133.0, 9944.0, 46588.0, 3738433.0, 354190.0, 28135.0, 7098.0, 2358.0, 993.0, 472.0, 222.0, 135.0, 59.0, 36.0, 34.0, 20.0, 15.0, 8.0, 5.0, 5.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.078125, -4.923583984375, -4.76904296875, -4.614501953125, -4.4599609375, -4.305419921875, -4.15087890625, -3.996337890625, -3.841796875, -3.687255859375, -3.53271484375, -3.378173828125, -3.2236328125, -3.069091796875, -2.91455078125, -2.760009765625, -2.60546875, -2.450927734375, -2.29638671875, -2.141845703125, -1.9873046875, -1.832763671875, -1.67822265625, -1.523681640625, -1.369140625, -1.214599609375, -1.06005859375, -0.905517578125, -0.7509765625, -0.596435546875, -0.44189453125, -0.287353515625, -0.1328125, 0.021728515625, 0.17626953125, 0.330810546875, 0.4853515625, 0.639892578125, 0.79443359375, 0.948974609375, 1.103515625, 1.258056640625, 1.41259765625, 1.567138671875, 1.7216796875, 1.876220703125, 2.03076171875, 2.185302734375, 2.33984375, 2.494384765625, 2.64892578125, 2.803466796875, 2.9580078125, 3.112548828125, 3.26708984375, 3.421630859375, 3.576171875, 3.730712890625, 3.88525390625, 4.039794921875, 4.1943359375, 4.348876953125, 4.50341796875, 4.657958984375, 4.8125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 3.0, 9.0, 8.0, 11.0, 18.0, 24.0, 35.0, 26.0, 32.0, 42.0, 37.0, 53.0, 47.0, 60.0, 72.0, 49.0, 69.0, 58.0, 53.0, 50.0, 49.0, 40.0, 26.0, 22.0, 24.0, 20.0, 18.0, 10.0, 13.0, 11.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36767578125, -0.3555450439453125, -0.343414306640625, -0.3312835693359375, -0.31915283203125, -0.3070220947265625, -0.294891357421875, -0.2827606201171875, -0.2706298828125, -0.2584991455078125, -0.246368408203125, -0.2342376708984375, -0.22210693359375, -0.2099761962890625, -0.197845458984375, -0.1857147216796875, -0.173583984375, -0.1614532470703125, -0.149322509765625, -0.1371917724609375, -0.12506103515625, -0.1129302978515625, -0.100799560546875, -0.0886688232421875, -0.0765380859375, -0.0644073486328125, -0.052276611328125, -0.0401458740234375, -0.02801513671875, -0.0158843994140625, -0.003753662109375, 0.0083770751953125, 0.0205078125, 0.0326385498046875, 0.044769287109375, 0.0569000244140625, 0.06903076171875, 0.0811614990234375, 0.093292236328125, 0.1054229736328125, 0.1175537109375, 0.1296844482421875, 0.141815185546875, 0.1539459228515625, 0.16607666015625, 0.1782073974609375, 0.190338134765625, 0.2024688720703125, 0.214599609375, 0.2267303466796875, 0.238861083984375, 0.2509918212890625, 0.26312255859375, 0.2752532958984375, 0.287384033203125, 0.2995147705078125, 0.3116455078125, 0.3237762451171875, 0.335906982421875, 0.3480377197265625, 0.36016845703125, 0.3722991943359375, 0.384429931640625, 0.3965606689453125, 0.40869140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 11.0, 10.0, 12.0, 18.0, 20.0, 36.0, 54.0, 86.0, 133.0, 180.0, 311.0, 566.0, 975.0, 1925.0, 4427.0, 10709.0, 33575.0, 196849.0, 3760668.0, 138746.0, 28009.0, 9316.0, 3771.0, 1682.0, 901.0, 465.0, 311.0, 180.0, 103.0, 62.0, 35.0, 23.0, 30.0, 21.0, 20.0, 9.0, 7.0, 5.0, 4.0, 4.0, 6.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0], "bins": [-3.67578125, -3.572021484375, -3.46826171875, -3.364501953125, -3.2607421875, -3.156982421875, -3.05322265625, -2.949462890625, -2.845703125, -2.741943359375, -2.63818359375, -2.534423828125, -2.4306640625, -2.326904296875, -2.22314453125, -2.119384765625, -2.015625, -1.911865234375, -1.80810546875, -1.704345703125, -1.6005859375, -1.496826171875, -1.39306640625, -1.289306640625, -1.185546875, -1.081787109375, -0.97802734375, -0.874267578125, -0.7705078125, -0.666748046875, -0.56298828125, -0.459228515625, -0.35546875, -0.251708984375, -0.14794921875, -0.044189453125, 0.0595703125, 0.163330078125, 0.26708984375, 0.370849609375, 0.474609375, 0.578369140625, 0.68212890625, 0.785888671875, 0.8896484375, 0.993408203125, 1.09716796875, 1.200927734375, 1.3046875, 1.408447265625, 1.51220703125, 1.615966796875, 1.7197265625, 1.823486328125, 1.92724609375, 2.031005859375, 2.134765625, 2.238525390625, 2.34228515625, 2.446044921875, 2.5498046875, 2.653564453125, 2.75732421875, 2.861083984375, 2.96484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 4.0, 7.0, 10.0, 10.0, 10.0, 18.0, 44.0, 44.0, 66.0, 184.0, 515.0, 2403.0, 380.0, 125.0, 87.0, 49.0, 34.0, 21.0, 14.0, 9.0, 9.0, 4.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.2971343994140625, -1.258331298828125, -1.2195281982421875, -1.18072509765625, -1.1419219970703125, -1.103118896484375, -1.0643157958984375, -1.0255126953125, -0.9867095947265625, -0.947906494140625, -0.9091033935546875, -0.87030029296875, -0.8314971923828125, -0.792694091796875, -0.7538909912109375, -0.715087890625, -0.6762847900390625, -0.637481689453125, -0.5986785888671875, -0.55987548828125, -0.5210723876953125, -0.482269287109375, -0.4434661865234375, -0.4046630859375, -0.3658599853515625, -0.327056884765625, -0.2882537841796875, -0.24945068359375, -0.2106475830078125, -0.171844482421875, -0.1330413818359375, -0.09423828125, -0.0554351806640625, -0.016632080078125, 0.0221710205078125, 0.06097412109375, 0.0997772216796875, 0.138580322265625, 0.1773834228515625, 0.2161865234375, 0.2549896240234375, 0.293792724609375, 0.3325958251953125, 0.37139892578125, 0.4102020263671875, 0.449005126953125, 0.4878082275390625, 0.526611328125, 0.5654144287109375, 0.604217529296875, 0.6430206298828125, 0.68182373046875, 0.7206268310546875, 0.759429931640625, 0.7982330322265625, 0.8370361328125, 0.8758392333984375, 0.914642333984375, 0.9534454345703125, 0.99224853515625, 1.0310516357421875, 1.069854736328125, 1.1086578369140625, 1.1474609375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 17.0, 25.0, 33.0, 55.0, 83.0, 126.0, 127.0, 168.0, 134.0, 91.0, 56.0, 41.0, 22.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.134398460388184, -9.889609336853027, -9.644819259643555, -9.400030136108398, -9.155240058898926, -8.91045093536377, -8.665660858154297, -8.42087173461914, -8.176082611083984, -7.93129301071167, -7.6865034103393555, -7.441714286804199, -7.196924686431885, -6.95213508605957, -6.707345485687256, -6.462555885314941, -6.217765808105469, -5.972976207733154, -5.72818660736084, -5.483397483825684, -5.238607883453369, -4.993818283081055, -4.74902868270874, -4.504239082336426, -4.2594499588012695, -4.014660358428955, -3.7698709964752197, -3.5250813961029053, -3.280291795730591, -3.0355024337768555, -2.790712833404541, -2.5459232330322266, -2.301133632659912, -2.0563440322875977, -1.8115545511245728, -1.5667650699615479, -1.3219754695892334, -1.0771859884262085, -0.8323965072631836, -0.5876069068908691, -0.34281742572784424, -0.09802789986133575, 0.14676162600517273, 0.39155113697052, 0.6363406777381897, 0.8811302185058594, 1.1259196996688843, 1.3707093000411987, 1.6154987812042236, 1.8602882623672485, 2.1050777435302734, 2.349867343902588, 2.5946569442749023, 2.839446544647217, 3.084235906600952, 3.3290255069732666, 3.573814868927002, 3.8186044692993164, 4.063394069671631, 4.308183670043945, 4.552972793579102, 4.797762393951416, 5.0425519943237305, 5.287341594696045, 5.532131195068359]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 7.0, 6.0, 11.0, 10.0, 9.0, 15.0, 20.0, 27.0, 22.0, 24.0, 21.0, 18.0, 37.0, 38.0, 38.0, 28.0, 38.0, 48.0, 33.0, 31.0, 39.0, 50.0, 38.0, 35.0, 40.0, 45.0, 30.0, 38.0, 28.0, 28.0, 22.0, 18.0, 11.0, 23.0, 12.0, 12.0, 10.0, 15.0, 6.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7943644523620605, -2.6975338459014893, -2.600703477859497, -2.503872871398926, -2.4070422649383545, -2.310211658477783, -2.213381290435791, -2.1165506839752197, -2.0197200775146484, -1.9228895902633667, -1.8260589838027954, -1.7292284965515137, -1.6323978900909424, -1.5355674028396606, -1.438736915588379, -1.3419063091278076, -1.2450758218765259, -1.1482453346252441, -1.0514147281646729, -0.9545842409133911, -0.8577536344528198, -0.7609231472015381, -0.6640926003456116, -0.5672620534896851, -0.47043150663375854, -0.37360095977783203, -0.2767704129219055, -0.1799398958683014, -0.08310934901237488, 0.013721197843551636, 0.11055171489715576, 0.20738226175308228, 0.3042128086090088, 0.4010433554649353, 0.4978739023208618, 0.5947043895721436, 0.6915349960327148, 0.7883654832839966, 0.8851960301399231, 0.9820265769958496, 1.078857183456421, 1.1756876707077026, 1.272518277168274, 1.3693487644195557, 1.466179370880127, 1.5630098581314087, 1.6598403453826904, 1.7566709518432617, 1.8535014390945435, 1.9503319263458252, 2.0471625328063965, 2.1439931392669678, 2.24082350730896, 2.3376541137695312, 2.4344847202301025, 2.531315326690674, 2.628145694732666, 2.7249763011932373, 2.8218066692352295, 2.918637275695801, 3.015467882156372, 3.1122984886169434, 3.2091288566589355, 3.305959463119507, 3.402790069580078]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 2.0, 1.0, 4.0, 7.0, 13.0, 6.0, 20.0, 25.0, 48.0, 44.0, 59.0, 91.0, 161.0, 193.0, 315.0, 460.0, 727.0, 1209.0, 2048.0, 3586.0, 6678.0, 12455.0, 24766.0, 51727.0, 152659.0, 553481.0, 137751.0, 49529.0, 23451.0, 11992.0, 6341.0, 3386.0, 2049.0, 1143.0, 720.0, 472.0, 312.0, 201.0, 134.0, 94.0, 62.0, 45.0, 26.0, 21.0, 18.0, 10.0, 11.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2900390625, -1.243072509765625, -1.19610595703125, -1.149139404296875, -1.1021728515625, -1.055206298828125, -1.00823974609375, -0.961273193359375, -0.914306640625, -0.867340087890625, -0.82037353515625, -0.773406982421875, -0.7264404296875, -0.679473876953125, -0.63250732421875, -0.585540771484375, -0.53857421875, -0.491607666015625, -0.44464111328125, -0.397674560546875, -0.3507080078125, -0.303741455078125, -0.25677490234375, -0.209808349609375, -0.162841796875, -0.115875244140625, -0.06890869140625, -0.021942138671875, 0.0250244140625, 0.071990966796875, 0.11895751953125, 0.165924072265625, 0.212890625, 0.259857177734375, 0.30682373046875, 0.353790283203125, 0.4007568359375, 0.447723388671875, 0.49468994140625, 0.541656494140625, 0.588623046875, 0.635589599609375, 0.68255615234375, 0.729522705078125, 0.7764892578125, 0.823455810546875, 0.87042236328125, 0.917388916015625, 0.96435546875, 1.011322021484375, 1.05828857421875, 1.105255126953125, 1.1522216796875, 1.199188232421875, 1.24615478515625, 1.293121337890625, 1.340087890625, 1.387054443359375, 1.43402099609375, 1.480987548828125, 1.5279541015625, 1.574920654296875, 1.62188720703125, 1.668853759765625, 1.7158203125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 9.0, 14.0, 15.0, 14.0, 17.0, 28.0, 37.0, 37.0, 45.0, 51.0, 58.0, 57.0, 63.0, 66.0, 52.0, 70.0, 57.0, 45.0, 43.0, 46.0, 42.0, 34.0, 17.0, 20.0, 16.0, 15.0, 12.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4267578125, -0.4132118225097656, -0.39966583251953125, -0.3861198425292969, -0.3725738525390625, -0.3590278625488281, -0.34548187255859375, -0.3319358825683594, -0.318389892578125, -0.3048439025878906, -0.29129791259765625, -0.2777519226074219, -0.2642059326171875, -0.2506599426269531, -0.23711395263671875, -0.22356796264648438, -0.21002197265625, -0.19647598266601562, -0.18292999267578125, -0.16938400268554688, -0.1558380126953125, -0.14229202270507812, -0.12874603271484375, -0.11520004272460938, -0.101654052734375, -0.08810806274414062, -0.07456207275390625, -0.061016082763671875, -0.0474700927734375, -0.033924102783203125, -0.02037811279296875, -0.006832122802734375, 0.0067138671875, 0.020259857177734375, 0.03380584716796875, 0.047351837158203125, 0.0608978271484375, 0.07444381713867188, 0.08798980712890625, 0.10153579711914062, 0.115081787109375, 0.12862777709960938, 0.14217376708984375, 0.15571975708007812, 0.1692657470703125, 0.18281173706054688, 0.19635772705078125, 0.20990371704101562, 0.22344970703125, 0.23699569702148438, 0.25054168701171875, 0.2640876770019531, 0.2776336669921875, 0.2911796569824219, 0.30472564697265625, 0.3182716369628906, 0.331817626953125, 0.3453636169433594, 0.35890960693359375, 0.3724555969238281, 0.3860015869140625, 0.3995475769042969, 0.41309356689453125, 0.4266395568847656, 0.440185546875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 3.0, 11.0, 10.0, 25.0, 18.0, 29.0, 38.0, 42.0, 66.0, 94.0, 168.0, 284.0, 553.0, 1131.0, 2491.0, 6077.0, 15299.0, 41678.0, 162084.0, 684338.0, 86443.0, 28582.0, 10980.0, 4251.0, 1882.0, 834.0, 436.0, 245.0, 160.0, 84.0, 57.0, 41.0, 19.0, 21.0, 16.0, 8.0, 16.0, 11.0, 6.0, 7.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9677734375, -1.9006500244140625, -1.833526611328125, -1.7664031982421875, -1.69927978515625, -1.6321563720703125, -1.565032958984375, -1.4979095458984375, -1.4307861328125, -1.3636627197265625, -1.296539306640625, -1.2294158935546875, -1.16229248046875, -1.0951690673828125, -1.028045654296875, -0.9609222412109375, -0.893798828125, -0.8266754150390625, -0.759552001953125, -0.6924285888671875, -0.62530517578125, -0.5581817626953125, -0.491058349609375, -0.4239349365234375, -0.3568115234375, -0.2896881103515625, -0.222564697265625, -0.1554412841796875, -0.08831787109375, -0.0211944580078125, 0.045928955078125, 0.1130523681640625, 0.18017578125, 0.2472991943359375, 0.314422607421875, 0.3815460205078125, 0.44866943359375, 0.5157928466796875, 0.582916259765625, 0.6500396728515625, 0.7171630859375, 0.7842864990234375, 0.851409912109375, 0.9185333251953125, 0.98565673828125, 1.0527801513671875, 1.119903564453125, 1.1870269775390625, 1.254150390625, 1.3212738037109375, 1.388397216796875, 1.4555206298828125, 1.52264404296875, 1.5897674560546875, 1.656890869140625, 1.7240142822265625, 1.7911376953125, 1.8582611083984375, 1.925384521484375, 1.9925079345703125, 2.05963134765625, 2.1267547607421875, 2.193878173828125, 2.2610015869140625, 2.328125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 6.0, 15.0, 16.0, 14.0, 17.0, 14.0, 22.0, 22.0, 33.0, 30.0, 44.0, 41.0, 50.0, 42.0, 48.0, 46.0, 50.0, 58.0, 39.0, 45.0, 51.0, 35.0, 38.0, 31.0, 38.0, 32.0, 25.0, 18.0, 8.0, 13.0, 12.0, 12.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3935546875, -1.343780517578125, -1.29400634765625, -1.244232177734375, -1.1944580078125, -1.144683837890625, -1.09490966796875, -1.045135498046875, -0.995361328125, -0.945587158203125, -0.89581298828125, -0.846038818359375, -0.7962646484375, -0.746490478515625, -0.69671630859375, -0.646942138671875, -0.59716796875, -0.547393798828125, -0.49761962890625, -0.447845458984375, -0.3980712890625, -0.348297119140625, -0.29852294921875, -0.248748779296875, -0.198974609375, -0.149200439453125, -0.09942626953125, -0.049652099609375, 0.0001220703125, 0.049896240234375, 0.09967041015625, 0.149444580078125, 0.19921875, 0.248992919921875, 0.29876708984375, 0.348541259765625, 0.3983154296875, 0.448089599609375, 0.49786376953125, 0.547637939453125, 0.597412109375, 0.647186279296875, 0.69696044921875, 0.746734619140625, 0.7965087890625, 0.846282958984375, 0.89605712890625, 0.945831298828125, 0.99560546875, 1.045379638671875, 1.09515380859375, 1.144927978515625, 1.1947021484375, 1.244476318359375, 1.29425048828125, 1.344024658203125, 1.393798828125, 1.443572998046875, 1.49334716796875, 1.543121337890625, 1.5928955078125, 1.642669677734375, 1.69244384765625, 1.742218017578125, 1.7919921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 5.0, 5.0, 5.0, 4.0, 9.0, 13.0, 26.0, 35.0, 55.0, 68.0, 121.0, 170.0, 306.0, 578.0, 1158.0, 2326.0, 6389.0, 24002.0, 194194.0, 736316.0, 62911.0, 12412.0, 3950.0, 1584.0, 839.0, 414.0, 257.0, 136.0, 100.0, 44.0, 29.0, 25.0, 13.0, 20.0, 8.0, 10.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3134765625, -1.2670135498046875, -1.220550537109375, -1.1740875244140625, -1.12762451171875, -1.0811614990234375, -1.034698486328125, -0.9882354736328125, -0.9417724609375, -0.8953094482421875, -0.848846435546875, -0.8023834228515625, -0.75592041015625, -0.7094573974609375, -0.662994384765625, -0.6165313720703125, -0.570068359375, -0.5236053466796875, -0.477142333984375, -0.4306793212890625, -0.38421630859375, -0.3377532958984375, -0.291290283203125, -0.2448272705078125, -0.1983642578125, -0.1519012451171875, -0.105438232421875, -0.0589752197265625, -0.01251220703125, 0.0339508056640625, 0.080413818359375, 0.1268768310546875, 0.17333984375, 0.2198028564453125, 0.266265869140625, 0.3127288818359375, 0.35919189453125, 0.4056549072265625, 0.452117919921875, 0.4985809326171875, 0.5450439453125, 0.5915069580078125, 0.637969970703125, 0.6844329833984375, 0.73089599609375, 0.7773590087890625, 0.823822021484375, 0.8702850341796875, 0.916748046875, 0.9632110595703125, 1.009674072265625, 1.0561370849609375, 1.10260009765625, 1.1490631103515625, 1.195526123046875, 1.2419891357421875, 1.2884521484375, 1.3349151611328125, 1.381378173828125, 1.4278411865234375, 1.47430419921875, 1.5207672119140625, 1.567230224609375, 1.6136932373046875, 1.66015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 2.0, 10.0, 21.0, 35.0, 56.0, 96.0, 243.0, 285.0, 117.0, 59.0, 24.0, 19.0, 12.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00047969818115234375, -0.0004647485911846161, -0.00044979900121688843, -0.00043484941124916077, -0.0004198998212814331, -0.00040495023131370544, -0.0003900006413459778, -0.0003750510513782501, -0.00036010146141052246, -0.0003451518714427948, -0.00033020228147506714, -0.0003152526915073395, -0.0003003031015396118, -0.00028535351157188416, -0.0002704039216041565, -0.00025545433163642883, -0.00024050474166870117, -0.0002255551517009735, -0.00021060556173324585, -0.0001956559717655182, -0.00018070638179779053, -0.00016575679183006287, -0.0001508072018623352, -0.00013585761189460754, -0.00012090802192687988, -0.00010595843195915222, -9.100884199142456e-05, -7.60592520236969e-05, -6.110966205596924e-05, -4.616007208824158e-05, -3.1210482120513916e-05, -1.6260892152786255e-05, -1.3113021850585938e-06, 1.3638287782669067e-05, 2.858787775039673e-05, 4.353746771812439e-05, 5.848705768585205e-05, 7.343664765357971e-05, 8.838623762130737e-05, 0.00010333582758903503, 0.0001182854175567627, 0.00013323500752449036, 0.00014818459749221802, 0.00016313418745994568, 0.00017808377742767334, 0.000193033367395401, 0.00020798295736312866, 0.00022293254733085632, 0.00023788213729858398, 0.00025283172726631165, 0.0002677813172340393, 0.00028273090720176697, 0.00029768049716949463, 0.0003126300871372223, 0.00032757967710494995, 0.0003425292670726776, 0.0003574788570404053, 0.00037242844700813293, 0.0003873780369758606, 0.00040232762694358826, 0.0004172772169113159, 0.0004322268068790436, 0.00044717639684677124, 0.0004621259868144989, 0.00047707557678222656]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 4.0, 9.0, 7.0, 7.0, 11.0, 13.0, 27.0, 32.0, 49.0, 73.0, 119.0, 214.0, 406.0, 731.0, 1662.0, 3966.0, 12017.0, 52009.0, 625049.0, 304418.0, 33249.0, 8664.0, 3077.0, 1281.0, 631.0, 329.0, 167.0, 84.0, 86.0, 40.0, 35.0, 25.0, 13.0, 9.0, 10.0, 6.0, 3.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.35546875, -1.311553955078125, -1.26763916015625, -1.223724365234375, -1.1798095703125, -1.135894775390625, -1.09197998046875, -1.048065185546875, -1.004150390625, -0.960235595703125, -0.91632080078125, -0.872406005859375, -0.8284912109375, -0.784576416015625, -0.74066162109375, -0.696746826171875, -0.65283203125, -0.608917236328125, -0.56500244140625, -0.521087646484375, -0.4771728515625, -0.433258056640625, -0.38934326171875, -0.345428466796875, -0.301513671875, -0.257598876953125, -0.21368408203125, -0.169769287109375, -0.1258544921875, -0.081939697265625, -0.03802490234375, 0.005889892578125, 0.0498046875, 0.093719482421875, 0.13763427734375, 0.181549072265625, 0.2254638671875, 0.269378662109375, 0.31329345703125, 0.357208251953125, 0.401123046875, 0.445037841796875, 0.48895263671875, 0.532867431640625, 0.5767822265625, 0.620697021484375, 0.66461181640625, 0.708526611328125, 0.75244140625, 0.796356201171875, 0.84027099609375, 0.884185791015625, 0.9281005859375, 0.972015380859375, 1.01593017578125, 1.059844970703125, 1.103759765625, 1.147674560546875, 1.19158935546875, 1.235504150390625, 1.2794189453125, 1.323333740234375, 1.36724853515625, 1.411163330078125, 1.455078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 3.0, 9.0, 2.0, 13.0, 10.0, 15.0, 14.0, 18.0, 21.0, 47.0, 66.0, 91.0, 157.0, 155.0, 119.0, 82.0, 44.0, 32.0, 29.0, 13.0, 11.0, 5.0, 7.0, 7.0, 5.0, 5.0, 4.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9931640625, -0.9631423950195312, -0.9331207275390625, -0.9030990600585938, -0.873077392578125, -0.8430557250976562, -0.8130340576171875, -0.7830123901367188, -0.75299072265625, -0.7229690551757812, -0.6929473876953125, -0.6629257202148438, -0.632904052734375, -0.6028823852539062, -0.5728607177734375, -0.5428390502929688, -0.5128173828125, -0.48279571533203125, -0.4527740478515625, -0.42275238037109375, -0.392730712890625, -0.36270904541015625, -0.3326873779296875, -0.30266571044921875, -0.27264404296875, -0.24262237548828125, -0.2126007080078125, -0.18257904052734375, -0.152557373046875, -0.12253570556640625, -0.0925140380859375, -0.06249237060546875, -0.032470703125, -0.00244903564453125, 0.0275726318359375, 0.05759429931640625, 0.087615966796875, 0.11763763427734375, 0.1476593017578125, 0.17768096923828125, 0.20770263671875, 0.23772430419921875, 0.2677459716796875, 0.29776763916015625, 0.327789306640625, 0.35781097412109375, 0.3878326416015625, 0.41785430908203125, 0.4478759765625, 0.47789764404296875, 0.5079193115234375, 0.5379409790039062, 0.567962646484375, 0.5979843139648438, 0.6280059814453125, 0.6580276489257812, 0.68804931640625, 0.7180709838867188, 0.7480926513671875, 0.7781143188476562, 0.808135986328125, 0.8381576538085938, 0.8681793212890625, 0.8982009887695312, 0.92822265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 21.0, 55.0, 103.0, 176.0, 239.0, 207.0, 112.0, 51.0, 20.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.28742790222168, -12.53518009185791, -11.78293228149414, -11.030685424804688, -10.278436660766602, -9.526189804077148, -8.773941993713379, -8.02169418334961, -7.26944637298584, -6.51719856262207, -5.764950752258301, -5.0127034187316895, -4.26045560836792, -3.5082077980041504, -2.755960464477539, -2.0037126541137695, -1.25146484375, -0.49921715259552, 0.25303053855895996, 1.0052781105041504, 1.75752592086792, 2.5097737312316895, 3.262021064758301, 4.01426887512207, 4.76651668548584, 5.518764495849609, 6.271012306213379, 7.02325963973999, 7.77550745010376, 8.527755737304688, 9.28000259399414, 10.03225040435791, 10.784496307373047, 11.536744117736816, 12.288991928100586, 13.041238784790039, 13.793487548828125, 14.545734405517578, 15.297982215881348, 16.050230026245117, 16.802478790283203, 17.554725646972656, 18.306974411010742, 19.059221267700195, 19.81147003173828, 20.563716888427734, 21.315963745117188, 22.068212509155273, 22.820459365844727, 23.57270622253418, 24.324954986572266, 25.07720184326172, 25.829450607299805, 26.581697463989258, 27.333946228027344, 28.086193084716797, 28.83843994140625, 29.590686798095703, 30.34293556213379, 31.095182418823242, 31.847431182861328, 32.59967803955078, 33.351924896240234, 34.10417175292969, 34.856422424316406]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 8.0, 13.0, 10.0, 18.0, 11.0, 24.0, 19.0, 24.0, 35.0, 30.0, 24.0, 35.0, 30.0, 47.0, 38.0, 55.0, 50.0, 46.0, 49.0, 55.0, 46.0, 38.0, 43.0, 29.0, 33.0, 40.0, 22.0, 22.0, 17.0, 23.0, 18.0, 13.0, 9.0, 5.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.435820579528809, -8.197875022888184, -7.9599289894104, -7.721983432769775, -7.484037399291992, -7.246091842651367, -7.008146286010742, -6.770200252532959, -6.532254695892334, -6.294309139251709, -6.056363105773926, -5.818417549133301, -5.580471515655518, -5.342525959014893, -5.104579925537109, -4.866634368896484, -4.628688812255859, -4.390743255615234, -4.152797222137451, -3.914851665496826, -3.676905870437622, -3.438960075378418, -3.201014280319214, -2.9630684852600098, -2.7251224517822266, -2.4871766567230225, -2.2492308616638184, -2.0112853050231934, -1.7733395099639893, -1.5353937149047852, -1.297447919845581, -1.0595022439956665, -0.821556568145752, -0.5836108326911926, -0.3456650674343109, -0.1077193021774292, 0.13022643327713013, 0.36817216873168945, 0.6061179637908936, 0.8440636396408081, 1.0820094347000122, 1.3199552297592163, 1.5579009056091309, 1.795846700668335, 2.033792495727539, 2.271738052368164, 2.5096840858459473, 2.7476296424865723, 2.9855754375457764, 3.2235212326049805, 3.4614670276641846, 3.6994128227233887, 3.9373583793640137, 4.175304412841797, 4.413249969482422, 4.651195526123047, 4.88914155960083, 5.127087116241455, 5.365033149719238, 5.602978706359863, 5.8409247398376465, 6.0788702964782715, 6.316816329956055, 6.55476188659668, 6.792707443237305]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 12.0, 11.0, 16.0, 22.0, 24.0, 41.0, 56.0, 90.0, 137.0, 238.0, 378.0, 666.0, 1251.0, 2532.0, 5763.0, 15160.0, 51913.0, 906881.0, 3123392.0, 57786.0, 16187.0, 6060.0, 2600.0, 1304.0, 699.0, 359.0, 234.0, 132.0, 99.0, 60.0, 34.0, 37.0, 17.0, 18.0, 12.0, 12.0, 11.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.75, -3.636474609375, -3.52294921875, -3.409423828125, -3.2958984375, -3.182373046875, -3.06884765625, -2.955322265625, -2.841796875, -2.728271484375, -2.61474609375, -2.501220703125, -2.3876953125, -2.274169921875, -2.16064453125, -2.047119140625, -1.93359375, -1.820068359375, -1.70654296875, -1.593017578125, -1.4794921875, -1.365966796875, -1.25244140625, -1.138916015625, -1.025390625, -0.911865234375, -0.79833984375, -0.684814453125, -0.5712890625, -0.457763671875, -0.34423828125, -0.230712890625, -0.1171875, -0.003662109375, 0.10986328125, 0.223388671875, 0.3369140625, 0.450439453125, 0.56396484375, 0.677490234375, 0.791015625, 0.904541015625, 1.01806640625, 1.131591796875, 1.2451171875, 1.358642578125, 1.47216796875, 1.585693359375, 1.69921875, 1.812744140625, 1.92626953125, 2.039794921875, 2.1533203125, 2.266845703125, 2.38037109375, 2.493896484375, 2.607421875, 2.720947265625, 2.83447265625, 2.947998046875, 3.0615234375, 3.175048828125, 3.28857421875, 3.402099609375, 3.515625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 11.0, 7.0, 24.0, 20.0, 25.0, 28.0, 32.0, 26.0, 33.0, 46.0, 48.0, 56.0, 47.0, 63.0, 66.0, 67.0, 50.0, 52.0, 51.0, 48.0, 43.0, 25.0, 29.0, 19.0, 24.0, 14.0, 13.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39306640625, -0.37996673583984375, -0.3668670654296875, -0.35376739501953125, -0.340667724609375, -0.32756805419921875, -0.3144683837890625, -0.30136871337890625, -0.28826904296875, -0.27516937255859375, -0.2620697021484375, -0.24897003173828125, -0.235870361328125, -0.22277069091796875, -0.2096710205078125, -0.19657135009765625, -0.1834716796875, -0.17037200927734375, -0.1572723388671875, -0.14417266845703125, -0.131072998046875, -0.11797332763671875, -0.1048736572265625, -0.09177398681640625, -0.07867431640625, -0.06557464599609375, -0.0524749755859375, -0.03937530517578125, -0.026275634765625, -0.01317596435546875, -7.62939453125e-05, 0.01302337646484375, 0.026123046875, 0.03922271728515625, 0.0523223876953125, 0.06542205810546875, 0.078521728515625, 0.09162139892578125, 0.1047210693359375, 0.11782073974609375, 0.13092041015625, 0.14402008056640625, 0.1571197509765625, 0.17021942138671875, 0.183319091796875, 0.19641876220703125, 0.2095184326171875, 0.22261810302734375, 0.2357177734375, 0.24881744384765625, 0.2619171142578125, 0.27501678466796875, 0.288116455078125, 0.30121612548828125, 0.3143157958984375, 0.32741546630859375, 0.34051513671875, 0.35361480712890625, 0.3667144775390625, 0.37981414794921875, 0.392913818359375, 0.40601348876953125, 0.4191131591796875, 0.43221282958984375, 0.4453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 2.0, 7.0, 4.0, 10.0, 17.0, 21.0, 28.0, 23.0, 44.0, 59.0, 99.0, 204.0, 601.0, 1687.0, 5840.0, 28384.0, 923175.0, 3193214.0, 31516.0, 6359.0, 1814.0, 626.0, 244.0, 103.0, 66.0, 42.0, 20.0, 19.0, 19.0, 9.0, 8.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.77734375, -6.5721435546875, -6.366943359375, -6.1617431640625, -5.95654296875, -5.7513427734375, -5.546142578125, -5.3409423828125, -5.1357421875, -4.9305419921875, -4.725341796875, -4.5201416015625, -4.31494140625, -4.1097412109375, -3.904541015625, -3.6993408203125, -3.494140625, -3.2889404296875, -3.083740234375, -2.8785400390625, -2.67333984375, -2.4681396484375, -2.262939453125, -2.0577392578125, -1.8525390625, -1.6473388671875, -1.442138671875, -1.2369384765625, -1.03173828125, -0.8265380859375, -0.621337890625, -0.4161376953125, -0.2109375, -0.0057373046875, 0.199462890625, 0.4046630859375, 0.60986328125, 0.8150634765625, 1.020263671875, 1.2254638671875, 1.4306640625, 1.6358642578125, 1.841064453125, 2.0462646484375, 2.25146484375, 2.4566650390625, 2.661865234375, 2.8670654296875, 3.072265625, 3.2774658203125, 3.482666015625, 3.6878662109375, 3.89306640625, 4.0982666015625, 4.303466796875, 4.5086669921875, 4.7138671875, 4.9190673828125, 5.124267578125, 5.3294677734375, 5.53466796875, 5.7398681640625, 5.945068359375, 6.1502685546875, 6.35546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 6.0, 14.0, 19.0, 23.0, 38.0, 75.0, 175.0, 1042.0, 2315.0, 186.0, 74.0, 35.0, 25.0, 14.0, 13.0, 8.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.728515625, -2.6665802001953125, -2.604644775390625, -2.5427093505859375, -2.48077392578125, -2.4188385009765625, -2.356903076171875, -2.2949676513671875, -2.2330322265625, -2.1710968017578125, -2.109161376953125, -2.0472259521484375, -1.98529052734375, -1.9233551025390625, -1.861419677734375, -1.7994842529296875, -1.737548828125, -1.6756134033203125, -1.613677978515625, -1.5517425537109375, -1.48980712890625, -1.4278717041015625, -1.365936279296875, -1.3040008544921875, -1.2420654296875, -1.1801300048828125, -1.118194580078125, -1.0562591552734375, -0.99432373046875, -0.9323883056640625, -0.870452880859375, -0.8085174560546875, -0.74658203125, -0.6846466064453125, -0.622711181640625, -0.5607757568359375, -0.49884033203125, -0.4369049072265625, -0.374969482421875, -0.3130340576171875, -0.2510986328125, -0.1891632080078125, -0.127227783203125, -0.0652923583984375, -0.00335693359375, 0.0585784912109375, 0.120513916015625, 0.1824493408203125, 0.244384765625, 0.3063201904296875, 0.368255615234375, 0.4301910400390625, 0.49212646484375, 0.5540618896484375, 0.615997314453125, 0.6779327392578125, 0.7398681640625, 0.8018035888671875, 0.863739013671875, 0.9256744384765625, 0.98760986328125, 1.0495452880859375, 1.111480712890625, 1.1734161376953125, 1.2353515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 11.0, 9.0, 13.0, 35.0, 70.0, 132.0, 189.0, 216.0, 167.0, 84.0, 44.0, 23.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.13837718963623, -14.762004852294922, -14.385631561279297, -14.009259223937988, -13.63288688659668, -13.256513595581055, -12.880141258239746, -12.503768920898438, -12.127395629882812, -11.751023292541504, -11.374650001525879, -10.99827766418457, -10.621905326843262, -10.245532989501953, -9.869159698486328, -9.49278736114502, -9.116415023803711, -8.740042686462402, -8.363669395446777, -7.987297058105469, -7.61092472076416, -7.234551906585693, -6.858179092407227, -6.481806755065918, -6.105433940887451, -5.729061126708984, -5.352688789367676, -4.976315975189209, -4.599943161010742, -4.223570823669434, -3.847198009490967, -3.470825433731079, -3.094453811645508, -2.71808123588562, -2.3417086601257324, -1.9653358459472656, -1.588963270187378, -1.2125906944274902, -0.8362178802490234, -0.45984530448913574, -0.08347272872924805, 0.2928999066352844, 0.6692725419998169, 1.0456452369689941, 1.4220178127288818, 1.7983903884887695, 2.1747632026672363, 2.551135778427124, 2.9275083541870117, 3.3038809299468994, 3.680253505706787, 4.056626319885254, 4.4329986572265625, 4.809371471405029, 5.185744285583496, 5.562116622924805, 5.9384894371032715, 6.314862251281738, 6.691234588623047, 7.067607402801514, 7.4439802169799805, 7.820352554321289, 8.196725845336914, 8.573098182678223, 8.949470520019531]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 8.0, 2.0, 5.0, 6.0, 7.0, 8.0, 11.0, 16.0, 14.0, 23.0, 15.0, 19.0, 19.0, 27.0, 30.0, 28.0, 41.0, 50.0, 36.0, 41.0, 46.0, 40.0, 38.0, 44.0, 43.0, 39.0, 40.0, 42.0, 35.0, 29.0, 24.0, 27.0, 21.0, 22.0, 17.0, 12.0, 18.0, 8.0, 11.0, 6.0, 13.0, 3.0, 3.0, 4.0, 2.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.24822998046875, -3.1394431591033936, -3.030656337738037, -2.9218692779541016, -2.813082456588745, -2.7042956352233887, -2.5955088138580322, -2.486721992492676, -2.3779351711273193, -2.269148349761963, -2.1603615283966064, -2.05157470703125, -1.942787766456604, -1.834000825881958, -1.7252140045166016, -1.6164271831512451, -1.5076402425765991, -1.3988534212112427, -1.2900664806365967, -1.1812796592712402, -1.0724928379058838, -0.9637059569358826, -0.8549190759658813, -0.7461322546005249, -0.6373453736305237, -0.5285584926605225, -0.419771671295166, -0.3109847903251648, -0.20219793915748596, -0.09341108798980713, 0.015375792980194092, 0.12416261434555054, 0.23294949531555176, 0.3417363464832306, 0.4505231976509094, 0.5593100786209106, 0.6680968999862671, 0.7768837809562683, 0.8856706619262695, 0.994457483291626, 1.1032443046569824, 1.2120311260223389, 1.3208180665969849, 1.4296048879623413, 1.5383917093276978, 1.6471786499023438, 1.7559654712677002, 1.8647522926330566, 1.9735392332077026, 2.0823261737823486, 2.191112995147705, 2.2998998165130615, 2.408686637878418, 2.5174734592437744, 2.626260280609131, 2.7350473403930664, 2.843834161758423, 2.9526209831237793, 3.0614078044891357, 3.170194625854492, 3.2789816856384277, 3.387768507003784, 3.4965553283691406, 3.605342149734497, 3.7141289710998535]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 8.0, 16.0, 29.0, 34.0, 59.0, 78.0, 115.0, 144.0, 262.0, 415.0, 716.0, 1110.0, 2038.0, 3528.0, 6564.0, 12229.0, 23733.0, 47132.0, 91297.0, 195143.0, 345767.0, 157420.0, 77633.0, 39418.0, 20259.0, 10356.0, 5695.0, 2997.0, 1693.0, 1029.0, 587.0, 356.0, 230.0, 143.0, 103.0, 63.0, 36.0, 35.0, 20.0, 19.0, 9.0, 7.0, 7.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0], "bins": [-1.84765625, -1.7954254150390625, -1.743194580078125, -1.6909637451171875, -1.63873291015625, -1.5865020751953125, -1.534271240234375, -1.4820404052734375, -1.4298095703125, -1.3775787353515625, -1.325347900390625, -1.2731170654296875, -1.22088623046875, -1.1686553955078125, -1.116424560546875, -1.0641937255859375, -1.011962890625, -0.9597320556640625, -0.907501220703125, -0.8552703857421875, -0.80303955078125, -0.7508087158203125, -0.698577880859375, -0.6463470458984375, -0.5941162109375, -0.5418853759765625, -0.489654541015625, -0.4374237060546875, -0.38519287109375, -0.3329620361328125, -0.280731201171875, -0.2285003662109375, -0.17626953125, -0.1240386962890625, -0.071807861328125, -0.0195770263671875, 0.03265380859375, 0.0848846435546875, 0.137115478515625, 0.1893463134765625, 0.2415771484375, 0.2938079833984375, 0.346038818359375, 0.3982696533203125, 0.45050048828125, 0.5027313232421875, 0.554962158203125, 0.6071929931640625, 0.659423828125, 0.7116546630859375, 0.763885498046875, 0.8161163330078125, 0.86834716796875, 0.9205780029296875, 0.972808837890625, 1.0250396728515625, 1.0772705078125, 1.1295013427734375, 1.181732177734375, 1.2339630126953125, 1.28619384765625, 1.3384246826171875, 1.390655517578125, 1.4428863525390625, 1.4951171875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 13.0, 11.0, 16.0, 11.0, 25.0, 12.0, 28.0, 25.0, 20.0, 33.0, 33.0, 48.0, 51.0, 43.0, 46.0, 40.0, 47.0, 35.0, 51.0, 56.0, 43.0, 49.0, 33.0, 32.0, 34.0, 21.0, 28.0, 17.0, 24.0, 17.0, 14.0, 11.0, 6.0, 5.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362060546875, -0.3498687744140625, -0.337677001953125, -0.3254852294921875, -0.31329345703125, -0.3011016845703125, -0.288909912109375, -0.2767181396484375, -0.2645263671875, -0.2523345947265625, -0.240142822265625, -0.2279510498046875, -0.21575927734375, -0.2035675048828125, -0.191375732421875, -0.1791839599609375, -0.1669921875, -0.1548004150390625, -0.142608642578125, -0.1304168701171875, -0.11822509765625, -0.1060333251953125, -0.093841552734375, -0.0816497802734375, -0.0694580078125, -0.0572662353515625, -0.045074462890625, -0.0328826904296875, -0.02069091796875, -0.0084991455078125, 0.003692626953125, 0.0158843994140625, 0.028076171875, 0.0402679443359375, 0.052459716796875, 0.0646514892578125, 0.07684326171875, 0.0890350341796875, 0.101226806640625, 0.1134185791015625, 0.1256103515625, 0.1378021240234375, 0.149993896484375, 0.1621856689453125, 0.17437744140625, 0.1865692138671875, 0.198760986328125, 0.2109527587890625, 0.22314453125, 0.2353363037109375, 0.247528076171875, 0.2597198486328125, 0.27191162109375, 0.2841033935546875, 0.296295166015625, 0.3084869384765625, 0.3206787109375, 0.3328704833984375, 0.345062255859375, 0.3572540283203125, 0.36944580078125, 0.3816375732421875, 0.393829345703125, 0.4060211181640625, 0.418212890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 11.0, 14.0, 21.0, 29.0, 52.0, 60.0, 86.0, 133.0, 223.0, 382.0, 694.0, 1394.0, 3558.0, 12332.0, 62909.0, 609315.0, 301951.0, 41048.0, 8904.0, 2706.0, 1167.0, 609.0, 314.0, 206.0, 137.0, 85.0, 53.0, 26.0, 29.0, 29.0, 12.0, 9.0, 13.0, 4.0, 5.0, 1.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.90673828125, -3.7666015625, -3.62646484375, -3.486328125, -3.34619140625, -3.2060546875, -3.06591796875, -2.92578125, -2.78564453125, -2.6455078125, -2.50537109375, -2.365234375, -2.22509765625, -2.0849609375, -1.94482421875, -1.8046875, -1.66455078125, -1.5244140625, -1.38427734375, -1.244140625, -1.10400390625, -0.9638671875, -0.82373046875, -0.68359375, -0.54345703125, -0.4033203125, -0.26318359375, -0.123046875, 0.01708984375, 0.1572265625, 0.29736328125, 0.4375, 0.57763671875, 0.7177734375, 0.85791015625, 0.998046875, 1.13818359375, 1.2783203125, 1.41845703125, 1.55859375, 1.69873046875, 1.8388671875, 1.97900390625, 2.119140625, 2.25927734375, 2.3994140625, 2.53955078125, 2.6796875, 2.81982421875, 2.9599609375, 3.10009765625, 3.240234375, 3.38037109375, 3.5205078125, 3.66064453125, 3.80078125, 3.94091796875, 4.0810546875, 4.22119140625, 4.361328125, 4.50146484375, 4.6416015625, 4.78173828125, 4.921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 10.0, 17.0, 10.0, 23.0, 17.0, 31.0, 33.0, 42.0, 55.0, 30.0, 52.0, 75.0, 69.0, 72.0, 68.0, 58.0, 59.0, 56.0, 38.0, 38.0, 31.0, 19.0, 25.0, 14.0, 9.0, 12.0, 12.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.859375, -2.773345947265625, -2.68731689453125, -2.601287841796875, -2.5152587890625, -2.429229736328125, -2.34320068359375, -2.257171630859375, -2.171142578125, -2.085113525390625, -1.99908447265625, -1.913055419921875, -1.8270263671875, -1.740997314453125, -1.65496826171875, -1.568939208984375, -1.48291015625, -1.396881103515625, -1.31085205078125, -1.224822998046875, -1.1387939453125, -1.052764892578125, -0.96673583984375, -0.880706787109375, -0.794677734375, -0.708648681640625, -0.62261962890625, -0.536590576171875, -0.4505615234375, -0.364532470703125, -0.27850341796875, -0.192474365234375, -0.1064453125, -0.020416259765625, 0.06561279296875, 0.151641845703125, 0.2376708984375, 0.323699951171875, 0.40972900390625, 0.495758056640625, 0.581787109375, 0.667816162109375, 0.75384521484375, 0.839874267578125, 0.9259033203125, 1.011932373046875, 1.09796142578125, 1.183990478515625, 1.27001953125, 1.356048583984375, 1.44207763671875, 1.528106689453125, 1.6141357421875, 1.700164794921875, 1.78619384765625, 1.872222900390625, 1.958251953125, 2.044281005859375, 2.13031005859375, 2.216339111328125, 2.3023681640625, 2.388397216796875, 2.47442626953125, 2.560455322265625, 2.646484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 8.0, 10.0, 4.0, 7.0, 9.0, 11.0, 21.0, 31.0, 25.0, 54.0, 73.0, 101.0, 141.0, 197.0, 331.0, 562.0, 905.0, 1421.0, 2546.0, 4456.0, 8422.0, 19036.0, 58319.0, 404425.0, 446758.0, 61281.0, 19512.0, 8733.0, 4570.0, 2505.0, 1502.0, 866.0, 564.0, 384.0, 227.0, 162.0, 121.0, 65.0, 48.0, 46.0, 27.0, 19.0, 16.0, 13.0, 9.0, 4.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.52374267578125, -1.4693603515625, -1.41497802734375, -1.360595703125, -1.30621337890625, -1.2518310546875, -1.19744873046875, -1.14306640625, -1.08868408203125, -1.0343017578125, -0.97991943359375, -0.925537109375, -0.87115478515625, -0.8167724609375, -0.76239013671875, -0.7080078125, -0.65362548828125, -0.5992431640625, -0.54486083984375, -0.490478515625, -0.43609619140625, -0.3817138671875, -0.32733154296875, -0.27294921875, -0.21856689453125, -0.1641845703125, -0.10980224609375, -0.055419921875, -0.00103759765625, 0.0533447265625, 0.10772705078125, 0.162109375, 0.21649169921875, 0.2708740234375, 0.32525634765625, 0.379638671875, 0.43402099609375, 0.4884033203125, 0.54278564453125, 0.59716796875, 0.65155029296875, 0.7059326171875, 0.76031494140625, 0.814697265625, 0.86907958984375, 0.9234619140625, 0.97784423828125, 1.0322265625, 1.08660888671875, 1.1409912109375, 1.19537353515625, 1.249755859375, 1.30413818359375, 1.3585205078125, 1.41290283203125, 1.46728515625, 1.52166748046875, 1.5760498046875, 1.63043212890625, 1.684814453125, 1.73919677734375, 1.7935791015625, 1.84796142578125, 1.90234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 7.0, 13.0, 24.0, 33.0, 73.0, 174.0, 341.0, 169.0, 62.0, 41.0, 25.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005192756652832031, -0.0004951581358909607, -0.00047104060649871826, -0.00044692307710647583, -0.0004228055477142334, -0.00039868801832199097, -0.00037457048892974854, -0.0003504529595375061, -0.00032633543014526367, -0.00030221790075302124, -0.0002781003713607788, -0.0002539828419685364, -0.00022986531257629395, -0.00020574778318405151, -0.00018163025379180908, -0.00015751272439956665, -0.00013339519500732422, -0.00010927766561508179, -8.516013622283936e-05, -6.104260683059692e-05, -3.692507743835449e-05, -1.280754804611206e-05, 1.1309981346130371e-05, 3.54275107383728e-05, 5.9545040130615234e-05, 8.366256952285767e-05, 0.0001077800989151001, 0.00013189762830734253, 0.00015601515769958496, 0.0001801326870918274, 0.00020425021648406982, 0.00022836774587631226, 0.0002524852752685547, 0.0002766028046607971, 0.00030072033405303955, 0.000324837863445282, 0.0003489553928375244, 0.00037307292222976685, 0.0003971904516220093, 0.0004213079810142517, 0.00044542551040649414, 0.00046954303979873657, 0.000493660569190979, 0.0005177780985832214, 0.0005418956279754639, 0.0005660131573677063, 0.0005901306867599487, 0.0006142482161521912, 0.0006383657455444336, 0.000662483274936676, 0.0006866008043289185, 0.0007107183337211609, 0.0007348358631134033, 0.0007589533925056458, 0.0007830709218978882, 0.0008071884512901306, 0.000831305980682373, 0.0008554235100746155, 0.0008795410394668579, 0.0009036585688591003, 0.0009277760982513428, 0.0009518936276435852, 0.0009760111570358276, 0.00100012868642807, 0.0010242462158203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 2.0, 15.0, 13.0, 16.0, 38.0, 67.0, 86.0, 174.0, 357.0, 947.0, 2823.0, 13529.0, 220869.0, 773661.0, 28919.0, 4641.0, 1393.0, 487.0, 209.0, 114.0, 61.0, 35.0, 21.0, 17.0, 15.0, 11.0, 5.0, 3.0, 5.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.36328125, -4.24267578125, -4.1220703125, -4.00146484375, -3.880859375, -3.76025390625, -3.6396484375, -3.51904296875, -3.3984375, -3.27783203125, -3.1572265625, -3.03662109375, -2.916015625, -2.79541015625, -2.6748046875, -2.55419921875, -2.43359375, -2.31298828125, -2.1923828125, -2.07177734375, -1.951171875, -1.83056640625, -1.7099609375, -1.58935546875, -1.46875, -1.34814453125, -1.2275390625, -1.10693359375, -0.986328125, -0.86572265625, -0.7451171875, -0.62451171875, -0.50390625, -0.38330078125, -0.2626953125, -0.14208984375, -0.021484375, 0.09912109375, 0.2197265625, 0.34033203125, 0.4609375, 0.58154296875, 0.7021484375, 0.82275390625, 0.943359375, 1.06396484375, 1.1845703125, 1.30517578125, 1.42578125, 1.54638671875, 1.6669921875, 1.78759765625, 1.908203125, 2.02880859375, 2.1494140625, 2.27001953125, 2.390625, 2.51123046875, 2.6318359375, 2.75244140625, 2.873046875, 2.99365234375, 3.1142578125, 3.23486328125, 3.35546875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 7.0, 1.0, 7.0, 7.0, 11.0, 19.0, 24.0, 28.0, 33.0, 55.0, 78.0, 130.0, 132.0, 143.0, 99.0, 69.0, 40.0, 29.0, 17.0, 16.0, 10.0, 5.0, 4.0, 7.0, 9.0, 7.0, 3.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.8740234375, -1.8215789794921875, -1.769134521484375, -1.7166900634765625, -1.66424560546875, -1.6118011474609375, -1.559356689453125, -1.5069122314453125, -1.4544677734375, -1.4020233154296875, -1.349578857421875, -1.2971343994140625, -1.24468994140625, -1.1922454833984375, -1.139801025390625, -1.0873565673828125, -1.034912109375, -0.9824676513671875, -0.930023193359375, -0.8775787353515625, -0.82513427734375, -0.7726898193359375, -0.720245361328125, -0.6678009033203125, -0.6153564453125, -0.5629119873046875, -0.510467529296875, -0.4580230712890625, -0.40557861328125, -0.3531341552734375, -0.300689697265625, -0.2482452392578125, -0.19580078125, -0.1433563232421875, -0.090911865234375, -0.0384674072265625, 0.01397705078125, 0.0664215087890625, 0.118865966796875, 0.1713104248046875, 0.2237548828125, 0.2761993408203125, 0.328643798828125, 0.3810882568359375, 0.43353271484375, 0.4859771728515625, 0.538421630859375, 0.5908660888671875, 0.643310546875, 0.6957550048828125, 0.748199462890625, 0.8006439208984375, 0.85308837890625, 0.9055328369140625, 0.957977294921875, 1.0104217529296875, 1.0628662109375, 1.1153106689453125, 1.167755126953125, 1.2201995849609375, 1.27264404296875, 1.3250885009765625, 1.377532958984375, 1.4299774169921875, 1.482421875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 8.0, 5.0, 12.0, 24.0, 42.0, 55.0, 77.0, 107.0, 101.0, 134.0, 131.0, 99.0, 73.0, 49.0, 33.0, 21.0, 15.0, 10.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.590675354003906, -34.841182708740234, -34.09169387817383, -33.342201232910156, -32.59271240234375, -31.843219757080078, -31.09372901916504, -30.34423828125, -29.59474754333496, -28.845256805419922, -28.095766067504883, -27.346275329589844, -26.596782684326172, -25.847291946411133, -25.097801208496094, -24.348310470581055, -23.598819732666016, -22.849328994750977, -22.099838256835938, -21.3503475189209, -20.60085678100586, -19.851364135742188, -19.10187339782715, -18.35238265991211, -17.60289192199707, -16.85340118408203, -16.103910446166992, -15.354418754577637, -14.604928016662598, -13.855437278747559, -13.105945587158203, -12.356454849243164, -11.606964111328125, -10.857473373413086, -10.107982635498047, -9.358490943908691, -8.609000205993652, -7.859509468078613, -7.110018253326416, -6.360527038574219, -5.61103630065918, -4.861545562744141, -4.112054347991943, -3.362563371658325, -2.613072395324707, -1.8635814189910889, -1.1140904426574707, -0.36459922790527344, 0.3848915100097656, 1.1343824863433838, 1.883873462677002, 2.63336443901062, 3.3828554153442383, 4.132346153259277, 4.881837368011475, 5.631328582763672, 6.380819320678711, 7.13031005859375, 7.879801273345947, 8.629292488098145, 9.378783226013184, 10.128273963928223, 10.877765655517578, 11.627256393432617, 12.376747131347656]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 3.0, 8.0, 9.0, 14.0, 19.0, 8.0, 13.0, 15.0, 26.0, 22.0, 27.0, 23.0, 27.0, 39.0, 43.0, 45.0, 54.0, 56.0, 49.0, 37.0, 50.0, 46.0, 31.0, 50.0, 46.0, 38.0, 26.0, 34.0, 18.0, 19.0, 17.0, 18.0, 15.0, 8.0, 11.0, 8.0, 11.0, 6.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0], "bins": [-14.467655181884766, -14.096028327941895, -13.724401473999023, -13.352773666381836, -12.981146812438965, -12.609519958496094, -12.237893104553223, -11.866266250610352, -11.49463939666748, -11.12301254272461, -10.751385688781738, -10.379758834838867, -10.00813102722168, -9.636504173278809, -9.264877319335938, -8.893250465393066, -8.521623611450195, -8.149996757507324, -7.778369426727295, -7.406742572784424, -7.035115718841553, -6.663488388061523, -6.291861534118652, -5.920234680175781, -5.548606872558594, -5.176980018615723, -4.805352687835693, -4.433725833892822, -4.062098979949951, -3.690471887588501, -3.318844795227051, -2.9472179412841797, -2.5755910873413086, -2.2039639949798584, -1.8323371410369873, -1.460710048675537, -1.0890830755233765, -0.7174561023712158, -0.3458290100097656, 0.02579784393310547, 0.39742493629455566, 0.7690519094467163, 1.140678882598877, 1.5123059749603271, 1.8839329481124878, 2.2555599212646484, 2.6271870136260986, 2.9988138675689697, 3.37044095993042, 3.74206805229187, 4.11369514465332, 4.485321998596191, 4.8569488525390625, 5.228575706481934, 5.600203037261963, 5.971829891204834, 6.343457221984863, 6.715084075927734, 7.086711406707764, 7.458338260650635, 7.829965114593506, 8.201592445373535, 8.573219299316406, 8.944846153259277, 9.316473007202148]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 3.0, 2.0, 8.0, 8.0, 14.0, 19.0, 31.0, 51.0, 89.0, 122.0, 227.0, 377.0, 671.0, 1411.0, 2978.0, 6704.0, 17565.0, 56876.0, 517135.0, 3461980.0, 88265.0, 23739.0, 8716.0, 3659.0, 1624.0, 829.0, 441.0, 260.0, 143.0, 102.0, 73.0, 47.0, 32.0, 19.0, 17.0, 12.0, 11.0, 4.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.458984375, -3.340301513671875, -3.22161865234375, -3.102935791015625, -2.9842529296875, -2.865570068359375, -2.74688720703125, -2.628204345703125, -2.509521484375, -2.390838623046875, -2.27215576171875, -2.153472900390625, -2.0347900390625, -1.916107177734375, -1.79742431640625, -1.678741455078125, -1.56005859375, -1.441375732421875, -1.32269287109375, -1.204010009765625, -1.0853271484375, -0.966644287109375, -0.84796142578125, -0.729278564453125, -0.610595703125, -0.491912841796875, -0.37322998046875, -0.254547119140625, -0.1358642578125, -0.017181396484375, 0.10150146484375, 0.220184326171875, 0.3388671875, 0.457550048828125, 0.57623291015625, 0.694915771484375, 0.8135986328125, 0.932281494140625, 1.05096435546875, 1.169647216796875, 1.288330078125, 1.407012939453125, 1.52569580078125, 1.644378662109375, 1.7630615234375, 1.881744384765625, 2.00042724609375, 2.119110107421875, 2.23779296875, 2.356475830078125, 2.47515869140625, 2.593841552734375, 2.7125244140625, 2.831207275390625, 2.94989013671875, 3.068572998046875, 3.187255859375, 3.305938720703125, 3.42462158203125, 3.543304443359375, 3.6619873046875, 3.780670166015625, 3.89935302734375, 4.018035888671875, 4.13671875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 3.0, 10.0, 12.0, 16.0, 15.0, 18.0, 19.0, 27.0, 25.0, 25.0, 41.0, 41.0, 48.0, 50.0, 51.0, 49.0, 52.0, 46.0, 44.0, 54.0, 40.0, 49.0, 42.0, 42.0, 35.0, 22.0, 25.0, 21.0, 22.0, 13.0, 4.0, 7.0, 3.0, 7.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.44775390625, -0.4341011047363281, -0.42044830322265625, -0.4067955017089844, -0.3931427001953125, -0.3794898986816406, -0.36583709716796875, -0.3521842956542969, -0.338531494140625, -0.3248786926269531, -0.31122589111328125, -0.2975730895996094, -0.2839202880859375, -0.2702674865722656, -0.25661468505859375, -0.24296188354492188, -0.22930908203125, -0.21565628051757812, -0.20200347900390625, -0.18835067749023438, -0.1746978759765625, -0.16104507446289062, -0.14739227294921875, -0.13373947143554688, -0.120086669921875, -0.10643386840820312, -0.09278106689453125, -0.07912826538085938, -0.0654754638671875, -0.051822662353515625, -0.03816986083984375, -0.024517059326171875, -0.0108642578125, 0.002788543701171875, 0.01644134521484375, 0.030094146728515625, 0.0437469482421875, 0.057399749755859375, 0.07105255126953125, 0.08470535278320312, 0.098358154296875, 0.11201095581054688, 0.12566375732421875, 0.13931655883789062, 0.1529693603515625, 0.16662216186523438, 0.18027496337890625, 0.19392776489257812, 0.20758056640625, 0.22123336791992188, 0.23488616943359375, 0.24853897094726562, 0.2621917724609375, 0.2758445739746094, 0.28949737548828125, 0.3031501770019531, 0.316802978515625, 0.3304557800292969, 0.34410858154296875, 0.3577613830566406, 0.3714141845703125, 0.3850669860839844, 0.39871978759765625, 0.4123725891113281, 0.426025390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 12.0, 12.0, 24.0, 28.0, 47.0, 57.0, 82.0, 114.0, 183.0, 288.0, 422.0, 687.0, 1131.0, 1863.0, 3308.0, 6243.0, 13447.0, 31883.0, 109635.0, 3109194.0, 784760.0, 80526.0, 26140.0, 11156.0, 5536.0, 2977.0, 1754.0, 1008.0, 570.0, 375.0, 247.0, 185.0, 124.0, 86.0, 48.0, 36.0, 28.0, 19.0, 14.0, 6.0, 9.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.552734375, -3.44134521484375, -3.3299560546875, -3.21856689453125, -3.107177734375, -2.99578857421875, -2.8843994140625, -2.77301025390625, -2.66162109375, -2.55023193359375, -2.4388427734375, -2.32745361328125, -2.216064453125, -2.10467529296875, -1.9932861328125, -1.88189697265625, -1.7705078125, -1.65911865234375, -1.5477294921875, -1.43634033203125, -1.324951171875, -1.21356201171875, -1.1021728515625, -0.99078369140625, -0.87939453125, -0.76800537109375, -0.6566162109375, -0.54522705078125, -0.433837890625, -0.32244873046875, -0.2110595703125, -0.09967041015625, 0.01171875, 0.12310791015625, 0.2344970703125, 0.34588623046875, 0.457275390625, 0.56866455078125, 0.6800537109375, 0.79144287109375, 0.90283203125, 1.01422119140625, 1.1256103515625, 1.23699951171875, 1.348388671875, 1.45977783203125, 1.5711669921875, 1.68255615234375, 1.7939453125, 1.90533447265625, 2.0167236328125, 2.12811279296875, 2.239501953125, 2.35089111328125, 2.4622802734375, 2.57366943359375, 2.68505859375, 2.79644775390625, 2.9078369140625, 3.01922607421875, 3.130615234375, 3.24200439453125, 3.3533935546875, 3.46478271484375, 3.576171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 12.0, 7.0, 20.0, 23.0, 30.0, 38.0, 46.0, 111.0, 179.0, 464.0, 2083.0, 492.0, 204.0, 109.0, 59.0, 46.0, 28.0, 20.0, 16.0, 15.0, 11.0, 12.0, 5.0, 4.0, 6.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5791015625, -1.527435302734375, -1.47576904296875, -1.424102783203125, -1.3724365234375, -1.320770263671875, -1.26910400390625, -1.217437744140625, -1.165771484375, -1.114105224609375, -1.06243896484375, -1.010772705078125, -0.9591064453125, -0.907440185546875, -0.85577392578125, -0.804107666015625, -0.75244140625, -0.700775146484375, -0.64910888671875, -0.597442626953125, -0.5457763671875, -0.494110107421875, -0.44244384765625, -0.390777587890625, -0.339111328125, -0.287445068359375, -0.23577880859375, -0.184112548828125, -0.1324462890625, -0.080780029296875, -0.02911376953125, 0.022552490234375, 0.07421875, 0.125885009765625, 0.17755126953125, 0.229217529296875, 0.2808837890625, 0.332550048828125, 0.38421630859375, 0.435882568359375, 0.487548828125, 0.539215087890625, 0.59088134765625, 0.642547607421875, 0.6942138671875, 0.745880126953125, 0.79754638671875, 0.849212646484375, 0.90087890625, 0.952545166015625, 1.00421142578125, 1.055877685546875, 1.1075439453125, 1.159210205078125, 1.21087646484375, 1.262542724609375, 1.314208984375, 1.365875244140625, 1.41754150390625, 1.469207763671875, 1.5208740234375, 1.572540283203125, 1.62420654296875, 1.675872802734375, 1.7275390625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 13.0, 16.0, 37.0, 55.0, 64.0, 130.0, 155.0, 145.0, 110.0, 97.0, 67.0, 44.0, 26.0, 13.0, 12.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.918634414672852, -15.486771583557129, -15.054908752441406, -14.623046875, -14.191184043884277, -13.759321212768555, -13.327458381652832, -12.89559555053711, -12.463732719421387, -12.031869888305664, -11.600007057189941, -11.168144226074219, -10.736282348632812, -10.30441951751709, -9.872556686401367, -9.440693855285645, -9.008831024169922, -8.5769681930542, -8.145105361938477, -7.713243007659912, -7.2813801765441895, -6.849517822265625, -6.417654991149902, -5.98579216003418, -5.553930282592773, -5.122067451477051, -4.690205097198486, -4.258342266082764, -3.826479434967041, -3.3946168422698975, -2.962754249572754, -2.5308914184570312, -2.0990285873413086, -1.6671658754348755, -1.2353031635284424, -0.8034405708312988, -0.3715778589248657, 0.06028485298156738, 0.49214744567871094, 0.9240102767944336, 1.3558728694915771, 1.7877355813980103, 2.2195982933044434, 2.651460886001587, 3.0833234786987305, 3.515186309814453, 3.9470489025115967, 4.378911972045898, 4.810774326324463, 5.2426371574401855, 5.67449951171875, 6.106362342834473, 6.538225173950195, 6.970088005065918, 7.401950359344482, 7.833813190460205, 8.26567554473877, 8.697538375854492, 9.129401206970215, 9.561264038085938, 9.993125915527344, 10.424988746643066, 10.856851577758789, 11.288714408874512, 11.720577239990234]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 2.0, 4.0, 9.0, 5.0, 20.0, 20.0, 18.0, 22.0, 27.0, 22.0, 41.0, 41.0, 36.0, 47.0, 47.0, 45.0, 46.0, 55.0, 40.0, 48.0, 40.0, 38.0, 41.0, 43.0, 37.0, 42.0, 36.0, 28.0, 20.0, 12.0, 16.0, 11.0, 12.0, 5.0, 2.0, 7.0, 3.0, 6.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.979898929595947, -6.781107425689697, -6.582315921783447, -6.383524417877197, -6.1847333908081055, -5.9859418869018555, -5.7871503829956055, -5.5883588790893555, -5.3895673751831055, -5.1907758712768555, -4.9919843673706055, -4.7931928634643555, -4.5944013595581055, -4.395610332489014, -4.196818828582764, -3.9980273246765137, -3.7992358207702637, -3.6004443168640137, -3.4016528129577637, -3.2028615474700928, -3.0040700435638428, -2.8052785396575928, -2.606487274169922, -2.407695770263672, -2.208904266357422, -2.010112762451172, -1.8113213777542114, -1.612529993057251, -1.413738489151001, -1.214946985244751, -1.0161556005477905, -0.8173642158508301, -0.6185731887817383, -0.41978174448013306, -0.22099030017852783, -0.022198855876922607, 0.17659258842468262, 0.37538403272628784, 0.5741754770278931, 0.7729668617248535, 0.9717583656311035, 1.1705498695373535, 1.369341254234314, 1.5681326389312744, 1.7669241428375244, 1.9657156467437744, 2.1645069122314453, 2.3632984161376953, 2.5620899200439453, 2.7608814239501953, 2.9596729278564453, 3.158464193344116, 3.357255697250366, 3.556047201156616, 3.754838466644287, 3.953629970550537, 4.152421474456787, 4.351212978363037, 4.550004482269287, 4.748795986175537, 4.947587013244629, 5.146378517150879, 5.345170021057129, 5.543961524963379, 5.742753028869629]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 6.0, 4.0, 13.0, 19.0, 19.0, 34.0, 52.0, 66.0, 96.0, 162.0, 208.0, 325.0, 508.0, 863.0, 1254.0, 2087.0, 3781.0, 6376.0, 11464.0, 22199.0, 45649.0, 98938.0, 218392.0, 307536.0, 173150.0, 77842.0, 36044.0, 18275.0, 9736.0, 5297.0, 3087.0, 1812.0, 1168.0, 707.0, 466.0, 314.0, 195.0, 118.0, 83.0, 59.0, 46.0, 33.0, 21.0, 18.0, 14.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-1.9228515625, -1.8684539794921875, -1.814056396484375, -1.7596588134765625, -1.70526123046875, -1.6508636474609375, -1.596466064453125, -1.5420684814453125, -1.4876708984375, -1.4332733154296875, -1.378875732421875, -1.3244781494140625, -1.27008056640625, -1.2156829833984375, -1.161285400390625, -1.1068878173828125, -1.052490234375, -0.9980926513671875, -0.943695068359375, -0.8892974853515625, -0.83489990234375, -0.7805023193359375, -0.726104736328125, -0.6717071533203125, -0.6173095703125, -0.5629119873046875, -0.508514404296875, -0.4541168212890625, -0.39971923828125, -0.3453216552734375, -0.290924072265625, -0.2365264892578125, -0.18212890625, -0.1277313232421875, -0.073333740234375, -0.0189361572265625, 0.03546142578125, 0.0898590087890625, 0.144256591796875, 0.1986541748046875, 0.2530517578125, 0.3074493408203125, 0.361846923828125, 0.4162445068359375, 0.47064208984375, 0.5250396728515625, 0.579437255859375, 0.6338348388671875, 0.688232421875, 0.7426300048828125, 0.797027587890625, 0.8514251708984375, 0.90582275390625, 0.9602203369140625, 1.014617919921875, 1.0690155029296875, 1.1234130859375, 1.1778106689453125, 1.232208251953125, 1.2866058349609375, 1.34100341796875, 1.3954010009765625, 1.449798583984375, 1.5041961669921875, 1.55859375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 10.0, 9.0, 9.0, 15.0, 12.0, 12.0, 33.0, 34.0, 37.0, 43.0, 41.0, 45.0, 58.0, 40.0, 51.0, 53.0, 52.0, 42.0, 50.0, 36.0, 43.0, 42.0, 32.0, 24.0, 35.0, 15.0, 22.0, 14.0, 23.0, 13.0, 11.0, 7.0, 7.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.515625, -0.5003204345703125, -0.485015869140625, -0.4697113037109375, -0.45440673828125, -0.4391021728515625, -0.423797607421875, -0.4084930419921875, -0.3931884765625, -0.3778839111328125, -0.362579345703125, -0.3472747802734375, -0.33197021484375, -0.3166656494140625, -0.301361083984375, -0.2860565185546875, -0.270751953125, -0.2554473876953125, -0.240142822265625, -0.2248382568359375, -0.20953369140625, -0.1942291259765625, -0.178924560546875, -0.1636199951171875, -0.1483154296875, -0.1330108642578125, -0.117706298828125, -0.1024017333984375, -0.08709716796875, -0.0717926025390625, -0.056488037109375, -0.0411834716796875, -0.02587890625, -0.0105743408203125, 0.004730224609375, 0.0200347900390625, 0.03533935546875, 0.0506439208984375, 0.065948486328125, 0.0812530517578125, 0.0965576171875, 0.1118621826171875, 0.127166748046875, 0.1424713134765625, 0.15777587890625, 0.1730804443359375, 0.188385009765625, 0.2036895751953125, 0.218994140625, 0.2342987060546875, 0.249603271484375, 0.2649078369140625, 0.28021240234375, 0.2955169677734375, 0.310821533203125, 0.3261260986328125, 0.3414306640625, 0.3567352294921875, 0.372039794921875, 0.3873443603515625, 0.40264892578125, 0.4179534912109375, 0.433258056640625, 0.4485626220703125, 0.4638671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 12.0, 11.0, 12.0, 21.0, 19.0, 47.0, 61.0, 74.0, 107.0, 174.0, 300.0, 532.0, 1211.0, 3304.0, 12625.0, 71363.0, 649459.0, 266289.0, 32188.0, 6806.0, 1972.0, 809.0, 426.0, 244.0, 156.0, 94.0, 67.0, 40.0, 24.0, 29.0, 13.0, 16.0, 13.0, 5.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.70703125, -4.54351806640625, -4.3800048828125, -4.21649169921875, -4.052978515625, -3.88946533203125, -3.7259521484375, -3.56243896484375, -3.39892578125, -3.23541259765625, -3.0718994140625, -2.90838623046875, -2.744873046875, -2.58135986328125, -2.4178466796875, -2.25433349609375, -2.0908203125, -1.92730712890625, -1.7637939453125, -1.60028076171875, -1.436767578125, -1.27325439453125, -1.1097412109375, -0.94622802734375, -0.78271484375, -0.61920166015625, -0.4556884765625, -0.29217529296875, -0.128662109375, 0.03485107421875, 0.1983642578125, 0.36187744140625, 0.525390625, 0.68890380859375, 0.8524169921875, 1.01593017578125, 1.179443359375, 1.34295654296875, 1.5064697265625, 1.66998291015625, 1.83349609375, 1.99700927734375, 2.1605224609375, 2.32403564453125, 2.487548828125, 2.65106201171875, 2.8145751953125, 2.97808837890625, 3.1416015625, 3.30511474609375, 3.4686279296875, 3.63214111328125, 3.795654296875, 3.95916748046875, 4.1226806640625, 4.28619384765625, 4.44970703125, 4.61322021484375, 4.7767333984375, 4.94024658203125, 5.103759765625, 5.26727294921875, 5.4307861328125, 5.59429931640625, 5.7578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 10.0, 8.0, 11.0, 20.0, 21.0, 31.0, 21.0, 30.0, 25.0, 57.0, 48.0, 51.0, 61.0, 61.0, 47.0, 47.0, 67.0, 48.0, 48.0, 52.0, 29.0, 25.0, 36.0, 27.0, 22.0, 21.0, 12.0, 16.0, 10.0, 8.0, 4.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.55078125, -3.44659423828125, -3.3424072265625, -3.23822021484375, -3.134033203125, -3.02984619140625, -2.9256591796875, -2.82147216796875, -2.71728515625, -2.61309814453125, -2.5089111328125, -2.40472412109375, -2.300537109375, -2.19635009765625, -2.0921630859375, -1.98797607421875, -1.8837890625, -1.77960205078125, -1.6754150390625, -1.57122802734375, -1.467041015625, -1.36285400390625, -1.2586669921875, -1.15447998046875, -1.05029296875, -0.94610595703125, -0.8419189453125, -0.73773193359375, -0.633544921875, -0.52935791015625, -0.4251708984375, -0.32098388671875, -0.216796875, -0.11260986328125, -0.0084228515625, 0.09576416015625, 0.199951171875, 0.30413818359375, 0.4083251953125, 0.51251220703125, 0.61669921875, 0.72088623046875, 0.8250732421875, 0.92926025390625, 1.033447265625, 1.13763427734375, 1.2418212890625, 1.34600830078125, 1.4501953125, 1.55438232421875, 1.6585693359375, 1.76275634765625, 1.866943359375, 1.97113037109375, 2.0753173828125, 2.17950439453125, 2.28369140625, 2.38787841796875, 2.4920654296875, 2.59625244140625, 2.700439453125, 2.80462646484375, 2.9088134765625, 3.01300048828125, 3.1171875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 8.0, 13.0, 27.0, 41.0, 70.0, 111.0, 214.0, 382.0, 732.0, 1631.0, 4133.0, 11656.0, 41333.0, 245252.0, 619826.0, 91180.0, 20560.0, 6550.0, 2502.0, 1081.0, 569.0, 299.0, 152.0, 81.0, 53.0, 40.0, 19.0, 14.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.982421875, -2.89532470703125, -2.8082275390625, -2.72113037109375, -2.634033203125, -2.54693603515625, -2.4598388671875, -2.37274169921875, -2.28564453125, -2.19854736328125, -2.1114501953125, -2.02435302734375, -1.937255859375, -1.85015869140625, -1.7630615234375, -1.67596435546875, -1.5888671875, -1.50177001953125, -1.4146728515625, -1.32757568359375, -1.240478515625, -1.15338134765625, -1.0662841796875, -0.97918701171875, -0.89208984375, -0.80499267578125, -0.7178955078125, -0.63079833984375, -0.543701171875, -0.45660400390625, -0.3695068359375, -0.28240966796875, -0.1953125, -0.10821533203125, -0.0211181640625, 0.06597900390625, 0.153076171875, 0.24017333984375, 0.3272705078125, 0.41436767578125, 0.50146484375, 0.58856201171875, 0.6756591796875, 0.76275634765625, 0.849853515625, 0.93695068359375, 1.0240478515625, 1.11114501953125, 1.1982421875, 1.28533935546875, 1.3724365234375, 1.45953369140625, 1.546630859375, 1.63372802734375, 1.7208251953125, 1.80792236328125, 1.89501953125, 1.98211669921875, 2.0692138671875, 2.15631103515625, 2.243408203125, 2.33050537109375, 2.4176025390625, 2.50469970703125, 2.591796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 2.0, 7.0, 5.0, 6.0, 16.0, 27.0, 50.0, 110.0, 203.0, 254.0, 146.0, 82.0, 32.0, 23.0, 15.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005054473876953125, -0.0004791766405105591, -0.00045290589332580566, -0.00042663514614105225, -0.00040036439895629883, -0.0003740936517715454, -0.000347822904586792, -0.0003215521574020386, -0.00029528141021728516, -0.00026901066303253174, -0.00024273991584777832, -0.0002164691686630249, -0.00019019842147827148, -0.00016392767429351807, -0.00013765692710876465, -0.00011138617992401123, -8.511543273925781e-05, -5.8844685554504395e-05, -3.2573938369750977e-05, -6.303191184997559e-06, 1.996755599975586e-05, 4.623830318450928e-05, 7.25090503692627e-05, 9.877979755401611e-05, 0.00012505054473876953, 0.00015132129192352295, 0.00017759203910827637, 0.00020386278629302979, 0.0002301335334777832, 0.0002564042806625366, 0.00028267502784729004, 0.00030894577503204346, 0.0003352165222167969, 0.0003614872694015503, 0.0003877580165863037, 0.00041402876377105713, 0.00044029951095581055, 0.00046657025814056396, 0.0004928410053253174, 0.0005191117525100708, 0.0005453824996948242, 0.0005716532468795776, 0.0005979239940643311, 0.0006241947412490845, 0.0006504654884338379, 0.0006767362356185913, 0.0007030069828033447, 0.0007292777299880981, 0.0007555484771728516, 0.000781819224357605, 0.0008080899715423584, 0.0008343607187271118, 0.0008606314659118652, 0.0008869022130966187, 0.0009131729602813721, 0.0009394437074661255, 0.0009657144546508789, 0.0009919852018356323, 0.0010182559490203857, 0.0010445266962051392, 0.0010707974433898926, 0.001097068190574646, 0.0011233389377593994, 0.0011496096849441528, 0.0011758804321289062]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 8.0, 4.0, 8.0, 10.0, 13.0, 26.0, 28.0, 54.0, 103.0, 162.0, 299.0, 749.0, 2159.0, 8135.0, 48848.0, 673448.0, 281373.0, 25465.0, 5018.0, 1435.0, 596.0, 266.0, 119.0, 71.0, 43.0, 40.0, 32.0, 11.0, 6.0, 9.0, 4.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.517578125, -3.399688720703125, -3.28179931640625, -3.163909912109375, -3.0460205078125, -2.928131103515625, -2.81024169921875, -2.692352294921875, -2.574462890625, -2.456573486328125, -2.33868408203125, -2.220794677734375, -2.1029052734375, -1.985015869140625, -1.86712646484375, -1.749237060546875, -1.63134765625, -1.513458251953125, -1.39556884765625, -1.277679443359375, -1.1597900390625, -1.041900634765625, -0.92401123046875, -0.806121826171875, -0.688232421875, -0.570343017578125, -0.45245361328125, -0.334564208984375, -0.2166748046875, -0.098785400390625, 0.01910400390625, 0.136993408203125, 0.2548828125, 0.372772216796875, 0.49066162109375, 0.608551025390625, 0.7264404296875, 0.844329833984375, 0.96221923828125, 1.080108642578125, 1.197998046875, 1.315887451171875, 1.43377685546875, 1.551666259765625, 1.6695556640625, 1.787445068359375, 1.90533447265625, 2.023223876953125, 2.14111328125, 2.259002685546875, 2.37689208984375, 2.494781494140625, 2.6126708984375, 2.730560302734375, 2.84844970703125, 2.966339111328125, 3.084228515625, 3.202117919921875, 3.32000732421875, 3.437896728515625, 3.5557861328125, 3.673675537109375, 3.79156494140625, 3.909454345703125, 4.02734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 5.0, 12.0, 15.0, 22.0, 23.0, 19.0, 23.0, 36.0, 45.0, 70.0, 61.0, 97.0, 129.0, 78.0, 73.0, 45.0, 41.0, 30.0, 27.0, 28.0, 22.0, 19.0, 19.0, 12.0, 12.0, 9.0, 5.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.015625, -1.958709716796875, -1.90179443359375, -1.844879150390625, -1.7879638671875, -1.731048583984375, -1.67413330078125, -1.617218017578125, -1.560302734375, -1.503387451171875, -1.44647216796875, -1.389556884765625, -1.3326416015625, -1.275726318359375, -1.21881103515625, -1.161895751953125, -1.10498046875, -1.048065185546875, -0.99114990234375, -0.934234619140625, -0.8773193359375, -0.820404052734375, -0.76348876953125, -0.706573486328125, -0.649658203125, -0.592742919921875, -0.53582763671875, -0.478912353515625, -0.4219970703125, -0.365081787109375, -0.30816650390625, -0.251251220703125, -0.1943359375, -0.137420654296875, -0.08050537109375, -0.023590087890625, 0.0333251953125, 0.090240478515625, 0.14715576171875, 0.204071044921875, 0.260986328125, 0.317901611328125, 0.37481689453125, 0.431732177734375, 0.4886474609375, 0.545562744140625, 0.60247802734375, 0.659393310546875, 0.71630859375, 0.773223876953125, 0.83013916015625, 0.887054443359375, 0.9439697265625, 1.000885009765625, 1.05780029296875, 1.114715576171875, 1.171630859375, 1.228546142578125, 1.28546142578125, 1.342376708984375, 1.3992919921875, 1.456207275390625, 1.51312255859375, 1.570037841796875, 1.626953125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 7.0, 3.0, 5.0, 15.0, 30.0, 48.0, 70.0, 99.0, 139.0, 155.0, 135.0, 103.0, 68.0, 54.0, 35.0, 23.0, 12.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.883092880249023, -26.001834869384766, -25.120576858520508, -24.23931884765625, -23.358062744140625, -22.476802825927734, -21.59554672241211, -20.71428871154785, -19.833030700683594, -18.951772689819336, -18.070514678955078, -17.18925666809082, -16.307998657226562, -15.426741600036621, -14.54548454284668, -13.664226531982422, -12.782968521118164, -11.901710510253906, -11.020452499389648, -10.139195442199707, -9.25793743133545, -8.376679420471191, -7.495421886444092, -6.614164352416992, -5.732906341552734, -4.851648330688477, -3.970390796661377, -3.0891330242156982, -2.2078752517700195, -1.3266172409057617, -0.4453597068786621, 0.4358978271484375, 1.3171539306640625, 2.198411703109741, 3.07966947555542, 3.9609272480010986, 4.842185020446777, 5.723443031311035, 6.604700565338135, 7.485958099365234, 8.367216110229492, 9.24847412109375, 10.129732131958008, 11.01098918914795, 11.892247200012207, 12.773505210876465, 13.654762268066406, 14.536020278930664, 15.417278289794922, 16.29853630065918, 17.179794311523438, 18.061052322387695, 18.942310333251953, 19.823566436767578, 20.704824447631836, 21.586082458496094, 22.46734046936035, 23.34859848022461, 24.229856491088867, 25.111114501953125, 25.99237060546875, 26.87363052368164, 27.754886627197266, 28.636144638061523, 29.51740264892578]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 7.0, 14.0, 14.0, 12.0, 20.0, 13.0, 12.0, 18.0, 23.0, 18.0, 31.0, 40.0, 34.0, 45.0, 37.0, 41.0, 50.0, 59.0, 36.0, 50.0, 41.0, 50.0, 46.0, 36.0, 34.0, 34.0, 22.0, 24.0, 26.0, 13.0, 15.0, 12.0, 11.0, 9.0, 16.0, 7.0, 9.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.448860168457031, -14.010856628417969, -13.572854042053223, -13.13485050201416, -12.696846961975098, -12.258844375610352, -11.820840835571289, -11.382837295532227, -10.944833755493164, -10.506830215454102, -10.068827629089355, -9.630824089050293, -9.19282054901123, -8.754817962646484, -8.316814422607422, -7.878810882568359, -7.440808296203613, -7.002805233001709, -6.5648016929626465, -6.126798629760742, -5.68879508972168, -5.250792026519775, -4.812788963317871, -4.374785423278809, -3.9367823600769043, -3.498779058456421, -3.0607757568359375, -2.622772693634033, -2.18476939201355, -1.7467660903930664, -1.308763027191162, -0.8707597255706787, -0.4327564239501953, 0.0052468180656433105, 0.44325006008148193, 0.8812532424926758, 1.3192565441131592, 1.7572598457336426, 2.195262908935547, 2.6332662105560303, 3.0712695121765137, 3.509272813796997, 3.9472761154174805, 4.385279178619385, 4.823282241821289, 5.261285781860352, 5.699288845062256, 6.13729190826416, 6.575295448303223, 7.013298511505127, 7.4513020515441895, 7.889305114746094, 8.327308654785156, 8.765312194824219, 9.203314781188965, 9.641318321228027, 10.079320907592773, 10.517324447631836, 10.955327033996582, 11.393330574035645, 11.831334114074707, 12.269336700439453, 12.707340240478516, 13.145343780517578, 13.58334732055664]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 4.0, 18.0, 14.0, 26.0, 34.0, 57.0, 83.0, 117.0, 171.0, 312.0, 521.0, 1043.0, 2530.0, 10723.0, 4021367.0, 145120.0, 7801.0, 2214.0, 903.0, 465.0, 279.0, 138.0, 91.0, 74.0, 65.0, 23.0, 23.0, 19.0, 19.0, 11.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.765625, -9.4595947265625, -9.153564453125, -8.8475341796875, -8.54150390625, -8.2354736328125, -7.929443359375, -7.6234130859375, -7.3173828125, -7.0113525390625, -6.705322265625, -6.3992919921875, -6.09326171875, -5.7872314453125, -5.481201171875, -5.1751708984375, -4.869140625, -4.5631103515625, -4.257080078125, -3.9510498046875, -3.64501953125, -3.3389892578125, -3.032958984375, -2.7269287109375, -2.4208984375, -2.1148681640625, -1.808837890625, -1.5028076171875, -1.19677734375, -0.8907470703125, -0.584716796875, -0.2786865234375, 0.02734375, 0.3333740234375, 0.639404296875, 0.9454345703125, 1.25146484375, 1.5574951171875, 1.863525390625, 2.1695556640625, 2.4755859375, 2.7816162109375, 3.087646484375, 3.3936767578125, 3.69970703125, 4.0057373046875, 4.311767578125, 4.6177978515625, 4.923828125, 5.2298583984375, 5.535888671875, 5.8419189453125, 6.14794921875, 6.4539794921875, 6.760009765625, 7.0660400390625, 7.3720703125, 7.6781005859375, 7.984130859375, 8.2901611328125, 8.59619140625, 8.9022216796875, 9.208251953125, 9.5142822265625, 9.8203125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 9.0, 6.0, 13.0, 13.0, 14.0, 21.0, 22.0, 24.0, 36.0, 41.0, 41.0, 57.0, 48.0, 43.0, 60.0, 55.0, 53.0, 56.0, 45.0, 46.0, 41.0, 43.0, 39.0, 31.0, 27.0, 21.0, 20.0, 12.0, 14.0, 10.0, 8.0, 13.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.66845703125, -0.6507759094238281, -0.6330947875976562, -0.6154136657714844, -0.5977325439453125, -0.5800514221191406, -0.5623703002929688, -0.5446891784667969, -0.527008056640625, -0.5093269348144531, -0.49164581298828125, -0.4739646911621094, -0.4562835693359375, -0.4386024475097656, -0.42092132568359375, -0.4032402038574219, -0.38555908203125, -0.3678779602050781, -0.35019683837890625, -0.3325157165527344, -0.3148345947265625, -0.2971534729003906, -0.27947235107421875, -0.2617912292480469, -0.244110107421875, -0.22642898559570312, -0.20874786376953125, -0.19106674194335938, -0.1733856201171875, -0.15570449829101562, -0.13802337646484375, -0.12034225463867188, -0.1026611328125, -0.08498001098632812, -0.06729888916015625, -0.049617767333984375, -0.0319366455078125, -0.014255523681640625, 0.00342559814453125, 0.021106719970703125, 0.038787841796875, 0.056468963623046875, 0.07415008544921875, 0.09183120727539062, 0.1095123291015625, 0.12719345092773438, 0.14487457275390625, 0.16255569458007812, 0.18023681640625, 0.19791793823242188, 0.21559906005859375, 0.23328018188476562, 0.2509613037109375, 0.2686424255371094, 0.28632354736328125, 0.3040046691894531, 0.321685791015625, 0.3393669128417969, 0.35704803466796875, 0.3747291564941406, 0.3924102783203125, 0.4100914001464844, 0.42777252197265625, 0.4454536437988281, 0.463134765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 12.0, 20.0, 19.0, 36.0, 50.0, 81.0, 120.0, 214.0, 344.0, 639.0, 1128.0, 2807.0, 16525.0, 4133298.0, 32222.0, 3677.0, 1348.0, 649.0, 404.0, 251.0, 127.0, 96.0, 79.0, 44.0, 20.0, 23.0, 9.0, 12.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8671875, -9.4820556640625, -9.096923828125, -8.7117919921875, -8.32666015625, -7.9415283203125, -7.556396484375, -7.1712646484375, -6.7861328125, -6.4010009765625, -6.015869140625, -5.6307373046875, -5.24560546875, -4.8604736328125, -4.475341796875, -4.0902099609375, -3.705078125, -3.3199462890625, -2.934814453125, -2.5496826171875, -2.16455078125, -1.7794189453125, -1.394287109375, -1.0091552734375, -0.6240234375, -0.2388916015625, 0.146240234375, 0.5313720703125, 0.91650390625, 1.3016357421875, 1.686767578125, 2.0718994140625, 2.45703125, 2.8421630859375, 3.227294921875, 3.6124267578125, 3.99755859375, 4.3826904296875, 4.767822265625, 5.1529541015625, 5.5380859375, 5.9232177734375, 6.308349609375, 6.6934814453125, 7.07861328125, 7.4637451171875, 7.848876953125, 8.2340087890625, 8.619140625, 9.0042724609375, 9.389404296875, 9.7745361328125, 10.15966796875, 10.5447998046875, 10.929931640625, 11.3150634765625, 11.7001953125, 12.0853271484375, 12.470458984375, 12.8555908203125, 13.24072265625, 13.6258544921875, 14.010986328125, 14.3961181640625, 14.78125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 14.0, 20.0, 20.0, 79.0, 3673.0, 204.0, 29.0, 18.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.197265625, -1.139495849609375, -1.08172607421875, -1.023956298828125, -0.9661865234375, -0.908416748046875, -0.85064697265625, -0.792877197265625, -0.735107421875, -0.677337646484375, -0.61956787109375, -0.561798095703125, -0.5040283203125, -0.446258544921875, -0.38848876953125, -0.330718994140625, -0.27294921875, -0.215179443359375, -0.15740966796875, -0.099639892578125, -0.0418701171875, 0.015899658203125, 0.07366943359375, 0.131439208984375, 0.189208984375, 0.246978759765625, 0.30474853515625, 0.362518310546875, 0.4202880859375, 0.478057861328125, 0.53582763671875, 0.593597412109375, 0.6513671875, 0.709136962890625, 0.76690673828125, 0.824676513671875, 0.8824462890625, 0.940216064453125, 0.99798583984375, 1.055755615234375, 1.113525390625, 1.171295166015625, 1.22906494140625, 1.286834716796875, 1.3446044921875, 1.402374267578125, 1.46014404296875, 1.517913818359375, 1.57568359375, 1.633453369140625, 1.69122314453125, 1.748992919921875, 1.8067626953125, 1.864532470703125, 1.92230224609375, 1.980072021484375, 2.037841796875, 2.095611572265625, 2.15338134765625, 2.211151123046875, 2.2689208984375, 2.326690673828125, 2.38446044921875, 2.442230224609375, 2.5]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 11.0, 15.0, 28.0, 44.0, 52.0, 103.0, 118.0, 161.0, 133.0, 118.0, 74.0, 40.0, 45.0, 30.0, 8.0, 6.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.795115947723389, -5.637499809265137, -5.479883670806885, -5.322267532348633, -5.164651393890381, -5.007035255432129, -4.849419116973877, -4.691802978515625, -4.534186840057373, -4.376570701599121, -4.218954563140869, -4.061338424682617, -3.9037222862243652, -3.7461061477661133, -3.5884900093078613, -3.4308738708496094, -3.2732574939727783, -3.1156413555145264, -2.9580252170562744, -2.8004090785980225, -2.6427929401397705, -2.4851768016815186, -2.3275604248046875, -2.1699442863464355, -2.0123281478881836, -1.8547120094299316, -1.6970958709716797, -1.5394797325134277, -1.3818635940551758, -1.2242474555969238, -1.0666311979293823, -0.9090150594711304, -0.751399040222168, -0.593782901763916, -0.4361667335033417, -0.27855056524276733, -0.12093442678451538, 0.03668171167373657, 0.1942979097366333, 0.35191404819488525, 0.5095301866531372, 0.6671463251113892, 0.8247624635696411, 0.9823786616325378, 1.1399948596954346, 1.2976109981536865, 1.4552271366119385, 1.6128432750701904, 1.7704594135284424, 1.9280755519866943, 2.0856916904449463, 2.2433078289031982, 2.40092396736145, 2.558540105819702, 2.716156482696533, 2.873772621154785, 3.031388759613037, 3.189004898071289, 3.346621036529541, 3.504237174987793, 3.661853313446045, 3.819469451904297, 3.977085590362549, 4.134701728820801, 4.292317867279053]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 3.0, 6.0, 15.0, 10.0, 15.0, 15.0, 22.0, 28.0, 22.0, 35.0, 38.0, 39.0, 54.0, 52.0, 40.0, 59.0, 62.0, 51.0, 52.0, 44.0, 42.0, 44.0, 43.0, 40.0, 32.0, 20.0, 28.0, 16.0, 21.0, 12.0, 13.0, 3.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.0149853229522705, -2.9304065704345703, -2.845827579498291, -2.761248826980591, -2.6766700744628906, -2.5920910835266113, -2.507512331008911, -2.422933578491211, -2.3383545875549316, -2.2537758350372314, -2.169196844100952, -2.084618091583252, -2.0000391006469727, -1.9154603481292725, -1.8308815956115723, -1.7463027238845825, -1.6617238521575928, -1.577144980430603, -1.4925661087036133, -1.407987356185913, -1.3234084844589233, -1.2388296127319336, -1.1542508602142334, -1.0696719884872437, -0.9850931167602539, -0.9005142450332642, -0.8159354329109192, -0.7313566207885742, -0.6467777490615845, -0.5621988773345947, -0.47762006521224976, -0.3930412530899048, -0.30846214294433594, -0.22388330101966858, -0.13930445909500122, -0.05472561717033386, 0.029853224754333496, 0.11443206667900085, 0.1990109086036682, 0.2835897207260132, 0.36816859245300293, 0.4527474343776703, 0.5373262763023376, 0.6219050884246826, 0.7064839601516724, 0.7910628318786621, 0.8756416440010071, 0.960220456123352, 1.0447993278503418, 1.1293781995773315, 1.2139570713043213, 1.2985358238220215, 1.3831146955490112, 1.467693567276001, 1.5522723197937012, 1.636851191520691, 1.7214300632476807, 1.8060089349746704, 1.8905878067016602, 1.9751665592193604, 2.0597453117370605, 2.14432430267334, 2.22890305519104, 2.3134818077087402, 2.3980607986450195]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 9.0, 9.0, 18.0, 14.0, 37.0, 27.0, 56.0, 76.0, 107.0, 156.0, 224.0, 384.0, 580.0, 941.0, 1490.0, 2352.0, 4153.0, 7384.0, 13641.0, 26413.0, 54319.0, 117049.0, 236068.0, 277073.0, 157511.0, 73233.0, 35115.0, 17608.0, 9382.0, 5213.0, 2922.0, 1836.0, 1131.0, 664.0, 465.0, 278.0, 195.0, 137.0, 100.0, 59.0, 40.0, 23.0, 15.0, 17.0, 6.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.97265625, -1.909423828125, -1.84619140625, -1.782958984375, -1.7197265625, -1.656494140625, -1.59326171875, -1.530029296875, -1.466796875, -1.403564453125, -1.34033203125, -1.277099609375, -1.2138671875, -1.150634765625, -1.08740234375, -1.024169921875, -0.9609375, -0.897705078125, -0.83447265625, -0.771240234375, -0.7080078125, -0.644775390625, -0.58154296875, -0.518310546875, -0.455078125, -0.391845703125, -0.32861328125, -0.265380859375, -0.2021484375, -0.138916015625, -0.07568359375, -0.012451171875, 0.05078125, 0.114013671875, 0.17724609375, 0.240478515625, 0.3037109375, 0.366943359375, 0.43017578125, 0.493408203125, 0.556640625, 0.619873046875, 0.68310546875, 0.746337890625, 0.8095703125, 0.872802734375, 0.93603515625, 0.999267578125, 1.0625, 1.125732421875, 1.18896484375, 1.252197265625, 1.3154296875, 1.378662109375, 1.44189453125, 1.505126953125, 1.568359375, 1.631591796875, 1.69482421875, 1.758056640625, 1.8212890625, 1.884521484375, 1.94775390625, 2.010986328125, 2.07421875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 6.0, 3.0, 2.0, 2.0, 4.0, 11.0, 6.0, 8.0, 14.0, 16.0, 13.0, 28.0, 28.0, 41.0, 34.0, 40.0, 39.0, 56.0, 48.0, 46.0, 59.0, 45.0, 45.0, 52.0, 53.0, 49.0, 42.0, 37.0, 34.0, 28.0, 29.0, 17.0, 14.0, 11.0, 7.0, 8.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.76220703125, -0.7416000366210938, -0.7209930419921875, -0.7003860473632812, -0.679779052734375, -0.6591720581054688, -0.6385650634765625, -0.6179580688476562, -0.59735107421875, -0.5767440795898438, -0.5561370849609375, -0.5355300903320312, -0.514923095703125, -0.49431610107421875, -0.4737091064453125, -0.45310211181640625, -0.4324951171875, -0.41188812255859375, -0.3912811279296875, -0.37067413330078125, -0.350067138671875, -0.32946014404296875, -0.3088531494140625, -0.28824615478515625, -0.26763916015625, -0.24703216552734375, -0.2264251708984375, -0.20581817626953125, -0.185211181640625, -0.16460418701171875, -0.1439971923828125, -0.12339019775390625, -0.102783203125, -0.08217620849609375, -0.0615692138671875, -0.04096221923828125, -0.020355224609375, 0.00025177001953125, 0.0208587646484375, 0.04146575927734375, 0.06207275390625, 0.08267974853515625, 0.1032867431640625, 0.12389373779296875, 0.144500732421875, 0.16510772705078125, 0.1857147216796875, 0.20632171630859375, 0.2269287109375, 0.24753570556640625, 0.2681427001953125, 0.28874969482421875, 0.309356689453125, 0.32996368408203125, 0.3505706787109375, 0.37117767333984375, 0.39178466796875, 0.41239166259765625, 0.4329986572265625, 0.45360565185546875, 0.474212646484375, 0.49481964111328125, 0.5154266357421875, 0.5360336303710938, 0.556640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 3.0, 5.0, 11.0, 10.0, 14.0, 20.0, 17.0, 31.0, 35.0, 51.0, 89.0, 122.0, 132.0, 223.0, 324.0, 583.0, 1085.0, 2379.0, 6457.0, 21803.0, 103123.0, 573294.0, 272968.0, 46495.0, 11488.0, 3877.0, 1574.0, 849.0, 455.0, 325.0, 191.0, 135.0, 94.0, 63.0, 43.0, 33.0, 27.0, 24.0, 20.0, 21.0, 15.0, 8.0, 6.0, 4.0, 5.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.9453125, -4.798828125, -4.65234375, -4.505859375, -4.359375, -4.212890625, -4.06640625, -3.919921875, -3.7734375, -3.626953125, -3.48046875, -3.333984375, -3.1875, -3.041015625, -2.89453125, -2.748046875, -2.6015625, -2.455078125, -2.30859375, -2.162109375, -2.015625, -1.869140625, -1.72265625, -1.576171875, -1.4296875, -1.283203125, -1.13671875, -0.990234375, -0.84375, -0.697265625, -0.55078125, -0.404296875, -0.2578125, -0.111328125, 0.03515625, 0.181640625, 0.328125, 0.474609375, 0.62109375, 0.767578125, 0.9140625, 1.060546875, 1.20703125, 1.353515625, 1.5, 1.646484375, 1.79296875, 1.939453125, 2.0859375, 2.232421875, 2.37890625, 2.525390625, 2.671875, 2.818359375, 2.96484375, 3.111328125, 3.2578125, 3.404296875, 3.55078125, 3.697265625, 3.84375, 3.990234375, 4.13671875, 4.283203125, 4.4296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 10.0, 6.0, 4.0, 3.0, 14.0, 18.0, 22.0, 16.0, 19.0, 23.0, 22.0, 24.0, 36.0, 38.0, 41.0, 45.0, 42.0, 40.0, 49.0, 33.0, 35.0, 29.0, 39.0, 38.0, 38.0, 30.0, 36.0, 35.0, 30.0, 34.0, 22.0, 19.0, 18.0, 10.0, 13.0, 16.0, 13.0, 5.0, 7.0, 4.0, 8.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.42578125, -3.32196044921875, -3.2181396484375, -3.11431884765625, -3.010498046875, -2.90667724609375, -2.8028564453125, -2.69903564453125, -2.59521484375, -2.49139404296875, -2.3875732421875, -2.28375244140625, -2.179931640625, -2.07611083984375, -1.9722900390625, -1.86846923828125, -1.7646484375, -1.66082763671875, -1.5570068359375, -1.45318603515625, -1.349365234375, -1.24554443359375, -1.1417236328125, -1.03790283203125, -0.93408203125, -0.83026123046875, -0.7264404296875, -0.62261962890625, -0.518798828125, -0.41497802734375, -0.3111572265625, -0.20733642578125, -0.103515625, 0.00030517578125, 0.1041259765625, 0.20794677734375, 0.311767578125, 0.41558837890625, 0.5194091796875, 0.62322998046875, 0.72705078125, 0.83087158203125, 0.9346923828125, 1.03851318359375, 1.142333984375, 1.24615478515625, 1.3499755859375, 1.45379638671875, 1.5576171875, 1.66143798828125, 1.7652587890625, 1.86907958984375, 1.972900390625, 2.07672119140625, 2.1805419921875, 2.28436279296875, 2.38818359375, 2.49200439453125, 2.5958251953125, 2.69964599609375, 2.803466796875, 2.90728759765625, 3.0111083984375, 3.11492919921875, 3.21875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 9.0, 17.0, 25.0, 43.0, 70.0, 91.0, 195.0, 336.0, 659.0, 1178.0, 2582.0, 6232.0, 17504.0, 64087.0, 334549.0, 490308.0, 92994.0, 23341.0, 8047.0, 3182.0, 1427.0, 778.0, 387.0, 184.0, 100.0, 66.0, 55.0, 30.0, 26.0, 12.0, 8.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4375, -2.36810302734375, -2.2987060546875, -2.22930908203125, -2.159912109375, -2.09051513671875, -2.0211181640625, -1.95172119140625, -1.88232421875, -1.81292724609375, -1.7435302734375, -1.67413330078125, -1.604736328125, -1.53533935546875, -1.4659423828125, -1.39654541015625, -1.3271484375, -1.25775146484375, -1.1883544921875, -1.11895751953125, -1.049560546875, -0.98016357421875, -0.9107666015625, -0.84136962890625, -0.77197265625, -0.70257568359375, -0.6331787109375, -0.56378173828125, -0.494384765625, -0.42498779296875, -0.3555908203125, -0.28619384765625, -0.216796875, -0.14739990234375, -0.0780029296875, -0.00860595703125, 0.060791015625, 0.13018798828125, 0.1995849609375, 0.26898193359375, 0.33837890625, 0.40777587890625, 0.4771728515625, 0.54656982421875, 0.615966796875, 0.68536376953125, 0.7547607421875, 0.82415771484375, 0.8935546875, 0.96295166015625, 1.0323486328125, 1.10174560546875, 1.171142578125, 1.24053955078125, 1.3099365234375, 1.37933349609375, 1.44873046875, 1.51812744140625, 1.5875244140625, 1.65692138671875, 1.726318359375, 1.79571533203125, 1.8651123046875, 1.93450927734375, 2.00390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 8.0, 9.0, 9.0, 14.0, 23.0, 34.0, 43.0, 56.0, 79.0, 146.0, 116.0, 116.0, 95.0, 74.0, 56.0, 37.0, 31.0, 15.0, 11.0, 6.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005960464477539062, -0.0005787909030914307, -0.0005615353584289551, -0.0005442798137664795, -0.0005270242691040039, -0.0005097687244415283, -0.0004925131797790527, -0.00047525763511657715, -0.00045800209045410156, -0.000440746545791626, -0.0004234910011291504, -0.0004062354564666748, -0.0003889799118041992, -0.00037172436714172363, -0.00035446882247924805, -0.00033721327781677246, -0.0003199577331542969, -0.0003027021884918213, -0.0002854466438293457, -0.0002681910991668701, -0.00025093555450439453, -0.00023368000984191895, -0.00021642446517944336, -0.00019916892051696777, -0.0001819133758544922, -0.0001646578311920166, -0.00014740228652954102, -0.00013014674186706543, -0.00011289119720458984, -9.563565254211426e-05, -7.838010787963867e-05, -6.112456321716309e-05, -4.38690185546875e-05, -2.6613473892211914e-05, -9.357929229736328e-06, 7.897615432739258e-06, 2.5153160095214844e-05, 4.240870475769043e-05, 5.9664249420166016e-05, 7.69197940826416e-05, 9.417533874511719e-05, 0.00011143088340759277, 0.00012868642807006836, 0.00014594197273254395, 0.00016319751739501953, 0.00018045306205749512, 0.0001977086067199707, 0.0002149641513824463, 0.00023221969604492188, 0.00024947524070739746, 0.00026673078536987305, 0.00028398633003234863, 0.0003012418746948242, 0.0003184974193572998, 0.0003357529640197754, 0.000353008508682251, 0.00037026405334472656, 0.00038751959800720215, 0.00040477514266967773, 0.0004220306873321533, 0.0004392862319946289, 0.0004565417766571045, 0.0004737973213195801, 0.0004910528659820557, 0.0005083084106445312]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 3.0, 2.0, 13.0, 14.0, 33.0, 30.0, 36.0, 71.0, 123.0, 236.0, 395.0, 878.0, 1984.0, 6933.0, 40426.0, 581068.0, 378751.0, 28579.0, 5566.0, 1782.0, 760.0, 357.0, 174.0, 116.0, 65.0, 40.0, 33.0, 22.0, 16.0, 8.0, 4.0, 5.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.427734375, -3.320343017578125, -3.21295166015625, -3.105560302734375, -2.9981689453125, -2.890777587890625, -2.78338623046875, -2.675994873046875, -2.568603515625, -2.461212158203125, -2.35382080078125, -2.246429443359375, -2.1390380859375, -2.031646728515625, -1.92425537109375, -1.816864013671875, -1.70947265625, -1.602081298828125, -1.49468994140625, -1.387298583984375, -1.2799072265625, -1.172515869140625, -1.06512451171875, -0.957733154296875, -0.850341796875, -0.742950439453125, -0.63555908203125, -0.528167724609375, -0.4207763671875, -0.313385009765625, -0.20599365234375, -0.098602294921875, 0.0087890625, 0.116180419921875, 0.22357177734375, 0.330963134765625, 0.4383544921875, 0.545745849609375, 0.65313720703125, 0.760528564453125, 0.867919921875, 0.975311279296875, 1.08270263671875, 1.190093994140625, 1.2974853515625, 1.404876708984375, 1.51226806640625, 1.619659423828125, 1.72705078125, 1.834442138671875, 1.94183349609375, 2.049224853515625, 2.1566162109375, 2.264007568359375, 2.37139892578125, 2.478790283203125, 2.586181640625, 2.693572998046875, 2.80096435546875, 2.908355712890625, 3.0157470703125, 3.123138427734375, 3.23052978515625, 3.337921142578125, 3.4453125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 12.0, 16.0, 14.0, 25.0, 36.0, 42.0, 50.0, 67.0, 90.0, 104.0, 107.0, 100.0, 83.0, 67.0, 44.0, 31.0, 32.0, 21.0, 17.0, 10.0, 12.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.12109375, -3.0490570068359375, -2.977020263671875, -2.9049835205078125, -2.83294677734375, -2.7609100341796875, -2.688873291015625, -2.6168365478515625, -2.5447998046875, -2.4727630615234375, -2.400726318359375, -2.3286895751953125, -2.25665283203125, -2.1846160888671875, -2.112579345703125, -2.0405426025390625, -1.968505859375, -1.8964691162109375, -1.824432373046875, -1.7523956298828125, -1.68035888671875, -1.6083221435546875, -1.536285400390625, -1.4642486572265625, -1.3922119140625, -1.3201751708984375, -1.248138427734375, -1.1761016845703125, -1.10406494140625, -1.0320281982421875, -0.959991455078125, -0.8879547119140625, -0.81591796875, -0.7438812255859375, -0.671844482421875, -0.5998077392578125, -0.52777099609375, -0.4557342529296875, -0.383697509765625, -0.3116607666015625, -0.2396240234375, -0.1675872802734375, -0.095550537109375, -0.0235137939453125, 0.04852294921875, 0.1205596923828125, 0.192596435546875, 0.2646331787109375, 0.336669921875, 0.4087066650390625, 0.480743408203125, 0.5527801513671875, 0.62481689453125, 0.6968536376953125, 0.768890380859375, 0.8409271240234375, 0.9129638671875, 0.9850006103515625, 1.057037353515625, 1.1290740966796875, 1.20111083984375, 1.2731475830078125, 1.345184326171875, 1.4172210693359375, 1.4892578125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 10.0, 10.0, 18.0, 44.0, 85.0, 144.0, 205.0, 193.0, 141.0, 87.0, 42.0, 18.0, 8.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.0272216796875, -63.392906188964844, -61.75859451293945, -60.1242790222168, -58.489967346191406, -56.85565185546875, -55.221336364746094, -53.58702087402344, -51.95270919799805, -50.31839370727539, -48.68408203125, -47.049766540527344, -45.41545104980469, -43.7811393737793, -42.14682388305664, -40.51251220703125, -38.878196716308594, -37.24388122558594, -35.60956954956055, -33.97525405883789, -32.3409423828125, -30.706626892089844, -29.072311401367188, -27.437997817993164, -25.80368423461914, -24.169370651245117, -22.535057067871094, -20.900741577148438, -19.266427993774414, -17.63211441040039, -15.99779987335205, -14.363485336303711, -12.729175567626953, -11.09486198425293, -9.46054744720459, -7.826233386993408, -6.191919326782227, -4.557605743408203, -2.9232912063598633, -1.2889766693115234, 0.3453369140625, 1.9796509742736816, 3.6139650344848633, 5.248279094696045, 6.882593154907227, 8.51690673828125, 10.15122127532959, 11.78553581237793, 13.419849395751953, 15.054162979125977, 16.6884765625, 18.322792053222656, 19.95710563659668, 21.591419219970703, 23.22573471069336, 24.860048294067383, 26.494361877441406, 28.12867546081543, 29.762989044189453, 31.39730453491211, 33.0316162109375, 34.665931701660156, 36.30024719238281, 37.93456268310547, 39.56887435913086]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 5.0, 6.0, 2.0, 10.0, 9.0, 17.0, 8.0, 11.0, 7.0, 19.0, 15.0, 26.0, 28.0, 26.0, 29.0, 36.0, 42.0, 30.0, 48.0, 53.0, 55.0, 48.0, 45.0, 48.0, 35.0, 43.0, 33.0, 39.0, 40.0, 21.0, 25.0, 21.0, 22.0, 22.0, 13.0, 11.0, 7.0, 14.0, 6.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.641098022460938, -17.076351165771484, -16.51160430908203, -15.946857452392578, -15.382111549377441, -14.817364692687988, -14.252617835998535, -13.687870979309082, -13.123125076293945, -12.558378219604492, -11.993631362915039, -11.428884506225586, -10.86413860321045, -10.299391746520996, -9.734644889831543, -9.16989803314209, -8.605151176452637, -8.040404319763184, -7.475657939910889, -6.9109110832214355, -6.346164703369141, -5.7814178466796875, -5.216670989990234, -4.651924133300781, -4.087177753448486, -3.5224311351776123, -2.9576845169067383, -2.392937660217285, -1.8281910419464111, -1.263444423675537, -0.698697566986084, -0.13395094871520996, 0.43079566955566406, 0.9955423474311829, 1.5602890253067017, 2.1250357627868652, 2.6897823810577393, 3.2545289993286133, 3.8192758560180664, 4.3840227127075195, 4.9487690925598145, 5.513515949249268, 6.0782623291015625, 6.643009185791016, 7.207756042480469, 7.772502422332764, 8.337249755859375, 8.901995658874512, 9.466742515563965, 10.031489372253418, 10.596236228942871, 11.160982131958008, 11.725728988647461, 12.290475845336914, 12.855222702026367, 13.41996955871582, 13.984716415405273, 14.549463272094727, 15.11421012878418, 15.678956985473633, 16.243703842163086, 16.808448791503906, 17.37319564819336, 17.937942504882812, 18.502689361572266]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 2.0, 9.0, 6.0, 9.0, 16.0, 19.0, 29.0, 46.0, 49.0, 66.0, 106.0, 157.0, 246.0, 293.0, 516.0, 765.0, 1267.0, 2184.0, 4181.0, 9544.0, 44636.0, 4064502.0, 45643.0, 10023.0, 4229.0, 2246.0, 1310.0, 714.0, 490.0, 327.0, 223.0, 134.0, 91.0, 69.0, 46.0, 32.0, 12.0, 11.0, 7.0, 4.0, 8.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.962646484375, -5.78466796875, -5.606689453125, -5.4287109375, -5.250732421875, -5.07275390625, -4.894775390625, -4.716796875, -4.538818359375, -4.36083984375, -4.182861328125, -4.0048828125, -3.826904296875, -3.64892578125, -3.470947265625, -3.29296875, -3.114990234375, -2.93701171875, -2.759033203125, -2.5810546875, -2.403076171875, -2.22509765625, -2.047119140625, -1.869140625, -1.691162109375, -1.51318359375, -1.335205078125, -1.1572265625, -0.979248046875, -0.80126953125, -0.623291015625, -0.4453125, -0.267333984375, -0.08935546875, 0.088623046875, 0.2666015625, 0.444580078125, 0.62255859375, 0.800537109375, 0.978515625, 1.156494140625, 1.33447265625, 1.512451171875, 1.6904296875, 1.868408203125, 2.04638671875, 2.224365234375, 2.40234375, 2.580322265625, 2.75830078125, 2.936279296875, 3.1142578125, 3.292236328125, 3.47021484375, 3.648193359375, 3.826171875, 4.004150390625, 4.18212890625, 4.360107421875, 4.5380859375, 4.716064453125, 4.89404296875, 5.072021484375, 5.25]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 5.0, 2.0, 8.0, 7.0, 12.0, 12.0, 24.0, 14.0, 30.0, 35.0, 41.0, 58.0, 52.0, 72.0, 58.0, 74.0, 74.0, 59.0, 53.0, 66.0, 51.0, 40.0, 40.0, 32.0, 19.0, 15.0, 5.0, 13.0, 9.0, 5.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99609375, -0.9682388305664062, -0.9403839111328125, -0.9125289916992188, -0.884674072265625, -0.8568191528320312, -0.8289642333984375, -0.8011093139648438, -0.77325439453125, -0.7453994750976562, -0.7175445556640625, -0.6896896362304688, -0.661834716796875, -0.6339797973632812, -0.6061248779296875, -0.5782699584960938, -0.5504150390625, -0.5225601196289062, -0.4947052001953125, -0.46685028076171875, -0.438995361328125, -0.41114044189453125, -0.3832855224609375, -0.35543060302734375, -0.32757568359375, -0.29972076416015625, -0.2718658447265625, -0.24401092529296875, -0.216156005859375, -0.18830108642578125, -0.1604461669921875, -0.13259124755859375, -0.104736328125, -0.07688140869140625, -0.0490264892578125, -0.02117156982421875, 0.006683349609375, 0.03453826904296875, 0.0623931884765625, 0.09024810791015625, 0.11810302734375, 0.14595794677734375, 0.1738128662109375, 0.20166778564453125, 0.229522705078125, 0.25737762451171875, 0.2852325439453125, 0.31308746337890625, 0.3409423828125, 0.36879730224609375, 0.3966522216796875, 0.42450714111328125, 0.452362060546875, 0.48021697998046875, 0.5080718994140625, 0.5359268188476562, 0.56378173828125, 0.5916366577148438, 0.6194915771484375, 0.6473464965820312, 0.675201416015625, 0.7030563354492188, 0.7309112548828125, 0.7587661743164062, 0.78662109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 7.0, 6.0, 12.0, 12.0, 12.0, 22.0, 30.0, 36.0, 32.0, 47.0, 86.0, 89.0, 120.0, 172.0, 286.0, 429.0, 734.0, 1205.0, 2380.0, 5659.0, 18576.0, 333027.0, 3798228.0, 20828.0, 6133.0, 2584.0, 1337.0, 714.0, 461.0, 299.0, 171.0, 130.0, 85.0, 70.0, 56.0, 32.0, 39.0, 27.0, 21.0, 19.0, 11.0, 10.0, 11.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0], "bins": [-7.83984375, -7.60260009765625, -7.3653564453125, -7.12811279296875, -6.890869140625, -6.65362548828125, -6.4163818359375, -6.17913818359375, -5.94189453125, -5.70465087890625, -5.4674072265625, -5.23016357421875, -4.992919921875, -4.75567626953125, -4.5184326171875, -4.28118896484375, -4.0439453125, -3.80670166015625, -3.5694580078125, -3.33221435546875, -3.094970703125, -2.85772705078125, -2.6204833984375, -2.38323974609375, -2.14599609375, -1.90875244140625, -1.6715087890625, -1.43426513671875, -1.197021484375, -0.95977783203125, -0.7225341796875, -0.48529052734375, -0.248046875, -0.01080322265625, 0.2264404296875, 0.46368408203125, 0.700927734375, 0.93817138671875, 1.1754150390625, 1.41265869140625, 1.64990234375, 1.88714599609375, 2.1243896484375, 2.36163330078125, 2.598876953125, 2.83612060546875, 3.0733642578125, 3.31060791015625, 3.5478515625, 3.78509521484375, 4.0223388671875, 4.25958251953125, 4.496826171875, 4.73406982421875, 4.9713134765625, 5.20855712890625, 5.44580078125, 5.68304443359375, 5.9202880859375, 6.15753173828125, 6.394775390625, 6.63201904296875, 6.8692626953125, 7.10650634765625, 7.34375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 7.0, 12.0, 16.0, 16.0, 55.0, 241.0, 3558.0, 87.0, 27.0, 15.0, 11.0, 10.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.162109375, -2.0970458984375, -2.031982421875, -1.9669189453125, -1.90185546875, -1.8367919921875, -1.771728515625, -1.7066650390625, -1.6416015625, -1.5765380859375, -1.511474609375, -1.4464111328125, -1.38134765625, -1.3162841796875, -1.251220703125, -1.1861572265625, -1.12109375, -1.0560302734375, -0.990966796875, -0.9259033203125, -0.86083984375, -0.7957763671875, -0.730712890625, -0.6656494140625, -0.6005859375, -0.5355224609375, -0.470458984375, -0.4053955078125, -0.34033203125, -0.2752685546875, -0.210205078125, -0.1451416015625, -0.080078125, -0.0150146484375, 0.050048828125, 0.1151123046875, 0.18017578125, 0.2452392578125, 0.310302734375, 0.3753662109375, 0.4404296875, 0.5054931640625, 0.570556640625, 0.6356201171875, 0.70068359375, 0.7657470703125, 0.830810546875, 0.8958740234375, 0.9609375, 1.0260009765625, 1.091064453125, 1.1561279296875, 1.22119140625, 1.2862548828125, 1.351318359375, 1.4163818359375, 1.4814453125, 1.5465087890625, 1.611572265625, 1.6766357421875, 1.74169921875, 1.8067626953125, 1.871826171875, 1.9368896484375, 2.001953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 0.0, 6.0, 3.0, 7.0, 13.0, 12.0, 18.0, 23.0, 26.0, 35.0, 44.0, 53.0, 38.0, 60.0, 66.0, 77.0, 96.0, 73.0, 65.0, 55.0, 50.0, 43.0, 26.0, 16.0, 18.0, 19.0, 10.0, 12.0, 4.0, 10.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.223165273666382, -3.1176178455352783, -3.012070417404175, -2.9065229892730713, -2.8009753227233887, -2.695427894592285, -2.5898804664611816, -2.484333038330078, -2.3787856101989746, -2.273238182067871, -2.1676907539367676, -2.062143325805664, -1.956595778465271, -1.8510483503341675, -1.7455008029937744, -1.639953374862671, -1.5344059467315674, -1.4288585186004639, -1.3233110904693604, -1.2177635431289673, -1.1122161149978638, -1.0066686868667603, -0.901121199131012, -0.7955737113952637, -0.6900262832641602, -0.5844788551330566, -0.47893136739730835, -0.37338390946388245, -0.26783645153045654, -0.16228902339935303, -0.056741535663604736, 0.048805952072143555, 0.15435314178466797, 0.25990059971809387, 0.3654480576515198, 0.4709955155849457, 0.5765429735183716, 0.6820904016494751, 0.7876378893852234, 0.8931853771209717, 0.9987328052520752, 1.1042802333831787, 1.2098276615142822, 1.3153752088546753, 1.4209226369857788, 1.5264700651168823, 1.6320176124572754, 1.737565040588379, 1.8431124687194824, 1.948659896850586, 2.0542073249816895, 2.159754753112793, 2.2653021812438965, 2.370849609375, 2.4763972759246826, 2.581944704055786, 2.6874921321868896, 2.793039560317993, 2.8985869884490967, 3.0041344165802, 3.109682083129883, 3.2152295112609863, 3.32077693939209, 3.4263243675231934, 3.531871795654297]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 4.0, 11.0, 4.0, 14.0, 19.0, 8.0, 15.0, 17.0, 28.0, 20.0, 28.0, 26.0, 43.0, 44.0, 47.0, 36.0, 43.0, 47.0, 45.0, 49.0, 53.0, 49.0, 47.0, 30.0, 34.0, 29.0, 22.0, 28.0, 24.0, 23.0, 24.0, 14.0, 13.0, 13.0, 13.0, 5.0, 7.0, 8.0, 2.0, 2.0, 0.0, 6.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.157294273376465, -3.057957887649536, -2.9586212635040283, -2.8592848777770996, -2.759948253631592, -2.660611867904663, -2.5612754821777344, -2.4619388580322266, -2.362602472305298, -2.263266086578369, -2.1639294624328613, -2.0645930767059326, -1.9652565717697144, -1.865920066833496, -1.7665836811065674, -1.6672471761703491, -1.5679106712341309, -1.4685741662979126, -1.3692376613616943, -1.2699012756347656, -1.1705647706985474, -1.071228265762329, -0.9718918204307556, -0.8725553750991821, -0.7732188701629639, -0.6738823652267456, -0.5745459198951721, -0.47520944476127625, -0.37587296962738037, -0.2765364944934845, -0.17720001935958862, -0.07786357402801514, 0.021472692489624023, 0.1208091676235199, 0.22014564275741577, 0.31948211789131165, 0.4188185930252075, 0.5181550979614258, 0.6174915432929993, 0.7168279886245728, 0.816164493560791, 0.9155009984970093, 1.0148375034332275, 1.1141738891601562, 1.2135103940963745, 1.3128468990325928, 1.4121832847595215, 1.5115197896957397, 1.610856294631958, 1.7101927995681763, 1.8095293045043945, 1.9088656902313232, 2.008202075958252, 2.1075387001037598, 2.2068750858306885, 2.306211471557617, 2.405548095703125, 2.5048844814300537, 2.6042211055755615, 2.7035574913024902, 2.802894115447998, 2.9022305011749268, 3.0015668869018555, 3.1009035110473633, 3.200239896774292]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 12.0, 18.0, 29.0, 31.0, 58.0, 82.0, 113.0, 179.0, 296.0, 452.0, 782.0, 1274.0, 2141.0, 3413.0, 5938.0, 10197.0, 18704.0, 34920.0, 70253.0, 148038.0, 282314.0, 236641.0, 113702.0, 54887.0, 28023.0, 15121.0, 8473.0, 5026.0, 2849.0, 1714.0, 1050.0, 655.0, 380.0, 263.0, 184.0, 113.0, 75.0, 44.0, 36.0, 19.0, 23.0, 8.0, 6.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.7080078125, -1.658966064453125, -1.60992431640625, -1.560882568359375, -1.5118408203125, -1.462799072265625, -1.41375732421875, -1.364715576171875, -1.315673828125, -1.266632080078125, -1.21759033203125, -1.168548583984375, -1.1195068359375, -1.070465087890625, -1.02142333984375, -0.972381591796875, -0.92333984375, -0.874298095703125, -0.82525634765625, -0.776214599609375, -0.7271728515625, -0.678131103515625, -0.62908935546875, -0.580047607421875, -0.531005859375, -0.481964111328125, -0.43292236328125, -0.383880615234375, -0.3348388671875, -0.285797119140625, -0.23675537109375, -0.187713623046875, -0.138671875, -0.089630126953125, -0.04058837890625, 0.008453369140625, 0.0574951171875, 0.106536865234375, 0.15557861328125, 0.204620361328125, 0.253662109375, 0.302703857421875, 0.35174560546875, 0.400787353515625, 0.4498291015625, 0.498870849609375, 0.54791259765625, 0.596954345703125, 0.64599609375, 0.695037841796875, 0.74407958984375, 0.793121337890625, 0.8421630859375, 0.891204833984375, 0.94024658203125, 0.989288330078125, 1.038330078125, 1.087371826171875, 1.13641357421875, 1.185455322265625, 1.2344970703125, 1.283538818359375, 1.33258056640625, 1.381622314453125, 1.4306640625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 9.0, 11.0, 15.0, 18.0, 18.0, 15.0, 41.0, 39.0, 44.0, 48.0, 53.0, 50.0, 53.0, 66.0, 66.0, 57.0, 51.0, 41.0, 43.0, 34.0, 42.0, 31.0, 33.0, 24.0, 20.0, 6.0, 12.0, 8.0, 8.0, 8.0, 5.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9775390625, -0.9496307373046875, -0.921722412109375, -0.8938140869140625, -0.86590576171875, -0.8379974365234375, -0.810089111328125, -0.7821807861328125, -0.7542724609375, -0.7263641357421875, -0.698455810546875, -0.6705474853515625, -0.64263916015625, -0.6147308349609375, -0.586822509765625, -0.5589141845703125, -0.531005859375, -0.5030975341796875, -0.475189208984375, -0.4472808837890625, -0.41937255859375, -0.3914642333984375, -0.363555908203125, -0.3356475830078125, -0.3077392578125, -0.2798309326171875, -0.251922607421875, -0.2240142822265625, -0.19610595703125, -0.1681976318359375, -0.140289306640625, -0.1123809814453125, -0.08447265625, -0.0565643310546875, -0.028656005859375, -0.0007476806640625, 0.02716064453125, 0.0550689697265625, 0.082977294921875, 0.1108856201171875, 0.1387939453125, 0.1667022705078125, 0.194610595703125, 0.2225189208984375, 0.25042724609375, 0.2783355712890625, 0.306243896484375, 0.3341522216796875, 0.362060546875, 0.3899688720703125, 0.417877197265625, 0.4457855224609375, 0.47369384765625, 0.5016021728515625, 0.529510498046875, 0.5574188232421875, 0.5853271484375, 0.6132354736328125, 0.641143798828125, 0.6690521240234375, 0.69696044921875, 0.7248687744140625, 0.752777099609375, 0.7806854248046875, 0.80859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 5.0, 2.0, 11.0, 10.0, 16.0, 26.0, 20.0, 31.0, 51.0, 84.0, 109.0, 183.0, 250.0, 415.0, 785.0, 1844.0, 6343.0, 44713.0, 653082.0, 310268.0, 23059.0, 4076.0, 1407.0, 649.0, 379.0, 228.0, 166.0, 99.0, 63.0, 41.0, 40.0, 28.0, 16.0, 13.0, 13.0, 10.0, 12.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.921875, -5.74163818359375, -5.5614013671875, -5.38116455078125, -5.200927734375, -5.02069091796875, -4.8404541015625, -4.66021728515625, -4.47998046875, -4.29974365234375, -4.1195068359375, -3.93927001953125, -3.759033203125, -3.57879638671875, -3.3985595703125, -3.21832275390625, -3.0380859375, -2.85784912109375, -2.6776123046875, -2.49737548828125, -2.317138671875, -2.13690185546875, -1.9566650390625, -1.77642822265625, -1.59619140625, -1.41595458984375, -1.2357177734375, -1.05548095703125, -0.875244140625, -0.69500732421875, -0.5147705078125, -0.33453369140625, -0.154296875, 0.02593994140625, 0.2061767578125, 0.38641357421875, 0.566650390625, 0.74688720703125, 0.9271240234375, 1.10736083984375, 1.28759765625, 1.46783447265625, 1.6480712890625, 1.82830810546875, 2.008544921875, 2.18878173828125, 2.3690185546875, 2.54925537109375, 2.7294921875, 2.90972900390625, 3.0899658203125, 3.27020263671875, 3.450439453125, 3.63067626953125, 3.8109130859375, 3.99114990234375, 4.17138671875, 4.35162353515625, 4.5318603515625, 4.71209716796875, 4.892333984375, 5.07257080078125, 5.2528076171875, 5.43304443359375, 5.61328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 8.0, 9.0, 7.0, 14.0, 17.0, 10.0, 17.0, 19.0, 24.0, 24.0, 28.0, 31.0, 34.0, 27.0, 27.0, 28.0, 27.0, 28.0, 54.0, 48.0, 38.0, 56.0, 36.0, 67.0, 31.0, 37.0, 42.0, 28.0, 30.0, 22.0, 24.0, 18.0, 16.0, 15.0, 13.0, 5.0, 9.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.8515625, -3.7242431640625, -3.596923828125, -3.4696044921875, -3.34228515625, -3.2149658203125, -3.087646484375, -2.9603271484375, -2.8330078125, -2.7056884765625, -2.578369140625, -2.4510498046875, -2.32373046875, -2.1964111328125, -2.069091796875, -1.9417724609375, -1.814453125, -1.6871337890625, -1.559814453125, -1.4324951171875, -1.30517578125, -1.1778564453125, -1.050537109375, -0.9232177734375, -0.7958984375, -0.6685791015625, -0.541259765625, -0.4139404296875, -0.28662109375, -0.1593017578125, -0.031982421875, 0.0953369140625, 0.22265625, 0.3499755859375, 0.477294921875, 0.6046142578125, 0.73193359375, 0.8592529296875, 0.986572265625, 1.1138916015625, 1.2412109375, 1.3685302734375, 1.495849609375, 1.6231689453125, 1.75048828125, 1.8778076171875, 2.005126953125, 2.1324462890625, 2.259765625, 2.3870849609375, 2.514404296875, 2.6417236328125, 2.76904296875, 2.8963623046875, 3.023681640625, 3.1510009765625, 3.2783203125, 3.4056396484375, 3.532958984375, 3.6602783203125, 3.78759765625, 3.9149169921875, 4.042236328125, 4.1695556640625, 4.296875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 8.0, 12.0, 16.0, 29.0, 31.0, 50.0, 93.0, 129.0, 253.0, 517.0, 1328.0, 4218.0, 19709.0, 186595.0, 752848.0, 68026.0, 10343.0, 2560.0, 867.0, 375.0, 205.0, 134.0, 70.0, 42.0, 27.0, 25.0, 12.0, 2.0, 5.0, 2.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.57421875, -2.4832763671875, -2.392333984375, -2.3013916015625, -2.21044921875, -2.1195068359375, -2.028564453125, -1.9376220703125, -1.8466796875, -1.7557373046875, -1.664794921875, -1.5738525390625, -1.48291015625, -1.3919677734375, -1.301025390625, -1.2100830078125, -1.119140625, -1.0281982421875, -0.937255859375, -0.8463134765625, -0.75537109375, -0.6644287109375, -0.573486328125, -0.4825439453125, -0.3916015625, -0.3006591796875, -0.209716796875, -0.1187744140625, -0.02783203125, 0.0631103515625, 0.154052734375, 0.2449951171875, 0.3359375, 0.4268798828125, 0.517822265625, 0.6087646484375, 0.69970703125, 0.7906494140625, 0.881591796875, 0.9725341796875, 1.0634765625, 1.1544189453125, 1.245361328125, 1.3363037109375, 1.42724609375, 1.5181884765625, 1.609130859375, 1.7000732421875, 1.791015625, 1.8819580078125, 1.972900390625, 2.0638427734375, 2.15478515625, 2.2457275390625, 2.336669921875, 2.4276123046875, 2.5185546875, 2.6094970703125, 2.700439453125, 2.7913818359375, 2.88232421875, 2.9732666015625, 3.064208984375, 3.1551513671875, 3.24609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 10.0, 9.0, 5.0, 5.0, 11.0, 10.0, 9.0, 15.0, 31.0, 54.0, 50.0, 62.0, 90.0, 110.0, 104.0, 96.0, 82.0, 57.0, 51.0, 29.0, 23.0, 22.0, 19.0, 6.0, 10.0, 5.0, 7.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003294944763183594, -0.0003188997507095337, -0.000308305025100708, -0.0002977102994918823, -0.00028711557388305664, -0.00027652084827423096, -0.0002659261226654053, -0.0002553313970565796, -0.0002447366714477539, -0.00023414194583892822, -0.00022354722023010254, -0.00021295249462127686, -0.00020235776901245117, -0.0001917630434036255, -0.0001811683177947998, -0.00017057359218597412, -0.00015997886657714844, -0.00014938414096832275, -0.00013878941535949707, -0.0001281946897506714, -0.0001175999641418457, -0.00010700523853302002, -9.641051292419434e-05, -8.581578731536865e-05, -7.522106170654297e-05, -6.462633609771729e-05, -5.40316104888916e-05, -4.343688488006592e-05, -3.2842159271240234e-05, -2.224743366241455e-05, -1.1652708053588867e-05, -1.0579824447631836e-06, 9.5367431640625e-06, 2.0131468772888184e-05, 3.072619438171387e-05, 4.132091999053955e-05, 5.1915645599365234e-05, 6.251037120819092e-05, 7.31050968170166e-05, 8.369982242584229e-05, 9.429454803466797e-05, 0.00010488927364349365, 0.00011548399925231934, 0.00012607872486114502, 0.0001366734504699707, 0.0001472681760787964, 0.00015786290168762207, 0.00016845762729644775, 0.00017905235290527344, 0.00018964707851409912, 0.0002002418041229248, 0.0002108365297317505, 0.00022143125534057617, 0.00023202598094940186, 0.00024262070655822754, 0.0002532154321670532, 0.0002638101577758789, 0.0002744048833847046, 0.0002849996089935303, 0.00029559433460235596, 0.00030618906021118164, 0.0003167837858200073, 0.000327378511428833, 0.0003379732370376587, 0.0003485679626464844]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 16.0, 15.0, 28.0, 50.0, 105.0, 144.0, 365.0, 736.0, 2047.0, 10140.0, 121744.0, 843220.0, 60217.0, 6815.0, 1599.0, 613.0, 280.0, 181.0, 87.0, 43.0, 30.0, 30.0, 11.0, 9.0, 6.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.49224853515625, -3.3809814453125, -3.26971435546875, -3.158447265625, -3.04718017578125, -2.9359130859375, -2.82464599609375, -2.71337890625, -2.60211181640625, -2.4908447265625, -2.37957763671875, -2.268310546875, -2.15704345703125, -2.0457763671875, -1.93450927734375, -1.8232421875, -1.71197509765625, -1.6007080078125, -1.48944091796875, -1.378173828125, -1.26690673828125, -1.1556396484375, -1.04437255859375, -0.93310546875, -0.82183837890625, -0.7105712890625, -0.59930419921875, -0.488037109375, -0.37677001953125, -0.2655029296875, -0.15423583984375, -0.04296875, 0.06829833984375, 0.1795654296875, 0.29083251953125, 0.402099609375, 0.51336669921875, 0.6246337890625, 0.73590087890625, 0.84716796875, 0.95843505859375, 1.0697021484375, 1.18096923828125, 1.292236328125, 1.40350341796875, 1.5147705078125, 1.62603759765625, 1.7373046875, 1.84857177734375, 1.9598388671875, 2.07110595703125, 2.182373046875, 2.29364013671875, 2.4049072265625, 2.51617431640625, 2.62744140625, 2.73870849609375, 2.8499755859375, 2.96124267578125, 3.072509765625, 3.18377685546875, 3.2950439453125, 3.40631103515625, 3.517578125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 9.0, 12.0, 14.0, 17.0, 20.0, 37.0, 52.0, 68.0, 76.0, 105.0, 94.0, 99.0, 100.0, 72.0, 64.0, 48.0, 35.0, 23.0, 11.0, 12.0, 15.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.7562103271484375, -1.691131591796875, -1.6260528564453125, -1.56097412109375, -1.4958953857421875, -1.430816650390625, -1.3657379150390625, -1.3006591796875, -1.2355804443359375, -1.170501708984375, -1.1054229736328125, -1.04034423828125, -0.9752655029296875, -0.910186767578125, -0.8451080322265625, -0.780029296875, -0.7149505615234375, -0.649871826171875, -0.5847930908203125, -0.51971435546875, -0.4546356201171875, -0.389556884765625, -0.3244781494140625, -0.2593994140625, -0.1943206787109375, -0.129241943359375, -0.0641632080078125, 0.00091552734375, 0.0659942626953125, 0.131072998046875, 0.1961517333984375, 0.26123046875, 0.3263092041015625, 0.391387939453125, 0.4564666748046875, 0.52154541015625, 0.5866241455078125, 0.651702880859375, 0.7167816162109375, 0.7818603515625, 0.8469390869140625, 0.912017822265625, 0.9770965576171875, 1.04217529296875, 1.1072540283203125, 1.172332763671875, 1.2374114990234375, 1.302490234375, 1.3675689697265625, 1.432647705078125, 1.4977264404296875, 1.56280517578125, 1.6278839111328125, 1.692962646484375, 1.7580413818359375, 1.8231201171875, 1.8881988525390625, 1.953277587890625, 2.0183563232421875, 2.08343505859375, 2.1485137939453125, 2.213592529296875, 2.2786712646484375, 2.34375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 10.0, 42.0, 142.0, 303.0, 317.0, 146.0, 34.0, 10.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.16486358642578, -83.83296966552734, -81.50108337402344, -79.169189453125, -76.83729553222656, -74.50540161132812, -72.17351531982422, -69.84162139892578, -67.50973510742188, -65.17784118652344, -62.845951080322266, -60.514060974121094, -58.182167053222656, -55.850276947021484, -53.51838684082031, -51.186492919921875, -48.85459899902344, -46.522708892822266, -44.19081497192383, -41.858924865722656, -39.52703094482422, -37.19514083862305, -34.863250732421875, -32.53135681152344, -30.199466705322266, -27.86757469177246, -25.535682678222656, -23.203792572021484, -20.87190055847168, -18.540008544921875, -16.208118438720703, -13.876226425170898, -11.544342041015625, -9.21245002746582, -6.880558967590332, -4.5486674308776855, -2.216775894165039, 0.11511611938476562, 2.447007179260254, 4.778898239135742, 7.110790252685547, 9.442682266235352, 11.77457332611084, 14.106464385986328, 16.438356399536133, 18.770248413085938, 21.10213851928711, 23.434030532836914, 25.76592254638672, 28.097814559936523, 30.429706573486328, 32.7615966796875, 35.09349060058594, 37.42538070678711, 39.75727081298828, 42.08916473388672, 44.42105484008789, 46.75294494628906, 49.0848388671875, 51.41672897338867, 53.748619079589844, 56.08051300048828, 58.41240310668945, 60.744293212890625, 63.07618713378906]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 14.0, 8.0, 9.0, 13.0, 18.0, 20.0, 37.0, 27.0, 22.0, 29.0, 34.0, 37.0, 44.0, 42.0, 43.0, 53.0, 48.0, 48.0, 48.0, 48.0, 41.0, 33.0, 34.0, 29.0, 28.0, 28.0, 32.0, 16.0, 14.0, 22.0, 11.0, 7.0, 9.0, 12.0, 6.0, 5.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-19.65219497680664, -19.099414825439453, -18.5466365814209, -17.99385643005371, -17.441078186035156, -16.88829803466797, -16.335519790649414, -15.782739639282227, -15.229960441589355, -14.677181243896484, -14.124402046203613, -13.571622848510742, -13.018842697143555, -12.466064453125, -11.913284301757812, -11.360505104064941, -10.80772590637207, -10.2549467086792, -9.702167510986328, -9.149388313293457, -8.596609115600586, -8.043828964233398, -7.491049766540527, -6.938270568847656, -6.385491371154785, -5.832712173461914, -5.279932975769043, -4.727153301239014, -4.174374103546143, -3.6215949058532715, -3.0688154697418213, -2.516036033630371, -1.9632558822631836, -1.410476565361023, -0.8576972484588623, -0.30491793155670166, 0.24786138534545898, 0.8006405830383301, 1.3534200191497803, 1.9061994552612305, 2.4589786529541016, 3.0117578506469727, 3.564537286758423, 4.117316722869873, 4.670095920562744, 5.222875118255615, 5.7756547927856445, 6.328433990478516, 6.881213188171387, 7.433992385864258, 7.986771583557129, 8.53955078125, 9.092330932617188, 9.645109176635742, 10.19788932800293, 10.7506685256958, 11.303447723388672, 11.856226921081543, 12.409006118774414, 12.961785316467285, 13.514564514160156, 14.067344665527344, 14.620123863220215, 15.172903060913086, 15.725682258605957]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 2.0, 6.0, 2.0, 5.0, 1.0, 9.0, 14.0, 12.0, 15.0, 19.0, 27.0, 31.0, 41.0, 56.0, 84.0, 133.0, 228.0, 433.0, 801.0, 1695.0, 4509.0, 22871.0, 4143671.0, 13188.0, 3370.0, 1377.0, 652.0, 357.0, 247.0, 115.0, 94.0, 61.0, 49.0, 25.0, 22.0, 11.0, 8.0, 11.0, 7.0, 4.0, 2.0, 5.0, 4.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -9.02490234375, -8.7373046875, -8.44970703125, -8.162109375, -7.87451171875, -7.5869140625, -7.29931640625, -7.01171875, -6.72412109375, -6.4365234375, -6.14892578125, -5.861328125, -5.57373046875, -5.2861328125, -4.99853515625, -4.7109375, -4.42333984375, -4.1357421875, -3.84814453125, -3.560546875, -3.27294921875, -2.9853515625, -2.69775390625, -2.41015625, -2.12255859375, -1.8349609375, -1.54736328125, -1.259765625, -0.97216796875, -0.6845703125, -0.39697265625, -0.109375, 0.17822265625, 0.4658203125, 0.75341796875, 1.041015625, 1.32861328125, 1.6162109375, 1.90380859375, 2.19140625, 2.47900390625, 2.7666015625, 3.05419921875, 3.341796875, 3.62939453125, 3.9169921875, 4.20458984375, 4.4921875, 4.77978515625, 5.0673828125, 5.35498046875, 5.642578125, 5.93017578125, 6.2177734375, 6.50537109375, 6.79296875, 7.08056640625, 7.3681640625, 7.65576171875, 7.943359375, 8.23095703125, 8.5185546875, 8.80615234375, 9.09375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 9.0, 7.0, 4.0, 10.0, 21.0, 19.0, 22.0, 36.0, 45.0, 61.0, 52.0, 48.0, 61.0, 73.0, 76.0, 68.0, 54.0, 54.0, 42.0, 54.0, 38.0, 30.0, 31.0, 19.0, 9.0, 12.0, 8.0, 11.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.1875, -1.1547012329101562, -1.1219024658203125, -1.0891036987304688, -1.056304931640625, -1.0235061645507812, -0.9907073974609375, -0.9579086303710938, -0.92510986328125, -0.8923110961914062, -0.8595123291015625, -0.8267135620117188, -0.793914794921875, -0.7611160278320312, -0.7283172607421875, -0.6955184936523438, -0.6627197265625, -0.6299209594726562, -0.5971221923828125, -0.5643234252929688, -0.531524658203125, -0.49872589111328125, -0.4659271240234375, -0.43312835693359375, -0.40032958984375, -0.36753082275390625, -0.3347320556640625, -0.30193328857421875, -0.269134521484375, -0.23633575439453125, -0.2035369873046875, -0.17073822021484375, -0.137939453125, -0.10514068603515625, -0.0723419189453125, -0.03954315185546875, -0.006744384765625, 0.02605438232421875, 0.0588531494140625, 0.09165191650390625, 0.12445068359375, 0.15724945068359375, 0.1900482177734375, 0.22284698486328125, 0.255645751953125, 0.28844451904296875, 0.3212432861328125, 0.35404205322265625, 0.3868408203125, 0.41963958740234375, 0.4524383544921875, 0.48523712158203125, 0.518035888671875, 0.5508346557617188, 0.5836334228515625, 0.6164321899414062, 0.64923095703125, 0.6820297241210938, 0.7148284912109375, 0.7476272583007812, 0.780426025390625, 0.8132247924804688, 0.8460235595703125, 0.8788223266601562, 0.91162109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 3.0, 5.0, 17.0, 19.0, 34.0, 43.0, 72.0, 111.0, 157.0, 298.0, 450.0, 794.0, 1426.0, 2714.0, 5725.0, 17220.0, 4083967.0, 63063.0, 9486.0, 3984.0, 2020.0, 1099.0, 604.0, 384.0, 195.0, 142.0, 87.0, 59.0, 33.0, 21.0, 19.0, 5.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2109375, -5.00872802734375, -4.8065185546875, -4.60430908203125, -4.402099609375, -4.19989013671875, -3.9976806640625, -3.79547119140625, -3.59326171875, -3.39105224609375, -3.1888427734375, -2.98663330078125, -2.784423828125, -2.58221435546875, -2.3800048828125, -2.17779541015625, -1.9755859375, -1.77337646484375, -1.5711669921875, -1.36895751953125, -1.166748046875, -0.96453857421875, -0.7623291015625, -0.56011962890625, -0.35791015625, -0.15570068359375, 0.0465087890625, 0.24871826171875, 0.450927734375, 0.65313720703125, 0.8553466796875, 1.05755615234375, 1.259765625, 1.46197509765625, 1.6641845703125, 1.86639404296875, 2.068603515625, 2.27081298828125, 2.4730224609375, 2.67523193359375, 2.87744140625, 3.07965087890625, 3.2818603515625, 3.48406982421875, 3.686279296875, 3.88848876953125, 4.0906982421875, 4.29290771484375, 4.4951171875, 4.69732666015625, 4.8995361328125, 5.10174560546875, 5.303955078125, 5.50616455078125, 5.7083740234375, 5.91058349609375, 6.11279296875, 6.31500244140625, 6.5172119140625, 6.71942138671875, 6.921630859375, 7.12384033203125, 7.3260498046875, 7.52825927734375, 7.73046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 8.0, 14.0, 20.0, 57.0, 3651.0, 233.0, 32.0, 17.0, 10.0, 3.0, 6.0, 0.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.142578125, -1.098388671875, -1.05419921875, -1.010009765625, -0.9658203125, -0.921630859375, -0.87744140625, -0.833251953125, -0.7890625, -0.744873046875, -0.70068359375, -0.656494140625, -0.6123046875, -0.568115234375, -0.52392578125, -0.479736328125, -0.435546875, -0.391357421875, -0.34716796875, -0.302978515625, -0.2587890625, -0.214599609375, -0.17041015625, -0.126220703125, -0.08203125, -0.037841796875, 0.00634765625, 0.050537109375, 0.0947265625, 0.138916015625, 0.18310546875, 0.227294921875, 0.271484375, 0.315673828125, 0.35986328125, 0.404052734375, 0.4482421875, 0.492431640625, 0.53662109375, 0.580810546875, 0.625, 0.669189453125, 0.71337890625, 0.757568359375, 0.8017578125, 0.845947265625, 0.89013671875, 0.934326171875, 0.978515625, 1.022705078125, 1.06689453125, 1.111083984375, 1.1552734375, 1.199462890625, 1.24365234375, 1.287841796875, 1.33203125, 1.376220703125, 1.42041015625, 1.464599609375, 1.5087890625, 1.552978515625, 1.59716796875, 1.641357421875, 1.685546875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 20.0, 24.0, 33.0, 100.0, 161.0, 223.0, 183.0, 117.0, 68.0, 41.0, 14.0, 8.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.823406219482422, -6.585963726043701, -6.3485212326049805, -6.11107873916626, -5.873636245727539, -5.636194229125977, -5.398751735687256, -5.161309242248535, -4.9238667488098145, -4.686424255371094, -4.448981761932373, -4.211539268493652, -3.9740970134735107, -3.73665452003479, -3.4992122650146484, -3.2617697715759277, -3.024327278137207, -2.7868847846984863, -2.5494422912597656, -2.312000036239624, -2.0745575428009033, -1.8371150493621826, -1.5996726751327515, -1.3622303009033203, -1.1247878074645996, -0.8873453736305237, -0.6499029397964478, -0.4124605059623718, -0.1750180721282959, 0.062424421310424805, 0.29986679553985596, 0.5373091697692871, 0.7747516632080078, 1.0121941566467285, 1.2496365308761597, 1.4870789051055908, 1.7245213985443115, 1.9619638919830322, 2.199406147003174, 2.4368486404418945, 2.6742911338806152, 2.911733627319336, 3.1491761207580566, 3.3866183757781982, 3.624060869216919, 3.8615033626556396, 4.098945617675781, 4.336388111114502, 4.573830604553223, 4.811273097991943, 5.048715591430664, 5.286158084869385, 5.5236005783081055, 5.761042594909668, 5.998485088348389, 6.235927581787109, 6.47337007522583, 6.710812568664551, 6.9482550621032715, 7.185697555541992, 7.423139572143555, 7.660582542419434, 7.898024559020996, 8.135467529296875, 8.372909545898438]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 5.0, 10.0, 6.0, 2.0, 12.0, 8.0, 15.0, 15.0, 18.0, 23.0, 29.0, 32.0, 35.0, 26.0, 34.0, 37.0, 38.0, 36.0, 35.0, 47.0, 38.0, 37.0, 51.0, 45.0, 49.0, 43.0, 35.0, 30.0, 29.0, 30.0, 26.0, 21.0, 21.0, 15.0, 18.0, 8.0, 10.0, 8.0, 7.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2664427757263184, -2.194556474685669, -2.1226701736450195, -2.05078387260437, -1.9788975715637207, -1.9070112705230713, -1.8351248502731323, -1.763238549232483, -1.6913522481918335, -1.619465947151184, -1.5475796461105347, -1.4756933450698853, -1.4038069248199463, -1.3319206237792969, -1.2600343227386475, -1.188148021697998, -1.1162617206573486, -1.0443754196166992, -0.9724891185760498, -0.9006027579307556, -0.8287164568901062, -0.7568301558494568, -0.6849437952041626, -0.6130574941635132, -0.5411711931228638, -0.46928489208221436, -0.39739856123924255, -0.32551223039627075, -0.25362592935562134, -0.18173962831497192, -0.10985329747200012, -0.03796696662902832, 0.03391909599304199, 0.1058054119348526, 0.1776917278766632, 0.24957804381847382, 0.3214643597602844, 0.39335066080093384, 0.46523699164390564, 0.5371233224868774, 0.6090096235275269, 0.6808959245681763, 0.7527822256088257, 0.8246685862541199, 0.8965548872947693, 0.9684411883354187, 1.040327548980713, 1.1122138500213623, 1.1841001510620117, 1.2559864521026611, 1.3278727531433105, 1.39975905418396, 1.4716453552246094, 1.5435316562652588, 1.6154180765151978, 1.6873043775558472, 1.7591906785964966, 1.831076979637146, 1.9029632806777954, 1.9748495817184448, 2.046736001968384, 2.118622303009033, 2.1905086040496826, 2.262394905090332, 2.3342812061309814]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 8.0, 16.0, 19.0, 20.0, 33.0, 47.0, 62.0, 113.0, 185.0, 327.0, 546.0, 939.0, 1653.0, 3120.0, 5899.0, 12354.0, 26730.0, 64542.0, 174662.0, 402337.0, 216527.0, 77657.0, 31900.0, 14276.0, 6733.0, 3377.0, 1887.0, 1074.0, 577.0, 365.0, 204.0, 129.0, 77.0, 55.0, 34.0, 30.0, 12.0, 10.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.654296875, -1.6019439697265625, -1.549591064453125, -1.4972381591796875, -1.44488525390625, -1.3925323486328125, -1.340179443359375, -1.2878265380859375, -1.2354736328125, -1.1831207275390625, -1.130767822265625, -1.0784149169921875, -1.02606201171875, -0.9737091064453125, -0.921356201171875, -0.8690032958984375, -0.816650390625, -0.7642974853515625, -0.711944580078125, -0.6595916748046875, -0.60723876953125, -0.5548858642578125, -0.502532958984375, -0.4501800537109375, -0.3978271484375, -0.3454742431640625, -0.293121337890625, -0.2407684326171875, -0.18841552734375, -0.1360626220703125, -0.083709716796875, -0.0313568115234375, 0.02099609375, 0.0733489990234375, 0.125701904296875, 0.1780548095703125, 0.23040771484375, 0.2827606201171875, 0.335113525390625, 0.3874664306640625, 0.4398193359375, 0.4921722412109375, 0.544525146484375, 0.5968780517578125, 0.64923095703125, 0.7015838623046875, 0.753936767578125, 0.8062896728515625, 0.858642578125, 0.9109954833984375, 0.963348388671875, 1.0157012939453125, 1.06805419921875, 1.1204071044921875, 1.172760009765625, 1.2251129150390625, 1.2774658203125, 1.3298187255859375, 1.382171630859375, 1.4345245361328125, 1.48687744140625, 1.5392303466796875, 1.591583251953125, 1.6439361572265625, 1.6962890625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 4.0, 8.0, 6.0, 16.0, 14.0, 28.0, 33.0, 33.0, 31.0, 63.0, 57.0, 54.0, 71.0, 62.0, 73.0, 64.0, 49.0, 51.0, 47.0, 52.0, 33.0, 31.0, 20.0, 21.0, 17.0, 16.0, 9.0, 8.0, 5.0, 9.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.23828125, -1.2020721435546875, -1.165863037109375, -1.1296539306640625, -1.09344482421875, -1.0572357177734375, -1.021026611328125, -0.9848175048828125, -0.9486083984375, -0.9123992919921875, -0.876190185546875, -0.8399810791015625, -0.80377197265625, -0.7675628662109375, -0.731353759765625, -0.6951446533203125, -0.658935546875, -0.6227264404296875, -0.586517333984375, -0.5503082275390625, -0.51409912109375, -0.4778900146484375, -0.441680908203125, -0.4054718017578125, -0.3692626953125, -0.3330535888671875, -0.296844482421875, -0.2606353759765625, -0.22442626953125, -0.1882171630859375, -0.152008056640625, -0.1157989501953125, -0.07958984375, -0.0433807373046875, -0.007171630859375, 0.0290374755859375, 0.06524658203125, 0.1014556884765625, 0.137664794921875, 0.1738739013671875, 0.2100830078125, 0.2462921142578125, 0.282501220703125, 0.3187103271484375, 0.35491943359375, 0.3911285400390625, 0.427337646484375, 0.4635467529296875, 0.499755859375, 0.5359649658203125, 0.572174072265625, 0.6083831787109375, 0.64459228515625, 0.6808013916015625, 0.717010498046875, 0.7532196044921875, 0.7894287109375, 0.8256378173828125, 0.861846923828125, 0.8980560302734375, 0.93426513671875, 0.9704742431640625, 1.006683349609375, 1.0428924560546875, 1.0791015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 9.0, 8.0, 9.0, 20.0, 25.0, 34.0, 55.0, 80.0, 120.0, 215.0, 472.0, 1008.0, 3433.0, 38161.0, 937500.0, 60927.0, 4170.0, 1170.0, 495.0, 245.0, 142.0, 90.0, 56.0, 34.0, 26.0, 19.0, 16.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6640625, -8.445068359375, -8.22607421875, -8.007080078125, -7.7880859375, -7.569091796875, -7.35009765625, -7.131103515625, -6.912109375, -6.693115234375, -6.47412109375, -6.255126953125, -6.0361328125, -5.817138671875, -5.59814453125, -5.379150390625, -5.16015625, -4.941162109375, -4.72216796875, -4.503173828125, -4.2841796875, -4.065185546875, -3.84619140625, -3.627197265625, -3.408203125, -3.189208984375, -2.97021484375, -2.751220703125, -2.5322265625, -2.313232421875, -2.09423828125, -1.875244140625, -1.65625, -1.437255859375, -1.21826171875, -0.999267578125, -0.7802734375, -0.561279296875, -0.34228515625, -0.123291015625, 0.095703125, 0.314697265625, 0.53369140625, 0.752685546875, 0.9716796875, 1.190673828125, 1.40966796875, 1.628662109375, 1.84765625, 2.066650390625, 2.28564453125, 2.504638671875, 2.7236328125, 2.942626953125, 3.16162109375, 3.380615234375, 3.599609375, 3.818603515625, 4.03759765625, 4.256591796875, 4.4755859375, 4.694580078125, 4.91357421875, 5.132568359375, 5.3515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 6.0, 16.0, 13.0, 9.0, 16.0, 15.0, 24.0, 23.0, 34.0, 34.0, 51.0, 45.0, 47.0, 42.0, 56.0, 46.0, 49.0, 60.0, 61.0, 51.0, 44.0, 33.0, 37.0, 27.0, 21.0, 24.0, 22.0, 16.0, 16.0, 13.0, 9.0, 5.0, 7.0, 6.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.3203125, -5.16851806640625, -5.0167236328125, -4.86492919921875, -4.713134765625, -4.56134033203125, -4.4095458984375, -4.25775146484375, -4.10595703125, -3.95416259765625, -3.8023681640625, -3.65057373046875, -3.498779296875, -3.34698486328125, -3.1951904296875, -3.04339599609375, -2.8916015625, -2.73980712890625, -2.5880126953125, -2.43621826171875, -2.284423828125, -2.13262939453125, -1.9808349609375, -1.82904052734375, -1.67724609375, -1.52545166015625, -1.3736572265625, -1.22186279296875, -1.070068359375, -0.91827392578125, -0.7664794921875, -0.61468505859375, -0.462890625, -0.31109619140625, -0.1593017578125, -0.00750732421875, 0.144287109375, 0.29608154296875, 0.4478759765625, 0.59967041015625, 0.75146484375, 0.90325927734375, 1.0550537109375, 1.20684814453125, 1.358642578125, 1.51043701171875, 1.6622314453125, 1.81402587890625, 1.9658203125, 2.11761474609375, 2.2694091796875, 2.42120361328125, 2.572998046875, 2.72479248046875, 2.8765869140625, 3.02838134765625, 3.18017578125, 3.33197021484375, 3.4837646484375, 3.63555908203125, 3.787353515625, 3.93914794921875, 4.0909423828125, 4.24273681640625, 4.39453125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 8.0, 9.0, 14.0, 19.0, 18.0, 43.0, 68.0, 110.0, 169.0, 275.0, 559.0, 957.0, 2342.0, 7937.0, 50829.0, 719802.0, 238022.0, 19697.0, 4296.0, 1603.0, 748.0, 366.0, 215.0, 138.0, 84.0, 52.0, 43.0, 22.0, 28.0, 22.0, 13.0, 4.0, 9.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.314453125, -2.2479095458984375, -2.181365966796875, -2.1148223876953125, -2.04827880859375, -1.9817352294921875, -1.915191650390625, -1.8486480712890625, -1.7821044921875, -1.7155609130859375, -1.649017333984375, -1.5824737548828125, -1.51593017578125, -1.4493865966796875, -1.382843017578125, -1.3162994384765625, -1.249755859375, -1.1832122802734375, -1.116668701171875, -1.0501251220703125, -0.98358154296875, -0.9170379638671875, -0.850494384765625, -0.7839508056640625, -0.7174072265625, -0.6508636474609375, -0.584320068359375, -0.5177764892578125, -0.45123291015625, -0.3846893310546875, -0.318145751953125, -0.2516021728515625, -0.18505859375, -0.1185150146484375, -0.051971435546875, 0.0145721435546875, 0.08111572265625, 0.1476593017578125, 0.214202880859375, 0.2807464599609375, 0.3472900390625, 0.4138336181640625, 0.480377197265625, 0.5469207763671875, 0.61346435546875, 0.6800079345703125, 0.746551513671875, 0.8130950927734375, 0.879638671875, 0.9461822509765625, 1.012725830078125, 1.0792694091796875, 1.14581298828125, 1.2123565673828125, 1.278900146484375, 1.3454437255859375, 1.4119873046875, 1.4785308837890625, 1.545074462890625, 1.6116180419921875, 1.67816162109375, 1.7447052001953125, 1.811248779296875, 1.8777923583984375, 1.9443359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 12.0, 8.0, 21.0, 22.0, 23.0, 47.0, 68.0, 98.0, 135.0, 165.0, 126.0, 84.0, 49.0, 36.0, 26.0, 18.0, 14.0, 13.0, 8.0, 9.0, 6.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003724098205566406, -0.00036339089274406433, -0.00035437196493148804, -0.00034535303711891174, -0.00033633410930633545, -0.00032731518149375916, -0.00031829625368118286, -0.00030927732586860657, -0.0003002583980560303, -0.000291239470243454, -0.0002822205424308777, -0.0002732016146183014, -0.0002641826868057251, -0.0002551637589931488, -0.0002461448311805725, -0.00023712590336799622, -0.00022810697555541992, -0.00021908804774284363, -0.00021006911993026733, -0.00020105019211769104, -0.00019203126430511475, -0.00018301233649253845, -0.00017399340867996216, -0.00016497448086738586, -0.00015595555305480957, -0.00014693662524223328, -0.00013791769742965698, -0.0001288987696170807, -0.0001198798418045044, -0.0001108609139919281, -0.0001018419861793518, -9.282305836677551e-05, -8.380413055419922e-05, -7.478520274162292e-05, -6.576627492904663e-05, -5.674734711647034e-05, -4.772841930389404e-05, -3.870949149131775e-05, -2.9690563678741455e-05, -2.067163586616516e-05, -1.1652708053588867e-05, -2.6337802410125732e-06, 6.385147571563721e-06, 1.5404075384140015e-05, 2.442300319671631e-05, 3.34419310092926e-05, 4.2460858821868896e-05, 5.147978663444519e-05, 6.0498714447021484e-05, 6.951764225959778e-05, 7.853657007217407e-05, 8.755549788475037e-05, 9.657442569732666e-05, 0.00010559335350990295, 0.00011461228132247925, 0.00012363120913505554, 0.00013265013694763184, 0.00014166906476020813, 0.00015068799257278442, 0.00015970692038536072, 0.000168725848197937, 0.0001777447760105133, 0.0001867637038230896, 0.0001957826316356659, 0.0002048015594482422]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 8.0, 20.0, 31.0, 42.0, 90.0, 145.0, 299.0, 686.0, 2114.0, 11612.0, 273268.0, 731363.0, 23990.0, 3139.0, 931.0, 370.0, 177.0, 86.0, 68.0, 33.0, 20.0, 19.0, 9.0, 7.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.033203125, -2.932586669921875, -2.83197021484375, -2.731353759765625, -2.6307373046875, -2.530120849609375, -2.42950439453125, -2.328887939453125, -2.228271484375, -2.127655029296875, -2.02703857421875, -1.926422119140625, -1.8258056640625, -1.725189208984375, -1.62457275390625, -1.523956298828125, -1.42333984375, -1.322723388671875, -1.22210693359375, -1.121490478515625, -1.0208740234375, -0.920257568359375, -0.81964111328125, -0.719024658203125, -0.618408203125, -0.517791748046875, -0.41717529296875, -0.316558837890625, -0.2159423828125, -0.115325927734375, -0.01470947265625, 0.085906982421875, 0.1865234375, 0.287139892578125, 0.38775634765625, 0.488372802734375, 0.5889892578125, 0.689605712890625, 0.79022216796875, 0.890838623046875, 0.991455078125, 1.092071533203125, 1.19268798828125, 1.293304443359375, 1.3939208984375, 1.494537353515625, 1.59515380859375, 1.695770263671875, 1.79638671875, 1.897003173828125, 1.99761962890625, 2.098236083984375, 2.1988525390625, 2.299468994140625, 2.40008544921875, 2.500701904296875, 2.601318359375, 2.701934814453125, 2.80255126953125, 2.903167724609375, 3.0037841796875, 3.104400634765625, 3.20501708984375, 3.305633544921875, 3.40625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 5.0, 5.0, 7.0, 20.0, 24.0, 31.0, 34.0, 48.0, 62.0, 87.0, 110.0, 128.0, 108.0, 91.0, 63.0, 52.0, 44.0, 28.0, 12.0, 14.0, 8.0, 5.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.923828125, -1.85394287109375, -1.7840576171875, -1.71417236328125, -1.644287109375, -1.57440185546875, -1.5045166015625, -1.43463134765625, -1.36474609375, -1.29486083984375, -1.2249755859375, -1.15509033203125, -1.085205078125, -1.01531982421875, -0.9454345703125, -0.87554931640625, -0.8056640625, -0.73577880859375, -0.6658935546875, -0.59600830078125, -0.526123046875, -0.45623779296875, -0.3863525390625, -0.31646728515625, -0.24658203125, -0.17669677734375, -0.1068115234375, -0.03692626953125, 0.032958984375, 0.10284423828125, 0.1727294921875, 0.24261474609375, 0.3125, 0.38238525390625, 0.4522705078125, 0.52215576171875, 0.592041015625, 0.66192626953125, 0.7318115234375, 0.80169677734375, 0.87158203125, 0.94146728515625, 1.0113525390625, 1.08123779296875, 1.151123046875, 1.22100830078125, 1.2908935546875, 1.36077880859375, 1.4306640625, 1.50054931640625, 1.5704345703125, 1.64031982421875, 1.710205078125, 1.78009033203125, 1.8499755859375, 1.91986083984375, 1.98974609375, 2.05963134765625, 2.1295166015625, 2.19940185546875, 2.269287109375, 2.33917236328125, 2.4090576171875, 2.47894287109375, 2.548828125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 10.0, 50.0, 136.0, 254.0, 277.0, 156.0, 63.0, 34.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.02540588378906, -48.46538543701172, -46.905364990234375, -45.34534454345703, -43.78532409667969, -42.225303649902344, -40.665283203125, -39.105262756347656, -37.54524230957031, -35.98522186279297, -34.425201416015625, -32.86518096923828, -31.305160522460938, -29.745140075683594, -28.18511962890625, -26.625099182128906, -25.065080642700195, -23.50506019592285, -21.945039749145508, -20.385019302368164, -18.82499885559082, -17.264978408813477, -15.70495891571045, -14.144938468933105, -12.584918022155762, -11.024897575378418, -9.464877128601074, -7.904857158660889, -6.344836711883545, -4.784816265106201, -3.2247962951660156, -1.6647758483886719, -0.10475540161132812, 1.455264925956726, 3.0152852535247803, 4.575305461883545, 6.135325908660889, 7.695346355438232, 9.255366325378418, 10.815386772155762, 12.375407218933105, 13.93542766571045, 15.495448112487793, 17.05546760559082, 18.615488052368164, 20.175508499145508, 21.73552894592285, 23.295549392700195, 24.85556983947754, 26.415590286254883, 27.975610733032227, 29.53563117980957, 31.095651626586914, 32.655670166015625, 34.21569061279297, 35.77571105957031, 37.335731506347656, 38.895751953125, 40.455772399902344, 42.01579284667969, 43.57581329345703, 45.135833740234375, 46.69585418701172, 48.25587463378906, 49.815895080566406]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 7.0, 14.0, 16.0, 23.0, 16.0, 24.0, 30.0, 30.0, 35.0, 44.0, 33.0, 37.0, 44.0, 64.0, 56.0, 59.0, 56.0, 49.0, 44.0, 30.0, 51.0, 31.0, 33.0, 22.0, 24.0, 13.0, 18.0, 21.0, 12.0, 14.0, 8.0, 9.0, 8.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.298492431640625, -19.64858055114746, -18.998666763305664, -18.3487548828125, -17.698843002319336, -17.048931121826172, -16.399017333984375, -15.749105453491211, -15.09919261932373, -14.44927978515625, -13.799367904663086, -13.149455070495605, -12.499542236328125, -11.849630355834961, -11.19971752166748, -10.5498046875, -9.899892807006836, -9.249979972839355, -8.600068092346191, -7.950155258178711, -7.300242900848389, -6.650330543518066, -6.000417709350586, -5.350505352020264, -4.700592994689941, -4.050680637359619, -3.4007680416107178, -2.7508554458618164, -2.100943088531494, -1.4510307312011719, -0.8011181354522705, -0.15120553970336914, 0.4987068176269531, 1.148619294166565, 1.7985317707061768, 2.448444366455078, 3.0983567237854004, 3.7482690811157227, 4.398181915283203, 5.048094272613525, 5.698006629943848, 6.34791898727417, 6.997831344604492, 7.647744178771973, 8.297657012939453, 8.947568893432617, 9.597481727600098, 10.247394561767578, 10.897306442260742, 11.547219276428223, 12.197131156921387, 12.847043991088867, 13.496955871582031, 14.146868705749512, 14.796781539916992, 15.446693420410156, 16.096607208251953, 16.746519088745117, 17.396432876586914, 18.046344757080078, 18.696256637573242, 19.346168518066406, 19.996082305908203, 20.645994186401367, 21.29590606689453]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 5.0, 9.0, 6.0, 7.0, 8.0, 21.0, 20.0, 48.0, 36.0, 51.0, 72.0, 137.0, 208.0, 376.0, 693.0, 1420.0, 3039.0, 8448.0, 57313.0, 4083451.0, 27608.0, 6306.0, 2392.0, 1093.0, 600.0, 339.0, 199.0, 113.0, 53.0, 48.0, 47.0, 21.0, 17.0, 13.0, 10.0, 10.0, 6.0, 9.0, 5.0, 7.0, 0.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.05859375, -4.8802490234375, -4.701904296875, -4.5235595703125, -4.34521484375, -4.1668701171875, -3.988525390625, -3.8101806640625, -3.6318359375, -3.4534912109375, -3.275146484375, -3.0968017578125, -2.91845703125, -2.7401123046875, -2.561767578125, -2.3834228515625, -2.205078125, -2.0267333984375, -1.848388671875, -1.6700439453125, -1.49169921875, -1.3133544921875, -1.135009765625, -0.9566650390625, -0.7783203125, -0.5999755859375, -0.421630859375, -0.2432861328125, -0.06494140625, 0.1134033203125, 0.291748046875, 0.4700927734375, 0.6484375, 0.8267822265625, 1.005126953125, 1.1834716796875, 1.36181640625, 1.5401611328125, 1.718505859375, 1.8968505859375, 2.0751953125, 2.2535400390625, 2.431884765625, 2.6102294921875, 2.78857421875, 2.9669189453125, 3.145263671875, 3.3236083984375, 3.501953125, 3.6802978515625, 3.858642578125, 4.0369873046875, 4.21533203125, 4.3936767578125, 4.572021484375, 4.7503662109375, 4.9287109375, 5.1070556640625, 5.285400390625, 5.4637451171875, 5.64208984375, 5.8204345703125, 5.998779296875, 6.1771240234375, 6.35546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 10.0, 12.0, 12.0, 22.0, 18.0, 30.0, 44.0, 51.0, 56.0, 56.0, 70.0, 86.0, 62.0, 50.0, 66.0, 59.0, 50.0, 64.0, 30.0, 26.0, 17.0, 25.0, 22.0, 11.0, 10.0, 5.0, 4.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.48828125, -1.45233154296875, -1.4163818359375, -1.38043212890625, -1.344482421875, -1.30853271484375, -1.2725830078125, -1.23663330078125, -1.20068359375, -1.16473388671875, -1.1287841796875, -1.09283447265625, -1.056884765625, -1.02093505859375, -0.9849853515625, -0.94903564453125, -0.9130859375, -0.87713623046875, -0.8411865234375, -0.80523681640625, -0.769287109375, -0.73333740234375, -0.6973876953125, -0.66143798828125, -0.62548828125, -0.58953857421875, -0.5535888671875, -0.51763916015625, -0.481689453125, -0.44573974609375, -0.4097900390625, -0.37384033203125, -0.337890625, -0.30194091796875, -0.2659912109375, -0.23004150390625, -0.194091796875, -0.15814208984375, -0.1221923828125, -0.08624267578125, -0.05029296875, -0.01434326171875, 0.0216064453125, 0.05755615234375, 0.093505859375, 0.12945556640625, 0.1654052734375, 0.20135498046875, 0.2373046875, 0.27325439453125, 0.3092041015625, 0.34515380859375, 0.381103515625, 0.41705322265625, 0.4530029296875, 0.48895263671875, 0.52490234375, 0.56085205078125, 0.5968017578125, 0.63275146484375, 0.668701171875, 0.70465087890625, 0.7406005859375, 0.77655029296875, 0.8125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 8.0, 4.0, 6.0, 11.0, 6.0, 10.0, 10.0, 16.0, 20.0, 29.0, 46.0, 97.0, 142.0, 262.0, 461.0, 880.0, 1979.0, 4643.0, 14707.0, 943511.0, 3203770.0, 14842.0, 4757.0, 2008.0, 930.0, 433.0, 273.0, 152.0, 94.0, 66.0, 34.0, 21.0, 18.0, 7.0, 14.0, 8.0, 8.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.765625, -4.5584716796875, -4.351318359375, -4.1441650390625, -3.93701171875, -3.7298583984375, -3.522705078125, -3.3155517578125, -3.1083984375, -2.9012451171875, -2.694091796875, -2.4869384765625, -2.27978515625, -2.0726318359375, -1.865478515625, -1.6583251953125, -1.451171875, -1.2440185546875, -1.036865234375, -0.8297119140625, -0.62255859375, -0.4154052734375, -0.208251953125, -0.0010986328125, 0.2060546875, 0.4132080078125, 0.620361328125, 0.8275146484375, 1.03466796875, 1.2418212890625, 1.448974609375, 1.6561279296875, 1.86328125, 2.0704345703125, 2.277587890625, 2.4847412109375, 2.69189453125, 2.8990478515625, 3.106201171875, 3.3133544921875, 3.5205078125, 3.7276611328125, 3.934814453125, 4.1419677734375, 4.34912109375, 4.5562744140625, 4.763427734375, 4.9705810546875, 5.177734375, 5.3848876953125, 5.592041015625, 5.7991943359375, 6.00634765625, 6.2135009765625, 6.420654296875, 6.6278076171875, 6.8349609375, 7.0421142578125, 7.249267578125, 7.4564208984375, 7.66357421875, 7.8707275390625, 8.077880859375, 8.2850341796875, 8.4921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 9.0, 7.0, 21.0, 40.0, 106.0, 3472.0, 286.0, 63.0, 19.0, 15.0, 9.0, 3.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.74609375, -1.661773681640625, -1.57745361328125, -1.493133544921875, -1.4088134765625, -1.324493408203125, -1.24017333984375, -1.155853271484375, -1.071533203125, -0.987213134765625, -0.90289306640625, -0.818572998046875, -0.7342529296875, -0.649932861328125, -0.56561279296875, -0.481292724609375, -0.39697265625, -0.312652587890625, -0.22833251953125, -0.144012451171875, -0.0596923828125, 0.024627685546875, 0.10894775390625, 0.193267822265625, 0.277587890625, 0.361907958984375, 0.44622802734375, 0.530548095703125, 0.6148681640625, 0.699188232421875, 0.78350830078125, 0.867828369140625, 0.9521484375, 1.036468505859375, 1.12078857421875, 1.205108642578125, 1.2894287109375, 1.373748779296875, 1.45806884765625, 1.542388916015625, 1.626708984375, 1.711029052734375, 1.79534912109375, 1.879669189453125, 1.9639892578125, 2.048309326171875, 2.13262939453125, 2.216949462890625, 2.30126953125, 2.385589599609375, 2.46990966796875, 2.554229736328125, 2.6385498046875, 2.722869873046875, 2.80718994140625, 2.891510009765625, 2.975830078125, 3.060150146484375, 3.14447021484375, 3.228790283203125, 3.3131103515625, 3.397430419921875, 3.48175048828125, 3.566070556640625, 3.650390625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 15.0, 25.0, 55.0, 117.0, 233.0, 230.0, 154.0, 75.0, 45.0, 25.0, 11.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3701701164245605, -6.9570112228393555, -6.543852806091309, -6.130694389343262, -5.717535495758057, -5.304376602172852, -4.891218185424805, -4.478059768676758, -4.064900875091553, -3.6517422199249268, -3.238583564758301, -2.825424909591675, -2.412266254425049, -1.9991075992584229, -1.5859489440917969, -1.172790288925171, -0.7596316337585449, -0.34647297859191895, 0.06668567657470703, 0.479844331741333, 0.893002986907959, 1.306161642074585, 1.719320297241211, 2.132478952407837, 2.545637607574463, 2.958796262741089, 3.371954917907715, 3.785113573074341, 4.198272228240967, 4.611431121826172, 5.024589538574219, 5.437747955322266, 5.8509063720703125, 6.264064788818359, 6.6772236824035645, 7.0903825759887695, 7.503540992736816, 7.916699409484863, 8.329858779907227, 8.743017196655273, 9.15617561340332, 9.569334030151367, 9.982492446899414, 10.395651817321777, 10.808810234069824, 11.221968650817871, 11.635128021240234, 12.048286437988281, 12.461444854736328, 12.874603271484375, 13.287761688232422, 13.700921058654785, 14.114079475402832, 14.527237892150879, 14.940397262573242, 15.353555679321289, 15.766714096069336, 16.179872512817383, 16.59303092956543, 17.006189346313477, 17.419349670410156, 17.832508087158203, 18.24566650390625, 18.658824920654297, 19.071983337402344]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 7.0, 15.0, 16.0, 31.0, 16.0, 32.0, 18.0, 25.0, 40.0, 40.0, 54.0, 52.0, 54.0, 52.0, 64.0, 57.0, 53.0, 55.0, 50.0, 55.0, 40.0, 35.0, 25.0, 20.0, 21.0, 13.0, 18.0, 11.0, 9.0, 4.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.4573750495910645, -6.265223503112793, -6.073071479797363, -5.880919933319092, -5.68876838684082, -5.496616363525391, -5.304464817047119, -5.112313270568848, -4.920161247253418, -4.7280097007751465, -4.535857677459717, -4.343706130981445, -4.151554584503174, -3.9594027996063232, -3.7672510147094727, -3.575099468231201, -3.3829479217529297, -3.190796136856079, -2.9986445903778076, -2.806492805480957, -2.6143412590026855, -2.422189474105835, -2.2300376892089844, -2.037886142730713, -1.8457343578338623, -1.6535826921463013, -1.4614310264587402, -1.2692792415618896, -1.0771275758743286, -0.8849759101867676, -0.692824125289917, -0.500672459602356, -0.3085203170776367, -0.1163686215877533, 0.07578307390213013, 0.26793479919433594, 0.460086464881897, 0.652238130569458, 0.8443899154663086, 1.0365415811538696, 1.2286932468414307, 1.4208449125289917, 1.6129965782165527, 1.8051483631134033, 1.9973000288009644, 2.1894516944885254, 2.381603479385376, 2.5737552642822266, 2.765906810760498, 2.9580585956573486, 3.15021014213562, 3.3423619270324707, 3.534513473510742, 3.7266652584075928, 3.9188170433044434, 4.110968589782715, 4.3031206130981445, 4.495272159576416, 4.687424182891846, 4.879575729370117, 5.071727275848389, 5.26387882232666, 5.45603084564209, 5.648182392120361, 5.840333938598633]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 10.0, 17.0, 21.0, 27.0, 39.0, 55.0, 62.0, 114.0, 153.0, 250.0, 387.0, 663.0, 1106.0, 1936.0, 3419.0, 6827.0, 13381.0, 27934.0, 63393.0, 148278.0, 376135.0, 231305.0, 93521.0, 40966.0, 18643.0, 8989.0, 4748.0, 2455.0, 1423.0, 837.0, 523.0, 310.0, 189.0, 139.0, 80.0, 54.0, 39.0, 31.0, 18.0, 15.0, 13.0, 9.0, 8.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.423828125, -2.347442626953125, -2.27105712890625, -2.194671630859375, -2.1182861328125, -2.041900634765625, -1.96551513671875, -1.889129638671875, -1.812744140625, -1.736358642578125, -1.65997314453125, -1.583587646484375, -1.5072021484375, -1.430816650390625, -1.35443115234375, -1.278045654296875, -1.20166015625, -1.125274658203125, -1.04888916015625, -0.972503662109375, -0.8961181640625, -0.819732666015625, -0.74334716796875, -0.666961669921875, -0.590576171875, -0.514190673828125, -0.43780517578125, -0.361419677734375, -0.2850341796875, -0.208648681640625, -0.13226318359375, -0.055877685546875, 0.0205078125, 0.096893310546875, 0.17327880859375, 0.249664306640625, 0.3260498046875, 0.402435302734375, 0.47882080078125, 0.555206298828125, 0.631591796875, 0.707977294921875, 0.78436279296875, 0.860748291015625, 0.9371337890625, 1.013519287109375, 1.08990478515625, 1.166290283203125, 1.24267578125, 1.319061279296875, 1.39544677734375, 1.471832275390625, 1.5482177734375, 1.624603271484375, 1.70098876953125, 1.777374267578125, 1.853759765625, 1.930145263671875, 2.00653076171875, 2.082916259765625, 2.1593017578125, 2.235687255859375, 2.31207275390625, 2.388458251953125, 2.46484375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 12.0, 10.0, 22.0, 15.0, 29.0, 25.0, 35.0, 50.0, 49.0, 68.0, 84.0, 61.0, 68.0, 54.0, 66.0, 63.0, 52.0, 46.0, 36.0, 34.0, 31.0, 14.0, 17.0, 12.0, 11.0, 7.0, 6.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5419921875, -1.501953125, -1.4619140625, -1.421875, -1.3818359375, -1.341796875, -1.3017578125, -1.26171875, -1.2216796875, -1.181640625, -1.1416015625, -1.1015625, -1.0615234375, -1.021484375, -0.9814453125, -0.94140625, -0.9013671875, -0.861328125, -0.8212890625, -0.78125, -0.7412109375, -0.701171875, -0.6611328125, -0.62109375, -0.5810546875, -0.541015625, -0.5009765625, -0.4609375, -0.4208984375, -0.380859375, -0.3408203125, -0.30078125, -0.2607421875, -0.220703125, -0.1806640625, -0.140625, -0.1005859375, -0.060546875, -0.0205078125, 0.01953125, 0.0595703125, 0.099609375, 0.1396484375, 0.1796875, 0.2197265625, 0.259765625, 0.2998046875, 0.33984375, 0.3798828125, 0.419921875, 0.4599609375, 0.5, 0.5400390625, 0.580078125, 0.6201171875, 0.66015625, 0.7001953125, 0.740234375, 0.7802734375, 0.8203125, 0.8603515625, 0.900390625, 0.9404296875, 0.98046875, 1.0205078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 10.0, 21.0, 24.0, 32.0, 56.0, 51.0, 81.0, 123.0, 174.0, 295.0, 506.0, 1006.0, 2646.0, 13193.0, 160561.0, 807197.0, 52343.0, 6430.0, 1797.0, 761.0, 408.0, 261.0, 173.0, 109.0, 67.0, 56.0, 35.0, 26.0, 20.0, 21.0, 15.0, 10.0, 4.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.33203125, -7.11187744140625, -6.8917236328125, -6.67156982421875, -6.451416015625, -6.23126220703125, -6.0111083984375, -5.79095458984375, -5.57080078125, -5.35064697265625, -5.1304931640625, -4.91033935546875, -4.690185546875, -4.47003173828125, -4.2498779296875, -4.02972412109375, -3.8095703125, -3.58941650390625, -3.3692626953125, -3.14910888671875, -2.928955078125, -2.70880126953125, -2.4886474609375, -2.26849365234375, -2.04833984375, -1.82818603515625, -1.6080322265625, -1.38787841796875, -1.167724609375, -0.94757080078125, -0.7274169921875, -0.50726318359375, -0.287109375, -0.06695556640625, 0.1531982421875, 0.37335205078125, 0.593505859375, 0.81365966796875, 1.0338134765625, 1.25396728515625, 1.47412109375, 1.69427490234375, 1.9144287109375, 2.13458251953125, 2.354736328125, 2.57489013671875, 2.7950439453125, 3.01519775390625, 3.2353515625, 3.45550537109375, 3.6756591796875, 3.89581298828125, 4.115966796875, 4.33612060546875, 4.5562744140625, 4.77642822265625, 4.99658203125, 5.21673583984375, 5.4368896484375, 5.65704345703125, 5.877197265625, 6.09735107421875, 6.3175048828125, 6.53765869140625, 6.7578125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 6.0, 4.0, 2.0, 4.0, 6.0, 6.0, 3.0, 19.0, 10.0, 15.0, 26.0, 18.0, 35.0, 34.0, 44.0, 40.0, 32.0, 48.0, 51.0, 48.0, 47.0, 42.0, 46.0, 54.0, 40.0, 47.0, 39.0, 36.0, 29.0, 38.0, 22.0, 11.0, 23.0, 12.0, 12.0, 14.0, 11.0, 6.0, 7.0, 3.0, 3.0, 2.0, 8.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.10272216796875, -3.9710693359375, -3.83941650390625, -3.707763671875, -3.57611083984375, -3.4444580078125, -3.31280517578125, -3.18115234375, -3.04949951171875, -2.9178466796875, -2.78619384765625, -2.654541015625, -2.52288818359375, -2.3912353515625, -2.25958251953125, -2.1279296875, -1.99627685546875, -1.8646240234375, -1.73297119140625, -1.601318359375, -1.46966552734375, -1.3380126953125, -1.20635986328125, -1.07470703125, -0.94305419921875, -0.8114013671875, -0.67974853515625, -0.548095703125, -0.41644287109375, -0.2847900390625, -0.15313720703125, -0.021484375, 0.11016845703125, 0.2418212890625, 0.37347412109375, 0.505126953125, 0.63677978515625, 0.7684326171875, 0.90008544921875, 1.03173828125, 1.16339111328125, 1.2950439453125, 1.42669677734375, 1.558349609375, 1.69000244140625, 1.8216552734375, 1.95330810546875, 2.0849609375, 2.21661376953125, 2.3482666015625, 2.47991943359375, 2.611572265625, 2.74322509765625, 2.8748779296875, 3.00653076171875, 3.13818359375, 3.26983642578125, 3.4014892578125, 3.53314208984375, 3.664794921875, 3.79644775390625, 3.9281005859375, 4.05975341796875, 4.19140625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 9.0, 5.0, 10.0, 16.0, 23.0, 19.0, 33.0, 46.0, 61.0, 85.0, 144.0, 207.0, 377.0, 620.0, 1385.0, 3188.0, 9001.0, 35921.0, 253277.0, 637465.0, 81247.0, 16189.0, 5005.0, 2003.0, 971.0, 470.0, 270.0, 153.0, 101.0, 74.0, 47.0, 33.0, 27.0, 17.0, 10.0, 10.0, 10.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.70703125, -1.6540679931640625, -1.601104736328125, -1.5481414794921875, -1.49517822265625, -1.4422149658203125, -1.389251708984375, -1.3362884521484375, -1.2833251953125, -1.2303619384765625, -1.177398681640625, -1.1244354248046875, -1.07147216796875, -1.0185089111328125, -0.965545654296875, -0.9125823974609375, -0.859619140625, -0.8066558837890625, -0.753692626953125, -0.7007293701171875, -0.64776611328125, -0.5948028564453125, -0.541839599609375, -0.4888763427734375, -0.4359130859375, -0.3829498291015625, -0.329986572265625, -0.2770233154296875, -0.22406005859375, -0.1710968017578125, -0.118133544921875, -0.0651702880859375, -0.01220703125, 0.0407562255859375, 0.093719482421875, 0.1466827392578125, 0.19964599609375, 0.2526092529296875, 0.305572509765625, 0.3585357666015625, 0.4114990234375, 0.4644622802734375, 0.517425537109375, 0.5703887939453125, 0.62335205078125, 0.6763153076171875, 0.729278564453125, 0.7822418212890625, 0.835205078125, 0.8881683349609375, 0.941131591796875, 0.9940948486328125, 1.04705810546875, 1.1000213623046875, 1.152984619140625, 1.2059478759765625, 1.2589111328125, 1.3118743896484375, 1.364837646484375, 1.4178009033203125, 1.47076416015625, 1.5237274169921875, 1.576690673828125, 1.6296539306640625, 1.6826171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 3.0, 14.0, 5.0, 18.0, 18.0, 34.0, 39.0, 57.0, 75.0, 132.0, 194.0, 111.0, 69.0, 61.0, 40.0, 36.0, 18.0, 19.0, 20.0, 11.0, 12.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000484466552734375, -0.0004711933434009552, -0.0004579201340675354, -0.0004446469247341156, -0.0004313737154006958, -0.000418100506067276, -0.0004048272967338562, -0.0003915540874004364, -0.0003782808780670166, -0.0003650076687335968, -0.000351734459400177, -0.0003384612500667572, -0.0003251880407333374, -0.0003119148313999176, -0.0002986416220664978, -0.000285368412733078, -0.0002720952033996582, -0.0002588219940662384, -0.0002455487847328186, -0.0002322755753993988, -0.000219002366065979, -0.0002057291567325592, -0.0001924559473991394, -0.0001791827380657196, -0.0001659095287322998, -0.00015263631939888, -0.0001393631100654602, -0.0001260899007320404, -0.0001128166913986206, -9.95434820652008e-05, -8.6270272731781e-05, -7.29970633983612e-05, -5.9723854064941406e-05, -4.6450644731521606e-05, -3.317743539810181e-05, -1.9904226064682007e-05, -6.631016731262207e-06, 6.642192602157593e-06, 1.9915401935577393e-05, 3.318861126899719e-05, 4.646182060241699e-05, 5.973502993583679e-05, 7.300823926925659e-05, 8.628144860267639e-05, 9.955465793609619e-05, 0.00011282786726951599, 0.0001261010766029358, 0.0001393742859363556, 0.0001526474952697754, 0.0001659207046031952, 0.000179193913936615, 0.0001924671232700348, 0.0002057403326034546, 0.0002190135419368744, 0.0002322867512702942, 0.000245559960603714, 0.0002588331699371338, 0.0002721063792705536, 0.0002853795886039734, 0.0002986527979373932, 0.000311926007270813, 0.0003251992166042328, 0.0003384724259376526, 0.0003517456352710724, 0.0003650188446044922]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 6.0, 5.0, 8.0, 11.0, 11.0, 31.0, 36.0, 65.0, 92.0, 151.0, 283.0, 537.0, 1345.0, 4352.0, 26642.0, 573373.0, 413786.0, 21432.0, 3857.0, 1300.0, 527.0, 258.0, 161.0, 75.0, 74.0, 43.0, 29.0, 20.0, 10.0, 7.0, 5.0, 9.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9990234375, -1.9155731201171875, -1.832122802734375, -1.7486724853515625, -1.66522216796875, -1.5817718505859375, -1.498321533203125, -1.4148712158203125, -1.3314208984375, -1.2479705810546875, -1.164520263671875, -1.0810699462890625, -0.99761962890625, -0.9141693115234375, -0.830718994140625, -0.7472686767578125, -0.663818359375, -0.5803680419921875, -0.496917724609375, -0.4134674072265625, -0.33001708984375, -0.2465667724609375, -0.163116455078125, -0.0796661376953125, 0.0037841796875, 0.0872344970703125, 0.170684814453125, 0.2541351318359375, 0.33758544921875, 0.4210357666015625, 0.504486083984375, 0.5879364013671875, 0.67138671875, 0.7548370361328125, 0.838287353515625, 0.9217376708984375, 1.00518798828125, 1.0886383056640625, 1.172088623046875, 1.2555389404296875, 1.3389892578125, 1.4224395751953125, 1.505889892578125, 1.5893402099609375, 1.67279052734375, 1.7562408447265625, 1.839691162109375, 1.9231414794921875, 2.006591796875, 2.0900421142578125, 2.173492431640625, 2.2569427490234375, 2.34039306640625, 2.4238433837890625, 2.507293701171875, 2.5907440185546875, 2.6741943359375, 2.7576446533203125, 2.841094970703125, 2.9245452880859375, 3.00799560546875, 3.0914459228515625, 3.174896240234375, 3.2583465576171875, 3.341796875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 10.0, 12.0, 10.0, 9.0, 14.0, 24.0, 21.0, 37.0, 30.0, 51.0, 52.0, 76.0, 94.0, 81.0, 81.0, 80.0, 60.0, 47.0, 43.0, 28.0, 32.0, 24.0, 17.0, 15.0, 16.0, 6.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-1.533203125, -1.4913482666015625, -1.449493408203125, -1.4076385498046875, -1.36578369140625, -1.3239288330078125, -1.282073974609375, -1.2402191162109375, -1.1983642578125, -1.1565093994140625, -1.114654541015625, -1.0727996826171875, -1.03094482421875, -0.9890899658203125, -0.947235107421875, -0.9053802490234375, -0.863525390625, -0.8216705322265625, -0.779815673828125, -0.7379608154296875, -0.69610595703125, -0.6542510986328125, -0.612396240234375, -0.5705413818359375, -0.5286865234375, -0.4868316650390625, -0.444976806640625, -0.4031219482421875, -0.36126708984375, -0.3194122314453125, -0.277557373046875, -0.2357025146484375, -0.19384765625, -0.1519927978515625, -0.110137939453125, -0.0682830810546875, -0.02642822265625, 0.0154266357421875, 0.057281494140625, 0.0991363525390625, 0.1409912109375, 0.1828460693359375, 0.224700927734375, 0.2665557861328125, 0.30841064453125, 0.3502655029296875, 0.392120361328125, 0.4339752197265625, 0.475830078125, 0.5176849365234375, 0.559539794921875, 0.6013946533203125, 0.64324951171875, 0.6851043701171875, 0.726959228515625, 0.7688140869140625, 0.8106689453125, 0.8525238037109375, 0.894378662109375, 0.9362335205078125, 0.97808837890625, 1.0199432373046875, 1.061798095703125, 1.1036529541015625, 1.1455078125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 13.0, 22.0, 48.0, 79.0, 150.0, 199.0, 203.0, 136.0, 77.0, 41.0, 12.0, 10.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.99011993408203, -51.58573913574219, -50.181358337402344, -48.7769775390625, -47.372596740722656, -45.96821594238281, -44.56383514404297, -43.159454345703125, -41.75507354736328, -40.35069274902344, -38.946311950683594, -37.54193115234375, -36.137550354003906, -34.73316955566406, -33.32878875732422, -31.924407958984375, -30.520029067993164, -29.11564826965332, -27.711267471313477, -26.306886672973633, -24.90250587463379, -23.498125076293945, -22.093746185302734, -20.68936538696289, -19.284984588623047, -17.880603790283203, -16.47622299194336, -15.071842193603516, -13.667461395263672, -12.263080596923828, -10.8587007522583, -9.454319953918457, -8.049938201904297, -6.645557403564453, -5.241176605224609, -3.836796283721924, -2.43241548538208, -1.0280346870422363, 0.3763456344604492, 1.780726432800293, 3.1851072311401367, 4.5894880294799805, 5.993868827819824, 7.39824914932251, 8.802629470825195, 10.207010269165039, 11.611391067504883, 13.015771865844727, 14.42015266418457, 15.824533462524414, 17.228914260864258, 18.6332950592041, 20.037675857543945, 21.44205665588379, 22.846435546875, 24.250816345214844, 25.655197143554688, 27.05957794189453, 28.463958740234375, 29.86833953857422, 31.272720336914062, 32.677101135253906, 34.08148193359375, 35.485862731933594, 36.89024353027344]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 6.0, 13.0, 15.0, 7.0, 18.0, 20.0, 13.0, 28.0, 22.0, 32.0, 34.0, 26.0, 35.0, 43.0, 35.0, 55.0, 55.0, 48.0, 49.0, 46.0, 51.0, 42.0, 35.0, 39.0, 34.0, 27.0, 29.0, 18.0, 30.0, 22.0, 11.0, 8.0, 12.0, 10.0, 6.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.100662231445312, -20.487611770629883, -19.874563217163086, -19.261512756347656, -18.64846420288086, -18.03541374206543, -17.42236328125, -16.809314727783203, -16.196264266967773, -15.58321475982666, -14.970165252685547, -14.357114791870117, -13.744065284729004, -13.13101577758789, -12.517966270446777, -11.904916763305664, -11.29186725616455, -10.678817749023438, -10.065768241882324, -9.452718734741211, -8.839668273925781, -8.226618766784668, -7.613569259643555, -7.000519275665283, -6.38746976852417, -5.774420261383057, -5.161370277404785, -4.548320770263672, -3.9352710247039795, -3.322221279144287, -2.709171772003174, -2.0961217880249023, -1.483072280883789, -0.8700225949287415, -0.25697290897369385, 0.356076717376709, 0.9691264629364014, 1.5821762084960938, 2.195225715637207, 2.8082756996154785, 3.421325206756592, 4.034374713897705, 4.647424697875977, 5.26047420501709, 5.873523712158203, 6.486573696136475, 7.099623203277588, 7.712673187255859, 8.325722694396973, 8.938772201538086, 9.5518217086792, 10.164871215820312, 10.777921676635742, 11.390971183776855, 12.004020690917969, 12.617071151733398, 13.230119705200195, 13.843169212341309, 14.456218719482422, 15.069269180297852, 15.682318687438965, 16.295368194580078, 16.908416748046875, 17.521467208862305, 18.134517669677734]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 8.0, 14.0, 22.0, 31.0, 27.0, 50.0, 83.0, 95.0, 177.0, 285.0, 422.0, 697.0, 1221.0, 2004.0, 3819.0, 7628.0, 16692.0, 44953.0, 224424.0, 3463167.0, 335315.0, 54991.0, 19666.0, 8586.0, 4277.0, 2333.0, 1289.0, 763.0, 441.0, 284.0, 179.0, 124.0, 68.0, 51.0, 28.0, 29.0, 12.0, 9.0, 4.0, 4.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23046875, -2.155059814453125, -2.07965087890625, -2.004241943359375, -1.9288330078125, -1.853424072265625, -1.77801513671875, -1.702606201171875, -1.627197265625, -1.551788330078125, -1.47637939453125, -1.400970458984375, -1.3255615234375, -1.250152587890625, -1.17474365234375, -1.099334716796875, -1.02392578125, -0.948516845703125, -0.87310791015625, -0.797698974609375, -0.7222900390625, -0.646881103515625, -0.57147216796875, -0.496063232421875, -0.420654296875, -0.345245361328125, -0.26983642578125, -0.194427490234375, -0.1190185546875, -0.043609619140625, 0.03179931640625, 0.107208251953125, 0.1826171875, 0.258026123046875, 0.33343505859375, 0.408843994140625, 0.4842529296875, 0.559661865234375, 0.63507080078125, 0.710479736328125, 0.785888671875, 0.861297607421875, 0.93670654296875, 1.012115478515625, 1.0875244140625, 1.162933349609375, 1.23834228515625, 1.313751220703125, 1.38916015625, 1.464569091796875, 1.53997802734375, 1.615386962890625, 1.6907958984375, 1.766204833984375, 1.84161376953125, 1.917022705078125, 1.992431640625, 2.067840576171875, 2.14324951171875, 2.218658447265625, 2.2940673828125, 2.369476318359375, 2.44488525390625, 2.520294189453125, 2.595703125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 5.0, 5.0, 3.0, 8.0, 5.0, 8.0, 10.0, 19.0, 27.0, 30.0, 25.0, 35.0, 38.0, 42.0, 47.0, 61.0, 62.0, 45.0, 48.0, 55.0, 58.0, 51.0, 52.0, 33.0, 36.0, 29.0, 36.0, 17.0, 19.0, 21.0, 11.0, 17.0, 10.0, 13.0, 7.0, 3.0, 6.0, 1.0, 7.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0263671875, -0.9976882934570312, -0.9690093994140625, -0.9403305053710938, -0.911651611328125, -0.8829727172851562, -0.8542938232421875, -0.8256149291992188, -0.79693603515625, -0.7682571411132812, -0.7395782470703125, -0.7108993530273438, -0.682220458984375, -0.6535415649414062, -0.6248626708984375, -0.5961837768554688, -0.5675048828125, -0.5388259887695312, -0.5101470947265625, -0.48146820068359375, -0.452789306640625, -0.42411041259765625, -0.3954315185546875, -0.36675262451171875, -0.33807373046875, -0.30939483642578125, -0.2807159423828125, -0.25203704833984375, -0.223358154296875, -0.19467926025390625, -0.1660003662109375, -0.13732147216796875, -0.108642578125, -0.07996368408203125, -0.0512847900390625, -0.02260589599609375, 0.006072998046875, 0.03475189208984375, 0.0634307861328125, 0.09210968017578125, 0.12078857421875, 0.14946746826171875, 0.1781463623046875, 0.20682525634765625, 0.235504150390625, 0.26418304443359375, 0.2928619384765625, 0.32154083251953125, 0.3502197265625, 0.37889862060546875, 0.4075775146484375, 0.43625640869140625, 0.464935302734375, 0.49361419677734375, 0.5222930908203125, 0.5509719848632812, 0.57965087890625, 0.6083297729492188, 0.6370086669921875, 0.6656875610351562, 0.694366455078125, 0.7230453491210938, 0.7517242431640625, 0.7804031372070312, 0.80908203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 8.0, 28.0, 28.0, 75.0, 123.0, 244.0, 602.0, 2126.0, 13547.0, 574803.0, 3579191.0, 19647.0, 2666.0, 685.0, 249.0, 121.0, 50.0, 32.0, 20.0, 8.0, 4.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.921875, -8.6348876953125, -8.347900390625, -8.0609130859375, -7.77392578125, -7.4869384765625, -7.199951171875, -6.9129638671875, -6.6259765625, -6.3389892578125, -6.052001953125, -5.7650146484375, -5.47802734375, -5.1910400390625, -4.904052734375, -4.6170654296875, -4.330078125, -4.0430908203125, -3.756103515625, -3.4691162109375, -3.18212890625, -2.8951416015625, -2.608154296875, -2.3211669921875, -2.0341796875, -1.7471923828125, -1.460205078125, -1.1732177734375, -0.88623046875, -0.5992431640625, -0.312255859375, -0.0252685546875, 0.26171875, 0.5487060546875, 0.835693359375, 1.1226806640625, 1.40966796875, 1.6966552734375, 1.983642578125, 2.2706298828125, 2.5576171875, 2.8446044921875, 3.131591796875, 3.4185791015625, 3.70556640625, 3.9925537109375, 4.279541015625, 4.5665283203125, 4.853515625, 5.1405029296875, 5.427490234375, 5.7144775390625, 6.00146484375, 6.2884521484375, 6.575439453125, 6.8624267578125, 7.1494140625, 7.4364013671875, 7.723388671875, 8.0103759765625, 8.29736328125, 8.5843505859375, 8.871337890625, 9.1583251953125, 9.4453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 7.0, 13.0, 20.0, 17.0, 38.0, 50.0, 95.0, 257.0, 926.0, 1967.0, 405.0, 140.0, 52.0, 23.0, 17.0, 13.0, 7.0, 7.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.6451416015625, -5.458251953125, -5.2713623046875, -5.08447265625, -4.8975830078125, -4.710693359375, -4.5238037109375, -4.3369140625, -4.1500244140625, -3.963134765625, -3.7762451171875, -3.58935546875, -3.4024658203125, -3.215576171875, -3.0286865234375, -2.841796875, -2.6549072265625, -2.468017578125, -2.2811279296875, -2.09423828125, -1.9073486328125, -1.720458984375, -1.5335693359375, -1.3466796875, -1.1597900390625, -0.972900390625, -0.7860107421875, -0.59912109375, -0.4122314453125, -0.225341796875, -0.0384521484375, 0.1484375, 0.3353271484375, 0.522216796875, 0.7091064453125, 0.89599609375, 1.0828857421875, 1.269775390625, 1.4566650390625, 1.6435546875, 1.8304443359375, 2.017333984375, 2.2042236328125, 2.39111328125, 2.5780029296875, 2.764892578125, 2.9517822265625, 3.138671875, 3.3255615234375, 3.512451171875, 3.6993408203125, 3.88623046875, 4.0731201171875, 4.260009765625, 4.4468994140625, 4.6337890625, 4.8206787109375, 5.007568359375, 5.1944580078125, 5.38134765625, 5.5682373046875, 5.755126953125, 5.9420166015625, 6.12890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 13.0, 20.0, 39.0, 91.0, 202.0, 306.0, 193.0, 82.0, 21.0, 17.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.11920166015625, -62.41537094116211, -60.711544036865234, -59.007713317871094, -57.30388259887695, -55.60005187988281, -53.89622497558594, -52.1923942565918, -50.488563537597656, -48.784732818603516, -47.08090591430664, -45.3770751953125, -43.67324447631836, -41.96941375732422, -40.265586853027344, -38.5617561340332, -36.85792922973633, -35.15409851074219, -33.45027160644531, -31.746440887451172, -30.04261016845703, -28.338781356811523, -26.634952545166016, -24.931121826171875, -23.227293014526367, -21.52346420288086, -19.81963348388672, -18.11580467224121, -16.411975860595703, -14.708145141601562, -13.004316329956055, -11.30048656463623, -9.59665298461914, -7.892823219299316, -6.18899393081665, -4.485164642333984, -2.78133487701416, -1.077505111694336, 0.6263236999511719, 2.330153465270996, 4.03398323059082, 5.7378129959106445, 7.4416422843933105, 9.145471572875977, 10.8493013381958, 12.553131103515625, 14.256959915161133, 15.960789680480957, 17.66461944580078, 19.36844825744629, 21.07227897644043, 22.776107788085938, 24.479938507080078, 26.183767318725586, 27.887596130371094, 29.591426849365234, 31.295255661010742, 32.99908447265625, 34.70291519165039, 36.40674591064453, 38.110572814941406, 39.81440353393555, 41.51823425292969, 43.22206115722656, 44.9258918762207]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 6.0, 15.0, 15.0, 29.0, 21.0, 34.0, 37.0, 37.0, 53.0, 54.0, 47.0, 55.0, 58.0, 55.0, 52.0, 56.0, 39.0, 68.0, 40.0, 31.0, 29.0, 25.0, 27.0, 28.0, 9.0, 19.0, 12.0, 9.0, 11.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.76620101928711, -21.130428314208984, -20.49465560913086, -19.8588809967041, -19.223108291625977, -18.58733558654785, -17.951562881469727, -17.3157901763916, -16.680015563964844, -16.04424285888672, -15.408469200134277, -14.772696495056152, -14.136922836303711, -13.501150131225586, -12.865377426147461, -12.229604721069336, -11.593832015991211, -10.958059310913086, -10.322285652160645, -9.68651294708252, -9.050739288330078, -8.414966583251953, -7.779193878173828, -7.143420696258545, -6.507647514343262, -5.8718743324279785, -5.236101150512695, -4.60032844543457, -3.964555263519287, -3.328782081604004, -2.6930091381073, -2.0572361946105957, -1.4214611053466797, -0.785688042640686, -0.14991497993469238, 0.48585808277130127, 1.121631145477295, 1.7574043273925781, 2.3931772708892822, 3.0289502143859863, 3.6647233963012695, 4.300496578216553, 4.936269760131836, 5.572042465209961, 6.207815647125244, 6.843588829040527, 7.479361534118652, 8.115135192871094, 8.750907897949219, 9.386680603027344, 10.022454261779785, 10.65822696685791, 11.294000625610352, 11.929773330688477, 12.565546035766602, 13.201318740844727, 13.837092399597168, 14.472865104675293, 15.108638763427734, 15.74441146850586, 16.380184173583984, 17.01595687866211, 17.651731491088867, 18.287504196166992, 18.923276901245117]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 8.0, 13.0, 20.0, 31.0, 46.0, 41.0, 95.0, 127.0, 229.0, 401.0, 676.0, 1148.0, 2148.0, 4072.0, 8094.0, 17789.0, 43151.0, 125619.0, 491759.0, 236876.0, 66713.0, 26218.0, 11409.0, 5277.0, 2780.0, 1581.0, 875.0, 516.0, 317.0, 199.0, 118.0, 86.0, 43.0, 26.0, 24.0, 10.0, 4.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83203125, -2.7454833984375, -2.658935546875, -2.5723876953125, -2.48583984375, -2.3992919921875, -2.312744140625, -2.2261962890625, -2.1396484375, -2.0531005859375, -1.966552734375, -1.8800048828125, -1.79345703125, -1.7069091796875, -1.620361328125, -1.5338134765625, -1.447265625, -1.3607177734375, -1.274169921875, -1.1876220703125, -1.10107421875, -1.0145263671875, -0.927978515625, -0.8414306640625, -0.7548828125, -0.6683349609375, -0.581787109375, -0.4952392578125, -0.40869140625, -0.3221435546875, -0.235595703125, -0.1490478515625, -0.0625, 0.0240478515625, 0.110595703125, 0.1971435546875, 0.28369140625, 0.3702392578125, 0.456787109375, 0.5433349609375, 0.6298828125, 0.7164306640625, 0.802978515625, 0.8895263671875, 0.97607421875, 1.0626220703125, 1.149169921875, 1.2357177734375, 1.322265625, 1.4088134765625, 1.495361328125, 1.5819091796875, 1.66845703125, 1.7550048828125, 1.841552734375, 1.9281005859375, 2.0146484375, 2.1011962890625, 2.187744140625, 2.2742919921875, 2.36083984375, 2.4473876953125, 2.533935546875, 2.6204833984375, 2.70703125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 2.0, 7.0, 4.0, 3.0, 6.0, 14.0, 8.0, 25.0, 26.0, 29.0, 26.0, 32.0, 40.0, 38.0, 48.0, 46.0, 57.0, 50.0, 58.0, 52.0, 50.0, 59.0, 40.0, 39.0, 34.0, 39.0, 17.0, 21.0, 21.0, 23.0, 15.0, 12.0, 7.0, 11.0, 10.0, 6.0, 8.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.056640625, -1.02545166015625, -0.9942626953125, -0.96307373046875, -0.931884765625, -0.90069580078125, -0.8695068359375, -0.83831787109375, -0.80712890625, -0.77593994140625, -0.7447509765625, -0.71356201171875, -0.682373046875, -0.65118408203125, -0.6199951171875, -0.58880615234375, -0.5576171875, -0.52642822265625, -0.4952392578125, -0.46405029296875, -0.432861328125, -0.40167236328125, -0.3704833984375, -0.33929443359375, -0.30810546875, -0.27691650390625, -0.2457275390625, -0.21453857421875, -0.183349609375, -0.15216064453125, -0.1209716796875, -0.08978271484375, -0.05859375, -0.02740478515625, 0.0037841796875, 0.03497314453125, 0.066162109375, 0.09735107421875, 0.1285400390625, 0.15972900390625, 0.19091796875, 0.22210693359375, 0.2532958984375, 0.28448486328125, 0.315673828125, 0.34686279296875, 0.3780517578125, 0.40924072265625, 0.4404296875, 0.47161865234375, 0.5028076171875, 0.53399658203125, 0.565185546875, 0.59637451171875, 0.6275634765625, 0.65875244140625, 0.68994140625, 0.72113037109375, 0.7523193359375, 0.78350830078125, 0.814697265625, 0.84588623046875, 0.8770751953125, 0.90826416015625, 0.939453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 8.0, 10.0, 12.0, 6.0, 25.0, 37.0, 77.0, 97.0, 167.0, 330.0, 809.0, 2303.0, 15091.0, 861105.0, 158612.0, 7129.0, 1523.0, 551.0, 291.0, 136.0, 62.0, 54.0, 48.0, 26.0, 11.0, 7.0, 6.0, 5.0, 5.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9609375, -10.6165771484375, -10.272216796875, -9.9278564453125, -9.58349609375, -9.2391357421875, -8.894775390625, -8.5504150390625, -8.2060546875, -7.8616943359375, -7.517333984375, -7.1729736328125, -6.82861328125, -6.4842529296875, -6.139892578125, -5.7955322265625, -5.451171875, -5.1068115234375, -4.762451171875, -4.4180908203125, -4.07373046875, -3.7293701171875, -3.385009765625, -3.0406494140625, -2.6962890625, -2.3519287109375, -2.007568359375, -1.6632080078125, -1.31884765625, -0.9744873046875, -0.630126953125, -0.2857666015625, 0.05859375, 0.4029541015625, 0.747314453125, 1.0916748046875, 1.43603515625, 1.7803955078125, 2.124755859375, 2.4691162109375, 2.8134765625, 3.1578369140625, 3.502197265625, 3.8465576171875, 4.19091796875, 4.5352783203125, 4.879638671875, 5.2239990234375, 5.568359375, 5.9127197265625, 6.257080078125, 6.6014404296875, 6.94580078125, 7.2901611328125, 7.634521484375, 7.9788818359375, 8.3232421875, 8.6676025390625, 9.011962890625, 9.3563232421875, 9.70068359375, 10.0450439453125, 10.389404296875, 10.7337646484375, 11.078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 5.0, 5.0, 7.0, 8.0, 24.0, 18.0, 15.0, 23.0, 30.0, 32.0, 55.0, 54.0, 48.0, 68.0, 66.0, 77.0, 62.0, 64.0, 61.0, 43.0, 44.0, 31.0, 41.0, 33.0, 21.0, 10.0, 9.0, 8.0, 7.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.875, -6.668701171875, -6.46240234375, -6.256103515625, -6.0498046875, -5.843505859375, -5.63720703125, -5.430908203125, -5.224609375, -5.018310546875, -4.81201171875, -4.605712890625, -4.3994140625, -4.193115234375, -3.98681640625, -3.780517578125, -3.57421875, -3.367919921875, -3.16162109375, -2.955322265625, -2.7490234375, -2.542724609375, -2.33642578125, -2.130126953125, -1.923828125, -1.717529296875, -1.51123046875, -1.304931640625, -1.0986328125, -0.892333984375, -0.68603515625, -0.479736328125, -0.2734375, -0.067138671875, 0.13916015625, 0.345458984375, 0.5517578125, 0.758056640625, 0.96435546875, 1.170654296875, 1.376953125, 1.583251953125, 1.78955078125, 1.995849609375, 2.2021484375, 2.408447265625, 2.61474609375, 2.821044921875, 3.02734375, 3.233642578125, 3.43994140625, 3.646240234375, 3.8525390625, 4.058837890625, 4.26513671875, 4.471435546875, 4.677734375, 4.884033203125, 5.09033203125, 5.296630859375, 5.5029296875, 5.709228515625, 5.91552734375, 6.121826171875, 6.328125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 3.0, 4.0, 7.0, 15.0, 10.0, 19.0, 30.0, 34.0, 61.0, 113.0, 202.0, 353.0, 909.0, 2561.0, 11248.0, 138087.0, 855825.0, 31388.0, 5110.0, 1386.0, 565.0, 246.0, 146.0, 81.0, 38.0, 37.0, 16.0, 8.0, 9.0, 13.0, 6.0, 4.0, 4.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.95703125, -3.8343505859375, -3.711669921875, -3.5889892578125, -3.46630859375, -3.3436279296875, -3.220947265625, -3.0982666015625, -2.9755859375, -2.8529052734375, -2.730224609375, -2.6075439453125, -2.48486328125, -2.3621826171875, -2.239501953125, -2.1168212890625, -1.994140625, -1.8714599609375, -1.748779296875, -1.6260986328125, -1.50341796875, -1.3807373046875, -1.258056640625, -1.1353759765625, -1.0126953125, -0.8900146484375, -0.767333984375, -0.6446533203125, -0.52197265625, -0.3992919921875, -0.276611328125, -0.1539306640625, -0.03125, 0.0914306640625, 0.214111328125, 0.3367919921875, 0.45947265625, 0.5821533203125, 0.704833984375, 0.8275146484375, 0.9501953125, 1.0728759765625, 1.195556640625, 1.3182373046875, 1.44091796875, 1.5635986328125, 1.686279296875, 1.8089599609375, 1.931640625, 2.0543212890625, 2.177001953125, 2.2996826171875, 2.42236328125, 2.5450439453125, 2.667724609375, 2.7904052734375, 2.9130859375, 3.0357666015625, 3.158447265625, 3.2811279296875, 3.40380859375, 3.5264892578125, 3.649169921875, 3.7718505859375, 3.89453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 13.0, 14.0, 8.0, 35.0, 46.0, 68.0, 96.0, 184.0, 212.0, 99.0, 75.0, 40.0, 28.0, 16.0, 10.0, 15.0, 8.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004703998565673828, -0.0004542432725429535, -0.00043808668851852417, -0.00042193010449409485, -0.00040577352046966553, -0.0003896169364452362, -0.0003734603524208069, -0.00035730376839637756, -0.00034114718437194824, -0.0003249906003475189, -0.0003088340163230896, -0.0002926774322986603, -0.00027652084827423096, -0.00026036426424980164, -0.0002442076802253723, -0.000228051096200943, -0.00021189451217651367, -0.00019573792815208435, -0.00017958134412765503, -0.0001634247601032257, -0.0001472681760787964, -0.00013111159205436707, -0.00011495500802993774, -9.879842400550842e-05, -8.26418399810791e-05, -6.648525595664978e-05, -5.032867193222046e-05, -3.417208790779114e-05, -1.8015503883361816e-05, -1.8589198589324951e-06, 1.4297664165496826e-05, 3.0454248189926147e-05, 4.661083221435547e-05, 6.276741623878479e-05, 7.892400026321411e-05, 9.508058428764343e-05, 0.00011123716831207275, 0.00012739375233650208, 0.0001435503363609314, 0.00015970692038536072, 0.00017586350440979004, 0.00019202008843421936, 0.00020817667245864868, 0.000224333256483078, 0.00024048984050750732, 0.00025664642453193665, 0.00027280300855636597, 0.0002889595925807953, 0.0003051161766052246, 0.00032127276062965393, 0.00033742934465408325, 0.0003535859286785126, 0.0003697425127029419, 0.0003858990967273712, 0.00040205568075180054, 0.00041821226477622986, 0.0004343688488006592, 0.0004505254328250885, 0.0004666820168495178, 0.00048283860087394714, 0.0004989951848983765, 0.0005151517689228058, 0.0005313083529472351, 0.0005474649369716644, 0.0005636215209960938]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 5.0, 13.0, 10.0, 13.0, 25.0, 37.0, 50.0, 98.0, 126.0, 251.0, 534.0, 1354.0, 5072.0, 47963.0, 933428.0, 51723.0, 5125.0, 1445.0, 576.0, 285.0, 166.0, 83.0, 54.0, 27.0, 24.0, 14.0, 10.0, 6.0, 7.0, 6.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.72265625, -3.58734130859375, -3.4520263671875, -3.31671142578125, -3.181396484375, -3.04608154296875, -2.9107666015625, -2.77545166015625, -2.64013671875, -2.50482177734375, -2.3695068359375, -2.23419189453125, -2.098876953125, -1.96356201171875, -1.8282470703125, -1.69293212890625, -1.5576171875, -1.42230224609375, -1.2869873046875, -1.15167236328125, -1.016357421875, -0.88104248046875, -0.7457275390625, -0.61041259765625, -0.47509765625, -0.33978271484375, -0.2044677734375, -0.06915283203125, 0.066162109375, 0.20147705078125, 0.3367919921875, 0.47210693359375, 0.607421875, 0.74273681640625, 0.8780517578125, 1.01336669921875, 1.148681640625, 1.28399658203125, 1.4193115234375, 1.55462646484375, 1.68994140625, 1.82525634765625, 1.9605712890625, 2.09588623046875, 2.231201171875, 2.36651611328125, 2.5018310546875, 2.63714599609375, 2.7724609375, 2.90777587890625, 3.0430908203125, 3.17840576171875, 3.313720703125, 3.44903564453125, 3.5843505859375, 3.71966552734375, 3.85498046875, 3.99029541015625, 4.1256103515625, 4.26092529296875, 4.396240234375, 4.53155517578125, 4.6668701171875, 4.80218505859375, 4.9375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 7.0, 4.0, 15.0, 16.0, 15.0, 15.0, 35.0, 51.0, 73.0, 79.0, 114.0, 112.0, 108.0, 89.0, 75.0, 47.0, 32.0, 32.0, 22.0, 12.0, 12.0, 8.0, 6.0, 3.0, 8.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.03515625, -2.9583892822265625, -2.881622314453125, -2.8048553466796875, -2.72808837890625, -2.6513214111328125, -2.574554443359375, -2.4977874755859375, -2.4210205078125, -2.3442535400390625, -2.267486572265625, -2.1907196044921875, -2.11395263671875, -2.0371856689453125, -1.960418701171875, -1.8836517333984375, -1.806884765625, -1.7301177978515625, -1.653350830078125, -1.5765838623046875, -1.49981689453125, -1.4230499267578125, -1.346282958984375, -1.2695159912109375, -1.1927490234375, -1.1159820556640625, -1.039215087890625, -0.9624481201171875, -0.88568115234375, -0.8089141845703125, -0.732147216796875, -0.6553802490234375, -0.57861328125, -0.5018463134765625, -0.425079345703125, -0.3483123779296875, -0.27154541015625, -0.1947784423828125, -0.118011474609375, -0.0412445068359375, 0.0355224609375, 0.1122894287109375, 0.189056396484375, 0.2658233642578125, 0.34259033203125, 0.4193572998046875, 0.496124267578125, 0.5728912353515625, 0.649658203125, 0.7264251708984375, 0.803192138671875, 0.8799591064453125, 0.95672607421875, 1.0334930419921875, 1.110260009765625, 1.1870269775390625, 1.2637939453125, 1.3405609130859375, 1.417327880859375, 1.4940948486328125, 1.57086181640625, 1.6476287841796875, 1.724395751953125, 1.8011627197265625, 1.8779296875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 13.0, 7.0, 12.0, 27.0, 30.0, 81.0, 94.0, 139.0, 181.0, 147.0, 111.0, 65.0, 40.0, 19.0, 11.0, 7.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.732933044433594, -46.589378356933594, -45.445823669433594, -44.302268981933594, -43.158714294433594, -42.015159606933594, -40.871604919433594, -39.72805404663086, -38.58449935913086, -37.44094467163086, -36.29738998413086, -35.15383529663086, -34.01028060913086, -32.866729736328125, -31.723173141479492, -30.579620361328125, -29.436063766479492, -28.292509078979492, -27.148954391479492, -26.005401611328125, -24.861846923828125, -23.718292236328125, -22.574737548828125, -21.431182861328125, -20.287628173828125, -19.144073486328125, -18.000518798828125, -16.856964111328125, -15.713411331176758, -14.569856643676758, -13.426301956176758, -12.282748222351074, -11.13919448852539, -9.99563980102539, -8.852086067199707, -7.708531379699707, -6.564977169036865, -5.421422958374023, -4.277868270874023, -3.13431453704834, -1.9907598495483398, -0.8472055196762085, 0.29634881019592285, 1.4399032592773438, 2.5834574699401855, 3.7270116806030273, 4.870566368103027, 6.014120101928711, 7.157674789428711, 8.301229476928711, 9.444783210754395, 10.588337898254395, 11.731891632080078, 12.875446319580078, 14.019001007080078, 15.162554740905762, 16.306110382080078, 17.449665069580078, 18.593219757080078, 19.736774444580078, 20.880327224731445, 22.023881912231445, 23.167436599731445, 24.310989379882812, 25.454544067382812]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 13.0, 26.0, 30.0, 37.0, 53.0, 66.0, 79.0, 97.0, 122.0, 122.0, 88.0, 82.0, 67.0, 33.0, 39.0, 16.0, 18.0, 11.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.863380432128906, -59.53375244140625, -58.204124450683594, -56.87449645996094, -55.54486846923828, -54.215240478515625, -52.88561248779297, -51.55598449707031, -50.226356506347656, -48.896728515625, -47.567100524902344, -46.23747253417969, -44.90784454345703, -43.578216552734375, -42.24858856201172, -40.91896057128906, -39.589332580566406, -38.25970458984375, -36.930076599121094, -35.60044860839844, -34.27082061767578, -32.941192626953125, -31.61156463623047, -30.281936645507812, -28.952312469482422, -27.622684478759766, -26.29305648803711, -24.963428497314453, -23.633800506591797, -22.30417251586914, -20.974544525146484, -19.644916534423828, -18.315288543701172, -16.985660552978516, -15.65603256225586, -14.326404571533203, -12.996776580810547, -11.66714859008789, -10.33752155303955, -9.007893562316895, -7.678265571594238, -6.348637580871582, -5.019009590148926, -3.6893820762634277, -2.3597540855407715, -1.0301260948181152, 0.2995014190673828, 1.629129409790039, 2.9587574005126953, 4.288385391235352, 5.618013381958008, 6.947640895843506, 8.27726936340332, 9.606897354125977, 10.936524391174316, 12.266152381896973, 13.595780372619629, 14.925408363342285, 16.255035400390625, 17.58466339111328, 18.914291381835938, 20.243919372558594, 21.57354736328125, 22.903175354003906, 24.232803344726562]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 5.0, 2.0, 10.0, 8.0, 12.0, 12.0, 14.0, 28.0, 30.0, 31.0, 64.0, 78.0, 131.0, 223.0, 371.0, 703.0, 1444.0, 3726.0, 12838.0, 94691.0, 3891841.0, 162493.0, 17817.0, 4540.0, 1566.0, 686.0, 349.0, 195.0, 120.0, 62.0, 64.0, 37.0, 23.0, 19.0, 5.0, 15.0, 4.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.28515625, -4.14501953125, -4.0048828125, -3.86474609375, -3.724609375, -3.58447265625, -3.4443359375, -3.30419921875, -3.1640625, -3.02392578125, -2.8837890625, -2.74365234375, -2.603515625, -2.46337890625, -2.3232421875, -2.18310546875, -2.04296875, -1.90283203125, -1.7626953125, -1.62255859375, -1.482421875, -1.34228515625, -1.2021484375, -1.06201171875, -0.921875, -0.78173828125, -0.6416015625, -0.50146484375, -0.361328125, -0.22119140625, -0.0810546875, 0.05908203125, 0.19921875, 0.33935546875, 0.4794921875, 0.61962890625, 0.759765625, 0.89990234375, 1.0400390625, 1.18017578125, 1.3203125, 1.46044921875, 1.6005859375, 1.74072265625, 1.880859375, 2.02099609375, 2.1611328125, 2.30126953125, 2.44140625, 2.58154296875, 2.7216796875, 2.86181640625, 3.001953125, 3.14208984375, 3.2822265625, 3.42236328125, 3.5625, 3.70263671875, 3.8427734375, 3.98291015625, 4.123046875, 4.26318359375, 4.4033203125, 4.54345703125, 4.68359375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 12.0, 19.0, 27.0, 65.0, 99.0, 130.0, 152.0, 165.0, 122.0, 99.0, 51.0, 36.0, 16.0, 11.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -4.029388427734375, -3.93768310546875, -3.845977783203125, -3.7542724609375, -3.662567138671875, -3.57086181640625, -3.479156494140625, -3.387451171875, -3.295745849609375, -3.20404052734375, -3.112335205078125, -3.0206298828125, -2.928924560546875, -2.83721923828125, -2.745513916015625, -2.65380859375, -2.562103271484375, -2.47039794921875, -2.378692626953125, -2.2869873046875, -2.195281982421875, -2.10357666015625, -2.011871337890625, -1.920166015625, -1.828460693359375, -1.73675537109375, -1.645050048828125, -1.5533447265625, -1.461639404296875, -1.36993408203125, -1.278228759765625, -1.1865234375, -1.094818115234375, -1.00311279296875, -0.911407470703125, -0.8197021484375, -0.727996826171875, -0.63629150390625, -0.544586181640625, -0.452880859375, -0.361175537109375, -0.26947021484375, -0.177764892578125, -0.0860595703125, 0.005645751953125, 0.09735107421875, 0.189056396484375, 0.28076171875, 0.372467041015625, 0.46417236328125, 0.555877685546875, 0.6475830078125, 0.739288330078125, 0.83099365234375, 0.922698974609375, 1.014404296875, 1.106109619140625, 1.19781494140625, 1.289520263671875, 1.3812255859375, 1.472930908203125, 1.56463623046875, 1.656341552734375, 1.748046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 2.0, 8.0, 10.0, 9.0, 28.0, 54.0, 99.0, 177.0, 294.0, 532.0, 1028.0, 2236.0, 5745.0, 21488.0, 208896.0, 3832120.0, 98438.0, 14885.0, 4424.0, 1796.0, 901.0, 479.0, 286.0, 142.0, 92.0, 27.0, 18.0, 15.0, 4.0, 7.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.828125, -5.64813232421875, -5.4681396484375, -5.28814697265625, -5.108154296875, -4.92816162109375, -4.7481689453125, -4.56817626953125, -4.38818359375, -4.20819091796875, -4.0281982421875, -3.84820556640625, -3.668212890625, -3.48822021484375, -3.3082275390625, -3.12823486328125, -2.9482421875, -2.76824951171875, -2.5882568359375, -2.40826416015625, -2.228271484375, -2.04827880859375, -1.8682861328125, -1.68829345703125, -1.50830078125, -1.32830810546875, -1.1483154296875, -0.96832275390625, -0.788330078125, -0.60833740234375, -0.4283447265625, -0.24835205078125, -0.068359375, 0.11163330078125, 0.2916259765625, 0.47161865234375, 0.651611328125, 0.83160400390625, 1.0115966796875, 1.19158935546875, 1.37158203125, 1.55157470703125, 1.7315673828125, 1.91156005859375, 2.091552734375, 2.27154541015625, 2.4515380859375, 2.63153076171875, 2.8115234375, 2.99151611328125, 3.1715087890625, 3.35150146484375, 3.531494140625, 3.71148681640625, 3.8914794921875, 4.07147216796875, 4.25146484375, 4.43145751953125, 4.6114501953125, 4.79144287109375, 4.971435546875, 5.15142822265625, 5.3314208984375, 5.51141357421875, 5.69140625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 14.0, 9.0, 23.0, 29.0, 52.0, 86.0, 187.0, 602.0, 1850.0, 742.0, 223.0, 88.0, 41.0, 31.0, 18.0, 13.0, 12.0, 11.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.16168212890625, -4.9874267578125, -4.81317138671875, -4.638916015625, -4.46466064453125, -4.2904052734375, -4.11614990234375, -3.94189453125, -3.76763916015625, -3.5933837890625, -3.41912841796875, -3.244873046875, -3.07061767578125, -2.8963623046875, -2.72210693359375, -2.5478515625, -2.37359619140625, -2.1993408203125, -2.02508544921875, -1.850830078125, -1.67657470703125, -1.5023193359375, -1.32806396484375, -1.15380859375, -0.97955322265625, -0.8052978515625, -0.63104248046875, -0.456787109375, -0.28253173828125, -0.1082763671875, 0.06597900390625, 0.240234375, 0.41448974609375, 0.5887451171875, 0.76300048828125, 0.937255859375, 1.11151123046875, 1.2857666015625, 1.46002197265625, 1.63427734375, 1.80853271484375, 1.9827880859375, 2.15704345703125, 2.331298828125, 2.50555419921875, 2.6798095703125, 2.85406494140625, 3.0283203125, 3.20257568359375, 3.3768310546875, 3.55108642578125, 3.725341796875, 3.89959716796875, 4.0738525390625, 4.24810791015625, 4.42236328125, 4.59661865234375, 4.7708740234375, 4.94512939453125, 5.119384765625, 5.29364013671875, 5.4678955078125, 5.64215087890625, 5.81640625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 14.0, 24.0, 134.0, 526.0, 247.0, 38.0, 13.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-122.79389190673828, -119.70279693603516, -116.61170196533203, -113.5206069946289, -110.42951965332031, -107.33842468261719, -104.24732971191406, -101.15623474121094, -98.06513977050781, -94.97404479980469, -91.88294982910156, -88.79185485839844, -85.70075988769531, -82.60967254638672, -79.5185775756836, -76.42748260498047, -73.33638763427734, -70.24529266357422, -67.1541976928711, -64.06310272216797, -60.97201156616211, -57.880916595458984, -54.789825439453125, -51.69873046875, -48.607635498046875, -45.51654052734375, -42.425445556640625, -39.334354400634766, -36.24325942993164, -33.152164459228516, -30.061071395874023, -26.96997833251953, -23.878890991210938, -20.787796020507812, -17.69670295715332, -14.605608940124512, -11.514514923095703, -8.423420906066895, -5.332326889038086, -2.2412338256835938, 0.8498611450195312, 3.94095516204834, 7.032049179077148, 10.123143196105957, 13.214237213134766, 16.30533218383789, 19.396425247192383, 22.487518310546875, 25.57861328125, 28.669708251953125, 31.760801315307617, 34.85189437866211, 37.942989349365234, 41.03408432006836, 44.12517547607422, 47.216270446777344, 50.30736541748047, 53.398460388183594, 56.48955535888672, 59.58064651489258, 62.6717414855957, 65.76283264160156, 68.85392761230469, 71.94502258300781, 75.03611755371094]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 13.0, 12.0, 12.0, 19.0, 32.0, 28.0, 51.0, 43.0, 48.0, 63.0, 76.0, 73.0, 64.0, 59.0, 84.0, 59.0, 59.0, 46.0, 41.0, 34.0, 22.0, 16.0, 11.0, 4.0, 8.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.458568572998047, -19.611988067626953, -18.76540756225586, -17.918827056884766, -17.072248458862305, -16.22566795349121, -15.379087448120117, -14.532506942749023, -13.68592643737793, -12.839345932006836, -11.992766380310059, -11.146185874938965, -10.299605369567871, -9.453025817871094, -8.6064453125, -7.759864807128906, -6.913285255432129, -6.066705226898193, -5.2201247215271, -4.373544692993164, -3.5269644260406494, -2.6803841590881348, -1.8338041305541992, -0.9872236251831055, -0.14064359664916992, 0.7059366106987, 1.5525168180465698, 2.399096965789795, 3.2456772327423096, 4.092257499694824, 4.93883752822876, 5.7854180335998535, 6.631998062133789, 7.478578090667725, 8.32515811920166, 9.171738624572754, 10.018319129943848, 10.864898681640625, 11.711479187011719, 12.558059692382812, 13.404640197753906, 14.251220703125, 15.097800254821777, 15.944380760192871, 16.79096031188965, 17.637540817260742, 18.484121322631836, 19.33070182800293, 20.17728042602539, 21.023860931396484, 21.870441436767578, 22.717021942138672, 23.563600540161133, 24.410181045532227, 25.25676155090332, 26.103342056274414, 26.949922561645508, 27.7965030670166, 28.643083572387695, 29.489662170410156, 30.33624267578125, 31.182823181152344, 32.02940368652344, 32.87598419189453, 33.722564697265625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 11.0, 3.0, 7.0, 16.0, 25.0, 37.0, 74.0, 114.0, 220.0, 383.0, 713.0, 1590.0, 3392.0, 8623.0, 25088.0, 99629.0, 631743.0, 213975.0, 41108.0, 12880.0, 4802.0, 1983.0, 990.0, 460.0, 278.0, 175.0, 77.0, 48.0, 39.0, 16.0, 15.0, 14.0, 5.0, 3.0, 4.0, 2.0, 5.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.26953125, -3.1514892578125, -3.033447265625, -2.9154052734375, -2.79736328125, -2.6793212890625, -2.561279296875, -2.4432373046875, -2.3251953125, -2.2071533203125, -2.089111328125, -1.9710693359375, -1.85302734375, -1.7349853515625, -1.616943359375, -1.4989013671875, -1.380859375, -1.2628173828125, -1.144775390625, -1.0267333984375, -0.90869140625, -0.7906494140625, -0.672607421875, -0.5545654296875, -0.4365234375, -0.3184814453125, -0.200439453125, -0.0823974609375, 0.03564453125, 0.1536865234375, 0.271728515625, 0.3897705078125, 0.5078125, 0.6258544921875, 0.743896484375, 0.8619384765625, 0.97998046875, 1.0980224609375, 1.216064453125, 1.3341064453125, 1.4521484375, 1.5701904296875, 1.688232421875, 1.8062744140625, 1.92431640625, 2.0423583984375, 2.160400390625, 2.2784423828125, 2.396484375, 2.5145263671875, 2.632568359375, 2.7506103515625, 2.86865234375, 2.9866943359375, 3.104736328125, 3.2227783203125, 3.3408203125, 3.4588623046875, 3.576904296875, 3.6949462890625, 3.81298828125, 3.9310302734375, 4.049072265625, 4.1671142578125, 4.28515625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 17.0, 18.0, 34.0, 43.0, 48.0, 85.0, 84.0, 97.0, 109.0, 87.0, 95.0, 75.0, 68.0, 34.0, 37.0, 26.0, 16.0, 6.0, 7.0, 4.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.623046875, -2.5513916015625, -2.479736328125, -2.4080810546875, -2.33642578125, -2.2647705078125, -2.193115234375, -2.1214599609375, -2.0498046875, -1.9781494140625, -1.906494140625, -1.8348388671875, -1.76318359375, -1.6915283203125, -1.619873046875, -1.5482177734375, -1.4765625, -1.4049072265625, -1.333251953125, -1.2615966796875, -1.18994140625, -1.1182861328125, -1.046630859375, -0.9749755859375, -0.9033203125, -0.8316650390625, -0.760009765625, -0.6883544921875, -0.61669921875, -0.5450439453125, -0.473388671875, -0.4017333984375, -0.330078125, -0.2584228515625, -0.186767578125, -0.1151123046875, -0.04345703125, 0.0281982421875, 0.099853515625, 0.1715087890625, 0.2431640625, 0.3148193359375, 0.386474609375, 0.4581298828125, 0.52978515625, 0.6014404296875, 0.673095703125, 0.7447509765625, 0.81640625, 0.8880615234375, 0.959716796875, 1.0313720703125, 1.10302734375, 1.1746826171875, 1.246337890625, 1.3179931640625, 1.3896484375, 1.4613037109375, 1.532958984375, 1.6046142578125, 1.67626953125, 1.7479248046875, 1.819580078125, 1.8912353515625, 1.962890625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 8.0, 17.0, 13.0, 15.0, 32.0, 28.0, 32.0, 60.0, 90.0, 88.0, 158.0, 263.0, 418.0, 786.0, 1647.0, 3969.0, 13414.0, 70992.0, 771060.0, 153039.0, 22090.0, 5618.0, 2252.0, 952.0, 518.0, 289.0, 203.0, 124.0, 110.0, 61.0, 48.0, 33.0, 33.0, 16.0, 8.0, 14.0, 10.0, 3.0, 5.0, 5.0, 8.0, 3.0, 2.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.765625, -4.6102294921875, -4.454833984375, -4.2994384765625, -4.14404296875, -3.9886474609375, -3.833251953125, -3.6778564453125, -3.5224609375, -3.3670654296875, -3.211669921875, -3.0562744140625, -2.90087890625, -2.7454833984375, -2.590087890625, -2.4346923828125, -2.279296875, -2.1239013671875, -1.968505859375, -1.8131103515625, -1.65771484375, -1.5023193359375, -1.346923828125, -1.1915283203125, -1.0361328125, -0.8807373046875, -0.725341796875, -0.5699462890625, -0.41455078125, -0.2591552734375, -0.103759765625, 0.0516357421875, 0.20703125, 0.3624267578125, 0.517822265625, 0.6732177734375, 0.82861328125, 0.9840087890625, 1.139404296875, 1.2947998046875, 1.4501953125, 1.6055908203125, 1.760986328125, 1.9163818359375, 2.07177734375, 2.2271728515625, 2.382568359375, 2.5379638671875, 2.693359375, 2.8487548828125, 3.004150390625, 3.1595458984375, 3.31494140625, 3.4703369140625, 3.625732421875, 3.7811279296875, 3.9365234375, 4.0919189453125, 4.247314453125, 4.4027099609375, 4.55810546875, 4.7135009765625, 4.868896484375, 5.0242919921875, 5.1796875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 0.0, 7.0, 7.0, 9.0, 21.0, 18.0, 22.0, 26.0, 38.0, 50.0, 47.0, 86.0, 69.0, 83.0, 77.0, 61.0, 82.0, 60.0, 59.0, 36.0, 28.0, 23.0, 22.0, 14.0, 13.0, 9.0, 15.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.12890625, -5.88519287109375, -5.6414794921875, -5.39776611328125, -5.154052734375, -4.91033935546875, -4.6666259765625, -4.42291259765625, -4.17919921875, -3.93548583984375, -3.6917724609375, -3.44805908203125, -3.204345703125, -2.96063232421875, -2.7169189453125, -2.47320556640625, -2.2294921875, -1.98577880859375, -1.7420654296875, -1.49835205078125, -1.254638671875, -1.01092529296875, -0.7672119140625, -0.52349853515625, -0.27978515625, -0.03607177734375, 0.2076416015625, 0.45135498046875, 0.695068359375, 0.93878173828125, 1.1824951171875, 1.42620849609375, 1.669921875, 1.91363525390625, 2.1573486328125, 2.40106201171875, 2.644775390625, 2.88848876953125, 3.1322021484375, 3.37591552734375, 3.61962890625, 3.86334228515625, 4.1070556640625, 4.35076904296875, 4.594482421875, 4.83819580078125, 5.0819091796875, 5.32562255859375, 5.5693359375, 5.81304931640625, 6.0567626953125, 6.30047607421875, 6.544189453125, 6.78790283203125, 7.0316162109375, 7.27532958984375, 7.51904296875, 7.76275634765625, 8.0064697265625, 8.25018310546875, 8.493896484375, 8.73760986328125, 8.9813232421875, 9.22503662109375, 9.46875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 8.0, 7.0, 7.0, 14.0, 9.0, 17.0, 24.0, 30.0, 59.0, 79.0, 139.0, 250.0, 659.0, 2085.0, 11948.0, 441526.0, 575727.0, 12451.0, 2116.0, 707.0, 302.0, 125.0, 69.0, 52.0, 28.0, 37.0, 17.0, 17.0, 8.0, 8.0, 8.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.03125, -4.89154052734375, -4.7518310546875, -4.61212158203125, -4.472412109375, -4.33270263671875, -4.1929931640625, -4.05328369140625, -3.91357421875, -3.77386474609375, -3.6341552734375, -3.49444580078125, -3.354736328125, -3.21502685546875, -3.0753173828125, -2.93560791015625, -2.7958984375, -2.65618896484375, -2.5164794921875, -2.37677001953125, -2.237060546875, -2.09735107421875, -1.9576416015625, -1.81793212890625, -1.67822265625, -1.53851318359375, -1.3988037109375, -1.25909423828125, -1.119384765625, -0.97967529296875, -0.8399658203125, -0.70025634765625, -0.560546875, -0.42083740234375, -0.2811279296875, -0.14141845703125, -0.001708984375, 0.13800048828125, 0.2777099609375, 0.41741943359375, 0.55712890625, 0.69683837890625, 0.8365478515625, 0.97625732421875, 1.115966796875, 1.25567626953125, 1.3953857421875, 1.53509521484375, 1.6748046875, 1.81451416015625, 1.9542236328125, 2.09393310546875, 2.233642578125, 2.37335205078125, 2.5130615234375, 2.65277099609375, 2.79248046875, 2.93218994140625, 3.0718994140625, 3.21160888671875, 3.351318359375, 3.49102783203125, 3.6307373046875, 3.77044677734375, 3.91015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 3.0, 3.0, 11.0, 12.0, 13.0, 16.0, 29.0, 33.0, 49.0, 58.0, 104.0, 177.0, 156.0, 97.0, 74.0, 35.0, 27.0, 15.0, 17.0, 21.0, 3.0, 9.0, 5.0, 6.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037407875061035156, -0.00036197155714035034, -0.0003498643636703491, -0.0003377571702003479, -0.0003256499767303467, -0.00031354278326034546, -0.00030143558979034424, -0.000289328396320343, -0.0002772212028503418, -0.0002651140093803406, -0.00025300681591033936, -0.00024089962244033813, -0.00022879242897033691, -0.0002166852355003357, -0.00020457804203033447, -0.00019247084856033325, -0.00018036365509033203, -0.0001682564616203308, -0.0001561492681503296, -0.00014404207468032837, -0.00013193488121032715, -0.00011982768774032593, -0.00010772049427032471, -9.561330080032349e-05, -8.350610733032227e-05, -7.139891386032104e-05, -5.9291720390319824e-05, -4.7184526920318604e-05, -3.507733345031738e-05, -2.2970139980316162e-05, -1.0862946510314941e-05, 1.2442469596862793e-06, 1.33514404296875e-05, 2.545863389968872e-05, 3.756582736968994e-05, 4.967302083969116e-05, 6.178021430969238e-05, 7.38874077796936e-05, 8.599460124969482e-05, 9.810179471969604e-05, 0.00011020898818969727, 0.00012231618165969849, 0.0001344233751296997, 0.00014653056859970093, 0.00015863776206970215, 0.00017074495553970337, 0.0001828521490097046, 0.0001949593424797058, 0.00020706653594970703, 0.00021917372941970825, 0.00023128092288970947, 0.0002433881163597107, 0.0002554953098297119, 0.00026760250329971313, 0.00027970969676971436, 0.0002918168902397156, 0.0003039240837097168, 0.000316031277179718, 0.00032813847064971924, 0.00034024566411972046, 0.0003523528575897217, 0.0003644600510597229, 0.0003765672445297241, 0.00038867443799972534, 0.00040078163146972656]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 10.0, 15.0, 21.0, 37.0, 69.0, 143.0, 331.0, 939.0, 4739.0, 250725.0, 782589.0, 7007.0, 1145.0, 382.0, 178.0, 73.0, 60.0, 31.0, 22.0, 7.0, 10.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.94921875, -5.7578125, -5.56640625, -5.375, -5.18359375, -4.9921875, -4.80078125, -4.609375, -4.41796875, -4.2265625, -4.03515625, -3.84375, -3.65234375, -3.4609375, -3.26953125, -3.078125, -2.88671875, -2.6953125, -2.50390625, -2.3125, -2.12109375, -1.9296875, -1.73828125, -1.546875, -1.35546875, -1.1640625, -0.97265625, -0.78125, -0.58984375, -0.3984375, -0.20703125, -0.015625, 0.17578125, 0.3671875, 0.55859375, 0.75, 0.94140625, 1.1328125, 1.32421875, 1.515625, 1.70703125, 1.8984375, 2.08984375, 2.28125, 2.47265625, 2.6640625, 2.85546875, 3.046875, 3.23828125, 3.4296875, 3.62109375, 3.8125, 4.00390625, 4.1953125, 4.38671875, 4.578125, 4.76953125, 4.9609375, 5.15234375, 5.34375, 5.53515625, 5.7265625, 5.91796875, 6.109375, 6.30078125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 4.0, 10.0, 10.0, 14.0, 15.0, 30.0, 46.0, 50.0, 70.0, 88.0, 96.0, 139.0, 120.0, 78.0, 61.0, 39.0, 34.0, 31.0, 19.0, 14.0, 11.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7119140625, -1.6443023681640625, -1.576690673828125, -1.5090789794921875, -1.44146728515625, -1.3738555908203125, -1.306243896484375, -1.2386322021484375, -1.1710205078125, -1.1034088134765625, -1.035797119140625, -0.9681854248046875, -0.90057373046875, -0.8329620361328125, -0.765350341796875, -0.6977386474609375, -0.630126953125, -0.5625152587890625, -0.494903564453125, -0.4272918701171875, -0.35968017578125, -0.2920684814453125, -0.224456787109375, -0.1568450927734375, -0.0892333984375, -0.0216217041015625, 0.045989990234375, 0.1136016845703125, 0.18121337890625, 0.2488250732421875, 0.316436767578125, 0.3840484619140625, 0.45166015625, 0.5192718505859375, 0.586883544921875, 0.6544952392578125, 0.72210693359375, 0.7897186279296875, 0.857330322265625, 0.9249420166015625, 0.9925537109375, 1.0601654052734375, 1.127777099609375, 1.1953887939453125, 1.26300048828125, 1.3306121826171875, 1.398223876953125, 1.4658355712890625, 1.533447265625, 1.6010589599609375, 1.668670654296875, 1.7362823486328125, 1.80389404296875, 1.8715057373046875, 1.939117431640625, 2.0067291259765625, 2.0743408203125, 2.1419525146484375, 2.209564208984375, 2.2771759033203125, 2.34478759765625, 2.4123992919921875, 2.480010986328125, 2.5476226806640625, 2.615234375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 12.0, 22.0, 45.0, 82.0, 163.0, 275.0, 209.0, 110.0, 38.0, 17.0, 9.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.57830810546875, -68.12085723876953, -66.66339874267578, -65.20594787597656, -63.748497009277344, -62.29104232788086, -60.83359146118164, -59.376136779785156, -57.91868591308594, -56.46123123168945, -55.003780364990234, -53.54632568359375, -52.08887481689453, -50.63142013549805, -49.17396926879883, -47.716514587402344, -46.259063720703125, -44.80160903930664, -43.34415817260742, -41.88670349121094, -40.42925262451172, -38.971797943115234, -37.514347076416016, -36.05689239501953, -34.59943771362305, -33.14198303222656, -31.684532165527344, -30.227079391479492, -28.76962661743164, -27.31217384338379, -25.854721069335938, -24.397266387939453, -22.939817428588867, -21.482364654541016, -20.024911880493164, -18.567459106445312, -17.11000633239746, -15.65255355834961, -14.195099830627441, -12.73764705657959, -11.280194282531738, -9.822741508483887, -8.365288734436035, -6.907835483551025, -5.450382709503174, -3.9929299354553223, -2.5354766845703125, -1.078023910522461, 0.3794288635253906, 1.8368817567825317, 3.294334650039673, 4.7517876625061035, 6.209240436553955, 7.666693210601807, 9.124146461486816, 10.581599235534668, 12.03905200958252, 13.496504783630371, 14.953957557678223, 16.41141128540039, 17.868864059448242, 19.326316833496094, 20.783769607543945, 22.241222381591797, 23.69867515563965]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 10.0, 12.0, 6.0, 14.0, 22.0, 21.0, 25.0, 33.0, 47.0, 50.0, 64.0, 59.0, 68.0, 90.0, 63.0, 62.0, 48.0, 59.0, 59.0, 31.0, 27.0, 30.0, 21.0, 20.0, 12.0, 12.0, 16.0, 5.0, 3.0, 2.0, 4.0, 2.0, 4.0], "bins": [-40.0952033996582, -39.2021484375, -38.30908966064453, -37.41603469848633, -36.52297592163086, -35.629920959472656, -34.73686218261719, -33.843807220458984, -32.950748443603516, -32.05769348144531, -31.164634704589844, -30.271577835083008, -29.378520965576172, -28.485464096069336, -27.5924072265625, -26.699352264404297, -25.80629539489746, -24.913238525390625, -24.02018165588379, -23.127124786376953, -22.234067916870117, -21.34101104736328, -20.447956085205078, -19.55489730834961, -18.661842346191406, -17.76878547668457, -16.875728607177734, -15.982671737670898, -15.089614868164062, -14.196557998657227, -13.303502082824707, -12.410445213317871, -11.517387390136719, -10.624330520629883, -9.731273651123047, -8.838216781616211, -7.945160388946533, -7.052103519439697, -6.1590471267700195, -5.265990257263184, -4.372933387756348, -3.4798765182495117, -2.586819887161255, -1.693763256072998, -0.8007063865661621, 0.09235048294067383, 0.9854068756103516, 1.8784637451171875, 2.7715206146240234, 3.6645774841308594, 4.557634353637695, 5.450690746307373, 6.343747615814209, 7.236804485321045, 8.129860877990723, 9.022917747497559, 9.915974617004395, 10.80903148651123, 11.702088356018066, 12.595144271850586, 13.488201141357422, 14.381258010864258, 15.274314880371094, 16.16737174987793, 17.060428619384766]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 3.0, 5.0, 6.0, 6.0, 5.0, 3.0, 9.0, 11.0, 19.0, 30.0, 39.0, 74.0, 144.0, 330.0, 904.0, 2831.0, 11767.0, 94192.0, 3546455.0, 500398.0, 28185.0, 6082.0, 1824.0, 610.0, 193.0, 70.0, 37.0, 23.0, 10.0, 11.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.878509521484375, -4.74920654296875, -4.619903564453125, -4.4906005859375, -4.361297607421875, -4.23199462890625, -4.102691650390625, -3.973388671875, -3.844085693359375, -3.71478271484375, -3.585479736328125, -3.4561767578125, -3.326873779296875, -3.19757080078125, -3.068267822265625, -2.93896484375, -2.809661865234375, -2.68035888671875, -2.551055908203125, -2.4217529296875, -2.292449951171875, -2.16314697265625, -2.033843994140625, -1.904541015625, -1.775238037109375, -1.64593505859375, -1.516632080078125, -1.3873291015625, -1.258026123046875, -1.12872314453125, -0.999420166015625, -0.8701171875, -0.740814208984375, -0.61151123046875, -0.482208251953125, -0.3529052734375, -0.223602294921875, -0.09429931640625, 0.035003662109375, 0.164306640625, 0.293609619140625, 0.42291259765625, 0.552215576171875, 0.6815185546875, 0.810821533203125, 0.94012451171875, 1.069427490234375, 1.19873046875, 1.328033447265625, 1.45733642578125, 1.586639404296875, 1.7159423828125, 1.845245361328125, 1.97454833984375, 2.103851318359375, 2.233154296875, 2.362457275390625, 2.49176025390625, 2.621063232421875, 2.7503662109375, 2.879669189453125, 3.00897216796875, 3.138275146484375, 3.267578125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 10.0, 29.0, 42.0, 63.0, 95.0, 112.0, 143.0, 136.0, 126.0, 88.0, 63.0, 54.0, 29.0, 17.0, 6.0], "bins": [-4.91796875, -4.830177307128906, -4.7423858642578125, -4.654594421386719, -4.566802978515625, -4.479011535644531, -4.3912200927734375, -4.303428649902344, -4.21563720703125, -4.127845764160156, -4.0400543212890625, -3.9522628784179688, -3.864471435546875, -3.7766799926757812, -3.6888885498046875, -3.6010971069335938, -3.5133056640625, -3.4255142211914062, -3.3377227783203125, -3.2499313354492188, -3.162139892578125, -3.0743484497070312, -2.9865570068359375, -2.8987655639648438, -2.81097412109375, -2.7231826782226562, -2.6353912353515625, -2.5475997924804688, -2.459808349609375, -2.3720169067382812, -2.2842254638671875, -2.1964340209960938, -2.108642578125, -2.0208511352539062, -1.9330596923828125, -1.8452682495117188, -1.757476806640625, -1.6696853637695312, -1.5818939208984375, -1.4941024780273438, -1.40631103515625, -1.3185195922851562, -1.2307281494140625, -1.1429367065429688, -1.055145263671875, -0.9673538208007812, -0.8795623779296875, -0.7917709350585938, -0.7039794921875, -0.6161880493164062, -0.5283966064453125, -0.44060516357421875, -0.352813720703125, -0.26502227783203125, -0.1772308349609375, -0.08943939208984375, -0.00164794921875, 0.08614349365234375, 0.1739349365234375, 0.26172637939453125, 0.349517822265625, 0.43730926513671875, 0.5251007080078125, 0.6128921508789062, 0.70068359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 11.0, 16.0, 31.0, 39.0, 61.0, 135.0, 307.0, 777.0, 2518.0, 12456.0, 188476.0, 3910120.0, 67588.0, 8292.0, 2121.0, 752.0, 281.0, 120.0, 77.0, 34.0, 19.0, 8.0, 11.0, 11.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.9453125, -8.6922607421875, -8.439208984375, -8.1861572265625, -7.93310546875, -7.6800537109375, -7.427001953125, -7.1739501953125, -6.9208984375, -6.6678466796875, -6.414794921875, -6.1617431640625, -5.90869140625, -5.6556396484375, -5.402587890625, -5.1495361328125, -4.896484375, -4.6434326171875, -4.390380859375, -4.1373291015625, -3.88427734375, -3.6312255859375, -3.378173828125, -3.1251220703125, -2.8720703125, -2.6190185546875, -2.365966796875, -2.1129150390625, -1.85986328125, -1.6068115234375, -1.353759765625, -1.1007080078125, -0.84765625, -0.5946044921875, -0.341552734375, -0.0885009765625, 0.16455078125, 0.4176025390625, 0.670654296875, 0.9237060546875, 1.1767578125, 1.4298095703125, 1.682861328125, 1.9359130859375, 2.18896484375, 2.4420166015625, 2.695068359375, 2.9481201171875, 3.201171875, 3.4542236328125, 3.707275390625, 3.9603271484375, 4.21337890625, 4.4664306640625, 4.719482421875, 4.9725341796875, 5.2255859375, 5.4786376953125, 5.731689453125, 5.9847412109375, 6.23779296875, 6.4908447265625, 6.743896484375, 6.9969482421875, 7.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 10.0, 14.0, 10.0, 17.0, 30.0, 64.0, 91.0, 159.0, 404.0, 968.0, 1268.0, 487.0, 235.0, 97.0, 66.0, 38.0, 17.0, 21.0, 15.0, 19.0, 10.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75, -5.56597900390625, -5.3819580078125, -5.19793701171875, -5.013916015625, -4.82989501953125, -4.6458740234375, -4.46185302734375, -4.27783203125, -4.09381103515625, -3.9097900390625, -3.72576904296875, -3.541748046875, -3.35772705078125, -3.1737060546875, -2.98968505859375, -2.8056640625, -2.62164306640625, -2.4376220703125, -2.25360107421875, -2.069580078125, -1.88555908203125, -1.7015380859375, -1.51751708984375, -1.33349609375, -1.14947509765625, -0.9654541015625, -0.78143310546875, -0.597412109375, -0.41339111328125, -0.2293701171875, -0.04534912109375, 0.138671875, 0.32269287109375, 0.5067138671875, 0.69073486328125, 0.874755859375, 1.05877685546875, 1.2427978515625, 1.42681884765625, 1.61083984375, 1.79486083984375, 1.9788818359375, 2.16290283203125, 2.346923828125, 2.53094482421875, 2.7149658203125, 2.89898681640625, 3.0830078125, 3.26702880859375, 3.4510498046875, 3.63507080078125, 3.819091796875, 4.00311279296875, 4.1871337890625, 4.37115478515625, 4.55517578125, 4.73919677734375, 4.9232177734375, 5.10723876953125, 5.291259765625, 5.47528076171875, 5.6593017578125, 5.84332275390625, 6.02734375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 19.0, 94.0, 490.0, 315.0, 60.0, 9.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.50341796875, -107.76128387451172, -104.01914978027344, -100.27701568603516, -96.53488159179688, -92.7927474975586, -89.05061340332031, -85.30847930908203, -81.56634521484375, -77.82421112060547, -74.08207702636719, -70.3399429321289, -66.59780883789062, -62.855674743652344, -59.11354064941406, -55.37140655517578, -51.6292724609375, -47.88713836669922, -44.14500427246094, -40.402870178222656, -36.660736083984375, -32.918601989746094, -29.176467895507812, -25.43433380126953, -21.69219970703125, -17.95006561279297, -14.207931518554688, -10.465797424316406, -6.723663330078125, -2.9815292358398438, 0.7606048583984375, 4.502738952636719, 8.244873046875, 11.987007141113281, 15.729141235351562, 19.471275329589844, 23.213409423828125, 26.955543518066406, 30.697677612304688, 34.43981170654297, 38.18194580078125, 41.92407989501953, 45.66621398925781, 49.408348083496094, 53.150482177734375, 56.892616271972656, 60.63475036621094, 64.37688446044922, 68.1190185546875, 71.86115264892578, 75.60328674316406, 79.34542083740234, 83.08755493164062, 86.8296890258789, 90.57182312011719, 94.31395721435547, 98.05609130859375, 101.79822540283203, 105.54035949707031, 109.2824935913086, 113.02462768554688, 116.76676177978516, 120.50889587402344, 124.25102996826172, 127.9931640625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 5.0, 18.0, 18.0, 27.0, 23.0, 37.0, 61.0, 61.0, 69.0, 76.0, 103.0, 91.0, 69.0, 55.0, 55.0, 61.0, 50.0, 34.0, 31.0, 22.0, 12.0, 6.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.06675148010254, -23.902523040771484, -22.73829460144043, -21.574066162109375, -20.40983772277832, -19.245609283447266, -18.081382751464844, -16.917152404785156, -15.752924919128418, -14.588696479797363, -13.424468040466309, -12.26024055480957, -11.096012115478516, -9.931783676147461, -8.767555236816406, -7.603326797485352, -6.439098358154297, -5.274869918823242, -4.1106414794921875, -2.946413516998291, -1.7821850776672363, -0.6179566383361816, 0.5462713241577148, 1.7104997634887695, 2.874728202819824, 4.038956642150879, 5.203185081481934, 6.36741304397583, 7.531641483306885, 8.695869445800781, 9.860097885131836, 11.02432632446289, 12.188552856445312, 13.352781295776367, 14.517009735107422, 15.681238174438477, 16.84546661376953, 18.009695053100586, 19.17392349243164, 20.338150024414062, 21.50238037109375, 22.666608810424805, 23.83083724975586, 24.995065689086914, 26.15929412841797, 27.323522567749023, 28.487751007080078, 29.6519775390625, 30.816205978393555, 31.98043441772461, 33.14466094970703, 34.30889129638672, 35.47311782836914, 36.63734817504883, 37.80157470703125, 38.96580505371094, 40.13003158569336, 41.29425811767578, 42.45848846435547, 43.62271499633789, 44.78694534301758, 45.951171875, 47.11540222167969, 48.27962875366211, 49.4438591003418]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 9.0, 7.0, 19.0, 36.0, 68.0, 83.0, 188.0, 335.0, 770.0, 1741.0, 4235.0, 11634.0, 35364.0, 126155.0, 502451.0, 266761.0, 66448.0, 20288.0, 6961.0, 2695.0, 1119.0, 526.0, 284.0, 146.0, 73.0, 39.0, 27.0, 16.0, 14.0, 11.0, 5.0, 8.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.109375, -3.987640380859375, -3.86590576171875, -3.744171142578125, -3.6224365234375, -3.500701904296875, -3.37896728515625, -3.257232666015625, -3.135498046875, -3.013763427734375, -2.89202880859375, -2.770294189453125, -2.6485595703125, -2.526824951171875, -2.40509033203125, -2.283355712890625, -2.16162109375, -2.039886474609375, -1.91815185546875, -1.796417236328125, -1.6746826171875, -1.552947998046875, -1.43121337890625, -1.309478759765625, -1.187744140625, -1.066009521484375, -0.94427490234375, -0.822540283203125, -0.7008056640625, -0.579071044921875, -0.45733642578125, -0.335601806640625, -0.2138671875, -0.092132568359375, 0.02960205078125, 0.151336669921875, 0.2730712890625, 0.394805908203125, 0.51654052734375, 0.638275146484375, 0.760009765625, 0.881744384765625, 1.00347900390625, 1.125213623046875, 1.2469482421875, 1.368682861328125, 1.49041748046875, 1.612152099609375, 1.73388671875, 1.855621337890625, 1.97735595703125, 2.099090576171875, 2.2208251953125, 2.342559814453125, 2.46429443359375, 2.586029052734375, 2.707763671875, 2.829498291015625, 2.95123291015625, 3.072967529296875, 3.1947021484375, 3.316436767578125, 3.43817138671875, 3.559906005859375, 3.681640625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 8.0, 2.0, 8.0, 9.0, 6.0, 9.0, 8.0, 15.0, 26.0, 25.0, 29.0, 23.0, 22.0, 37.0, 27.0, 48.0, 46.0, 49.0, 55.0, 41.0, 43.0, 40.0, 49.0, 50.0, 44.0, 34.0, 30.0, 32.0, 21.0, 26.0, 23.0, 20.0, 13.0, 21.0, 10.0, 11.0, 8.0, 10.0, 9.0, 9.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.080078125, -1.0476150512695312, -1.0151519775390625, -0.9826889038085938, -0.950225830078125, -0.9177627563476562, -0.8852996826171875, -0.8528366088867188, -0.82037353515625, -0.7879104614257812, -0.7554473876953125, -0.7229843139648438, -0.690521240234375, -0.6580581665039062, -0.6255950927734375, -0.5931320190429688, -0.5606689453125, -0.5282058715820312, -0.4957427978515625, -0.46327972412109375, -0.430816650390625, -0.39835357666015625, -0.3658905029296875, -0.33342742919921875, -0.30096435546875, -0.26850128173828125, -0.2360382080078125, -0.20357513427734375, -0.171112060546875, -0.13864898681640625, -0.1061859130859375, -0.07372283935546875, -0.041259765625, -0.00879669189453125, 0.0236663818359375, 0.05612945556640625, 0.088592529296875, 0.12105560302734375, 0.1535186767578125, 0.18598175048828125, 0.21844482421875, 0.25090789794921875, 0.2833709716796875, 0.31583404541015625, 0.348297119140625, 0.38076019287109375, 0.4132232666015625, 0.44568634033203125, 0.4781494140625, 0.5106124877929688, 0.5430755615234375, 0.5755386352539062, 0.608001708984375, 0.6404647827148438, 0.6729278564453125, 0.7053909301757812, 0.73785400390625, 0.7703170776367188, 0.8027801513671875, 0.8352432250976562, 0.867706298828125, 0.9001693725585938, 0.9326324462890625, 0.9650955200195312, 0.99755859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 7.0, 11.0, 18.0, 23.0, 24.0, 36.0, 50.0, 96.0, 147.0, 222.0, 395.0, 763.0, 1688.0, 5479.0, 34515.0, 830696.0, 156466.0, 12212.0, 3066.0, 1197.0, 558.0, 319.0, 181.0, 129.0, 67.0, 49.0, 34.0, 28.0, 14.0, 12.0, 8.0, 9.0, 7.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.897216796875, -7.62255859375, -7.347900390625, -7.0732421875, -6.798583984375, -6.52392578125, -6.249267578125, -5.974609375, -5.699951171875, -5.42529296875, -5.150634765625, -4.8759765625, -4.601318359375, -4.32666015625, -4.052001953125, -3.77734375, -3.502685546875, -3.22802734375, -2.953369140625, -2.6787109375, -2.404052734375, -2.12939453125, -1.854736328125, -1.580078125, -1.305419921875, -1.03076171875, -0.756103515625, -0.4814453125, -0.206787109375, 0.06787109375, 0.342529296875, 0.6171875, 0.891845703125, 1.16650390625, 1.441162109375, 1.7158203125, 1.990478515625, 2.26513671875, 2.539794921875, 2.814453125, 3.089111328125, 3.36376953125, 3.638427734375, 3.9130859375, 4.187744140625, 4.46240234375, 4.737060546875, 5.01171875, 5.286376953125, 5.56103515625, 5.835693359375, 6.1103515625, 6.385009765625, 6.65966796875, 6.934326171875, 7.208984375, 7.483642578125, 7.75830078125, 8.032958984375, 8.3076171875, 8.582275390625, 8.85693359375, 9.131591796875, 9.40625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 10.0, 3.0, 8.0, 15.0, 21.0, 19.0, 18.0, 28.0, 42.0, 38.0, 51.0, 43.0, 57.0, 63.0, 71.0, 56.0, 62.0, 46.0, 58.0, 39.0, 52.0, 40.0, 33.0, 31.0, 18.0, 15.0, 22.0, 14.0, 12.0, 7.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53515625, -6.32696533203125, -6.1187744140625, -5.91058349609375, -5.702392578125, -5.49420166015625, -5.2860107421875, -5.07781982421875, -4.86962890625, -4.66143798828125, -4.4532470703125, -4.24505615234375, -4.036865234375, -3.82867431640625, -3.6204833984375, -3.41229248046875, -3.2041015625, -2.99591064453125, -2.7877197265625, -2.57952880859375, -2.371337890625, -2.16314697265625, -1.9549560546875, -1.74676513671875, -1.53857421875, -1.33038330078125, -1.1221923828125, -0.91400146484375, -0.705810546875, -0.49761962890625, -0.2894287109375, -0.08123779296875, 0.126953125, 0.33514404296875, 0.5433349609375, 0.75152587890625, 0.959716796875, 1.16790771484375, 1.3760986328125, 1.58428955078125, 1.79248046875, 2.00067138671875, 2.2088623046875, 2.41705322265625, 2.625244140625, 2.83343505859375, 3.0416259765625, 3.24981689453125, 3.4580078125, 3.66619873046875, 3.8743896484375, 4.08258056640625, 4.290771484375, 4.49896240234375, 4.7071533203125, 4.91534423828125, 5.12353515625, 5.33172607421875, 5.5399169921875, 5.74810791015625, 5.956298828125, 6.16448974609375, 6.3726806640625, 6.58087158203125, 6.7890625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 8.0, 6.0, 13.0, 26.0, 26.0, 31.0, 30.0, 61.0, 87.0, 159.0, 248.0, 444.0, 878.0, 2111.0, 6469.0, 32366.0, 351153.0, 601161.0, 41257.0, 7494.0, 2408.0, 916.0, 469.0, 278.0, 159.0, 92.0, 46.0, 43.0, 23.0, 22.0, 7.0, 8.0, 11.0, 5.0, 6.0, 10.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.921875, -1.857940673828125, -1.79400634765625, -1.730072021484375, -1.6661376953125, -1.602203369140625, -1.53826904296875, -1.474334716796875, -1.410400390625, -1.346466064453125, -1.28253173828125, -1.218597412109375, -1.1546630859375, -1.090728759765625, -1.02679443359375, -0.962860107421875, -0.89892578125, -0.834991455078125, -0.77105712890625, -0.707122802734375, -0.6431884765625, -0.579254150390625, -0.51531982421875, -0.451385498046875, -0.387451171875, -0.323516845703125, -0.25958251953125, -0.195648193359375, -0.1317138671875, -0.067779541015625, -0.00384521484375, 0.060089111328125, 0.1240234375, 0.187957763671875, 0.25189208984375, 0.315826416015625, 0.3797607421875, 0.443695068359375, 0.50762939453125, 0.571563720703125, 0.635498046875, 0.699432373046875, 0.76336669921875, 0.827301025390625, 0.8912353515625, 0.955169677734375, 1.01910400390625, 1.083038330078125, 1.14697265625, 1.210906982421875, 1.27484130859375, 1.338775634765625, 1.4027099609375, 1.466644287109375, 1.53057861328125, 1.594512939453125, 1.658447265625, 1.722381591796875, 1.78631591796875, 1.850250244140625, 1.9141845703125, 1.978118896484375, 2.04205322265625, 2.105987548828125, 2.169921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 15.0, 11.0, 12.0, 19.0, 22.0, 36.0, 36.0, 57.0, 54.0, 103.0, 97.0, 110.0, 92.0, 63.0, 61.0, 53.0, 29.0, 29.0, 19.0, 14.0, 14.0, 7.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0004248619079589844, -0.00041309744119644165, -0.0004013329744338989, -0.0003895685076713562, -0.0003778040409088135, -0.00036603957414627075, -0.00035427510738372803, -0.0003425106406211853, -0.0003307461738586426, -0.00031898170709609985, -0.00030721724033355713, -0.0002954527735710144, -0.0002836883068084717, -0.00027192384004592896, -0.00026015937328338623, -0.0002483949065208435, -0.00023663043975830078, -0.00022486597299575806, -0.00021310150623321533, -0.0002013370394706726, -0.00018957257270812988, -0.00017780810594558716, -0.00016604363918304443, -0.0001542791724205017, -0.00014251470565795898, -0.00013075023889541626, -0.00011898577213287354, -0.00010722130537033081, -9.545683860778809e-05, -8.369237184524536e-05, -7.192790508270264e-05, -6.016343832015991e-05, -4.839897155761719e-05, -3.663450479507446e-05, -2.4870038032531738e-05, -1.3105571269989014e-05, -1.341104507446289e-06, 1.0423362255096436e-05, 2.218782901763916e-05, 3.3952295780181885e-05, 4.571676254272461e-05, 5.7481229305267334e-05, 6.924569606781006e-05, 8.101016283035278e-05, 9.277462959289551e-05, 0.00010453909635543823, 0.00011630356311798096, 0.00012806802988052368, 0.0001398324966430664, 0.00015159696340560913, 0.00016336143016815186, 0.00017512589693069458, 0.0001868903636932373, 0.00019865483045578003, 0.00021041929721832275, 0.00022218376398086548, 0.0002339482307434082, 0.00024571269750595093, 0.00025747716426849365, 0.0002692416310310364, 0.0002810060977935791, 0.0002927705645561218, 0.00030453503131866455, 0.0003162994980812073, 0.00032806396484375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 4.0, 7.0, 5.0, 11.0, 26.0, 31.0, 40.0, 83.0, 152.0, 327.0, 705.0, 2086.0, 11010.0, 578134.0, 441789.0, 10624.0, 2072.0, 745.0, 305.0, 165.0, 95.0, 51.0, 30.0, 21.0, 6.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.063751220703125, -3.95953369140625, -3.855316162109375, -3.7510986328125, -3.646881103515625, -3.54266357421875, -3.438446044921875, -3.334228515625, -3.230010986328125, -3.12579345703125, -3.021575927734375, -2.9173583984375, -2.813140869140625, -2.70892333984375, -2.604705810546875, -2.50048828125, -2.396270751953125, -2.29205322265625, -2.187835693359375, -2.0836181640625, -1.979400634765625, -1.87518310546875, -1.770965576171875, -1.666748046875, -1.562530517578125, -1.45831298828125, -1.354095458984375, -1.2498779296875, -1.145660400390625, -1.04144287109375, -0.937225341796875, -0.8330078125, -0.728790283203125, -0.62457275390625, -0.520355224609375, -0.4161376953125, -0.311920166015625, -0.20770263671875, -0.103485107421875, 0.000732421875, 0.104949951171875, 0.20916748046875, 0.313385009765625, 0.4176025390625, 0.521820068359375, 0.62603759765625, 0.730255126953125, 0.83447265625, 0.938690185546875, 1.04290771484375, 1.147125244140625, 1.2513427734375, 1.355560302734375, 1.45977783203125, 1.563995361328125, 1.668212890625, 1.772430419921875, 1.87664794921875, 1.980865478515625, 2.0850830078125, 2.189300537109375, 2.29351806640625, 2.397735595703125, 2.501953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 8.0, 3.0, 9.0, 3.0, 15.0, 16.0, 16.0, 31.0, 36.0, 43.0, 66.0, 69.0, 80.0, 89.0, 83.0, 75.0, 60.0, 59.0, 51.0, 43.0, 44.0, 32.0, 22.0, 13.0, 9.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8759765625, -1.8257293701171875, -1.775482177734375, -1.7252349853515625, -1.67498779296875, -1.6247406005859375, -1.574493408203125, -1.5242462158203125, -1.4739990234375, -1.4237518310546875, -1.373504638671875, -1.3232574462890625, -1.27301025390625, -1.2227630615234375, -1.172515869140625, -1.1222686767578125, -1.072021484375, -1.0217742919921875, -0.971527099609375, -0.9212799072265625, -0.87103271484375, -0.8207855224609375, -0.770538330078125, -0.7202911376953125, -0.6700439453125, -0.6197967529296875, -0.569549560546875, -0.5193023681640625, -0.46905517578125, -0.4188079833984375, -0.368560791015625, -0.3183135986328125, -0.26806640625, -0.2178192138671875, -0.167572021484375, -0.1173248291015625, -0.06707763671875, -0.0168304443359375, 0.033416748046875, 0.0836639404296875, 0.1339111328125, 0.1841583251953125, 0.234405517578125, 0.2846527099609375, 0.33489990234375, 0.3851470947265625, 0.435394287109375, 0.4856414794921875, 0.535888671875, 0.5861358642578125, 0.636383056640625, 0.6866302490234375, 0.73687744140625, 0.7871246337890625, 0.837371826171875, 0.8876190185546875, 0.9378662109375, 0.9881134033203125, 1.038360595703125, 1.0886077880859375, 1.13885498046875, 1.1891021728515625, 1.239349365234375, 1.2895965576171875, 1.33984375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 25.0, 38.0, 108.0, 286.0, 306.0, 125.0, 77.0, 16.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.84762573242188, -77.90388488769531, -75.96013641357422, -74.01639556884766, -72.0726547241211, -70.12890625, -68.18516540527344, -66.24142456054688, -64.29768371582031, -62.353939056396484, -60.41019821166992, -58.466453552246094, -56.52271270751953, -54.5789680480957, -52.635223388671875, -50.69148254394531, -48.74773406982422, -46.80398941040039, -44.86024856567383, -42.91650390625, -40.97276306152344, -39.02901840209961, -37.08527374267578, -35.14153289794922, -33.19778823852539, -31.254045486450195, -29.310302734375, -27.366558074951172, -25.422815322875977, -23.47907257080078, -21.535327911376953, -19.591585159301758, -17.647842407226562, -15.704099655151367, -13.760355949401855, -11.816612243652344, -9.872869491577148, -7.929126739501953, -5.985383033752441, -4.04163932800293, -2.0978965759277344, -0.15415334701538086, 1.7895898818969727, 3.733333110809326, 5.67707633972168, 7.620819091796875, 9.564562797546387, 11.508306503295898, 13.452049255371094, 15.395792007446289, 17.339534759521484, 19.283279418945312, 21.227022171020508, 23.170764923095703, 25.11450958251953, 27.058252334594727, 29.001995086669922, 30.945737838745117, 32.88948059082031, 34.83322525024414, 36.77696990966797, 38.72071075439453, 40.66445541381836, 42.60820007324219, 44.55194091796875]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 5.0, 2.0, 2.0, 8.0, 7.0, 11.0, 11.0, 14.0, 19.0, 20.0, 16.0, 24.0, 29.0, 35.0, 33.0, 41.0, 48.0, 56.0, 60.0, 70.0, 79.0, 58.0, 49.0, 28.0, 45.0, 43.0, 37.0, 28.0, 25.0, 20.0, 22.0, 13.0, 13.0, 14.0, 6.0, 9.0, 4.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15326690673828, -18.427181243896484, -17.701095581054688, -16.97500991821289, -16.248924255371094, -15.522839546203613, -14.796754837036133, -14.070669174194336, -13.344583511352539, -12.618497848510742, -11.892412185668945, -11.166327476501465, -10.440241813659668, -9.714156150817871, -8.98807144165039, -8.261985778808594, -7.535900115966797, -6.809814453125, -6.083729267120361, -5.357644081115723, -4.631558418273926, -3.905472993850708, -3.1793875694274902, -2.4533023834228516, -1.7272167205810547, -1.001131296157837, -0.27504587173461914, 0.45103955268859863, 1.1771249771118164, 1.9032104015350342, 2.629295825958252, 3.3553810119628906, 4.0814666748046875, 4.807552337646484, 5.533637523651123, 6.259722709655762, 6.985808372497559, 7.7118940353393555, 8.437978744506836, 9.164064407348633, 9.89015007019043, 10.616235733032227, 11.342321395874023, 12.068406105041504, 12.7944917678833, 13.520577430725098, 14.246662139892578, 14.972747802734375, 15.698833465576172, 16.42491912841797, 17.151004791259766, 17.877090454101562, 18.60317611694336, 19.329259872436523, 20.05534553527832, 20.781431198120117, 21.507516860961914, 22.23360252380371, 22.959688186645508, 23.685773849487305, 24.41185760498047, 25.137943267822266, 25.864028930664062, 26.59011459350586, 27.316200256347656]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 19.0, 30.0, 50.0, 80.0, 159.0, 303.0, 667.0, 1308.0, 3327.0, 9584.0, 40505.0, 526263.0, 3397563.0, 180141.0, 23777.0, 6191.0, 2265.0, 1013.0, 461.0, 252.0, 140.0, 70.0, 35.0, 30.0, 13.0, 5.0, 12.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.42578125, -2.32611083984375, -2.2264404296875, -2.12677001953125, -2.027099609375, -1.92742919921875, -1.8277587890625, -1.72808837890625, -1.62841796875, -1.52874755859375, -1.4290771484375, -1.32940673828125, -1.229736328125, -1.13006591796875, -1.0303955078125, -0.93072509765625, -0.8310546875, -0.73138427734375, -0.6317138671875, -0.53204345703125, -0.432373046875, -0.33270263671875, -0.2330322265625, -0.13336181640625, -0.03369140625, 0.06597900390625, 0.1656494140625, 0.26531982421875, 0.364990234375, 0.46466064453125, 0.5643310546875, 0.66400146484375, 0.763671875, 0.86334228515625, 0.9630126953125, 1.06268310546875, 1.162353515625, 1.26202392578125, 1.3616943359375, 1.46136474609375, 1.56103515625, 1.66070556640625, 1.7603759765625, 1.86004638671875, 1.959716796875, 2.05938720703125, 2.1590576171875, 2.25872802734375, 2.3583984375, 2.45806884765625, 2.5577392578125, 2.65740966796875, 2.757080078125, 2.85675048828125, 2.9564208984375, 3.05609130859375, 3.15576171875, 3.25543212890625, 3.3551025390625, 3.45477294921875, 3.554443359375, 3.65411376953125, 3.7537841796875, 3.85345458984375, 3.953125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 6.0, 11.0, 9.0, 14.0, 24.0, 20.0, 38.0, 45.0, 42.0, 65.0, 72.0, 75.0, 79.0, 76.0, 82.0, 68.0, 61.0, 55.0, 37.0, 36.0, 27.0, 21.0, 18.0, 16.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26953125, -1.214447021484375, -1.15936279296875, -1.104278564453125, -1.0491943359375, -0.994110107421875, -0.93902587890625, -0.883941650390625, -0.828857421875, -0.773773193359375, -0.71868896484375, -0.663604736328125, -0.6085205078125, -0.553436279296875, -0.49835205078125, -0.443267822265625, -0.38818359375, -0.333099365234375, -0.27801513671875, -0.222930908203125, -0.1678466796875, -0.112762451171875, -0.05767822265625, -0.002593994140625, 0.052490234375, 0.107574462890625, 0.16265869140625, 0.217742919921875, 0.2728271484375, 0.327911376953125, 0.38299560546875, 0.438079833984375, 0.4931640625, 0.548248291015625, 0.60333251953125, 0.658416748046875, 0.7135009765625, 0.768585205078125, 0.82366943359375, 0.878753662109375, 0.933837890625, 0.988922119140625, 1.04400634765625, 1.099090576171875, 1.1541748046875, 1.209259033203125, 1.26434326171875, 1.319427490234375, 1.37451171875, 1.429595947265625, 1.48468017578125, 1.539764404296875, 1.5948486328125, 1.649932861328125, 1.70501708984375, 1.760101318359375, 1.815185546875, 1.870269775390625, 1.92535400390625, 1.980438232421875, 2.0355224609375, 2.090606689453125, 2.14569091796875, 2.200775146484375, 2.255859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 5.0, 9.0, 12.0, 18.0, 31.0, 49.0, 75.0, 165.0, 276.0, 549.0, 1228.0, 3345.0, 10322.0, 45142.0, 506827.0, 3485266.0, 113974.0, 18352.0, 5148.0, 1870.0, 762.0, 378.0, 182.0, 109.0, 64.0, 44.0, 22.0, 16.0, 10.0, 6.0, 2.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.96136474609375, -3.8211669921875, -3.68096923828125, -3.540771484375, -3.40057373046875, -3.2603759765625, -3.12017822265625, -2.97998046875, -2.83978271484375, -2.6995849609375, -2.55938720703125, -2.419189453125, -2.27899169921875, -2.1387939453125, -1.99859619140625, -1.8583984375, -1.71820068359375, -1.5780029296875, -1.43780517578125, -1.297607421875, -1.15740966796875, -1.0172119140625, -0.87701416015625, -0.73681640625, -0.59661865234375, -0.4564208984375, -0.31622314453125, -0.176025390625, -0.03582763671875, 0.1043701171875, 0.24456787109375, 0.384765625, 0.52496337890625, 0.6651611328125, 0.80535888671875, 0.945556640625, 1.08575439453125, 1.2259521484375, 1.36614990234375, 1.50634765625, 1.64654541015625, 1.7867431640625, 1.92694091796875, 2.067138671875, 2.20733642578125, 2.3475341796875, 2.48773193359375, 2.6279296875, 2.76812744140625, 2.9083251953125, 3.04852294921875, 3.188720703125, 3.32891845703125, 3.4691162109375, 3.60931396484375, 3.74951171875, 3.88970947265625, 4.0299072265625, 4.17010498046875, 4.310302734375, 4.45050048828125, 4.5906982421875, 4.73089599609375, 4.87109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 6.0, 4.0, 8.0, 13.0, 16.0, 17.0, 30.0, 20.0, 45.0, 60.0, 85.0, 149.0, 304.0, 736.0, 1119.0, 708.0, 298.0, 166.0, 85.0, 54.0, 37.0, 21.0, 26.0, 12.0, 8.0, 8.0, 10.0, 4.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609375, -4.47174072265625, -4.3341064453125, -4.19647216796875, -4.058837890625, -3.92120361328125, -3.7835693359375, -3.64593505859375, -3.50830078125, -3.37066650390625, -3.2330322265625, -3.09539794921875, -2.957763671875, -2.82012939453125, -2.6824951171875, -2.54486083984375, -2.4072265625, -2.26959228515625, -2.1319580078125, -1.99432373046875, -1.856689453125, -1.71905517578125, -1.5814208984375, -1.44378662109375, -1.30615234375, -1.16851806640625, -1.0308837890625, -0.89324951171875, -0.755615234375, -0.61798095703125, -0.4803466796875, -0.34271240234375, -0.205078125, -0.06744384765625, 0.0701904296875, 0.20782470703125, 0.345458984375, 0.48309326171875, 0.6207275390625, 0.75836181640625, 0.89599609375, 1.03363037109375, 1.1712646484375, 1.30889892578125, 1.446533203125, 1.58416748046875, 1.7218017578125, 1.85943603515625, 1.9970703125, 2.13470458984375, 2.2723388671875, 2.40997314453125, 2.547607421875, 2.68524169921875, 2.8228759765625, 2.96051025390625, 3.09814453125, 3.23577880859375, 3.3734130859375, 3.51104736328125, 3.648681640625, 3.78631591796875, 3.9239501953125, 4.06158447265625, 4.19921875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 7.0, 9.0, 21.0, 39.0, 184.0, 377.0, 244.0, 77.0, 28.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.83332824707031, -41.71901321411133, -39.604698181152344, -37.490386962890625, -35.37607192993164, -33.261756896972656, -31.147443771362305, -29.033130645751953, -26.91881561279297, -24.804500579833984, -22.690187454223633, -20.57587432861328, -18.461559295654297, -16.347244262695312, -14.232931137084961, -12.118617057800293, -10.004302978515625, -7.889988899230957, -5.775674819946289, -3.661360740661621, -1.5470466613769531, 0.5672674179077148, 2.681581497192383, 4.795895576477051, 6.910209655761719, 9.024523735046387, 11.138837814331055, 13.253151893615723, 15.36746597290039, 17.481781005859375, 19.596094131469727, 21.710407257080078, 23.824722290039062, 25.939037322998047, 28.0533504486084, 30.16766357421875, 32.281978607177734, 34.39629364013672, 36.51060485839844, 38.62491989135742, 40.739234924316406, 42.85354995727539, 44.967864990234375, 47.082176208496094, 49.19649124145508, 51.31080627441406, 53.42511749267578, 55.539432525634766, 57.65374755859375, 59.768062591552734, 61.88237762451172, 63.99668884277344, 66.11100769042969, 68.2253189086914, 70.33963012695312, 72.45394897460938, 74.5682601928711, 76.68257141113281, 78.79689025878906, 80.91120147705078, 83.0255126953125, 85.13983154296875, 87.25414276123047, 89.36846160888672, 91.48277282714844]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 4.0, 9.0, 9.0, 10.0, 7.0, 18.0, 22.0, 28.0, 19.0, 46.0, 33.0, 48.0, 42.0, 55.0, 56.0, 51.0, 52.0, 71.0, 65.0, 55.0, 36.0, 46.0, 39.0, 44.0, 39.0, 24.0, 16.0, 10.0, 7.0, 13.0, 6.0, 8.0, 5.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.82343292236328, -16.198184967041016, -15.572936058044434, -14.947687149047852, -14.322439193725586, -13.697190284729004, -13.071941375732422, -12.446693420410156, -11.821444511413574, -11.196195602416992, -10.570947647094727, -9.945698738098145, -9.320449829101562, -8.695201873779297, -8.069952964782715, -7.444704532623291, -6.819456100463867, -6.194207668304443, -5.5689592361450195, -4.9437103271484375, -4.318461894989014, -3.69321346282959, -3.067964792251587, -2.442716121673584, -1.8174676895141602, -1.1922191381454468, -0.5669705867767334, 0.05827796459197998, 0.6835265159606934, 1.3087749481201172, 1.9340236186981201, 2.559272289276123, 3.184520721435547, 3.8097691535949707, 4.4350175857543945, 5.060266494750977, 5.6855149269104, 6.310763359069824, 6.936012268066406, 7.56126070022583, 8.186509132385254, 8.811758041381836, 9.437005996704102, 10.062254905700684, 10.687503814697266, 11.312751770019531, 11.938000679016113, 12.563249588012695, 13.188497543334961, 13.813746452331543, 14.438994407653809, 15.06424331665039, 15.689491271972656, 16.314739227294922, 16.93998908996582, 17.565237045288086, 18.190486907958984, 18.81573486328125, 19.44098472595215, 20.066232681274414, 20.69148063659668, 21.316730499267578, 21.941978454589844, 22.56722640991211, 23.192474365234375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 4.0, 6.0, 6.0, 10.0, 23.0, 31.0, 72.0, 203.0, 564.0, 1864.0, 6321.0, 29898.0, 382261.0, 577470.0, 38988.0, 7571.0, 2140.0, 709.0, 225.0, 96.0, 44.0, 14.0, 13.0, 7.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.05078125, -4.84930419921875, -4.6478271484375, -4.44635009765625, -4.244873046875, -4.04339599609375, -3.8419189453125, -3.64044189453125, -3.43896484375, -3.23748779296875, -3.0360107421875, -2.83453369140625, -2.633056640625, -2.43157958984375, -2.2301025390625, -2.02862548828125, -1.8271484375, -1.62567138671875, -1.4241943359375, -1.22271728515625, -1.021240234375, -0.81976318359375, -0.6182861328125, -0.41680908203125, -0.21533203125, -0.01385498046875, 0.1876220703125, 0.38909912109375, 0.590576171875, 0.79205322265625, 0.9935302734375, 1.19500732421875, 1.396484375, 1.59796142578125, 1.7994384765625, 2.00091552734375, 2.202392578125, 2.40386962890625, 2.6053466796875, 2.80682373046875, 3.00830078125, 3.20977783203125, 3.4112548828125, 3.61273193359375, 3.814208984375, 4.01568603515625, 4.2171630859375, 4.41864013671875, 4.6201171875, 4.82159423828125, 5.0230712890625, 5.22454833984375, 5.426025390625, 5.62750244140625, 5.8289794921875, 6.03045654296875, 6.23193359375, 6.43341064453125, 6.6348876953125, 6.83636474609375, 7.037841796875, 7.23931884765625, 7.4407958984375, 7.64227294921875, 7.84375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 2.0, 9.0, 8.0, 14.0, 11.0, 10.0, 14.0, 16.0, 17.0, 18.0, 14.0, 32.0, 34.0, 27.0, 37.0, 33.0, 36.0, 41.0, 41.0, 40.0, 33.0, 45.0, 47.0, 53.0, 40.0, 34.0, 30.0, 34.0, 21.0, 25.0, 25.0, 29.0, 23.0, 15.0, 18.0, 18.0, 9.0, 6.0, 9.0, 5.0, 10.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0009765625, -0.9691925048828125, -0.937408447265625, -0.9056243896484375, -0.87384033203125, -0.8420562744140625, -0.810272216796875, -0.7784881591796875, -0.7467041015625, -0.7149200439453125, -0.683135986328125, -0.6513519287109375, -0.61956787109375, -0.5877838134765625, -0.555999755859375, -0.5242156982421875, -0.492431640625, -0.4606475830078125, -0.428863525390625, -0.3970794677734375, -0.36529541015625, -0.3335113525390625, -0.301727294921875, -0.2699432373046875, -0.2381591796875, -0.2063751220703125, -0.174591064453125, -0.1428070068359375, -0.11102294921875, -0.0792388916015625, -0.047454833984375, -0.0156707763671875, 0.01611328125, 0.0478973388671875, 0.079681396484375, 0.1114654541015625, 0.14324951171875, 0.1750335693359375, 0.206817626953125, 0.2386016845703125, 0.2703857421875, 0.3021697998046875, 0.333953857421875, 0.3657379150390625, 0.39752197265625, 0.4293060302734375, 0.461090087890625, 0.4928741455078125, 0.524658203125, 0.5564422607421875, 0.588226318359375, 0.6200103759765625, 0.65179443359375, 0.6835784912109375, 0.715362548828125, 0.7471466064453125, 0.7789306640625, 0.8107147216796875, 0.842498779296875, 0.8742828369140625, 0.90606689453125, 0.9378509521484375, 0.969635009765625, 1.0014190673828125, 1.033203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 7.0, 14.0, 29.0, 30.0, 86.0, 118.0, 189.0, 401.0, 775.0, 1943.0, 8227.0, 97130.0, 895492.0, 36328.0, 4951.0, 1484.0, 565.0, 319.0, 169.0, 87.0, 80.0, 49.0, 14.0, 12.0, 9.0, 7.0, 4.0, 7.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.60791015625, -7.3486328125, -7.08935546875, -6.830078125, -6.57080078125, -6.3115234375, -6.05224609375, -5.79296875, -5.53369140625, -5.2744140625, -5.01513671875, -4.755859375, -4.49658203125, -4.2373046875, -3.97802734375, -3.71875, -3.45947265625, -3.2001953125, -2.94091796875, -2.681640625, -2.42236328125, -2.1630859375, -1.90380859375, -1.64453125, -1.38525390625, -1.1259765625, -0.86669921875, -0.607421875, -0.34814453125, -0.0888671875, 0.17041015625, 0.4296875, 0.68896484375, 0.9482421875, 1.20751953125, 1.466796875, 1.72607421875, 1.9853515625, 2.24462890625, 2.50390625, 2.76318359375, 3.0224609375, 3.28173828125, 3.541015625, 3.80029296875, 4.0595703125, 4.31884765625, 4.578125, 4.83740234375, 5.0966796875, 5.35595703125, 5.615234375, 5.87451171875, 6.1337890625, 6.39306640625, 6.65234375, 6.91162109375, 7.1708984375, 7.43017578125, 7.689453125, 7.94873046875, 8.2080078125, 8.46728515625, 8.7265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 8.0, 8.0, 10.0, 11.0, 25.0, 16.0, 26.0, 23.0, 18.0, 35.0, 44.0, 58.0, 45.0, 49.0, 53.0, 57.0, 46.0, 58.0, 45.0, 51.0, 42.0, 40.0, 32.0, 26.0, 30.0, 16.0, 20.0, 17.0, 23.0, 12.0, 14.0, 15.0, 8.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4453125, -4.28662109375, -4.1279296875, -3.96923828125, -3.810546875, -3.65185546875, -3.4931640625, -3.33447265625, -3.17578125, -3.01708984375, -2.8583984375, -2.69970703125, -2.541015625, -2.38232421875, -2.2236328125, -2.06494140625, -1.90625, -1.74755859375, -1.5888671875, -1.43017578125, -1.271484375, -1.11279296875, -0.9541015625, -0.79541015625, -0.63671875, -0.47802734375, -0.3193359375, -0.16064453125, -0.001953125, 0.15673828125, 0.3154296875, 0.47412109375, 0.6328125, 0.79150390625, 0.9501953125, 1.10888671875, 1.267578125, 1.42626953125, 1.5849609375, 1.74365234375, 1.90234375, 2.06103515625, 2.2197265625, 2.37841796875, 2.537109375, 2.69580078125, 2.8544921875, 3.01318359375, 3.171875, 3.33056640625, 3.4892578125, 3.64794921875, 3.806640625, 3.96533203125, 4.1240234375, 4.28271484375, 4.44140625, 4.60009765625, 4.7587890625, 4.91748046875, 5.076171875, 5.23486328125, 5.3935546875, 5.55224609375, 5.7109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 9.0, 17.0, 29.0, 28.0, 58.0, 85.0, 123.0, 141.0, 254.0, 377.0, 682.0, 1410.0, 3687.0, 12912.0, 72205.0, 690958.0, 224435.0, 29637.0, 6742.0, 2345.0, 989.0, 522.0, 284.0, 190.0, 127.0, 85.0, 58.0, 33.0, 29.0, 15.0, 13.0, 15.0, 14.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3642578125, -1.3213043212890625, -1.278350830078125, -1.2353973388671875, -1.19244384765625, -1.1494903564453125, -1.106536865234375, -1.0635833740234375, -1.0206298828125, -0.9776763916015625, -0.934722900390625, -0.8917694091796875, -0.84881591796875, -0.8058624267578125, -0.762908935546875, -0.7199554443359375, -0.677001953125, -0.6340484619140625, -0.591094970703125, -0.5481414794921875, -0.50518798828125, -0.4622344970703125, -0.419281005859375, -0.3763275146484375, -0.3333740234375, -0.2904205322265625, -0.247467041015625, -0.2045135498046875, -0.16156005859375, -0.1186065673828125, -0.075653076171875, -0.0326995849609375, 0.01025390625, 0.0532073974609375, 0.096160888671875, 0.1391143798828125, 0.18206787109375, 0.2250213623046875, 0.267974853515625, 0.3109283447265625, 0.3538818359375, 0.3968353271484375, 0.439788818359375, 0.4827423095703125, 0.52569580078125, 0.5686492919921875, 0.611602783203125, 0.6545562744140625, 0.697509765625, 0.7404632568359375, 0.783416748046875, 0.8263702392578125, 0.86932373046875, 0.9122772216796875, 0.955230712890625, 0.9981842041015625, 1.0411376953125, 1.0840911865234375, 1.127044677734375, 1.1699981689453125, 1.21295166015625, 1.2559051513671875, 1.298858642578125, 1.3418121337890625, 1.384765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 4.0, 14.0, 12.0, 17.0, 25.0, 38.0, 49.0, 67.0, 125.0, 162.0, 139.0, 107.0, 55.0, 36.0, 27.0, 24.0, 20.0, 11.0, 12.0, 6.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00043320655822753906, -0.00042204558849334717, -0.0004108846187591553, -0.0003997236490249634, -0.0003885626792907715, -0.0003774017095565796, -0.0003662407398223877, -0.0003550797700881958, -0.0003439188003540039, -0.000332757830619812, -0.0003215968608856201, -0.0003104358911514282, -0.00029927492141723633, -0.00028811395168304443, -0.00027695298194885254, -0.00026579201221466064, -0.00025463104248046875, -0.00024347007274627686, -0.00023230910301208496, -0.00022114813327789307, -0.00020998716354370117, -0.00019882619380950928, -0.00018766522407531738, -0.0001765042543411255, -0.0001653432846069336, -0.0001541823148727417, -0.0001430213451385498, -0.0001318603754043579, -0.00012069940567016602, -0.00010953843593597412, -9.837746620178223e-05, -8.721649646759033e-05, -7.605552673339844e-05, -6.489455699920654e-05, -5.373358726501465e-05, -4.2572617530822754e-05, -3.141164779663086e-05, -2.0250678062438965e-05, -9.08970832824707e-06, 2.0712614059448242e-06, 1.3232231140136719e-05, 2.4393200874328613e-05, 3.555417060852051e-05, 4.67151403427124e-05, 5.78761100769043e-05, 6.903707981109619e-05, 8.019804954528809e-05, 9.135901927947998e-05, 0.00010251998901367188, 0.00011368095874786377, 0.00012484192848205566, 0.00013600289821624756, 0.00014716386795043945, 0.00015832483768463135, 0.00016948580741882324, 0.00018064677715301514, 0.00019180774688720703, 0.00020296871662139893, 0.00021412968635559082, 0.00022529065608978271, 0.0002364516258239746, 0.0002476125955581665, 0.0002587735652923584, 0.0002699345350265503, 0.0002810955047607422]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 5.0, 8.0, 23.0, 23.0, 31.0, 43.0, 75.0, 123.0, 203.0, 323.0, 560.0, 1203.0, 2796.0, 8976.0, 49990.0, 650384.0, 292465.0, 30507.0, 6413.0, 2219.0, 950.0, 495.0, 297.0, 147.0, 116.0, 56.0, 28.0, 29.0, 25.0, 14.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2260894775390625, -1.183624267578125, -1.1411590576171875, -1.09869384765625, -1.0562286376953125, -1.013763427734375, -0.9712982177734375, -0.9288330078125, -0.8863677978515625, -0.843902587890625, -0.8014373779296875, -0.75897216796875, -0.7165069580078125, -0.674041748046875, -0.6315765380859375, -0.589111328125, -0.5466461181640625, -0.504180908203125, -0.4617156982421875, -0.41925048828125, -0.3767852783203125, -0.334320068359375, -0.2918548583984375, -0.2493896484375, -0.2069244384765625, -0.164459228515625, -0.1219940185546875, -0.07952880859375, -0.0370635986328125, 0.005401611328125, 0.0478668212890625, 0.09033203125, 0.1327972412109375, 0.175262451171875, 0.2177276611328125, 0.26019287109375, 0.3026580810546875, 0.345123291015625, 0.3875885009765625, 0.4300537109375, 0.4725189208984375, 0.514984130859375, 0.5574493408203125, 0.59991455078125, 0.6423797607421875, 0.684844970703125, 0.7273101806640625, 0.769775390625, 0.8122406005859375, 0.854705810546875, 0.8971710205078125, 0.93963623046875, 0.9821014404296875, 1.024566650390625, 1.0670318603515625, 1.1094970703125, 1.1519622802734375, 1.194427490234375, 1.2368927001953125, 1.27935791015625, 1.3218231201171875, 1.364288330078125, 1.4067535400390625, 1.44921875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 7.0, 6.0, 10.0, 8.0, 7.0, 19.0, 18.0, 27.0, 33.0, 26.0, 39.0, 37.0, 34.0, 47.0, 51.0, 58.0, 61.0, 55.0, 57.0, 64.0, 44.0, 44.0, 35.0, 43.0, 26.0, 25.0, 24.0, 23.0, 14.0, 13.0, 10.0, 9.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.97802734375, -0.9501571655273438, -0.9222869873046875, -0.8944168090820312, -0.866546630859375, -0.8386764526367188, -0.8108062744140625, -0.7829360961914062, -0.75506591796875, -0.7271957397460938, -0.6993255615234375, -0.6714553833007812, -0.643585205078125, -0.6157150268554688, -0.5878448486328125, -0.5599746704101562, -0.5321044921875, -0.5042343139648438, -0.4763641357421875, -0.44849395751953125, -0.420623779296875, -0.39275360107421875, -0.3648834228515625, -0.33701324462890625, -0.30914306640625, -0.28127288818359375, -0.2534027099609375, -0.22553253173828125, -0.197662353515625, -0.16979217529296875, -0.1419219970703125, -0.11405181884765625, -0.086181640625, -0.05831146240234375, -0.0304412841796875, -0.00257110595703125, 0.025299072265625, 0.05316925048828125, 0.0810394287109375, 0.10890960693359375, 0.13677978515625, 0.16464996337890625, 0.1925201416015625, 0.22039031982421875, 0.248260498046875, 0.27613067626953125, 0.3040008544921875, 0.33187103271484375, 0.3597412109375, 0.38761138916015625, 0.4154815673828125, 0.44335174560546875, 0.471221923828125, 0.49909210205078125, 0.5269622802734375, 0.5548324584960938, 0.58270263671875, 0.6105728149414062, 0.6384429931640625, 0.6663131713867188, 0.694183349609375, 0.7220535278320312, 0.7499237060546875, 0.7777938842773438, 0.8056640625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 9.0, 18.0, 33.0, 68.0, 173.0, 271.0, 224.0, 95.0, 54.0, 26.0, 19.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.96748352050781, -49.71733093261719, -48.4671745300293, -47.21702194213867, -45.96686553955078, -44.716712951660156, -43.466556549072266, -42.21640396118164, -40.96624755859375, -39.716094970703125, -38.465938568115234, -37.21578598022461, -35.96562957763672, -34.715476989746094, -33.4653205871582, -32.21516799926758, -30.965015411376953, -29.714860916137695, -28.464706420898438, -27.21455192565918, -25.964397430419922, -24.714244842529297, -23.46409034729004, -22.21393585205078, -20.963781356811523, -19.713626861572266, -18.463472366333008, -17.21331787109375, -15.963164329528809, -14.71300983428955, -13.46285629272461, -12.212701797485352, -10.96255111694336, -9.712396621704102, -8.462242126464844, -7.212088584899902, -5.9619340896606445, -4.711779594421387, -3.461625576019287, -2.2114715576171875, -0.9613170623779297, 0.288837194442749, 1.5389914512634277, 2.7891457080841064, 4.039299964904785, 5.289454460144043, 6.539608478546143, 7.789762496948242, 9.0399169921875, 10.290071487426758, 11.540225982666016, 12.790379524230957, 14.040534019470215, 15.290688514709473, 16.540842056274414, 17.790996551513672, 19.04115104675293, 20.291305541992188, 21.541460037231445, 22.791614532470703, 24.041767120361328, 25.29192352294922, 26.542076110839844, 27.7922306060791, 29.04238510131836]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 6.0, 16.0, 13.0, 16.0, 26.0, 24.0, 24.0, 29.0, 23.0, 26.0, 26.0, 37.0, 33.0, 45.0, 47.0, 49.0, 82.0, 60.0, 58.0, 45.0, 58.0, 23.0, 36.0, 28.0, 20.0, 27.0, 20.0, 11.0, 13.0, 16.0, 11.0, 8.0, 9.0, 7.0, 5.0, 8.0, 3.0, 4.0, 0.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.763154983520508, -20.16584587097168, -19.56853675842285, -18.971227645874023, -18.373918533325195, -17.776609420776367, -17.17930030822754, -16.581989288330078, -15.984681129455566, -15.387372016906738, -14.79006290435791, -14.192753791809082, -13.595443725585938, -12.99813461303711, -12.400825500488281, -11.803516387939453, -11.206207275390625, -10.608898162841797, -10.011589050292969, -9.41427993774414, -8.816970825195312, -8.219661712646484, -7.62235164642334, -7.025042533874512, -6.427733421325684, -5.8304243087768555, -5.233115196228027, -4.635805606842041, -4.038496494293213, -3.4411873817443848, -2.8438780307769775, -2.2465686798095703, -1.6492595672607422, -1.0519503355026245, -0.45464110374450684, 0.14266812801361084, 0.7399773597717285, 1.3372864723205566, 1.9345958232879639, 2.531905174255371, 3.129214286804199, 3.7265233993530273, 4.3238325119018555, 4.921142101287842, 5.51845121383667, 6.115760326385498, 6.713069915771484, 7.3103790283203125, 7.907688140869141, 8.504997253417969, 9.102306365966797, 9.699615478515625, 10.296924591064453, 10.894233703613281, 11.491543769836426, 12.088852882385254, 12.686161994934082, 13.28347110748291, 13.880780220031738, 14.478089332580566, 15.075399398803711, 15.672708511352539, 16.270017623901367, 16.867326736450195, 17.464635848999023]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 12.0, 13.0, 24.0, 40.0, 61.0, 85.0, 166.0, 321.0, 541.0, 1072.0, 2146.0, 5188.0, 15636.0, 85999.0, 2478427.0, 1520464.0, 63049.0, 12769.0, 4425.0, 1860.0, 883.0, 460.0, 237.0, 148.0, 96.0, 53.0, 27.0, 13.0, 18.0, 11.0, 11.0, 6.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9404296875, -1.8519439697265625, -1.763458251953125, -1.6749725341796875, -1.58648681640625, -1.4980010986328125, -1.409515380859375, -1.3210296630859375, -1.2325439453125, -1.1440582275390625, -1.055572509765625, -0.9670867919921875, -0.87860107421875, -0.7901153564453125, -0.701629638671875, -0.6131439208984375, -0.524658203125, -0.4361724853515625, -0.347686767578125, -0.2592010498046875, -0.17071533203125, -0.0822296142578125, 0.006256103515625, 0.0947418212890625, 0.1832275390625, 0.2717132568359375, 0.360198974609375, 0.4486846923828125, 0.53717041015625, 0.6256561279296875, 0.714141845703125, 0.8026275634765625, 0.89111328125, 0.9795989990234375, 1.068084716796875, 1.1565704345703125, 1.24505615234375, 1.3335418701171875, 1.422027587890625, 1.5105133056640625, 1.5989990234375, 1.6874847412109375, 1.775970458984375, 1.8644561767578125, 1.95294189453125, 2.0414276123046875, 2.129913330078125, 2.2183990478515625, 2.306884765625, 2.3953704833984375, 2.483856201171875, 2.5723419189453125, 2.66082763671875, 2.7493133544921875, 2.837799072265625, 2.9262847900390625, 3.0147705078125, 3.1032562255859375, 3.191741943359375, 3.2802276611328125, 3.36871337890625, 3.4571990966796875, 3.545684814453125, 3.6341705322265625, 3.72265625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 6.0, 8.0, 12.0, 11.0, 13.0, 12.0, 16.0, 26.0, 18.0, 19.0, 29.0, 39.0, 31.0, 43.0, 56.0, 44.0, 43.0, 42.0, 55.0, 44.0, 35.0, 51.0, 37.0, 28.0, 43.0, 38.0, 17.0, 29.0, 20.0, 31.0, 23.0, 12.0, 17.0, 7.0, 11.0, 4.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9931640625, -0.961395263671875, -0.92962646484375, -0.897857666015625, -0.8660888671875, -0.834320068359375, -0.80255126953125, -0.770782470703125, -0.739013671875, -0.707244873046875, -0.67547607421875, -0.643707275390625, -0.6119384765625, -0.580169677734375, -0.54840087890625, -0.516632080078125, -0.48486328125, -0.453094482421875, -0.42132568359375, -0.389556884765625, -0.3577880859375, -0.326019287109375, -0.29425048828125, -0.262481689453125, -0.230712890625, -0.198944091796875, -0.16717529296875, -0.135406494140625, -0.1036376953125, -0.071868896484375, -0.04010009765625, -0.008331298828125, 0.0234375, 0.055206298828125, 0.08697509765625, 0.118743896484375, 0.1505126953125, 0.182281494140625, 0.21405029296875, 0.245819091796875, 0.277587890625, 0.309356689453125, 0.34112548828125, 0.372894287109375, 0.4046630859375, 0.436431884765625, 0.46820068359375, 0.499969482421875, 0.53173828125, 0.563507080078125, 0.59527587890625, 0.627044677734375, 0.6588134765625, 0.690582275390625, 0.72235107421875, 0.754119873046875, 0.785888671875, 0.817657470703125, 0.84942626953125, 0.881195068359375, 0.9129638671875, 0.944732666015625, 0.97650146484375, 1.008270263671875, 1.0400390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 12.0, 9.0, 14.0, 20.0, 23.0, 53.0, 76.0, 181.0, 339.0, 855.0, 2012.0, 6042.0, 27351.0, 358254.0, 3684471.0, 93021.0, 14600.0, 4167.0, 1469.0, 601.0, 276.0, 166.0, 84.0, 69.0, 32.0, 22.0, 14.0, 8.0, 15.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.40606689453125, -4.2652587890625, -4.12445068359375, -3.983642578125, -3.84283447265625, -3.7020263671875, -3.56121826171875, -3.42041015625, -3.27960205078125, -3.1387939453125, -2.99798583984375, -2.857177734375, -2.71636962890625, -2.5755615234375, -2.43475341796875, -2.2939453125, -2.15313720703125, -2.0123291015625, -1.87152099609375, -1.730712890625, -1.58990478515625, -1.4490966796875, -1.30828857421875, -1.16748046875, -1.02667236328125, -0.8858642578125, -0.74505615234375, -0.604248046875, -0.46343994140625, -0.3226318359375, -0.18182373046875, -0.041015625, 0.09979248046875, 0.2406005859375, 0.38140869140625, 0.522216796875, 0.66302490234375, 0.8038330078125, 0.94464111328125, 1.08544921875, 1.22625732421875, 1.3670654296875, 1.50787353515625, 1.648681640625, 1.78948974609375, 1.9302978515625, 2.07110595703125, 2.2119140625, 2.35272216796875, 2.4935302734375, 2.63433837890625, 2.775146484375, 2.91595458984375, 3.0567626953125, 3.19757080078125, 3.33837890625, 3.47918701171875, 3.6199951171875, 3.76080322265625, 3.901611328125, 4.04241943359375, 4.1832275390625, 4.32403564453125, 4.46484375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 6.0, 12.0, 14.0, 17.0, 25.0, 41.0, 57.0, 86.0, 167.0, 424.0, 1121.0, 1109.0, 475.0, 203.0, 104.0, 76.0, 39.0, 22.0, 11.0, 12.0, 14.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.423828125, -3.286895751953125, -3.14996337890625, -3.013031005859375, -2.8760986328125, -2.739166259765625, -2.60223388671875, -2.465301513671875, -2.328369140625, -2.191436767578125, -2.05450439453125, -1.917572021484375, -1.7806396484375, -1.643707275390625, -1.50677490234375, -1.369842529296875, -1.23291015625, -1.095977783203125, -0.95904541015625, -0.822113037109375, -0.6851806640625, -0.548248291015625, -0.41131591796875, -0.274383544921875, -0.137451171875, -0.000518798828125, 0.13641357421875, 0.273345947265625, 0.4102783203125, 0.547210693359375, 0.68414306640625, 0.821075439453125, 0.9580078125, 1.094940185546875, 1.23187255859375, 1.368804931640625, 1.5057373046875, 1.642669677734375, 1.77960205078125, 1.916534423828125, 2.053466796875, 2.190399169921875, 2.32733154296875, 2.464263916015625, 2.6011962890625, 2.738128662109375, 2.87506103515625, 3.011993408203125, 3.14892578125, 3.285858154296875, 3.42279052734375, 3.559722900390625, 3.6966552734375, 3.833587646484375, 3.97052001953125, 4.107452392578125, 4.244384765625, 4.381317138671875, 4.51824951171875, 4.655181884765625, 4.7921142578125, 4.929046630859375, 5.06597900390625, 5.202911376953125, 5.33984375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 35.0, 151.0, 514.0, 223.0, 44.0, 18.0, 9.0, 1.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.74943542480469, -42.21086502075195, -39.672298431396484, -37.13372802734375, -34.59516143798828, -32.05659103393555, -29.518020629882812, -26.97945213317871, -24.44088363647461, -21.902315139770508, -19.363746643066406, -16.825176239013672, -14.28660774230957, -11.748039245605469, -9.20946979522705, -6.670900344848633, -4.132331848144531, -1.5937628746032715, 0.9448060989379883, 3.483375072479248, 6.021944046020508, 8.56051254272461, 11.099081993103027, 13.637651443481445, 16.176219940185547, 18.71478843688965, 21.25335693359375, 23.791927337646484, 26.330495834350586, 28.869064331054688, 31.407634735107422, 33.946205139160156, 36.484771728515625, 39.02334213256836, 41.56190872192383, 44.10047912597656, 46.63904571533203, 49.177616119384766, 51.7161865234375, 54.25475311279297, 56.7933235168457, 59.33189392089844, 61.870460510253906, 64.40902709960938, 66.94760131835938, 69.48616790771484, 72.02473449707031, 74.56330871582031, 77.10187530517578, 79.64044189453125, 82.17901611328125, 84.71758270263672, 87.25614929199219, 89.79472351074219, 92.33329010009766, 94.87185668945312, 97.41043090820312, 99.9489974975586, 102.4875717163086, 105.02613830566406, 107.56470489501953, 110.103271484375, 112.641845703125, 115.18041229248047, 117.71897888183594]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 3.0, 9.0, 14.0, 11.0, 14.0, 21.0, 20.0, 35.0, 30.0, 46.0, 45.0, 59.0, 49.0, 69.0, 52.0, 65.0, 72.0, 62.0, 47.0, 38.0, 39.0, 42.0, 41.0, 32.0, 22.0, 14.0, 19.0, 12.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.11739158630371, -22.506160736083984, -21.894927978515625, -21.2836971282959, -20.672466278076172, -20.061233520507812, -19.450002670288086, -18.83877182006836, -18.2275390625, -17.616308212280273, -17.005075454711914, -16.393844604492188, -15.782612800598145, -15.171380996704102, -14.560150146484375, -13.948918342590332, -13.337687492370605, -12.726455688476562, -12.115224838256836, -11.503993034362793, -10.89276123046875, -10.281530380249023, -9.67029857635498, -9.059066772460938, -8.447835922241211, -7.836604595184326, -7.225372791290283, -6.614141464233398, -6.0029096603393555, -5.391678333282471, -4.780447006225586, -4.169215202331543, -3.5579833984375, -2.946751832962036, -2.3355202674865723, -1.7242889404296875, -1.1130573749542236, -0.5018258094787598, 0.109405517578125, 0.720637321472168, 1.3318686485290527, 1.9431002140045166, 2.5543317794799805, 3.1655631065368652, 3.776794672012329, 4.388026237487793, 4.999257564544678, 5.610489368438721, 6.2217206954956055, 6.83295202255249, 7.444183826446533, 8.055415153503418, 8.666646957397461, 9.277877807617188, 9.88910961151123, 10.500341415405273, 11.111572265625, 11.722804069519043, 12.33403491973877, 12.945266723632812, 13.556498527526855, 14.167730331420898, 14.778961181640625, 15.390192985534668, 16.00142478942871]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 10.0, 11.0, 13.0, 41.0, 87.0, 197.0, 449.0, 1293.0, 4709.0, 28993.0, 565326.0, 419110.0, 22450.0, 3976.0, 1162.0, 399.0, 177.0, 75.0, 34.0, 23.0, 11.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6484375, -5.49554443359375, -5.3426513671875, -5.18975830078125, -5.036865234375, -4.88397216796875, -4.7310791015625, -4.57818603515625, -4.42529296875, -4.27239990234375, -4.1195068359375, -3.96661376953125, -3.813720703125, -3.66082763671875, -3.5079345703125, -3.35504150390625, -3.2021484375, -3.04925537109375, -2.8963623046875, -2.74346923828125, -2.590576171875, -2.43768310546875, -2.2847900390625, -2.13189697265625, -1.97900390625, -1.82611083984375, -1.6732177734375, -1.52032470703125, -1.367431640625, -1.21453857421875, -1.0616455078125, -0.90875244140625, -0.755859375, -0.60296630859375, -0.4500732421875, -0.29718017578125, -0.144287109375, 0.00860595703125, 0.1614990234375, 0.31439208984375, 0.46728515625, 0.62017822265625, 0.7730712890625, 0.92596435546875, 1.078857421875, 1.23175048828125, 1.3846435546875, 1.53753662109375, 1.6904296875, 1.84332275390625, 1.9962158203125, 2.14910888671875, 2.302001953125, 2.45489501953125, 2.6077880859375, 2.76068115234375, 2.91357421875, 3.06646728515625, 3.2193603515625, 3.37225341796875, 3.525146484375, 3.67803955078125, 3.8309326171875, 3.98382568359375, 4.13671875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 4.0, 8.0, 6.0, 8.0, 3.0, 8.0, 16.0, 20.0, 21.0, 17.0, 23.0, 35.0, 30.0, 33.0, 39.0, 47.0, 33.0, 55.0, 39.0, 45.0, 51.0, 46.0, 47.0, 36.0, 39.0, 46.0, 39.0, 30.0, 27.0, 32.0, 24.0, 17.0, 17.0, 12.0, 19.0, 8.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1134490966796875, -1.077484130859375, -1.0415191650390625, -1.00555419921875, -0.9695892333984375, -0.933624267578125, -0.8976593017578125, -0.8616943359375, -0.8257293701171875, -0.789764404296875, -0.7537994384765625, -0.71783447265625, -0.6818695068359375, -0.645904541015625, -0.6099395751953125, -0.573974609375, -0.5380096435546875, -0.502044677734375, -0.4660797119140625, -0.43011474609375, -0.3941497802734375, -0.358184814453125, -0.3222198486328125, -0.2862548828125, -0.2502899169921875, -0.214324951171875, -0.1783599853515625, -0.14239501953125, -0.1064300537109375, -0.070465087890625, -0.0345001220703125, 0.00146484375, 0.0374298095703125, 0.073394775390625, 0.1093597412109375, 0.14532470703125, 0.1812896728515625, 0.217254638671875, 0.2532196044921875, 0.2891845703125, 0.3251495361328125, 0.361114501953125, 0.3970794677734375, 0.43304443359375, 0.4690093994140625, 0.504974365234375, 0.5409393310546875, 0.576904296875, 0.6128692626953125, 0.648834228515625, 0.6847991943359375, 0.72076416015625, 0.7567291259765625, 0.792694091796875, 0.8286590576171875, 0.8646240234375, 0.9005889892578125, 0.936553955078125, 0.9725189208984375, 1.00848388671875, 1.0444488525390625, 1.080413818359375, 1.1163787841796875, 1.15234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 8.0, 21.0, 21.0, 62.0, 83.0, 119.0, 255.0, 644.0, 1581.0, 4969.0, 32037.0, 810474.0, 182065.0, 11530.0, 2718.0, 1003.0, 429.0, 233.0, 99.0, 68.0, 37.0, 34.0, 19.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.68359375, -4.53619384765625, -4.3887939453125, -4.24139404296875, -4.093994140625, -3.94659423828125, -3.7991943359375, -3.65179443359375, -3.50439453125, -3.35699462890625, -3.2095947265625, -3.06219482421875, -2.914794921875, -2.76739501953125, -2.6199951171875, -2.47259521484375, -2.3251953125, -2.17779541015625, -2.0303955078125, -1.88299560546875, -1.735595703125, -1.58819580078125, -1.4407958984375, -1.29339599609375, -1.14599609375, -0.99859619140625, -0.8511962890625, -0.70379638671875, -0.556396484375, -0.40899658203125, -0.2615966796875, -0.11419677734375, 0.033203125, 0.18060302734375, 0.3280029296875, 0.47540283203125, 0.622802734375, 0.77020263671875, 0.9176025390625, 1.06500244140625, 1.21240234375, 1.35980224609375, 1.5072021484375, 1.65460205078125, 1.802001953125, 1.94940185546875, 2.0968017578125, 2.24420166015625, 2.3916015625, 2.53900146484375, 2.6864013671875, 2.83380126953125, 2.981201171875, 3.12860107421875, 3.2760009765625, 3.42340087890625, 3.57080078125, 3.71820068359375, 3.8656005859375, 4.01300048828125, 4.160400390625, 4.30780029296875, 4.4552001953125, 4.60260009765625, 4.75]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 10.0, 11.0, 18.0, 11.0, 23.0, 27.0, 29.0, 31.0, 32.0, 31.0, 45.0, 58.0, 61.0, 44.0, 55.0, 72.0, 59.0, 66.0, 47.0, 45.0, 29.0, 29.0, 35.0, 31.0, 22.0, 14.0, 19.0, 12.0, 6.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.09765625, -4.9515380859375, -4.805419921875, -4.6593017578125, -4.51318359375, -4.3670654296875, -4.220947265625, -4.0748291015625, -3.9287109375, -3.7825927734375, -3.636474609375, -3.4903564453125, -3.34423828125, -3.1981201171875, -3.052001953125, -2.9058837890625, -2.759765625, -2.6136474609375, -2.467529296875, -2.3214111328125, -2.17529296875, -2.0291748046875, -1.883056640625, -1.7369384765625, -1.5908203125, -1.4447021484375, -1.298583984375, -1.1524658203125, -1.00634765625, -0.8602294921875, -0.714111328125, -0.5679931640625, -0.421875, -0.2757568359375, -0.129638671875, 0.0164794921875, 0.16259765625, 0.3087158203125, 0.454833984375, 0.6009521484375, 0.7470703125, 0.8931884765625, 1.039306640625, 1.1854248046875, 1.33154296875, 1.4776611328125, 1.623779296875, 1.7698974609375, 1.916015625, 2.0621337890625, 2.208251953125, 2.3543701171875, 2.50048828125, 2.6466064453125, 2.792724609375, 2.9388427734375, 3.0849609375, 3.2310791015625, 3.377197265625, 3.5233154296875, 3.66943359375, 3.8155517578125, 3.961669921875, 4.1077880859375, 4.25390625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 11.0, 13.0, 15.0, 34.0, 49.0, 69.0, 128.0, 253.0, 508.0, 1409.0, 4049.0, 16482.0, 121568.0, 803805.0, 81680.0, 12896.0, 3316.0, 1214.0, 478.0, 240.0, 117.0, 79.0, 42.0, 23.0, 19.0, 9.0, 10.0, 8.0, 4.0, 0.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4150390625, -1.3726959228515625, -1.330352783203125, -1.2880096435546875, -1.24566650390625, -1.2033233642578125, -1.160980224609375, -1.1186370849609375, -1.0762939453125, -1.0339508056640625, -0.991607666015625, -0.9492645263671875, -0.90692138671875, -0.8645782470703125, -0.822235107421875, -0.7798919677734375, -0.737548828125, -0.6952056884765625, -0.652862548828125, -0.6105194091796875, -0.56817626953125, -0.5258331298828125, -0.483489990234375, -0.4411468505859375, -0.3988037109375, -0.3564605712890625, -0.314117431640625, -0.2717742919921875, -0.22943115234375, -0.1870880126953125, -0.144744873046875, -0.1024017333984375, -0.06005859375, -0.0177154541015625, 0.024627685546875, 0.0669708251953125, 0.10931396484375, 0.1516571044921875, 0.194000244140625, 0.2363433837890625, 0.2786865234375, 0.3210296630859375, 0.363372802734375, 0.4057159423828125, 0.44805908203125, 0.4904022216796875, 0.532745361328125, 0.5750885009765625, 0.617431640625, 0.6597747802734375, 0.702117919921875, 0.7444610595703125, 0.78680419921875, 0.8291473388671875, 0.871490478515625, 0.9138336181640625, 0.9561767578125, 0.9985198974609375, 1.040863037109375, 1.0832061767578125, 1.12554931640625, 1.1678924560546875, 1.210235595703125, 1.2525787353515625, 1.294921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 2.0, 7.0, 17.0, 11.0, 20.0, 25.0, 55.0, 84.0, 115.0, 175.0, 134.0, 93.0, 68.0, 57.0, 36.0, 16.0, 17.0, 11.0, 14.0, 8.0, 4.0, 3.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002416372299194336, -0.00023382343351840973, -0.00022600963711738586, -0.000218195840716362, -0.00021038204431533813, -0.00020256824791431427, -0.0001947544515132904, -0.00018694065511226654, -0.00017912685871124268, -0.0001713130623102188, -0.00016349926590919495, -0.00015568546950817108, -0.00014787167310714722, -0.00014005787670612335, -0.0001322440803050995, -0.00012443028390407562, -0.00011661648750305176, -0.00010880269110202789, -0.00010098889470100403, -9.317509829998016e-05, -8.53613018989563e-05, -7.754750549793243e-05, -6.973370909690857e-05, -6.19199126958847e-05, -5.410611629486084e-05, -4.6292319893836975e-05, -3.847852349281311e-05, -3.0664727091789246e-05, -2.285093069076538e-05, -1.5037134289741516e-05, -7.223337888717651e-06, 5.904585123062134e-07, 8.404254913330078e-06, 1.6218051314353943e-05, 2.4031847715377808e-05, 3.184564411640167e-05, 3.965944051742554e-05, 4.74732369184494e-05, 5.5287033319473267e-05, 6.310082972049713e-05, 7.0914626121521e-05, 7.872842252254486e-05, 8.654221892356873e-05, 9.435601532459259e-05, 0.00010216981172561646, 0.00010998360812664032, 0.00011779740452766418, 0.00012561120092868805, 0.00013342499732971191, 0.00014123879373073578, 0.00014905259013175964, 0.0001568663865327835, 0.00016468018293380737, 0.00017249397933483124, 0.0001803077757358551, 0.00018812157213687897, 0.00019593536853790283, 0.0002037491649389267, 0.00021156296133995056, 0.00021937675774097443, 0.0002271905541419983, 0.00023500435054302216, 0.00024281814694404602, 0.0002506319433450699, 0.00025844573974609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 8.0, 13.0, 18.0, 33.0, 30.0, 62.0, 154.0, 325.0, 1141.0, 7030.0, 154204.0, 863075.0, 19243.0, 2251.0, 516.0, 216.0, 97.0, 53.0, 27.0, 24.0, 15.0, 8.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.58984375, -3.508636474609375, -3.42742919921875, -3.346221923828125, -3.2650146484375, -3.183807373046875, -3.10260009765625, -3.021392822265625, -2.940185546875, -2.858978271484375, -2.77777099609375, -2.696563720703125, -2.6153564453125, -2.534149169921875, -2.45294189453125, -2.371734619140625, -2.29052734375, -2.209320068359375, -2.12811279296875, -2.046905517578125, -1.9656982421875, -1.884490966796875, -1.80328369140625, -1.722076416015625, -1.640869140625, -1.559661865234375, -1.47845458984375, -1.397247314453125, -1.3160400390625, -1.234832763671875, -1.15362548828125, -1.072418212890625, -0.9912109375, -0.910003662109375, -0.82879638671875, -0.747589111328125, -0.6663818359375, -0.585174560546875, -0.50396728515625, -0.422760009765625, -0.341552734375, -0.260345458984375, -0.17913818359375, -0.097930908203125, -0.0167236328125, 0.064483642578125, 0.14569091796875, 0.226898193359375, 0.30810546875, 0.389312744140625, 0.47052001953125, 0.551727294921875, 0.6329345703125, 0.714141845703125, 0.79534912109375, 0.876556396484375, 0.957763671875, 1.038970947265625, 1.12017822265625, 1.201385498046875, 1.2825927734375, 1.363800048828125, 1.44500732421875, 1.526214599609375, 1.607421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 6.0, 11.0, 20.0, 33.0, 51.0, 82.0, 127.0, 172.0, 179.0, 121.0, 62.0, 46.0, 35.0, 15.0, 17.0, 7.0, 3.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.62890625, -2.5740814208984375, -2.519256591796875, -2.4644317626953125, -2.40960693359375, -2.3547821044921875, -2.299957275390625, -2.2451324462890625, -2.1903076171875, -2.1354827880859375, -2.080657958984375, -2.0258331298828125, -1.97100830078125, -1.9161834716796875, -1.861358642578125, -1.8065338134765625, -1.751708984375, -1.6968841552734375, -1.642059326171875, -1.5872344970703125, -1.53240966796875, -1.4775848388671875, -1.422760009765625, -1.3679351806640625, -1.3131103515625, -1.2582855224609375, -1.203460693359375, -1.1486358642578125, -1.09381103515625, -1.0389862060546875, -0.984161376953125, -0.9293365478515625, -0.87451171875, -0.8196868896484375, -0.764862060546875, -0.7100372314453125, -0.65521240234375, -0.6003875732421875, -0.545562744140625, -0.4907379150390625, -0.4359130859375, -0.3810882568359375, -0.326263427734375, -0.2714385986328125, -0.21661376953125, -0.1617889404296875, -0.106964111328125, -0.0521392822265625, 0.002685546875, 0.0575103759765625, 0.112335205078125, 0.1671600341796875, 0.22198486328125, 0.2768096923828125, 0.331634521484375, 0.3864593505859375, 0.4412841796875, 0.4961090087890625, 0.550933837890625, 0.6057586669921875, 0.66058349609375, 0.7154083251953125, 0.770233154296875, 0.8250579833984375, 0.8798828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 16.0, 58.0, 199.0, 450.0, 187.0, 56.0, 13.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.20783615112305, -45.74612045288086, -44.284400939941406, -42.82268524169922, -41.36096954345703, -39.899253845214844, -38.43753433227539, -36.9758186340332, -35.51409912109375, -34.05238342285156, -32.59066390991211, -31.128948211669922, -29.667232513427734, -28.205514907836914, -26.743797302246094, -25.282081604003906, -23.82036590576172, -22.3586483001709, -20.89693260192871, -19.43521499633789, -17.973499298095703, -16.511781692504883, -15.050064086914062, -13.588347434997559, -12.126630783081055, -10.66491413116455, -9.203197479248047, -7.741479873657227, -6.279763221740723, -4.818046569824219, -3.3563289642333984, -1.8946123123168945, -0.43289947509765625, 1.0288174152374268, 2.4905343055725098, 3.952251434326172, 5.413968086242676, 6.87568473815918, 8.33740234375, 9.799118995666504, 11.260835647583008, 12.722552299499512, 14.184268951416016, 15.645986557006836, 17.107704162597656, 18.569419860839844, 20.031137466430664, 21.492855072021484, 22.954570770263672, 24.416288375854492, 25.87800407409668, 27.3397216796875, 28.801437377929688, 30.263154983520508, 31.724872589111328, 33.186588287353516, 34.64830780029297, 36.110023498535156, 37.57174301147461, 39.0334587097168, 40.495174407958984, 41.95689392089844, 43.418609619140625, 44.88032531738281, 46.342041015625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 7.0, 4.0, 8.0, 4.0, 13.0, 8.0, 13.0, 13.0, 24.0, 12.0, 24.0, 28.0, 25.0, 39.0, 40.0, 31.0, 49.0, 71.0, 80.0, 72.0, 68.0, 40.0, 37.0, 40.0, 34.0, 33.0, 35.0, 25.0, 23.0, 17.0, 14.0, 12.0, 10.0, 17.0, 7.0, 10.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.893497467041016, -16.367094039916992, -15.840689659118652, -15.314285278320312, -14.787881851196289, -14.261478424072266, -13.735074043273926, -13.208669662475586, -12.682266235351562, -12.155862808227539, -11.6294584274292, -11.10305404663086, -10.576650619506836, -10.050247192382812, -9.523842811584473, -8.997438430786133, -8.47103500366211, -7.944631099700928, -7.418227195739746, -6.8918232917785645, -6.365419387817383, -5.839015483856201, -5.3126115798950195, -4.786207675933838, -4.259803771972656, -3.7333998680114746, -3.206995964050293, -2.6805920600891113, -2.1541881561279297, -1.627784252166748, -1.1013803482055664, -0.5749764442443848, -0.04857063293457031, 0.47783327102661133, 1.004237174987793, 1.5306410789489746, 2.0570449829101562, 2.583448886871338, 3.1098527908325195, 3.636256694793701, 4.162660598754883, 4.6890645027160645, 5.215468406677246, 5.741872310638428, 6.268276214599609, 6.794680118560791, 7.321084022521973, 7.847487926483154, 8.373891830444336, 8.90029525756836, 9.4266996383667, 9.953104019165039, 10.479507446289062, 11.005910873413086, 11.532315254211426, 12.058719635009766, 12.585123062133789, 13.111526489257812, 13.637930870056152, 14.164335250854492, 14.690738677978516, 15.217142105102539, 15.743546485900879, 16.26995086669922, 16.796354293823242]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 20.0, 25.0, 37.0, 47.0, 93.0, 196.0, 396.0, 703.0, 1459.0, 3392.0, 8963.0, 34127.0, 592054.0, 3359763.0, 163403.0, 19266.0, 6012.0, 2287.0, 1025.0, 439.0, 258.0, 126.0, 68.0, 43.0, 17.0, 12.0, 17.0, 5.0, 4.0, 4.0, 6.0, 1.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.861328125, -1.77398681640625, -1.6866455078125, -1.59930419921875, -1.511962890625, -1.42462158203125, -1.3372802734375, -1.24993896484375, -1.16259765625, -1.07525634765625, -0.9879150390625, -0.90057373046875, -0.813232421875, -0.72589111328125, -0.6385498046875, -0.55120849609375, -0.4638671875, -0.37652587890625, -0.2891845703125, -0.20184326171875, -0.114501953125, -0.02716064453125, 0.0601806640625, 0.14752197265625, 0.23486328125, 0.32220458984375, 0.4095458984375, 0.49688720703125, 0.584228515625, 0.67156982421875, 0.7589111328125, 0.84625244140625, 0.93359375, 1.02093505859375, 1.1082763671875, 1.19561767578125, 1.282958984375, 1.37030029296875, 1.4576416015625, 1.54498291015625, 1.63232421875, 1.71966552734375, 1.8070068359375, 1.89434814453125, 1.981689453125, 2.06903076171875, 2.1563720703125, 2.24371337890625, 2.3310546875, 2.41839599609375, 2.5057373046875, 2.59307861328125, 2.680419921875, 2.76776123046875, 2.8551025390625, 2.94244384765625, 3.02978515625, 3.11712646484375, 3.2044677734375, 3.29180908203125, 3.379150390625, 3.46649169921875, 3.5538330078125, 3.64117431640625, 3.728515625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 9.0, 8.0, 8.0, 8.0, 17.0, 17.0, 19.0, 31.0, 34.0, 42.0, 40.0, 45.0, 39.0, 49.0, 40.0, 66.0, 58.0, 53.0, 64.0, 39.0, 44.0, 47.0, 40.0, 31.0, 30.0, 26.0, 23.0, 24.0, 11.0, 8.0, 6.0, 3.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232421875, -1.28436279296875, -1.2454833984375, -1.20660400390625, -1.167724609375, -1.12884521484375, -1.0899658203125, -1.05108642578125, -1.01220703125, -0.97332763671875, -0.9344482421875, -0.89556884765625, -0.856689453125, -0.81781005859375, -0.7789306640625, -0.74005126953125, -0.701171875, -0.66229248046875, -0.6234130859375, -0.58453369140625, -0.545654296875, -0.50677490234375, -0.4678955078125, -0.42901611328125, -0.39013671875, -0.35125732421875, -0.3123779296875, -0.27349853515625, -0.234619140625, -0.19573974609375, -0.1568603515625, -0.11798095703125, -0.0791015625, -0.04022216796875, -0.0013427734375, 0.03753662109375, 0.076416015625, 0.11529541015625, 0.1541748046875, 0.19305419921875, 0.23193359375, 0.27081298828125, 0.3096923828125, 0.34857177734375, 0.387451171875, 0.42633056640625, 0.4652099609375, 0.50408935546875, 0.54296875, 0.58184814453125, 0.6207275390625, 0.65960693359375, 0.698486328125, 0.73736572265625, 0.7762451171875, 0.81512451171875, 0.85400390625, 0.89288330078125, 0.9317626953125, 0.97064208984375, 1.009521484375, 1.04840087890625, 1.0872802734375, 1.12615966796875, 1.1650390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 10.0, 16.0, 18.0, 35.0, 64.0, 140.0, 334.0, 999.0, 4292.0, 36849.0, 3898586.0, 239283.0, 10809.0, 1885.0, 535.0, 209.0, 99.0, 38.0, 22.0, 18.0, 14.0, 4.0, 9.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.17578125, -4.9747314453125, -4.773681640625, -4.5726318359375, -4.37158203125, -4.1705322265625, -3.969482421875, -3.7684326171875, -3.5673828125, -3.3663330078125, -3.165283203125, -2.9642333984375, -2.76318359375, -2.5621337890625, -2.361083984375, -2.1600341796875, -1.958984375, -1.7579345703125, -1.556884765625, -1.3558349609375, -1.15478515625, -0.9537353515625, -0.752685546875, -0.5516357421875, -0.3505859375, -0.1495361328125, 0.051513671875, 0.2525634765625, 0.45361328125, 0.6546630859375, 0.855712890625, 1.0567626953125, 1.2578125, 1.4588623046875, 1.659912109375, 1.8609619140625, 2.06201171875, 2.2630615234375, 2.464111328125, 2.6651611328125, 2.8662109375, 3.0672607421875, 3.268310546875, 3.4693603515625, 3.67041015625, 3.8714599609375, 4.072509765625, 4.2735595703125, 4.474609375, 4.6756591796875, 4.876708984375, 5.0777587890625, 5.27880859375, 5.4798583984375, 5.680908203125, 5.8819580078125, 6.0830078125, 6.2840576171875, 6.485107421875, 6.6861572265625, 6.88720703125, 7.0882568359375, 7.289306640625, 7.4903564453125, 7.69140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 9.0, 9.0, 13.0, 20.0, 19.0, 40.0, 67.0, 144.0, 261.0, 810.0, 1552.0, 656.0, 227.0, 90.0, 54.0, 33.0, 20.0, 9.0, 14.0, 6.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6875, -5.539306640625, -5.39111328125, -5.242919921875, -5.0947265625, -4.946533203125, -4.79833984375, -4.650146484375, -4.501953125, -4.353759765625, -4.20556640625, -4.057373046875, -3.9091796875, -3.760986328125, -3.61279296875, -3.464599609375, -3.31640625, -3.168212890625, -3.02001953125, -2.871826171875, -2.7236328125, -2.575439453125, -2.42724609375, -2.279052734375, -2.130859375, -1.982666015625, -1.83447265625, -1.686279296875, -1.5380859375, -1.389892578125, -1.24169921875, -1.093505859375, -0.9453125, -0.797119140625, -0.64892578125, -0.500732421875, -0.3525390625, -0.204345703125, -0.05615234375, 0.092041015625, 0.240234375, 0.388427734375, 0.53662109375, 0.684814453125, 0.8330078125, 0.981201171875, 1.12939453125, 1.277587890625, 1.42578125, 1.573974609375, 1.72216796875, 1.870361328125, 2.0185546875, 2.166748046875, 2.31494140625, 2.463134765625, 2.611328125, 2.759521484375, 2.90771484375, 3.055908203125, 3.2041015625, 3.352294921875, 3.50048828125, 3.648681640625, 3.796875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 7.0, 17.0, 28.0, 57.0, 127.0, 194.0, 242.0, 177.0, 76.0, 25.0, 22.0, 9.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.468975067138672, -18.553943634033203, -17.638912200927734, -16.723880767822266, -15.808849334716797, -14.893817901611328, -13.97878646850586, -13.06375503540039, -12.148723602294922, -11.233692169189453, -10.318660736083984, -9.403629302978516, -8.488597869873047, -7.573566913604736, -6.658535480499268, -5.743504047393799, -4.828473091125488, -3.9134416580200195, -2.998410224914551, -2.083379030227661, -1.1683475971221924, -0.25331640243530273, 0.661715030670166, 1.5767464637756348, 2.4917778968811035, 3.4068093299865723, 4.321840763092041, 5.236871719360352, 6.15190315246582, 7.066934585571289, 7.981966018676758, 8.896997451782227, 9.812028884887695, 10.727060317993164, 11.642091751098633, 12.557123184204102, 13.47215461730957, 14.387186050415039, 15.302217483520508, 16.217248916625977, 17.132280349731445, 18.047311782836914, 18.962343215942383, 19.87737464904785, 20.79240608215332, 21.70743751525879, 22.622468948364258, 23.537500381469727, 24.452529907226562, 25.36756134033203, 26.2825927734375, 27.19762420654297, 28.112655639648438, 29.027687072753906, 29.942718505859375, 30.857749938964844, 31.772781372070312, 32.68781280517578, 33.60284423828125, 34.51787567138672, 35.43290710449219, 36.347938537597656, 37.262969970703125, 38.178001403808594, 39.09303283691406]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 9.0, 9.0, 16.0, 13.0, 10.0, 22.0, 18.0, 25.0, 14.0, 27.0, 33.0, 34.0, 41.0, 50.0, 49.0, 62.0, 62.0, 58.0, 39.0, 51.0, 45.0, 44.0, 42.0, 33.0, 31.0, 27.0, 23.0, 21.0, 13.0, 16.0, 11.0, 11.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.822197914123535, -11.449347496032715, -11.076498031616211, -10.70364761352539, -10.33079719543457, -9.95794677734375, -9.585097312927246, -9.212246894836426, -8.839397430419922, -8.466547012329102, -8.093697547912598, -7.720847129821777, -7.347996711730957, -6.975146770477295, -6.602296829223633, -6.2294464111328125, -5.856595993041992, -5.48374605178833, -5.11089563369751, -4.738045692443848, -4.365195274353027, -3.9923453330993652, -3.619495391845703, -3.246645212173462, -2.8737950325012207, -2.5009448528289795, -2.1280946731567383, -1.7552447319030762, -1.382394552230835, -1.0095443725585938, -0.6366944313049316, -0.26384425163269043, 0.10900592803955078, 0.4818560481071472, 0.8547061681747437, 1.2275562286376953, 1.6004064083099365, 1.9732565879821777, 2.34610652923584, 2.718956708908081, 3.0918068885803223, 3.4646570682525635, 3.8375072479248047, 4.210357189178467, 4.583207130432129, 4.956057548522949, 5.328907489776611, 5.701757431030273, 6.074607849121094, 6.447457790374756, 6.820308208465576, 7.193158149719238, 7.566008567810059, 7.938858509063721, 8.311708450317383, 8.684558868408203, 9.057409286499023, 9.430259704589844, 9.803109169006348, 10.175959587097168, 10.548810005187988, 10.921659469604492, 11.294509887695312, 11.667360305786133, 12.040209770202637]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 15.0, 18.0, 37.0, 84.0, 151.0, 339.0, 789.0, 2276.0, 8244.0, 40137.0, 357585.0, 561924.0, 61120.0, 11111.0, 2983.0, 971.0, 401.0, 191.0, 90.0, 47.0, 23.0, 7.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646484375, -3.5482177734375, -3.449951171875, -3.3516845703125, -3.25341796875, -3.1551513671875, -3.056884765625, -2.9586181640625, -2.8603515625, -2.7620849609375, -2.663818359375, -2.5655517578125, -2.46728515625, -2.3690185546875, -2.270751953125, -2.1724853515625, -2.07421875, -1.9759521484375, -1.877685546875, -1.7794189453125, -1.68115234375, -1.5828857421875, -1.484619140625, -1.3863525390625, -1.2880859375, -1.1898193359375, -1.091552734375, -0.9932861328125, -0.89501953125, -0.7967529296875, -0.698486328125, -0.6002197265625, -0.501953125, -0.4036865234375, -0.305419921875, -0.2071533203125, -0.10888671875, -0.0106201171875, 0.087646484375, 0.1859130859375, 0.2841796875, 0.3824462890625, 0.480712890625, 0.5789794921875, 0.67724609375, 0.7755126953125, 0.873779296875, 0.9720458984375, 1.0703125, 1.1685791015625, 1.266845703125, 1.3651123046875, 1.46337890625, 1.5616455078125, 1.659912109375, 1.7581787109375, 1.8564453125, 1.9547119140625, 2.052978515625, 2.1512451171875, 2.24951171875, 2.3477783203125, 2.446044921875, 2.5443115234375, 2.642578125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 3.0, 9.0, 11.0, 4.0, 7.0, 11.0, 12.0, 14.0, 17.0, 14.0, 21.0, 25.0, 23.0, 30.0, 37.0, 39.0, 44.0, 58.0, 58.0, 62.0, 54.0, 49.0, 47.0, 52.0, 40.0, 28.0, 26.0, 31.0, 27.0, 25.0, 28.0, 24.0, 15.0, 16.0, 9.0, 10.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.21875, -1.1827392578125, -1.146728515625, -1.1107177734375, -1.07470703125, -1.0386962890625, -1.002685546875, -0.9666748046875, -0.9306640625, -0.8946533203125, -0.858642578125, -0.8226318359375, -0.78662109375, -0.7506103515625, -0.714599609375, -0.6785888671875, -0.642578125, -0.6065673828125, -0.570556640625, -0.5345458984375, -0.49853515625, -0.4625244140625, -0.426513671875, -0.3905029296875, -0.3544921875, -0.3184814453125, -0.282470703125, -0.2464599609375, -0.21044921875, -0.1744384765625, -0.138427734375, -0.1024169921875, -0.06640625, -0.0303955078125, 0.005615234375, 0.0416259765625, 0.07763671875, 0.1136474609375, 0.149658203125, 0.1856689453125, 0.2216796875, 0.2576904296875, 0.293701171875, 0.3297119140625, 0.36572265625, 0.4017333984375, 0.437744140625, 0.4737548828125, 0.509765625, 0.5457763671875, 0.581787109375, 0.6177978515625, 0.65380859375, 0.6898193359375, 0.725830078125, 0.7618408203125, 0.7978515625, 0.8338623046875, 0.869873046875, 0.9058837890625, 0.94189453125, 0.9779052734375, 1.013916015625, 1.0499267578125, 1.0859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 7.0, 13.0, 9.0, 12.0, 15.0, 27.0, 34.0, 40.0, 61.0, 82.0, 129.0, 194.0, 259.0, 552.0, 1185.0, 3150.0, 11765.0, 71325.0, 754962.0, 174097.0, 22230.0, 4980.0, 1683.0, 698.0, 371.0, 207.0, 129.0, 86.0, 66.0, 50.0, 42.0, 20.0, 21.0, 10.0, 15.0, 7.0, 3.0, 10.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.109375, -2.023956298828125, -1.93853759765625, -1.853118896484375, -1.7677001953125, -1.682281494140625, -1.59686279296875, -1.511444091796875, -1.426025390625, -1.340606689453125, -1.25518798828125, -1.169769287109375, -1.0843505859375, -0.998931884765625, -0.91351318359375, -0.828094482421875, -0.74267578125, -0.657257080078125, -0.57183837890625, -0.486419677734375, -0.4010009765625, -0.315582275390625, -0.23016357421875, -0.144744873046875, -0.059326171875, 0.026092529296875, 0.11151123046875, 0.196929931640625, 0.2823486328125, 0.367767333984375, 0.45318603515625, 0.538604736328125, 0.6240234375, 0.709442138671875, 0.79486083984375, 0.880279541015625, 0.9656982421875, 1.051116943359375, 1.13653564453125, 1.221954345703125, 1.307373046875, 1.392791748046875, 1.47821044921875, 1.563629150390625, 1.6490478515625, 1.734466552734375, 1.81988525390625, 1.905303955078125, 1.99072265625, 2.076141357421875, 2.16156005859375, 2.246978759765625, 2.3323974609375, 2.417816162109375, 2.50323486328125, 2.588653564453125, 2.674072265625, 2.759490966796875, 2.84490966796875, 2.930328369140625, 3.0157470703125, 3.101165771484375, 3.18658447265625, 3.272003173828125, 3.357421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 6.0, 4.0, 15.0, 10.0, 19.0, 21.0, 23.0, 36.0, 40.0, 46.0, 53.0, 65.0, 65.0, 53.0, 63.0, 67.0, 53.0, 57.0, 38.0, 50.0, 49.0, 37.0, 25.0, 16.0, 14.0, 14.0, 17.0, 4.0, 10.0, 11.0, 6.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.1156005859375, -3.961669921875, -3.8077392578125, -3.65380859375, -3.4998779296875, -3.345947265625, -3.1920166015625, -3.0380859375, -2.8841552734375, -2.730224609375, -2.5762939453125, -2.42236328125, -2.2684326171875, -2.114501953125, -1.9605712890625, -1.806640625, -1.6527099609375, -1.498779296875, -1.3448486328125, -1.19091796875, -1.0369873046875, -0.883056640625, -0.7291259765625, -0.5751953125, -0.4212646484375, -0.267333984375, -0.1134033203125, 0.04052734375, 0.1944580078125, 0.348388671875, 0.5023193359375, 0.65625, 0.8101806640625, 0.964111328125, 1.1180419921875, 1.27197265625, 1.4259033203125, 1.579833984375, 1.7337646484375, 1.8876953125, 2.0416259765625, 2.195556640625, 2.3494873046875, 2.50341796875, 2.6573486328125, 2.811279296875, 2.9652099609375, 3.119140625, 3.2730712890625, 3.427001953125, 3.5809326171875, 3.73486328125, 3.8887939453125, 4.042724609375, 4.1966552734375, 4.3505859375, 4.5045166015625, 4.658447265625, 4.8123779296875, 4.96630859375, 5.1202392578125, 5.274169921875, 5.4281005859375, 5.58203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 13.0, 7.0, 18.0, 18.0, 31.0, 60.0, 78.0, 138.0, 285.0, 550.0, 1205.0, 3144.0, 9788.0, 44471.0, 669491.0, 274024.0, 32719.0, 7805.0, 2605.0, 1035.0, 498.0, 224.0, 130.0, 72.0, 46.0, 27.0, 30.0, 10.0, 8.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.01171875, -0.980010986328125, -0.94830322265625, -0.916595458984375, -0.8848876953125, -0.853179931640625, -0.82147216796875, -0.789764404296875, -0.758056640625, -0.726348876953125, -0.69464111328125, -0.662933349609375, -0.6312255859375, -0.599517822265625, -0.56781005859375, -0.536102294921875, -0.50439453125, -0.472686767578125, -0.44097900390625, -0.409271240234375, -0.3775634765625, -0.345855712890625, -0.31414794921875, -0.282440185546875, -0.250732421875, -0.219024658203125, -0.18731689453125, -0.155609130859375, -0.1239013671875, -0.092193603515625, -0.06048583984375, -0.028778076171875, 0.0029296875, 0.034637451171875, 0.06634521484375, 0.098052978515625, 0.1297607421875, 0.161468505859375, 0.19317626953125, 0.224884033203125, 0.256591796875, 0.288299560546875, 0.32000732421875, 0.351715087890625, 0.3834228515625, 0.415130615234375, 0.44683837890625, 0.478546142578125, 0.51025390625, 0.541961669921875, 0.57366943359375, 0.605377197265625, 0.6370849609375, 0.668792724609375, 0.70050048828125, 0.732208251953125, 0.763916015625, 0.795623779296875, 0.82733154296875, 0.859039306640625, 0.8907470703125, 0.922454833984375, 0.95416259765625, 0.985870361328125, 1.017578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 7.0, 18.0, 56.0, 123.0, 238.0, 287.0, 129.0, 49.0, 37.0, 12.0, 4.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004458427429199219, -0.00043195486068725586, -0.00041806697845458984, -0.00040417909622192383, -0.0003902912139892578, -0.0003764033317565918, -0.0003625154495239258, -0.00034862756729125977, -0.00033473968505859375, -0.00032085180282592773, -0.0003069639205932617, -0.0002930760383605957, -0.0002791881561279297, -0.00026530027389526367, -0.00025141239166259766, -0.00023752450942993164, -0.00022363662719726562, -0.0002097487449645996, -0.0001958608627319336, -0.00018197298049926758, -0.00016808509826660156, -0.00015419721603393555, -0.00014030933380126953, -0.00012642145156860352, -0.0001125335693359375, -9.864568710327148e-05, -8.475780487060547e-05, -7.086992263793945e-05, -5.698204040527344e-05, -4.309415817260742e-05, -2.9206275939941406e-05, -1.531839370727539e-05, -1.430511474609375e-06, 1.245737075805664e-05, 2.6345252990722656e-05, 4.023313522338867e-05, 5.412101745605469e-05, 6.80088996887207e-05, 8.189678192138672e-05, 9.578466415405273e-05, 0.00010967254638671875, 0.00012356042861938477, 0.00013744831085205078, 0.0001513361930847168, 0.0001652240753173828, 0.00017911195755004883, 0.00019299983978271484, 0.00020688772201538086, 0.00022077560424804688, 0.0002346634864807129, 0.0002485513687133789, 0.0002624392509460449, 0.00027632713317871094, 0.00029021501541137695, 0.00030410289764404297, 0.000317990779876709, 0.000331878662109375, 0.000345766544342041, 0.00035965442657470703, 0.00037354230880737305, 0.00038743019104003906, 0.0004013180732727051, 0.0004152059555053711, 0.0004290938377380371, 0.0004429817199707031]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 9.0, 9.0, 17.0, 14.0, 17.0, 24.0, 46.0, 56.0, 92.0, 138.0, 233.0, 417.0, 771.0, 1540.0, 3619.0, 9886.0, 36353.0, 253151.0, 665755.0, 54552.0, 13324.0, 4501.0, 1912.0, 881.0, 468.0, 296.0, 147.0, 102.0, 63.0, 53.0, 28.0, 20.0, 16.0, 10.0, 9.0, 6.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.96923828125, -0.9399795532226562, -0.9107208251953125, -0.8814620971679688, -0.852203369140625, -0.8229446411132812, -0.7936859130859375, -0.7644271850585938, -0.73516845703125, -0.7059097290039062, -0.6766510009765625, -0.6473922729492188, -0.618133544921875, -0.5888748168945312, -0.5596160888671875, -0.5303573608398438, -0.5010986328125, -0.47183990478515625, -0.4425811767578125, -0.41332244873046875, -0.384063720703125, -0.35480499267578125, -0.3255462646484375, -0.29628753662109375, -0.26702880859375, -0.23777008056640625, -0.2085113525390625, -0.17925262451171875, -0.149993896484375, -0.12073516845703125, -0.0914764404296875, -0.06221771240234375, -0.032958984375, -0.00370025634765625, 0.0255584716796875, 0.05481719970703125, 0.084075927734375, 0.11333465576171875, 0.1425933837890625, 0.17185211181640625, 0.20111083984375, 0.23036956787109375, 0.2596282958984375, 0.28888702392578125, 0.318145751953125, 0.34740447998046875, 0.3766632080078125, 0.40592193603515625, 0.4351806640625, 0.46443939208984375, 0.4936981201171875, 0.5229568481445312, 0.552215576171875, 0.5814743041992188, 0.6107330322265625, 0.6399917602539062, 0.66925048828125, 0.6985092163085938, 0.7277679443359375, 0.7570266723632812, 0.786285400390625, 0.8155441284179688, 0.8448028564453125, 0.8740615844726562, 0.9033203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 2.0, 6.0, 12.0, 10.0, 8.0, 12.0, 18.0, 25.0, 31.0, 26.0, 29.0, 65.0, 81.0, 78.0, 110.0, 92.0, 72.0, 66.0, 58.0, 33.0, 33.0, 23.0, 18.0, 14.0, 12.0, 13.0, 4.0, 10.0, 4.0, 5.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64697265625, -0.6244888305664062, -0.6020050048828125, -0.5795211791992188, -0.557037353515625, -0.5345535278320312, -0.5120697021484375, -0.48958587646484375, -0.46710205078125, -0.44461822509765625, -0.4221343994140625, -0.39965057373046875, -0.377166748046875, -0.35468292236328125, -0.3321990966796875, -0.30971527099609375, -0.2872314453125, -0.26474761962890625, -0.2422637939453125, -0.21977996826171875, -0.197296142578125, -0.17481231689453125, -0.1523284912109375, -0.12984466552734375, -0.10736083984375, -0.08487701416015625, -0.0623931884765625, -0.03990936279296875, -0.017425537109375, 0.00505828857421875, 0.0275421142578125, 0.05002593994140625, 0.072509765625, 0.09499359130859375, 0.1174774169921875, 0.13996124267578125, 0.162445068359375, 0.18492889404296875, 0.2074127197265625, 0.22989654541015625, 0.25238037109375, 0.27486419677734375, 0.2973480224609375, 0.31983184814453125, 0.342315673828125, 0.36479949951171875, 0.3872833251953125, 0.40976715087890625, 0.4322509765625, 0.45473480224609375, 0.4772186279296875, 0.49970245361328125, 0.522186279296875, 0.5446701049804688, 0.5671539306640625, 0.5896377563476562, 0.61212158203125, 0.6346054077148438, 0.6570892333984375, 0.6795730590820312, 0.702056884765625, 0.7245407104492188, 0.7470245361328125, 0.7695083618164062, 0.7919921875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 1.0, 2.0, 14.0, 25.0, 69.0, 142.0, 276.0, 237.0, 103.0, 64.0, 26.0, 16.0, 4.0, 7.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.77892303466797, -21.050357818603516, -20.321792602539062, -19.59322738647461, -18.864662170410156, -18.136096954345703, -17.40753173828125, -16.678966522216797, -15.950401306152344, -15.22183609008789, -14.493270874023438, -13.764705657958984, -13.036140441894531, -12.307575225830078, -11.579010009765625, -10.850444793701172, -10.121879577636719, -9.393314361572266, -8.664749145507812, -7.936183929443359, -7.207618713378906, -6.479053497314453, -5.75048828125, -5.021923065185547, -4.293357849121094, -3.5647926330566406, -2.8362274169921875, -2.1076622009277344, -1.3790969848632812, -0.6505317687988281, 0.078033447265625, 0.8065986633300781, 1.5351619720458984, 2.2637271881103516, 2.9922924041748047, 3.720857620239258, 4.449422836303711, 5.177988052368164, 5.906553268432617, 6.63511848449707, 7.363683700561523, 8.092248916625977, 8.82081413269043, 9.549379348754883, 10.277944564819336, 11.006509780883789, 11.735074996948242, 12.463640213012695, 13.192205429077148, 13.920770645141602, 14.649335861206055, 15.377901077270508, 16.10646629333496, 16.835031509399414, 17.563596725463867, 18.29216194152832, 19.020727157592773, 19.749292373657227, 20.47785758972168, 21.206422805786133, 21.934988021850586, 22.66355323791504, 23.392118453979492, 24.120683670043945, 24.8492488861084]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 10.0, 1.0, 6.0, 7.0, 11.0, 8.0, 18.0, 9.0, 15.0, 21.0, 24.0, 26.0, 27.0, 22.0, 31.0, 30.0, 34.0, 55.0, 76.0, 97.0, 66.0, 60.0, 46.0, 30.0, 39.0, 29.0, 32.0, 28.0, 23.0, 25.0, 15.0, 9.0, 16.0, 9.0, 9.0, 5.0, 6.0, 8.0, 3.0, 5.0, 3.0, 0.0, 6.0, 1.0, 0.0, 5.0, 0.0, 1.0, 3.0], "bins": [-14.920915603637695, -14.49063777923584, -14.060359954833984, -13.630083084106445, -13.19980525970459, -12.769527435302734, -12.339250564575195, -11.90897274017334, -11.478694915771484, -11.048417091369629, -10.618139266967773, -10.187862396240234, -9.757584571838379, -9.327306747436523, -8.897029876708984, -8.466752052307129, -8.036474227905273, -7.606196403503418, -7.175919055938721, -6.745641708374023, -6.315363883972168, -5.8850860595703125, -5.454808712005615, -5.024531364440918, -4.5942535400390625, -4.163975715637207, -3.7336983680725098, -3.3034207820892334, -2.873143196105957, -2.4428656101226807, -2.0125880241394043, -1.582310438156128, -1.1520318984985352, -0.7217543125152588, -0.2914767265319824, 0.13880085945129395, 0.5690784454345703, 0.9993560314178467, 1.429633617401123, 1.8599112033843994, 2.290188789367676, 2.720466375350952, 3.1507439613342285, 3.581021547317505, 4.011299133300781, 4.441576957702637, 4.871854305267334, 5.302131652832031, 5.732409477233887, 6.162687301635742, 6.5929646492004395, 7.023241996765137, 7.453519821166992, 7.883797645568848, 8.314075469970703, 8.744352340698242, 9.174630165100098, 9.604907989501953, 10.035184860229492, 10.465462684631348, 10.895740509033203, 11.326018333435059, 11.756296157836914, 12.186573028564453, 12.616850852966309]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 6.0, 10.0, 9.0, 25.0, 34.0, 54.0, 97.0, 144.0, 282.0, 532.0, 1207.0, 2615.0, 7063.0, 24373.0, 196994.0, 2855400.0, 1009589.0, 74230.0, 13702.0, 4385.0, 1745.0, 793.0, 409.0, 242.0, 128.0, 82.0, 54.0, 27.0, 17.0, 20.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.2730560302734375, -1.205291748046875, -1.1375274658203125, -1.06976318359375, -1.0019989013671875, -0.934234619140625, -0.8664703369140625, -0.7987060546875, -0.7309417724609375, -0.663177490234375, -0.5954132080078125, -0.52764892578125, -0.4598846435546875, -0.392120361328125, -0.3243560791015625, -0.256591796875, -0.1888275146484375, -0.121063232421875, -0.0532989501953125, 0.01446533203125, 0.0822296142578125, 0.149993896484375, 0.2177581787109375, 0.2855224609375, 0.3532867431640625, 0.421051025390625, 0.4888153076171875, 0.55657958984375, 0.6243438720703125, 0.692108154296875, 0.7598724365234375, 0.82763671875, 0.8954010009765625, 0.963165283203125, 1.0309295654296875, 1.09869384765625, 1.1664581298828125, 1.234222412109375, 1.3019866943359375, 1.3697509765625, 1.4375152587890625, 1.505279541015625, 1.5730438232421875, 1.64080810546875, 1.7085723876953125, 1.776336669921875, 1.8441009521484375, 1.911865234375, 1.9796295166015625, 2.047393798828125, 2.1151580810546875, 2.18292236328125, 2.2506866455078125, 2.318450927734375, 2.3862152099609375, 2.4539794921875, 2.5217437744140625, 2.589508056640625, 2.6572723388671875, 2.72503662109375, 2.7928009033203125, 2.860565185546875, 2.9283294677734375, 2.99609375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 8.0, 5.0, 3.0, 6.0, 9.0, 8.0, 14.0, 17.0, 16.0, 9.0, 19.0, 25.0, 34.0, 29.0, 32.0, 43.0, 47.0, 59.0, 45.0, 50.0, 55.0, 54.0, 43.0, 44.0, 31.0, 44.0, 40.0, 31.0, 24.0, 23.0, 28.0, 22.0, 14.0, 16.0, 17.0, 11.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.115234375, -1.08172607421875, -1.0482177734375, -1.01470947265625, -0.981201171875, -0.94769287109375, -0.9141845703125, -0.88067626953125, -0.84716796875, -0.81365966796875, -0.7801513671875, -0.74664306640625, -0.713134765625, -0.67962646484375, -0.6461181640625, -0.61260986328125, -0.5791015625, -0.54559326171875, -0.5120849609375, -0.47857666015625, -0.445068359375, -0.41156005859375, -0.3780517578125, -0.34454345703125, -0.31103515625, -0.27752685546875, -0.2440185546875, -0.21051025390625, -0.177001953125, -0.14349365234375, -0.1099853515625, -0.07647705078125, -0.04296875, -0.00946044921875, 0.0240478515625, 0.05755615234375, 0.091064453125, 0.12457275390625, 0.1580810546875, 0.19158935546875, 0.22509765625, 0.25860595703125, 0.2921142578125, 0.32562255859375, 0.359130859375, 0.39263916015625, 0.4261474609375, 0.45965576171875, 0.4931640625, 0.52667236328125, 0.5601806640625, 0.59368896484375, 0.627197265625, 0.66070556640625, 0.6942138671875, 0.72772216796875, 0.76123046875, 0.79473876953125, 0.8282470703125, 0.86175537109375, 0.895263671875, 0.92877197265625, 0.9622802734375, 0.99578857421875, 1.029296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 8.0, 20.0, 32.0, 40.0, 89.0, 176.0, 327.0, 861.0, 2942.0, 18000.0, 1539117.0, 2606671.0, 21153.0, 3131.0, 955.0, 379.0, 157.0, 98.0, 46.0, 23.0, 18.0, 14.0, 4.0, 5.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3828125, -5.2198486328125, -5.056884765625, -4.8939208984375, -4.73095703125, -4.5679931640625, -4.405029296875, -4.2420654296875, -4.0791015625, -3.9161376953125, -3.753173828125, -3.5902099609375, -3.42724609375, -3.2642822265625, -3.101318359375, -2.9383544921875, -2.775390625, -2.6124267578125, -2.449462890625, -2.2864990234375, -2.12353515625, -1.9605712890625, -1.797607421875, -1.6346435546875, -1.4716796875, -1.3087158203125, -1.145751953125, -0.9827880859375, -0.81982421875, -0.6568603515625, -0.493896484375, -0.3309326171875, -0.16796875, -0.0050048828125, 0.157958984375, 0.3209228515625, 0.48388671875, 0.6468505859375, 0.809814453125, 0.9727783203125, 1.1357421875, 1.2987060546875, 1.461669921875, 1.6246337890625, 1.78759765625, 1.9505615234375, 2.113525390625, 2.2764892578125, 2.439453125, 2.6024169921875, 2.765380859375, 2.9283447265625, 3.09130859375, 3.2542724609375, 3.417236328125, 3.5802001953125, 3.7431640625, 3.9061279296875, 4.069091796875, 4.2320556640625, 4.39501953125, 4.5579833984375, 4.720947265625, 4.8839111328125, 5.046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 10.0, 17.0, 32.0, 51.0, 98.0, 216.0, 633.0, 1408.0, 930.0, 333.0, 136.0, 83.0, 40.0, 31.0, 15.0, 11.0, 5.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1875, -3.04693603515625, -2.9063720703125, -2.76580810546875, -2.625244140625, -2.48468017578125, -2.3441162109375, -2.20355224609375, -2.06298828125, -1.92242431640625, -1.7818603515625, -1.64129638671875, -1.500732421875, -1.36016845703125, -1.2196044921875, -1.07904052734375, -0.9384765625, -0.79791259765625, -0.6573486328125, -0.51678466796875, -0.376220703125, -0.23565673828125, -0.0950927734375, 0.04547119140625, 0.18603515625, 0.32659912109375, 0.4671630859375, 0.60772705078125, 0.748291015625, 0.88885498046875, 1.0294189453125, 1.16998291015625, 1.310546875, 1.45111083984375, 1.5916748046875, 1.73223876953125, 1.872802734375, 2.01336669921875, 2.1539306640625, 2.29449462890625, 2.43505859375, 2.57562255859375, 2.7161865234375, 2.85675048828125, 2.997314453125, 3.13787841796875, 3.2784423828125, 3.41900634765625, 3.5595703125, 3.70013427734375, 3.8406982421875, 3.98126220703125, 4.121826171875, 4.26239013671875, 4.4029541015625, 4.54351806640625, 4.68408203125, 4.82464599609375, 4.9652099609375, 5.10577392578125, 5.246337890625, 5.38690185546875, 5.5274658203125, 5.66802978515625, 5.80859375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 13.0, 55.0, 138.0, 262.0, 279.0, 145.0, 47.0, 31.0, 9.0, 4.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.70498275756836, -21.61915397644043, -20.5333251953125, -19.447498321533203, -18.361669540405273, -17.275840759277344, -16.190013885498047, -15.104185104370117, -14.018356323242188, -12.932527542114258, -11.846699714660645, -10.760871887207031, -9.675043106079102, -8.589214324951172, -7.503386497497559, -6.417558193206787, -5.331729888916016, -4.245901584625244, -3.1600732803344727, -2.074244976043701, -0.9884166717529297, 0.0974116325378418, 1.1832399368286133, 2.2690682411193848, 3.3548965454101562, 4.440724849700928, 5.526553153991699, 6.612381458282471, 7.698209762573242, 8.784038543701172, 9.869866371154785, 10.955694198608398, 12.041519165039062, 13.127347946166992, 14.213175773620605, 15.299003601074219, 16.38483238220215, 17.470661163330078, 18.556488037109375, 19.642316818237305, 20.728145599365234, 21.813974380493164, 22.899803161621094, 23.98563003540039, 25.07145881652832, 26.15728759765625, 27.243114471435547, 28.328943252563477, 29.414772033691406, 30.500600814819336, 31.586429595947266, 32.67225646972656, 33.758087158203125, 34.84391403198242, 35.92974090576172, 37.01557159423828, 38.10139846801758, 39.187225341796875, 40.27305603027344, 41.358882904052734, 42.44470977783203, 43.530540466308594, 44.61636734008789, 45.70219802856445, 46.78802490234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 9.0, 3.0, 4.0, 12.0, 6.0, 12.0, 15.0, 23.0, 19.0, 23.0, 28.0, 44.0, 39.0, 48.0, 50.0, 55.0, 55.0, 53.0, 46.0, 62.0, 54.0, 49.0, 51.0, 32.0, 33.0, 34.0, 29.0, 24.0, 20.0, 18.0, 13.0, 10.0, 10.0, 11.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.540031433105469, -12.143294334411621, -11.74655818939209, -11.349821090698242, -10.953083992004395, -10.556346893310547, -10.159610748291016, -9.762873649597168, -9.36613655090332, -8.969399452209473, -8.572663307189941, -8.175926208496094, -7.779189109802246, -7.382452487945557, -6.985715866088867, -6.5889787673950195, -6.192242622375488, -5.795506000518799, -5.398768901824951, -5.002032279968262, -4.605295181274414, -4.208558559417725, -3.811821937561035, -3.4150850772857666, -3.018348217010498, -2.6216113567352295, -2.224874496459961, -1.8281378746032715, -1.431401014328003, -1.0346641540527344, -0.6379275321960449, -0.24119067192077637, 0.15554523468017578, 0.5522820353507996, 0.9490188360214233, 1.3457555770874023, 1.742492437362671, 2.1392292976379395, 2.535965919494629, 2.9327027797698975, 3.329439640045166, 3.7261765003204346, 4.122913360595703, 4.519649982452393, 4.916386604309082, 5.31312370300293, 5.709860324859619, 6.106596946716309, 6.503334045410156, 6.900070667266846, 7.296807765960693, 7.693544387817383, 8.09028148651123, 8.487018585205078, 8.88375473022461, 9.280491828918457, 9.677228927612305, 10.073966026306152, 10.470702171325684, 10.867439270019531, 11.264176368713379, 11.660913467407227, 12.057649612426758, 12.454386711120605, 12.851122856140137]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 9.0, 10.0, 18.0, 22.0, 28.0, 58.0, 76.0, 131.0, 233.0, 361.0, 936.0, 2387.0, 7548.0, 30519.0, 211374.0, 675499.0, 94094.0, 17391.0, 4711.0, 1643.0, 709.0, 336.0, 158.0, 117.0, 67.0, 51.0, 33.0, 14.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.38671875, -3.29345703125, -3.2001953125, -3.10693359375, -3.013671875, -2.92041015625, -2.8271484375, -2.73388671875, -2.640625, -2.54736328125, -2.4541015625, -2.36083984375, -2.267578125, -2.17431640625, -2.0810546875, -1.98779296875, -1.89453125, -1.80126953125, -1.7080078125, -1.61474609375, -1.521484375, -1.42822265625, -1.3349609375, -1.24169921875, -1.1484375, -1.05517578125, -0.9619140625, -0.86865234375, -0.775390625, -0.68212890625, -0.5888671875, -0.49560546875, -0.40234375, -0.30908203125, -0.2158203125, -0.12255859375, -0.029296875, 0.06396484375, 0.1572265625, 0.25048828125, 0.34375, 0.43701171875, 0.5302734375, 0.62353515625, 0.716796875, 0.81005859375, 0.9033203125, 0.99658203125, 1.08984375, 1.18310546875, 1.2763671875, 1.36962890625, 1.462890625, 1.55615234375, 1.6494140625, 1.74267578125, 1.8359375, 1.92919921875, 2.0224609375, 2.11572265625, 2.208984375, 2.30224609375, 2.3955078125, 2.48876953125, 2.58203125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 3.0, 12.0, 7.0, 15.0, 13.0, 13.0, 16.0, 26.0, 19.0, 21.0, 35.0, 28.0, 46.0, 37.0, 39.0, 44.0, 43.0, 49.0, 61.0, 51.0, 47.0, 31.0, 44.0, 37.0, 32.0, 34.0, 31.0, 26.0, 22.0, 16.0, 12.0, 16.0, 10.0, 11.0, 6.0, 7.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.1748046875, -1.1412506103515625, -1.107696533203125, -1.0741424560546875, -1.04058837890625, -1.0070343017578125, -0.973480224609375, -0.9399261474609375, -0.9063720703125, -0.8728179931640625, -0.839263916015625, -0.8057098388671875, -0.77215576171875, -0.7386016845703125, -0.705047607421875, -0.6714935302734375, -0.637939453125, -0.6043853759765625, -0.570831298828125, -0.5372772216796875, -0.50372314453125, -0.4701690673828125, -0.436614990234375, -0.4030609130859375, -0.3695068359375, -0.3359527587890625, -0.302398681640625, -0.2688446044921875, -0.23529052734375, -0.2017364501953125, -0.168182373046875, -0.1346282958984375, -0.10107421875, -0.0675201416015625, -0.033966064453125, -0.0004119873046875, 0.03314208984375, 0.0666961669921875, 0.100250244140625, 0.1338043212890625, 0.1673583984375, 0.2009124755859375, 0.234466552734375, 0.2680206298828125, 0.30157470703125, 0.3351287841796875, 0.368682861328125, 0.4022369384765625, 0.435791015625, 0.4693450927734375, 0.502899169921875, 0.5364532470703125, 0.57000732421875, 0.6035614013671875, 0.637115478515625, 0.6706695556640625, 0.7042236328125, 0.7377777099609375, 0.771331787109375, 0.8048858642578125, 0.83843994140625, 0.8719940185546875, 0.905548095703125, 0.9391021728515625, 0.97265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 10.0, 8.0, 6.0, 12.0, 15.0, 24.0, 32.0, 39.0, 85.0, 122.0, 222.0, 340.0, 638.0, 1411.0, 3910.0, 18472.0, 329220.0, 665791.0, 20864.0, 4232.0, 1466.0, 704.0, 357.0, 209.0, 125.0, 65.0, 48.0, 32.0, 34.0, 19.0, 8.0, 5.0, 4.0, 8.0, 3.0, 3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.9281005859375, -3.801513671875, -3.6749267578125, -3.54833984375, -3.4217529296875, -3.295166015625, -3.1685791015625, -3.0419921875, -2.9154052734375, -2.788818359375, -2.6622314453125, -2.53564453125, -2.4090576171875, -2.282470703125, -2.1558837890625, -2.029296875, -1.9027099609375, -1.776123046875, -1.6495361328125, -1.52294921875, -1.3963623046875, -1.269775390625, -1.1431884765625, -1.0166015625, -0.8900146484375, -0.763427734375, -0.6368408203125, -0.51025390625, -0.3836669921875, -0.257080078125, -0.1304931640625, -0.00390625, 0.1226806640625, 0.249267578125, 0.3758544921875, 0.50244140625, 0.6290283203125, 0.755615234375, 0.8822021484375, 1.0087890625, 1.1353759765625, 1.261962890625, 1.3885498046875, 1.51513671875, 1.6417236328125, 1.768310546875, 1.8948974609375, 2.021484375, 2.1480712890625, 2.274658203125, 2.4012451171875, 2.52783203125, 2.6544189453125, 2.781005859375, 2.9075927734375, 3.0341796875, 3.1607666015625, 3.287353515625, 3.4139404296875, 3.54052734375, 3.6671142578125, 3.793701171875, 3.9202880859375, 4.046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 14.0, 13.0, 19.0, 24.0, 26.0, 39.0, 45.0, 48.0, 44.0, 70.0, 59.0, 75.0, 64.0, 85.0, 62.0, 59.0, 43.0, 43.0, 34.0, 19.0, 29.0, 20.0, 8.0, 11.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.4140625, -6.23663330078125, -6.0592041015625, -5.88177490234375, -5.704345703125, -5.52691650390625, -5.3494873046875, -5.17205810546875, -4.99462890625, -4.81719970703125, -4.6397705078125, -4.46234130859375, -4.284912109375, -4.10748291015625, -3.9300537109375, -3.75262451171875, -3.5751953125, -3.39776611328125, -3.2203369140625, -3.04290771484375, -2.865478515625, -2.68804931640625, -2.5106201171875, -2.33319091796875, -2.15576171875, -1.97833251953125, -1.8009033203125, -1.62347412109375, -1.446044921875, -1.26861572265625, -1.0911865234375, -0.91375732421875, -0.736328125, -0.55889892578125, -0.3814697265625, -0.20404052734375, -0.026611328125, 0.15081787109375, 0.3282470703125, 0.50567626953125, 0.68310546875, 0.86053466796875, 1.0379638671875, 1.21539306640625, 1.392822265625, 1.57025146484375, 1.7476806640625, 1.92510986328125, 2.1025390625, 2.27996826171875, 2.4573974609375, 2.63482666015625, 2.812255859375, 2.98968505859375, 3.1671142578125, 3.34454345703125, 3.52197265625, 3.69940185546875, 3.8768310546875, 4.05426025390625, 4.231689453125, 4.40911865234375, 4.5865478515625, 4.76397705078125, 4.94140625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 8.0, 9.0, 2.0, 7.0, 7.0, 26.0, 22.0, 36.0, 54.0, 99.0, 138.0, 243.0, 509.0, 984.0, 2231.0, 6317.0, 24983.0, 196823.0, 749976.0, 49811.0, 10291.0, 3182.0, 1306.0, 621.0, 322.0, 179.0, 118.0, 65.0, 39.0, 33.0, 22.0, 15.0, 15.0, 8.0, 13.0, 7.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75732421875, -0.73138427734375, -0.7054443359375, -0.67950439453125, -0.653564453125, -0.62762451171875, -0.6016845703125, -0.57574462890625, -0.5498046875, -0.52386474609375, -0.4979248046875, -0.47198486328125, -0.446044921875, -0.42010498046875, -0.3941650390625, -0.36822509765625, -0.34228515625, -0.31634521484375, -0.2904052734375, -0.26446533203125, -0.238525390625, -0.21258544921875, -0.1866455078125, -0.16070556640625, -0.134765625, -0.10882568359375, -0.0828857421875, -0.05694580078125, -0.031005859375, -0.00506591796875, 0.0208740234375, 0.04681396484375, 0.07275390625, 0.09869384765625, 0.1246337890625, 0.15057373046875, 0.176513671875, 0.20245361328125, 0.2283935546875, 0.25433349609375, 0.2802734375, 0.30621337890625, 0.3321533203125, 0.35809326171875, 0.384033203125, 0.40997314453125, 0.4359130859375, 0.46185302734375, 0.48779296875, 0.51373291015625, 0.5396728515625, 0.56561279296875, 0.591552734375, 0.61749267578125, 0.6434326171875, 0.66937255859375, 0.6953125, 0.72125244140625, 0.7471923828125, 0.77313232421875, 0.799072265625, 0.82501220703125, 0.8509521484375, 0.87689208984375, 0.90283203125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 9.0, 16.0, 13.0, 21.0, 39.0, 95.0, 186.0, 246.0, 163.0, 72.0, 50.0, 26.0, 17.0, 17.0, 7.0, 6.0, 4.0, 0.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002942085266113281, -0.0002848505973815918, -0.00027549266815185547, -0.00026613473892211914, -0.0002567768096923828, -0.0002474188804626465, -0.00023806095123291016, -0.00022870302200317383, -0.0002193450927734375, -0.00020998716354370117, -0.00020062923431396484, -0.00019127130508422852, -0.0001819133758544922, -0.00017255544662475586, -0.00016319751739501953, -0.0001538395881652832, -0.00014448165893554688, -0.00013512372970581055, -0.00012576580047607422, -0.00011640787124633789, -0.00010704994201660156, -9.769201278686523e-05, -8.83340835571289e-05, -7.897615432739258e-05, -6.961822509765625e-05, -6.026029586791992e-05, -5.0902366638183594e-05, -4.1544437408447266e-05, -3.218650817871094e-05, -2.282857894897461e-05, -1.3470649719238281e-05, -4.112720489501953e-06, 5.245208740234375e-06, 1.4603137969970703e-05, 2.396106719970703e-05, 3.331899642944336e-05, 4.267692565917969e-05, 5.2034854888916016e-05, 6.139278411865234e-05, 7.075071334838867e-05, 8.0108642578125e-05, 8.946657180786133e-05, 9.882450103759766e-05, 0.00010818243026733398, 0.00011754035949707031, 0.00012689828872680664, 0.00013625621795654297, 0.0001456141471862793, 0.00015497207641601562, 0.00016433000564575195, 0.00017368793487548828, 0.0001830458641052246, 0.00019240379333496094, 0.00020176172256469727, 0.0002111196517944336, 0.00022047758102416992, 0.00022983551025390625, 0.00023919343948364258, 0.0002485513687133789, 0.00025790929794311523, 0.00026726722717285156, 0.0002766251564025879, 0.0002859830856323242, 0.00029534101486206055, 0.0003046989440917969]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 11.0, 17.0, 14.0, 22.0, 36.0, 43.0, 65.0, 78.0, 151.0, 211.0, 414.0, 620.0, 1262.0, 2564.0, 6803.0, 22528.0, 110516.0, 750603.0, 117071.0, 22880.0, 6926.0, 2743.0, 1251.0, 640.0, 373.0, 238.0, 139.0, 100.0, 73.0, 48.0, 38.0, 27.0, 13.0, 9.0, 6.0, 3.0, 10.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8056640625, -0.7841873168945312, -0.7627105712890625, -0.7412338256835938, -0.719757080078125, -0.6982803344726562, -0.6768035888671875, -0.6553268432617188, -0.63385009765625, -0.6123733520507812, -0.5908966064453125, -0.5694198608398438, -0.547943115234375, -0.5264663696289062, -0.5049896240234375, -0.48351287841796875, -0.4620361328125, -0.44055938720703125, -0.4190826416015625, -0.39760589599609375, -0.376129150390625, -0.35465240478515625, -0.3331756591796875, -0.31169891357421875, -0.29022216796875, -0.26874542236328125, -0.2472686767578125, -0.22579193115234375, -0.204315185546875, -0.18283843994140625, -0.1613616943359375, -0.13988494873046875, -0.118408203125, -0.09693145751953125, -0.0754547119140625, -0.05397796630859375, -0.032501220703125, -0.01102447509765625, 0.0104522705078125, 0.03192901611328125, 0.05340576171875, 0.07488250732421875, 0.0963592529296875, 0.11783599853515625, 0.139312744140625, 0.16078948974609375, 0.1822662353515625, 0.20374298095703125, 0.2252197265625, 0.24669647216796875, 0.2681732177734375, 0.28964996337890625, 0.311126708984375, 0.33260345458984375, 0.3540802001953125, 0.37555694580078125, 0.39703369140625, 0.41851043701171875, 0.4399871826171875, 0.46146392822265625, 0.482940673828125, 0.5044174194335938, 0.5258941650390625, 0.5473709106445312, 0.56884765625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 9.0, 2.0, 5.0, 6.0, 7.0, 7.0, 16.0, 17.0, 26.0, 38.0, 41.0, 60.0, 77.0, 90.0, 96.0, 112.0, 91.0, 64.0, 52.0, 47.0, 37.0, 19.0, 19.0, 12.0, 10.0, 10.0, 5.0, 5.0, 5.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.767578125, -0.7417831420898438, -0.7159881591796875, -0.6901931762695312, -0.664398193359375, -0.6386032104492188, -0.6128082275390625, -0.5870132446289062, -0.56121826171875, -0.5354232788085938, -0.5096282958984375, -0.48383331298828125, -0.458038330078125, -0.43224334716796875, -0.4064483642578125, -0.38065338134765625, -0.3548583984375, -0.32906341552734375, -0.3032684326171875, -0.27747344970703125, -0.251678466796875, -0.22588348388671875, -0.2000885009765625, -0.17429351806640625, -0.14849853515625, -0.12270355224609375, -0.0969085693359375, -0.07111358642578125, -0.045318603515625, -0.01952362060546875, 0.0062713623046875, 0.03206634521484375, 0.057861328125, 0.08365631103515625, 0.1094512939453125, 0.13524627685546875, 0.161041259765625, 0.18683624267578125, 0.2126312255859375, 0.23842620849609375, 0.26422119140625, 0.29001617431640625, 0.3158111572265625, 0.34160614013671875, 0.367401123046875, 0.39319610595703125, 0.4189910888671875, 0.44478607177734375, 0.4705810546875, 0.49637603759765625, 0.5221710205078125, 0.5479660034179688, 0.573760986328125, 0.5995559692382812, 0.6253509521484375, 0.6511459350585938, 0.67694091796875, 0.7027359008789062, 0.7285308837890625, 0.7543258666992188, 0.780120849609375, 0.8059158325195312, 0.8317108154296875, 0.8575057983398438, 0.88330078125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 17.0, 27.0, 87.0, 192.0, 411.0, 138.0, 56.0, 25.0, 17.0, 9.0, 7.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.05223846435547, -21.102924346923828, -20.15361213684082, -19.20429801940918, -18.254985809326172, -17.30567169189453, -16.356359481811523, -15.407045364379883, -14.457733154296875, -13.50841999053955, -12.559106826782227, -11.609793663024902, -10.660480499267578, -9.711166381835938, -8.76185417175293, -7.812540531158447, -6.863226890563965, -5.913913726806641, -4.964600563049316, -4.015287399291992, -3.065973997116089, -2.1166605949401855, -1.1673474311828613, -0.2180342674255371, 0.7312788963317871, 1.6805920600891113, 2.6299052238464355, 3.579218626022339, 4.528532028198242, 5.477845191955566, 6.427158355712891, 7.376471519470215, 8.325784683227539, 9.275097846984863, 10.224411010742188, 11.173724174499512, 12.123037338256836, 13.072351455688477, 14.021663665771484, 14.970977783203125, 15.920289993286133, 16.869604110717773, 17.81891632080078, 18.768230438232422, 19.71754264831543, 20.66685676574707, 21.616168975830078, 22.56548309326172, 23.51479721069336, 24.464111328125, 25.413423538208008, 26.36273765563965, 27.312049865722656, 28.261363983154297, 29.210676193237305, 30.159990310668945, 31.109302520751953, 32.058616638183594, 33.007930755615234, 33.95724105834961, 34.90655517578125, 35.85586929321289, 36.80518341064453, 37.754493713378906, 38.70380783081055]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 7.0, 7.0, 3.0, 5.0, 10.0, 3.0, 17.0, 17.0, 21.0, 14.0, 17.0, 24.0, 27.0, 37.0, 40.0, 62.0, 72.0, 98.0, 92.0, 80.0, 59.0, 40.0, 31.0, 22.0, 26.0, 21.0, 33.0, 19.0, 21.0, 16.0, 14.0, 6.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.257675170898438, -17.72547721862793, -17.193279266357422, -16.661083221435547, -16.12888526916504, -15.596687316894531, -15.064489364624023, -14.532291412353516, -14.000094413757324, -13.467896461486816, -12.935699462890625, -12.403501510620117, -11.87130355834961, -11.339106559753418, -10.80690860748291, -10.274711608886719, -9.742513656616211, -9.210315704345703, -8.678118705749512, -8.145920753479004, -7.613723278045654, -7.081525802612305, -6.549327850341797, -6.017130374908447, -5.484932899475098, -4.952735424041748, -4.420537948608398, -3.8883399963378906, -3.356142520904541, -2.8239450454711914, -2.2917473316192627, -1.759549617767334, -1.227351188659668, -0.6951535940170288, -0.16295599937438965, 0.3692415952682495, 0.9014391899108887, 1.4336366653442383, 1.965834379196167, 2.4980320930480957, 3.0302295684814453, 3.562427043914795, 4.0946245193481445, 4.626822471618652, 5.159019947052002, 5.691217422485352, 6.223415374755859, 6.755612850189209, 7.287810325622559, 7.820007801055908, 8.352205276489258, 8.884403228759766, 9.416601181030273, 9.948798179626465, 10.480996131896973, 11.013193130493164, 11.545391082763672, 12.07758903503418, 12.609786033630371, 13.141983985900879, 13.67418098449707, 14.206378936767578, 14.738576889038086, 15.270774841308594, 15.802971839904785]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 1.0, 3.0, 4.0, 8.0, 7.0, 7.0, 13.0, 28.0, 32.0, 43.0, 72.0, 114.0, 145.0, 219.0, 341.0, 512.0, 899.0, 1569.0, 2630.0, 5037.0, 10790.0, 28480.0, 119388.0, 801469.0, 2369200.0, 689494.0, 114648.0, 27698.0, 10114.0, 4804.0, 2590.0, 1470.0, 858.0, 566.0, 336.0, 206.0, 150.0, 108.0, 68.0, 55.0, 34.0, 26.0, 18.0, 11.0, 5.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 3.0], "bins": [-2.2890625, -2.226287841796875, -2.16351318359375, -2.100738525390625, -2.0379638671875, -1.975189208984375, -1.91241455078125, -1.849639892578125, -1.786865234375, -1.724090576171875, -1.66131591796875, -1.598541259765625, -1.5357666015625, -1.472991943359375, -1.41021728515625, -1.347442626953125, -1.28466796875, -1.221893310546875, -1.15911865234375, -1.096343994140625, -1.0335693359375, -0.970794677734375, -0.90802001953125, -0.845245361328125, -0.782470703125, -0.719696044921875, -0.65692138671875, -0.594146728515625, -0.5313720703125, -0.468597412109375, -0.40582275390625, -0.343048095703125, -0.2802734375, -0.217498779296875, -0.15472412109375, -0.091949462890625, -0.0291748046875, 0.033599853515625, 0.09637451171875, 0.159149169921875, 0.221923828125, 0.284698486328125, 0.34747314453125, 0.410247802734375, 0.4730224609375, 0.535797119140625, 0.59857177734375, 0.661346435546875, 0.72412109375, 0.786895751953125, 0.84967041015625, 0.912445068359375, 0.9752197265625, 1.037994384765625, 1.10076904296875, 1.163543701171875, 1.226318359375, 1.289093017578125, 1.35186767578125, 1.414642333984375, 1.4774169921875, 1.540191650390625, 1.60296630859375, 1.665740966796875, 1.728515625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 7.0, 3.0, 4.0, 2.0, 5.0, 10.0, 11.0, 11.0, 10.0, 9.0, 20.0, 28.0, 25.0, 29.0, 37.0, 43.0, 40.0, 45.0, 39.0, 43.0, 44.0, 54.0, 59.0, 51.0, 42.0, 50.0, 40.0, 36.0, 24.0, 31.0, 27.0, 33.0, 14.0, 21.0, 14.0, 8.0, 8.0, 8.0, 4.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1728515625, -1.1395034790039062, -1.1061553955078125, -1.0728073120117188, -1.039459228515625, -1.0061111450195312, -0.9727630615234375, -0.9394149780273438, -0.90606689453125, -0.8727188110351562, -0.8393707275390625, -0.8060226440429688, -0.772674560546875, -0.7393264770507812, -0.7059783935546875, -0.6726303100585938, -0.6392822265625, -0.6059341430664062, -0.5725860595703125, -0.5392379760742188, -0.505889892578125, -0.47254180908203125, -0.4391937255859375, -0.40584564208984375, -0.37249755859375, -0.33914947509765625, -0.3058013916015625, -0.27245330810546875, -0.239105224609375, -0.20575714111328125, -0.1724090576171875, -0.13906097412109375, -0.105712890625, -0.07236480712890625, -0.0390167236328125, -0.00566864013671875, 0.027679443359375, 0.06102752685546875, 0.0943756103515625, 0.12772369384765625, 0.16107177734375, 0.19441986083984375, 0.2277679443359375, 0.26111602783203125, 0.294464111328125, 0.32781219482421875, 0.3611602783203125, 0.39450836181640625, 0.4278564453125, 0.46120452880859375, 0.4945526123046875, 0.5279006958007812, 0.561248779296875, 0.5945968627929688, 0.6279449462890625, 0.6612930297851562, 0.69464111328125, 0.7279891967773438, 0.7613372802734375, 0.7946853637695312, 0.828033447265625, 0.8613815307617188, 0.8947296142578125, 0.9280776977539062, 0.96142578125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 14.0, 22.0, 20.0, 34.0, 77.0, 73.0, 138.0, 258.0, 542.0, 1385.0, 5858.0, 75841.0, 4029585.0, 72008.0, 5822.0, 1405.0, 539.0, 245.0, 118.0, 102.0, 54.0, 35.0, 17.0, 17.0, 17.0, 9.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.3359375, -9.0933837890625, -8.850830078125, -8.6082763671875, -8.36572265625, -8.1231689453125, -7.880615234375, -7.6380615234375, -7.3955078125, -7.1529541015625, -6.910400390625, -6.6678466796875, -6.42529296875, -6.1827392578125, -5.940185546875, -5.6976318359375, -5.455078125, -5.2125244140625, -4.969970703125, -4.7274169921875, -4.48486328125, -4.2423095703125, -3.999755859375, -3.7572021484375, -3.5146484375, -3.2720947265625, -3.029541015625, -2.7869873046875, -2.54443359375, -2.3018798828125, -2.059326171875, -1.8167724609375, -1.57421875, -1.3316650390625, -1.089111328125, -0.8465576171875, -0.60400390625, -0.3614501953125, -0.118896484375, 0.1236572265625, 0.3662109375, 0.6087646484375, 0.851318359375, 1.0938720703125, 1.33642578125, 1.5789794921875, 1.821533203125, 2.0640869140625, 2.306640625, 2.5491943359375, 2.791748046875, 3.0343017578125, 3.27685546875, 3.5194091796875, 3.761962890625, 4.0045166015625, 4.2470703125, 4.4896240234375, 4.732177734375, 4.9747314453125, 5.21728515625, 5.4598388671875, 5.702392578125, 5.9449462890625, 6.1875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 10.0, 8.0, 18.0, 19.0, 34.0, 39.0, 49.0, 97.0, 130.0, 251.0, 434.0, 763.0, 838.0, 495.0, 295.0, 194.0, 126.0, 71.0, 49.0, 44.0, 31.0, 11.0, 16.0, 11.0, 3.0, 4.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69140625, -3.54986572265625, -3.4083251953125, -3.26678466796875, -3.125244140625, -2.98370361328125, -2.8421630859375, -2.70062255859375, -2.55908203125, -2.41754150390625, -2.2760009765625, -2.13446044921875, -1.992919921875, -1.85137939453125, -1.7098388671875, -1.56829833984375, -1.4267578125, -1.28521728515625, -1.1436767578125, -1.00213623046875, -0.860595703125, -0.71905517578125, -0.5775146484375, -0.43597412109375, -0.29443359375, -0.15289306640625, -0.0113525390625, 0.13018798828125, 0.271728515625, 0.41326904296875, 0.5548095703125, 0.69635009765625, 0.837890625, 0.97943115234375, 1.1209716796875, 1.26251220703125, 1.404052734375, 1.54559326171875, 1.6871337890625, 1.82867431640625, 1.97021484375, 2.11175537109375, 2.2532958984375, 2.39483642578125, 2.536376953125, 2.67791748046875, 2.8194580078125, 2.96099853515625, 3.1025390625, 3.24407958984375, 3.3856201171875, 3.52716064453125, 3.668701171875, 3.81024169921875, 3.9517822265625, 4.09332275390625, 4.23486328125, 4.37640380859375, 4.5179443359375, 4.65948486328125, 4.801025390625, 4.94256591796875, 5.0841064453125, 5.22564697265625, 5.3671875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 11.0, 23.0, 32.0, 63.0, 130.0, 221.0, 209.0, 121.0, 65.0, 41.0, 22.0, 20.0, 12.0, 3.0, 2.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.770538330078125, -34.20754623413086, -32.64455795288086, -31.081565856933594, -29.518573760986328, -27.955583572387695, -26.392593383789062, -24.829601287841797, -23.266611099243164, -21.70362091064453, -20.140628814697266, -18.577638626098633, -17.0146484375, -15.451656341552734, -13.888666152954102, -12.325675010681152, -10.762683868408203, -9.199692726135254, -7.636702060699463, -6.073711395263672, -4.510720252990723, -2.9477291107177734, -1.3847389221191406, 0.1782522201538086, 1.7412433624267578, 3.304234266281128, 4.867225170135498, 6.430215835571289, 7.993206977844238, 9.556198120117188, 11.11918830871582, 12.68217945098877, 14.245170593261719, 15.808161735534668, 17.371152877807617, 18.93414306640625, 20.497135162353516, 22.06012535095215, 23.62311553955078, 25.186107635498047, 26.74909782409668, 28.312088012695312, 29.875080108642578, 31.43807029724121, 33.001060485839844, 34.56405258178711, 36.127044677734375, 37.690032958984375, 39.25302505493164, 40.816017150878906, 42.379005432128906, 43.94199752807617, 45.50498962402344, 47.06797790527344, 48.6309700012207, 50.19396209716797, 51.75695037841797, 53.319942474365234, 54.882930755615234, 56.4459228515625, 58.008914947509766, 59.57190704345703, 61.13489532470703, 62.6978874206543, 64.26087951660156]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 13.0, 8.0, 8.0, 16.0, 18.0, 24.0, 27.0, 37.0, 32.0, 42.0, 38.0, 45.0, 68.0, 60.0, 79.0, 71.0, 58.0, 64.0, 42.0, 51.0, 28.0, 32.0, 23.0, 22.0, 18.0, 17.0, 18.0, 11.0, 9.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.577024459838867, -27.740110397338867, -26.903196334838867, -26.066280364990234, -25.229366302490234, -24.392452239990234, -23.555538177490234, -22.718624114990234, -21.881710052490234, -21.044795989990234, -20.207881927490234, -19.370967864990234, -18.5340518951416, -17.6971378326416, -16.8602237701416, -16.0233097076416, -15.186394691467285, -14.349480628967285, -13.512565612792969, -12.675651550292969, -11.838737487792969, -11.001823425292969, -10.164908409118652, -9.327994346618652, -8.491079330444336, -7.654164791107178, -6.817250728607178, -5.9803361892700195, -5.1434221267700195, -4.306507587432861, -3.469593048095703, -2.632678985595703, -1.7957649230957031, -0.9588505625724792, -0.12193620204925537, 0.7149782180786133, 1.5518925189971924, 2.3888068199157715, 3.2257213592529297, 4.06263542175293, 4.899549961090088, 5.736464500427246, 6.573378562927246, 7.410293102264404, 8.247207641601562, 9.084121704101562, 9.921035766601562, 10.757949829101562, 11.594864845275879, 12.431778907775879, 13.268693923950195, 14.105607986450195, 14.942522048950195, 15.779436111450195, 16.616352081298828, 17.453266143798828, 18.290180206298828, 19.127094268798828, 19.964008331298828, 20.800922393798828, 21.63783836364746, 22.47475242614746, 23.31166648864746, 24.14858055114746, 24.98549461364746]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 7.0, 11.0, 21.0, 40.0, 64.0, 86.0, 188.0, 277.0, 476.0, 874.0, 1768.0, 3773.0, 8929.0, 25795.0, 113021.0, 719146.0, 128187.0, 28391.0, 9515.0, 3938.0, 1808.0, 1002.0, 495.0, 279.0, 177.0, 87.0, 69.0, 44.0, 27.0, 10.0, 13.0, 7.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.892578125, -1.830596923828125, -1.76861572265625, -1.706634521484375, -1.6446533203125, -1.582672119140625, -1.52069091796875, -1.458709716796875, -1.396728515625, -1.334747314453125, -1.27276611328125, -1.210784912109375, -1.1488037109375, -1.086822509765625, -1.02484130859375, -0.962860107421875, -0.90087890625, -0.838897705078125, -0.77691650390625, -0.714935302734375, -0.6529541015625, -0.590972900390625, -0.52899169921875, -0.467010498046875, -0.405029296875, -0.343048095703125, -0.28106689453125, -0.219085693359375, -0.1571044921875, -0.095123291015625, -0.03314208984375, 0.028839111328125, 0.0908203125, 0.152801513671875, 0.21478271484375, 0.276763916015625, 0.3387451171875, 0.400726318359375, 0.46270751953125, 0.524688720703125, 0.586669921875, 0.648651123046875, 0.71063232421875, 0.772613525390625, 0.8345947265625, 0.896575927734375, 0.95855712890625, 1.020538330078125, 1.08251953125, 1.144500732421875, 1.20648193359375, 1.268463134765625, 1.3304443359375, 1.392425537109375, 1.45440673828125, 1.516387939453125, 1.578369140625, 1.640350341796875, 1.70233154296875, 1.764312744140625, 1.8262939453125, 1.888275146484375, 1.95025634765625, 2.012237548828125, 2.07421875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 14.0, 12.0, 18.0, 11.0, 26.0, 19.0, 43.0, 49.0, 69.0, 75.0, 84.0, 92.0, 58.0, 106.0, 57.0, 60.0, 58.0, 48.0, 35.0, 19.0, 17.0, 15.0, 7.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55859375, -2.4911346435546875, -2.423675537109375, -2.3562164306640625, -2.28875732421875, -2.2212982177734375, -2.153839111328125, -2.0863800048828125, -2.0189208984375, -1.9514617919921875, -1.884002685546875, -1.8165435791015625, -1.74908447265625, -1.6816253662109375, -1.614166259765625, -1.5467071533203125, -1.479248046875, -1.4117889404296875, -1.344329833984375, -1.2768707275390625, -1.20941162109375, -1.1419525146484375, -1.074493408203125, -1.0070343017578125, -0.9395751953125, -0.8721160888671875, -0.804656982421875, -0.7371978759765625, -0.66973876953125, -0.6022796630859375, -0.534820556640625, -0.4673614501953125, -0.39990234375, -0.3324432373046875, -0.264984130859375, -0.1975250244140625, -0.13006591796875, -0.0626068115234375, 0.004852294921875, 0.0723114013671875, 0.1397705078125, 0.2072296142578125, 0.274688720703125, 0.3421478271484375, 0.40960693359375, 0.4770660400390625, 0.544525146484375, 0.6119842529296875, 0.679443359375, 0.7469024658203125, 0.814361572265625, 0.8818206787109375, 0.94927978515625, 1.0167388916015625, 1.084197998046875, 1.1516571044921875, 1.2191162109375, 1.2865753173828125, 1.354034423828125, 1.4214935302734375, 1.48895263671875, 1.5564117431640625, 1.623870849609375, 1.6913299560546875, 1.7587890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 5.0, 10.0, 9.0, 10.0, 16.0, 38.0, 46.0, 66.0, 114.0, 194.0, 421.0, 1086.0, 4261.0, 61350.0, 962101.0, 15284.0, 2075.0, 685.0, 314.0, 170.0, 104.0, 61.0, 40.0, 24.0, 15.0, 15.0, 13.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44140625, -4.3079833984375, -4.174560546875, -4.0411376953125, -3.90771484375, -3.7742919921875, -3.640869140625, -3.5074462890625, -3.3740234375, -3.2406005859375, -3.107177734375, -2.9737548828125, -2.84033203125, -2.7069091796875, -2.573486328125, -2.4400634765625, -2.306640625, -2.1732177734375, -2.039794921875, -1.9063720703125, -1.77294921875, -1.6395263671875, -1.506103515625, -1.3726806640625, -1.2392578125, -1.1058349609375, -0.972412109375, -0.8389892578125, -0.70556640625, -0.5721435546875, -0.438720703125, -0.3052978515625, -0.171875, -0.0384521484375, 0.094970703125, 0.2283935546875, 0.36181640625, 0.4952392578125, 0.628662109375, 0.7620849609375, 0.8955078125, 1.0289306640625, 1.162353515625, 1.2957763671875, 1.42919921875, 1.5626220703125, 1.696044921875, 1.8294677734375, 1.962890625, 2.0963134765625, 2.229736328125, 2.3631591796875, 2.49658203125, 2.6300048828125, 2.763427734375, 2.8968505859375, 3.0302734375, 3.1636962890625, 3.297119140625, 3.4305419921875, 3.56396484375, 3.6973876953125, 3.830810546875, 3.9642333984375, 4.09765625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 5.0, 7.0, 8.0, 8.0, 12.0, 29.0, 23.0, 26.0, 33.0, 35.0, 49.0, 66.0, 98.0, 90.0, 113.0, 70.0, 63.0, 62.0, 39.0, 32.0, 26.0, 18.0, 18.0, 12.0, 13.0, 8.0, 5.0, 6.0, 12.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-7.8046875, -7.5877685546875, -7.370849609375, -7.1539306640625, -6.93701171875, -6.7200927734375, -6.503173828125, -6.2862548828125, -6.0693359375, -5.8524169921875, -5.635498046875, -5.4185791015625, -5.20166015625, -4.9847412109375, -4.767822265625, -4.5509033203125, -4.333984375, -4.1170654296875, -3.900146484375, -3.6832275390625, -3.46630859375, -3.2493896484375, -3.032470703125, -2.8155517578125, -2.5986328125, -2.3817138671875, -2.164794921875, -1.9478759765625, -1.73095703125, -1.5140380859375, -1.297119140625, -1.0802001953125, -0.86328125, -0.6463623046875, -0.429443359375, -0.2125244140625, 0.00439453125, 0.2213134765625, 0.438232421875, 0.6551513671875, 0.8720703125, 1.0889892578125, 1.305908203125, 1.5228271484375, 1.73974609375, 1.9566650390625, 2.173583984375, 2.3905029296875, 2.607421875, 2.8243408203125, 3.041259765625, 3.2581787109375, 3.47509765625, 3.6920166015625, 3.908935546875, 4.1258544921875, 4.3427734375, 4.5596923828125, 4.776611328125, 4.9935302734375, 5.21044921875, 5.4273681640625, 5.644287109375, 5.8612060546875, 6.078125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 1.0, 9.0, 9.0, 13.0, 22.0, 23.0, 43.0, 46.0, 83.0, 116.0, 239.0, 495.0, 925.0, 2573.0, 8770.0, 52266.0, 909248.0, 59273.0, 9581.0, 2758.0, 987.0, 473.0, 209.0, 146.0, 72.0, 47.0, 34.0, 26.0, 20.0, 9.0, 10.0, 9.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4716796875, -0.4545440673828125, -0.437408447265625, -0.4202728271484375, -0.40313720703125, -0.3860015869140625, -0.368865966796875, -0.3517303466796875, -0.3345947265625, -0.3174591064453125, -0.300323486328125, -0.2831878662109375, -0.26605224609375, -0.2489166259765625, -0.231781005859375, -0.2146453857421875, -0.197509765625, -0.1803741455078125, -0.163238525390625, -0.1461029052734375, -0.12896728515625, -0.1118316650390625, -0.094696044921875, -0.0775604248046875, -0.0604248046875, -0.0432891845703125, -0.026153564453125, -0.0090179443359375, 0.00811767578125, 0.0252532958984375, 0.042388916015625, 0.0595245361328125, 0.07666015625, 0.0937957763671875, 0.110931396484375, 0.1280670166015625, 0.14520263671875, 0.1623382568359375, 0.179473876953125, 0.1966094970703125, 0.2137451171875, 0.2308807373046875, 0.248016357421875, 0.2651519775390625, 0.28228759765625, 0.2994232177734375, 0.316558837890625, 0.3336944580078125, 0.350830078125, 0.3679656982421875, 0.385101318359375, 0.4022369384765625, 0.41937255859375, 0.4365081787109375, 0.453643798828125, 0.4707794189453125, 0.4879150390625, 0.5050506591796875, 0.522186279296875, 0.5393218994140625, 0.55645751953125, 0.5735931396484375, 0.590728759765625, 0.6078643798828125, 0.625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 1.0, 3.0, 8.0, 8.0, 5.0, 11.0, 11.0, 17.0, 19.0, 30.0, 28.0, 44.0, 60.0, 72.0, 88.0, 141.0, 91.0, 91.0, 57.0, 45.0, 38.0, 27.0, 25.0, 18.0, 10.0, 9.0, 11.0, 4.0, 7.0, 4.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.410215377807617e-05, -8.11498612165451e-05, -7.819756865501404e-05, -7.524527609348297e-05, -7.22929835319519e-05, -6.934069097042084e-05, -6.638839840888977e-05, -6.34361058473587e-05, -6.048381328582764e-05, -5.753152072429657e-05, -5.45792281627655e-05, -5.1626935601234436e-05, -4.867464303970337e-05, -4.57223504781723e-05, -4.2770057916641235e-05, -3.981776535511017e-05, -3.68654727935791e-05, -3.3913180232048035e-05, -3.096088767051697e-05, -2.80085951089859e-05, -2.5056302547454834e-05, -2.2104009985923767e-05, -1.91517174243927e-05, -1.6199424862861633e-05, -1.3247132301330566e-05, -1.02948397397995e-05, -7.342547178268433e-06, -4.390254616737366e-06, -1.4379620552062988e-06, 1.514330506324768e-06, 4.466623067855835e-06, 7.418915629386902e-06, 1.0371208190917969e-05, 1.3323500752449036e-05, 1.6275793313980103e-05, 1.922808587551117e-05, 2.2180378437042236e-05, 2.5132670998573303e-05, 2.808496356010437e-05, 3.103725612163544e-05, 3.3989548683166504e-05, 3.694184124469757e-05, 3.989413380622864e-05, 4.2846426367759705e-05, 4.579871892929077e-05, 4.875101149082184e-05, 5.1703304052352905e-05, 5.465559661388397e-05, 5.760788917541504e-05, 6.0560181736946106e-05, 6.351247429847717e-05, 6.646476686000824e-05, 6.94170594215393e-05, 7.236935198307037e-05, 7.532164454460144e-05, 7.827393710613251e-05, 8.122622966766357e-05, 8.417852222919464e-05, 8.713081479072571e-05, 9.008310735225677e-05, 9.303539991378784e-05, 9.598769247531891e-05, 9.893998503684998e-05, 0.00010189227759838104, 0.00010484457015991211]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 4.0, 4.0, 8.0, 8.0, 11.0, 16.0, 22.0, 36.0, 72.0, 89.0, 175.0, 330.0, 811.0, 2185.0, 7855.0, 43413.0, 906126.0, 72060.0, 10758.0, 2704.0, 920.0, 382.0, 215.0, 113.0, 75.0, 53.0, 30.0, 22.0, 17.0, 13.0, 8.0, 4.0, 7.0, 6.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.5807723999023438, -0.5604705810546875, -0.5401687622070312, -0.519866943359375, -0.49956512451171875, -0.4792633056640625, -0.45896148681640625, -0.43865966796875, -0.41835784912109375, -0.3980560302734375, -0.37775421142578125, -0.357452392578125, -0.33715057373046875, -0.3168487548828125, -0.29654693603515625, -0.2762451171875, -0.25594329833984375, -0.2356414794921875, -0.21533966064453125, -0.195037841796875, -0.17473602294921875, -0.1544342041015625, -0.13413238525390625, -0.11383056640625, -0.09352874755859375, -0.0732269287109375, -0.05292510986328125, -0.032623291015625, -0.01232147216796875, 0.0079803466796875, 0.02828216552734375, 0.048583984375, 0.06888580322265625, 0.0891876220703125, 0.10948944091796875, 0.129791259765625, 0.15009307861328125, 0.1703948974609375, 0.19069671630859375, 0.21099853515625, 0.23130035400390625, 0.2516021728515625, 0.27190399169921875, 0.292205810546875, 0.31250762939453125, 0.3328094482421875, 0.35311126708984375, 0.3734130859375, 0.39371490478515625, 0.4140167236328125, 0.43431854248046875, 0.454620361328125, 0.47492218017578125, 0.4952239990234375, 0.5155258178710938, 0.53582763671875, 0.5561294555664062, 0.5764312744140625, 0.5967330932617188, 0.617034912109375, 0.6373367309570312, 0.6576385498046875, 0.6779403686523438, 0.6982421875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 9.0, 8.0, 2.0, 7.0, 9.0, 11.0, 19.0, 13.0, 24.0, 41.0, 44.0, 76.0, 117.0, 141.0, 142.0, 110.0, 67.0, 42.0, 30.0, 20.0, 14.0, 13.0, 13.0, 9.0, 6.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376220703125, -0.3581123352050781, -0.34000396728515625, -0.3218955993652344, -0.3037872314453125, -0.2856788635253906, -0.26757049560546875, -0.24946212768554688, -0.231353759765625, -0.21324539184570312, -0.19513702392578125, -0.17702865600585938, -0.1589202880859375, -0.14081192016601562, -0.12270355224609375, -0.10459518432617188, -0.08648681640625, -0.06837844848632812, -0.05027008056640625, -0.032161712646484375, -0.0140533447265625, 0.004055023193359375, 0.02216339111328125, 0.040271759033203125, 0.058380126953125, 0.07648849487304688, 0.09459686279296875, 0.11270523071289062, 0.1308135986328125, 0.14892196655273438, 0.16703033447265625, 0.18513870239257812, 0.2032470703125, 0.22135543823242188, 0.23946380615234375, 0.2575721740722656, 0.2756805419921875, 0.2937889099121094, 0.31189727783203125, 0.3300056457519531, 0.348114013671875, 0.3662223815917969, 0.38433074951171875, 0.4024391174316406, 0.4205474853515625, 0.4386558532714844, 0.45676422119140625, 0.4748725891113281, 0.49298095703125, 0.5110893249511719, 0.5291976928710938, 0.5473060607910156, 0.5654144287109375, 0.5835227966308594, 0.6016311645507812, 0.6197395324707031, 0.637847900390625, 0.6559562683105469, 0.6740646362304688, 0.6921730041503906, 0.7102813720703125, 0.7283897399902344, 0.7464981079101562, 0.7646064758300781, 0.78271484375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 8.0, 17.0, 33.0, 76.0, 243.0, 494.0, 73.0, 39.0, 10.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.34946823120117, -31.34620475769043, -30.34294319152832, -29.339679718017578, -28.336416244506836, -27.333152770996094, -26.329891204833984, -25.326627731323242, -24.3233642578125, -23.320100784301758, -22.31683921813965, -21.313575744628906, -20.310312271118164, -19.307048797607422, -18.303787231445312, -17.30052375793457, -16.29726219177246, -15.293999671936035, -14.290736198425293, -13.287473678588867, -12.284210205078125, -11.2809476852417, -10.277685165405273, -9.274421691894531, -8.271159172058105, -7.2678961753845215, -6.2646331787109375, -5.261370658874512, -4.258107662200928, -3.2548446655273438, -2.251582145690918, -1.248319149017334, -0.24505615234375, 0.7582067251205444, 1.7614696025848389, 2.7647323608398438, 3.7679953575134277, 4.771258354187012, 5.7745208740234375, 6.7777838706970215, 7.7810468673706055, 8.784309387207031, 9.787572860717773, 10.7908353805542, 11.794097900390625, 12.797361373901367, 13.800623893737793, 14.803886413574219, 15.807149887084961, 16.810413360595703, 17.813674926757812, 18.816938400268555, 19.820201873779297, 20.823463439941406, 21.82672691345215, 22.82999038696289, 23.833251953125, 24.836515426635742, 25.83977699279785, 26.843040466308594, 27.846303939819336, 28.849567413330078, 29.852828979492188, 30.85609245300293, 31.859355926513672]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 8.0, 8.0, 10.0, 14.0, 15.0, 11.0, 22.0, 25.0, 25.0, 53.0, 90.0, 160.0, 183.0, 131.0, 46.0, 40.0, 32.0, 26.0, 32.0, 18.0, 14.0, 8.0, 16.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.364177703857422, -22.718461990356445, -22.072744369506836, -21.42702865600586, -20.78131103515625, -20.135595321655273, -19.489879608154297, -18.844161987304688, -18.19844627380371, -17.552730560302734, -16.907012939453125, -16.26129722595215, -15.615580558776855, -14.969863891601562, -14.324148178100586, -13.678431510925293, -13.03271484375, -12.386998176574707, -11.741281509399414, -11.095565795898438, -10.449849128723145, -9.804132461547852, -9.158416748046875, -8.512700080871582, -7.866983413696289, -7.221266746520996, -6.575550556182861, -5.929834365844727, -5.284117698669434, -4.638401031494141, -3.992684841156006, -3.346968650817871, -2.701253890991211, -2.055537462234497, -1.4098210334777832, -0.7641046047210693, -0.11838817596435547, 0.5273282527923584, 1.1730446815490723, 1.818760871887207, 2.4644775390625, 3.110193967819214, 3.7559103965759277, 4.4016265869140625, 5.0473432540893555, 5.693059921264648, 6.338776111602783, 6.984492301940918, 7.630208969116211, 8.275925636291504, 8.921642303466797, 9.567358016967773, 10.213074684143066, 10.85879135131836, 11.504507064819336, 12.150223731994629, 12.795940399169922, 13.441657066345215, 14.087373733520508, 14.733089447021484, 15.378806114196777, 16.02452278137207, 16.670238494873047, 17.315956115722656, 17.961671829223633]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 9.0, 4.0, 8.0, 13.0, 12.0, 15.0, 19.0, 29.0, 31.0, 34.0, 30.0, 56.0, 202.0, 228.0, 68.0, 51.0, 43.0, 38.0, 17.0, 24.0, 15.0, 6.0, 8.0, 9.0, 11.0, 10.0, 2.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.923828125, -1.870391845703125, -1.81695556640625, -1.763519287109375, -1.7100830078125, -1.656646728515625, -1.60321044921875, -1.549774169921875, -1.496337890625, -1.442901611328125, -1.38946533203125, -1.336029052734375, -1.2825927734375, -1.229156494140625, -1.17572021484375, -1.122283935546875, -1.06884765625, -1.015411376953125, -0.96197509765625, -0.908538818359375, -0.8551025390625, -0.801666259765625, -0.74822998046875, -0.694793701171875, -0.641357421875, -0.587921142578125, -0.53448486328125, -0.481048583984375, -0.4276123046875, -0.374176025390625, -0.32073974609375, -0.267303466796875, -0.2138671875, -0.160430908203125, -0.10699462890625, -0.053558349609375, -0.0001220703125, 0.053314208984375, 0.10675048828125, 0.160186767578125, 0.213623046875, 0.267059326171875, 0.32049560546875, 0.373931884765625, 0.4273681640625, 0.480804443359375, 0.53424072265625, 0.587677001953125, 0.64111328125, 0.694549560546875, 0.74798583984375, 0.801422119140625, 0.8548583984375, 0.908294677734375, 0.96173095703125, 1.015167236328125, 1.068603515625, 1.122039794921875, 1.17547607421875, 1.228912353515625, 1.2823486328125, 1.335784912109375, 1.38922119140625, 1.442657470703125, 1.49609375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 12.0, 12.0, 16.0, 10.0, 32.0, 40.0, 100.0, 160.0, 360.0, 830.0, 2862.0, 18627.0, 8348735.0, 12993.0, 2387.0, 715.0, 324.0, 133.0, 74.0, 45.0, 36.0, 20.0, 12.0, 8.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.696331024169922, -16.225074768066406, -15.753816604614258, -15.282560348510742, -14.81130313873291, -14.340045928955078, -13.868789672851562, -13.39753246307373, -12.926275253295898, -12.455018043518066, -11.983760833740234, -11.512504577636719, -11.041247367858887, -10.569990158081055, -10.098733901977539, -9.627476692199707, -9.156219482421875, -8.684962272644043, -8.213705062866211, -7.742448806762695, -7.271191596984863, -6.799934387207031, -6.328677654266357, -5.857420921325684, -5.386163711547852, -4.9149065017700195, -4.443649768829346, -3.9723927974700928, -3.50113582611084, -3.029878854751587, -2.558621883392334, -2.087364912033081, -1.6161069869995117, -1.1448500156402588, -0.6735930442810059, -0.20233607292175293, 0.2689208984375, 0.7401778697967529, 1.2114348411560059, 1.6826918125152588, 2.1539487838745117, 2.6252057552337646, 3.0964627265930176, 3.5677196979522705, 4.038976669311523, 4.5102338790893555, 4.981490612030029, 5.452747344970703, 5.924004554748535, 6.395261764526367, 6.866518497467041, 7.337775230407715, 7.809032440185547, 8.280289649963379, 8.751546859741211, 9.222803115844727, 9.694060325622559, 10.16531753540039, 10.636573791503906, 11.107831001281738, 11.57908821105957, 12.050345420837402, 12.521602630615234, 12.99285888671875, 13.464116096496582]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 7.0, 3.0, 8.0, 9.0, 9.0, 6.0, 10.0, 7.0, 5.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.5355281829834, -22.650772094726562, -21.766014099121094, -20.881258010864258, -19.996501922607422, -19.111743927001953, -18.226987838745117, -17.34223175048828, -16.457473754882812, -15.57271671295166, -14.687959671020508, -13.803203582763672, -12.91844654083252, -12.033689498901367, -11.148933410644531, -10.264176368713379, -9.379419326782227, -8.494662284851074, -7.60990571975708, -6.725149154663086, -5.840392112731934, -4.955635070800781, -4.070878505706787, -3.186121940612793, -2.3013648986816406, -1.4166080951690674, -0.5318512916564941, 0.3529055118560791, 1.2376623153686523, 2.1224193572998047, 3.007175922393799, 3.891932487487793, 4.776691436767578, 5.6614484786987305, 6.546205043792725, 7.430961608886719, 8.315718650817871, 9.200475692749023, 10.08523178100586, 10.969988822937012, 11.854745864868164, 12.739502906799316, 13.624259948730469, 14.509016036987305, 15.393773078918457, 16.27853012084961, 17.163286209106445, 18.04804229736328, 18.93280029296875, 19.817556381225586, 20.702314376831055, 21.58707046508789, 22.47182846069336, 23.356584548950195, 24.24134063720703, 25.1260986328125, 26.010854721069336, 26.895610809326172, 27.78036880493164, 28.665124893188477, 29.549880981445312, 30.43463897705078, 31.319395065307617, 32.20415115356445, 33.08890914916992]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 12.0, 16.0, 20.0, 31.0, 35.0, 52.0, 82.0, 136.0, 170.0, 300.0, 532.0, 957.0, 2169.0, 5125.0, 14981.0, 53362.0, 207988.0, 173040.0, 43616.0, 12949.0, 4647.0, 1910.0, 903.0, 494.0, 258.0, 148.0, 103.0, 63.0, 41.0, 30.0, 23.0, 17.0, 10.0, 7.0, 11.0, 10.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8671875, -9.47119140625, -9.0751953125, -8.67919921875, -8.283203125, -7.88720703125, -7.4912109375, -7.09521484375, -6.69921875, -6.30322265625, -5.9072265625, -5.51123046875, -5.115234375, -4.71923828125, -4.3232421875, -3.92724609375, -3.53125, -3.13525390625, -2.7392578125, -2.34326171875, -1.947265625, -1.55126953125, -1.1552734375, -0.75927734375, -0.36328125, 0.03271484375, 0.4287109375, 0.82470703125, 1.220703125, 1.61669921875, 2.0126953125, 2.40869140625, 2.8046875, 3.20068359375, 3.5966796875, 3.99267578125, 4.388671875, 4.78466796875, 5.1806640625, 5.57666015625, 5.97265625, 6.36865234375, 6.7646484375, 7.16064453125, 7.556640625, 7.95263671875, 8.3486328125, 8.74462890625, 9.140625, 9.53662109375, 9.9326171875, 10.32861328125, 10.724609375, 11.12060546875, 11.5166015625, 11.91259765625, 12.30859375, 12.70458984375, 13.1005859375, 13.49658203125, 13.892578125, 14.28857421875, 14.6845703125, 15.08056640625, 15.4765625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 3.0, 7.0, 5.0, 12.0, 9.0, 11.0, 11.0, 17.0, 17.0, 26.0, 38.0, 27.0, 40.0, 64.0, 58.0, 66.0, 65.0, 67.0, 82.0, 46.0, 54.0, 49.0, 31.0, 39.0, 22.0, 18.0, 30.0, 21.0, 20.0, 11.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5244140625, -1.4751129150390625, -1.425811767578125, -1.3765106201171875, -1.32720947265625, -1.2779083251953125, -1.228607177734375, -1.1793060302734375, -1.1300048828125, -1.0807037353515625, -1.031402587890625, -0.9821014404296875, -0.93280029296875, -0.8834991455078125, -0.834197998046875, -0.7848968505859375, -0.735595703125, -0.6862945556640625, -0.636993408203125, -0.5876922607421875, -0.53839111328125, -0.4890899658203125, -0.439788818359375, -0.3904876708984375, -0.3411865234375, -0.2918853759765625, -0.242584228515625, -0.1932830810546875, -0.14398193359375, -0.0946807861328125, -0.045379638671875, 0.0039215087890625, 0.05322265625, 0.1025238037109375, 0.151824951171875, 0.2011260986328125, 0.25042724609375, 0.2997283935546875, 0.349029541015625, 0.3983306884765625, 0.4476318359375, 0.4969329833984375, 0.546234130859375, 0.5955352783203125, 0.64483642578125, 0.6941375732421875, 0.743438720703125, 0.7927398681640625, 0.842041015625, 0.8913421630859375, 0.940643310546875, 0.9899444580078125, 1.03924560546875, 1.0885467529296875, 1.137847900390625, 1.1871490478515625, 1.2364501953125, 1.2857513427734375, 1.335052490234375, 1.3843536376953125, 1.43365478515625, 1.4829559326171875, 1.532257080078125, 1.5815582275390625, 1.630859375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 10.0, 9.0, 14.0, 15.0, 24.0, 40.0, 86.0, 88.0, 69.0, 44.0, 29.0, 12.0, 8.0, 6.0, 6.0, 1.0, 2.0, 2.0, 3.0, 6.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.313547134399414, -9.968452453613281, -9.623358726501465, -9.278264045715332, -8.933170318603516, -8.588075637817383, -8.24298095703125, -7.897887229919434, -7.552793025970459, -7.207698822021484, -6.86260461807251, -6.517510414123535, -6.172415733337402, -5.827322006225586, -5.482227325439453, -5.1371331214904785, -4.792038917541504, -4.446944713592529, -4.101850509643555, -3.756756067276001, -3.4116618633270264, -3.0665676593780518, -2.721473217010498, -2.3763790130615234, -2.031284809112549, -1.6861906051635742, -1.34109628200531, -0.9960019588470459, -0.6509077548980713, -0.3058135509490967, 0.03928089141845703, 0.38437509536743164, 0.7294692993164062, 1.0745635032653809, 1.419657826423645, 1.7647521495819092, 2.109846353530884, 2.4549405574798584, 2.800034999847412, 3.1451292037963867, 3.4902234077453613, 3.835317611694336, 4.1804118156433105, 4.525506019592285, 4.870600700378418, 5.215694427490234, 5.560789108276367, 5.905883312225342, 6.250977516174316, 6.596071720123291, 6.941165924072266, 7.286260604858398, 7.631354331970215, 7.976449012756348, 8.321542739868164, 8.666637420654297, 9.01173210144043, 9.356826782226562, 9.701920509338379, 10.047015190124512, 10.392108917236328, 10.737203598022461, 11.082298278808594, 11.42739200592041, 11.772485733032227]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 3.0, 2.0, 2.0, 4.0, 8.0, 16.0, 9.0, 14.0, 19.0, 29.0, 51.0, 67.0, 63.0, 55.0, 33.0, 30.0, 19.0, 17.0, 12.0, 5.0, 3.0, 5.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.644369125366211, -9.361872673034668, -9.079376220703125, -8.796879768371582, -8.514383316040039, -8.231886863708496, -7.949390411376953, -7.66689395904541, -7.384397506713867, -7.101901054382324, -6.819404602050781, -6.536908149719238, -6.254411697387695, -5.971915245056152, -5.689418792724609, -5.406922340393066, -5.124426364898682, -4.841929912567139, -4.559433460235596, -4.276937007904053, -3.9944405555725098, -3.711944103240967, -3.429447889328003, -3.14695143699646, -2.864454984664917, -2.581958532333374, -2.299462080001831, -2.016965866088867, -1.7344692945480347, -1.4519728422164917, -1.1694765090942383, -0.8869800567626953, -0.6044836044311523, -0.32198718190193176, -0.03949075937271118, 0.243005633354187, 0.52550208568573, 0.807998538017273, 1.0904948711395264, 1.3729913234710693, 1.6554877758026123, 1.9379842281341553, 2.2204806804656982, 2.502976894378662, 2.785473346710205, 3.067969799041748, 3.350466251373291, 3.632962703704834, 3.915459156036377, 4.19795560836792, 4.480452060699463, 4.762948513031006, 5.045444965362549, 5.327941417694092, 5.610437393188477, 5.8929338455200195, 6.1754302978515625, 6.4579267501831055, 6.740423202514648, 7.022919654846191, 7.305416107177734, 7.587912559509277, 7.87040901184082, 8.152905464172363, 8.435401916503906]}, "eval/loss": 1.8662452697753906, "eval/wer": 1.0954184847282824, "eval/runtime": 1261.4937, "eval/samples_per_second": 2.094, "eval/steps_per_second": 0.262} \ No newline at end of file