{"train/loss": 4.3938, "train/learning_rate": 3.9800000000000005e-05, "train/epoch": 0.78, "train/global_step": 200, "_runtime": 3628, "_timestamp": 1646210825, "_step": 199, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 583.0, 429.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-214.20204162597656, -183.53944396972656, -152.87684631347656, -122.2142562866211, -91.5516586303711, -60.889068603515625, -30.226470947265625, 0.436126708984375, 31.098724365234375, 61.761322021484375, 92.42391967773438, 123.08650970458984, 153.74911499023438, 184.4116973876953, 215.0742950439453, 245.7368927001953, 276.39947509765625, 307.06207275390625, 337.72467041015625, 368.38726806640625, 399.04986572265625, 429.71246337890625, 460.37506103515625, 491.03765869140625, 521.7002563476562, 552.3628540039062, 583.0254516601562, 613.6880493164062, 644.3506469726562, 675.0132446289062, 705.6758422851562, 736.3384399414062, 767.0010375976562, 797.6636352539062, 828.3262329101562, 858.9888305664062, 889.6514282226562, 920.3140258789062, 950.9766235351562, 981.6392211914062, 1012.3018188476562, 1042.96435546875, 1073.626953125, 1104.28955078125, 1134.9521484375, 1165.61474609375, 1196.27734375, 1226.93994140625, 1257.6025390625, 1288.26513671875, 1318.927734375, 1349.59033203125, 1380.2529296875, 1410.91552734375, 1441.578125, 1472.24072265625, 1502.9033203125, 1533.56591796875, 1564.228515625, 1594.89111328125, 1625.5537109375, 1656.21630859375, 1686.87890625, 1717.54150390625, 1748.2041015625]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 2.0, 7.0, 7.0, 8.0, 8.0, 14.0, 11.0, 18.0, 16.0, 24.0, 37.0, 40.0, 39.0, 33.0, 57.0, 44.0, 50.0, 56.0, 43.0, 46.0, 63.0, 54.0, 42.0, 57.0, 42.0, 23.0, 36.0, 23.0, 19.0, 17.0, 13.0, 12.0, 5.0, 9.0, 4.0, 7.0, 6.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.32231140136719, -112.09468078613281, -107.86705017089844, -103.63941192626953, -99.41178131103516, -95.18415069580078, -90.95651245117188, -86.7288818359375, -82.50125122070312, -78.27362060546875, -74.04598999023438, -69.81835174560547, -65.5907211303711, -61.36309051513672, -57.13545608520508, -52.90782165527344, -48.68019104003906, -44.45256042480469, -40.22492599487305, -35.997291564941406, -31.76966094970703, -27.542028427124023, -23.314395904541016, -19.086763381958008, -14.859130859375, -10.631498336791992, -6.403865814208984, -2.1762332916259766, 2.0513992309570312, 6.279031753540039, 10.506664276123047, 14.734296798706055, 18.961944580078125, 23.189577102661133, 27.41720962524414, 31.64484214782715, 35.872474670410156, 40.10010528564453, 44.32773971557617, 48.55537414550781, 52.78300476074219, 57.01063537597656, 61.2382698059082, 65.46590423583984, 69.69353485107422, 73.9211654663086, 78.1488037109375, 82.37643432617188, 86.60406494140625, 90.83169555664062, 95.059326171875, 99.2869644165039, 103.51459503173828, 107.74222564697266, 111.96986389160156, 116.19749450683594, 120.42512512207031, 124.65275573730469, 128.88038635253906, 133.10801696777344, 137.33566284179688, 141.56329345703125, 145.79092407226562, 150.0185546875, 154.24618530273438]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 12.0, 7.0, 14.0, 17.0, 15.0, 9.0, 30.0, 46.0, 30.0, 43.0, 50.0, 40.0, 44.0, 43.0, 56.0, 54.0, 48.0, 55.0, 63.0, 45.0, 45.0, 42.0, 31.0, 34.0, 22.0, 19.0, 20.0, 15.0, 11.0, 6.0, 9.0, 4.0, 8.0, 1.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-10.2578125, -9.99139404296875, -9.7249755859375, -9.45855712890625, -9.192138671875, -8.92572021484375, -8.6593017578125, -8.39288330078125, -8.12646484375, -7.86004638671875, -7.5936279296875, -7.32720947265625, -7.060791015625, -6.79437255859375, -6.5279541015625, -6.26153564453125, -5.9951171875, -5.72869873046875, -5.4622802734375, -5.19586181640625, -4.929443359375, -4.66302490234375, -4.3966064453125, -4.13018798828125, -3.86376953125, -3.59735107421875, -3.3309326171875, -3.06451416015625, -2.798095703125, -2.53167724609375, -2.2652587890625, -1.99884033203125, -1.732421875, -1.46600341796875, -1.1995849609375, -0.93316650390625, -0.666748046875, -0.40032958984375, -0.1339111328125, 0.13250732421875, 0.39892578125, 0.66534423828125, 0.9317626953125, 1.19818115234375, 1.464599609375, 1.73101806640625, 1.9974365234375, 2.26385498046875, 2.5302734375, 2.79669189453125, 3.0631103515625, 3.32952880859375, 3.595947265625, 3.86236572265625, 4.1287841796875, 4.39520263671875, 4.66162109375, 4.92803955078125, 5.1944580078125, 5.46087646484375, 5.727294921875, 5.99371337890625, 6.2601318359375, 6.52655029296875, 6.79296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 6.0, 7.0, 16.0, 15.0, 25.0, 53.0, 57.0, 105.0, 165.0, 292.0, 474.0, 770.0, 1503.0, 3132.0, 7687.0, 26624.0, 170288.0, 2646197.0, 1227234.0, 82122.0, 16824.0, 5668.0, 2336.0, 1130.0, 655.0, 309.0, 216.0, 155.0, 78.0, 50.0, 28.0, 23.0, 11.0, 10.0, 7.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.171875, -24.233642578125, -23.29541015625, -22.357177734375, -21.4189453125, -20.480712890625, -19.54248046875, -18.604248046875, -17.666015625, -16.727783203125, -15.78955078125, -14.851318359375, -13.9130859375, -12.974853515625, -12.03662109375, -11.098388671875, -10.16015625, -9.221923828125, -8.28369140625, -7.345458984375, -6.4072265625, -5.468994140625, -4.53076171875, -3.592529296875, -2.654296875, -1.716064453125, -0.77783203125, 0.160400390625, 1.0986328125, 2.036865234375, 2.97509765625, 3.913330078125, 4.8515625, 5.789794921875, 6.72802734375, 7.666259765625, 8.6044921875, 9.542724609375, 10.48095703125, 11.419189453125, 12.357421875, 13.295654296875, 14.23388671875, 15.172119140625, 16.1103515625, 17.048583984375, 17.98681640625, 18.925048828125, 19.86328125, 20.801513671875, 21.73974609375, 22.677978515625, 23.6162109375, 24.554443359375, 25.49267578125, 26.430908203125, 27.369140625, 28.307373046875, 29.24560546875, 30.183837890625, 31.1220703125, 32.060302734375, 32.99853515625, 33.936767578125, 34.875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 14.0, 33.0, 39.0, 63.0, 108.0, 164.0, 344.0, 652.0, 845.0, 726.0, 450.0, 243.0, 166.0, 86.0, 45.0, 29.0, 16.0, 10.0, 13.0, 4.0, 1.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.375, -35.9697265625, -34.564453125, -33.1591796875, -31.75390625, -30.3486328125, -28.943359375, -27.5380859375, -26.1328125, -24.7275390625, -23.322265625, -21.9169921875, -20.51171875, -19.1064453125, -17.701171875, -16.2958984375, -14.890625, -13.4853515625, -12.080078125, -10.6748046875, -9.26953125, -7.8642578125, -6.458984375, -5.0537109375, -3.6484375, -2.2431640625, -0.837890625, 0.5673828125, 1.97265625, 3.3779296875, 4.783203125, 6.1884765625, 7.59375, 8.9990234375, 10.404296875, 11.8095703125, 13.21484375, 14.6201171875, 16.025390625, 17.4306640625, 18.8359375, 20.2412109375, 21.646484375, 23.0517578125, 24.45703125, 25.8623046875, 27.267578125, 28.6728515625, 30.078125, 31.4833984375, 32.888671875, 34.2939453125, 35.69921875, 37.1044921875, 38.509765625, 39.9150390625, 41.3203125, 42.7255859375, 44.130859375, 45.5361328125, 46.94140625, 48.3466796875, 49.751953125, 51.1572265625, 52.5625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 7.0, 13.0, 14.0, 18.0, 45.0, 99.0, 209.0, 430.0, 1069.0, 4562.0, 1943743.0, 2237006.0, 4944.0, 1199.0, 464.0, 193.0, 111.0, 61.0, 34.0, 16.0, 8.0, 12.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-180.375, -174.91015625, -169.4453125, -163.98046875, -158.515625, -153.05078125, -147.5859375, -142.12109375, -136.65625, -131.19140625, -125.7265625, -120.26171875, -114.796875, -109.33203125, -103.8671875, -98.40234375, -92.9375, -87.47265625, -82.0078125, -76.54296875, -71.078125, -65.61328125, -60.1484375, -54.68359375, -49.21875, -43.75390625, -38.2890625, -32.82421875, -27.359375, -21.89453125, -16.4296875, -10.96484375, -5.5, -0.03515625, 5.4296875, 10.89453125, 16.359375, 21.82421875, 27.2890625, 32.75390625, 38.21875, 43.68359375, 49.1484375, 54.61328125, 60.078125, 65.54296875, 71.0078125, 76.47265625, 81.9375, 87.40234375, 92.8671875, 98.33203125, 103.796875, 109.26171875, 114.7265625, 120.19140625, 125.65625, 131.12109375, 136.5859375, 142.05078125, 147.515625, 152.98046875, 158.4453125, 163.91015625, 169.375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 23.0, 781.0, 206.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1118.4102783203125, -1094.9495849609375, -1071.4888916015625, -1048.0281982421875, -1024.5675048828125, -1001.1068725585938, -977.6461791992188, -954.1854858398438, -930.724853515625, -907.26416015625, -883.803466796875, -860.3427734375, -836.8821411132812, -813.4214477539062, -789.9607543945312, -766.5000610351562, -743.0393676757812, -719.5786743164062, -696.1179809570312, -672.6573486328125, -649.1966552734375, -625.7359619140625, -602.2752685546875, -578.8145751953125, -555.3538818359375, -531.8931884765625, -508.4325256347656, -484.9718322753906, -461.51116943359375, -438.05047607421875, -414.58978271484375, -391.12908935546875, -367.66851806640625, -344.20782470703125, -320.7471618652344, -297.2864685058594, -273.8258056640625, -250.3651123046875, -226.9044189453125, -203.44374084472656, -179.98306274414062, -156.5223846435547, -133.06170654296875, -109.60101318359375, -86.14033508300781, -62.679656982421875, -39.218963623046875, -15.758285522460938, 7.702392578125, 31.163074493408203, 54.623756408691406, 78.08444213867188, 101.54512023925781, 125.00579833984375, 148.46649169921875, 171.9271697998047, 195.38784790039062, 218.84852600097656, 242.3092041015625, 265.7698974609375, 289.2305908203125, 312.6912536621094, 336.1519470214844, 359.61260986328125, 383.07330322265625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 14.0, 5.0, 14.0, 18.0, 19.0, 19.0, 22.0, 33.0, 21.0, 33.0, 27.0, 41.0, 40.0, 50.0, 50.0, 54.0, 40.0, 50.0, 50.0, 50.0, 48.0, 49.0, 45.0, 28.0, 35.0, 28.0, 16.0, 18.0, 10.0, 20.0, 11.0, 16.0, 8.0, 7.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-133.56314086914062, -129.90260314941406, -126.2420654296875, -122.58152770996094, -118.92098999023438, -115.26045227050781, -111.59991455078125, -107.93937683105469, -104.27883911132812, -100.61830139160156, -96.957763671875, -93.29722595214844, -89.63668823242188, -85.97615051269531, -82.31561279296875, -78.65507507324219, -74.99454498291016, -71.3340072631836, -67.67346954345703, -64.01293182373047, -60.352394104003906, -56.691856384277344, -53.03132247924805, -49.370784759521484, -45.71024703979492, -42.04970932006836, -38.3891716003418, -34.7286376953125, -31.068098068237305, -27.407560348510742, -23.747024536132812, -20.08648681640625, -16.42595672607422, -12.765419006347656, -9.10488224029541, -5.444345474243164, -1.7838077545166016, 1.876729965209961, 5.537265777587891, 9.197803497314453, 12.858341217041016, 16.518878936767578, 20.17941665649414, 23.83995246887207, 27.500490188598633, 31.161027908325195, 34.821563720703125, 38.48210144042969, 42.14263916015625, 45.80317687988281, 49.463714599609375, 53.12425231933594, 56.7847900390625, 60.44532775878906, 64.10586547851562, 67.76640319824219, 71.42694091796875, 75.08747863769531, 78.74801635742188, 82.40855407714844, 86.069091796875, 89.72962951660156, 93.39016723632812, 97.05070495605469, 100.71123504638672]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 7.0, 5.0, 13.0, 21.0, 11.0, 21.0, 19.0, 22.0, 33.0, 38.0, 29.0, 29.0, 49.0, 43.0, 48.0, 50.0, 48.0, 56.0, 51.0, 44.0, 47.0, 37.0, 33.0, 38.0, 24.0, 23.0, 29.0, 19.0, 25.0, 13.0, 8.0, 9.0, 13.0, 6.0, 12.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.0213623046875, -7.761474609375, -7.5015869140625, -7.24169921875, -6.9818115234375, -6.721923828125, -6.4620361328125, -6.2021484375, -5.9422607421875, -5.682373046875, -5.4224853515625, -5.16259765625, -4.9027099609375, -4.642822265625, -4.3829345703125, -4.123046875, -3.8631591796875, -3.603271484375, -3.3433837890625, -3.08349609375, -2.8236083984375, -2.563720703125, -2.3038330078125, -2.0439453125, -1.7840576171875, -1.524169921875, -1.2642822265625, -1.00439453125, -0.7445068359375, -0.484619140625, -0.2247314453125, 0.03515625, 0.2950439453125, 0.554931640625, 0.8148193359375, 1.07470703125, 1.3345947265625, 1.594482421875, 1.8543701171875, 2.1142578125, 2.3741455078125, 2.634033203125, 2.8939208984375, 3.15380859375, 3.4136962890625, 3.673583984375, 3.9334716796875, 4.193359375, 4.4532470703125, 4.713134765625, 4.9730224609375, 5.23291015625, 5.4927978515625, 5.752685546875, 6.0125732421875, 6.2724609375, 6.5323486328125, 6.792236328125, 7.0521240234375, 7.31201171875, 7.5718994140625, 7.831787109375, 8.0916748046875, 8.3515625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 13.0, 12.0, 28.0, 39.0, 52.0, 71.0, 136.0, 182.0, 304.0, 549.0, 720.0, 1089.0, 1787.0, 2881.0, 4592.0, 7319.0, 11702.0, 18498.0, 29483.0, 46885.0, 74587.0, 118110.0, 189724.0, 200551.0, 125900.0, 78712.0, 50013.0, 31632.0, 19521.0, 12382.0, 7880.0, 4758.0, 3048.0, 2014.0, 1184.0, 750.0, 511.0, 312.0, 210.0, 150.0, 90.0, 45.0, 31.0, 28.0, 24.0, 16.0, 6.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.947265625, -0.9186172485351562, -0.8899688720703125, -0.8613204956054688, -0.832672119140625, -0.8040237426757812, -0.7753753662109375, -0.7467269897460938, -0.71807861328125, -0.6894302368164062, -0.6607818603515625, -0.6321334838867188, -0.603485107421875, -0.5748367309570312, -0.5461883544921875, -0.5175399780273438, -0.4888916015625, -0.46024322509765625, -0.4315948486328125, -0.40294647216796875, -0.374298095703125, -0.34564971923828125, -0.3170013427734375, -0.28835296630859375, -0.25970458984375, -0.23105621337890625, -0.2024078369140625, -0.17375946044921875, -0.145111083984375, -0.11646270751953125, -0.0878143310546875, -0.05916595458984375, -0.030517578125, -0.00186920166015625, 0.0267791748046875, 0.05542755126953125, 0.084075927734375, 0.11272430419921875, 0.1413726806640625, 0.17002105712890625, 0.19866943359375, 0.22731781005859375, 0.2559661865234375, 0.28461456298828125, 0.313262939453125, 0.34191131591796875, 0.3705596923828125, 0.39920806884765625, 0.4278564453125, 0.45650482177734375, 0.4851531982421875, 0.5138015747070312, 0.542449951171875, 0.5710983276367188, 0.5997467041015625, 0.6283950805664062, 0.65704345703125, 0.6856918334960938, 0.7143402099609375, 0.7429885864257812, 0.771636962890625, 0.8002853393554688, 0.8289337158203125, 0.8575820922851562, 0.88623046875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 6.0, 9.0, 8.0, 7.0, 11.0, 20.0, 19.0, 20.0, 25.0, 19.0, 29.0, 44.0, 37.0, 32.0, 42.0, 54.0, 34.0, 38.0, 50.0, 1067.0, 36.0, 40.0, 40.0, 45.0, 41.0, 31.0, 31.0, 32.0, 19.0, 20.0, 16.0, 20.0, 9.0, 15.0, 8.0, 10.0, 15.0, 6.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.47735595703125, -4.3179931640625, -4.15863037109375, -3.999267578125, -3.83990478515625, -3.6805419921875, -3.52117919921875, -3.36181640625, -3.20245361328125, -3.0430908203125, -2.88372802734375, -2.724365234375, -2.56500244140625, -2.4056396484375, -2.24627685546875, -2.0869140625, -1.92755126953125, -1.7681884765625, -1.60882568359375, -1.449462890625, -1.29010009765625, -1.1307373046875, -0.97137451171875, -0.81201171875, -0.65264892578125, -0.4932861328125, -0.33392333984375, -0.174560546875, -0.01519775390625, 0.1441650390625, 0.30352783203125, 0.462890625, 0.62225341796875, 0.7816162109375, 0.94097900390625, 1.100341796875, 1.25970458984375, 1.4190673828125, 1.57843017578125, 1.73779296875, 1.89715576171875, 2.0565185546875, 2.21588134765625, 2.375244140625, 2.53460693359375, 2.6939697265625, 2.85333251953125, 3.0126953125, 3.17205810546875, 3.3314208984375, 3.49078369140625, 3.650146484375, 3.80950927734375, 3.9688720703125, 4.12823486328125, 4.28759765625, 4.44696044921875, 4.6063232421875, 4.76568603515625, 4.925048828125, 5.08441162109375, 5.2437744140625, 5.40313720703125, 5.5625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 10.0, 20.0, 27.0, 58.0, 68.0, 106.0, 159.0, 226.0, 339.0, 517.0, 871.0, 1326.0, 1920.0, 2963.0, 4378.0, 6751.0, 10170.0, 15807.0, 23631.0, 36379.0, 55610.0, 87691.0, 138618.0, 1247443.0, 165827.0, 104650.0, 66652.0, 42764.0, 28157.0, 18597.0, 12103.0, 7983.0, 5194.0, 3518.0, 2197.0, 1464.0, 1031.0, 643.0, 440.0, 307.0, 208.0, 96.0, 75.0, 60.0, 28.0, 17.0, 13.0, 7.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.833984375, -0.8084793090820312, -0.7829742431640625, -0.7574691772460938, -0.731964111328125, -0.7064590454101562, -0.6809539794921875, -0.6554489135742188, -0.62994384765625, -0.6044387817382812, -0.5789337158203125, -0.5534286499023438, -0.527923583984375, -0.5024185180664062, -0.4769134521484375, -0.45140838623046875, -0.4259033203125, -0.40039825439453125, -0.3748931884765625, -0.34938812255859375, -0.323883056640625, -0.29837799072265625, -0.2728729248046875, -0.24736785888671875, -0.22186279296875, -0.19635772705078125, -0.1708526611328125, -0.14534759521484375, -0.119842529296875, -0.09433746337890625, -0.0688323974609375, -0.04332733154296875, -0.017822265625, 0.00768280029296875, 0.0331878662109375, 0.05869293212890625, 0.084197998046875, 0.10970306396484375, 0.1352081298828125, 0.16071319580078125, 0.18621826171875, 0.21172332763671875, 0.2372283935546875, 0.26273345947265625, 0.288238525390625, 0.31374359130859375, 0.3392486572265625, 0.36475372314453125, 0.3902587890625, 0.41576385498046875, 0.4412689208984375, 0.46677398681640625, 0.492279052734375, 0.5177841186523438, 0.5432891845703125, 0.5687942504882812, 0.59429931640625, 0.6198043823242188, 0.6453094482421875, 0.6708145141601562, 0.696319580078125, 0.7218246459960938, 0.7473297119140625, 0.7728347778320312, 0.79833984375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 13.0, 6.0, 6.0, 11.0, 14.0, 18.0, 24.0, 32.0, 45.0, 40.0, 56.0, 57.0, 83.0, 83.0, 90.0, 83.0, 70.0, 57.0, 44.0, 41.0, 32.0, 17.0, 14.0, 8.0, 9.0, 13.0, 5.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016450881958007812, -0.00158749520778656, -0.0015299022197723389, -0.0014723092317581177, -0.0014147162437438965, -0.0013571232557296753, -0.001299530267715454, -0.001241937279701233, -0.0011843442916870117, -0.0011267513036727905, -0.0010691583156585693, -0.0010115653276443481, -0.000953972339630127, -0.0008963793516159058, -0.0008387863636016846, -0.0007811933755874634, -0.0007236003875732422, -0.000666007399559021, -0.0006084144115447998, -0.0005508214235305786, -0.0004932284355163574, -0.00043563544750213623, -0.00037804245948791504, -0.00032044947147369385, -0.00026285648345947266, -0.00020526349544525146, -0.00014767050743103027, -9.007751941680908e-05, -3.248453140258789e-05, 2.51084566116333e-05, 8.270144462585449e-05, 0.00014029443264007568, 0.00019788742065429688, 0.00025548040866851807, 0.00031307339668273926, 0.00037066638469696045, 0.00042825937271118164, 0.00048585236072540283, 0.000543445348739624, 0.0006010383367538452, 0.0006586313247680664, 0.0007162243127822876, 0.0007738173007965088, 0.00083141028881073, 0.0008890032768249512, 0.0009465962648391724, 0.0010041892528533936, 0.0010617822408676147, 0.001119375228881836, 0.0011769682168960571, 0.0012345612049102783, 0.0012921541929244995, 0.0013497471809387207, 0.001407340168952942, 0.001464933156967163, 0.0015225261449813843, 0.0015801191329956055, 0.0016377121210098267, 0.0016953051090240479, 0.001752898097038269, 0.0018104910850524902, 0.0018680840730667114, 0.0019256770610809326, 0.001983270049095154, 0.002040863037109375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 7.0, 9.0, 12.0, 23.0, 15.0, 24.0, 22.0, 25.0, 32.0, 63.0, 60.0, 107.0, 148.0, 206.0, 286.0, 509.0, 1076.0, 955967.0, 87623.0, 848.0, 467.0, 300.0, 184.0, 166.0, 103.0, 64.0, 50.0, 32.0, 22.0, 18.0, 13.0, 16.0, 11.0, 10.0, 8.0, 4.0, 7.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0300750732421875, -0.02903437614440918, -0.02799367904663086, -0.02695298194885254, -0.02591228485107422, -0.0248715877532959, -0.023830890655517578, -0.022790193557739258, -0.021749496459960938, -0.020708799362182617, -0.019668102264404297, -0.018627405166625977, -0.017586708068847656, -0.016546010971069336, -0.015505313873291016, -0.014464616775512695, -0.013423919677734375, -0.012383222579956055, -0.011342525482177734, -0.010301828384399414, -0.009261131286621094, -0.008220434188842773, -0.007179737091064453, -0.006139039993286133, -0.0050983428955078125, -0.004057645797729492, -0.003016948699951172, -0.0019762516021728516, -0.0009355545043945312, 0.00010514259338378906, 0.0011458396911621094, 0.0021865367889404297, 0.00322723388671875, 0.00426793098449707, 0.005308628082275391, 0.006349325180053711, 0.007390022277832031, 0.008430719375610352, 0.009471416473388672, 0.010512113571166992, 0.011552810668945312, 0.012593507766723633, 0.013634204864501953, 0.014674901962280273, 0.015715599060058594, 0.016756296157836914, 0.017796993255615234, 0.018837690353393555, 0.019878387451171875, 0.020919084548950195, 0.021959781646728516, 0.023000478744506836, 0.024041175842285156, 0.025081872940063477, 0.026122570037841797, 0.027163267135620117, 0.028203964233398438, 0.029244661331176758, 0.030285358428955078, 0.0313260555267334, 0.03236675262451172, 0.03340744972229004, 0.03444814682006836, 0.03548884391784668, 0.036529541015625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 12.0, 52.0, 120.0, 304.0, 331.0, 135.0, 40.0, 12.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006757056689821184, -0.0006336048245429993, -0.0005915040383115411, -0.0005494032520800829, -0.0005073024076409638, -0.00046520159230567515, -0.0004231007769703865, -0.00038099996163509786, -0.0003388991462998092, -0.0002967983309645206, -0.00025469751562923193, -0.00021259670029394329, -0.00017049588495865464, -0.000128395069623366, -8.629425428807735e-05, -4.419343895278871e-05, -2.0926236175000668e-06, 4.000819171778858e-05, 8.210900705307722e-05, 0.00012420982238836586, 0.0001663106377236545, 0.00020841145305894315, 0.0002505122683942318, 0.00029261308372952044, 0.0003347138990648091, 0.00037681471440009773, 0.00041891552973538637, 0.000461016345070675, 0.0005031171604059637, 0.0005452180048450828, 0.000587318791076541, 0.0006294195773079991, 0.0006715203635394573, 0.0007136211497709155, 0.0007557219942100346, 0.0007978228386491537, 0.0008399236248806119, 0.0008820244111120701, 0.0009241252555511892, 0.0009662260999903083, 0.0010083268862217665, 0.0010504276724532247, 0.0010925284586846828, 0.0011346293613314629, 0.001176730147562921, 0.0012188309337943792, 0.0012609318364411592, 0.0013030326226726174, 0.0013451334089040756, 0.0013872341951355338, 0.001429334981366992, 0.001471435884013772, 0.0015135366702452302, 0.0015556374564766884, 0.0015977383591234684, 0.0016398391453549266, 0.0016819399315863848, 0.001724040717817843, 0.0017661415040493011, 0.0018082424066960812, 0.0018503431929275393, 0.0018924439791589975, 0.0019345448818057775, 0.001976645551621914, 0.002018746454268694]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 8.0, 5.0, 8.0, 10.0, 13.0, 14.0, 13.0, 14.0, 25.0, 25.0, 28.0, 21.0, 34.0, 34.0, 26.0, 31.0, 47.0, 47.0, 59.0, 46.0, 45.0, 34.0, 41.0, 48.0, 27.0, 40.0, 32.0, 26.0, 23.0, 17.0, 27.0, 22.0, 16.0, 15.0, 13.0, 10.0, 13.0, 11.0, 8.0, 10.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.000709235668182373, -0.0006841253489255905, -0.000659015029668808, -0.0006339047104120255, -0.0006087943911552429, -0.0005836840718984604, -0.0005585737526416779, -0.0005334634333848953, -0.0005083531141281128, -0.00048324279487133026, -0.00045813247561454773, -0.0004330221563577652, -0.00040791183710098267, -0.00038280151784420013, -0.0003576911985874176, -0.00033258087933063507, -0.00030747056007385254, -0.00028236024081707, -0.0002572499215602875, -0.00023213960230350494, -0.0002070292830467224, -0.00018191896378993988, -0.00015680864453315735, -0.00013169832527637482, -0.00010658800601959229, -8.147768676280975e-05, -5.636736750602722e-05, -3.125704824924469e-05, -6.146728992462158e-06, 1.8963590264320374e-05, 4.4073909521102905e-05, 6.918422877788544e-05, 9.429454803466797e-05, 0.0001194048672914505, 0.00014451518654823303, 0.00016962550580501556, 0.0001947358250617981, 0.00021984614431858063, 0.00024495646357536316, 0.0002700667828321457, 0.0002951771020889282, 0.00032028742134571075, 0.0003453977406024933, 0.0003705080598592758, 0.00039561837911605835, 0.0004207286983728409, 0.0004458390176296234, 0.00047094933688640594, 0.0004960596561431885, 0.000521169975399971, 0.0005462802946567535, 0.0005713906139135361, 0.0005965009331703186, 0.0006216112524271011, 0.0006467215716838837, 0.0006718318909406662, 0.0006969422101974487, 0.0007220525294542313, 0.0007471628487110138, 0.0007722731679677963, 0.0007973834872245789, 0.0008224938064813614, 0.0008476041257381439, 0.0008727144449949265, 0.000897824764251709]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 7.0, 5.0, 13.0, 21.0, 11.0, 21.0, 19.0, 22.0, 33.0, 38.0, 29.0, 29.0, 49.0, 43.0, 48.0, 50.0, 48.0, 56.0, 51.0, 45.0, 46.0, 37.0, 33.0, 38.0, 24.0, 23.0, 29.0, 19.0, 25.0, 13.0, 8.0, 9.0, 13.0, 6.0, 12.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.0213623046875, -7.761474609375, -7.5015869140625, -7.24169921875, -6.9818115234375, -6.721923828125, -6.4620361328125, -6.2021484375, -5.9422607421875, -5.682373046875, -5.4224853515625, -5.16259765625, -4.9027099609375, -4.642822265625, -4.3829345703125, -4.123046875, -3.8631591796875, -3.603271484375, -3.3433837890625, -3.08349609375, -2.8236083984375, -2.563720703125, -2.3038330078125, -2.0439453125, -1.7840576171875, -1.524169921875, -1.2642822265625, -1.00439453125, -0.7445068359375, -0.484619140625, -0.2247314453125, 0.03515625, 0.2950439453125, 0.554931640625, 0.8148193359375, 1.07470703125, 1.3345947265625, 1.594482421875, 1.8543701171875, 2.1142578125, 2.3741455078125, 2.634033203125, 2.8939208984375, 3.15380859375, 3.4136962890625, 3.673583984375, 3.9334716796875, 4.193359375, 4.4532470703125, 4.713134765625, 4.9730224609375, 5.23291015625, 5.4927978515625, 5.752685546875, 6.0125732421875, 6.2724609375, 6.5323486328125, 6.792236328125, 7.0521240234375, 7.31201171875, 7.5718994140625, 7.831787109375, 8.0916748046875, 8.3515625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 8.0, 8.0, 7.0, 13.0, 15.0, 38.0, 38.0, 41.0, 70.0, 93.0, 134.0, 177.0, 244.0, 358.0, 484.0, 703.0, 1006.0, 1350.0, 2184.0, 3409.0, 6057.0, 12554.0, 44455.0, 780508.0, 153144.0, 20454.0, 8289.0, 4379.0, 2637.0, 1718.0, 1137.0, 796.0, 594.0, 403.0, 297.0, 208.0, 153.0, 107.0, 81.0, 55.0, 42.0, 31.0, 29.0, 12.0, 18.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-49.28125, -47.77587890625, -46.2705078125, -44.76513671875, -43.259765625, -41.75439453125, -40.2490234375, -38.74365234375, -37.23828125, -35.73291015625, -34.2275390625, -32.72216796875, -31.216796875, -29.71142578125, -28.2060546875, -26.70068359375, -25.1953125, -23.68994140625, -22.1845703125, -20.67919921875, -19.173828125, -17.66845703125, -16.1630859375, -14.65771484375, -13.15234375, -11.64697265625, -10.1416015625, -8.63623046875, -7.130859375, -5.62548828125, -4.1201171875, -2.61474609375, -1.109375, 0.39599609375, 1.9013671875, 3.40673828125, 4.912109375, 6.41748046875, 7.9228515625, 9.42822265625, 10.93359375, 12.43896484375, 13.9443359375, 15.44970703125, 16.955078125, 18.46044921875, 19.9658203125, 21.47119140625, 22.9765625, 24.48193359375, 25.9873046875, 27.49267578125, 28.998046875, 30.50341796875, 32.0087890625, 33.51416015625, 35.01953125, 36.52490234375, 38.0302734375, 39.53564453125, 41.041015625, 42.54638671875, 44.0517578125, 45.55712890625, 47.0625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 8.0, 4.0, 9.0, 10.0, 14.0, 11.0, 14.0, 24.0, 18.0, 30.0, 19.0, 36.0, 41.0, 39.0, 48.0, 53.0, 68.0, 96.0, 242.0, 1539.0, 191.0, 89.0, 64.0, 51.0, 40.0, 35.0, 26.0, 36.0, 31.0, 22.0, 21.0, 21.0, 15.0, 19.0, 15.0, 10.0, 5.0, 5.0, 5.0, 3.0, 3.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.84375, -23.108642578125, -22.37353515625, -21.638427734375, -20.9033203125, -20.168212890625, -19.43310546875, -18.697998046875, -17.962890625, -17.227783203125, -16.49267578125, -15.757568359375, -15.0224609375, -14.287353515625, -13.55224609375, -12.817138671875, -12.08203125, -11.346923828125, -10.61181640625, -9.876708984375, -9.1416015625, -8.406494140625, -7.67138671875, -6.936279296875, -6.201171875, -5.466064453125, -4.73095703125, -3.995849609375, -3.2607421875, -2.525634765625, -1.79052734375, -1.055419921875, -0.3203125, 0.414794921875, 1.14990234375, 1.885009765625, 2.6201171875, 3.355224609375, 4.09033203125, 4.825439453125, 5.560546875, 6.295654296875, 7.03076171875, 7.765869140625, 8.5009765625, 9.236083984375, 9.97119140625, 10.706298828125, 11.44140625, 12.176513671875, 12.91162109375, 13.646728515625, 14.3818359375, 15.116943359375, 15.85205078125, 16.587158203125, 17.322265625, 18.057373046875, 18.79248046875, 19.527587890625, 20.2626953125, 20.997802734375, 21.73291015625, 22.468017578125, 23.203125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 5.0, 8.0, 10.0, 16.0, 8.0, 14.0, 24.0, 21.0, 24.0, 29.0, 34.0, 52.0, 52.0, 80.0, 163.0, 407.0, 1929.0, 2545150.0, 595146.0, 1575.0, 393.0, 174.0, 83.0, 61.0, 47.0, 29.0, 24.0, 29.0, 24.0, 12.0, 11.0, 12.0, 14.0, 12.0, 7.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-115.4375, -111.9345703125, -108.431640625, -104.9287109375, -101.42578125, -97.9228515625, -94.419921875, -90.9169921875, -87.4140625, -83.9111328125, -80.408203125, -76.9052734375, -73.40234375, -69.8994140625, -66.396484375, -62.8935546875, -59.390625, -55.8876953125, -52.384765625, -48.8818359375, -45.37890625, -41.8759765625, -38.373046875, -34.8701171875, -31.3671875, -27.8642578125, -24.361328125, -20.8583984375, -17.35546875, -13.8525390625, -10.349609375, -6.8466796875, -3.34375, 0.1591796875, 3.662109375, 7.1650390625, 10.66796875, 14.1708984375, 17.673828125, 21.1767578125, 24.6796875, 28.1826171875, 31.685546875, 35.1884765625, 38.69140625, 42.1943359375, 45.697265625, 49.2001953125, 52.703125, 56.2060546875, 59.708984375, 63.2119140625, 66.71484375, 70.2177734375, 73.720703125, 77.2236328125, 80.7265625, 84.2294921875, 87.732421875, 91.2353515625, 94.73828125, 98.2412109375, 101.744140625, 105.2470703125, 108.75]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 139.0, 870.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.09609985351562, -209.5765380859375, -198.05697631835938, -186.53741455078125, -175.01785278320312, -163.498291015625, -151.97874450683594, -140.4591827392578, -128.9396209716797, -117.42005920410156, -105.90049743652344, -94.38094329833984, -82.86138153076172, -71.3418197631836, -59.822265625, -48.302703857421875, -36.78314208984375, -25.263582229614258, -13.744022369384766, -2.2244644165039062, 9.295097351074219, 20.814659118652344, 32.33421325683594, 43.85377502441406, 55.37333679199219, 66.89289855957031, 78.41246032714844, 89.93201446533203, 101.45157623291016, 112.97113800048828, 124.49069213867188, 136.01025390625, 147.52978515625, 159.04934692382812, 170.56890869140625, 182.08847045898438, 193.6080322265625, 205.12759399414062, 216.6471405029297, 228.1667022705078, 239.68626403808594, 251.20582580566406, 262.7253723144531, 274.24493408203125, 285.7644958496094, 297.2840576171875, 308.8036193847656, 320.32318115234375, 331.8427429199219, 343.3623046875, 354.8818664550781, 366.40142822265625, 377.9209899902344, 389.4405517578125, 400.9600830078125, 412.47967529296875, 423.99920654296875, 435.5187683105469, 447.038330078125, 458.5578918457031, 470.07745361328125, 481.5970153808594, 493.1165771484375, 504.6361083984375, 516.1557006835938]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 10.0, 5.0, 8.0, 7.0, 14.0, 14.0, 22.0, 16.0, 23.0, 26.0, 29.0, 29.0, 25.0, 18.0, 36.0, 33.0, 32.0, 28.0, 45.0, 36.0, 44.0, 36.0, 40.0, 39.0, 43.0, 40.0, 41.0, 31.0, 39.0, 20.0, 18.0, 29.0, 20.0, 30.0, 14.0, 17.0, 8.0, 9.0, 7.0, 6.0, 5.0, 4.0, 5.0, 5.0], "bins": [-83.70170593261719, -81.44474792480469, -79.18778228759766, -76.93082427978516, -74.67386627197266, -72.41690826416016, -70.15994262695312, -67.90298461914062, -65.64602661132812, -63.38906478881836, -61.13210678100586, -58.875144958496094, -56.618186950683594, -54.36122512817383, -52.10426330566406, -49.84730529785156, -47.5903434753418, -45.33338165283203, -43.07642364501953, -40.819461822509766, -38.562503814697266, -36.3055419921875, -34.048583984375, -31.791622161865234, -29.5346622467041, -27.27770233154297, -25.020742416381836, -22.763782501220703, -20.506820678710938, -18.249862670898438, -15.992900848388672, -13.735940933227539, -11.478981018066406, -9.222021102905273, -6.965060710906982, -4.708100318908691, -2.4511404037475586, -0.19418048858642578, 2.0627803802490234, 4.319740295410156, 6.576700210571289, 8.833660125732422, 11.090620040893555, 13.347580909729004, 15.604540824890137, 17.861499786376953, 20.11846160888672, 22.37542152404785, 24.632381439208984, 26.889341354370117, 29.14630126953125, 31.403263092041016, 33.660221099853516, 35.91718292236328, 38.17414093017578, 40.43110275268555, 42.68806457519531, 44.94502639770508, 47.20198440551758, 49.458946228027344, 51.715904235839844, 53.97286605834961, 56.229827880859375, 58.486785888671875, 60.743743896484375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 4.0, 10.0, 6.0, 10.0, 14.0, 10.0, 20.0, 12.0, 23.0, 18.0, 37.0, 24.0, 30.0, 31.0, 29.0, 40.0, 49.0, 47.0, 49.0, 44.0, 52.0, 54.0, 49.0, 33.0, 27.0, 47.0, 26.0, 21.0, 20.0, 31.0, 24.0, 17.0, 15.0, 10.0, 8.0, 13.0, 10.0, 9.0, 5.0, 5.0, 2.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.83203125, -7.57476806640625, -7.3175048828125, -7.06024169921875, -6.802978515625, -6.54571533203125, -6.2884521484375, -6.03118896484375, -5.77392578125, -5.51666259765625, -5.2593994140625, -5.00213623046875, -4.744873046875, -4.48760986328125, -4.2303466796875, -3.97308349609375, -3.7158203125, -3.45855712890625, -3.2012939453125, -2.94403076171875, -2.686767578125, -2.42950439453125, -2.1722412109375, -1.91497802734375, -1.65771484375, -1.40045166015625, -1.1431884765625, -0.88592529296875, -0.628662109375, -0.37139892578125, -0.1141357421875, 0.14312744140625, 0.400390625, 0.65765380859375, 0.9149169921875, 1.17218017578125, 1.429443359375, 1.68670654296875, 1.9439697265625, 2.20123291015625, 2.45849609375, 2.71575927734375, 2.9730224609375, 3.23028564453125, 3.487548828125, 3.74481201171875, 4.0020751953125, 4.25933837890625, 4.5166015625, 4.77386474609375, 5.0311279296875, 5.28839111328125, 5.545654296875, 5.80291748046875, 6.0601806640625, 6.31744384765625, 6.57470703125, 6.83197021484375, 7.0892333984375, 7.34649658203125, 7.603759765625, 7.86102294921875, 8.1182861328125, 8.37554931640625, 8.6328125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 9.0, 11.0, 10.0, 10.0, 17.0, 27.0, 37.0, 52.0, 80.0, 133.0, 184.0, 307.0, 537.0, 975.0, 2103.0, 4577.0, 11377.0, 39610.0, 417727.0, 3485306.0, 186577.0, 27679.0, 9098.0, 3852.0, 1773.0, 942.0, 477.0, 260.0, 171.0, 107.0, 68.0, 58.0, 28.0, 28.0, 20.0, 16.0, 12.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.46875, -48.91015625, -47.3515625, -45.79296875, -44.234375, -42.67578125, -41.1171875, -39.55859375, -38.0, -36.44140625, -34.8828125, -33.32421875, -31.765625, -30.20703125, -28.6484375, -27.08984375, -25.53125, -23.97265625, -22.4140625, -20.85546875, -19.296875, -17.73828125, -16.1796875, -14.62109375, -13.0625, -11.50390625, -9.9453125, -8.38671875, -6.828125, -5.26953125, -3.7109375, -2.15234375, -0.59375, 0.96484375, 2.5234375, 4.08203125, 5.640625, 7.19921875, 8.7578125, 10.31640625, 11.875, 13.43359375, 14.9921875, 16.55078125, 18.109375, 19.66796875, 21.2265625, 22.78515625, 24.34375, 25.90234375, 27.4609375, 29.01953125, 30.578125, 32.13671875, 33.6953125, 35.25390625, 36.8125, 38.37109375, 39.9296875, 41.48828125, 43.046875, 44.60546875, 46.1640625, 47.72265625, 49.28125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 11.0, 5.0, 8.0, 14.0, 15.0, 22.0, 39.0, 37.0, 67.0, 131.0, 173.0, 276.0, 425.0, 640.0, 735.0, 520.0, 325.0, 204.0, 126.0, 97.0, 67.0, 45.0, 25.0, 19.0, 20.0, 10.0, 10.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.03125, -55.537109375, -54.04296875, -52.548828125, -51.0546875, -49.560546875, -48.06640625, -46.572265625, -45.078125, -43.583984375, -42.08984375, -40.595703125, -39.1015625, -37.607421875, -36.11328125, -34.619140625, -33.125, -31.630859375, -30.13671875, -28.642578125, -27.1484375, -25.654296875, -24.16015625, -22.666015625, -21.171875, -19.677734375, -18.18359375, -16.689453125, -15.1953125, -13.701171875, -12.20703125, -10.712890625, -9.21875, -7.724609375, -6.23046875, -4.736328125, -3.2421875, -1.748046875, -0.25390625, 1.240234375, 2.734375, 4.228515625, 5.72265625, 7.216796875, 8.7109375, 10.205078125, 11.69921875, 13.193359375, 14.6875, 16.181640625, 17.67578125, 19.169921875, 20.6640625, 22.158203125, 23.65234375, 25.146484375, 26.640625, 28.134765625, 29.62890625, 31.123046875, 32.6171875, 34.111328125, 35.60546875, 37.099609375, 38.59375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 9.0, 9.0, 13.0, 29.0, 32.0, 53.0, 83.0, 120.0, 201.0, 407.0, 2137.0, 3956621.0, 232759.0, 1053.0, 304.0, 160.0, 105.0, 55.0, 42.0, 33.0, 17.0, 13.0, 4.0, 12.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-188.375, -180.478515625, -172.58203125, -164.685546875, -156.7890625, -148.892578125, -140.99609375, -133.099609375, -125.203125, -117.306640625, -109.41015625, -101.513671875, -93.6171875, -85.720703125, -77.82421875, -69.927734375, -62.03125, -54.134765625, -46.23828125, -38.341796875, -30.4453125, -22.548828125, -14.65234375, -6.755859375, 1.140625, 9.037109375, 16.93359375, 24.830078125, 32.7265625, 40.623046875, 48.51953125, 56.416015625, 64.3125, 72.208984375, 80.10546875, 88.001953125, 95.8984375, 103.794921875, 111.69140625, 119.587890625, 127.484375, 135.380859375, 143.27734375, 151.173828125, 159.0703125, 166.966796875, 174.86328125, 182.759765625, 190.65625, 198.552734375, 206.44921875, 214.345703125, 222.2421875, 230.138671875, 238.03515625, 245.931640625, 253.828125, 261.724609375, 269.62109375, 277.517578125, 285.4140625, 293.310546875, 301.20703125, 309.103515625, 317.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 89.0, 873.0, 52.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-258.8080139160156, -234.0271759033203, -209.24635314941406, -184.46551513671875, -159.6846923828125, -134.9038543701172, -110.12301635742188, -85.34219360351562, -60.56135559082031, -35.78052520751953, -10.999691009521484, 13.781143188476562, 38.561973571777344, 63.342803955078125, 88.12364196777344, 112.90446472167969, 137.685302734375, 162.4661407470703, 187.24696350097656, 212.02780151367188, 236.80862426757812, 261.5894775390625, 286.37030029296875, 311.151123046875, 335.93194580078125, 360.7127685546875, 385.4936218261719, 410.2744445800781, 435.0552673339844, 459.83612060546875, 484.616943359375, 509.39776611328125, 534.1786499023438, 558.95947265625, 583.7402954101562, 608.5211181640625, 633.302001953125, 658.0828247070312, 682.8636474609375, 707.6444702148438, 732.42529296875, 757.2061157226562, 781.9869384765625, 806.767822265625, 831.5486450195312, 856.3294677734375, 881.1102905273438, 905.89111328125, 930.6719970703125, 955.4528198242188, 980.233642578125, 1005.0145263671875, 1029.7952880859375, 1054.576171875, 1079.35693359375, 1104.1378173828125, 1128.9185791015625, 1153.699462890625, 1178.480224609375, 1203.2611083984375, 1228.0418701171875, 1252.82275390625, 1277.603515625, 1302.3843994140625, 1327.165283203125]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 1.0, 5.0, 10.0, 7.0, 16.0, 11.0, 18.0, 13.0, 16.0, 16.0, 21.0, 32.0, 25.0, 39.0, 34.0, 30.0, 47.0, 37.0, 46.0, 42.0, 46.0, 33.0, 46.0, 37.0, 41.0, 33.0, 39.0, 43.0, 28.0, 33.0, 31.0, 12.0, 19.0, 16.0, 15.0, 12.0, 16.0, 11.0, 6.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.78587341308594, -98.97459411621094, -95.16332244873047, -91.35204315185547, -87.540771484375, -83.7294921875, -79.918212890625, -76.10694122314453, -72.29566192626953, -68.48438262939453, -64.67311096191406, -60.86183166503906, -57.05055618286133, -53.239280700683594, -49.42800521850586, -45.616729736328125, -41.80545425415039, -37.994178771972656, -34.18290328979492, -30.371625900268555, -26.560348510742188, -22.749073028564453, -18.93779754638672, -15.126520156860352, -11.315244674682617, -7.503968238830566, -3.692692279815674, 0.11858367919921875, 3.9298601150512695, 7.74113655090332, 11.552412033081055, 15.363689422607422, 19.174964904785156, 22.98624038696289, 26.797517776489258, 30.608793258666992, 34.42007064819336, 38.231346130371094, 42.04262161254883, 45.85389709472656, 49.66517639160156, 53.4764518737793, 57.28772735595703, 61.09900665283203, 64.9102783203125, 68.7215576171875, 72.5328369140625, 76.34410858154297, 80.15538024902344, 83.96665954589844, 87.7779312133789, 91.5892105102539, 95.40048217773438, 99.21176147460938, 103.02304077148438, 106.83431243896484, 110.64559173583984, 114.45687103271484, 118.26814270019531, 122.07942199707031, 125.89069366455078, 129.70196533203125, 133.51324462890625, 137.32452392578125, 141.13580322265625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 9.0, 10.0, 9.0, 6.0, 9.0, 15.0, 10.0, 14.0, 22.0, 25.0, 26.0, 31.0, 30.0, 28.0, 43.0, 35.0, 36.0, 48.0, 45.0, 49.0, 39.0, 52.0, 39.0, 35.0, 33.0, 36.0, 34.0, 35.0, 31.0, 21.0, 25.0, 19.0, 16.0, 15.0, 11.0, 12.0, 7.0, 10.0, 9.0, 8.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.875, -7.6202392578125, -7.365478515625, -7.1107177734375, -6.85595703125, -6.6011962890625, -6.346435546875, -6.0916748046875, -5.8369140625, -5.5821533203125, -5.327392578125, -5.0726318359375, -4.81787109375, -4.5631103515625, -4.308349609375, -4.0535888671875, -3.798828125, -3.5440673828125, -3.289306640625, -3.0345458984375, -2.77978515625, -2.5250244140625, -2.270263671875, -2.0155029296875, -1.7607421875, -1.5059814453125, -1.251220703125, -0.9964599609375, -0.74169921875, -0.4869384765625, -0.232177734375, 0.0225830078125, 0.27734375, 0.5321044921875, 0.786865234375, 1.0416259765625, 1.29638671875, 1.5511474609375, 1.805908203125, 2.0606689453125, 2.3154296875, 2.5701904296875, 2.824951171875, 3.0797119140625, 3.33447265625, 3.5892333984375, 3.843994140625, 4.0987548828125, 4.353515625, 4.6082763671875, 4.863037109375, 5.1177978515625, 5.37255859375, 5.6273193359375, 5.882080078125, 6.1368408203125, 6.3916015625, 6.6463623046875, 6.901123046875, 7.1558837890625, 7.41064453125, 7.6654052734375, 7.920166015625, 8.1749267578125, 8.4296875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 10.0, 11.0, 9.0, 11.0, 28.0, 40.0, 51.0, 72.0, 135.0, 201.0, 276.0, 397.0, 607.0, 884.0, 1320.0, 1931.0, 2799.0, 4114.0, 6215.0, 9040.0, 13444.0, 19705.0, 29006.0, 43404.0, 63666.0, 93346.0, 140635.0, 190304.0, 138980.0, 92004.0, 63270.0, 43096.0, 28978.0, 19457.0, 13161.0, 8993.0, 6068.0, 4116.0, 2879.0, 1939.0, 1287.0, 839.0, 592.0, 390.0, 279.0, 199.0, 125.0, 75.0, 60.0, 30.0, 28.0, 18.0, 13.0, 8.0, 8.0, 5.0, 2.0, 4.0], "bins": [-0.87939453125, -0.8531341552734375, -0.826873779296875, -0.8006134033203125, -0.77435302734375, -0.7480926513671875, -0.721832275390625, -0.6955718994140625, -0.6693115234375, -0.6430511474609375, -0.616790771484375, -0.5905303955078125, -0.56427001953125, -0.5380096435546875, -0.511749267578125, -0.4854888916015625, -0.459228515625, -0.4329681396484375, -0.406707763671875, -0.3804473876953125, -0.35418701171875, -0.3279266357421875, -0.301666259765625, -0.2754058837890625, -0.2491455078125, -0.2228851318359375, -0.196624755859375, -0.1703643798828125, -0.14410400390625, -0.1178436279296875, -0.091583251953125, -0.0653228759765625, -0.0390625, -0.0128021240234375, 0.013458251953125, 0.0397186279296875, 0.06597900390625, 0.0922393798828125, 0.118499755859375, 0.1447601318359375, 0.1710205078125, 0.1972808837890625, 0.223541259765625, 0.2498016357421875, 0.27606201171875, 0.3023223876953125, 0.328582763671875, 0.3548431396484375, 0.381103515625, 0.4073638916015625, 0.433624267578125, 0.4598846435546875, 0.48614501953125, 0.5124053955078125, 0.538665771484375, 0.5649261474609375, 0.5911865234375, 0.6174468994140625, 0.643707275390625, 0.6699676513671875, 0.69622802734375, 0.7224884033203125, 0.748748779296875, 0.7750091552734375, 0.80126953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 6.0, 7.0, 9.0, 11.0, 12.0, 14.0, 23.0, 19.0, 36.0, 30.0, 33.0, 42.0, 24.0, 54.0, 38.0, 41.0, 53.0, 40.0, 1053.0, 43.0, 32.0, 46.0, 29.0, 38.0, 32.0, 25.0, 23.0, 35.0, 31.0, 15.0, 19.0, 20.0, 15.0, 12.0, 9.0, 12.0, 4.0, 5.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73828125, -4.57525634765625, -4.4122314453125, -4.24920654296875, -4.086181640625, -3.92315673828125, -3.7601318359375, -3.59710693359375, -3.43408203125, -3.27105712890625, -3.1080322265625, -2.94500732421875, -2.781982421875, -2.61895751953125, -2.4559326171875, -2.29290771484375, -2.1298828125, -1.96685791015625, -1.8038330078125, -1.64080810546875, -1.477783203125, -1.31475830078125, -1.1517333984375, -0.98870849609375, -0.82568359375, -0.66265869140625, -0.4996337890625, -0.33660888671875, -0.173583984375, -0.01055908203125, 0.1524658203125, 0.31549072265625, 0.478515625, 0.64154052734375, 0.8045654296875, 0.96759033203125, 1.130615234375, 1.29364013671875, 1.4566650390625, 1.61968994140625, 1.78271484375, 1.94573974609375, 2.1087646484375, 2.27178955078125, 2.434814453125, 2.59783935546875, 2.7608642578125, 2.92388916015625, 3.0869140625, 3.24993896484375, 3.4129638671875, 3.57598876953125, 3.739013671875, 3.90203857421875, 4.0650634765625, 4.22808837890625, 4.39111328125, 4.55413818359375, 4.7171630859375, 4.88018798828125, 5.043212890625, 5.20623779296875, 5.3692626953125, 5.53228759765625, 5.6953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 17.0, 21.0, 27.0, 63.0, 69.0, 123.0, 177.0, 273.0, 373.0, 654.0, 941.0, 1396.0, 2173.0, 3414.0, 5157.0, 8119.0, 12447.0, 19537.0, 30645.0, 47440.0, 74372.0, 117101.0, 187868.0, 1240804.0, 124222.0, 78955.0, 50214.0, 32094.0, 20719.0, 13158.0, 8628.0, 5532.0, 3681.0, 2374.0, 1494.0, 1020.0, 617.0, 392.0, 298.0, 198.0, 106.0, 73.0, 48.0, 36.0, 23.0, 12.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.93994140625, -0.9115142822265625, -0.883087158203125, -0.8546600341796875, -0.82623291015625, -0.7978057861328125, -0.769378662109375, -0.7409515380859375, -0.7125244140625, -0.6840972900390625, -0.655670166015625, -0.6272430419921875, -0.59881591796875, -0.5703887939453125, -0.541961669921875, -0.5135345458984375, -0.485107421875, -0.4566802978515625, -0.428253173828125, -0.3998260498046875, -0.37139892578125, -0.3429718017578125, -0.314544677734375, -0.2861175537109375, -0.2576904296875, -0.2292633056640625, -0.200836181640625, -0.1724090576171875, -0.14398193359375, -0.1155548095703125, -0.087127685546875, -0.0587005615234375, -0.0302734375, -0.0018463134765625, 0.026580810546875, 0.0550079345703125, 0.08343505859375, 0.1118621826171875, 0.140289306640625, 0.1687164306640625, 0.1971435546875, 0.2255706787109375, 0.253997802734375, 0.2824249267578125, 0.31085205078125, 0.3392791748046875, 0.367706298828125, 0.3961334228515625, 0.424560546875, 0.4529876708984375, 0.481414794921875, 0.5098419189453125, 0.53826904296875, 0.5666961669921875, 0.595123291015625, 0.6235504150390625, 0.6519775390625, 0.6804046630859375, 0.708831787109375, 0.7372589111328125, 0.76568603515625, 0.7941131591796875, 0.822540283203125, 0.8509674072265625, 0.87939453125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 13.0, 13.0, 7.0, 11.0, 10.0, 19.0, 19.0, 31.0, 27.0, 30.0, 40.0, 40.0, 49.0, 50.0, 69.0, 55.0, 51.0, 54.0, 56.0, 49.0, 44.0, 33.0, 34.0, 39.0, 22.0, 23.0, 19.0, 10.0, 11.0, 10.0, 9.0, 9.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.001800537109375, -0.0017470866441726685, -0.001693636178970337, -0.0016401857137680054, -0.0015867352485656738, -0.0015332847833633423, -0.0014798343181610107, -0.0014263838529586792, -0.0013729333877563477, -0.0013194829225540161, -0.0012660324573516846, -0.001212581992149353, -0.0011591315269470215, -0.00110568106174469, -0.0010522305965423584, -0.0009987801313400269, -0.0009453296661376953, -0.0008918792009353638, -0.0008384287357330322, -0.0007849782705307007, -0.0007315278053283691, -0.0006780773401260376, -0.0006246268749237061, -0.0005711764097213745, -0.000517725944519043, -0.0004642754793167114, -0.0004108250141143799, -0.00035737454891204834, -0.0003039240837097168, -0.00025047361850738525, -0.0001970231533050537, -0.00014357268810272217, -9.012222290039062e-05, -3.667175769805908e-05, 1.677870750427246e-05, 7.0229172706604e-05, 0.00012367963790893555, 0.0001771301031112671, 0.00023058056831359863, 0.0002840310335159302, 0.0003374814987182617, 0.00039093196392059326, 0.0004443824291229248, 0.0004978328943252563, 0.0005512833595275879, 0.0006047338247299194, 0.000658184289932251, 0.0007116347551345825, 0.0007650852203369141, 0.0008185356855392456, 0.0008719861507415771, 0.0009254366159439087, 0.0009788870811462402, 0.0010323375463485718, 0.0010857880115509033, 0.0011392384767532349, 0.0011926889419555664, 0.001246139407157898, 0.0012995898723602295, 0.001353040337562561, 0.0014064908027648926, 0.0014599412679672241, 0.0015133917331695557, 0.0015668421983718872, 0.0016202926635742188]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 10.0, 12.0, 13.0, 27.0, 24.0, 35.0, 39.0, 80.0, 77.0, 90.0, 130.0, 183.0, 307.0, 786.0, 20123.0, 1023975.0, 1215.0, 480.0, 281.0, 177.0, 110.0, 92.0, 63.0, 62.0, 30.0, 27.0, 20.0, 19.0, 14.0, 9.0, 11.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03619384765625, -0.03491067886352539, -0.03362751007080078, -0.03234434127807617, -0.031061172485351562, -0.029778003692626953, -0.028494834899902344, -0.027211666107177734, -0.025928497314453125, -0.024645328521728516, -0.023362159729003906, -0.022078990936279297, -0.020795822143554688, -0.019512653350830078, -0.01822948455810547, -0.01694631576538086, -0.01566314697265625, -0.01437997817993164, -0.013096809387207031, -0.011813640594482422, -0.010530471801757812, -0.009247303009033203, -0.007964134216308594, -0.006680965423583984, -0.005397796630859375, -0.004114627838134766, -0.0028314590454101562, -0.0015482902526855469, -0.0002651214599609375, 0.0010180473327636719, 0.0023012161254882812, 0.0035843849182128906, 0.0048675537109375, 0.006150722503662109, 0.007433891296386719, 0.008717060089111328, 0.010000228881835938, 0.011283397674560547, 0.012566566467285156, 0.013849735260009766, 0.015132904052734375, 0.016416072845458984, 0.017699241638183594, 0.018982410430908203, 0.020265579223632812, 0.021548748016357422, 0.02283191680908203, 0.02411508560180664, 0.02539825439453125, 0.02668142318725586, 0.02796459197998047, 0.029247760772705078, 0.030530929565429688, 0.0318140983581543, 0.033097267150878906, 0.034380435943603516, 0.035663604736328125, 0.036946773529052734, 0.038229942321777344, 0.03951311111450195, 0.04079627990722656, 0.04207944869995117, 0.04336261749267578, 0.04464578628540039, 0.045928955078125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 78.0, 881.0, 55.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00650307722389698, -0.006308676674962044, -0.00611427566036582, -0.005919875111430883, -0.005725474562495947, -0.005531073547899723, -0.0053366729989647865, -0.00514227245002985, -0.0049478719010949135, -0.004753471352159977, -0.004559070337563753, -0.004364669788628817, -0.00417026923969388, -0.003975868225097656, -0.0037814676761627197, -0.003587067127227783, -0.0033926661126315594, -0.003198265330865979, -0.0030038647819310427, -0.0028094640001654625, -0.002615063451230526, -0.002420662669464946, -0.0022262618876993656, -0.002031861338764429, -0.001837460556998849, -0.0016430598916485906, -0.0014486592262983322, -0.001254258444532752, -0.0010598577791824937, -0.0008654571138322353, -0.0006710563320666552, -0.0004766556667163968, -0.00028225453570485115, -8.785384125076234e-05, 0.00010654685320332646, 0.00030094757676124573, 0.0004953482421115041, 0.0006897489074617624, 0.0008841496892273426, 0.001078550354577601, 0.0012729510199278593, 0.0014673516852781177, 0.001661752350628376, 0.0018561531323939562, 0.0020505539141595364, 0.002244954463094473, 0.002439355244860053, 0.0026337560266256332, 0.0028281565755605698, 0.00302255735732615, 0.0032169579062610865, 0.0034113586880266666, 0.003605759236961603, 0.0038001600187271833, 0.0039945608004927635, 0.0041889613494277, 0.0043833618983626366, 0.004577762447297573, 0.004772163461893797, 0.0049665640108287334, 0.00516096455976367, 0.005355365574359894, 0.00554976612329483, 0.005744166672229767, 0.005938567686825991]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 8.0, 7.0, 5.0, 14.0, 14.0, 14.0, 10.0, 12.0, 13.0, 21.0, 28.0, 27.0, 39.0, 34.0, 33.0, 46.0, 50.0, 40.0, 51.0, 47.0, 39.0, 41.0, 37.0, 45.0, 32.0, 39.0, 36.0, 32.0, 37.0, 23.0, 17.0, 16.0, 15.0, 12.0, 9.0, 22.0, 6.0, 8.0, 6.0, 6.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009483098983764648, -0.0009173713624477386, -0.0008864328265190125, -0.0008554942905902863, -0.0008245557546615601, -0.0007936172187328339, -0.0007626786828041077, -0.0007317401468753815, -0.0007008016109466553, -0.0006698630750179291, -0.0006389245390892029, -0.0006079860031604767, -0.0005770474672317505, -0.0005461089313030243, -0.0005151703953742981, -0.0004842318594455719, -0.0004532933235168457, -0.0004223547875881195, -0.0003914162516593933, -0.0003604777157306671, -0.0003295391798019409, -0.0002986006438732147, -0.0002676621079444885, -0.00023672357201576233, -0.00020578503608703613, -0.00017484650015830994, -0.00014390796422958374, -0.00011296942830085754, -8.203089237213135e-05, -5.109235644340515e-05, -2.0153820514678955e-05, 1.0784715414047241e-05, 4.172325134277344e-05, 7.266178727149963e-05, 0.00010360032320022583, 0.00013453885912895203, 0.00016547739505767822, 0.00019641593098640442, 0.00022735446691513062, 0.0002582930028438568, 0.000289231538772583, 0.0003201700747013092, 0.0003511086106300354, 0.0003820471465587616, 0.0004129856824874878, 0.000443924218416214, 0.0004748627543449402, 0.0005058012902736664, 0.0005367398262023926, 0.0005676783621311188, 0.000598616898059845, 0.0006295554339885712, 0.0006604939699172974, 0.0006914325058460236, 0.0007223710417747498, 0.000753309577703476, 0.0007842481136322021, 0.0008151866495609283, 0.0008461251854896545, 0.0008770637214183807, 0.0009080022573471069, 0.0009389407932758331, 0.0009698793292045593, 0.0010008178651332855, 0.0010317564010620117]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 9.0, 10.0, 9.0, 6.0, 9.0, 15.0, 10.0, 14.0, 22.0, 25.0, 26.0, 31.0, 30.0, 28.0, 43.0, 35.0, 36.0, 48.0, 45.0, 49.0, 39.0, 52.0, 39.0, 35.0, 33.0, 36.0, 34.0, 35.0, 31.0, 21.0, 25.0, 19.0, 16.0, 15.0, 11.0, 12.0, 7.0, 10.0, 9.0, 8.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.875, -7.6202392578125, -7.365478515625, -7.1107177734375, -6.85595703125, -6.6011962890625, -6.346435546875, -6.0916748046875, -5.8369140625, -5.5821533203125, -5.327392578125, -5.0726318359375, -4.81787109375, -4.5631103515625, -4.308349609375, -4.0535888671875, -3.798828125, -3.5440673828125, -3.289306640625, -3.0345458984375, -2.77978515625, -2.5250244140625, -2.270263671875, -2.0155029296875, -1.7607421875, -1.5059814453125, -1.251220703125, -0.9964599609375, -0.74169921875, -0.4869384765625, -0.232177734375, 0.0225830078125, 0.27734375, 0.5321044921875, 0.786865234375, 1.0416259765625, 1.29638671875, 1.5511474609375, 1.805908203125, 2.0606689453125, 2.3154296875, 2.5701904296875, 2.824951171875, 3.0797119140625, 3.33447265625, 3.5892333984375, 3.843994140625, 4.0987548828125, 4.353515625, 4.6082763671875, 4.863037109375, 5.1177978515625, 5.37255859375, 5.6273193359375, 5.882080078125, 6.1368408203125, 6.3916015625, 6.6463623046875, 6.901123046875, 7.1558837890625, 7.41064453125, 7.6654052734375, 7.920166015625, 8.1749267578125, 8.4296875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 13.0, 6.0, 12.0, 8.0, 17.0, 26.0, 33.0, 58.0, 48.0, 75.0, 88.0, 139.0, 218.0, 265.0, 464.0, 722.0, 1268.0, 2554.0, 5513.0, 14596.0, 43417.0, 151043.0, 460625.0, 257565.0, 71460.0, 22387.0, 8153.0, 3497.0, 1655.0, 878.0, 598.0, 348.0, 225.0, 146.0, 117.0, 79.0, 62.0, 43.0, 37.0, 26.0, 26.0, 13.0, 10.0, 7.0, 5.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.0625, -7.7999267578125, -7.537353515625, -7.2747802734375, -7.01220703125, -6.7496337890625, -6.487060546875, -6.2244873046875, -5.9619140625, -5.6993408203125, -5.436767578125, -5.1741943359375, -4.91162109375, -4.6490478515625, -4.386474609375, -4.1239013671875, -3.861328125, -3.5987548828125, -3.336181640625, -3.0736083984375, -2.81103515625, -2.5484619140625, -2.285888671875, -2.0233154296875, -1.7607421875, -1.4981689453125, -1.235595703125, -0.9730224609375, -0.71044921875, -0.4478759765625, -0.185302734375, 0.0772705078125, 0.33984375, 0.6024169921875, 0.864990234375, 1.1275634765625, 1.39013671875, 1.6527099609375, 1.915283203125, 2.1778564453125, 2.4404296875, 2.7030029296875, 2.965576171875, 3.2281494140625, 3.49072265625, 3.7532958984375, 4.015869140625, 4.2784423828125, 4.541015625, 4.8035888671875, 5.066162109375, 5.3287353515625, 5.59130859375, 5.8538818359375, 6.116455078125, 6.3790283203125, 6.6416015625, 6.9041748046875, 7.166748046875, 7.4293212890625, 7.69189453125, 7.9544677734375, 8.217041015625, 8.4796142578125, 8.7421875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 8.0, 1.0, 4.0, 4.0, 10.0, 8.0, 12.0, 14.0, 18.0, 23.0, 24.0, 29.0, 34.0, 35.0, 38.0, 35.0, 42.0, 44.0, 40.0, 79.0, 252.0, 1681.0, 158.0, 70.0, 49.0, 51.0, 33.0, 42.0, 37.0, 24.0, 23.0, 20.0, 13.0, 22.0, 15.0, 10.0, 13.0, 9.0, 10.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.296875, -27.363525390625, -26.43017578125, -25.496826171875, -24.5634765625, -23.630126953125, -22.69677734375, -21.763427734375, -20.830078125, -19.896728515625, -18.96337890625, -18.030029296875, -17.0966796875, -16.163330078125, -15.22998046875, -14.296630859375, -13.36328125, -12.429931640625, -11.49658203125, -10.563232421875, -9.6298828125, -8.696533203125, -7.76318359375, -6.829833984375, -5.896484375, -4.963134765625, -4.02978515625, -3.096435546875, -2.1630859375, -1.229736328125, -0.29638671875, 0.636962890625, 1.5703125, 2.503662109375, 3.43701171875, 4.370361328125, 5.3037109375, 6.237060546875, 7.17041015625, 8.103759765625, 9.037109375, 9.970458984375, 10.90380859375, 11.837158203125, 12.7705078125, 13.703857421875, 14.63720703125, 15.570556640625, 16.50390625, 17.437255859375, 18.37060546875, 19.303955078125, 20.2373046875, 21.170654296875, 22.10400390625, 23.037353515625, 23.970703125, 24.904052734375, 25.83740234375, 26.770751953125, 27.7041015625, 28.637451171875, 29.57080078125, 30.504150390625, 31.4375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 1.0, 6.0, 2.0, 5.0, 10.0, 10.0, 11.0, 11.0, 20.0, 16.0, 22.0, 17.0, 34.0, 39.0, 48.0, 80.0, 105.0, 160.0, 396.0, 1199.0, 27698.0, 3105627.0, 8385.0, 879.0, 314.0, 155.0, 97.0, 70.0, 45.0, 54.0, 41.0, 27.0, 25.0, 17.0, 19.0, 14.0, 10.0, 9.0, 6.0, 8.0, 0.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-71.9375, -69.783203125, -67.62890625, -65.474609375, -63.3203125, -61.166015625, -59.01171875, -56.857421875, -54.703125, -52.548828125, -50.39453125, -48.240234375, -46.0859375, -43.931640625, -41.77734375, -39.623046875, -37.46875, -35.314453125, -33.16015625, -31.005859375, -28.8515625, -26.697265625, -24.54296875, -22.388671875, -20.234375, -18.080078125, -15.92578125, -13.771484375, -11.6171875, -9.462890625, -7.30859375, -5.154296875, -3.0, -0.845703125, 1.30859375, 3.462890625, 5.6171875, 7.771484375, 9.92578125, 12.080078125, 14.234375, 16.388671875, 18.54296875, 20.697265625, 22.8515625, 25.005859375, 27.16015625, 29.314453125, 31.46875, 33.623046875, 35.77734375, 37.931640625, 40.0859375, 42.240234375, 44.39453125, 46.548828125, 48.703125, 50.857421875, 53.01171875, 55.166015625, 57.3203125, 59.474609375, 61.62890625, 63.783203125, 65.9375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 13.0, 977.0, 25.0, 2.0], "bins": [-599.9486694335938, -590.1962280273438, -580.4437255859375, -570.6912841796875, -560.9387817382812, -551.1863403320312, -541.433837890625, -531.681396484375, -521.9288940429688, -512.1764526367188, -502.4239501953125, -492.6714782714844, -482.91900634765625, -473.1665344238281, -463.4140625, -453.66162109375, -443.9091491699219, -434.15667724609375, -424.4042053222656, -414.6517333984375, -404.8992614746094, -395.14678955078125, -385.3943176269531, -375.641845703125, -365.889404296875, -356.1369323730469, -346.38446044921875, -336.6319885253906, -326.8795166015625, -317.1270446777344, -307.37457275390625, -297.62213134765625, -287.86962890625, -278.1171569824219, -268.36468505859375, -258.6122131347656, -248.8597412109375, -239.10726928710938, -229.3548126220703, -219.6023406982422, -209.849853515625, -200.09738159179688, -190.34490966796875, -180.59243774414062, -170.8399658203125, -161.08749389648438, -151.3350372314453, -141.5825653076172, -131.83009338378906, -122.07762145996094, -112.32514953613281, -102.57268524169922, -92.8202133178711, -83.06774139404297, -73.31527709960938, -63.56280517578125, -53.810333251953125, -44.057861328125, -34.30539321899414, -24.55292320251465, -14.800453186035156, -5.047981262207031, 4.704486846923828, 14.456954956054688, 24.209426879882812]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 2.0, 6.0, 2.0, 2.0, 6.0, 8.0, 4.0, 22.0, 17.0, 17.0, 17.0, 18.0, 27.0, 38.0, 25.0, 31.0, 35.0, 38.0, 40.0, 43.0, 49.0, 42.0, 42.0, 40.0, 42.0, 44.0, 26.0, 45.0, 47.0, 25.0, 31.0, 28.0, 21.0, 25.0, 20.0, 13.0, 12.0, 11.0, 11.0, 9.0, 3.0, 7.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-85.84872436523438, -82.8845443725586, -79.92037200927734, -76.95619201660156, -73.99201202392578, -71.02783966064453, -68.06365966796875, -65.0994873046875, -62.13530731201172, -59.1711311340332, -56.20695114135742, -53.242774963378906, -50.27859878540039, -47.314422607421875, -44.350242614746094, -41.38606643676758, -38.4218864440918, -35.45771026611328, -32.4935302734375, -29.529354095458984, -26.56517791748047, -23.60099983215332, -20.636821746826172, -17.672645568847656, -14.708467483520508, -11.744290351867676, -8.780113220214844, -5.815935134887695, -2.8517580032348633, 0.11241912841796875, 3.076597213745117, 6.040773391723633, 9.004951477050781, 11.969128608703613, 14.933305740356445, 17.897483825683594, 20.86166000366211, 23.825838088989258, 26.790016174316406, 29.754192352294922, 32.71836853027344, 35.68254470825195, 38.646724700927734, 41.61090087890625, 44.575077056884766, 47.53925323486328, 50.50343322753906, 53.46760940551758, 56.43178939819336, 59.395965576171875, 62.360145568847656, 65.32432556152344, 68.28849792480469, 71.25267791748047, 74.21685791015625, 77.1810302734375, 80.14521026611328, 83.10939025878906, 86.07356262207031, 89.0377426147461, 92.00192260742188, 94.96609497070312, 97.9302749633789, 100.89445495605469, 103.85862731933594]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 10.0, 12.0, 9.0, 9.0, 9.0, 11.0, 7.0, 18.0, 21.0, 26.0, 24.0, 34.0, 31.0, 30.0, 34.0, 39.0, 44.0, 42.0, 51.0, 48.0, 41.0, 44.0, 46.0, 31.0, 41.0, 35.0, 46.0, 25.0, 30.0, 23.0, 25.0, 22.0, 17.0, 10.0, 11.0, 9.0, 13.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.5390625, -8.2703857421875, -8.001708984375, -7.7330322265625, -7.46435546875, -7.1956787109375, -6.927001953125, -6.6583251953125, -6.3896484375, -6.1209716796875, -5.852294921875, -5.5836181640625, -5.31494140625, -5.0462646484375, -4.777587890625, -4.5089111328125, -4.240234375, -3.9715576171875, -3.702880859375, -3.4342041015625, -3.16552734375, -2.8968505859375, -2.628173828125, -2.3594970703125, -2.0908203125, -1.8221435546875, -1.553466796875, -1.2847900390625, -1.01611328125, -0.7474365234375, -0.478759765625, -0.2100830078125, 0.05859375, 0.3272705078125, 0.595947265625, 0.8646240234375, 1.13330078125, 1.4019775390625, 1.670654296875, 1.9393310546875, 2.2080078125, 2.4766845703125, 2.745361328125, 3.0140380859375, 3.28271484375, 3.5513916015625, 3.820068359375, 4.0887451171875, 4.357421875, 4.6260986328125, 4.894775390625, 5.1634521484375, 5.43212890625, 5.7008056640625, 5.969482421875, 6.2381591796875, 6.5068359375, 6.7755126953125, 7.044189453125, 7.3128662109375, 7.58154296875, 7.8502197265625, 8.118896484375, 8.3875732421875, 8.65625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 7.0, 9.0, 10.0, 16.0, 19.0, 33.0, 35.0, 46.0, 59.0, 77.0, 124.0, 200.0, 356.0, 900.0, 2883.0, 15464.0, 158522.0, 2604358.0, 1331113.0, 68053.0, 8621.0, 1898.0, 624.0, 286.0, 147.0, 119.0, 61.0, 56.0, 39.0, 34.0, 24.0, 29.0, 11.0, 11.0, 6.0, 5.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.71875, -28.755126953125, -27.79150390625, -26.827880859375, -25.8642578125, -24.900634765625, -23.93701171875, -22.973388671875, -22.009765625, -21.046142578125, -20.08251953125, -19.118896484375, -18.1552734375, -17.191650390625, -16.22802734375, -15.264404296875, -14.30078125, -13.337158203125, -12.37353515625, -11.409912109375, -10.4462890625, -9.482666015625, -8.51904296875, -7.555419921875, -6.591796875, -5.628173828125, -4.66455078125, -3.700927734375, -2.7373046875, -1.773681640625, -0.81005859375, 0.153564453125, 1.1171875, 2.080810546875, 3.04443359375, 4.008056640625, 4.9716796875, 5.935302734375, 6.89892578125, 7.862548828125, 8.826171875, 9.789794921875, 10.75341796875, 11.717041015625, 12.6806640625, 13.644287109375, 14.60791015625, 15.571533203125, 16.53515625, 17.498779296875, 18.46240234375, 19.426025390625, 20.3896484375, 21.353271484375, 22.31689453125, 23.280517578125, 24.244140625, 25.207763671875, 26.17138671875, 27.135009765625, 28.0986328125, 29.062255859375, 30.02587890625, 30.989501953125, 31.953125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 5.0, 7.0, 8.0, 23.0, 40.0, 80.0, 112.0, 187.0, 335.0, 502.0, 786.0, 784.0, 483.0, 306.0, 156.0, 102.0, 75.0, 37.0, 20.0, 13.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.71875, -61.10595703125, -59.4931640625, -57.88037109375, -56.267578125, -54.65478515625, -53.0419921875, -51.42919921875, -49.81640625, -48.20361328125, -46.5908203125, -44.97802734375, -43.365234375, -41.75244140625, -40.1396484375, -38.52685546875, -36.9140625, -35.30126953125, -33.6884765625, -32.07568359375, -30.462890625, -28.85009765625, -27.2373046875, -25.62451171875, -24.01171875, -22.39892578125, -20.7861328125, -19.17333984375, -17.560546875, -15.94775390625, -14.3349609375, -12.72216796875, -11.109375, -9.49658203125, -7.8837890625, -6.27099609375, -4.658203125, -3.04541015625, -1.4326171875, 0.18017578125, 1.79296875, 3.40576171875, 5.0185546875, 6.63134765625, 8.244140625, 9.85693359375, 11.4697265625, 13.08251953125, 14.6953125, 16.30810546875, 17.9208984375, 19.53369140625, 21.146484375, 22.75927734375, 24.3720703125, 25.98486328125, 27.59765625, 29.21044921875, 30.8232421875, 32.43603515625, 34.048828125, 35.66162109375, 37.2744140625, 38.88720703125, 40.5]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 5.0, 10.0, 16.0, 39.0, 54.0, 83.0, 145.0, 278.0, 610.0, 5542.0, 3836707.0, 348027.0, 1822.0, 416.0, 217.0, 117.0, 69.0, 42.0, 26.0, 27.0, 9.0, 4.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-146.75, -141.66015625, -136.5703125, -131.48046875, -126.390625, -121.30078125, -116.2109375, -111.12109375, -106.03125, -100.94140625, -95.8515625, -90.76171875, -85.671875, -80.58203125, -75.4921875, -70.40234375, -65.3125, -60.22265625, -55.1328125, -50.04296875, -44.953125, -39.86328125, -34.7734375, -29.68359375, -24.59375, -19.50390625, -14.4140625, -9.32421875, -4.234375, 0.85546875, 5.9453125, 11.03515625, 16.125, 21.21484375, 26.3046875, 31.39453125, 36.484375, 41.57421875, 46.6640625, 51.75390625, 56.84375, 61.93359375, 67.0234375, 72.11328125, 77.203125, 82.29296875, 87.3828125, 92.47265625, 97.5625, 102.65234375, 107.7421875, 112.83203125, 117.921875, 123.01171875, 128.1015625, 133.19140625, 138.28125, 143.37109375, 148.4609375, 153.55078125, 158.640625, 163.73046875, 168.8203125, 173.91015625, 179.0]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 20.0, 90.0, 372.0, 389.0, 124.0, 16.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-438.0901184082031, -426.88385009765625, -415.6775817871094, -404.4713134765625, -393.2650146484375, -382.0587463378906, -370.85247802734375, -359.6462097167969, -348.43994140625, -337.2336730957031, -326.02740478515625, -314.8211364746094, -303.6148681640625, -292.4085693359375, -281.2023010253906, -269.99603271484375, -258.7897644042969, -247.58349609375, -236.37722778320312, -225.1709442138672, -213.9646759033203, -202.75840759277344, -191.5521240234375, -180.34585571289062, -169.13958740234375, -157.93331909179688, -146.72705078125, -135.52076721191406, -124.31449890136719, -113.10823059082031, -101.9019546508789, -90.6956787109375, -79.48941040039062, -68.28314208984375, -57.076866149902344, -45.8705940246582, -34.66432189941406, -23.458049774169922, -12.251777648925781, -1.045501708984375, 10.1607666015625, 21.36703872680664, 32.57331085205078, 43.77958297729492, 54.98585510253906, 66.19212341308594, 77.39839935302734, 88.60467529296875, 99.81094360351562, 111.0172119140625, 122.2234878540039, 133.4297637939453, 144.6360321044922, 155.84230041503906, 167.048583984375, 178.25485229492188, 189.46112060546875, 200.66738891601562, 211.8736572265625, 223.07994079589844, 234.2862091064453, 245.4924774169922, 256.6987609863281, 267.905029296875, 279.1112976074219]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 7.0, 8.0, 6.0, 6.0, 18.0, 23.0, 14.0, 19.0, 22.0, 27.0, 31.0, 27.0, 23.0, 33.0, 34.0, 32.0, 54.0, 50.0, 43.0, 34.0, 47.0, 38.0, 45.0, 50.0, 28.0, 30.0, 25.0, 27.0, 25.0, 22.0, 28.0, 15.0, 23.0, 21.0, 14.0, 10.0, 10.0, 11.0, 1.0, 6.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-107.93976593017578, -104.61256408691406, -101.28536224365234, -97.95816040039062, -94.6309585571289, -91.30375671386719, -87.97655487060547, -84.64935302734375, -81.32215118408203, -77.99494934082031, -74.6677474975586, -71.34054565429688, -68.01334381103516, -64.68614196777344, -61.35894012451172, -58.03173828125, -54.70453643798828, -51.37733459472656, -48.050132751464844, -44.722930908203125, -41.395729064941406, -38.06852722167969, -34.74132537841797, -31.41412353515625, -28.08692169189453, -24.759719848632812, -21.432518005371094, -18.105316162109375, -14.778114318847656, -11.450912475585938, -8.123710632324219, -4.7965087890625, -1.46929931640625, 1.8579025268554688, 5.1851043701171875, 8.512306213378906, 11.839508056640625, 15.166709899902344, 18.493911743164062, 21.82111358642578, 25.1483154296875, 28.47551727294922, 31.802719116210938, 35.129920959472656, 38.457122802734375, 41.784324645996094, 45.11152648925781, 48.43872833251953, 51.76593017578125, 55.09313201904297, 58.42033386230469, 61.747535705566406, 65.07473754882812, 68.40193939208984, 71.72914123535156, 75.05634307861328, 78.383544921875, 81.71074676513672, 85.03794860839844, 88.36515045166016, 91.69235229492188, 95.0195541381836, 98.34675598144531, 101.67395782470703, 105.00115966796875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 8.0, 6.0, 7.0, 6.0, 9.0, 13.0, 13.0, 11.0, 20.0, 18.0, 25.0, 28.0, 29.0, 31.0, 34.0, 37.0, 32.0, 51.0, 44.0, 53.0, 41.0, 43.0, 47.0, 42.0, 39.0, 37.0, 29.0, 43.0, 35.0, 26.0, 29.0, 15.0, 16.0, 21.0, 13.0, 12.0, 14.0, 3.0, 3.0, 6.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.160888671875, -7.88427734375, -7.607666015625, -7.3310546875, -7.054443359375, -6.77783203125, -6.501220703125, -6.224609375, -5.947998046875, -5.67138671875, -5.394775390625, -5.1181640625, -4.841552734375, -4.56494140625, -4.288330078125, -4.01171875, -3.735107421875, -3.45849609375, -3.181884765625, -2.9052734375, -2.628662109375, -2.35205078125, -2.075439453125, -1.798828125, -1.522216796875, -1.24560546875, -0.968994140625, -0.6923828125, -0.415771484375, -0.13916015625, 0.137451171875, 0.4140625, 0.690673828125, 0.96728515625, 1.243896484375, 1.5205078125, 1.797119140625, 2.07373046875, 2.350341796875, 2.626953125, 2.903564453125, 3.18017578125, 3.456787109375, 3.7333984375, 4.010009765625, 4.28662109375, 4.563232421875, 4.83984375, 5.116455078125, 5.39306640625, 5.669677734375, 5.9462890625, 6.222900390625, 6.49951171875, 6.776123046875, 7.052734375, 7.329345703125, 7.60595703125, 7.882568359375, 8.1591796875, 8.435791015625, 8.71240234375, 8.989013671875, 9.265625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 12.0, 30.0, 36.0, 71.0, 71.0, 114.0, 171.0, 207.0, 336.0, 417.0, 662.0, 910.0, 1375.0, 1893.0, 2903.0, 4232.0, 6077.0, 8927.0, 13013.0, 19571.0, 28855.0, 41779.0, 60924.0, 88154.0, 129652.0, 180205.0, 146203.0, 97402.0, 67441.0, 46670.0, 32130.0, 21690.0, 14777.0, 10050.0, 6933.0, 4539.0, 3085.0, 2189.0, 1527.0, 1009.0, 704.0, 501.0, 331.0, 248.0, 159.0, 129.0, 82.0, 49.0, 35.0, 23.0, 12.0, 15.0, 6.0, 7.0, 4.0, 1.0, 2.0, 3.0], "bins": [-0.83740234375, -0.8109359741210938, -0.7844696044921875, -0.7580032348632812, -0.731536865234375, -0.7050704956054688, -0.6786041259765625, -0.6521377563476562, -0.62567138671875, -0.5992050170898438, -0.5727386474609375, -0.5462722778320312, -0.519805908203125, -0.49333953857421875, -0.4668731689453125, -0.44040679931640625, -0.4139404296875, -0.38747406005859375, -0.3610076904296875, -0.33454132080078125, -0.308074951171875, -0.28160858154296875, -0.2551422119140625, -0.22867584228515625, -0.20220947265625, -0.17574310302734375, -0.1492767333984375, -0.12281036376953125, -0.096343994140625, -0.06987762451171875, -0.0434112548828125, -0.01694488525390625, 0.009521484375, 0.03598785400390625, 0.0624542236328125, 0.08892059326171875, 0.115386962890625, 0.14185333251953125, 0.1683197021484375, 0.19478607177734375, 0.22125244140625, 0.24771881103515625, 0.2741851806640625, 0.30065155029296875, 0.327117919921875, 0.35358428955078125, 0.3800506591796875, 0.40651702880859375, 0.4329833984375, 0.45944976806640625, 0.4859161376953125, 0.5123825073242188, 0.538848876953125, 0.5653152465820312, 0.5917816162109375, 0.6182479858398438, 0.64471435546875, 0.6711807250976562, 0.6976470947265625, 0.7241134643554688, 0.750579833984375, 0.7770462036132812, 0.8035125732421875, 0.8299789428710938, 0.8564453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 10.0, 9.0, 5.0, 12.0, 13.0, 18.0, 22.0, 19.0, 31.0, 33.0, 31.0, 36.0, 34.0, 36.0, 35.0, 56.0, 47.0, 41.0, 1059.0, 47.0, 41.0, 28.0, 37.0, 30.0, 33.0, 35.0, 36.0, 21.0, 23.0, 27.0, 12.0, 10.0, 16.0, 11.0, 12.0, 10.0, 9.0, 10.0, 3.0, 5.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.55859375, -5.38665771484375, -5.2147216796875, -5.04278564453125, -4.870849609375, -4.69891357421875, -4.5269775390625, -4.35504150390625, -4.18310546875, -4.01116943359375, -3.8392333984375, -3.66729736328125, -3.495361328125, -3.32342529296875, -3.1514892578125, -2.97955322265625, -2.8076171875, -2.63568115234375, -2.4637451171875, -2.29180908203125, -2.119873046875, -1.94793701171875, -1.7760009765625, -1.60406494140625, -1.43212890625, -1.26019287109375, -1.0882568359375, -0.91632080078125, -0.744384765625, -0.57244873046875, -0.4005126953125, -0.22857666015625, -0.056640625, 0.11529541015625, 0.2872314453125, 0.45916748046875, 0.631103515625, 0.80303955078125, 0.9749755859375, 1.14691162109375, 1.31884765625, 1.49078369140625, 1.6627197265625, 1.83465576171875, 2.006591796875, 2.17852783203125, 2.3504638671875, 2.52239990234375, 2.6943359375, 2.86627197265625, 3.0382080078125, 3.21014404296875, 3.382080078125, 3.55401611328125, 3.7259521484375, 3.89788818359375, 4.06982421875, 4.24176025390625, 4.4136962890625, 4.58563232421875, 4.757568359375, 4.92950439453125, 5.1014404296875, 5.27337646484375, 5.4453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 3.0, 13.0, 8.0, 18.0, 31.0, 36.0, 59.0, 95.0, 140.0, 212.0, 360.0, 491.0, 820.0, 1245.0, 1807.0, 2848.0, 4376.0, 6639.0, 10405.0, 16168.0, 25620.0, 40513.0, 63814.0, 102028.0, 163117.0, 1258102.0, 147703.0, 91539.0, 57841.0, 36547.0, 22934.0, 14644.0, 9679.0, 6114.0, 3909.0, 2587.0, 1670.0, 1031.0, 650.0, 468.0, 297.0, 224.0, 107.0, 83.0, 50.0, 36.0, 25.0, 13.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-1.01953125, -0.9898834228515625, -0.960235595703125, -0.9305877685546875, -0.90093994140625, -0.8712921142578125, -0.841644287109375, -0.8119964599609375, -0.7823486328125, -0.7527008056640625, -0.723052978515625, -0.6934051513671875, -0.66375732421875, -0.6341094970703125, -0.604461669921875, -0.5748138427734375, -0.545166015625, -0.5155181884765625, -0.485870361328125, -0.4562225341796875, -0.42657470703125, -0.3969268798828125, -0.367279052734375, -0.3376312255859375, -0.3079833984375, -0.2783355712890625, -0.248687744140625, -0.2190399169921875, -0.18939208984375, -0.1597442626953125, -0.130096435546875, -0.1004486083984375, -0.07080078125, -0.0411529541015625, -0.011505126953125, 0.0181427001953125, 0.04779052734375, 0.0774383544921875, 0.107086181640625, 0.1367340087890625, 0.1663818359375, 0.1960296630859375, 0.225677490234375, 0.2553253173828125, 0.28497314453125, 0.3146209716796875, 0.344268798828125, 0.3739166259765625, 0.403564453125, 0.4332122802734375, 0.462860107421875, 0.4925079345703125, 0.52215576171875, 0.5518035888671875, 0.581451416015625, 0.6110992431640625, 0.6407470703125, 0.6703948974609375, 0.700042724609375, 0.7296905517578125, 0.75933837890625, 0.7889862060546875, 0.818634033203125, 0.8482818603515625, 0.8779296875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 6.0, 0.0, 3.0, 4.0, 3.0, 7.0, 6.0, 10.0, 12.0, 5.0, 13.0, 17.0, 24.0, 23.0, 29.0, 36.0, 41.0, 37.0, 58.0, 61.0, 69.0, 58.0, 51.0, 55.0, 54.0, 54.0, 46.0, 44.0, 27.0, 26.0, 22.0, 9.0, 15.0, 12.0, 10.0, 6.0, 7.0, 4.0, 10.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00142669677734375, -0.0013808012008666992, -0.0013349056243896484, -0.0012890100479125977, -0.0012431144714355469, -0.001197218894958496, -0.0011513233184814453, -0.0011054277420043945, -0.0010595321655273438, -0.001013636589050293, -0.0009677410125732422, -0.0009218454360961914, -0.0008759498596191406, -0.0008300542831420898, -0.0007841587066650391, -0.0007382631301879883, -0.0006923675537109375, -0.0006464719772338867, -0.0006005764007568359, -0.0005546808242797852, -0.0005087852478027344, -0.0004628896713256836, -0.0004169940948486328, -0.00037109851837158203, -0.00032520294189453125, -0.00027930736541748047, -0.0002334117889404297, -0.0001875162124633789, -0.00014162063598632812, -9.572505950927734e-05, -4.982948303222656e-05, -3.933906555175781e-06, 4.1961669921875e-05, 8.785724639892578e-05, 0.00013375282287597656, 0.00017964839935302734, 0.00022554397583007812, 0.0002714395523071289, 0.0003173351287841797, 0.00036323070526123047, 0.00040912628173828125, 0.00045502185821533203, 0.0005009174346923828, 0.0005468130111694336, 0.0005927085876464844, 0.0006386041641235352, 0.0006844997406005859, 0.0007303953170776367, 0.0007762908935546875, 0.0008221864700317383, 0.0008680820465087891, 0.0009139776229858398, 0.0009598731994628906, 0.0010057687759399414, 0.0010516643524169922, 0.001097559928894043, 0.0011434555053710938, 0.0011893510818481445, 0.0012352466583251953, 0.001281142234802246, 0.0013270378112792969, 0.0013729333877563477, 0.0014188289642333984, 0.0014647245407104492, 0.0015106201171875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 4.0, 3.0, 2.0, 7.0, 2.0, 12.0, 14.0, 12.0, 23.0, 35.0, 32.0, 55.0, 61.0, 96.0, 128.0, 216.0, 264.0, 666.0, 7048.0, 1036687.0, 1814.0, 473.0, 272.0, 183.0, 105.0, 73.0, 61.0, 39.0, 30.0, 33.0, 14.0, 19.0, 8.0, 13.0, 6.0, 4.0, 3.0, 8.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.037139892578125, -0.03595590591430664, -0.03477191925048828, -0.03358793258666992, -0.03240394592285156, -0.031219959259033203, -0.030035972595214844, -0.028851985931396484, -0.027667999267578125, -0.026484012603759766, -0.025300025939941406, -0.024116039276123047, -0.022932052612304688, -0.021748065948486328, -0.02056407928466797, -0.01938009262084961, -0.01819610595703125, -0.01701211929321289, -0.01582813262939453, -0.014644145965576172, -0.013460159301757812, -0.012276172637939453, -0.011092185974121094, -0.009908199310302734, -0.008724212646484375, -0.007540225982666016, -0.006356239318847656, -0.005172252655029297, -0.0039882659912109375, -0.002804279327392578, -0.0016202926635742188, -0.0004363059997558594, 0.0007476806640625, 0.0019316673278808594, 0.0031156539916992188, 0.004299640655517578, 0.0054836273193359375, 0.006667613983154297, 0.007851600646972656, 0.009035587310791016, 0.010219573974609375, 0.011403560638427734, 0.012587547302246094, 0.013771533966064453, 0.014955520629882812, 0.016139507293701172, 0.01732349395751953, 0.01850748062133789, 0.01969146728515625, 0.02087545394897461, 0.02205944061279297, 0.023243427276611328, 0.024427413940429688, 0.025611400604248047, 0.026795387268066406, 0.027979373931884766, 0.029163360595703125, 0.030347347259521484, 0.031531333923339844, 0.0327153205871582, 0.03389930725097656, 0.03508329391479492, 0.03626728057861328, 0.03745126724243164, 0.03863525390625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 10.0, 33.0, 165.0, 434.0, 290.0, 68.0, 14.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003726032329723239, -0.0036445967853069305, -0.003563161240890622, -0.00348172546364367, -0.0034002899192273617, -0.0033188543748110533, -0.003237418830394745, -0.003155983053147793, -0.0030745475087314844, -0.002993111964315176, -0.0029116764198988676, -0.0028302406426519156, -0.002748805098235607, -0.0026673695538192987, -0.0025859340094029903, -0.0025044982321560383, -0.0024230629205703735, -0.002341627376154065, -0.0022601918317377567, -0.0021787560544908047, -0.0020973205100744963, -0.002015884965658188, -0.0019344494212418795, -0.0018530137604102492, -0.001771578099578619, -0.0016901425551623106, -0.0016087068943306804, -0.001527271349914372, -0.0014458356890827417, -0.0013644001446664333, -0.001282964600250125, -0.0012015289394184947, -0.0011200933950021863, -0.001038657850585878, -0.0009572221897542477, -0.0008757866453379393, -0.000794350984506309, -0.0007129154400900006, -0.0006314798374660313, -0.000550044234842062, -0.0004686086322180927, -0.00038717302959412336, -0.00030573742697015405, -0.0002243018534500152, -0.00014286625082604587, -6.143064820207655e-05, 2.0004925318062305e-05, 0.00010144052794203162, 0.00018287613056600094, 0.00026431173318997025, 0.00034574733581393957, 0.00042718290933407843, 0.0005086185410618782, 0.0005900540854781866, 0.0006714896881021559, 0.0007529252907261252, 0.0008343608933500946, 0.0009157964959740639, 0.0009972320403903723, 0.0010786677012220025, 0.001160103245638311, 0.0012415389064699411, 0.0013229744508862495, 0.001404409995302558, 0.0014858456561341882]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 5.0, 5.0, 7.0, 7.0, 6.0, 8.0, 19.0, 10.0, 16.0, 22.0, 26.0, 18.0, 33.0, 24.0, 32.0, 34.0, 50.0, 31.0, 43.0, 38.0, 49.0, 36.0, 51.0, 28.0, 46.0, 44.0, 28.0, 28.0, 38.0, 35.0, 26.0, 26.0, 27.0, 15.0, 16.0, 17.0, 13.0, 10.0, 3.0, 9.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0008644461631774902, -0.0008378894999623299, -0.0008113328367471695, -0.0007847761735320091, -0.0007582195103168488, -0.0007316628471016884, -0.000705106183886528, -0.0006785495206713676, -0.0006519928574562073, -0.0006254361942410469, -0.0005988795310258865, -0.0005723228678107262, -0.0005457662045955658, -0.0005192095413804054, -0.0004926528781652451, -0.0004660962149500847, -0.0004395395517349243, -0.00041298288851976395, -0.0003864262253046036, -0.0003598695620894432, -0.00033331289887428284, -0.00030675623565912247, -0.0002801995724439621, -0.00025364290922880173, -0.00022708624601364136, -0.000200529582798481, -0.00017397291958332062, -0.00014741625636816025, -0.00012085959315299988, -9.430292993783951e-05, -6.774626672267914e-05, -4.118960350751877e-05, -1.4632940292358398e-05, 1.1923722922801971e-05, 3.848038613796234e-05, 6.503704935312271e-05, 9.159371256828308e-05, 0.00011815037578344345, 0.00014470703899860382, 0.0001712637022137642, 0.00019782036542892456, 0.00022437702864408493, 0.0002509336918592453, 0.00027749035507440567, 0.00030404701828956604, 0.0003306036815047264, 0.0003571603447198868, 0.00038371700793504715, 0.0004102736711502075, 0.0004368303343653679, 0.00046338699758052826, 0.0004899436607956886, 0.000516500324010849, 0.0005430569872260094, 0.0005696136504411697, 0.0005961703136563301, 0.0006227269768714905, 0.0006492836400866508, 0.0006758403033018112, 0.0007023969665169716, 0.000728953629732132, 0.0007555102929472923, 0.0007820669561624527, 0.0008086236193776131, 0.0008351802825927734]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 8.0, 6.0, 7.0, 6.0, 9.0, 13.0, 13.0, 11.0, 20.0, 18.0, 25.0, 28.0, 29.0, 31.0, 34.0, 37.0, 32.0, 51.0, 44.0, 53.0, 41.0, 43.0, 47.0, 42.0, 39.0, 37.0, 29.0, 43.0, 35.0, 26.0, 29.0, 15.0, 16.0, 21.0, 13.0, 12.0, 14.0, 3.0, 3.0, 6.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.160888671875, -7.88427734375, -7.607666015625, -7.3310546875, -7.054443359375, -6.77783203125, -6.501220703125, -6.224609375, -5.947998046875, -5.67138671875, -5.394775390625, -5.1181640625, -4.841552734375, -4.56494140625, -4.288330078125, -4.01171875, -3.735107421875, -3.45849609375, -3.181884765625, -2.9052734375, -2.628662109375, -2.35205078125, -2.075439453125, -1.798828125, -1.522216796875, -1.24560546875, -0.968994140625, -0.6923828125, -0.415771484375, -0.13916015625, 0.137451171875, 0.4140625, 0.690673828125, 0.96728515625, 1.243896484375, 1.5205078125, 1.797119140625, 2.07373046875, 2.350341796875, 2.626953125, 2.903564453125, 3.18017578125, 3.456787109375, 3.7333984375, 4.010009765625, 4.28662109375, 4.563232421875, 4.83984375, 5.116455078125, 5.39306640625, 5.669677734375, 5.9462890625, 6.222900390625, 6.49951171875, 6.776123046875, 7.052734375, 7.329345703125, 7.60595703125, 7.882568359375, 8.1591796875, 8.435791015625, 8.71240234375, 8.989013671875, 9.265625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 4.0, 3.0, 9.0, 15.0, 14.0, 18.0, 26.0, 57.0, 72.0, 84.0, 149.0, 253.0, 306.0, 507.0, 753.0, 1148.0, 1745.0, 2988.0, 5232.0, 9780.0, 21820.0, 58882.0, 221468.0, 506256.0, 139483.0, 41409.0, 16579.0, 8125.0, 4273.0, 2573.0, 1562.0, 967.0, 639.0, 471.0, 279.0, 190.0, 123.0, 87.0, 68.0, 49.0, 27.0, 22.0, 15.0, 8.0, 2.0, 6.0, 4.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6484375, -7.3963623046875, -7.144287109375, -6.8922119140625, -6.64013671875, -6.3880615234375, -6.135986328125, -5.8839111328125, -5.6318359375, -5.3797607421875, -5.127685546875, -4.8756103515625, -4.62353515625, -4.3714599609375, -4.119384765625, -3.8673095703125, -3.615234375, -3.3631591796875, -3.111083984375, -2.8590087890625, -2.60693359375, -2.3548583984375, -2.102783203125, -1.8507080078125, -1.5986328125, -1.3465576171875, -1.094482421875, -0.8424072265625, -0.59033203125, -0.3382568359375, -0.086181640625, 0.1658935546875, 0.41796875, 0.6700439453125, 0.922119140625, 1.1741943359375, 1.42626953125, 1.6783447265625, 1.930419921875, 2.1824951171875, 2.4345703125, 2.6866455078125, 2.938720703125, 3.1907958984375, 3.44287109375, 3.6949462890625, 3.947021484375, 4.1990966796875, 4.451171875, 4.7032470703125, 4.955322265625, 5.2073974609375, 5.45947265625, 5.7115478515625, 5.963623046875, 6.2156982421875, 6.4677734375, 6.7198486328125, 6.971923828125, 7.2239990234375, 7.47607421875, 7.7281494140625, 7.980224609375, 8.2322998046875, 8.484375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 10.0, 9.0, 9.0, 9.0, 11.0, 17.0, 12.0, 19.0, 12.0, 14.0, 27.0, 30.0, 34.0, 26.0, 34.0, 41.0, 46.0, 46.0, 45.0, 69.0, 203.0, 1738.0, 89.0, 57.0, 46.0, 39.0, 40.0, 37.0, 37.0, 33.0, 31.0, 27.0, 23.0, 32.0, 19.0, 15.0, 8.0, 9.0, 5.0, 4.0, 5.0, 10.0, 3.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0], "bins": [-30.71875, -29.848388671875, -28.97802734375, -28.107666015625, -27.2373046875, -26.366943359375, -25.49658203125, -24.626220703125, -23.755859375, -22.885498046875, -22.01513671875, -21.144775390625, -20.2744140625, -19.404052734375, -18.53369140625, -17.663330078125, -16.79296875, -15.922607421875, -15.05224609375, -14.181884765625, -13.3115234375, -12.441162109375, -11.57080078125, -10.700439453125, -9.830078125, -8.959716796875, -8.08935546875, -7.218994140625, -6.3486328125, -5.478271484375, -4.60791015625, -3.737548828125, -2.8671875, -1.996826171875, -1.12646484375, -0.256103515625, 0.6142578125, 1.484619140625, 2.35498046875, 3.225341796875, 4.095703125, 4.966064453125, 5.83642578125, 6.706787109375, 7.5771484375, 8.447509765625, 9.31787109375, 10.188232421875, 11.05859375, 11.928955078125, 12.79931640625, 13.669677734375, 14.5400390625, 15.410400390625, 16.28076171875, 17.151123046875, 18.021484375, 18.891845703125, 19.76220703125, 20.632568359375, 21.5029296875, 22.373291015625, 23.24365234375, 24.114013671875, 24.984375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 7.0, 2.0, 6.0, 5.0, 6.0, 6.0, 7.0, 10.0, 13.0, 11.0, 23.0, 22.0, 32.0, 40.0, 43.0, 70.0, 75.0, 117.0, 172.0, 315.0, 749.0, 2736.0, 52890.0, 3039456.0, 44498.0, 2657.0, 721.0, 342.0, 170.0, 112.0, 74.0, 46.0, 51.0, 39.0, 32.0, 22.0, 22.0, 12.0, 25.0, 15.0, 15.0, 8.0, 9.0, 9.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-45.125, -43.59423828125, -42.0634765625, -40.53271484375, -39.001953125, -37.47119140625, -35.9404296875, -34.40966796875, -32.87890625, -31.34814453125, -29.8173828125, -28.28662109375, -26.755859375, -25.22509765625, -23.6943359375, -22.16357421875, -20.6328125, -19.10205078125, -17.5712890625, -16.04052734375, -14.509765625, -12.97900390625, -11.4482421875, -9.91748046875, -8.38671875, -6.85595703125, -5.3251953125, -3.79443359375, -2.263671875, -0.73291015625, 0.7978515625, 2.32861328125, 3.859375, 5.39013671875, 6.9208984375, 8.45166015625, 9.982421875, 11.51318359375, 13.0439453125, 14.57470703125, 16.10546875, 17.63623046875, 19.1669921875, 20.69775390625, 22.228515625, 23.75927734375, 25.2900390625, 26.82080078125, 28.3515625, 29.88232421875, 31.4130859375, 32.94384765625, 34.474609375, 36.00537109375, 37.5361328125, 39.06689453125, 40.59765625, 42.12841796875, 43.6591796875, 45.18994140625, 46.720703125, 48.25146484375, 49.7822265625, 51.31298828125, 52.84375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 10.0, 1008.0, 0.0, 1.0], "bins": [-1240.0467529296875, -1219.8519287109375, -1199.656982421875, -1179.462158203125, -1159.267333984375, -1139.0723876953125, -1118.8775634765625, -1098.6826171875, -1078.48779296875, -1058.29296875, -1038.0980224609375, -1017.9031982421875, -997.7083129882812, -977.513427734375, -957.318603515625, -937.1237182617188, -916.9288330078125, -896.7339477539062, -876.5390625, -856.34423828125, -836.1493530273438, -815.9544677734375, -795.7596435546875, -775.5647583007812, -755.369873046875, -735.1749877929688, -714.9801025390625, -694.7852783203125, -674.5903930664062, -654.3955078125, -634.20068359375, -614.0057983398438, -593.8109130859375, -573.6160278320312, -553.421142578125, -533.226318359375, -513.0314331054688, -492.8365478515625, -472.6416931152344, -452.44683837890625, -432.251953125, -412.05706787109375, -391.8622131347656, -371.6673583984375, -351.47247314453125, -331.277587890625, -311.0827331542969, -290.88787841796875, -270.6929931640625, -250.4981231689453, -230.30325317382812, -210.10838317871094, -189.91351318359375, -169.71864318847656, -149.52377319335938, -129.3289031982422, -109.13404083251953, -88.93917083740234, -68.74430084228516, -48.54943084716797, -28.35456085205078, -8.159690856933594, 12.035179138183594, 32.23004913330078, 52.42491912841797]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 6.0, 14.0, 7.0, 8.0, 16.0, 20.0, 19.0, 34.0, 22.0, 26.0, 31.0, 20.0, 28.0, 27.0, 36.0, 38.0, 34.0, 43.0, 35.0, 36.0, 25.0, 48.0, 28.0, 35.0, 47.0, 34.0, 28.0, 23.0, 31.0, 19.0, 24.0, 23.0, 22.0, 27.0, 20.0, 15.0, 10.0, 6.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-91.7229232788086, -88.89141082763672, -86.05990600585938, -83.2283935546875, -80.39688110351562, -77.56536865234375, -74.7338638305664, -71.90235137939453, -69.07084655761719, -66.23933410644531, -63.4078254699707, -60.576316833496094, -57.74480438232422, -54.91329574584961, -52.081787109375, -49.250274658203125, -46.41876220703125, -43.58725357055664, -40.755741119384766, -37.924232482910156, -35.09272003173828, -32.26121139526367, -29.429702758789062, -26.59819221496582, -23.766681671142578, -20.935171127319336, -18.103660583496094, -15.272151947021484, -12.440641403198242, -9.609130859375, -6.777622222900391, -3.9461116790771484, -1.1146087646484375, 1.7169013023376465, 4.5484113693237305, 7.379920959472656, 10.211431503295898, 13.04294204711914, 15.87445068359375, 18.705961227416992, 21.537471771240234, 24.368982315063477, 27.20049285888672, 30.032001495361328, 32.86351013183594, 35.69502258300781, 38.52653121948242, 41.35803985595703, 44.189552307128906, 47.021060943603516, 49.85257339477539, 52.68408203125, 55.515594482421875, 58.347103118896484, 61.178611755371094, 64.01012420654297, 66.84162902832031, 69.67314147949219, 72.50464630126953, 75.3361587524414, 78.16767120361328, 80.99917602539062, 83.8306884765625, 86.66220092773438, 89.49371337890625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 10.0, 5.0, 10.0, 8.0, 12.0, 18.0, 18.0, 18.0, 25.0, 22.0, 31.0, 36.0, 38.0, 28.0, 49.0, 43.0, 45.0, 48.0, 49.0, 49.0, 43.0, 47.0, 39.0, 34.0, 44.0, 38.0, 27.0, 26.0, 19.0, 24.0, 21.0, 18.0, 9.0, 11.0, 7.0, 4.0, 6.0, 6.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -9.007080078125, -8.70947265625, -8.411865234375, -8.1142578125, -7.816650390625, -7.51904296875, -7.221435546875, -6.923828125, -6.626220703125, -6.32861328125, -6.031005859375, -5.7333984375, -5.435791015625, -5.13818359375, -4.840576171875, -4.54296875, -4.245361328125, -3.94775390625, -3.650146484375, -3.3525390625, -3.054931640625, -2.75732421875, -2.459716796875, -2.162109375, -1.864501953125, -1.56689453125, -1.269287109375, -0.9716796875, -0.674072265625, -0.37646484375, -0.078857421875, 0.21875, 0.516357421875, 0.81396484375, 1.111572265625, 1.4091796875, 1.706787109375, 2.00439453125, 2.302001953125, 2.599609375, 2.897216796875, 3.19482421875, 3.492431640625, 3.7900390625, 4.087646484375, 4.38525390625, 4.682861328125, 4.98046875, 5.278076171875, 5.57568359375, 5.873291015625, 6.1708984375, 6.468505859375, 6.76611328125, 7.063720703125, 7.361328125, 7.658935546875, 7.95654296875, 8.254150390625, 8.5517578125, 8.849365234375, 9.14697265625, 9.444580078125, 9.7421875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 4.0, 6.0, 2.0, 7.0, 2.0, 7.0, 14.0, 14.0, 10.0, 21.0, 19.0, 18.0, 27.0, 35.0, 33.0, 47.0, 55.0, 112.0, 327.0, 1723.0, 26262.0, 2539522.0, 1606848.0, 17244.0, 1255.0, 245.0, 95.0, 58.0, 39.0, 32.0, 38.0, 33.0, 24.0, 14.0, 17.0, 13.0, 10.0, 9.0, 11.0, 8.0, 9.0, 3.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.46875, -49.80517578125, -48.1416015625, -46.47802734375, -44.814453125, -43.15087890625, -41.4873046875, -39.82373046875, -38.16015625, -36.49658203125, -34.8330078125, -33.16943359375, -31.505859375, -29.84228515625, -28.1787109375, -26.51513671875, -24.8515625, -23.18798828125, -21.5244140625, -19.86083984375, -18.197265625, -16.53369140625, -14.8701171875, -13.20654296875, -11.54296875, -9.87939453125, -8.2158203125, -6.55224609375, -4.888671875, -3.22509765625, -1.5615234375, 0.10205078125, 1.765625, 3.42919921875, 5.0927734375, 6.75634765625, 8.419921875, 10.08349609375, 11.7470703125, 13.41064453125, 15.07421875, 16.73779296875, 18.4013671875, 20.06494140625, 21.728515625, 23.39208984375, 25.0556640625, 26.71923828125, 28.3828125, 30.04638671875, 31.7099609375, 33.37353515625, 35.037109375, 36.70068359375, 38.3642578125, 40.02783203125, 41.69140625, 43.35498046875, 45.0185546875, 46.68212890625, 48.345703125, 50.00927734375, 51.6728515625, 53.33642578125, 55.0]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 9.0, 13.0, 23.0, 38.0, 56.0, 85.0, 129.0, 190.0, 329.0, 453.0, 635.0, 714.0, 474.0, 322.0, 233.0, 135.0, 79.0, 60.0, 40.0, 22.0, 15.0, 9.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.71875, -36.46337890625, -35.2080078125, -33.95263671875, -32.697265625, -31.44189453125, -30.1865234375, -28.93115234375, -27.67578125, -26.42041015625, -25.1650390625, -23.90966796875, -22.654296875, -21.39892578125, -20.1435546875, -18.88818359375, -17.6328125, -16.37744140625, -15.1220703125, -13.86669921875, -12.611328125, -11.35595703125, -10.1005859375, -8.84521484375, -7.58984375, -6.33447265625, -5.0791015625, -3.82373046875, -2.568359375, -1.31298828125, -0.0576171875, 1.19775390625, 2.453125, 3.70849609375, 4.9638671875, 6.21923828125, 7.474609375, 8.72998046875, 9.9853515625, 11.24072265625, 12.49609375, 13.75146484375, 15.0068359375, 16.26220703125, 17.517578125, 18.77294921875, 20.0283203125, 21.28369140625, 22.5390625, 23.79443359375, 25.0498046875, 26.30517578125, 27.560546875, 28.81591796875, 30.0712890625, 31.32666015625, 32.58203125, 33.83740234375, 35.0927734375, 36.34814453125, 37.603515625, 38.85888671875, 40.1142578125, 41.36962890625, 42.625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 16.0, 18.0, 29.0, 47.0, 71.0, 100.0, 186.0, 385.0, 1035.0, 97999.0, 4087978.0, 5239.0, 520.0, 273.0, 164.0, 88.0, 62.0, 32.0, 17.0, 12.0, 5.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-190.25, -184.533203125, -178.81640625, -173.099609375, -167.3828125, -161.666015625, -155.94921875, -150.232421875, -144.515625, -138.798828125, -133.08203125, -127.365234375, -121.6484375, -115.931640625, -110.21484375, -104.498046875, -98.78125, -93.064453125, -87.34765625, -81.630859375, -75.9140625, -70.197265625, -64.48046875, -58.763671875, -53.046875, -47.330078125, -41.61328125, -35.896484375, -30.1796875, -24.462890625, -18.74609375, -13.029296875, -7.3125, -1.595703125, 4.12109375, 9.837890625, 15.5546875, 21.271484375, 26.98828125, 32.705078125, 38.421875, 44.138671875, 49.85546875, 55.572265625, 61.2890625, 67.005859375, 72.72265625, 78.439453125, 84.15625, 89.873046875, 95.58984375, 101.306640625, 107.0234375, 112.740234375, 118.45703125, 124.173828125, 129.890625, 135.607421875, 141.32421875, 147.041015625, 152.7578125, 158.474609375, 164.19140625, 169.908203125, 175.625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 16.0, 85.0, 184.0, 298.0, 261.0, 109.0, 46.0, 11.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-399.3083190917969, -391.5912170410156, -383.87408447265625, -376.156982421875, -368.43988037109375, -360.7227478027344, -353.0056457519531, -345.2885437011719, -337.5714111328125, -329.85430908203125, -322.1371765136719, -314.4200744628906, -306.7029724121094, -298.98583984375, -291.26873779296875, -283.5516357421875, -275.83453369140625, -268.117431640625, -260.4002990722656, -252.68319702148438, -244.96607971191406, -237.2489776611328, -229.5318603515625, -221.81475830078125, -214.09762573242188, -206.38050842285156, -198.6634063720703, -190.9462890625, -183.2291717529297, -175.51206970214844, -167.79495239257812, -160.07785034179688, -152.3607177734375, -144.6436004638672, -136.92649841308594, -129.20938110351562, -121.49227142333984, -113.77516174316406, -106.05804443359375, -98.34093475341797, -90.62382507324219, -82.9067153930664, -75.1895980834961, -67.47248840332031, -59.75537872314453, -52.038265228271484, -44.32115173339844, -36.604042053222656, -28.886932373046875, -21.16982078552246, -13.45270824432373, -5.735595703125, 1.981515884399414, 9.698627471923828, 17.415740966796875, 25.132850646972656, 32.8499641418457, 40.56707763671875, 48.28418731689453, 56.00130081176758, 63.718414306640625, 71.4355239868164, 79.15263366699219, 86.8697509765625, 94.58686065673828]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 8.0, 8.0, 16.0, 22.0, 22.0, 24.0, 29.0, 41.0, 45.0, 31.0, 46.0, 46.0, 46.0, 40.0, 34.0, 45.0, 50.0, 50.0, 43.0, 40.0, 39.0, 42.0, 31.0, 28.0, 27.0, 21.0, 21.0, 16.0, 16.0, 13.0, 18.0, 11.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.91848754882812, -92.65423583984375, -89.38998413085938, -86.125732421875, -82.86148071289062, -79.59722900390625, -76.33297729492188, -73.0687255859375, -69.80447387695312, -66.54022216796875, -63.275970458984375, -60.01171875, -56.747467041015625, -53.48321533203125, -50.21895980834961, -46.954708099365234, -43.690452575683594, -40.42620086669922, -37.161949157714844, -33.89769744873047, -30.63344383239746, -27.369192123413086, -24.104938507080078, -20.840686798095703, -17.576435089111328, -14.312183380126953, -11.047930717468262, -7.78367805480957, -4.519426345825195, -1.2551746368408203, 2.0090789794921875, 5.2733306884765625, 8.537582397460938, 11.801834106445312, 15.066086769104004, 18.330339431762695, 21.59459114074707, 24.858842849731445, 28.123096466064453, 31.387348175048828, 34.6515998840332, 37.91585159301758, 41.18010330200195, 44.444358825683594, 47.70861053466797, 50.972862243652344, 54.23711395263672, 57.501365661621094, 60.76561737060547, 64.02986907958984, 67.29412078857422, 70.5583724975586, 73.82262420654297, 77.08687591552734, 80.35113525390625, 83.61538696289062, 86.879638671875, 90.14389038085938, 93.40814208984375, 96.67239379882812, 99.9366455078125, 103.20089721679688, 106.46514892578125, 109.72940063476562, 112.99365234375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 4.0, 5.0, 4.0, 6.0, 15.0, 5.0, 10.0, 12.0, 21.0, 26.0, 20.0, 37.0, 25.0, 35.0, 37.0, 42.0, 46.0, 36.0, 53.0, 42.0, 35.0, 38.0, 54.0, 37.0, 35.0, 31.0, 40.0, 37.0, 26.0, 25.0, 29.0, 21.0, 22.0, 20.0, 9.0, 8.0, 16.0, 5.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.758056640625, -8.46923828125, -8.180419921875, -7.8916015625, -7.602783203125, -7.31396484375, -7.025146484375, -6.736328125, -6.447509765625, -6.15869140625, -5.869873046875, -5.5810546875, -5.292236328125, -5.00341796875, -4.714599609375, -4.42578125, -4.136962890625, -3.84814453125, -3.559326171875, -3.2705078125, -2.981689453125, -2.69287109375, -2.404052734375, -2.115234375, -1.826416015625, -1.53759765625, -1.248779296875, -0.9599609375, -0.671142578125, -0.38232421875, -0.093505859375, 0.1953125, 0.484130859375, 0.77294921875, 1.061767578125, 1.3505859375, 1.639404296875, 1.92822265625, 2.217041015625, 2.505859375, 2.794677734375, 3.08349609375, 3.372314453125, 3.6611328125, 3.949951171875, 4.23876953125, 4.527587890625, 4.81640625, 5.105224609375, 5.39404296875, 5.682861328125, 5.9716796875, 6.260498046875, 6.54931640625, 6.838134765625, 7.126953125, 7.415771484375, 7.70458984375, 7.993408203125, 8.2822265625, 8.571044921875, 8.85986328125, 9.148681640625, 9.4375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 15.0, 12.0, 22.0, 26.0, 56.0, 78.0, 113.0, 171.0, 263.0, 372.0, 557.0, 791.0, 1244.0, 1735.0, 2689.0, 4046.0, 5964.0, 8652.0, 12841.0, 19322.0, 28485.0, 42159.0, 60807.0, 89174.0, 135686.0, 187533.0, 146340.0, 95435.0, 65242.0, 44524.0, 30752.0, 20937.0, 13933.0, 9385.0, 6229.0, 4196.0, 2847.0, 1865.0, 1291.0, 878.0, 610.0, 418.0, 252.0, 198.0, 132.0, 88.0, 57.0, 51.0, 30.0, 24.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.91845703125, -0.8893814086914062, -0.8603057861328125, -0.8312301635742188, -0.802154541015625, -0.7730789184570312, -0.7440032958984375, -0.7149276733398438, -0.68585205078125, -0.6567764282226562, -0.6277008056640625, -0.5986251831054688, -0.569549560546875, -0.5404739379882812, -0.5113983154296875, -0.48232269287109375, -0.4532470703125, -0.42417144775390625, -0.3950958251953125, -0.36602020263671875, -0.336944580078125, -0.30786895751953125, -0.2787933349609375, -0.24971771240234375, -0.22064208984375, -0.19156646728515625, -0.1624908447265625, -0.13341522216796875, -0.104339599609375, -0.07526397705078125, -0.0461883544921875, -0.01711273193359375, 0.011962890625, 0.04103851318359375, 0.0701141357421875, 0.09918975830078125, 0.128265380859375, 0.15734100341796875, 0.1864166259765625, 0.21549224853515625, 0.24456787109375, 0.27364349365234375, 0.3027191162109375, 0.33179473876953125, 0.360870361328125, 0.38994598388671875, 0.4190216064453125, 0.44809722900390625, 0.4771728515625, 0.5062484741210938, 0.5353240966796875, 0.5643997192382812, 0.593475341796875, 0.6225509643554688, 0.6516265869140625, 0.6807022094726562, 0.70977783203125, 0.7388534545898438, 0.7679290771484375, 0.7970046997070312, 0.826080322265625, 0.8551559448242188, 0.8842315673828125, 0.9133071899414062, 0.9423828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 9.0, 5.0, 7.0, 13.0, 9.0, 12.0, 20.0, 18.0, 15.0, 25.0, 30.0, 23.0, 24.0, 29.0, 31.0, 34.0, 33.0, 37.0, 44.0, 41.0, 1059.0, 48.0, 47.0, 37.0, 42.0, 33.0, 38.0, 32.0, 23.0, 28.0, 20.0, 23.0, 16.0, 17.0, 12.0, 13.0, 9.0, 8.0, 11.0, 11.0, 6.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.0703125, -4.90484619140625, -4.7393798828125, -4.57391357421875, -4.408447265625, -4.24298095703125, -4.0775146484375, -3.91204833984375, -3.74658203125, -3.58111572265625, -3.4156494140625, -3.25018310546875, -3.084716796875, -2.91925048828125, -2.7537841796875, -2.58831787109375, -2.4228515625, -2.25738525390625, -2.0919189453125, -1.92645263671875, -1.760986328125, -1.59552001953125, -1.4300537109375, -1.26458740234375, -1.09912109375, -0.93365478515625, -0.7681884765625, -0.60272216796875, -0.437255859375, -0.27178955078125, -0.1063232421875, 0.05914306640625, 0.224609375, 0.39007568359375, 0.5555419921875, 0.72100830078125, 0.886474609375, 1.05194091796875, 1.2174072265625, 1.38287353515625, 1.54833984375, 1.71380615234375, 1.8792724609375, 2.04473876953125, 2.210205078125, 2.37567138671875, 2.5411376953125, 2.70660400390625, 2.8720703125, 3.03753662109375, 3.2030029296875, 3.36846923828125, 3.533935546875, 3.69940185546875, 3.8648681640625, 4.03033447265625, 4.19580078125, 4.36126708984375, 4.5267333984375, 4.69219970703125, 4.857666015625, 5.02313232421875, 5.1885986328125, 5.35406494140625, 5.51953125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 11.0, 9.0, 13.0, 28.0, 45.0, 74.0, 108.0, 148.0, 192.0, 283.0, 429.0, 620.0, 866.0, 1316.0, 1999.0, 3087.0, 4616.0, 7003.0, 10408.0, 16379.0, 24687.0, 37591.0, 58675.0, 92622.0, 148704.0, 1260285.0, 155088.0, 96466.0, 61335.0, 39197.0, 25512.0, 16896.0, 10818.0, 7292.0, 4756.0, 3199.0, 2173.0, 1408.0, 963.0, 600.0, 398.0, 273.0, 183.0, 132.0, 80.0, 56.0, 39.0, 29.0, 19.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0], "bins": [-0.99755859375, -0.9678192138671875, -0.938079833984375, -0.9083404541015625, -0.87860107421875, -0.8488616943359375, -0.819122314453125, -0.7893829345703125, -0.7596435546875, -0.7299041748046875, -0.700164794921875, -0.6704254150390625, -0.64068603515625, -0.6109466552734375, -0.581207275390625, -0.5514678955078125, -0.521728515625, -0.4919891357421875, -0.462249755859375, -0.4325103759765625, -0.40277099609375, -0.3730316162109375, -0.343292236328125, -0.3135528564453125, -0.2838134765625, -0.2540740966796875, -0.224334716796875, -0.1945953369140625, -0.16485595703125, -0.1351165771484375, -0.105377197265625, -0.0756378173828125, -0.0458984375, -0.0161590576171875, 0.013580322265625, 0.0433197021484375, 0.07305908203125, 0.1027984619140625, 0.132537841796875, 0.1622772216796875, 0.1920166015625, 0.2217559814453125, 0.251495361328125, 0.2812347412109375, 0.31097412109375, 0.3407135009765625, 0.370452880859375, 0.4001922607421875, 0.429931640625, 0.4596710205078125, 0.489410400390625, 0.5191497802734375, 0.54888916015625, 0.5786285400390625, 0.608367919921875, 0.6381072998046875, 0.6678466796875, 0.6975860595703125, 0.727325439453125, 0.7570648193359375, 0.78680419921875, 0.8165435791015625, 0.846282958984375, 0.8760223388671875, 0.90576171875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 8.0, 10.0, 14.0, 22.0, 24.0, 30.0, 31.0, 53.0, 42.0, 59.0, 65.0, 64.0, 75.0, 66.0, 66.0, 59.0, 65.0, 45.0, 39.0, 34.0, 26.0, 25.0, 18.0, 21.0, 8.0, 6.0, 1.0, 4.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002208709716796875, -0.002143755555152893, -0.002078801393508911, -0.002013847231864929, -0.0019488930702209473, -0.0018839389085769653, -0.0018189847469329834, -0.0017540305852890015, -0.0016890764236450195, -0.0016241222620010376, -0.0015591681003570557, -0.0014942139387130737, -0.0014292597770690918, -0.0013643056154251099, -0.001299351453781128, -0.001234397292137146, -0.001169443130493164, -0.0011044889688491821, -0.0010395348072052002, -0.0009745806455612183, -0.0009096264839172363, -0.0008446723222732544, -0.0007797181606292725, -0.0007147639989852905, -0.0006498098373413086, -0.0005848556756973267, -0.0005199015140533447, -0.0004549473524093628, -0.00038999319076538086, -0.0003250390291213989, -0.000260084867477417, -0.00019513070583343506, -0.00013017654418945312, -6.522238254547119e-05, -2.682209014892578e-07, 6.468594074249268e-05, 0.0001296401023864746, 0.00019459426403045654, 0.0002595484256744385, 0.0003245025873184204, 0.00038945674896240234, 0.0004544109106063843, 0.0005193650722503662, 0.0005843192338943481, 0.0006492733955383301, 0.000714227557182312, 0.0007791817188262939, 0.0008441358804702759, 0.0009090900421142578, 0.0009740442037582397, 0.0010389983654022217, 0.0011039525270462036, 0.0011689066886901855, 0.0012338608503341675, 0.0012988150119781494, 0.0013637691736221313, 0.0014287233352661133, 0.0014936774969100952, 0.0015586316585540771, 0.001623585820198059, 0.001688539981842041, 0.001753494143486023, 0.0018184483051300049, 0.0018834024667739868, 0.0019483566284179688]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 0.0, 2.0, 6.0, 3.0, 11.0, 15.0, 14.0, 23.0, 27.0, 37.0, 51.0, 53.0, 90.0, 142.0, 236.0, 403.0, 1101.0, 969208.0, 75417.0, 758.0, 347.0, 182.0, 124.0, 80.0, 52.0, 44.0, 33.0, 18.0, 25.0, 15.0, 10.0, 7.0, 3.0, 2.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0511474609375, -0.049680233001708984, -0.04821300506591797, -0.04674577713012695, -0.04527854919433594, -0.04381132125854492, -0.042344093322753906, -0.04087686538696289, -0.039409637451171875, -0.03794240951538086, -0.036475181579589844, -0.03500795364379883, -0.03354072570800781, -0.0320734977722168, -0.03060626983642578, -0.029139041900634766, -0.02767181396484375, -0.026204586029052734, -0.02473735809326172, -0.023270130157470703, -0.021802902221679688, -0.020335674285888672, -0.018868446350097656, -0.01740121841430664, -0.015933990478515625, -0.01446676254272461, -0.012999534606933594, -0.011532306671142578, -0.010065078735351562, -0.008597850799560547, -0.007130622863769531, -0.005663394927978516, -0.0041961669921875, -0.0027289390563964844, -0.0012617111206054688, 0.00020551681518554688, 0.0016727447509765625, 0.003139972686767578, 0.004607200622558594, 0.006074428558349609, 0.007541656494140625, 0.00900888442993164, 0.010476112365722656, 0.011943340301513672, 0.013410568237304688, 0.014877796173095703, 0.01634502410888672, 0.017812252044677734, 0.01927947998046875, 0.020746707916259766, 0.02221393585205078, 0.023681163787841797, 0.025148391723632812, 0.026615619659423828, 0.028082847595214844, 0.02955007553100586, 0.031017303466796875, 0.03248453140258789, 0.033951759338378906, 0.03541898727416992, 0.03688621520996094, 0.03835344314575195, 0.03982067108154297, 0.041287899017333984, 0.042755126953125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.0, 318.0, 515.0, 125.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0052827103063464165, -0.005151478108018637, -0.005020245909690857, -0.00488901324570179, -0.00475778104737401, -0.00462654884904623, -0.0044953166507184505, -0.004364084452390671, -0.004232851788401604, -0.004101619590073824, -0.003970387391746044, -0.0038391549605876207, -0.0037079225294291973, -0.0035766903311014175, -0.0034454581327736378, -0.003314225934445858, -0.0031829937361180782, -0.0030517615377902985, -0.002920529106631875, -0.0027892969083040953, -0.002658064477145672, -0.002526832278817892, -0.0023956000804901123, -0.0022643678821623325, -0.002133135451003909, -0.0020019032526761293, -0.001870670821517706, -0.0017394386231899261, -0.0016082063084468246, -0.001476973993703723, -0.0013457417953759432, -0.0012145094806328416, -0.0010832776315510273, -0.0009520453168079257, -0.000820813060272485, -0.0006895808037370443, -0.0005583484889939427, -0.00042711617425084114, -0.00029588391771540046, -0.00016465166117995977, -3.341934643685818e-05, 9.781293920241296e-05, 0.0002290452248416841, 0.00036027751048095524, 0.0004915097961202264, 0.000622742110863328, 0.0007539743673987687, 0.0008852066239342093, 0.001016438938677311, 0.0011476712534204125, 0.0012789035681635141, 0.001410135766491294, 0.0015413680812343955, 0.001672600395977497, 0.0018038325943052769, 0.0019350649090483785, 0.00206629722379148, 0.00219752942211926, 0.0023287618532776833, 0.002459994051605463, 0.002591226249933243, 0.0027224586810916662, 0.002853690879419446, 0.0029849233105778694, 0.003116155508905649]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 5.0, 3.0, 4.0, 11.0, 1.0, 9.0, 10.0, 15.0, 20.0, 19.0, 30.0, 14.0, 17.0, 27.0, 17.0, 22.0, 27.0, 38.0, 35.0, 32.0, 30.0, 36.0, 43.0, 38.0, 30.0, 34.0, 30.0, 38.0, 43.0, 31.0, 22.0, 22.0, 30.0, 30.0, 14.0, 20.0, 23.0, 22.0, 12.0, 21.0, 13.0, 10.0, 6.0, 7.0, 7.0, 4.0, 6.0, 2.0, 5.0, 5.0, 1.0, 2.0, 0.0, 4.0, 4.0], "bins": [-0.0008194446563720703, -0.000794626772403717, -0.0007698088884353638, -0.0007449910044670105, -0.0007201731204986572, -0.000695355236530304, -0.0006705373525619507, -0.0006457194685935974, -0.0006209015846252441, -0.0005960837006568909, -0.0005712658166885376, -0.0005464479327201843, -0.0005216300487518311, -0.0004968121647834778, -0.0004719942808151245, -0.00044717639684677124, -0.00042235851287841797, -0.0003975406289100647, -0.0003727227449417114, -0.00034790486097335815, -0.0003230869770050049, -0.0002982690930366516, -0.00027345120906829834, -0.00024863332509994507, -0.0002238154411315918, -0.00019899755716323853, -0.00017417967319488525, -0.00014936178922653198, -0.0001245439052581787, -9.972602128982544e-05, -7.490813732147217e-05, -5.0090253353118896e-05, -2.5272369384765625e-05, -4.544854164123535e-07, 2.4363398551940918e-05, 4.918128252029419e-05, 7.399916648864746e-05, 9.881705045700073e-05, 0.000123634934425354, 0.00014845281839370728, 0.00017327070236206055, 0.00019808858633041382, 0.0002229064702987671, 0.00024772435426712036, 0.00027254223823547363, 0.0002973601222038269, 0.0003221780061721802, 0.00034699589014053345, 0.0003718137741088867, 0.00039663165807724, 0.00042144954204559326, 0.00044626742601394653, 0.0004710853099822998, 0.0004959031939506531, 0.0005207210779190063, 0.0005455389618873596, 0.0005703568458557129, 0.0005951747298240662, 0.0006199926137924194, 0.0006448104977607727, 0.000669628381729126, 0.0006944462656974792, 0.0007192641496658325, 0.0007440820336341858, 0.0007688999176025391]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 4.0, 5.0, 4.0, 6.0, 15.0, 5.0, 10.0, 12.0, 21.0, 26.0, 20.0, 37.0, 25.0, 35.0, 37.0, 42.0, 46.0, 36.0, 53.0, 42.0, 35.0, 38.0, 54.0, 37.0, 35.0, 31.0, 40.0, 37.0, 26.0, 25.0, 29.0, 21.0, 22.0, 20.0, 9.0, 8.0, 16.0, 5.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.758056640625, -8.46923828125, -8.180419921875, -7.8916015625, -7.602783203125, -7.31396484375, -7.025146484375, -6.736328125, -6.447509765625, -6.15869140625, -5.869873046875, -5.5810546875, -5.292236328125, -5.00341796875, -4.714599609375, -4.42578125, -4.136962890625, -3.84814453125, -3.559326171875, -3.2705078125, -2.981689453125, -2.69287109375, -2.404052734375, -2.115234375, -1.826416015625, -1.53759765625, -1.248779296875, -0.9599609375, -0.671142578125, -0.38232421875, -0.093505859375, 0.1953125, 0.484130859375, 0.77294921875, 1.061767578125, 1.3505859375, 1.639404296875, 1.92822265625, 2.217041015625, 2.505859375, 2.794677734375, 3.08349609375, 3.372314453125, 3.6611328125, 3.949951171875, 4.23876953125, 4.527587890625, 4.81640625, 5.105224609375, 5.39404296875, 5.682861328125, 5.9716796875, 6.260498046875, 6.54931640625, 6.838134765625, 7.126953125, 7.415771484375, 7.70458984375, 7.993408203125, 8.2822265625, 8.571044921875, 8.85986328125, 9.148681640625, 9.4375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 9.0, 13.0, 17.0, 23.0, 36.0, 50.0, 83.0, 109.0, 170.0, 214.0, 356.0, 556.0, 985.0, 1795.0, 3604.0, 7959.0, 24015.0, 106702.0, 585630.0, 248270.0, 44527.0, 12522.0, 5034.0, 2490.0, 1313.0, 709.0, 467.0, 302.0, 185.0, 117.0, 88.0, 65.0, 36.0, 30.0, 23.0, 13.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7421875, -7.4525146484375, -7.162841796875, -6.8731689453125, -6.58349609375, -6.2938232421875, -6.004150390625, -5.7144775390625, -5.4248046875, -5.1351318359375, -4.845458984375, -4.5557861328125, -4.26611328125, -3.9764404296875, -3.686767578125, -3.3970947265625, -3.107421875, -2.8177490234375, -2.528076171875, -2.2384033203125, -1.94873046875, -1.6590576171875, -1.369384765625, -1.0797119140625, -0.7900390625, -0.5003662109375, -0.210693359375, 0.0789794921875, 0.36865234375, 0.6583251953125, 0.947998046875, 1.2376708984375, 1.52734375, 1.8170166015625, 2.106689453125, 2.3963623046875, 2.68603515625, 2.9757080078125, 3.265380859375, 3.5550537109375, 3.8447265625, 4.1343994140625, 4.424072265625, 4.7137451171875, 5.00341796875, 5.2930908203125, 5.582763671875, 5.8724365234375, 6.162109375, 6.4517822265625, 6.741455078125, 7.0311279296875, 7.32080078125, 7.6104736328125, 7.900146484375, 8.1898193359375, 8.4794921875, 8.7691650390625, 9.058837890625, 9.3485107421875, 9.63818359375, 9.9278564453125, 10.217529296875, 10.5072021484375, 10.796875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 10.0, 10.0, 12.0, 16.0, 12.0, 16.0, 22.0, 25.0, 26.0, 27.0, 38.0, 38.0, 30.0, 30.0, 44.0, 70.0, 101.0, 1696.0, 276.0, 94.0, 67.0, 47.0, 41.0, 41.0, 29.0, 32.0, 35.0, 18.0, 13.0, 21.0, 9.0, 9.0, 14.0, 9.0, 9.0, 10.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-32.40625, -31.418212890625, -30.43017578125, -29.442138671875, -28.4541015625, -27.466064453125, -26.47802734375, -25.489990234375, -24.501953125, -23.513916015625, -22.52587890625, -21.537841796875, -20.5498046875, -19.561767578125, -18.57373046875, -17.585693359375, -16.59765625, -15.609619140625, -14.62158203125, -13.633544921875, -12.6455078125, -11.657470703125, -10.66943359375, -9.681396484375, -8.693359375, -7.705322265625, -6.71728515625, -5.729248046875, -4.7412109375, -3.753173828125, -2.76513671875, -1.777099609375, -0.7890625, 0.198974609375, 1.18701171875, 2.175048828125, 3.1630859375, 4.151123046875, 5.13916015625, 6.127197265625, 7.115234375, 8.103271484375, 9.09130859375, 10.079345703125, 11.0673828125, 12.055419921875, 13.04345703125, 14.031494140625, 15.01953125, 16.007568359375, 16.99560546875, 17.983642578125, 18.9716796875, 19.959716796875, 20.94775390625, 21.935791015625, 22.923828125, 23.911865234375, 24.89990234375, 25.887939453125, 26.8759765625, 27.864013671875, 28.85205078125, 29.840087890625, 30.828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 9.0, 7.0, 14.0, 13.0, 11.0, 13.0, 23.0, 17.0, 31.0, 41.0, 56.0, 66.0, 109.0, 161.0, 269.0, 615.0, 2445.0, 42182.0, 3069248.0, 27000.0, 1894.0, 595.0, 243.0, 158.0, 117.0, 77.0, 51.0, 37.0, 43.0, 24.0, 21.0, 12.0, 14.0, 13.0, 14.0, 6.0, 11.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.21875, -49.59033203125, -47.9619140625, -46.33349609375, -44.705078125, -43.07666015625, -41.4482421875, -39.81982421875, -38.19140625, -36.56298828125, -34.9345703125, -33.30615234375, -31.677734375, -30.04931640625, -28.4208984375, -26.79248046875, -25.1640625, -23.53564453125, -21.9072265625, -20.27880859375, -18.650390625, -17.02197265625, -15.3935546875, -13.76513671875, -12.13671875, -10.50830078125, -8.8798828125, -7.25146484375, -5.623046875, -3.99462890625, -2.3662109375, -0.73779296875, 0.890625, 2.51904296875, 4.1474609375, 5.77587890625, 7.404296875, 9.03271484375, 10.6611328125, 12.28955078125, 13.91796875, 15.54638671875, 17.1748046875, 18.80322265625, 20.431640625, 22.06005859375, 23.6884765625, 25.31689453125, 26.9453125, 28.57373046875, 30.2021484375, 31.83056640625, 33.458984375, 35.08740234375, 36.7158203125, 38.34423828125, 39.97265625, 41.60107421875, 43.2294921875, 44.85791015625, 46.486328125, 48.11474609375, 49.7431640625, 51.37158203125, 53.0]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 183.0, 829.0, 5.0], "bins": [-734.0596313476562, -722.255126953125, -710.4505615234375, -698.6460571289062, -686.841552734375, -675.0369873046875, -663.2324829101562, -651.4279174804688, -639.6234130859375, -627.8189086914062, -616.0143432617188, -604.2098388671875, -592.4052734375, -580.6007690429688, -568.7962646484375, -556.99169921875, -545.1871948242188, -533.3826904296875, -521.578125, -509.77362060546875, -497.9690856933594, -486.16455078125, -474.36004638671875, -462.5555114746094, -450.7509765625, -438.9464416503906, -427.14190673828125, -415.33740234375, -403.5328674316406, -391.72833251953125, -379.923828125, -368.1192932128906, -356.3147277832031, -344.51019287109375, -332.7056884765625, -320.9011535644531, -309.09661865234375, -297.2920837402344, -285.487548828125, -273.68304443359375, -261.8785095214844, -250.073974609375, -238.2694549560547, -226.46493530273438, -214.660400390625, -202.85586547851562, -191.0513458251953, -179.246826171875, -167.44229125976562, -155.63775634765625, -143.83323669433594, -132.02871704101562, -120.22418212890625, -108.4196548461914, -96.61512756347656, -84.81060028076172, -73.0060806274414, -61.20155334472656, -49.39702606201172, -37.592498779296875, -25.78797149658203, -13.983444213867188, -2.1789169311523438, 9.6256103515625, 21.430137634277344]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 7.0, 8.0, 6.0, 7.0, 13.0, 9.0, 12.0, 18.0, 18.0, 16.0, 19.0, 18.0, 20.0, 23.0, 30.0, 32.0, 26.0, 40.0, 34.0, 33.0, 36.0, 39.0, 47.0, 44.0, 34.0, 43.0, 41.0, 36.0, 40.0, 30.0, 25.0, 29.0, 23.0, 18.0, 24.0, 14.0, 11.0, 10.0, 15.0, 15.0, 10.0, 12.0, 7.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-100.83224487304688, -97.67776489257812, -94.52328491210938, -91.36880493164062, -88.21432495117188, -85.05984497070312, -81.90536499023438, -78.7508773803711, -75.59639739990234, -72.4419174194336, -69.28743743896484, -66.1329574584961, -62.97847366333008, -59.82399368286133, -56.66951370239258, -53.51502990722656, -50.36055374145508, -47.20607376098633, -44.05159378051758, -40.89710998535156, -37.74263000488281, -34.58815002441406, -31.433670043945312, -28.27918815612793, -25.12470817565918, -21.97022819519043, -18.815746307373047, -15.661266326904297, -12.50678539276123, -9.352304458618164, -6.197824478149414, -3.0433425903320312, 0.11113739013671875, 3.265618085861206, 6.420098781585693, 9.574579238891602, 12.729060173034668, 15.883541107177734, 19.038021087646484, 22.192502975463867, 25.346982955932617, 28.501462936401367, 31.65594482421875, 34.8104248046875, 37.96490478515625, 41.119384765625, 44.27386474609375, 47.428348541259766, 50.582828521728516, 53.737308502197266, 56.891788482666016, 60.04627227783203, 63.20075225830078, 66.35523223876953, 69.50971221923828, 72.66419219970703, 75.81867218017578, 78.97315216064453, 82.12763214111328, 85.28211212158203, 88.43659210205078, 91.59107971191406, 94.74555969238281, 97.90003967285156, 101.05451965332031]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 4.0, 0.0, 9.0, 9.0, 10.0, 12.0, 14.0, 20.0, 21.0, 23.0, 25.0, 28.0, 35.0, 38.0, 45.0, 43.0, 44.0, 44.0, 46.0, 32.0, 38.0, 47.0, 31.0, 44.0, 42.0, 30.0, 34.0, 28.0, 20.0, 30.0, 35.0, 18.0, 16.0, 15.0, 10.0, 11.0, 9.0, 7.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1640625, -8.873046875, -8.58203125, -8.291015625, -8.0, -7.708984375, -7.41796875, -7.126953125, -6.8359375, -6.544921875, -6.25390625, -5.962890625, -5.671875, -5.380859375, -5.08984375, -4.798828125, -4.5078125, -4.216796875, -3.92578125, -3.634765625, -3.34375, -3.052734375, -2.76171875, -2.470703125, -2.1796875, -1.888671875, -1.59765625, -1.306640625, -1.015625, -0.724609375, -0.43359375, -0.142578125, 0.1484375, 0.439453125, 0.73046875, 1.021484375, 1.3125, 1.603515625, 1.89453125, 2.185546875, 2.4765625, 2.767578125, 3.05859375, 3.349609375, 3.640625, 3.931640625, 4.22265625, 4.513671875, 4.8046875, 5.095703125, 5.38671875, 5.677734375, 5.96875, 6.259765625, 6.55078125, 6.841796875, 7.1328125, 7.423828125, 7.71484375, 8.005859375, 8.296875, 8.587890625, 8.87890625, 9.169921875, 9.4609375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 3.0, 5.0, 11.0, 10.0, 11.0, 15.0, 24.0, 34.0, 53.0, 61.0, 85.0, 144.0, 264.0, 566.0, 1344.0, 3917.0, 13828.0, 64074.0, 510883.0, 2425170.0, 1022268.0, 120576.0, 22006.0, 5667.0, 1744.0, 669.0, 291.0, 169.0, 110.0, 71.0, 51.0, 39.0, 26.0, 23.0, 19.0, 11.0, 8.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.234375, -18.5859375, -17.9375, -17.2890625, -16.640625, -15.9921875, -15.34375, -14.6953125, -14.046875, -13.3984375, -12.75, -12.1015625, -11.453125, -10.8046875, -10.15625, -9.5078125, -8.859375, -8.2109375, -7.5625, -6.9140625, -6.265625, -5.6171875, -4.96875, -4.3203125, -3.671875, -3.0234375, -2.375, -1.7265625, -1.078125, -0.4296875, 0.21875, 0.8671875, 1.515625, 2.1640625, 2.8125, 3.4609375, 4.109375, 4.7578125, 5.40625, 6.0546875, 6.703125, 7.3515625, 8.0, 8.6484375, 9.296875, 9.9453125, 10.59375, 11.2421875, 11.890625, 12.5390625, 13.1875, 13.8359375, 14.484375, 15.1328125, 15.78125, 16.4296875, 17.078125, 17.7265625, 18.375, 19.0234375, 19.671875, 20.3203125, 20.96875, 21.6171875, 22.265625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 3.0, 9.0, 12.0, 22.0, 27.0, 33.0, 53.0, 67.0, 88.0, 137.0, 166.0, 264.0, 321.0, 444.0, 539.0, 507.0, 373.0, 287.0, 192.0, 147.0, 121.0, 64.0, 55.0, 35.0, 25.0, 20.0, 18.0, 8.0, 9.0, 6.0, 5.0, 7.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.0625, -33.134765625, -32.20703125, -31.279296875, -30.3515625, -29.423828125, -28.49609375, -27.568359375, -26.640625, -25.712890625, -24.78515625, -23.857421875, -22.9296875, -22.001953125, -21.07421875, -20.146484375, -19.21875, -18.291015625, -17.36328125, -16.435546875, -15.5078125, -14.580078125, -13.65234375, -12.724609375, -11.796875, -10.869140625, -9.94140625, -9.013671875, -8.0859375, -7.158203125, -6.23046875, -5.302734375, -4.375, -3.447265625, -2.51953125, -1.591796875, -0.6640625, 0.263671875, 1.19140625, 2.119140625, 3.046875, 3.974609375, 4.90234375, 5.830078125, 6.7578125, 7.685546875, 8.61328125, 9.541015625, 10.46875, 11.396484375, 12.32421875, 13.251953125, 14.1796875, 15.107421875, 16.03515625, 16.962890625, 17.890625, 18.818359375, 19.74609375, 20.673828125, 21.6015625, 22.529296875, 23.45703125, 24.384765625, 25.3125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 12.0, 6.0, 20.0, 24.0, 25.0, 49.0, 56.0, 96.0, 135.0, 224.0, 515.0, 2631.0, 314692.0, 3863149.0, 10883.0, 921.0, 295.0, 191.0, 102.0, 75.0, 46.0, 42.0, 22.0, 23.0, 12.0, 12.0, 12.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.0, -118.7890625, -114.578125, -110.3671875, -106.15625, -101.9453125, -97.734375, -93.5234375, -89.3125, -85.1015625, -80.890625, -76.6796875, -72.46875, -68.2578125, -64.046875, -59.8359375, -55.625, -51.4140625, -47.203125, -42.9921875, -38.78125, -34.5703125, -30.359375, -26.1484375, -21.9375, -17.7265625, -13.515625, -9.3046875, -5.09375, -0.8828125, 3.328125, 7.5390625, 11.75, 15.9609375, 20.171875, 24.3828125, 28.59375, 32.8046875, 37.015625, 41.2265625, 45.4375, 49.6484375, 53.859375, 58.0703125, 62.28125, 66.4921875, 70.703125, 74.9140625, 79.125, 83.3359375, 87.546875, 91.7578125, 95.96875, 100.1796875, 104.390625, 108.6015625, 112.8125, 117.0234375, 121.234375, 125.4453125, 129.65625, 133.8671875, 138.078125, 142.2890625, 146.5]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 48.0, 192.0, 402.0, 283.0, 74.0, 11.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-225.11192321777344, -213.69786071777344, -202.28379821777344, -190.8697509765625, -179.4556884765625, -168.0416259765625, -156.6275634765625, -145.2135009765625, -133.7994384765625, -122.3853759765625, -110.9713134765625, -99.55725860595703, -88.14319610595703, -76.72913360595703, -65.31507873535156, -53.90101623535156, -42.48695373535156, -31.072893142700195, -19.658832550048828, -8.244773864746094, 3.1692886352539062, 14.583351135253906, 25.997406005859375, 37.411468505859375, 48.825531005859375, 60.239593505859375, 71.65365600585938, 83.06771087646484, 94.48177337646484, 105.89583587646484, 117.30989074707031, 128.7239532470703, 140.13803100585938, 151.55209350585938, 162.96615600585938, 174.38021850585938, 185.79428100585938, 197.20834350585938, 208.6223907470703, 220.0364532470703, 231.4505157470703, 242.8645782470703, 254.2786407470703, 265.69268798828125, 277.10675048828125, 288.52081298828125, 299.93487548828125, 311.34893798828125, 322.76300048828125, 334.17706298828125, 345.59112548828125, 357.00518798828125, 368.41925048828125, 379.83331298828125, 391.24737548828125, 402.66143798828125, 414.07550048828125, 425.48956298828125, 436.90362548828125, 448.31768798828125, 459.73175048828125, 471.14581298828125, 482.55987548828125, 493.97393798828125, 505.3879699707031]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 10.0, 6.0, 4.0, 8.0, 12.0, 10.0, 20.0, 13.0, 11.0, 16.0, 16.0, 21.0, 30.0, 26.0, 26.0, 23.0, 33.0, 30.0, 25.0, 30.0, 39.0, 40.0, 34.0, 40.0, 36.0, 34.0, 37.0, 35.0, 36.0, 29.0, 25.0, 27.0, 23.0, 24.0, 23.0, 27.0, 14.0, 11.0, 15.0, 11.0, 11.0, 9.0, 9.0, 11.0, 7.0, 6.0, 5.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-79.11333465576172, -76.68402099609375, -74.25470733642578, -71.82539367675781, -69.39608001708984, -66.96676635742188, -64.5374526977539, -62.1081428527832, -59.678829193115234, -57.249515533447266, -54.8202018737793, -52.39088821411133, -49.961578369140625, -47.532264709472656, -45.10295104980469, -42.67363739013672, -40.24432373046875, -37.81501007080078, -35.38569641113281, -32.956382751464844, -30.527070999145508, -28.09775733947754, -25.668445587158203, -23.239131927490234, -20.809818267822266, -18.380504608154297, -15.951191902160645, -13.521879196166992, -11.092565536499023, -8.663251876831055, -6.233939170837402, -3.80462646484375, -1.3753204345703125, 1.053992748260498, 3.4833059310913086, 5.912619113922119, 8.34193229675293, 10.771245956420898, 13.20055866241455, 15.629871368408203, 18.059185028076172, 20.48849868774414, 22.91781234741211, 25.347124099731445, 27.776437759399414, 30.205751419067383, 32.63506317138672, 35.06437683105469, 37.493690490722656, 39.923004150390625, 42.352317810058594, 44.78163146972656, 47.21094512939453, 49.6402587890625, 52.0695686340332, 54.49888229370117, 56.92819595336914, 59.35750961303711, 61.78682327270508, 64.21613311767578, 66.64544677734375, 69.07476043701172, 71.50407409667969, 73.93338775634766, 76.36270141601562]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 8.0, 12.0, 11.0, 17.0, 22.0, 12.0, 12.0, 22.0, 27.0, 37.0, 32.0, 32.0, 47.0, 25.0, 45.0, 44.0, 47.0, 37.0, 45.0, 32.0, 40.0, 41.0, 31.0, 40.0, 34.0, 30.0, 34.0, 20.0, 14.0, 20.0, 32.0, 16.0, 15.0, 9.0, 6.0, 6.0, 6.0, 7.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.2618408203125, -8.968994140625, -8.6761474609375, -8.38330078125, -8.0904541015625, -7.797607421875, -7.5047607421875, -7.2119140625, -6.9190673828125, -6.626220703125, -6.3333740234375, -6.04052734375, -5.7476806640625, -5.454833984375, -5.1619873046875, -4.869140625, -4.5762939453125, -4.283447265625, -3.9906005859375, -3.69775390625, -3.4049072265625, -3.112060546875, -2.8192138671875, -2.5263671875, -2.2335205078125, -1.940673828125, -1.6478271484375, -1.35498046875, -1.0621337890625, -0.769287109375, -0.4764404296875, -0.18359375, 0.1092529296875, 0.402099609375, 0.6949462890625, 0.98779296875, 1.2806396484375, 1.573486328125, 1.8663330078125, 2.1591796875, 2.4520263671875, 2.744873046875, 3.0377197265625, 3.33056640625, 3.6234130859375, 3.916259765625, 4.2091064453125, 4.501953125, 4.7947998046875, 5.087646484375, 5.3804931640625, 5.67333984375, 5.9661865234375, 6.259033203125, 6.5518798828125, 6.8447265625, 7.1375732421875, 7.430419921875, 7.7232666015625, 8.01611328125, 8.3089599609375, 8.601806640625, 8.8946533203125, 9.1875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 11.0, 16.0, 21.0, 29.0, 49.0, 78.0, 103.0, 142.0, 225.0, 307.0, 438.0, 649.0, 950.0, 1345.0, 1932.0, 2838.0, 4080.0, 5794.0, 8621.0, 12511.0, 18160.0, 25893.0, 38557.0, 56351.0, 82567.0, 120799.0, 169766.0, 156241.0, 106870.0, 73473.0, 50231.0, 34358.0, 23206.0, 16131.0, 11183.0, 7595.0, 5325.0, 3651.0, 2506.0, 1713.0, 1211.0, 791.0, 611.0, 396.0, 239.0, 208.0, 137.0, 84.0, 63.0, 31.0, 28.0, 17.0, 8.0, 10.0, 4.0, 5.0, 0.0, 2.0], "bins": [-0.94775390625, -0.9188995361328125, -0.890045166015625, -0.8611907958984375, -0.83233642578125, -0.8034820556640625, -0.774627685546875, -0.7457733154296875, -0.7169189453125, -0.6880645751953125, -0.659210205078125, -0.6303558349609375, -0.60150146484375, -0.5726470947265625, -0.543792724609375, -0.5149383544921875, -0.486083984375, -0.4572296142578125, -0.428375244140625, -0.3995208740234375, -0.37066650390625, -0.3418121337890625, -0.312957763671875, -0.2841033935546875, -0.2552490234375, -0.2263946533203125, -0.197540283203125, -0.1686859130859375, -0.13983154296875, -0.1109771728515625, -0.082122802734375, -0.0532684326171875, -0.0244140625, 0.0044403076171875, 0.033294677734375, 0.0621490478515625, 0.09100341796875, 0.1198577880859375, 0.148712158203125, 0.1775665283203125, 0.2064208984375, 0.2352752685546875, 0.264129638671875, 0.2929840087890625, 0.32183837890625, 0.3506927490234375, 0.379547119140625, 0.4084014892578125, 0.437255859375, 0.4661102294921875, 0.494964599609375, 0.5238189697265625, 0.55267333984375, 0.5815277099609375, 0.610382080078125, 0.6392364501953125, 0.6680908203125, 0.6969451904296875, 0.725799560546875, 0.7546539306640625, 0.78350830078125, 0.8123626708984375, 0.841217041015625, 0.8700714111328125, 0.89892578125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 9.0, 17.0, 8.0, 14.0, 16.0, 17.0, 20.0, 29.0, 27.0, 36.0, 32.0, 37.0, 41.0, 38.0, 48.0, 30.0, 53.0, 1076.0, 42.0, 46.0, 44.0, 36.0, 38.0, 33.0, 22.0, 33.0, 22.0, 22.0, 24.0, 17.0, 10.0, 15.0, 20.0, 8.0, 5.0, 8.0, 10.0, 3.0, 4.0, 3.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.9296875, -6.72760009765625, -6.5255126953125, -6.32342529296875, -6.121337890625, -5.91925048828125, -5.7171630859375, -5.51507568359375, -5.31298828125, -5.11090087890625, -4.9088134765625, -4.70672607421875, -4.504638671875, -4.30255126953125, -4.1004638671875, -3.89837646484375, -3.6962890625, -3.49420166015625, -3.2921142578125, -3.09002685546875, -2.887939453125, -2.68585205078125, -2.4837646484375, -2.28167724609375, -2.07958984375, -1.87750244140625, -1.6754150390625, -1.47332763671875, -1.271240234375, -1.06915283203125, -0.8670654296875, -0.66497802734375, -0.462890625, -0.26080322265625, -0.0587158203125, 0.14337158203125, 0.345458984375, 0.54754638671875, 0.7496337890625, 0.95172119140625, 1.15380859375, 1.35589599609375, 1.5579833984375, 1.76007080078125, 1.962158203125, 2.16424560546875, 2.3663330078125, 2.56842041015625, 2.7705078125, 2.97259521484375, 3.1746826171875, 3.37677001953125, 3.578857421875, 3.78094482421875, 3.9830322265625, 4.18511962890625, 4.38720703125, 4.58929443359375, 4.7913818359375, 4.99346923828125, 5.195556640625, 5.39764404296875, 5.5997314453125, 5.80181884765625, 6.00390625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 9.0, 4.0, 12.0, 26.0, 45.0, 52.0, 102.0, 136.0, 271.0, 341.0, 541.0, 793.0, 1268.0, 2006.0, 3188.0, 5018.0, 7824.0, 12401.0, 20142.0, 31996.0, 51218.0, 83057.0, 140001.0, 1266897.0, 182766.0, 110152.0, 66142.0, 41294.0, 25725.0, 16086.0, 10133.0, 6321.0, 4072.0, 2557.0, 1616.0, 1029.0, 682.0, 443.0, 277.0, 175.0, 100.0, 73.0, 47.0, 36.0, 17.0, 19.0, 11.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0419921875, -1.006988525390625, -0.97198486328125, -0.936981201171875, -0.9019775390625, -0.866973876953125, -0.83197021484375, -0.796966552734375, -0.761962890625, -0.726959228515625, -0.69195556640625, -0.656951904296875, -0.6219482421875, -0.586944580078125, -0.55194091796875, -0.516937255859375, -0.48193359375, -0.446929931640625, -0.41192626953125, -0.376922607421875, -0.3419189453125, -0.306915283203125, -0.27191162109375, -0.236907958984375, -0.201904296875, -0.166900634765625, -0.13189697265625, -0.096893310546875, -0.0618896484375, -0.026885986328125, 0.00811767578125, 0.043121337890625, 0.078125, 0.113128662109375, 0.14813232421875, 0.183135986328125, 0.2181396484375, 0.253143310546875, 0.28814697265625, 0.323150634765625, 0.358154296875, 0.393157958984375, 0.42816162109375, 0.463165283203125, 0.4981689453125, 0.533172607421875, 0.56817626953125, 0.603179931640625, 0.63818359375, 0.673187255859375, 0.70819091796875, 0.743194580078125, 0.7781982421875, 0.813201904296875, 0.84820556640625, 0.883209228515625, 0.918212890625, 0.953216552734375, 0.98822021484375, 1.023223876953125, 1.0582275390625, 1.093231201171875, 1.12823486328125, 1.163238525390625, 1.1982421875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 7.0, 7.0, 5.0, 15.0, 8.0, 10.0, 13.0, 15.0, 22.0, 28.0, 35.0, 45.0, 43.0, 53.0, 70.0, 70.0, 75.0, 75.0, 53.0, 57.0, 59.0, 45.0, 36.0, 34.0, 26.0, 29.0, 10.0, 15.0, 12.0, 10.0, 4.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002468109130859375, -0.002392321825027466, -0.0023165345191955566, -0.0022407472133636475, -0.0021649599075317383, -0.002089172601699829, -0.00201338529586792, -0.0019375979900360107, -0.0018618106842041016, -0.0017860233783721924, -0.0017102360725402832, -0.001634448766708374, -0.0015586614608764648, -0.0014828741550445557, -0.0014070868492126465, -0.0013312995433807373, -0.0012555122375488281, -0.001179724931716919, -0.0011039376258850098, -0.0010281503200531006, -0.0009523630142211914, -0.0008765757083892822, -0.000800788402557373, -0.0007250010967254639, -0.0006492137908935547, -0.0005734264850616455, -0.0004976391792297363, -0.00042185187339782715, -0.00034606456756591797, -0.0002702772617340088, -0.0001944899559020996, -0.00011870265007019043, -4.291534423828125e-05, 3.287196159362793e-05, 0.00010865926742553711, 0.0001844465732574463, 0.00026023387908935547, 0.00033602118492126465, 0.00041180849075317383, 0.000487595796585083, 0.0005633831024169922, 0.0006391704082489014, 0.0007149577140808105, 0.0007907450199127197, 0.0008665323257446289, 0.0009423196315765381, 0.0010181069374084473, 0.0010938942432403564, 0.0011696815490722656, 0.0012454688549041748, 0.001321256160736084, 0.0013970434665679932, 0.0014728307723999023, 0.0015486180782318115, 0.0016244053840637207, 0.0017001926898956299, 0.001775979995727539, 0.0018517673015594482, 0.0019275546073913574, 0.0020033419132232666, 0.0020791292190551758, 0.002154916524887085, 0.002230703830718994, 0.0023064911365509033, 0.0023822784423828125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 6.0, 2.0, 8.0, 21.0, 22.0, 29.0, 30.0, 39.0, 47.0, 78.0, 101.0, 205.0, 334.0, 890.0, 521007.0, 523917.0, 916.0, 324.0, 194.0, 106.0, 80.0, 44.0, 36.0, 28.0, 15.0, 13.0, 8.0, 10.0, 7.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0584716796875, -0.056644439697265625, -0.05481719970703125, -0.052989959716796875, -0.0511627197265625, -0.049335479736328125, -0.04750823974609375, -0.045680999755859375, -0.043853759765625, -0.042026519775390625, -0.04019927978515625, -0.038372039794921875, -0.0365447998046875, -0.034717559814453125, -0.03289031982421875, -0.031063079833984375, -0.02923583984375, -0.027408599853515625, -0.02558135986328125, -0.023754119873046875, -0.0219268798828125, -0.020099639892578125, -0.01827239990234375, -0.016445159912109375, -0.014617919921875, -0.012790679931640625, -0.01096343994140625, -0.009136199951171875, -0.0073089599609375, -0.005481719970703125, -0.00365447998046875, -0.001827239990234375, 0.0, 0.001827239990234375, 0.00365447998046875, 0.005481719970703125, 0.0073089599609375, 0.009136199951171875, 0.01096343994140625, 0.012790679931640625, 0.014617919921875, 0.016445159912109375, 0.01827239990234375, 0.020099639892578125, 0.0219268798828125, 0.023754119873046875, 0.02558135986328125, 0.027408599853515625, 0.02923583984375, 0.031063079833984375, 0.03289031982421875, 0.034717559814453125, 0.0365447998046875, 0.038372039794921875, 0.04019927978515625, 0.042026519775390625, 0.043853759765625, 0.045680999755859375, 0.04750823974609375, 0.049335479736328125, 0.0511627197265625, 0.052989959716796875, 0.05481719970703125, 0.056644439697265625, 0.0584716796875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 28.0, 279.0, 607.0, 93.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027603129856288433, -0.0025665361899882555, -0.0023727596271783113, -0.0021789828315377235, -0.0019852062687277794, -0.0017914294730871916, -0.0015976526774466038, -0.0014038759982213378, -0.0012100993189960718, -0.0010163226397708058, -0.0008225459023378789, -0.000628769164904952, -0.00043499248567968607, -0.0002412158064544201, -4.743901081383228e-05, 0.0001463376684114337, 0.0003401143476366997, 0.0005338910268619657, 0.0007276677642948925, 0.0009214445017278194, 0.0011152211809530854, 0.0013089978601783514, 0.0015027746558189392, 0.0016965513350442052, 0.0018903280142694712, 0.002084104809910059, 0.002277881372720003, 0.002471658168360591, 0.0026654349640011787, 0.002859211526811123, 0.0030529883224517107, 0.0032467651180922985, 0.0034405412152409554, 0.003634318010881543, 0.0038280945736914873, 0.004021871369332075, 0.004215647932142019, 0.004409424960613251, 0.004603201523423195, 0.004796978086233139, 0.004990754649043083, 0.005184531211853027, 0.005378308240324259, 0.005572084803134203, 0.005765861365944147, 0.005959638394415379, 0.006153414957225323, 0.006347191520035267, 0.006540968548506498, 0.0067347451113164425, 0.006928522139787674, 0.007122298702597618, 0.007316075265407562, 0.007509851828217506, 0.007703628856688738, 0.00789740588515997, 0.008091182447969913, 0.008284959010779858, 0.008478735573589802, 0.00867251306772232, 0.008866289630532265, 0.009060066193342209, 0.009253842756152153, 0.009447619318962097, 0.009641395881772041]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 7.0, 3.0, 9.0, 16.0, 7.0, 10.0, 8.0, 9.0, 20.0, 25.0, 14.0, 23.0, 33.0, 36.0, 23.0, 34.0, 35.0, 41.0, 37.0, 37.0, 45.0, 41.0, 44.0, 37.0, 43.0, 43.0, 31.0, 26.0, 32.0, 33.0, 20.0, 26.0, 18.0, 26.0, 15.0, 12.0, 18.0, 14.0, 6.0, 9.0, 4.0, 9.0, 4.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.001100778579711914, -0.001066124066710472, -0.0010314695537090302, -0.0009968150407075882, -0.0009621605277061462, -0.0009275060147047043, -0.0008928515017032623, -0.0008581969887018204, -0.0008235424757003784, -0.0007888879626989365, -0.0007542334496974945, -0.0007195789366960526, -0.0006849244236946106, -0.0006502699106931686, -0.0006156153976917267, -0.0005809608846902847, -0.0005463063716888428, -0.0005116518586874008, -0.00047699734568595886, -0.0004423428326845169, -0.00040768831968307495, -0.000373033806681633, -0.00033837929368019104, -0.0003037247806787491, -0.00026907026767730713, -0.00023441575467586517, -0.00019976124167442322, -0.00016510672867298126, -0.0001304522156715393, -9.579770267009735e-05, -6.11431896686554e-05, -2.648867666721344e-05, 8.165836334228516e-06, 4.282034933567047e-05, 7.747486233711243e-05, 0.00011212937533855438, 0.00014678388833999634, 0.0001814384013414383, 0.00021609291434288025, 0.0002507474273443222, 0.00028540194034576416, 0.0003200564533472061, 0.00035471096634864807, 0.00038936547935009, 0.000424019992351532, 0.00045867450535297394, 0.0004933290183544159, 0.0005279835313558578, 0.0005626380443572998, 0.0005972925573587418, 0.0006319470703601837, 0.0006666015833616257, 0.0007012560963630676, 0.0007359106093645096, 0.0007705651223659515, 0.0008052196353673935, 0.0008398741483688354, 0.0008745286613702774, 0.0009091831743717194, 0.0009438376873731613, 0.0009784922003746033, 0.0010131467133760452, 0.0010478012263774872, 0.0010824557393789291, 0.001117110252380371]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 8.0, 12.0, 11.0, 17.0, 22.0, 12.0, 12.0, 22.0, 27.0, 37.0, 32.0, 32.0, 48.0, 24.0, 45.0, 44.0, 47.0, 37.0, 46.0, 31.0, 41.0, 40.0, 31.0, 41.0, 35.0, 28.0, 34.0, 20.0, 14.0, 20.0, 33.0, 16.0, 14.0, 9.0, 6.0, 6.0, 7.0, 6.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.26171875, -8.96875, -8.67578125, -8.3828125, -8.08984375, -7.796875, -7.50390625, -7.2109375, -6.91796875, -6.625, -6.33203125, -6.0390625, -5.74609375, -5.453125, -5.16015625, -4.8671875, -4.57421875, -4.28125, -3.98828125, -3.6953125, -3.40234375, -3.109375, -2.81640625, -2.5234375, -2.23046875, -1.9375, -1.64453125, -1.3515625, -1.05859375, -0.765625, -0.47265625, -0.1796875, 0.11328125, 0.40625, 0.69921875, 0.9921875, 1.28515625, 1.578125, 1.87109375, 2.1640625, 2.45703125, 2.75, 3.04296875, 3.3359375, 3.62890625, 3.921875, 4.21484375, 4.5078125, 4.80078125, 5.09375, 5.38671875, 5.6796875, 5.97265625, 6.265625, 6.55859375, 6.8515625, 7.14453125, 7.4375, 7.73046875, 8.0234375, 8.31640625, 8.609375, 8.90234375, 9.1953125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 10.0, 12.0, 16.0, 21.0, 35.0, 45.0, 72.0, 98.0, 154.0, 217.0, 293.0, 433.0, 693.0, 1020.0, 1576.0, 2622.0, 4616.0, 8802.0, 18525.0, 46576.0, 143571.0, 398867.0, 275266.0, 85650.0, 30200.0, 13036.0, 6580.0, 3584.0, 2053.0, 1296.0, 810.0, 569.0, 388.0, 242.0, 215.0, 112.0, 92.0, 65.0, 42.0, 25.0, 17.0, 19.0, 10.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.24609375, -6.0555419921875, -5.864990234375, -5.6744384765625, -5.48388671875, -5.2933349609375, -5.102783203125, -4.9122314453125, -4.7216796875, -4.5311279296875, -4.340576171875, -4.1500244140625, -3.95947265625, -3.7689208984375, -3.578369140625, -3.3878173828125, -3.197265625, -3.0067138671875, -2.816162109375, -2.6256103515625, -2.43505859375, -2.2445068359375, -2.053955078125, -1.8634033203125, -1.6728515625, -1.4822998046875, -1.291748046875, -1.1011962890625, -0.91064453125, -0.7200927734375, -0.529541015625, -0.3389892578125, -0.1484375, 0.0421142578125, 0.232666015625, 0.4232177734375, 0.61376953125, 0.8043212890625, 0.994873046875, 1.1854248046875, 1.3759765625, 1.5665283203125, 1.757080078125, 1.9476318359375, 2.13818359375, 2.3287353515625, 2.519287109375, 2.7098388671875, 2.900390625, 3.0909423828125, 3.281494140625, 3.4720458984375, 3.66259765625, 3.8531494140625, 4.043701171875, 4.2342529296875, 4.4248046875, 4.6153564453125, 4.805908203125, 4.9964599609375, 5.18701171875, 5.3775634765625, 5.568115234375, 5.7586669921875, 5.94921875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 11.0, 9.0, 14.0, 12.0, 12.0, 22.0, 17.0, 23.0, 24.0, 31.0, 24.0, 29.0, 33.0, 37.0, 33.0, 51.0, 57.0, 115.0, 1701.0, 281.0, 85.0, 55.0, 47.0, 49.0, 37.0, 31.0, 27.0, 30.0, 17.0, 18.0, 18.0, 14.0, 16.0, 7.0, 9.0, 7.0, 6.0, 10.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.75, -30.68359375, -29.6171875, -28.55078125, -27.484375, -26.41796875, -25.3515625, -24.28515625, -23.21875, -22.15234375, -21.0859375, -20.01953125, -18.953125, -17.88671875, -16.8203125, -15.75390625, -14.6875, -13.62109375, -12.5546875, -11.48828125, -10.421875, -9.35546875, -8.2890625, -7.22265625, -6.15625, -5.08984375, -4.0234375, -2.95703125, -1.890625, -0.82421875, 0.2421875, 1.30859375, 2.375, 3.44140625, 4.5078125, 5.57421875, 6.640625, 7.70703125, 8.7734375, 9.83984375, 10.90625, 11.97265625, 13.0390625, 14.10546875, 15.171875, 16.23828125, 17.3046875, 18.37109375, 19.4375, 20.50390625, 21.5703125, 22.63671875, 23.703125, 24.76953125, 25.8359375, 26.90234375, 27.96875, 29.03515625, 30.1015625, 31.16796875, 32.234375, 33.30078125, 34.3671875, 35.43359375, 36.5]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 9.0, 10.0, 7.0, 7.0, 6.0, 9.0, 15.0, 16.0, 23.0, 20.0, 23.0, 47.0, 50.0, 87.0, 101.0, 153.0, 242.0, 576.0, 2035.0, 54223.0, 3071162.0, 14386.0, 1233.0, 427.0, 240.0, 147.0, 101.0, 69.0, 56.0, 40.0, 34.0, 22.0, 21.0, 19.0, 17.0, 15.0, 10.0, 12.0, 9.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-58.78125, -57.01904296875, -55.2568359375, -53.49462890625, -51.732421875, -49.97021484375, -48.2080078125, -46.44580078125, -44.68359375, -42.92138671875, -41.1591796875, -39.39697265625, -37.634765625, -35.87255859375, -34.1103515625, -32.34814453125, -30.5859375, -28.82373046875, -27.0615234375, -25.29931640625, -23.537109375, -21.77490234375, -20.0126953125, -18.25048828125, -16.48828125, -14.72607421875, -12.9638671875, -11.20166015625, -9.439453125, -7.67724609375, -5.9150390625, -4.15283203125, -2.390625, -0.62841796875, 1.1337890625, 2.89599609375, 4.658203125, 6.42041015625, 8.1826171875, 9.94482421875, 11.70703125, 13.46923828125, 15.2314453125, 16.99365234375, 18.755859375, 20.51806640625, 22.2802734375, 24.04248046875, 25.8046875, 27.56689453125, 29.3291015625, 31.09130859375, 32.853515625, 34.61572265625, 36.3779296875, 38.14013671875, 39.90234375, 41.66455078125, 43.4267578125, 45.18896484375, 46.951171875, 48.71337890625, 50.4755859375, 52.23779296875, 54.0]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 10.0, 64.0, 306.0, 440.0, 162.0, 30.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.47980499267578, -37.180206298828125, -33.8806037902832, -30.581003189086914, -27.281402587890625, -23.981801986694336, -20.682201385498047, -17.382600784301758, -14.083000183105469, -10.78339958190918, -7.483798980712891, -4.184198379516602, -0.8845977783203125, 2.4150028228759766, 5.714603424072266, 9.014204025268555, 12.313804626464844, 15.613405227661133, 18.913005828857422, 22.21260643005371, 25.51220703125, 28.81180763244629, 32.11140823364258, 35.4110107421875, 38.710609436035156, 42.01020812988281, 45.309810638427734, 48.609413146972656, 51.90901184082031, 55.20861053466797, 58.50821304321289, 61.80781555175781, 65.10740661621094, 68.4070053100586, 71.70660400390625, 75.00621032714844, 78.3058090209961, 81.60540771484375, 84.90501403808594, 88.2046127319336, 91.50421142578125, 94.8038101196289, 98.10340881347656, 101.40301513671875, 104.7026138305664, 108.00221252441406, 111.30181884765625, 114.6014175415039, 117.90101623535156, 121.20061492919922, 124.50021362304688, 127.79981994628906, 131.09942626953125, 134.39901733398438, 137.69862365722656, 140.9982147216797, 144.29782104492188, 147.59742736816406, 150.8970184326172, 154.19662475585938, 157.4962158203125, 160.7958221435547, 164.09542846679688, 167.39501953125, 170.6946258544922]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 6.0, 5.0, 8.0, 8.0, 20.0, 20.0, 20.0, 17.0, 16.0, 41.0, 32.0, 30.0, 41.0, 47.0, 31.0, 49.0, 49.0, 54.0, 51.0, 51.0, 51.0, 44.0, 41.0, 38.0, 35.0, 25.0, 29.0, 23.0, 26.0, 18.0, 13.0, 8.0, 12.0, 9.0, 10.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-140.05441284179688, -136.0807647705078, -132.1071014404297, -128.13345336914062, -124.15980529785156, -120.18614959716797, -116.21249389648438, -112.23884582519531, -108.26519012451172, -104.29153442382812, -100.31788635253906, -96.34423065185547, -92.3705825805664, -88.39692687988281, -84.42327880859375, -80.44962310791016, -76.47596740722656, -72.50231170654297, -68.5286636352539, -64.55500793457031, -60.581356048583984, -56.607704162597656, -52.63405227661133, -48.660400390625, -44.68675231933594, -40.71310043334961, -36.73944854736328, -32.76579284667969, -28.79214096069336, -24.81848907470703, -20.844837188720703, -16.871183395385742, -12.897529602050781, -8.923876762390137, -4.95022439956665, -0.9765720367431641, 2.9970808029174805, 6.970733642578125, 10.944385528564453, 14.918039321899414, 18.891691207885742, 22.86534309387207, 26.83899688720703, 30.81264877319336, 34.78630065917969, 38.75995635986328, 42.733604431152344, 46.70726013183594, 50.680912017822266, 54.654563903808594, 58.62821578979492, 62.60186767578125, 66.57552337646484, 70.54917907714844, 74.5228271484375, 78.4964828491211, 82.47013092041016, 86.44378662109375, 90.41743469238281, 94.3910903930664, 98.36473846435547, 102.33839416503906, 106.31204223632812, 110.28569793701172, 114.25935363769531]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 4.0, 6.0, 2.0, 3.0, 5.0, 9.0, 11.0, 11.0, 9.0, 24.0, 14.0, 22.0, 16.0, 20.0, 31.0, 35.0, 39.0, 26.0, 43.0, 35.0, 45.0, 46.0, 47.0, 41.0, 41.0, 33.0, 34.0, 36.0, 35.0, 44.0, 33.0, 27.0, 25.0, 21.0, 15.0, 27.0, 26.0, 10.0, 12.0, 6.0, 5.0, 10.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9375, -9.6373291015625, -9.337158203125, -9.0369873046875, -8.73681640625, -8.4366455078125, -8.136474609375, -7.8363037109375, -7.5361328125, -7.2359619140625, -6.935791015625, -6.6356201171875, -6.33544921875, -6.0352783203125, -5.735107421875, -5.4349365234375, -5.134765625, -4.8345947265625, -4.534423828125, -4.2342529296875, -3.93408203125, -3.6339111328125, -3.333740234375, -3.0335693359375, -2.7333984375, -2.4332275390625, -2.133056640625, -1.8328857421875, -1.53271484375, -1.2325439453125, -0.932373046875, -0.6322021484375, -0.33203125, -0.0318603515625, 0.268310546875, 0.5684814453125, 0.86865234375, 1.1688232421875, 1.468994140625, 1.7691650390625, 2.0693359375, 2.3695068359375, 2.669677734375, 2.9698486328125, 3.27001953125, 3.5701904296875, 3.870361328125, 4.1705322265625, 4.470703125, 4.7708740234375, 5.071044921875, 5.3712158203125, 5.67138671875, 5.9715576171875, 6.271728515625, 6.5718994140625, 6.8720703125, 7.1722412109375, 7.472412109375, 7.7725830078125, 8.07275390625, 8.3729248046875, 8.673095703125, 8.9732666015625, 9.2734375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 1.0, 1.0, 8.0, 6.0, 9.0, 12.0, 8.0, 17.0, 19.0, 15.0, 20.0, 43.0, 58.0, 70.0, 122.0, 188.0, 417.0, 1097.0, 4249.0, 24331.0, 293518.0, 2963479.0, 844751.0, 51468.0, 7459.0, 1680.0, 522.0, 227.0, 135.0, 111.0, 49.0, 37.0, 28.0, 25.0, 21.0, 13.0, 14.0, 13.0, 11.0, 7.0, 6.0, 8.0, 3.0, 0.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.796875, -30.8525390625, -29.908203125, -28.9638671875, -28.01953125, -27.0751953125, -26.130859375, -25.1865234375, -24.2421875, -23.2978515625, -22.353515625, -21.4091796875, -20.46484375, -19.5205078125, -18.576171875, -17.6318359375, -16.6875, -15.7431640625, -14.798828125, -13.8544921875, -12.91015625, -11.9658203125, -11.021484375, -10.0771484375, -9.1328125, -8.1884765625, -7.244140625, -6.2998046875, -5.35546875, -4.4111328125, -3.466796875, -2.5224609375, -1.578125, -0.6337890625, 0.310546875, 1.2548828125, 2.19921875, 3.1435546875, 4.087890625, 5.0322265625, 5.9765625, 6.9208984375, 7.865234375, 8.8095703125, 9.75390625, 10.6982421875, 11.642578125, 12.5869140625, 13.53125, 14.4755859375, 15.419921875, 16.3642578125, 17.30859375, 18.2529296875, 19.197265625, 20.1416015625, 21.0859375, 22.0302734375, 22.974609375, 23.9189453125, 24.86328125, 25.8076171875, 26.751953125, 27.6962890625, 28.640625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 10.0, 11.0, 14.0, 26.0, 30.0, 48.0, 61.0, 81.0, 118.0, 153.0, 273.0, 348.0, 424.0, 548.0, 469.0, 400.0, 295.0, 193.0, 164.0, 117.0, 85.0, 60.0, 39.0, 27.0, 31.0, 12.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.0625, -31.112548828125, -30.16259765625, -29.212646484375, -28.2626953125, -27.312744140625, -26.36279296875, -25.412841796875, -24.462890625, -23.512939453125, -22.56298828125, -21.613037109375, -20.6630859375, -19.713134765625, -18.76318359375, -17.813232421875, -16.86328125, -15.913330078125, -14.96337890625, -14.013427734375, -13.0634765625, -12.113525390625, -11.16357421875, -10.213623046875, -9.263671875, -8.313720703125, -7.36376953125, -6.413818359375, -5.4638671875, -4.513916015625, -3.56396484375, -2.614013671875, -1.6640625, -0.714111328125, 0.23583984375, 1.185791015625, 2.1357421875, 3.085693359375, 4.03564453125, 4.985595703125, 5.935546875, 6.885498046875, 7.83544921875, 8.785400390625, 9.7353515625, 10.685302734375, 11.63525390625, 12.585205078125, 13.53515625, 14.485107421875, 15.43505859375, 16.385009765625, 17.3349609375, 18.284912109375, 19.23486328125, 20.184814453125, 21.134765625, 22.084716796875, 23.03466796875, 23.984619140625, 24.9345703125, 25.884521484375, 26.83447265625, 27.784423828125, 28.734375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 3.0, 3.0, 13.0, 10.0, 26.0, 30.0, 51.0, 59.0, 89.0, 139.0, 232.0, 441.0, 995.0, 7063.0, 1483539.0, 2689938.0, 9347.0, 1150.0, 467.0, 237.0, 150.0, 92.0, 67.0, 41.0, 30.0, 15.0, 12.0, 15.0, 8.0, 11.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.6875, -91.0517578125, -87.416015625, -83.7802734375, -80.14453125, -76.5087890625, -72.873046875, -69.2373046875, -65.6015625, -61.9658203125, -58.330078125, -54.6943359375, -51.05859375, -47.4228515625, -43.787109375, -40.1513671875, -36.515625, -32.8798828125, -29.244140625, -25.6083984375, -21.97265625, -18.3369140625, -14.701171875, -11.0654296875, -7.4296875, -3.7939453125, -0.158203125, 3.4775390625, 7.11328125, 10.7490234375, 14.384765625, 18.0205078125, 21.65625, 25.2919921875, 28.927734375, 32.5634765625, 36.19921875, 39.8349609375, 43.470703125, 47.1064453125, 50.7421875, 54.3779296875, 58.013671875, 61.6494140625, 65.28515625, 68.9208984375, 72.556640625, 76.1923828125, 79.828125, 83.4638671875, 87.099609375, 90.7353515625, 94.37109375, 98.0068359375, 101.642578125, 105.2783203125, 108.9140625, 112.5498046875, 116.185546875, 119.8212890625, 123.45703125, 127.0927734375, 130.728515625, 134.3642578125, 138.0]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 10.0, 15.0, 42.0, 80.0, 135.0, 200.0, 204.0, 155.0, 73.0, 57.0, 20.0, 11.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.28968811035156, -106.3785629272461, -100.46743774414062, -94.55632019042969, -88.64519500732422, -82.73406982421875, -76.82295227050781, -70.91182708740234, -65.00070190429688, -59.089576721191406, -53.1784553527832, -47.267333984375, -41.35620880126953, -35.44508361816406, -29.53396224975586, -23.622840881347656, -17.711715698242188, -11.800592422485352, -5.889469146728516, 0.021654129028320312, 5.932777404785156, 11.843900680541992, 17.755023956298828, 23.66614532470703, 29.5772705078125, 35.48839569091797, 41.39951705932617, 47.310638427734375, 53.221763610839844, 59.13288879394531, 65.04400634765625, 70.95513153076172, 76.86624145507812, 82.7773666381836, 88.68849182128906, 94.599609375, 100.51073455810547, 106.42185974121094, 112.33297729492188, 118.24410247802734, 124.15522766113281, 130.06634521484375, 135.97747802734375, 141.8885955810547, 147.79971313476562, 153.71084594726562, 159.62196350097656, 165.5330810546875, 171.4442138671875, 177.35533142089844, 183.26646423339844, 189.17758178710938, 195.08871459960938, 200.9998321533203, 206.91094970703125, 212.82208251953125, 218.7332000732422, 224.64431762695312, 230.55545043945312, 236.46656799316406, 242.377685546875, 248.288818359375, 254.19993591308594, 260.1110534667969, 266.0221862792969]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 5.0, 6.0, 5.0, 9.0, 6.0, 23.0, 7.0, 19.0, 12.0, 20.0, 17.0, 34.0, 33.0, 36.0, 45.0, 36.0, 44.0, 33.0, 39.0, 48.0, 40.0, 43.0, 47.0, 30.0, 43.0, 30.0, 36.0, 49.0, 29.0, 28.0, 14.0, 30.0, 17.0, 12.0, 7.0, 8.0, 11.0, 13.0, 8.0, 6.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-98.94590759277344, -96.07748413085938, -93.20905303955078, -90.34062957763672, -87.47219848632812, -84.60377502441406, -81.7353515625, -78.86692810058594, -75.99849700927734, -73.13007354736328, -70.26164245605469, -67.39321899414062, -64.52479553222656, -61.65636444091797, -58.787940979003906, -55.91951370239258, -53.05108642578125, -50.18265914916992, -47.314231872558594, -44.44580841064453, -41.5773811340332, -38.708953857421875, -35.84053039550781, -32.972103118896484, -30.103675842285156, -27.235248565673828, -24.366823196411133, -21.498397827148438, -18.62997055053711, -15.761544227600098, -12.893117904663086, -10.02469253540039, -7.1562652587890625, -4.287838935852051, -1.419412612915039, 1.4490137100219727, 4.317440032958984, 7.185866355895996, 10.054292678833008, 12.922718048095703, 15.791145324707031, 18.65957260131836, 21.527997970581055, 24.39642333984375, 27.264850616455078, 30.133277893066406, 33.00170135498047, 35.8701286315918, 38.738555908203125, 41.60698318481445, 44.47541046142578, 47.343833923339844, 50.21226119995117, 53.0806884765625, 55.94911193847656, 58.81753921508789, 61.68596649169922, 64.55438995361328, 67.42282104492188, 70.29124450683594, 73.15966796875, 76.0280990600586, 78.89652252197266, 81.76495361328125, 84.63337707519531]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 5.0, 5.0, 3.0, 7.0, 11.0, 13.0, 6.0, 4.0, 12.0, 14.0, 29.0, 18.0, 13.0, 45.0, 31.0, 28.0, 42.0, 40.0, 37.0, 31.0, 44.0, 54.0, 44.0, 47.0, 32.0, 37.0, 38.0, 36.0, 36.0, 37.0, 27.0, 20.0, 19.0, 23.0, 26.0, 16.0, 17.0, 10.0, 14.0, 5.0, 10.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.75, -10.4354248046875, -10.120849609375, -9.8062744140625, -9.49169921875, -9.1771240234375, -8.862548828125, -8.5479736328125, -8.2333984375, -7.9188232421875, -7.604248046875, -7.2896728515625, -6.97509765625, -6.6605224609375, -6.345947265625, -6.0313720703125, -5.716796875, -5.4022216796875, -5.087646484375, -4.7730712890625, -4.45849609375, -4.1439208984375, -3.829345703125, -3.5147705078125, -3.2001953125, -2.8856201171875, -2.571044921875, -2.2564697265625, -1.94189453125, -1.6273193359375, -1.312744140625, -0.9981689453125, -0.68359375, -0.3690185546875, -0.054443359375, 0.2601318359375, 0.57470703125, 0.8892822265625, 1.203857421875, 1.5184326171875, 1.8330078125, 2.1475830078125, 2.462158203125, 2.7767333984375, 3.09130859375, 3.4058837890625, 3.720458984375, 4.0350341796875, 4.349609375, 4.6641845703125, 4.978759765625, 5.2933349609375, 5.60791015625, 5.9224853515625, 6.237060546875, 6.5516357421875, 6.8662109375, 7.1807861328125, 7.495361328125, 7.8099365234375, 8.12451171875, 8.4390869140625, 8.753662109375, 9.0682373046875, 9.3828125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 16.0, 20.0, 23.0, 26.0, 56.0, 66.0, 106.0, 144.0, 220.0, 327.0, 513.0, 828.0, 1216.0, 1777.0, 2580.0, 3832.0, 5814.0, 8481.0, 12775.0, 18458.0, 27173.0, 39387.0, 57793.0, 85766.0, 127131.0, 180532.0, 154089.0, 102445.0, 69165.0, 47144.0, 32448.0, 22216.0, 15057.0, 9991.0, 6831.0, 4618.0, 3081.0, 2026.0, 1385.0, 920.0, 697.0, 438.0, 299.0, 233.0, 139.0, 109.0, 48.0, 41.0, 25.0, 20.0, 14.0, 7.0, 6.0, 6.0, 3.0, 0.0, 1.0], "bins": [-1.0400390625, -1.0082626342773438, -0.9764862060546875, -0.9447097778320312, -0.912933349609375, -0.8811569213867188, -0.8493804931640625, -0.8176040649414062, -0.78582763671875, -0.7540512084960938, -0.7222747802734375, -0.6904983520507812, -0.658721923828125, -0.6269454956054688, -0.5951690673828125, -0.5633926391601562, -0.5316162109375, -0.49983978271484375, -0.4680633544921875, -0.43628692626953125, -0.404510498046875, -0.37273406982421875, -0.3409576416015625, -0.30918121337890625, -0.27740478515625, -0.24562835693359375, -0.2138519287109375, -0.18207550048828125, -0.150299072265625, -0.11852264404296875, -0.0867462158203125, -0.05496978759765625, -0.023193359375, 0.00858306884765625, 0.0403594970703125, 0.07213592529296875, 0.103912353515625, 0.13568878173828125, 0.1674652099609375, 0.19924163818359375, 0.23101806640625, 0.26279449462890625, 0.2945709228515625, 0.32634735107421875, 0.358123779296875, 0.38990020751953125, 0.4216766357421875, 0.45345306396484375, 0.4852294921875, 0.5170059204101562, 0.5487823486328125, 0.5805587768554688, 0.612335205078125, 0.6441116333007812, 0.6758880615234375, 0.7076644897460938, 0.73944091796875, 0.7712173461914062, 0.8029937744140625, 0.8347702026367188, 0.866546630859375, 0.8983230590820312, 0.9300994873046875, 0.9618759155273438, 0.99365234375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 14.0, 9.0, 10.0, 20.0, 28.0, 18.0, 36.0, 21.0, 29.0, 38.0, 39.0, 37.0, 55.0, 35.0, 64.0, 27.0, 1060.0, 44.0, 37.0, 51.0, 45.0, 37.0, 32.0, 37.0, 19.0, 22.0, 34.0, 20.0, 16.0, 17.0, 17.0, 9.0, 12.0, 9.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.94140625, -6.7247314453125, -6.508056640625, -6.2913818359375, -6.07470703125, -5.8580322265625, -5.641357421875, -5.4246826171875, -5.2080078125, -4.9913330078125, -4.774658203125, -4.5579833984375, -4.34130859375, -4.1246337890625, -3.907958984375, -3.6912841796875, -3.474609375, -3.2579345703125, -3.041259765625, -2.8245849609375, -2.60791015625, -2.3912353515625, -2.174560546875, -1.9578857421875, -1.7412109375, -1.5245361328125, -1.307861328125, -1.0911865234375, -0.87451171875, -0.6578369140625, -0.441162109375, -0.2244873046875, -0.0078125, 0.2088623046875, 0.425537109375, 0.6422119140625, 0.85888671875, 1.0755615234375, 1.292236328125, 1.5089111328125, 1.7255859375, 1.9422607421875, 2.158935546875, 2.3756103515625, 2.59228515625, 2.8089599609375, 3.025634765625, 3.2423095703125, 3.458984375, 3.6756591796875, 3.892333984375, 4.1090087890625, 4.32568359375, 4.5423583984375, 4.759033203125, 4.9757080078125, 5.1923828125, 5.4090576171875, 5.625732421875, 5.8424072265625, 6.05908203125, 6.2757568359375, 6.492431640625, 6.7091064453125, 6.92578125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 19.0, 29.0, 34.0, 43.0, 60.0, 101.0, 161.0, 257.0, 349.0, 496.0, 781.0, 1287.0, 1908.0, 3037.0, 4620.0, 7308.0, 11706.0, 18598.0, 29776.0, 48119.0, 77305.0, 126279.0, 1078181.0, 357875.0, 124513.0, 77037.0, 47588.0, 29412.0, 18265.0, 11544.0, 7299.0, 4649.0, 2996.0, 1931.0, 1222.0, 774.0, 513.0, 379.0, 224.0, 150.0, 86.0, 63.0, 50.0, 37.0, 19.0, 16.0, 8.0, 5.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.171875, -1.1363525390625, -1.100830078125, -1.0653076171875, -1.02978515625, -0.9942626953125, -0.958740234375, -0.9232177734375, -0.8876953125, -0.8521728515625, -0.816650390625, -0.7811279296875, -0.74560546875, -0.7100830078125, -0.674560546875, -0.6390380859375, -0.603515625, -0.5679931640625, -0.532470703125, -0.4969482421875, -0.46142578125, -0.4259033203125, -0.390380859375, -0.3548583984375, -0.3193359375, -0.2838134765625, -0.248291015625, -0.2127685546875, -0.17724609375, -0.1417236328125, -0.106201171875, -0.0706787109375, -0.03515625, 0.0003662109375, 0.035888671875, 0.0714111328125, 0.10693359375, 0.1424560546875, 0.177978515625, 0.2135009765625, 0.2490234375, 0.2845458984375, 0.320068359375, 0.3555908203125, 0.39111328125, 0.4266357421875, 0.462158203125, 0.4976806640625, 0.533203125, 0.5687255859375, 0.604248046875, 0.6397705078125, 0.67529296875, 0.7108154296875, 0.746337890625, 0.7818603515625, 0.8173828125, 0.8529052734375, 0.888427734375, 0.9239501953125, 0.95947265625, 0.9949951171875, 1.030517578125, 1.0660400390625, 1.1015625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 14.0, 11.0, 17.0, 18.0, 15.0, 27.0, 32.0, 47.0, 34.0, 58.0, 54.0, 54.0, 72.0, 75.0, 64.0, 72.0, 59.0, 48.0, 44.0, 34.0, 24.0, 26.0, 20.0, 18.0, 13.0, 9.0, 9.0, 7.0, 1.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025463104248046875, -0.0024705231189727783, -0.002394735813140869, -0.00231894850730896, -0.0022431612014770508, -0.0021673738956451416, -0.0020915865898132324, -0.0020157992839813232, -0.001940011978149414, -0.0018642246723175049, -0.0017884373664855957, -0.0017126500606536865, -0.0016368627548217773, -0.0015610754489898682, -0.001485288143157959, -0.0014095008373260498, -0.0013337135314941406, -0.0012579262256622314, -0.0011821389198303223, -0.001106351613998413, -0.001030564308166504, -0.0009547770023345947, -0.0008789896965026855, -0.0008032023906707764, -0.0007274150848388672, -0.000651627779006958, -0.0005758404731750488, -0.0005000531673431396, -0.00042426586151123047, -0.0003484785556793213, -0.0002726912498474121, -0.00019690394401550293, -0.00012111663818359375, -4.532933235168457e-05, 3.045797348022461e-05, 0.00010624527931213379, 0.00018203258514404297, 0.00025781989097595215, 0.00033360719680786133, 0.0004093945026397705, 0.0004851818084716797, 0.0005609691143035889, 0.000636756420135498, 0.0007125437259674072, 0.0007883310317993164, 0.0008641183376312256, 0.0009399056434631348, 0.001015692949295044, 0.0010914802551269531, 0.0011672675609588623, 0.0012430548667907715, 0.0013188421726226807, 0.0013946294784545898, 0.001470416784286499, 0.0015462040901184082, 0.0016219913959503174, 0.0016977787017822266, 0.0017735660076141357, 0.001849353313446045, 0.001925140619277954, 0.0020009279251098633, 0.0020767152309417725, 0.0021525025367736816, 0.002228289842605591, 0.0023040771484375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 6.0, 10.0, 16.0, 14.0, 17.0, 19.0, 27.0, 26.0, 42.0, 53.0, 85.0, 113.0, 167.0, 282.0, 528.0, 1956.0, 941703.0, 101103.0, 1126.0, 442.0, 235.0, 138.0, 119.0, 67.0, 53.0, 51.0, 25.0, 20.0, 28.0, 19.0, 10.0, 12.0, 6.0, 5.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04296875, -0.04147911071777344, -0.039989471435546875, -0.03849983215332031, -0.03701019287109375, -0.03552055358886719, -0.034030914306640625, -0.03254127502441406, -0.0310516357421875, -0.029561996459960938, -0.028072357177734375, -0.026582717895507812, -0.02509307861328125, -0.023603439331054688, -0.022113800048828125, -0.020624160766601562, -0.019134521484375, -0.017644882202148438, -0.016155242919921875, -0.014665603637695312, -0.01317596435546875, -0.011686325073242188, -0.010196685791015625, -0.008707046508789062, -0.0072174072265625, -0.0057277679443359375, -0.004238128662109375, -0.0027484893798828125, -0.00125885009765625, 0.0002307891845703125, 0.001720428466796875, 0.0032100677490234375, 0.00469970703125, 0.0061893463134765625, 0.007678985595703125, 0.009168624877929688, 0.01065826416015625, 0.012147903442382812, 0.013637542724609375, 0.015127182006835938, 0.0166168212890625, 0.018106460571289062, 0.019596099853515625, 0.021085739135742188, 0.02257537841796875, 0.024065017700195312, 0.025554656982421875, 0.027044296264648438, 0.028533935546875, 0.030023574829101562, 0.031513214111328125, 0.03300285339355469, 0.03449249267578125, 0.03598213195800781, 0.037471771240234375, 0.03896141052246094, 0.0404510498046875, 0.04194068908691406, 0.043430328369140625, 0.04491996765136719, 0.04640960693359375, 0.04789924621582031, 0.049388885498046875, 0.05087852478027344, 0.0523681640625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 61.0, 385.0, 440.0, 107.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006576722953468561, -0.0064084515906870365, -0.006240180693566799, -0.0060719093307852745, -0.00590363796800375, -0.005735366605222225, -0.0055670952424407005, -0.005398824345320463, -0.0052305529825389385, -0.005062281619757414, -0.0048940107226371765, -0.004725739359855652, -0.004557467997074127, -0.0043891966342926025, -0.004220925271511078, -0.0040526543743908405, -0.003884383011609316, -0.003716111648827791, -0.00354784051887691, -0.003379569388926029, -0.0032112980261445045, -0.00304302666336298, -0.002874755533412099, -0.002706484403461218, -0.0025382130406796932, -0.0023699416778981686, -0.0022016705479472876, -0.0020333994179964066, -0.001865128055214882, -0.001696856808848679, -0.0015285855624824762, -0.0013603143161162734, -0.0011920435354113579, -0.001023772289045155, -0.0008555010426789522, -0.0006872297963127494, -0.0005189585499465466, -0.0003506873035803437, -0.0001824160572141409, -1.414481084793806e-05, 0.00015412643551826477, 0.0003223976818844676, 0.0004906689282506704, 0.0006589401746168733, 0.0008272114209830761, 0.000995482667349279, 0.0011637539137154818, 0.0013320251600816846, 0.0015002964064478874, 0.0016685676528140903, 0.001836838899180293, 0.002005110029131174, 0.0021733813919126987, 0.0023416527546942234, 0.0025099238846451044, 0.0026781950145959854, 0.00284646637737751, 0.0030147377401590347, 0.0031830088701099157, 0.0033512800000607967, 0.0035195513628423214, 0.003687822725623846, 0.003856093855574727, 0.004024364985525608, 0.004192636348307133]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 5.0, 5.0, 4.0, 9.0, 8.0, 6.0, 14.0, 23.0, 14.0, 17.0, 23.0, 25.0, 26.0, 24.0, 39.0, 33.0, 47.0, 61.0, 43.0, 33.0, 41.0, 35.0, 41.0, 45.0, 48.0, 41.0, 29.0, 30.0, 41.0, 26.0, 31.0, 12.0, 27.0, 27.0, 17.0, 11.0, 10.0, 13.0, 8.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010998845100402832, -0.0010632015764713287, -0.0010265186429023743, -0.0009898357093334198, -0.0009531527757644653, -0.0009164698421955109, -0.0008797869086265564, -0.0008431039750576019, -0.0008064210414886475, -0.000769738107919693, -0.0007330551743507385, -0.0006963722407817841, -0.0006596893072128296, -0.0006230063736438751, -0.0005863234400749207, -0.0005496405065059662, -0.0005129575729370117, -0.00047627463936805725, -0.0004395917057991028, -0.0004029087722301483, -0.00036622583866119385, -0.0003295429050922394, -0.0002928599715232849, -0.00025617703795433044, -0.00021949410438537598, -0.0001828111708164215, -0.00014612823724746704, -0.00010944530367851257, -7.27623701095581e-05, -3.607943654060364e-05, 6.034970283508301e-07, 3.72864305973053e-05, 7.396936416625977e-05, 0.00011065229773521423, 0.0001473352313041687, 0.00018401816487312317, 0.00022070109844207764, 0.0002573840320110321, 0.00029406696557998657, 0.00033074989914894104, 0.0003674328327178955, 0.00040411576628685, 0.00044079869985580444, 0.0004774816334247589, 0.0005141645669937134, 0.0005508475005626678, 0.0005875304341316223, 0.0006242133677005768, 0.0006608963012695312, 0.0006975792348384857, 0.0007342621684074402, 0.0007709451019763947, 0.0008076280355453491, 0.0008443109691143036, 0.0008809939026832581, 0.0009176768362522125, 0.000954359769821167, 0.0009910427033901215, 0.001027725636959076, 0.0010644085705280304, 0.0011010915040969849, 0.0011377744376659393, 0.0011744573712348938, 0.0012111403048038483, 0.0012478232383728027]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 5.0, 5.0, 3.0, 7.0, 11.0, 13.0, 6.0, 4.0, 12.0, 14.0, 29.0, 18.0, 13.0, 45.0, 31.0, 28.0, 42.0, 40.0, 37.0, 31.0, 44.0, 54.0, 44.0, 47.0, 32.0, 37.0, 38.0, 36.0, 36.0, 37.0, 27.0, 20.0, 19.0, 23.0, 26.0, 16.0, 17.0, 10.0, 14.0, 5.0, 10.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.75, -10.4354248046875, -10.120849609375, -9.8062744140625, -9.49169921875, -9.1771240234375, -8.862548828125, -8.5479736328125, -8.2333984375, -7.9188232421875, -7.604248046875, -7.2896728515625, -6.97509765625, -6.6605224609375, -6.345947265625, -6.0313720703125, -5.716796875, -5.4022216796875, -5.087646484375, -4.7730712890625, -4.45849609375, -4.1439208984375, -3.829345703125, -3.5147705078125, -3.2001953125, -2.8856201171875, -2.571044921875, -2.2564697265625, -1.94189453125, -1.6273193359375, -1.312744140625, -0.9981689453125, -0.68359375, -0.3690185546875, -0.054443359375, 0.2601318359375, 0.57470703125, 0.8892822265625, 1.203857421875, 1.5184326171875, 1.8330078125, 2.1475830078125, 2.462158203125, 2.7767333984375, 3.09130859375, 3.4058837890625, 3.720458984375, 4.0350341796875, 4.349609375, 4.6641845703125, 4.978759765625, 5.2933349609375, 5.60791015625, 5.9224853515625, 6.237060546875, 6.5516357421875, 6.8662109375, 7.1807861328125, 7.495361328125, 7.8099365234375, 8.12451171875, 8.4390869140625, 8.753662109375, 9.0682373046875, 9.3828125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 6.0, 5.0, 10.0, 9.0, 10.0, 25.0, 26.0, 34.0, 50.0, 73.0, 78.0, 132.0, 187.0, 267.0, 438.0, 688.0, 1082.0, 1798.0, 3057.0, 5130.0, 9492.0, 19378.0, 47111.0, 159332.0, 565161.0, 149337.0, 45013.0, 18648.0, 9139.0, 5043.0, 2890.0, 1773.0, 1071.0, 684.0, 419.0, 298.0, 186.0, 114.0, 110.0, 48.0, 61.0, 34.0, 35.0, 10.0, 18.0, 8.0, 8.0, 4.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0], "bins": [-10.65625, -10.34716796875, -10.0380859375, -9.72900390625, -9.419921875, -9.11083984375, -8.8017578125, -8.49267578125, -8.18359375, -7.87451171875, -7.5654296875, -7.25634765625, -6.947265625, -6.63818359375, -6.3291015625, -6.02001953125, -5.7109375, -5.40185546875, -5.0927734375, -4.78369140625, -4.474609375, -4.16552734375, -3.8564453125, -3.54736328125, -3.23828125, -2.92919921875, -2.6201171875, -2.31103515625, -2.001953125, -1.69287109375, -1.3837890625, -1.07470703125, -0.765625, -0.45654296875, -0.1474609375, 0.16162109375, 0.470703125, 0.77978515625, 1.0888671875, 1.39794921875, 1.70703125, 2.01611328125, 2.3251953125, 2.63427734375, 2.943359375, 3.25244140625, 3.5615234375, 3.87060546875, 4.1796875, 4.48876953125, 4.7978515625, 5.10693359375, 5.416015625, 5.72509765625, 6.0341796875, 6.34326171875, 6.65234375, 6.96142578125, 7.2705078125, 7.57958984375, 7.888671875, 8.19775390625, 8.5068359375, 8.81591796875, 9.125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 1.0, 9.0, 6.0, 6.0, 7.0, 8.0, 9.0, 5.0, 20.0, 23.0, 17.0, 20.0, 15.0, 28.0, 33.0, 31.0, 33.0, 33.0, 44.0, 48.0, 72.0, 113.0, 1751.0, 224.0, 74.0, 50.0, 44.0, 39.0, 36.0, 45.0, 25.0, 28.0, 18.0, 23.0, 26.0, 8.0, 15.0, 10.0, 12.0, 11.0, 8.0, 3.0, 4.0, 6.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.78125, -36.66064453125, -35.5400390625, -34.41943359375, -33.298828125, -32.17822265625, -31.0576171875, -29.93701171875, -28.81640625, -27.69580078125, -26.5751953125, -25.45458984375, -24.333984375, -23.21337890625, -22.0927734375, -20.97216796875, -19.8515625, -18.73095703125, -17.6103515625, -16.48974609375, -15.369140625, -14.24853515625, -13.1279296875, -12.00732421875, -10.88671875, -9.76611328125, -8.6455078125, -7.52490234375, -6.404296875, -5.28369140625, -4.1630859375, -3.04248046875, -1.921875, -0.80126953125, 0.3193359375, 1.43994140625, 2.560546875, 3.68115234375, 4.8017578125, 5.92236328125, 7.04296875, 8.16357421875, 9.2841796875, 10.40478515625, 11.525390625, 12.64599609375, 13.7666015625, 14.88720703125, 16.0078125, 17.12841796875, 18.2490234375, 19.36962890625, 20.490234375, 21.61083984375, 22.7314453125, 23.85205078125, 24.97265625, 26.09326171875, 27.2138671875, 28.33447265625, 29.455078125, 30.57568359375, 31.6962890625, 32.81689453125, 33.9375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 9.0, 14.0, 9.0, 17.0, 27.0, 23.0, 44.0, 60.0, 103.0, 145.0, 258.0, 708.0, 5052.0, 3046025.0, 90369.0, 1778.0, 444.0, 194.0, 144.0, 82.0, 62.0, 44.0, 32.0, 20.0, 8.0, 10.0, 11.0, 6.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.3125, -113.9404296875, -110.568359375, -107.1962890625, -103.82421875, -100.4521484375, -97.080078125, -93.7080078125, -90.3359375, -86.9638671875, -83.591796875, -80.2197265625, -76.84765625, -73.4755859375, -70.103515625, -66.7314453125, -63.359375, -59.9873046875, -56.615234375, -53.2431640625, -49.87109375, -46.4990234375, -43.126953125, -39.7548828125, -36.3828125, -33.0107421875, -29.638671875, -26.2666015625, -22.89453125, -19.5224609375, -16.150390625, -12.7783203125, -9.40625, -6.0341796875, -2.662109375, 0.7099609375, 4.08203125, 7.4541015625, 10.826171875, 14.1982421875, 17.5703125, 20.9423828125, 24.314453125, 27.6865234375, 31.05859375, 34.4306640625, 37.802734375, 41.1748046875, 44.546875, 47.9189453125, 51.291015625, 54.6630859375, 58.03515625, 61.4072265625, 64.779296875, 68.1513671875, 71.5234375, 74.8955078125, 78.267578125, 81.6396484375, 85.01171875, 88.3837890625, 91.755859375, 95.1279296875, 98.5]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 219.0, 634.0, 136.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.3973693847656, -319.3601379394531, -312.3228759765625, -305.28564453125, -298.2483825683594, -291.2111511230469, -284.17388916015625, -277.13665771484375, -270.09942626953125, -263.06219482421875, -256.0249328613281, -248.98770141601562, -241.95045471191406, -234.9132080078125, -227.87596130371094, -220.83871459960938, -213.8014678955078, -206.76422119140625, -199.7269744873047, -192.68972778320312, -185.65249633789062, -178.61524963378906, -171.5780029296875, -164.54075622558594, -157.50350952148438, -150.4662628173828, -143.42901611328125, -136.39178466796875, -129.3545379638672, -122.31729125976562, -115.28004455566406, -108.2427978515625, -101.20557403564453, -94.16832733154297, -87.13108825683594, -80.09384155273438, -73.05659484863281, -66.01935577392578, -58.98210906982422, -51.94486618041992, -44.907623291015625, -37.87038040161133, -30.8331356048584, -23.79589080810547, -16.758647918701172, -9.721405029296875, -2.6841583251953125, 4.353084564208984, 11.390327453613281, 18.427570343017578, 25.464815139770508, 32.50205993652344, 39.539302825927734, 46.57654571533203, 53.613792419433594, 60.65103530883789, 67.68827819824219, 74.72552490234375, 81.76276397705078, 88.80001068115234, 95.83724975585938, 102.87449645996094, 109.9117431640625, 116.94898986816406, 123.9862289428711]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 9.0, 4.0, 9.0, 7.0, 11.0, 12.0, 12.0, 20.0, 21.0, 22.0, 16.0, 21.0, 23.0, 34.0, 37.0, 19.0, 35.0, 44.0, 38.0, 39.0, 42.0, 46.0, 36.0, 39.0, 25.0, 44.0, 32.0, 39.0, 31.0, 28.0, 29.0, 25.0, 23.0, 27.0, 19.0, 8.0, 12.0, 15.0, 9.0, 7.0, 6.0, 6.0, 6.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-99.8073959350586, -96.61431121826172, -93.42121887207031, -90.22813415527344, -87.03504180908203, -83.84195709228516, -80.64886474609375, -77.45578002929688, -74.2626953125, -71.06961059570312, -67.87651824951172, -64.68343353271484, -61.49034118652344, -58.29725646972656, -55.10416793823242, -51.91107940673828, -48.717987060546875, -45.524898529052734, -42.331809997558594, -39.13872528076172, -35.94563293457031, -32.75254821777344, -29.559459686279297, -26.366371154785156, -23.173282623291016, -19.980194091796875, -16.787105560302734, -13.594018936157227, -10.400930404663086, -7.207841873168945, -4.0147552490234375, -0.8216667175292969, 2.371429443359375, 5.564517498016357, 8.75760555267334, 11.950693130493164, 15.143781661987305, 18.336870193481445, 21.529956817626953, 24.723045349121094, 27.916133880615234, 31.109222412109375, 34.302310943603516, 37.495399475097656, 40.68848419189453, 43.88157653808594, 47.07466125488281, 50.26774978637695, 53.460838317871094, 56.653926849365234, 59.847015380859375, 63.04010009765625, 66.23319244384766, 69.42627716064453, 72.61936950683594, 75.81245422363281, 79.00553894042969, 82.19862365722656, 85.39171600341797, 88.58480072021484, 91.77789306640625, 94.97097778320312, 98.1640625, 101.3571548461914, 104.55024719238281]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 10.0, 9.0, 11.0, 9.0, 15.0, 13.0, 16.0, 18.0, 22.0, 32.0, 37.0, 34.0, 40.0, 45.0, 38.0, 31.0, 46.0, 51.0, 47.0, 46.0, 38.0, 37.0, 36.0, 30.0, 41.0, 27.0, 32.0, 22.0, 26.0, 26.0, 16.0, 16.0, 20.0, 11.0, 7.0, 8.0, 7.0, 3.0, 5.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.2421875, -10.9129638671875, -10.583740234375, -10.2545166015625, -9.92529296875, -9.5960693359375, -9.266845703125, -8.9376220703125, -8.6083984375, -8.2791748046875, -7.949951171875, -7.6207275390625, -7.29150390625, -6.9622802734375, -6.633056640625, -6.3038330078125, -5.974609375, -5.6453857421875, -5.316162109375, -4.9869384765625, -4.65771484375, -4.3284912109375, -3.999267578125, -3.6700439453125, -3.3408203125, -3.0115966796875, -2.682373046875, -2.3531494140625, -2.02392578125, -1.6947021484375, -1.365478515625, -1.0362548828125, -0.70703125, -0.3778076171875, -0.048583984375, 0.2806396484375, 0.60986328125, 0.9390869140625, 1.268310546875, 1.5975341796875, 1.9267578125, 2.2559814453125, 2.585205078125, 2.9144287109375, 3.24365234375, 3.5728759765625, 3.902099609375, 4.2313232421875, 4.560546875, 4.8897705078125, 5.218994140625, 5.5482177734375, 5.87744140625, 6.2066650390625, 6.535888671875, 6.8651123046875, 7.1943359375, 7.5235595703125, 7.852783203125, 8.1820068359375, 8.51123046875, 8.8404541015625, 9.169677734375, 9.4989013671875, 9.828125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 9.0, 9.0, 16.0, 19.0, 22.0, 36.0, 54.0, 63.0, 92.0, 146.0, 222.0, 398.0, 727.0, 1334.0, 2598.0, 5513.0, 12935.0, 32930.0, 103668.0, 395661.0, 1208945.0, 1531387.0, 637945.0, 174378.0, 51265.0, 18713.0, 7815.0, 3436.0, 1748.0, 891.0, 461.0, 276.0, 196.0, 114.0, 76.0, 51.0, 41.0, 34.0, 13.0, 16.0, 11.0, 6.0, 3.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.543212890625, -12.14111328125, -11.739013671875, -11.3369140625, -10.934814453125, -10.53271484375, -10.130615234375, -9.728515625, -9.326416015625, -8.92431640625, -8.522216796875, -8.1201171875, -7.718017578125, -7.31591796875, -6.913818359375, -6.51171875, -6.109619140625, -5.70751953125, -5.305419921875, -4.9033203125, -4.501220703125, -4.09912109375, -3.697021484375, -3.294921875, -2.892822265625, -2.49072265625, -2.088623046875, -1.6865234375, -1.284423828125, -0.88232421875, -0.480224609375, -0.078125, 0.323974609375, 0.72607421875, 1.128173828125, 1.5302734375, 1.932373046875, 2.33447265625, 2.736572265625, 3.138671875, 3.540771484375, 3.94287109375, 4.344970703125, 4.7470703125, 5.149169921875, 5.55126953125, 5.953369140625, 6.35546875, 6.757568359375, 7.15966796875, 7.561767578125, 7.9638671875, 8.365966796875, 8.76806640625, 9.170166015625, 9.572265625, 9.974365234375, 10.37646484375, 10.778564453125, 11.1806640625, 11.582763671875, 11.98486328125, 12.386962890625, 12.7890625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 6.0, 2.0, 8.0, 10.0, 14.0, 21.0, 23.0, 33.0, 30.0, 44.0, 68.0, 85.0, 103.0, 140.0, 183.0, 210.0, 286.0, 367.0, 384.0, 429.0, 390.0, 267.0, 233.0, 172.0, 136.0, 98.0, 81.0, 69.0, 43.0, 37.0, 28.0, 29.0, 8.0, 10.0, 10.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-31.828125, -31.070068359375, -30.31201171875, -29.553955078125, -28.7958984375, -28.037841796875, -27.27978515625, -26.521728515625, -25.763671875, -25.005615234375, -24.24755859375, -23.489501953125, -22.7314453125, -21.973388671875, -21.21533203125, -20.457275390625, -19.69921875, -18.941162109375, -18.18310546875, -17.425048828125, -16.6669921875, -15.908935546875, -15.15087890625, -14.392822265625, -13.634765625, -12.876708984375, -12.11865234375, -11.360595703125, -10.6025390625, -9.844482421875, -9.08642578125, -8.328369140625, -7.5703125, -6.812255859375, -6.05419921875, -5.296142578125, -4.5380859375, -3.780029296875, -3.02197265625, -2.263916015625, -1.505859375, -0.747802734375, 0.01025390625, 0.768310546875, 1.5263671875, 2.284423828125, 3.04248046875, 3.800537109375, 4.55859375, 5.316650390625, 6.07470703125, 6.832763671875, 7.5908203125, 8.348876953125, 9.10693359375, 9.864990234375, 10.623046875, 11.381103515625, 12.13916015625, 12.897216796875, 13.6552734375, 14.413330078125, 15.17138671875, 15.929443359375, 16.6875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 15.0, 11.0, 12.0, 28.0, 43.0, 41.0, 54.0, 64.0, 105.0, 148.0, 228.0, 429.0, 1569.0, 31187.0, 3752280.0, 401057.0, 5264.0, 734.0, 325.0, 174.0, 124.0, 94.0, 69.0, 42.0, 36.0, 37.0, 23.0, 14.0, 18.0, 14.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-81.4375, -78.275390625, -75.11328125, -71.951171875, -68.7890625, -65.626953125, -62.46484375, -59.302734375, -56.140625, -52.978515625, -49.81640625, -46.654296875, -43.4921875, -40.330078125, -37.16796875, -34.005859375, -30.84375, -27.681640625, -24.51953125, -21.357421875, -18.1953125, -15.033203125, -11.87109375, -8.708984375, -5.546875, -2.384765625, 0.77734375, 3.939453125, 7.1015625, 10.263671875, 13.42578125, 16.587890625, 19.75, 22.912109375, 26.07421875, 29.236328125, 32.3984375, 35.560546875, 38.72265625, 41.884765625, 45.046875, 48.208984375, 51.37109375, 54.533203125, 57.6953125, 60.857421875, 64.01953125, 67.181640625, 70.34375, 73.505859375, 76.66796875, 79.830078125, 82.9921875, 86.154296875, 89.31640625, 92.478515625, 95.640625, 98.802734375, 101.96484375, 105.126953125, 108.2890625, 111.451171875, 114.61328125, 117.775390625, 120.9375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 22.0, 76.0, 190.0, 319.0, 248.0, 112.0, 33.0, 6.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-313.3824768066406, -303.8031311035156, -294.2237854003906, -284.6444091796875, -275.0650634765625, -265.4857177734375, -255.9063720703125, -246.3270263671875, -236.74766540527344, -227.16831970214844, -217.58895874023438, -208.00961303710938, -198.43026733398438, -188.8509063720703, -179.2715606689453, -169.69219970703125, -160.11285400390625, -150.53350830078125, -140.9541473388672, -131.3748016357422, -121.79544830322266, -112.21609497070312, -102.63674926757812, -93.0573959350586, -83.47804260253906, -73.89868927001953, -64.3193359375, -54.739990234375, -45.16063690185547, -35.58128356933594, -26.001934051513672, -16.422584533691406, -6.84326171875, 2.7360897064208984, 12.315441131591797, 21.894792556762695, 31.474143981933594, 41.053497314453125, 50.63284683227539, 60.212196350097656, 69.79154968261719, 79.37090301513672, 88.95025634765625, 98.52960205078125, 108.10895538330078, 117.68830871582031, 127.26765441894531, 136.84701538085938, 146.42636108398438, 156.00570678710938, 165.58506774902344, 175.16441345214844, 184.7437744140625, 194.3231201171875, 203.9024658203125, 213.4818115234375, 223.06117248535156, 232.64051818847656, 242.21987915039062, 251.79922485351562, 261.3785705566406, 270.95794677734375, 280.53729248046875, 290.11663818359375, 299.69598388671875]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 3.0, 9.0, 4.0, 8.0, 6.0, 12.0, 16.0, 23.0, 21.0, 21.0, 20.0, 20.0, 31.0, 28.0, 33.0, 42.0, 51.0, 35.0, 33.0, 37.0, 44.0, 51.0, 40.0, 40.0, 33.0, 35.0, 34.0, 34.0, 34.0, 24.0, 23.0, 18.0, 21.0, 25.0, 18.0, 9.0, 12.0, 11.0, 11.0, 6.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-82.7083740234375, -79.97003173828125, -77.23168182373047, -74.49333953857422, -71.75499725341797, -69.01664733886719, -66.27830505371094, -63.53996276855469, -60.80161666870117, -58.063270568847656, -55.324928283691406, -52.58658218383789, -49.848236083984375, -47.109893798828125, -44.37154769897461, -41.633201599121094, -38.894859313964844, -36.15651321411133, -33.41817092895508, -30.679824829101562, -27.94148063659668, -25.203136444091797, -22.46479034423828, -19.7264461517334, -16.988101959228516, -14.249757766723633, -11.511412620544434, -8.773067474365234, -6.034723281860352, -3.2963790893554688, -0.5580329895019531, 2.1803112030029297, 4.918663024902344, 7.657007694244385, 10.395352363586426, 13.133697509765625, 15.872041702270508, 18.61038589477539, 21.348731994628906, 24.08707618713379, 26.825420379638672, 29.563764572143555, 32.30210876464844, 35.04045486450195, 37.77880096435547, 40.51714324951172, 43.255489349365234, 45.99383544921875, 48.732177734375, 51.470523834228516, 54.208866119384766, 56.94721221923828, 59.68555450439453, 62.42390060424805, 65.16224670410156, 67.90058898925781, 70.63893127441406, 73.37727355957031, 76.1156234741211, 78.85396575927734, 81.5923080444336, 84.33065795898438, 87.06900024414062, 89.80734252929688, 92.54569244384766]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 7.0, 9.0, 7.0, 8.0, 9.0, 13.0, 14.0, 22.0, 21.0, 23.0, 22.0, 34.0, 32.0, 41.0, 39.0, 34.0, 39.0, 42.0, 50.0, 46.0, 41.0, 45.0, 28.0, 41.0, 36.0, 40.0, 31.0, 38.0, 29.0, 22.0, 19.0, 21.0, 12.0, 16.0, 16.0, 15.0, 9.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5390625, -11.1961669921875, -10.853271484375, -10.5103759765625, -10.16748046875, -9.8245849609375, -9.481689453125, -9.1387939453125, -8.7958984375, -8.4530029296875, -8.110107421875, -7.7672119140625, -7.42431640625, -7.0814208984375, -6.738525390625, -6.3956298828125, -6.052734375, -5.7098388671875, -5.366943359375, -5.0240478515625, -4.68115234375, -4.3382568359375, -3.995361328125, -3.6524658203125, -3.3095703125, -2.9666748046875, -2.623779296875, -2.2808837890625, -1.93798828125, -1.5950927734375, -1.252197265625, -0.9093017578125, -0.56640625, -0.2235107421875, 0.119384765625, 0.4622802734375, 0.80517578125, 1.1480712890625, 1.490966796875, 1.8338623046875, 2.1767578125, 2.5196533203125, 2.862548828125, 3.2054443359375, 3.54833984375, 3.8912353515625, 4.234130859375, 4.5770263671875, 4.919921875, 5.2628173828125, 5.605712890625, 5.9486083984375, 6.29150390625, 6.6343994140625, 6.977294921875, 7.3201904296875, 7.6630859375, 8.0059814453125, 8.348876953125, 8.6917724609375, 9.03466796875, 9.3775634765625, 9.720458984375, 10.0633544921875, 10.40625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 12.0, 22.0, 33.0, 37.0, 76.0, 95.0, 159.0, 208.0, 320.0, 485.0, 709.0, 976.0, 1583.0, 2367.0, 3427.0, 5207.0, 7868.0, 11451.0, 17088.0, 25878.0, 39433.0, 60666.0, 93376.0, 141719.0, 189255.0, 151423.0, 101000.0, 65657.0, 43045.0, 28234.0, 18932.0, 12358.0, 8333.0, 5591.0, 3841.0, 2536.0, 1695.0, 1089.0, 791.0, 533.0, 338.0, 239.0, 150.0, 122.0, 64.0, 46.0, 31.0, 15.0, 14.0, 9.0, 5.0, 2.0, 1.0, 9.0, 0.0, 0.0, 2.0], "bins": [-1.072265625, -1.038330078125, -1.00439453125, -0.970458984375, -0.9365234375, -0.902587890625, -0.86865234375, -0.834716796875, -0.80078125, -0.766845703125, -0.73291015625, -0.698974609375, -0.6650390625, -0.631103515625, -0.59716796875, -0.563232421875, -0.529296875, -0.495361328125, -0.46142578125, -0.427490234375, -0.3935546875, -0.359619140625, -0.32568359375, -0.291748046875, -0.2578125, -0.223876953125, -0.18994140625, -0.156005859375, -0.1220703125, -0.088134765625, -0.05419921875, -0.020263671875, 0.013671875, 0.047607421875, 0.08154296875, 0.115478515625, 0.1494140625, 0.183349609375, 0.21728515625, 0.251220703125, 0.28515625, 0.319091796875, 0.35302734375, 0.386962890625, 0.4208984375, 0.454833984375, 0.48876953125, 0.522705078125, 0.556640625, 0.590576171875, 0.62451171875, 0.658447265625, 0.6923828125, 0.726318359375, 0.76025390625, 0.794189453125, 0.828125, 0.862060546875, 0.89599609375, 0.929931640625, 0.9638671875, 0.997802734375, 1.03173828125, 1.065673828125, 1.099609375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 7.0, 11.0, 9.0, 8.0, 14.0, 13.0, 14.0, 15.0, 26.0, 24.0, 18.0, 25.0, 30.0, 27.0, 36.0, 29.0, 39.0, 37.0, 40.0, 35.0, 33.0, 1052.0, 35.0, 24.0, 37.0, 45.0, 29.0, 18.0, 34.0, 32.0, 20.0, 22.0, 28.0, 25.0, 13.0, 18.0, 15.0, 10.0, 5.0, 10.0, 15.0, 8.0, 3.0, 4.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-6.08984375, -5.9058837890625, -5.721923828125, -5.5379638671875, -5.35400390625, -5.1700439453125, -4.986083984375, -4.8021240234375, -4.6181640625, -4.4342041015625, -4.250244140625, -4.0662841796875, -3.88232421875, -3.6983642578125, -3.514404296875, -3.3304443359375, -3.146484375, -2.9625244140625, -2.778564453125, -2.5946044921875, -2.41064453125, -2.2266845703125, -2.042724609375, -1.8587646484375, -1.6748046875, -1.4908447265625, -1.306884765625, -1.1229248046875, -0.93896484375, -0.7550048828125, -0.571044921875, -0.3870849609375, -0.203125, -0.0191650390625, 0.164794921875, 0.3487548828125, 0.53271484375, 0.7166748046875, 0.900634765625, 1.0845947265625, 1.2685546875, 1.4525146484375, 1.636474609375, 1.8204345703125, 2.00439453125, 2.1883544921875, 2.372314453125, 2.5562744140625, 2.740234375, 2.9241943359375, 3.108154296875, 3.2921142578125, 3.47607421875, 3.6600341796875, 3.843994140625, 4.0279541015625, 4.2119140625, 4.3958740234375, 4.579833984375, 4.7637939453125, 4.94775390625, 5.1317138671875, 5.315673828125, 5.4996337890625, 5.68359375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 7.0, 12.0, 18.0, 17.0, 48.0, 48.0, 86.0, 122.0, 160.0, 243.0, 368.0, 551.0, 801.0, 1237.0, 1803.0, 2587.0, 4060.0, 5945.0, 8960.0, 13562.0, 20833.0, 31800.0, 48952.0, 75438.0, 117791.0, 195848.0, 1214538.0, 123064.0, 79173.0, 51398.0, 33458.0, 21910.0, 14210.0, 9377.0, 6110.0, 4214.0, 2760.0, 1766.0, 1236.0, 835.0, 575.0, 395.0, 264.0, 176.0, 118.0, 112.0, 53.0, 35.0, 22.0, 11.0, 12.0, 7.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.0166015625, -0.9827728271484375, -0.948944091796875, -0.9151153564453125, -0.88128662109375, -0.8474578857421875, -0.813629150390625, -0.7798004150390625, -0.7459716796875, -0.7121429443359375, -0.678314208984375, -0.6444854736328125, -0.61065673828125, -0.5768280029296875, -0.542999267578125, -0.5091705322265625, -0.475341796875, -0.4415130615234375, -0.407684326171875, -0.3738555908203125, -0.34002685546875, -0.3061981201171875, -0.272369384765625, -0.2385406494140625, -0.2047119140625, -0.1708831787109375, -0.137054443359375, -0.1032257080078125, -0.06939697265625, -0.0355682373046875, -0.001739501953125, 0.0320892333984375, 0.06591796875, 0.0997467041015625, 0.133575439453125, 0.1674041748046875, 0.20123291015625, 0.2350616455078125, 0.268890380859375, 0.3027191162109375, 0.3365478515625, 0.3703765869140625, 0.404205322265625, 0.4380340576171875, 0.47186279296875, 0.5056915283203125, 0.539520263671875, 0.5733489990234375, 0.607177734375, 0.6410064697265625, 0.674835205078125, 0.7086639404296875, 0.74249267578125, 0.7763214111328125, 0.810150146484375, 0.8439788818359375, 0.8778076171875, 0.9116363525390625, 0.945465087890625, 0.9792938232421875, 1.01312255859375, 1.0469512939453125, 1.080780029296875, 1.1146087646484375, 1.1484375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 6.0, 4.0, 6.0, 4.0, 8.0, 7.0, 11.0, 18.0, 17.0, 26.0, 30.0, 24.0, 41.0, 56.0, 62.0, 76.0, 93.0, 78.0, 78.0, 44.0, 48.0, 40.0, 43.0, 48.0, 16.0, 27.0, 17.0, 15.0, 17.0, 7.0, 12.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0033626556396484375, -0.0032573938369750977, -0.003152132034301758, -0.003046870231628418, -0.002941608428955078, -0.0028363466262817383, -0.0027310848236083984, -0.0026258230209350586, -0.0025205612182617188, -0.002415299415588379, -0.002310037612915039, -0.0022047758102416992, -0.0020995140075683594, -0.0019942522048950195, -0.0018889904022216797, -0.0017837285995483398, -0.001678466796875, -0.0015732049942016602, -0.0014679431915283203, -0.0013626813888549805, -0.0012574195861816406, -0.0011521577835083008, -0.001046895980834961, -0.0009416341781616211, -0.0008363723754882812, -0.0007311105728149414, -0.0006258487701416016, -0.0005205869674682617, -0.0004153251647949219, -0.00031006336212158203, -0.0002048015594482422, -9.953975677490234e-05, 5.7220458984375e-06, 0.00011098384857177734, 0.0002162456512451172, 0.00032150745391845703, 0.0004267692565917969, 0.0005320310592651367, 0.0006372928619384766, 0.0007425546646118164, 0.0008478164672851562, 0.0009530782699584961, 0.001058340072631836, 0.0011636018753051758, 0.0012688636779785156, 0.0013741254806518555, 0.0014793872833251953, 0.0015846490859985352, 0.001689910888671875, 0.0017951726913452148, 0.0019004344940185547, 0.0020056962966918945, 0.0021109580993652344, 0.0022162199020385742, 0.002321481704711914, 0.002426743507385254, 0.0025320053100585938, 0.0026372671127319336, 0.0027425289154052734, 0.0028477907180786133, 0.002953052520751953, 0.003058314323425293, 0.003163576126098633, 0.0032688379287719727, 0.0033740997314453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 5.0, 7.0, 4.0, 13.0, 15.0, 14.0, 26.0, 30.0, 40.0, 66.0, 106.0, 151.0, 316.0, 736.0, 29301.0, 1015381.0, 1332.0, 443.0, 211.0, 107.0, 67.0, 40.0, 39.0, 21.0, 11.0, 9.0, 9.0, 9.0, 9.0, 3.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.071044921875, -0.06852531433105469, -0.06600570678710938, -0.06348609924316406, -0.06096649169921875, -0.05844688415527344, -0.055927276611328125, -0.05340766906738281, -0.0508880615234375, -0.04836845397949219, -0.045848846435546875, -0.04332923889160156, -0.04080963134765625, -0.03829002380371094, -0.035770416259765625, -0.03325080871582031, -0.030731201171875, -0.028211593627929688, -0.025691986083984375, -0.023172378540039062, -0.02065277099609375, -0.018133163452148438, -0.015613555908203125, -0.013093948364257812, -0.0105743408203125, -0.008054733276367188, -0.005535125732421875, -0.0030155181884765625, -0.00049591064453125, 0.0020236968994140625, 0.004543304443359375, 0.0070629119873046875, 0.00958251953125, 0.012102127075195312, 0.014621734619140625, 0.017141342163085938, 0.01966094970703125, 0.022180557250976562, 0.024700164794921875, 0.027219772338867188, 0.0297393798828125, 0.03225898742675781, 0.034778594970703125, 0.03729820251464844, 0.03981781005859375, 0.04233741760253906, 0.044857025146484375, 0.04737663269042969, 0.049896240234375, 0.05241584777832031, 0.054935455322265625, 0.05745506286621094, 0.05997467041015625, 0.06249427795410156, 0.06501388549804688, 0.06753349304199219, 0.0700531005859375, 0.07257270812988281, 0.07509231567382812, 0.07761192321777344, 0.08013153076171875, 0.08265113830566406, 0.08517074584960938, 0.08769035339355469, 0.0902099609375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 260.0, 688.0, 52.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004649254493415356, -0.004322778899222612, -0.003996303305029869, -0.0036698277108371258, -0.0033433521166443825, -0.003016876522451639, -0.002690400928258896, -0.0023639253340661526, -0.0020374497398734093, -0.001710974145680666, -0.0013844985514879227, -0.0010580229572951794, -0.0007315473631024361, -0.00040507176890969276, -7.859617471694946e-05, 0.00024787941947579384, 0.0005743550136685371, 0.0009008306078612804, 0.0012273062020540237, 0.001553781796246767, 0.0018802573904395103, 0.0022067329846322536, 0.002533208578824997, 0.0028596841730177402, 0.0031861597672104836, 0.003512635361403227, 0.00383911095559597, 0.0041655865497887135, 0.004492062143981457, 0.0048185377381742, 0.005145013332366943, 0.005471488926559687, 0.005797963589429855, 0.006124439183622599, 0.006450914777815342, 0.006777390372008085, 0.0071038659662008286, 0.007430341560393572, 0.007756817154586315, 0.008083293214440346, 0.008409768342971802, 0.008736243471503258, 0.009062719531357288, 0.009389195591211319, 0.009715670719742775, 0.010042145848274231, 0.010368621908128262, 0.010695097967982292, 0.011021573096513748, 0.011348048225045204, 0.011674524284899235, 0.012001000344753265, 0.012327475473284721, 0.012653950601816177, 0.012980426661670208, 0.013306902721524239, 0.013633377850055695, 0.01395985297858715, 0.014286329038441181, 0.014612805098295212, 0.014939280226826668, 0.015265755355358124, 0.015592231415212154, 0.015918707475066185, 0.01624518260359764]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 5.0, 10.0, 10.0, 8.0, 16.0, 21.0, 18.0, 14.0, 26.0, 18.0, 33.0, 37.0, 38.0, 50.0, 34.0, 27.0, 43.0, 29.0, 40.0, 34.0, 49.0, 45.0, 45.0, 37.0, 39.0, 28.0, 28.0, 27.0, 31.0, 14.0, 29.0, 20.0, 21.0, 18.0, 5.0, 13.0, 7.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.001759648323059082, -0.0017096661031246185, -0.001659683883190155, -0.0016097016632556915, -0.001559719443321228, -0.0015097372233867645, -0.001459755003452301, -0.0014097727835178375, -0.001359790563583374, -0.0013098083436489105, -0.001259826123714447, -0.0012098439037799835, -0.00115986168384552, -0.0011098794639110565, -0.001059897243976593, -0.0010099150240421295, -0.000959932804107666, -0.0009099505841732025, -0.000859968364238739, -0.0008099861443042755, -0.000760003924369812, -0.0007100217044353485, -0.000660039484500885, -0.0006100572645664215, -0.000560075044631958, -0.0005100928246974945, -0.000460110604763031, -0.0004101283848285675, -0.000360146164894104, -0.0003101639449596405, -0.000260181725025177, -0.0002101995050907135, -0.00016021728515625, -0.0001102350652217865, -6.0252845287323e-05, -1.0270625352859497e-05, 3.9711594581604004e-05, 8.96938145160675e-05, 0.000139676034450531, 0.0001896582543849945, 0.000239640474319458, 0.0002896226942539215, 0.000339604914188385, 0.0003895871341228485, 0.000439569354057312, 0.0004895515739917755, 0.000539533793926239, 0.0005895160138607025, 0.000639498233795166, 0.0006894804537296295, 0.000739462673664093, 0.0007894448935985565, 0.00083942711353302, 0.0008894093334674835, 0.000939391553401947, 0.0009893737733364105, 0.001039355993270874, 0.0010893382132053375, 0.001139320433139801, 0.0011893026530742645, 0.001239284873008728, 0.0012892670929431915, 0.001339249312877655, 0.0013892315328121185, 0.001439213752746582]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 7.0, 9.0, 7.0, 8.0, 9.0, 13.0, 14.0, 22.0, 21.0, 23.0, 22.0, 34.0, 32.0, 41.0, 39.0, 34.0, 39.0, 42.0, 49.0, 47.0, 41.0, 45.0, 28.0, 41.0, 36.0, 40.0, 31.0, 38.0, 29.0, 22.0, 19.0, 21.0, 12.0, 16.0, 16.0, 15.0, 9.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5390625, -11.1961669921875, -10.853271484375, -10.5103759765625, -10.16748046875, -9.8245849609375, -9.481689453125, -9.1387939453125, -8.7958984375, -8.4530029296875, -8.110107421875, -7.7672119140625, -7.42431640625, -7.0814208984375, -6.738525390625, -6.3956298828125, -6.052734375, -5.7098388671875, -5.366943359375, -5.0240478515625, -4.68115234375, -4.3382568359375, -3.995361328125, -3.6524658203125, -3.3095703125, -2.9666748046875, -2.623779296875, -2.2808837890625, -1.93798828125, -1.5950927734375, -1.252197265625, -0.9093017578125, -0.56640625, -0.2235107421875, 0.119384765625, 0.4622802734375, 0.80517578125, 1.1480712890625, 1.490966796875, 1.8338623046875, 2.1767578125, 2.5196533203125, 2.862548828125, 3.2054443359375, 3.54833984375, 3.8912353515625, 4.234130859375, 4.5770263671875, 4.919921875, 5.2628173828125, 5.605712890625, 5.9486083984375, 6.29150390625, 6.6343994140625, 6.977294921875, 7.3201904296875, 7.6630859375, 8.0059814453125, 8.348876953125, 8.6917724609375, 9.03466796875, 9.3775634765625, 9.720458984375, 10.0633544921875, 10.40625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 10.0, 10.0, 12.0, 23.0, 23.0, 29.0, 47.0, 88.0, 121.0, 244.0, 397.0, 689.0, 1288.0, 2656.0, 5321.0, 11175.0, 25841.0, 69926.0, 262464.0, 468814.0, 126430.0, 41232.0, 16384.0, 7595.0, 3605.0, 1865.0, 967.0, 533.0, 298.0, 161.0, 86.0, 60.0, 52.0, 28.0, 30.0, 13.0, 10.0, 7.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.7890625, -9.4854736328125, -9.181884765625, -8.8782958984375, -8.57470703125, -8.2711181640625, -7.967529296875, -7.6639404296875, -7.3603515625, -7.0567626953125, -6.753173828125, -6.4495849609375, -6.14599609375, -5.8424072265625, -5.538818359375, -5.2352294921875, -4.931640625, -4.6280517578125, -4.324462890625, -4.0208740234375, -3.71728515625, -3.4136962890625, -3.110107421875, -2.8065185546875, -2.5029296875, -2.1993408203125, -1.895751953125, -1.5921630859375, -1.28857421875, -0.9849853515625, -0.681396484375, -0.3778076171875, -0.07421875, 0.2293701171875, 0.532958984375, 0.8365478515625, 1.14013671875, 1.4437255859375, 1.747314453125, 2.0509033203125, 2.3544921875, 2.6580810546875, 2.961669921875, 3.2652587890625, 3.56884765625, 3.8724365234375, 4.176025390625, 4.4796142578125, 4.783203125, 5.0867919921875, 5.390380859375, 5.6939697265625, 5.99755859375, 6.3011474609375, 6.604736328125, 6.9083251953125, 7.2119140625, 7.5155029296875, 7.819091796875, 8.1226806640625, 8.42626953125, 8.7298583984375, 9.033447265625, 9.3370361328125, 9.640625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 2.0, 7.0, 7.0, 11.0, 6.0, 12.0, 16.0, 15.0, 17.0, 18.0, 30.0, 35.0, 48.0, 49.0, 51.0, 53.0, 57.0, 75.0, 173.0, 1651.0, 191.0, 69.0, 59.0, 53.0, 45.0, 55.0, 39.0, 28.0, 26.0, 19.0, 21.0, 24.0, 19.0, 7.0, 19.0, 13.0, 6.0, 5.0, 5.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-46.59375, -45.31640625, -44.0390625, -42.76171875, -41.484375, -40.20703125, -38.9296875, -37.65234375, -36.375, -35.09765625, -33.8203125, -32.54296875, -31.265625, -29.98828125, -28.7109375, -27.43359375, -26.15625, -24.87890625, -23.6015625, -22.32421875, -21.046875, -19.76953125, -18.4921875, -17.21484375, -15.9375, -14.66015625, -13.3828125, -12.10546875, -10.828125, -9.55078125, -8.2734375, -6.99609375, -5.71875, -4.44140625, -3.1640625, -1.88671875, -0.609375, 0.66796875, 1.9453125, 3.22265625, 4.5, 5.77734375, 7.0546875, 8.33203125, 9.609375, 10.88671875, 12.1640625, 13.44140625, 14.71875, 15.99609375, 17.2734375, 18.55078125, 19.828125, 21.10546875, 22.3828125, 23.66015625, 24.9375, 26.21484375, 27.4921875, 28.76953125, 30.046875, 31.32421875, 32.6015625, 33.87890625, 35.15625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 9.0, 6.0, 14.0, 19.0, 19.0, 23.0, 31.0, 38.0, 41.0, 60.0, 95.0, 147.0, 174.0, 269.0, 499.0, 1844.0, 43413.0, 3080469.0, 15937.0, 1321.0, 412.0, 248.0, 171.0, 115.0, 82.0, 46.0, 43.0, 34.0, 28.0, 27.0, 13.0, 13.0, 7.0, 7.0, 10.0, 7.0, 0.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-89.625, -86.7705078125, -83.916015625, -81.0615234375, -78.20703125, -75.3525390625, -72.498046875, -69.6435546875, -66.7890625, -63.9345703125, -61.080078125, -58.2255859375, -55.37109375, -52.5166015625, -49.662109375, -46.8076171875, -43.953125, -41.0986328125, -38.244140625, -35.3896484375, -32.53515625, -29.6806640625, -26.826171875, -23.9716796875, -21.1171875, -18.2626953125, -15.408203125, -12.5537109375, -9.69921875, -6.8447265625, -3.990234375, -1.1357421875, 1.71875, 4.5732421875, 7.427734375, 10.2822265625, 13.13671875, 15.9912109375, 18.845703125, 21.7001953125, 24.5546875, 27.4091796875, 30.263671875, 33.1181640625, 35.97265625, 38.8271484375, 41.681640625, 44.5361328125, 47.390625, 50.2451171875, 53.099609375, 55.9541015625, 58.80859375, 61.6630859375, 64.517578125, 67.3720703125, 70.2265625, 73.0810546875, 75.935546875, 78.7900390625, 81.64453125, 84.4990234375, 87.353515625, 90.2080078125, 93.0625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 19.0, 108.0, 332.0, 367.0, 151.0, 26.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.08236694335938, -129.04515075683594, -125.00794219970703, -120.9707260131836, -116.93351745605469, -112.89630126953125, -108.85908508300781, -104.8218765258789, -100.78466796875, -96.74745178222656, -92.71024322509766, -88.67302703857422, -84.63581848144531, -80.59860229492188, -76.56138610839844, -72.52417755126953, -68.4869613647461, -64.44974517822266, -60.41253662109375, -56.37532043457031, -52.338111877441406, -48.30089569091797, -44.2636833190918, -40.226470947265625, -36.18925857543945, -32.15204620361328, -28.11483383178711, -24.077619552612305, -20.040407180786133, -16.00319480895996, -11.965980529785156, -7.928768157958984, -3.8915481567382812, 0.14566469192504883, 4.182877540588379, 8.220090866088867, 12.257303237915039, 16.29451560974121, 20.331729888916016, 24.368942260742188, 28.40615463256836, 32.44336700439453, 36.4805793762207, 40.517791748046875, 44.55500793457031, 48.59221649169922, 52.629432678222656, 56.66664505004883, 60.703857421875, 64.74107360839844, 68.77828216552734, 72.81549835205078, 76.85270690917969, 80.88992309570312, 84.92713928222656, 88.96434783935547, 93.00155639648438, 97.03877258300781, 101.07598114013672, 105.11319732666016, 109.15040588378906, 113.1876220703125, 117.22483825683594, 121.26204681396484, 125.29926300048828]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 7.0, 4.0, 5.0, 11.0, 14.0, 6.0, 12.0, 18.0, 23.0, 25.0, 23.0, 22.0, 28.0, 44.0, 27.0, 33.0, 39.0, 44.0, 42.0, 33.0, 32.0, 32.0, 36.0, 43.0, 30.0, 35.0, 28.0, 39.0, 33.0, 39.0, 23.0, 21.0, 18.0, 22.0, 12.0, 14.0, 14.0, 14.0, 9.0, 6.0, 7.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-85.38558197021484, -82.61650848388672, -79.84744262695312, -77.078369140625, -74.30929565429688, -71.54022979736328, -68.77115631103516, -66.00209045410156, -63.23301696777344, -60.46394729614258, -57.69487762451172, -54.925804138183594, -52.156734466552734, -49.387664794921875, -46.61859130859375, -43.84952163696289, -41.08045196533203, -38.31138229370117, -35.54231262207031, -32.77323913574219, -30.004169464111328, -27.23509979248047, -24.466028213500977, -21.696956634521484, -18.927886962890625, -16.158817291259766, -13.389745712280273, -10.620675086975098, -7.851604461669922, -5.082533836364746, -2.3134632110595703, 0.4556083679199219, 3.2246856689453125, 5.993756294250488, 8.762826919555664, 11.53189754486084, 14.300968170166016, 17.070037841796875, 19.839109420776367, 22.60818099975586, 25.37725067138672, 28.146320343017578, 30.91539192199707, 33.68446350097656, 36.45353317260742, 39.22260284423828, 41.991676330566406, 44.760746002197266, 47.529815673828125, 50.298885345458984, 53.067955017089844, 55.83702850341797, 58.60609817504883, 61.37516784667969, 64.14424133300781, 66.91331481933594, 69.68238067626953, 72.45145416259766, 75.22052001953125, 77.98959350585938, 80.7586669921875, 83.5277328491211, 86.29680633544922, 89.06587219238281, 91.83494567871094]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 8.0, 5.0, 4.0, 7.0, 7.0, 9.0, 7.0, 13.0, 14.0, 22.0, 21.0, 18.0, 27.0, 27.0, 34.0, 34.0, 36.0, 38.0, 41.0, 42.0, 44.0, 42.0, 45.0, 46.0, 36.0, 35.0, 36.0, 38.0, 44.0, 36.0, 26.0, 25.0, 22.0, 18.0, 23.0, 13.0, 9.0, 20.0, 12.0, 7.0, 5.0, 5.0, 3.0, 4.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3800048828125, -11.025634765625, -10.6712646484375, -10.31689453125, -9.9625244140625, -9.608154296875, -9.2537841796875, -8.8994140625, -8.5450439453125, -8.190673828125, -7.8363037109375, -7.48193359375, -7.1275634765625, -6.773193359375, -6.4188232421875, -6.064453125, -5.7100830078125, -5.355712890625, -5.0013427734375, -4.64697265625, -4.2926025390625, -3.938232421875, -3.5838623046875, -3.2294921875, -2.8751220703125, -2.520751953125, -2.1663818359375, -1.81201171875, -1.4576416015625, -1.103271484375, -0.7489013671875, -0.39453125, -0.0401611328125, 0.314208984375, 0.6685791015625, 1.02294921875, 1.3773193359375, 1.731689453125, 2.0860595703125, 2.4404296875, 2.7947998046875, 3.149169921875, 3.5035400390625, 3.85791015625, 4.2122802734375, 4.566650390625, 4.9210205078125, 5.275390625, 5.6297607421875, 5.984130859375, 6.3385009765625, 6.69287109375, 7.0472412109375, 7.401611328125, 7.7559814453125, 8.1103515625, 8.4647216796875, 8.819091796875, 9.1734619140625, 9.52783203125, 9.8822021484375, 10.236572265625, 10.5909423828125, 10.9453125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 2.0, 5.0, 10.0, 6.0, 14.0, 15.0, 17.0, 9.0, 26.0, 30.0, 25.0, 49.0, 53.0, 57.0, 89.0, 103.0, 174.0, 385.0, 1779.0, 26958.0, 2401920.0, 1740852.0, 19218.0, 1443.0, 376.0, 160.0, 94.0, 66.0, 59.0, 41.0, 42.0, 38.0, 20.0, 21.0, 27.0, 24.0, 9.0, 4.0, 15.0, 7.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-58.71875, -56.9892578125, -55.259765625, -53.5302734375, -51.80078125, -50.0712890625, -48.341796875, -46.6123046875, -44.8828125, -43.1533203125, -41.423828125, -39.6943359375, -37.96484375, -36.2353515625, -34.505859375, -32.7763671875, -31.046875, -29.3173828125, -27.587890625, -25.8583984375, -24.12890625, -22.3994140625, -20.669921875, -18.9404296875, -17.2109375, -15.4814453125, -13.751953125, -12.0224609375, -10.29296875, -8.5634765625, -6.833984375, -5.1044921875, -3.375, -1.6455078125, 0.083984375, 1.8134765625, 3.54296875, 5.2724609375, 7.001953125, 8.7314453125, 10.4609375, 12.1904296875, 13.919921875, 15.6494140625, 17.37890625, 19.1083984375, 20.837890625, 22.5673828125, 24.296875, 26.0263671875, 27.755859375, 29.4853515625, 31.21484375, 32.9443359375, 34.673828125, 36.4033203125, 38.1328125, 39.8623046875, 41.591796875, 43.3212890625, 45.05078125, 46.7802734375, 48.509765625, 50.2392578125, 51.96875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 9.0, 10.0, 19.0, 37.0, 36.0, 42.0, 82.0, 85.0, 151.0, 223.0, 286.0, 444.0, 529.0, 552.0, 436.0, 326.0, 236.0, 177.0, 105.0, 82.0, 75.0, 35.0, 25.0, 15.0, 15.0, 10.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.125, -32.15478515625, -31.1845703125, -30.21435546875, -29.244140625, -28.27392578125, -27.3037109375, -26.33349609375, -25.36328125, -24.39306640625, -23.4228515625, -22.45263671875, -21.482421875, -20.51220703125, -19.5419921875, -18.57177734375, -17.6015625, -16.63134765625, -15.6611328125, -14.69091796875, -13.720703125, -12.75048828125, -11.7802734375, -10.81005859375, -9.83984375, -8.86962890625, -7.8994140625, -6.92919921875, -5.958984375, -4.98876953125, -4.0185546875, -3.04833984375, -2.078125, -1.10791015625, -0.1376953125, 0.83251953125, 1.802734375, 2.77294921875, 3.7431640625, 4.71337890625, 5.68359375, 6.65380859375, 7.6240234375, 8.59423828125, 9.564453125, 10.53466796875, 11.5048828125, 12.47509765625, 13.4453125, 14.41552734375, 15.3857421875, 16.35595703125, 17.326171875, 18.29638671875, 19.2666015625, 20.23681640625, 21.20703125, 22.17724609375, 23.1474609375, 24.11767578125, 25.087890625, 26.05810546875, 27.0283203125, 27.99853515625, 28.96875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 6.0, 8.0, 9.0, 12.0, 12.0, 18.0, 20.0, 30.0, 40.0, 44.0, 46.0, 59.0, 115.0, 119.0, 160.0, 249.0, 404.0, 865.0, 3182.0, 77996.0, 3888551.0, 214867.0, 4991.0, 932.0, 464.0, 269.0, 212.0, 118.0, 97.0, 86.0, 74.0, 53.0, 39.0, 31.0, 17.0, 21.0, 16.0, 16.0, 8.0, 9.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-83.4375, -80.619140625, -77.80078125, -74.982421875, -72.1640625, -69.345703125, -66.52734375, -63.708984375, -60.890625, -58.072265625, -55.25390625, -52.435546875, -49.6171875, -46.798828125, -43.98046875, -41.162109375, -38.34375, -35.525390625, -32.70703125, -29.888671875, -27.0703125, -24.251953125, -21.43359375, -18.615234375, -15.796875, -12.978515625, -10.16015625, -7.341796875, -4.5234375, -1.705078125, 1.11328125, 3.931640625, 6.75, 9.568359375, 12.38671875, 15.205078125, 18.0234375, 20.841796875, 23.66015625, 26.478515625, 29.296875, 32.115234375, 34.93359375, 37.751953125, 40.5703125, 43.388671875, 46.20703125, 49.025390625, 51.84375, 54.662109375, 57.48046875, 60.298828125, 63.1171875, 65.935546875, 68.75390625, 71.572265625, 74.390625, 77.208984375, 80.02734375, 82.845703125, 85.6640625, 88.482421875, 91.30078125, 94.119140625, 96.9375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 19.0, 49.0, 79.0, 141.0, 183.0, 191.0, 146.0, 87.0, 68.0, 25.0, 7.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.84791564941406, -71.0132064819336, -65.17849731445312, -59.343780517578125, -53.509071350097656, -47.67436218261719, -41.83964920043945, -36.00493621826172, -30.17022705078125, -24.33551597595215, -18.500804901123047, -12.666093826293945, -6.831382751464844, -0.9966716766357422, 4.838039398193359, 10.672752380371094, 16.507461547851562, 22.342172622680664, 28.176883697509766, 34.0115966796875, 39.84630584716797, 45.68101501464844, 51.51572799682617, 57.350440979003906, 63.185150146484375, 69.01985931396484, 74.85456848144531, 80.68928527832031, 86.52399444580078, 92.35870361328125, 98.19342041015625, 104.02812957763672, 109.86285400390625, 115.69756317138672, 121.53227233886719, 127.36698913574219, 133.20169067382812, 139.03640747070312, 144.87112426757812, 150.70584106445312, 156.54054260253906, 162.37525939941406, 168.2099609375, 174.044677734375, 179.87939453125, 185.71409606933594, 191.54881286621094, 197.38351440429688, 203.21823120117188, 209.05294799804688, 214.8876495361328, 220.7223663330078, 226.55706787109375, 232.39178466796875, 238.22650146484375, 244.06121826171875, 249.8959197998047, 255.7306365966797, 261.5653381347656, 267.4000549316406, 273.2347717285156, 279.0694885253906, 284.9041748046875, 290.7388916015625, 296.5736083984375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 1.0, 8.0, 4.0, 16.0, 10.0, 10.0, 24.0, 18.0, 18.0, 25.0, 31.0, 26.0, 29.0, 26.0, 44.0, 45.0, 29.0, 38.0, 38.0, 35.0, 35.0, 40.0, 44.0, 40.0, 35.0, 32.0, 34.0, 43.0, 31.0, 24.0, 20.0, 19.0, 21.0, 20.0, 14.0, 10.0, 14.0, 8.0, 8.0, 6.0, 7.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-91.09634399414062, -88.38265228271484, -85.6689682006836, -82.95527648925781, -80.24159240722656, -77.52790069580078, -74.814208984375, -72.10052490234375, -69.38683319091797, -66.67314147949219, -63.95945739746094, -61.245765686035156, -58.53207778930664, -55.818389892578125, -53.104698181152344, -50.39101028442383, -47.67732238769531, -44.9636344909668, -42.24994659423828, -39.5362548828125, -36.822566986083984, -34.10887908935547, -31.39518928527832, -28.681499481201172, -25.967811584472656, -23.25412368774414, -20.540433883666992, -17.826744079589844, -15.113056182861328, -12.399367332458496, -9.685678482055664, -6.971988677978516, -4.25830078125, -1.544611930847168, 1.169076919555664, 3.882765769958496, 6.596454620361328, 9.31014347076416, 12.023832321166992, 14.73752212524414, 17.451210021972656, 20.164897918701172, 22.87858772277832, 25.59227752685547, 28.305965423583984, 31.0196533203125, 33.73334503173828, 36.4470329284668, 39.16072082519531, 41.87440872192383, 44.588096618652344, 47.301788330078125, 50.01547622680664, 52.729164123535156, 55.44285583496094, 58.15654373168945, 60.87023162841797, 63.583919525146484, 66.297607421875, 69.01129913330078, 71.72499084472656, 74.43867492675781, 77.1523666381836, 79.86605834960938, 82.57974243164062]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 6.0, 10.0, 11.0, 14.0, 13.0, 10.0, 12.0, 19.0, 18.0, 29.0, 30.0, 36.0, 33.0, 37.0, 45.0, 53.0, 42.0, 43.0, 39.0, 48.0, 40.0, 51.0, 39.0, 40.0, 37.0, 37.0, 36.0, 22.0, 24.0, 24.0, 15.0, 20.0, 13.0, 11.0, 15.0, 8.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.40625, -12.0289306640625, -11.651611328125, -11.2742919921875, -10.89697265625, -10.5196533203125, -10.142333984375, -9.7650146484375, -9.3876953125, -9.0103759765625, -8.633056640625, -8.2557373046875, -7.87841796875, -7.5010986328125, -7.123779296875, -6.7464599609375, -6.369140625, -5.9918212890625, -5.614501953125, -5.2371826171875, -4.85986328125, -4.4825439453125, -4.105224609375, -3.7279052734375, -3.3505859375, -2.9732666015625, -2.595947265625, -2.2186279296875, -1.84130859375, -1.4639892578125, -1.086669921875, -0.7093505859375, -0.33203125, 0.0452880859375, 0.422607421875, 0.7999267578125, 1.17724609375, 1.5545654296875, 1.931884765625, 2.3092041015625, 2.6865234375, 3.0638427734375, 3.441162109375, 3.8184814453125, 4.19580078125, 4.5731201171875, 4.950439453125, 5.3277587890625, 5.705078125, 6.0823974609375, 6.459716796875, 6.8370361328125, 7.21435546875, 7.5916748046875, 7.968994140625, 8.3463134765625, 8.7236328125, 9.1009521484375, 9.478271484375, 9.8555908203125, 10.23291015625, 10.6102294921875, 10.987548828125, 11.3648681640625, 11.7421875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 16.0, 21.0, 27.0, 54.0, 71.0, 93.0, 135.0, 220.0, 300.0, 489.0, 779.0, 1073.0, 1655.0, 2362.0, 3494.0, 5196.0, 7752.0, 11590.0, 17188.0, 25858.0, 38429.0, 56418.0, 83575.0, 123385.0, 172497.0, 159196.0, 109571.0, 73311.0, 50281.0, 34192.0, 22614.0, 15492.0, 10227.0, 7042.0, 4585.0, 3076.0, 2028.0, 1380.0, 911.0, 641.0, 423.0, 283.0, 199.0, 122.0, 93.0, 77.0, 49.0, 28.0, 17.0, 13.0, 9.0, 7.0, 4.0, 2.0, 0.0, 2.0], "bins": [-1.1572265625, -1.1219940185546875, -1.086761474609375, -1.0515289306640625, -1.01629638671875, -0.9810638427734375, -0.945831298828125, -0.9105987548828125, -0.8753662109375, -0.8401336669921875, -0.804901123046875, -0.7696685791015625, -0.73443603515625, -0.6992034912109375, -0.663970947265625, -0.6287384033203125, -0.593505859375, -0.5582733154296875, -0.523040771484375, -0.4878082275390625, -0.45257568359375, -0.4173431396484375, -0.382110595703125, -0.3468780517578125, -0.3116455078125, -0.2764129638671875, -0.241180419921875, -0.2059478759765625, -0.17071533203125, -0.1354827880859375, -0.100250244140625, -0.0650177001953125, -0.02978515625, 0.0054473876953125, 0.040679931640625, 0.0759124755859375, 0.11114501953125, 0.1463775634765625, 0.181610107421875, 0.2168426513671875, 0.2520751953125, 0.2873077392578125, 0.322540283203125, 0.3577728271484375, 0.39300537109375, 0.4282379150390625, 0.463470458984375, 0.4987030029296875, 0.533935546875, 0.5691680908203125, 0.604400634765625, 0.6396331787109375, 0.67486572265625, 0.7100982666015625, 0.745330810546875, 0.7805633544921875, 0.8157958984375, 0.8510284423828125, 0.886260986328125, 0.9214935302734375, 0.95672607421875, 0.9919586181640625, 1.027191162109375, 1.0624237060546875, 1.09765625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 3.0, 7.0, 10.0, 3.0, 6.0, 23.0, 11.0, 15.0, 17.0, 17.0, 25.0, 32.0, 28.0, 23.0, 37.0, 30.0, 44.0, 44.0, 47.0, 34.0, 1069.0, 38.0, 39.0, 39.0, 42.0, 34.0, 42.0, 23.0, 23.0, 35.0, 27.0, 33.0, 22.0, 20.0, 15.0, 13.0, 14.0, 6.0, 5.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.92578125, -6.7069091796875, -6.488037109375, -6.2691650390625, -6.05029296875, -5.8314208984375, -5.612548828125, -5.3936767578125, -5.1748046875, -4.9559326171875, -4.737060546875, -4.5181884765625, -4.29931640625, -4.0804443359375, -3.861572265625, -3.6427001953125, -3.423828125, -3.2049560546875, -2.986083984375, -2.7672119140625, -2.54833984375, -2.3294677734375, -2.110595703125, -1.8917236328125, -1.6728515625, -1.4539794921875, -1.235107421875, -1.0162353515625, -0.79736328125, -0.5784912109375, -0.359619140625, -0.1407470703125, 0.078125, 0.2969970703125, 0.515869140625, 0.7347412109375, 0.95361328125, 1.1724853515625, 1.391357421875, 1.6102294921875, 1.8291015625, 2.0479736328125, 2.266845703125, 2.4857177734375, 2.70458984375, 2.9234619140625, 3.142333984375, 3.3612060546875, 3.580078125, 3.7989501953125, 4.017822265625, 4.2366943359375, 4.45556640625, 4.6744384765625, 4.893310546875, 5.1121826171875, 5.3310546875, 5.5499267578125, 5.768798828125, 5.9876708984375, 6.20654296875, 6.4254150390625, 6.644287109375, 6.8631591796875, 7.08203125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 10.0, 22.0, 35.0, 54.0, 83.0, 116.0, 179.0, 293.0, 424.0, 596.0, 967.0, 1446.0, 2224.0, 3340.0, 5193.0, 7817.0, 12277.0, 19065.0, 29730.0, 46332.0, 71979.0, 114149.0, 180754.0, 1244428.0, 128798.0, 81209.0, 51558.0, 33560.0, 21395.0, 13626.0, 8895.0, 5642.0, 3816.0, 2502.0, 1542.0, 1001.0, 730.0, 464.0, 297.0, 212.0, 115.0, 95.0, 57.0, 31.0, 25.0, 13.0, 10.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.2021484375, -1.165863037109375, -1.12957763671875, -1.093292236328125, -1.0570068359375, -1.020721435546875, -0.98443603515625, -0.948150634765625, -0.911865234375, -0.875579833984375, -0.83929443359375, -0.803009033203125, -0.7667236328125, -0.730438232421875, -0.69415283203125, -0.657867431640625, -0.62158203125, -0.585296630859375, -0.54901123046875, -0.512725830078125, -0.4764404296875, -0.440155029296875, -0.40386962890625, -0.367584228515625, -0.331298828125, -0.295013427734375, -0.25872802734375, -0.222442626953125, -0.1861572265625, -0.149871826171875, -0.11358642578125, -0.077301025390625, -0.041015625, -0.004730224609375, 0.03155517578125, 0.067840576171875, 0.1041259765625, 0.140411376953125, 0.17669677734375, 0.212982177734375, 0.249267578125, 0.285552978515625, 0.32183837890625, 0.358123779296875, 0.3944091796875, 0.430694580078125, 0.46697998046875, 0.503265380859375, 0.53955078125, 0.575836181640625, 0.61212158203125, 0.648406982421875, 0.6846923828125, 0.720977783203125, 0.75726318359375, 0.793548583984375, 0.829833984375, 0.866119384765625, 0.90240478515625, 0.938690185546875, 0.9749755859375, 1.011260986328125, 1.04754638671875, 1.083831787109375, 1.1201171875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 6.0, 8.0, 7.0, 12.0, 10.0, 18.0, 19.0, 36.0, 42.0, 54.0, 70.0, 98.0, 106.0, 92.0, 102.0, 75.0, 71.0, 51.0, 19.0, 19.0, 22.0, 17.0, 14.0, 5.0, 9.0, 7.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003173828125, -0.0030379891395568848, -0.0029021501541137695, -0.0027663111686706543, -0.002630472183227539, -0.002494633197784424, -0.0023587942123413086, -0.0022229552268981934, -0.002087116241455078, -0.0019512772560119629, -0.0018154382705688477, -0.0016795992851257324, -0.0015437602996826172, -0.001407921314239502, -0.0012720823287963867, -0.0011362433433532715, -0.0010004043579101562, -0.000864565372467041, -0.0007287263870239258, -0.0005928874015808105, -0.0004570484161376953, -0.0003212094306945801, -0.00018537044525146484, -4.953145980834961e-05, 8.630752563476562e-05, 0.00022214651107788086, 0.0003579854965209961, 0.0004938244819641113, 0.0006296634674072266, 0.0007655024528503418, 0.000901341438293457, 0.0010371804237365723, 0.0011730194091796875, 0.0013088583946228027, 0.001444697380065918, 0.0015805363655090332, 0.0017163753509521484, 0.0018522143363952637, 0.001988053321838379, 0.002123892307281494, 0.0022597312927246094, 0.0023955702781677246, 0.00253140926361084, 0.002667248249053955, 0.0028030872344970703, 0.0029389262199401855, 0.0030747652053833008, 0.003210604190826416, 0.0033464431762695312, 0.0034822821617126465, 0.0036181211471557617, 0.003753960132598877, 0.003889799118041992, 0.004025638103485107, 0.004161477088928223, 0.004297316074371338, 0.004433155059814453, 0.004568994045257568, 0.004704833030700684, 0.004840672016143799, 0.004976511001586914, 0.005112349987030029, 0.0052481889724731445, 0.00538402795791626, 0.005519866943359375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 7.0, 15.0, 11.0, 13.0, 26.0, 25.0, 41.0, 81.0, 168.0, 438.0, 2024.0, 1042066.0, 2700.0, 483.0, 168.0, 90.0, 57.0, 29.0, 21.0, 18.0, 17.0, 10.0, 7.0, 5.0, 6.0, 8.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12279033660888672, -0.11960411071777344, -0.11641788482666016, -0.11323165893554688, -0.1100454330444336, -0.10685920715332031, -0.10367298126220703, -0.10048675537109375, -0.09730052947998047, -0.09411430358886719, -0.0909280776977539, -0.08774185180664062, -0.08455562591552734, -0.08136940002441406, -0.07818317413330078, -0.0749969482421875, -0.07181072235107422, -0.06862449645996094, -0.06543827056884766, -0.062252044677734375, -0.059065818786621094, -0.05587959289550781, -0.05269336700439453, -0.04950714111328125, -0.04632091522216797, -0.04313468933105469, -0.039948463439941406, -0.036762237548828125, -0.033576011657714844, -0.030389785766601562, -0.02720355987548828, -0.024017333984375, -0.02083110809326172, -0.017644882202148438, -0.014458656311035156, -0.011272430419921875, -0.008086204528808594, -0.0048999786376953125, -0.0017137527465820312, 0.00147247314453125, 0.004658699035644531, 0.007844924926757812, 0.011031150817871094, 0.014217376708984375, 0.017403602600097656, 0.020589828491210938, 0.02377605438232422, 0.0269622802734375, 0.03014850616455078, 0.03333473205566406, 0.036520957946777344, 0.039707183837890625, 0.042893409729003906, 0.04607963562011719, 0.04926586151123047, 0.05245208740234375, 0.05563831329345703, 0.05882453918457031, 0.062010765075683594, 0.06519699096679688, 0.06838321685791016, 0.07156944274902344, 0.07475566864013672, 0.07794189453125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 17.0, 138.0, 520.0, 294.0, 42.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011775626335293055, -0.0009695462067611516, -0.0007615297799929976, -0.0005535132950171828, -0.0003454968682490289, -0.00013748044148087502, 7.05360434949398e-05, 0.0002785524120554328, 0.0004865688970312476, 0.0006945853237994015, 0.0009026017505675554, 0.0011106182355433702, 0.001318634720519185, 0.001526651089079678, 0.0017346675740554929, 0.0019426839426159859, 0.0021507004275918007, 0.0023587169125676155, 0.0025667333975434303, 0.002774749882519245, 0.0029827661346644163, 0.003190782619640231, 0.003398799104616046, 0.003606815356761217, 0.003814831841737032, 0.004022848326712847, 0.004230864811688662, 0.004438881296664476, 0.004646897781640291, 0.004854913800954819, 0.0050629302859306335, 0.005270946770906448, 0.0054789637215435505, 0.005686980206519365, 0.00589499669149518, 0.006103013176470995, 0.00631102966144681, 0.006519045680761337, 0.006727062165737152, 0.006935078650712967, 0.007143095135688782, 0.0073511116206645966, 0.007559128105640411, 0.007767144590616226, 0.007975161075592041, 0.008183177560567856, 0.00839119404554367, 0.008599210530519485, 0.0088072270154953, 0.009015243500471115, 0.00922325998544693, 0.009431276470422745, 0.00963929295539856, 0.009847309440374374, 0.01005532592535019, 0.010263342410326004, 0.010471357963979244, 0.010679374448955059, 0.010887390933930874, 0.011095407418906689, 0.011303423903882504, 0.011511440388858318, 0.011719456873834133, 0.011927473358809948, 0.012135489843785763]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 1.0, 1.0, 3.0, 9.0, 10.0, 5.0, 11.0, 10.0, 17.0, 19.0, 14.0, 18.0, 21.0, 27.0, 34.0, 40.0, 34.0, 41.0, 45.0, 27.0, 27.0, 54.0, 39.0, 52.0, 40.0, 41.0, 48.0, 33.0, 37.0, 29.0, 34.0, 23.0, 25.0, 27.0, 19.0, 13.0, 14.0, 8.0, 15.0, 10.0, 7.0, 1.0, 4.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.001589357852935791, -0.001538855955004692, -0.0014883540570735931, -0.0014378521591424942, -0.0013873502612113953, -0.0013368483632802963, -0.0012863464653491974, -0.0012358445674180984, -0.0011853426694869995, -0.0011348407715559006, -0.0010843388736248016, -0.0010338369756937027, -0.0009833350777626038, -0.0009328331798315048, -0.0008823312819004059, -0.000831829383969307, -0.000781327486038208, -0.0007308255881071091, -0.0006803236901760101, -0.0006298217922449112, -0.0005793198943138123, -0.0005288179963827133, -0.0004783160984516144, -0.00042781420052051544, -0.0003773123025894165, -0.00032681040465831757, -0.00027630850672721863, -0.0002258066087961197, -0.00017530471086502075, -0.00012480281293392181, -7.430091500282288e-05, -2.3799017071723938e-05, 2.6702880859375e-05, 7.720477879047394e-05, 0.00012770667672157288, 0.00017820857465267181, 0.00022871047258377075, 0.0002792123705148697, 0.00032971426844596863, 0.00038021616637706757, 0.0004307180643081665, 0.00048121996223926544, 0.0005317218601703644, 0.0005822237581014633, 0.0006327256560325623, 0.0006832275539636612, 0.0007337294518947601, 0.0007842313498258591, 0.000834733247756958, 0.000885235145688057, 0.0009357370436191559, 0.0009862389415502548, 0.0010367408394813538, 0.0010872427374124527, 0.0011377446353435516, 0.0011882465332746506, 0.0012387484312057495, 0.0012892503291368484, 0.0013397522270679474, 0.0013902541249990463, 0.0014407560229301453, 0.0014912579208612442, 0.0015417598187923431, 0.001592261716723442, 0.001642763614654541]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 6.0, 10.0, 11.0, 14.0, 13.0, 10.0, 12.0, 19.0, 18.0, 29.0, 30.0, 36.0, 33.0, 37.0, 45.0, 53.0, 42.0, 43.0, 39.0, 48.0, 40.0, 51.0, 39.0, 40.0, 37.0, 37.0, 36.0, 22.0, 24.0, 24.0, 15.0, 20.0, 13.0, 11.0, 15.0, 8.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.40625, -12.0289306640625, -11.651611328125, -11.2742919921875, -10.89697265625, -10.5196533203125, -10.142333984375, -9.7650146484375, -9.3876953125, -9.0103759765625, -8.633056640625, -8.2557373046875, -7.87841796875, -7.5010986328125, -7.123779296875, -6.7464599609375, -6.369140625, -5.9918212890625, -5.614501953125, -5.2371826171875, -4.85986328125, -4.4825439453125, -4.105224609375, -3.7279052734375, -3.3505859375, -2.9732666015625, -2.595947265625, -2.2186279296875, -1.84130859375, -1.4639892578125, -1.086669921875, -0.7093505859375, -0.33203125, 0.0452880859375, 0.422607421875, 0.7999267578125, 1.17724609375, 1.5545654296875, 1.931884765625, 2.3092041015625, 2.6865234375, 3.0638427734375, 3.441162109375, 3.8184814453125, 4.19580078125, 4.5731201171875, 4.950439453125, 5.3277587890625, 5.705078125, 6.0823974609375, 6.459716796875, 6.8370361328125, 7.21435546875, 7.5916748046875, 7.968994140625, 8.3463134765625, 8.7236328125, 9.1009521484375, 9.478271484375, 9.8555908203125, 10.23291015625, 10.6102294921875, 10.987548828125, 11.3648681640625, 11.7421875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 2.0, 7.0, 10.0, 11.0, 15.0, 33.0, 47.0, 67.0, 102.0, 160.0, 240.0, 349.0, 546.0, 768.0, 1217.0, 1848.0, 2863.0, 4464.0, 7312.0, 12092.0, 21638.0, 42392.0, 95768.0, 258673.0, 353672.0, 127246.0, 53429.0, 26165.0, 14362.0, 8379.0, 5241.0, 3185.0, 2155.0, 1398.0, 886.0, 634.0, 409.0, 259.0, 174.0, 110.0, 89.0, 45.0, 37.0, 20.0, 15.0, 9.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.30120849609375, -5.0985107421875, -4.89581298828125, -4.693115234375, -4.49041748046875, -4.2877197265625, -4.08502197265625, -3.88232421875, -3.67962646484375, -3.4769287109375, -3.27423095703125, -3.071533203125, -2.86883544921875, -2.6661376953125, -2.46343994140625, -2.2607421875, -2.05804443359375, -1.8553466796875, -1.65264892578125, -1.449951171875, -1.24725341796875, -1.0445556640625, -0.84185791015625, -0.63916015625, -0.43646240234375, -0.2337646484375, -0.03106689453125, 0.171630859375, 0.37432861328125, 0.5770263671875, 0.77972412109375, 0.982421875, 1.18511962890625, 1.3878173828125, 1.59051513671875, 1.793212890625, 1.99591064453125, 2.1986083984375, 2.40130615234375, 2.60400390625, 2.80670166015625, 3.0093994140625, 3.21209716796875, 3.414794921875, 3.61749267578125, 3.8201904296875, 4.02288818359375, 4.2255859375, 4.42828369140625, 4.6309814453125, 4.83367919921875, 5.036376953125, 5.23907470703125, 5.4417724609375, 5.64447021484375, 5.84716796875, 6.04986572265625, 6.2525634765625, 6.45526123046875, 6.657958984375, 6.86065673828125, 7.0633544921875, 7.26605224609375, 7.46875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 4.0, 10.0, 8.0, 14.0, 8.0, 16.0, 18.0, 19.0, 23.0, 26.0, 39.0, 38.0, 47.0, 43.0, 43.0, 52.0, 105.0, 323.0, 1615.0, 124.0, 65.0, 45.0, 46.0, 49.0, 34.0, 40.0, 29.0, 25.0, 20.0, 32.0, 15.0, 16.0, 7.0, 9.0, 7.0, 7.0, 6.0, 2.0, 10.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.78125, -36.3359375, -34.890625, -33.4453125, -32.0, -30.5546875, -29.109375, -27.6640625, -26.21875, -24.7734375, -23.328125, -21.8828125, -20.4375, -18.9921875, -17.546875, -16.1015625, -14.65625, -13.2109375, -11.765625, -10.3203125, -8.875, -7.4296875, -5.984375, -4.5390625, -3.09375, -1.6484375, -0.203125, 1.2421875, 2.6875, 4.1328125, 5.578125, 7.0234375, 8.46875, 9.9140625, 11.359375, 12.8046875, 14.25, 15.6953125, 17.140625, 18.5859375, 20.03125, 21.4765625, 22.921875, 24.3671875, 25.8125, 27.2578125, 28.703125, 30.1484375, 31.59375, 33.0390625, 34.484375, 35.9296875, 37.375, 38.8203125, 40.265625, 41.7109375, 43.15625, 44.6015625, 46.046875, 47.4921875, 48.9375, 50.3828125, 51.828125, 53.2734375, 54.71875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 14.0, 18.0, 14.0, 30.0, 40.0, 62.0, 81.0, 113.0, 177.0, 339.0, 644.0, 4747.0, 3108542.0, 28899.0, 920.0, 400.0, 227.0, 143.0, 75.0, 62.0, 35.0, 29.0, 22.0, 16.0, 13.0, 7.0, 5.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-136.625, -132.443359375, -128.26171875, -124.080078125, -119.8984375, -115.716796875, -111.53515625, -107.353515625, -103.171875, -98.990234375, -94.80859375, -90.626953125, -86.4453125, -82.263671875, -78.08203125, -73.900390625, -69.71875, -65.537109375, -61.35546875, -57.173828125, -52.9921875, -48.810546875, -44.62890625, -40.447265625, -36.265625, -32.083984375, -27.90234375, -23.720703125, -19.5390625, -15.357421875, -11.17578125, -6.994140625, -2.8125, 1.369140625, 5.55078125, 9.732421875, 13.9140625, 18.095703125, 22.27734375, 26.458984375, 30.640625, 34.822265625, 39.00390625, 43.185546875, 47.3671875, 51.548828125, 55.73046875, 59.912109375, 64.09375, 68.275390625, 72.45703125, 76.638671875, 80.8203125, 85.001953125, 89.18359375, 93.365234375, 97.546875, 101.728515625, 105.91015625, 110.091796875, 114.2734375, 118.455078125, 122.63671875, 126.818359375, 131.0]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 19.0, 46.0, 63.0, 94.0, 134.0, 165.0, 155.0, 127.0, 105.0, 45.0, 21.0, 14.0, 7.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.19178009033203, -45.420387268066406, -43.64899444580078, -41.87759780883789, -40.106204986572266, -38.33481216430664, -36.56341552734375, -34.792022705078125, -33.0206298828125, -31.249237060546875, -29.477842330932617, -27.70644760131836, -25.935054779052734, -24.16366195678711, -22.39226722717285, -20.620872497558594, -18.84947967529297, -17.078086853027344, -15.306692123413086, -13.535298347473145, -11.763904571533203, -9.992510795593262, -8.22111701965332, -6.449723243713379, -4.6783294677734375, -2.906935691833496, -1.1355419158935547, 0.6358518600463867, 2.407245635986328, 4.1786394119262695, 5.950033187866211, 7.721426963806152, 9.492820739746094, 11.264214515686035, 13.035608291625977, 14.807002067565918, 16.57839584350586, 18.349788665771484, 20.121183395385742, 21.892578125, 23.663970947265625, 25.43536376953125, 27.206758499145508, 28.978153228759766, 30.74954605102539, 32.520938873291016, 34.292335510253906, 36.06372833251953, 37.835121154785156, 39.60651397705078, 41.377906799316406, 43.1493034362793, 44.92069625854492, 46.69208908081055, 48.46348571777344, 50.23487854003906, 52.00627136230469, 53.77766418457031, 55.54905700683594, 57.32045364379883, 59.09184646606445, 60.86323928833008, 62.63463592529297, 64.4060287475586, 66.17742156982422]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 11.0, 10.0, 11.0, 11.0, 17.0, 14.0, 20.0, 31.0, 34.0, 27.0, 32.0, 35.0, 35.0, 35.0, 32.0, 40.0, 38.0, 43.0, 44.0, 36.0, 47.0, 32.0, 49.0, 41.0, 24.0, 34.0, 26.0, 27.0, 22.0, 19.0, 17.0, 15.0, 14.0, 14.0, 11.0, 8.0, 4.0, 8.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-121.63163757324219, -117.97769927978516, -114.32376098632812, -110.66981506347656, -107.01587677001953, -103.3619384765625, -99.70800018310547, -96.05406188964844, -92.40011596679688, -88.74617767333984, -85.09223937988281, -81.43829345703125, -77.78435516357422, -74.13041687011719, -70.47647857666016, -66.82254028320312, -63.16859817504883, -59.5146598815918, -55.8607177734375, -52.20677947998047, -48.55283737182617, -44.89889907836914, -41.244956970214844, -37.59101867675781, -33.93708038330078, -30.283140182495117, -26.629199981689453, -22.975261688232422, -19.321319580078125, -15.667381286621094, -12.01344108581543, -8.359500885009766, -4.705558776855469, -1.0516188144683838, 2.602321147918701, 6.256260871887207, 9.910201072692871, 13.564140319824219, 17.218080520629883, 20.872020721435547, 24.52596092224121, 28.179901123046875, 31.83384132385254, 35.4877815246582, 39.141719818115234, 42.79566192626953, 46.44960021972656, 50.103538513183594, 53.75748062133789, 57.41141891479492, 61.06536102294922, 64.71929931640625, 68.37323760986328, 72.02717590332031, 75.68112182617188, 79.3350601196289, 82.98899841308594, 86.64293670654297, 90.296875, 93.95082092285156, 97.6047592163086, 101.25869750976562, 104.91263580322266, 108.56657409667969, 112.22052001953125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 10.0, 10.0, 10.0, 17.0, 14.0, 9.0, 19.0, 23.0, 28.0, 31.0, 35.0, 38.0, 31.0, 33.0, 37.0, 48.0, 48.0, 45.0, 43.0, 42.0, 42.0, 38.0, 45.0, 35.0, 36.0, 39.0, 23.0, 25.0, 18.0, 20.0, 15.0, 18.0, 21.0, 14.0, 5.0, 11.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.328125, -11.9447021484375, -11.561279296875, -11.1778564453125, -10.79443359375, -10.4110107421875, -10.027587890625, -9.6441650390625, -9.2607421875, -8.8773193359375, -8.493896484375, -8.1104736328125, -7.72705078125, -7.3436279296875, -6.960205078125, -6.5767822265625, -6.193359375, -5.8099365234375, -5.426513671875, -5.0430908203125, -4.65966796875, -4.2762451171875, -3.892822265625, -3.5093994140625, -3.1259765625, -2.7425537109375, -2.359130859375, -1.9757080078125, -1.59228515625, -1.2088623046875, -0.825439453125, -0.4420166015625, -0.05859375, 0.3248291015625, 0.708251953125, 1.0916748046875, 1.47509765625, 1.8585205078125, 2.241943359375, 2.6253662109375, 3.0087890625, 3.3922119140625, 3.775634765625, 4.1590576171875, 4.54248046875, 4.9259033203125, 5.309326171875, 5.6927490234375, 6.076171875, 6.4595947265625, 6.843017578125, 7.2264404296875, 7.60986328125, 7.9932861328125, 8.376708984375, 8.7601318359375, 9.1435546875, 9.5269775390625, 9.910400390625, 10.2938232421875, 10.67724609375, 11.0606689453125, 11.444091796875, 11.8275146484375, 12.2109375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 8.0, 10.0, 7.0, 17.0, 26.0, 18.0, 22.0, 25.0, 30.0, 42.0, 57.0, 74.0, 124.0, 172.0, 241.0, 474.0, 838.0, 1964.0, 5176.0, 17032.0, 75139.0, 459146.0, 1718141.0, 1495289.0, 340831.0, 57638.0, 13743.0, 4455.0, 1599.0, 741.0, 379.0, 213.0, 142.0, 110.0, 87.0, 56.0, 56.0, 41.0, 28.0, 18.0, 20.0, 7.0, 14.0, 5.0, 4.0, 5.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-18.0625, -17.478271484375, -16.89404296875, -16.309814453125, -15.7255859375, -15.141357421875, -14.55712890625, -13.972900390625, -13.388671875, -12.804443359375, -12.22021484375, -11.635986328125, -11.0517578125, -10.467529296875, -9.88330078125, -9.299072265625, -8.71484375, -8.130615234375, -7.54638671875, -6.962158203125, -6.3779296875, -5.793701171875, -5.20947265625, -4.625244140625, -4.041015625, -3.456787109375, -2.87255859375, -2.288330078125, -1.7041015625, -1.119873046875, -0.53564453125, 0.048583984375, 0.6328125, 1.217041015625, 1.80126953125, 2.385498046875, 2.9697265625, 3.553955078125, 4.13818359375, 4.722412109375, 5.306640625, 5.890869140625, 6.47509765625, 7.059326171875, 7.6435546875, 8.227783203125, 8.81201171875, 9.396240234375, 9.98046875, 10.564697265625, 11.14892578125, 11.733154296875, 12.3173828125, 12.901611328125, 13.48583984375, 14.070068359375, 14.654296875, 15.238525390625, 15.82275390625, 16.406982421875, 16.9912109375, 17.575439453125, 18.15966796875, 18.743896484375, 19.328125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 18.0, 19.0, 32.0, 55.0, 127.0, 192.0, 311.0, 604.0, 811.0, 796.0, 492.0, 283.0, 161.0, 75.0, 57.0, 27.0, 14.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.21875, -46.6552734375, -45.091796875, -43.5283203125, -41.96484375, -40.4013671875, -38.837890625, -37.2744140625, -35.7109375, -34.1474609375, -32.583984375, -31.0205078125, -29.45703125, -27.8935546875, -26.330078125, -24.7666015625, -23.203125, -21.6396484375, -20.076171875, -18.5126953125, -16.94921875, -15.3857421875, -13.822265625, -12.2587890625, -10.6953125, -9.1318359375, -7.568359375, -6.0048828125, -4.44140625, -2.8779296875, -1.314453125, 0.2490234375, 1.8125, 3.3759765625, 4.939453125, 6.5029296875, 8.06640625, 9.6298828125, 11.193359375, 12.7568359375, 14.3203125, 15.8837890625, 17.447265625, 19.0107421875, 20.57421875, 22.1376953125, 23.701171875, 25.2646484375, 26.828125, 28.3916015625, 29.955078125, 31.5185546875, 33.08203125, 34.6455078125, 36.208984375, 37.7724609375, 39.3359375, 40.8994140625, 42.462890625, 44.0263671875, 45.58984375, 47.1533203125, 48.716796875, 50.2802734375, 51.84375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 12.0, 6.0, 10.0, 19.0, 24.0, 31.0, 37.0, 47.0, 82.0, 129.0, 178.0, 348.0, 668.0, 2993.0, 509907.0, 3666063.0, 11549.0, 994.0, 419.0, 235.0, 147.0, 124.0, 68.0, 59.0, 26.0, 25.0, 20.0, 24.0, 9.0, 11.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-114.75, -111.1845703125, -107.619140625, -104.0537109375, -100.48828125, -96.9228515625, -93.357421875, -89.7919921875, -86.2265625, -82.6611328125, -79.095703125, -75.5302734375, -71.96484375, -68.3994140625, -64.833984375, -61.2685546875, -57.703125, -54.1376953125, -50.572265625, -47.0068359375, -43.44140625, -39.8759765625, -36.310546875, -32.7451171875, -29.1796875, -25.6142578125, -22.048828125, -18.4833984375, -14.91796875, -11.3525390625, -7.787109375, -4.2216796875, -0.65625, 2.9091796875, 6.474609375, 10.0400390625, 13.60546875, 17.1708984375, 20.736328125, 24.3017578125, 27.8671875, 31.4326171875, 34.998046875, 38.5634765625, 42.12890625, 45.6943359375, 49.259765625, 52.8251953125, 56.390625, 59.9560546875, 63.521484375, 67.0869140625, 70.65234375, 74.2177734375, 77.783203125, 81.3486328125, 84.9140625, 88.4794921875, 92.044921875, 95.6103515625, 99.17578125, 102.7412109375, 106.306640625, 109.8720703125, 113.4375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 8.0, 13.0, 41.0, 65.0, 87.0, 152.0, 177.0, 186.0, 130.0, 77.0, 46.0, 14.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.42098999023438, -128.0428924560547, -122.66481018066406, -117.28671264648438, -111.90862274169922, -106.53053283691406, -101.15243530273438, -95.77434539794922, -90.39625549316406, -85.0181655883789, -79.64007568359375, -74.26197814941406, -68.8838882446289, -63.50579833984375, -58.12770462036133, -52.749610900878906, -47.37152099609375, -41.993431091308594, -36.61533737182617, -31.237245559692383, -25.859153747558594, -20.481061935424805, -15.102970123291016, -9.724876403808594, -4.3467864990234375, 1.0313053131103516, 6.409397125244141, 11.78748893737793, 17.16558074951172, 22.543672561645508, 27.921764373779297, 33.29985809326172, 38.677947998046875, 44.05603790283203, 49.43413162231445, 54.812225341796875, 60.19031524658203, 65.56840515136719, 70.94650268554688, 76.32459259033203, 81.70268249511719, 87.08077239990234, 92.4588623046875, 97.83695983886719, 103.21504974365234, 108.5931396484375, 113.97123718261719, 119.34932708740234, 124.7274169921875, 130.1055145263672, 135.4835968017578, 140.8616943359375, 146.23977661132812, 151.6178741455078, 156.9959716796875, 162.37405395507812, 167.7521514892578, 173.1302490234375, 178.50833129882812, 183.8864288330078, 189.2645263671875, 194.64260864257812, 200.0207061767578, 205.3988037109375, 210.77688598632812]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 1.0, 5.0, 5.0, 14.0, 9.0, 14.0, 19.0, 11.0, 15.0, 26.0, 20.0, 34.0, 28.0, 33.0, 43.0, 30.0, 30.0, 35.0, 31.0, 30.0, 47.0, 25.0, 34.0, 42.0, 39.0, 31.0, 42.0, 38.0, 38.0, 33.0, 25.0, 25.0, 19.0, 23.0, 24.0, 12.0, 12.0, 12.0, 7.0, 7.0, 5.0, 7.0, 4.0, 3.0, 6.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-87.049072265625, -84.43451690673828, -81.81996154785156, -79.20540618896484, -76.59085083007812, -73.9762954711914, -71.36174011230469, -68.74717712402344, -66.13262939453125, -63.51807403564453, -60.90351867675781, -58.288963317871094, -55.674407958984375, -53.059852600097656, -50.44529342651367, -47.83073806762695, -45.21617889404297, -42.60162353515625, -39.98706817626953, -37.37251281738281, -34.757957458496094, -32.143402099609375, -29.52884292602539, -26.914287567138672, -24.299732208251953, -21.685176849365234, -19.070621490478516, -16.456064224243164, -13.841508865356445, -11.226953506469727, -8.612397193908691, -5.997840881347656, -3.3832855224609375, -0.7687296867370605, 1.8458261489868164, 4.460381984710693, 7.07493782043457, 9.689493179321289, 12.304049491882324, 14.91860580444336, 17.533161163330078, 20.147716522216797, 22.762271881103516, 25.376829147338867, 27.991384506225586, 30.605939865112305, 33.220497131347656, 35.835052490234375, 38.449607849121094, 41.06416320800781, 43.67871856689453, 46.29327392578125, 48.90782928466797, 51.52238464355469, 54.13694381713867, 56.75149917602539, 59.36605453491211, 61.98060989379883, 64.59516906738281, 67.20972442626953, 69.82427978515625, 72.43883514404297, 75.05339050292969, 77.6679458618164, 80.28250122070312]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 6.0, 9.0, 5.0, 14.0, 12.0, 10.0, 15.0, 20.0, 26.0, 17.0, 31.0, 37.0, 28.0, 39.0, 39.0, 30.0, 42.0, 33.0, 33.0, 51.0, 52.0, 45.0, 57.0, 27.0, 41.0, 36.0, 33.0, 23.0, 21.0, 26.0, 24.0, 23.0, 13.0, 12.0, 12.0, 12.0, 12.0, 9.0, 7.0, 4.0, 5.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.578125, -11.2012939453125, -10.824462890625, -10.4476318359375, -10.07080078125, -9.6939697265625, -9.317138671875, -8.9403076171875, -8.5634765625, -8.1866455078125, -7.809814453125, -7.4329833984375, -7.05615234375, -6.6793212890625, -6.302490234375, -5.9256591796875, -5.548828125, -5.1719970703125, -4.795166015625, -4.4183349609375, -4.04150390625, -3.6646728515625, -3.287841796875, -2.9110107421875, -2.5341796875, -2.1573486328125, -1.780517578125, -1.4036865234375, -1.02685546875, -0.6500244140625, -0.273193359375, 0.1036376953125, 0.48046875, 0.8572998046875, 1.234130859375, 1.6109619140625, 1.98779296875, 2.3646240234375, 2.741455078125, 3.1182861328125, 3.4951171875, 3.8719482421875, 4.248779296875, 4.6256103515625, 5.00244140625, 5.3792724609375, 5.756103515625, 6.1329345703125, 6.509765625, 6.8865966796875, 7.263427734375, 7.6402587890625, 8.01708984375, 8.3939208984375, 8.770751953125, 9.1475830078125, 9.5244140625, 9.9012451171875, 10.278076171875, 10.6549072265625, 11.03173828125, 11.4085693359375, 11.785400390625, 12.1622314453125, 12.5390625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 0.0, 10.0, 11.0, 19.0, 30.0, 33.0, 67.0, 90.0, 124.0, 218.0, 297.0, 407.0, 658.0, 936.0, 1386.0, 2084.0, 3008.0, 4596.0, 6560.0, 10045.0, 14944.0, 22406.0, 33577.0, 50603.0, 74544.0, 108419.0, 159325.0, 176213.0, 121529.0, 83699.0, 57415.0, 38308.0, 25434.0, 17227.0, 11369.0, 7503.0, 4881.0, 3413.0, 2310.0, 1589.0, 1064.0, 733.0, 481.0, 341.0, 200.0, 161.0, 112.0, 55.0, 38.0, 35.0, 22.0, 16.0, 6.0, 7.0, 5.0, 2.0, 1.0], "bins": [-1.23046875, -1.1944427490234375, -1.158416748046875, -1.1223907470703125, -1.08636474609375, -1.0503387451171875, -1.014312744140625, -0.9782867431640625, -0.9422607421875, -0.9062347412109375, -0.870208740234375, -0.8341827392578125, -0.79815673828125, -0.7621307373046875, -0.726104736328125, -0.6900787353515625, -0.654052734375, -0.6180267333984375, -0.582000732421875, -0.5459747314453125, -0.50994873046875, -0.4739227294921875, -0.437896728515625, -0.4018707275390625, -0.3658447265625, -0.3298187255859375, -0.293792724609375, -0.2577667236328125, -0.22174072265625, -0.1857147216796875, -0.149688720703125, -0.1136627197265625, -0.07763671875, -0.0416107177734375, -0.005584716796875, 0.0304412841796875, 0.06646728515625, 0.1024932861328125, 0.138519287109375, 0.1745452880859375, 0.2105712890625, 0.2465972900390625, 0.282623291015625, 0.3186492919921875, 0.35467529296875, 0.3907012939453125, 0.426727294921875, 0.4627532958984375, 0.498779296875, 0.5348052978515625, 0.570831298828125, 0.6068572998046875, 0.64288330078125, 0.6789093017578125, 0.714935302734375, 0.7509613037109375, 0.7869873046875, 0.8230133056640625, 0.859039306640625, 0.8950653076171875, 0.93109130859375, 0.9671173095703125, 1.003143310546875, 1.0391693115234375, 1.0751953125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 7.0, 10.0, 5.0, 10.0, 13.0, 10.0, 21.0, 16.0, 30.0, 22.0, 22.0, 39.0, 29.0, 37.0, 42.0, 48.0, 46.0, 46.0, 30.0, 1064.0, 37.0, 38.0, 48.0, 38.0, 34.0, 38.0, 24.0, 24.0, 31.0, 29.0, 15.0, 13.0, 22.0, 18.0, 16.0, 12.0, 8.0, 7.0, 4.0, 5.0, 2.0, 4.0, 0.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2265625, -6.9814453125, -6.736328125, -6.4912109375, -6.24609375, -6.0009765625, -5.755859375, -5.5107421875, -5.265625, -5.0205078125, -4.775390625, -4.5302734375, -4.28515625, -4.0400390625, -3.794921875, -3.5498046875, -3.3046875, -3.0595703125, -2.814453125, -2.5693359375, -2.32421875, -2.0791015625, -1.833984375, -1.5888671875, -1.34375, -1.0986328125, -0.853515625, -0.6083984375, -0.36328125, -0.1181640625, 0.126953125, 0.3720703125, 0.6171875, 0.8623046875, 1.107421875, 1.3525390625, 1.59765625, 1.8427734375, 2.087890625, 2.3330078125, 2.578125, 2.8232421875, 3.068359375, 3.3134765625, 3.55859375, 3.8037109375, 4.048828125, 4.2939453125, 4.5390625, 4.7841796875, 5.029296875, 5.2744140625, 5.51953125, 5.7646484375, 6.009765625, 6.2548828125, 6.5, 6.7451171875, 6.990234375, 7.2353515625, 7.48046875, 7.7255859375, 7.970703125, 8.2158203125, 8.4609375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 10.0, 13.0, 26.0, 27.0, 33.0, 67.0, 99.0, 151.0, 220.0, 333.0, 475.0, 787.0, 1135.0, 1795.0, 2762.0, 4161.0, 6584.0, 10478.0, 16319.0, 26066.0, 40940.0, 65247.0, 104939.0, 167810.0, 1253693.0, 147139.0, 90923.0, 56745.0, 35675.0, 22475.0, 14433.0, 9236.0, 5786.0, 3673.0, 2340.0, 1505.0, 1032.0, 716.0, 446.0, 269.0, 170.0, 133.0, 101.0, 58.0, 39.0, 24.0, 15.0, 13.0, 7.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3642578125, -1.3233489990234375, -1.282440185546875, -1.2415313720703125, -1.20062255859375, -1.1597137451171875, -1.118804931640625, -1.0778961181640625, -1.0369873046875, -0.9960784912109375, -0.955169677734375, -0.9142608642578125, -0.87335205078125, -0.8324432373046875, -0.791534423828125, -0.7506256103515625, -0.709716796875, -0.6688079833984375, -0.627899169921875, -0.5869903564453125, -0.54608154296875, -0.5051727294921875, -0.464263916015625, -0.4233551025390625, -0.3824462890625, -0.3415374755859375, -0.300628662109375, -0.2597198486328125, -0.21881103515625, -0.1779022216796875, -0.136993408203125, -0.0960845947265625, -0.05517578125, -0.0142669677734375, 0.026641845703125, 0.0675506591796875, 0.10845947265625, 0.1493682861328125, 0.190277099609375, 0.2311859130859375, 0.2720947265625, 0.3130035400390625, 0.353912353515625, 0.3948211669921875, 0.43572998046875, 0.4766387939453125, 0.517547607421875, 0.5584564208984375, 0.599365234375, 0.6402740478515625, 0.681182861328125, 0.7220916748046875, 0.76300048828125, 0.8039093017578125, 0.844818115234375, 0.8857269287109375, 0.9266357421875, 0.9675445556640625, 1.008453369140625, 1.0493621826171875, 1.09027099609375, 1.1311798095703125, 1.172088623046875, 1.2129974365234375, 1.25390625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 2.0, 8.0, 6.0, 10.0, 11.0, 17.0, 15.0, 30.0, 30.0, 29.0, 40.0, 36.0, 53.0, 51.0, 44.0, 57.0, 65.0, 65.0, 67.0, 52.0, 41.0, 47.0, 40.0, 34.0, 19.0, 23.0, 22.0, 16.0, 8.0, 19.0, 10.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0020923614501953125, -0.00202980637550354, -0.0019672513008117676, -0.0019046962261199951, -0.0018421411514282227, -0.0017795860767364502, -0.0017170310020446777, -0.0016544759273529053, -0.0015919208526611328, -0.0015293657779693604, -0.0014668107032775879, -0.0014042556285858154, -0.001341700553894043, -0.0012791454792022705, -0.001216590404510498, -0.0011540353298187256, -0.0010914802551269531, -0.0010289251804351807, -0.0009663701057434082, -0.0009038150310516357, -0.0008412599563598633, -0.0007787048816680908, -0.0007161498069763184, -0.0006535947322845459, -0.0005910396575927734, -0.000528484582901001, -0.0004659295082092285, -0.00040337443351745605, -0.0003408193588256836, -0.00027826428413391113, -0.00021570920944213867, -0.0001531541347503662, -9.059906005859375e-05, -2.804398536682129e-05, 3.451108932495117e-05, 9.706616401672363e-05, 0.0001596212387084961, 0.00022217631340026855, 0.000284731388092041, 0.0003472864627838135, 0.00040984153747558594, 0.0004723966121673584, 0.0005349516868591309, 0.0005975067615509033, 0.0006600618362426758, 0.0007226169109344482, 0.0007851719856262207, 0.0008477270603179932, 0.0009102821350097656, 0.0009728372097015381, 0.0010353922843933105, 0.001097947359085083, 0.0011605024337768555, 0.001223057508468628, 0.0012856125831604004, 0.0013481676578521729, 0.0014107227325439453, 0.0014732778072357178, 0.0015358328819274902, 0.0015983879566192627, 0.0016609430313110352, 0.0017234981060028076, 0.00178605318069458, 0.0018486082553863525, 0.001911163330078125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 1.0, 5.0, 9.0, 10.0, 5.0, 14.0, 13.0, 17.0, 25.0, 29.0, 44.0, 51.0, 92.0, 145.0, 264.0, 665.0, 4362.0, 1032502.0, 8723.0, 800.0, 294.0, 143.0, 101.0, 59.0, 37.0, 31.0, 22.0, 14.0, 22.0, 10.0, 8.0, 9.0, 5.0, 3.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04803466796875, -0.0464630126953125, -0.044891357421875, -0.0433197021484375, -0.041748046875, -0.0401763916015625, -0.038604736328125, -0.0370330810546875, -0.03546142578125, -0.0338897705078125, -0.032318115234375, -0.0307464599609375, -0.0291748046875, -0.0276031494140625, -0.026031494140625, -0.0244598388671875, -0.02288818359375, -0.0213165283203125, -0.019744873046875, -0.0181732177734375, -0.0166015625, -0.0150299072265625, -0.013458251953125, -0.0118865966796875, -0.01031494140625, -0.0087432861328125, -0.007171630859375, -0.0055999755859375, -0.0040283203125, -0.0024566650390625, -0.000885009765625, 0.0006866455078125, 0.00225830078125, 0.0038299560546875, 0.005401611328125, 0.0069732666015625, 0.008544921875, 0.0101165771484375, 0.011688232421875, 0.0132598876953125, 0.01483154296875, 0.0164031982421875, 0.017974853515625, 0.0195465087890625, 0.0211181640625, 0.0226898193359375, 0.024261474609375, 0.0258331298828125, 0.02740478515625, 0.0289764404296875, 0.030548095703125, 0.0321197509765625, 0.03369140625, 0.0352630615234375, 0.036834716796875, 0.0384063720703125, 0.03997802734375, 0.0415496826171875, 0.043121337890625, 0.0446929931640625, 0.0462646484375, 0.0478363037109375, 0.049407958984375, 0.0509796142578125, 0.05255126953125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 15.0, 20.0, 39.0, 71.0, 120.0, 142.0, 146.0, 134.0, 122.0, 94.0, 44.0, 26.0, 16.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0016483803046867251, -0.0015979146119207144, -0.0015474490355700254, -0.0014969834592193365, -0.0014465177664533257, -0.001396052073687315, -0.001345586497336626, -0.0012951209209859371, -0.0012446552282199264, -0.0011941895354539156, -0.0011437239591032267, -0.0010932583827525377, -0.001042792689986527, -0.0009923269972205162, -0.0009418614208698273, -0.0008913957863114774, -0.0008409301517531276, -0.0007904645171947777, -0.0007399988826364279, -0.000689533248078078, -0.0006390676135197282, -0.0005886019789613783, -0.0005381363444030285, -0.00048767070984467864, -0.0004372050752863288, -0.00038673944072797894, -0.0003362738061696291, -0.00028580817161127925, -0.0002353425370529294, -0.00018487690249457955, -0.0001344112679362297, -8.394563337787986e-05, -3.347988240420818e-05, 1.6985752154141665e-05, 6.745138671249151e-05, 0.00011791702127084136, 0.0001683826558291912, 0.00021884829038754106, 0.0002693139249458909, 0.00031977955950424075, 0.0003702451940625906, 0.00042071082862094045, 0.0004711764631792903, 0.0005216420977376401, 0.00057210773229599, 0.0006225733668543398, 0.0006730390014126897, 0.0007235046359710395, 0.0007739702705293894, 0.0008244359050877392, 0.0008749015396460891, 0.0009253671742044389, 0.0009758328087627888, 0.0010262983851134777, 0.0010767640778794885, 0.0011272297706454992, 0.0011776953469961882, 0.001228160923346877, 0.0012786266161128879, 0.0013290923088788986, 0.0013795578852295876, 0.0014300234615802765, 0.0014804891543462873, 0.001530954847112298, 0.001581420423462987]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 2.0, 9.0, 17.0, 8.0, 17.0, 15.0, 15.0, 23.0, 22.0, 23.0, 21.0, 22.0, 38.0, 27.0, 39.0, 36.0, 40.0, 40.0, 37.0, 26.0, 37.0, 33.0, 42.0, 27.0, 44.0, 30.0, 39.0, 31.0, 34.0, 22.0, 20.0, 13.0, 27.0, 17.0, 22.0, 13.0, 8.0, 11.0, 9.0, 9.0, 5.0, 9.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008800029754638672, -0.0008500795811414719, -0.0008201561868190765, -0.0007902327924966812, -0.0007603093981742859, -0.0007303860038518906, -0.0007004626095294952, -0.0006705392152070999, -0.0006406158208847046, -0.0006106924265623093, -0.0005807690322399139, -0.0005508456379175186, -0.0005209222435951233, -0.000490998849272728, -0.00046107545495033264, -0.0004311520606279373, -0.000401228666305542, -0.00037130527198314667, -0.00034138187766075134, -0.000311458483338356, -0.0002815350890159607, -0.00025161169469356537, -0.00022168830037117004, -0.00019176490604877472, -0.0001618415117263794, -0.00013191811740398407, -0.00010199472308158875, -7.207132875919342e-05, -4.2147934436798096e-05, -1.2224540114402771e-05, 1.7698854207992554e-05, 4.762224853038788e-05, 7.75456428527832e-05, 0.00010746903717517853, 0.00013739243149757385, 0.00016731582581996918, 0.0001972392201423645, 0.00022716261446475983, 0.00025708600878715515, 0.0002870094031095505, 0.0003169327974319458, 0.0003468561917543411, 0.00037677958607673645, 0.0004067029803991318, 0.0004366263747215271, 0.0004665497690439224, 0.0004964731633663177, 0.0005263965576887131, 0.0005563199520111084, 0.0005862433463335037, 0.000616166740655899, 0.0006460901349782944, 0.0006760135293006897, 0.000705936923623085, 0.0007358603179454803, 0.0007657837122678757, 0.000795707106590271, 0.0008256305009126663, 0.0008555538952350616, 0.000885477289557457, 0.0009154006838798523, 0.0009453240782022476, 0.0009752474725246429, 0.0010051708668470383, 0.0010350942611694336]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 6.0, 9.0, 5.0, 14.0, 12.0, 10.0, 15.0, 20.0, 26.0, 17.0, 31.0, 37.0, 29.0, 39.0, 38.0, 30.0, 42.0, 33.0, 33.0, 54.0, 49.0, 46.0, 56.0, 27.0, 41.0, 36.0, 33.0, 23.0, 21.0, 26.0, 24.0, 23.0, 13.0, 12.0, 12.0, 12.0, 12.0, 9.0, 7.0, 4.0, 5.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.578125, -11.201171875, -10.82421875, -10.447265625, -10.0703125, -9.693359375, -9.31640625, -8.939453125, -8.5625, -8.185546875, -7.80859375, -7.431640625, -7.0546875, -6.677734375, -6.30078125, -5.923828125, -5.546875, -5.169921875, -4.79296875, -4.416015625, -4.0390625, -3.662109375, -3.28515625, -2.908203125, -2.53125, -2.154296875, -1.77734375, -1.400390625, -1.0234375, -0.646484375, -0.26953125, 0.107421875, 0.484375, 0.861328125, 1.23828125, 1.615234375, 1.9921875, 2.369140625, 2.74609375, 3.123046875, 3.5, 3.876953125, 4.25390625, 4.630859375, 5.0078125, 5.384765625, 5.76171875, 6.138671875, 6.515625, 6.892578125, 7.26953125, 7.646484375, 8.0234375, 8.400390625, 8.77734375, 9.154296875, 9.53125, 9.908203125, 10.28515625, 10.662109375, 11.0390625, 11.416015625, 11.79296875, 12.169921875, 12.546875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 9.0, 17.0, 16.0, 23.0, 30.0, 37.0, 44.0, 60.0, 114.0, 121.0, 180.0, 283.0, 410.0, 595.0, 1074.0, 1826.0, 3328.0, 6147.0, 12050.0, 24951.0, 52409.0, 116662.0, 262604.0, 302353.0, 140756.0, 62540.0, 29294.0, 14103.0, 7215.0, 3858.0, 2075.0, 1213.0, 708.0, 413.0, 296.0, 208.0, 135.0, 86.0, 83.0, 69.0, 35.0, 26.0, 25.0, 15.0, 18.0, 6.0, 7.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-7.1875, -6.96368408203125, -6.7398681640625, -6.51605224609375, -6.292236328125, -6.06842041015625, -5.8446044921875, -5.62078857421875, -5.39697265625, -5.17315673828125, -4.9493408203125, -4.72552490234375, -4.501708984375, -4.27789306640625, -4.0540771484375, -3.83026123046875, -3.6064453125, -3.38262939453125, -3.1588134765625, -2.93499755859375, -2.711181640625, -2.48736572265625, -2.2635498046875, -2.03973388671875, -1.81591796875, -1.59210205078125, -1.3682861328125, -1.14447021484375, -0.920654296875, -0.69683837890625, -0.4730224609375, -0.24920654296875, -0.025390625, 0.19842529296875, 0.4222412109375, 0.64605712890625, 0.869873046875, 1.09368896484375, 1.3175048828125, 1.54132080078125, 1.76513671875, 1.98895263671875, 2.2127685546875, 2.43658447265625, 2.660400390625, 2.88421630859375, 3.1080322265625, 3.33184814453125, 3.5556640625, 3.77947998046875, 4.0032958984375, 4.22711181640625, 4.450927734375, 4.67474365234375, 4.8985595703125, 5.12237548828125, 5.34619140625, 5.57000732421875, 5.7938232421875, 6.01763916015625, 6.241455078125, 6.46527099609375, 6.6890869140625, 6.91290283203125, 7.13671875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 3.0, 6.0, 6.0, 9.0, 11.0, 10.0, 19.0, 13.0, 23.0, 30.0, 24.0, 36.0, 51.0, 58.0, 53.0, 74.0, 310.0, 1730.0, 125.0, 79.0, 62.0, 57.0, 53.0, 47.0, 39.0, 25.0, 29.0, 21.0, 7.0, 11.0, 3.0, 4.0, 10.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-75.625, -73.6962890625, -71.767578125, -69.8388671875, -67.91015625, -65.9814453125, -64.052734375, -62.1240234375, -60.1953125, -58.2666015625, -56.337890625, -54.4091796875, -52.48046875, -50.5517578125, -48.623046875, -46.6943359375, -44.765625, -42.8369140625, -40.908203125, -38.9794921875, -37.05078125, -35.1220703125, -33.193359375, -31.2646484375, -29.3359375, -27.4072265625, -25.478515625, -23.5498046875, -21.62109375, -19.6923828125, -17.763671875, -15.8349609375, -13.90625, -11.9775390625, -10.048828125, -8.1201171875, -6.19140625, -4.2626953125, -2.333984375, -0.4052734375, 1.5234375, 3.4521484375, 5.380859375, 7.3095703125, 9.23828125, 11.1669921875, 13.095703125, 15.0244140625, 16.953125, 18.8818359375, 20.810546875, 22.7392578125, 24.66796875, 26.5966796875, 28.525390625, 30.4541015625, 32.3828125, 34.3115234375, 36.240234375, 38.1689453125, 40.09765625, 42.0263671875, 43.955078125, 45.8837890625, 47.8125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 5.0, 7.0, 12.0, 14.0, 24.0, 30.0, 48.0, 74.0, 99.0, 126.0, 196.0, 303.0, 578.0, 2800.0, 3053944.0, 85124.0, 1156.0, 376.0, 234.0, 156.0, 99.0, 85.0, 46.0, 42.0, 39.0, 16.0, 13.0, 13.0, 8.0, 3.0, 9.0, 2.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.4375, -104.0673828125, -99.697265625, -95.3271484375, -90.95703125, -86.5869140625, -82.216796875, -77.8466796875, -73.4765625, -69.1064453125, -64.736328125, -60.3662109375, -55.99609375, -51.6259765625, -47.255859375, -42.8857421875, -38.515625, -34.1455078125, -29.775390625, -25.4052734375, -21.03515625, -16.6650390625, -12.294921875, -7.9248046875, -3.5546875, 0.8154296875, 5.185546875, 9.5556640625, 13.92578125, 18.2958984375, 22.666015625, 27.0361328125, 31.40625, 35.7763671875, 40.146484375, 44.5166015625, 48.88671875, 53.2568359375, 57.626953125, 61.9970703125, 66.3671875, 70.7373046875, 75.107421875, 79.4775390625, 83.84765625, 88.2177734375, 92.587890625, 96.9580078125, 101.328125, 105.6982421875, 110.068359375, 114.4384765625, 118.80859375, 123.1787109375, 127.548828125, 131.9189453125, 136.2890625, 140.6591796875, 145.029296875, 149.3994140625, 153.76953125, 158.1396484375, 162.509765625, 166.8798828125, 171.25]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 51.0, 323.0, 474.0, 145.0, 16.0, 4.0], "bins": [-308.0945129394531, -302.9800720214844, -297.86566162109375, -292.751220703125, -287.63677978515625, -282.5223693847656, -277.4079284667969, -272.2934875488281, -267.1790771484375, -262.06463623046875, -256.9502258300781, -251.83578491210938, -246.7213592529297, -241.60693359375, -236.49249267578125, -231.37806701660156, -226.2636260986328, -221.14920043945312, -216.03475952148438, -210.9203338623047, -205.805908203125, -200.69146728515625, -195.57704162597656, -190.46261596679688, -185.34817504882812, -180.23374938964844, -175.1193084716797, -170.0048828125, -164.8904571533203, -159.77603149414062, -154.66159057617188, -149.5471649169922, -144.4327392578125, -139.3183135986328, -134.20387268066406, -129.08944702148438, -123.97502136230469, -118.86058807373047, -113.74615478515625, -108.63172912597656, -103.51729583740234, -98.40286254882812, -93.28843688964844, -88.17400360107422, -83.0595703125, -77.94514465332031, -72.8307113647461, -67.71627807617188, -62.60185241699219, -57.487422943115234, -52.37299346923828, -47.25856018066406, -42.14413070678711, -37.029701232910156, -31.91526985168457, -26.800838470458984, -21.68640899658203, -16.571979522705078, -11.457548141479492, -6.343117713928223, -1.2286872863769531, 3.8857421875, 9.000173568725586, 14.114604949951172, 19.229034423828125]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 8.0, 4.0, 5.0, 2.0, 11.0, 12.0, 12.0, 12.0, 20.0, 19.0, 28.0, 30.0, 29.0, 27.0, 31.0, 39.0, 39.0, 39.0, 52.0, 41.0, 28.0, 43.0, 43.0, 38.0, 49.0, 43.0, 37.0, 25.0, 29.0, 32.0, 31.0, 27.0, 22.0, 27.0, 10.0, 10.0, 12.0, 8.0, 5.0, 8.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.20925903320312, -102.42353820800781, -98.63782501220703, -94.85210418701172, -91.06639099121094, -87.28067016601562, -83.49494934082031, -79.70923614501953, -75.92352294921875, -72.13780212402344, -68.35208892822266, -64.56636810302734, -60.78065490722656, -56.99493408203125, -53.2092170715332, -49.423500061035156, -45.637779235839844, -41.8520622253418, -38.06634521484375, -34.28062438964844, -30.494909286499023, -26.709192276000977, -22.923473358154297, -19.13775634765625, -15.352039337158203, -11.566322326660156, -7.780604362487793, -3.9948863983154297, -0.2091693878173828, 3.576547622680664, 7.362266540527344, 11.14798355102539, 14.933700561523438, 18.719417572021484, 22.50513458251953, 26.29085350036621, 30.076570510864258, 33.86228942871094, 37.648006439208984, 41.43372344970703, 45.21944046020508, 49.005157470703125, 52.79087448120117, 56.57659149169922, 60.36231231689453, 64.14802551269531, 67.93374633789062, 71.71946716308594, 75.50518035888672, 79.29090118408203, 83.07661437988281, 86.86233520507812, 90.6480484008789, 94.43376922607422, 98.219482421875, 102.00520324707031, 105.79092407226562, 109.57664489746094, 113.36235809326172, 117.14807891845703, 120.93379211425781, 124.71951293945312, 128.50523376464844, 132.29095458984375, 136.07666015625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 10.0, 6.0, 12.0, 14.0, 13.0, 15.0, 21.0, 25.0, 27.0, 26.0, 34.0, 43.0, 33.0, 39.0, 21.0, 45.0, 44.0, 37.0, 40.0, 65.0, 37.0, 41.0, 47.0, 45.0, 31.0, 26.0, 23.0, 27.0, 25.0, 19.0, 23.0, 12.0, 15.0, 7.0, 9.0, 14.0, 5.0, 4.0, 6.0, 4.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.4296875, -12.0328369140625, -11.635986328125, -11.2391357421875, -10.84228515625, -10.4454345703125, -10.048583984375, -9.6517333984375, -9.2548828125, -8.8580322265625, -8.461181640625, -8.0643310546875, -7.66748046875, -7.2706298828125, -6.873779296875, -6.4769287109375, -6.080078125, -5.6832275390625, -5.286376953125, -4.8895263671875, -4.49267578125, -4.0958251953125, -3.698974609375, -3.3021240234375, -2.9052734375, -2.5084228515625, -2.111572265625, -1.7147216796875, -1.31787109375, -0.9210205078125, -0.524169921875, -0.1273193359375, 0.26953125, 0.6663818359375, 1.063232421875, 1.4600830078125, 1.85693359375, 2.2537841796875, 2.650634765625, 3.0474853515625, 3.4443359375, 3.8411865234375, 4.238037109375, 4.6348876953125, 5.03173828125, 5.4285888671875, 5.825439453125, 6.2222900390625, 6.619140625, 7.0159912109375, 7.412841796875, 7.8096923828125, 8.20654296875, 8.6033935546875, 9.000244140625, 9.3970947265625, 9.7939453125, 10.1907958984375, 10.587646484375, 10.9844970703125, 11.38134765625, 11.7781982421875, 12.175048828125, 12.5718994140625, 12.96875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 7.0, 11.0, 8.0, 13.0, 13.0, 22.0, 22.0, 23.0, 34.0, 37.0, 51.0, 62.0, 114.0, 228.0, 711.0, 4520.0, 97244.0, 3316008.0, 759414.0, 13481.0, 1412.0, 342.0, 135.0, 88.0, 42.0, 42.0, 23.0, 20.0, 29.0, 20.0, 17.0, 18.0, 9.0, 10.0, 10.0, 7.0, 6.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.71875, -50.13818359375, -48.5576171875, -46.97705078125, -45.396484375, -43.81591796875, -42.2353515625, -40.65478515625, -39.07421875, -37.49365234375, -35.9130859375, -34.33251953125, -32.751953125, -31.17138671875, -29.5908203125, -28.01025390625, -26.4296875, -24.84912109375, -23.2685546875, -21.68798828125, -20.107421875, -18.52685546875, -16.9462890625, -15.36572265625, -13.78515625, -12.20458984375, -10.6240234375, -9.04345703125, -7.462890625, -5.88232421875, -4.3017578125, -2.72119140625, -1.140625, 0.43994140625, 2.0205078125, 3.60107421875, 5.181640625, 6.76220703125, 8.3427734375, 9.92333984375, 11.50390625, 13.08447265625, 14.6650390625, 16.24560546875, 17.826171875, 19.40673828125, 20.9873046875, 22.56787109375, 24.1484375, 25.72900390625, 27.3095703125, 28.89013671875, 30.470703125, 32.05126953125, 33.6318359375, 35.21240234375, 36.79296875, 38.37353515625, 39.9541015625, 41.53466796875, 43.115234375, 44.69580078125, 46.2763671875, 47.85693359375, 49.4375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 13.0, 23.0, 25.0, 44.0, 98.0, 146.0, 230.0, 383.0, 582.0, 724.0, 689.0, 446.0, 266.0, 156.0, 96.0, 57.0, 38.0, 21.0, 15.0, 8.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.59375, -47.26708984375, -45.9404296875, -44.61376953125, -43.287109375, -41.96044921875, -40.6337890625, -39.30712890625, -37.98046875, -36.65380859375, -35.3271484375, -34.00048828125, -32.673828125, -31.34716796875, -30.0205078125, -28.69384765625, -27.3671875, -26.04052734375, -24.7138671875, -23.38720703125, -22.060546875, -20.73388671875, -19.4072265625, -18.08056640625, -16.75390625, -15.42724609375, -14.1005859375, -12.77392578125, -11.447265625, -10.12060546875, -8.7939453125, -7.46728515625, -6.140625, -4.81396484375, -3.4873046875, -2.16064453125, -0.833984375, 0.49267578125, 1.8193359375, 3.14599609375, 4.47265625, 5.79931640625, 7.1259765625, 8.45263671875, 9.779296875, 11.10595703125, 12.4326171875, 13.75927734375, 15.0859375, 16.41259765625, 17.7392578125, 19.06591796875, 20.392578125, 21.71923828125, 23.0458984375, 24.37255859375, 25.69921875, 27.02587890625, 28.3525390625, 29.67919921875, 31.005859375, 32.33251953125, 33.6591796875, 34.98583984375, 36.3125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 6.0, 11.0, 13.0, 19.0, 26.0, 34.0, 57.0, 80.0, 116.0, 148.0, 238.0, 525.0, 1448.0, 39333.0, 4101588.0, 47867.0, 1489.0, 481.0, 275.0, 144.0, 88.0, 65.0, 64.0, 52.0, 37.0, 17.0, 14.0, 9.0, 12.0, 7.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-134.125, -130.123046875, -126.12109375, -122.119140625, -118.1171875, -114.115234375, -110.11328125, -106.111328125, -102.109375, -98.107421875, -94.10546875, -90.103515625, -86.1015625, -82.099609375, -78.09765625, -74.095703125, -70.09375, -66.091796875, -62.08984375, -58.087890625, -54.0859375, -50.083984375, -46.08203125, -42.080078125, -38.078125, -34.076171875, -30.07421875, -26.072265625, -22.0703125, -18.068359375, -14.06640625, -10.064453125, -6.0625, -2.060546875, 1.94140625, 5.943359375, 9.9453125, 13.947265625, 17.94921875, 21.951171875, 25.953125, 29.955078125, 33.95703125, 37.958984375, 41.9609375, 45.962890625, 49.96484375, 53.966796875, 57.96875, 61.970703125, 65.97265625, 69.974609375, 73.9765625, 77.978515625, 81.98046875, 85.982421875, 89.984375, 93.986328125, 97.98828125, 101.990234375, 105.9921875, 109.994140625, 113.99609375, 117.998046875, 122.0]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 19.0, 125.0, 356.0, 372.0, 116.0, 25.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-473.57769775390625, -460.76361083984375, -447.94952392578125, -435.13543701171875, -422.32135009765625, -409.50726318359375, -396.69317626953125, -383.87908935546875, -371.06500244140625, -358.25091552734375, -345.43682861328125, -332.62274169921875, -319.80865478515625, -306.99456787109375, -294.18048095703125, -281.36639404296875, -268.5523376464844, -255.73825073242188, -242.92416381835938, -230.11007690429688, -217.29598999023438, -204.48190307617188, -191.66783142089844, -178.85374450683594, -166.03965759277344, -153.22557067871094, -140.41148376464844, -127.59740447998047, -114.78331756591797, -101.96923065185547, -89.1551513671875, -76.341064453125, -63.527008056640625, -50.712921142578125, -37.89883804321289, -25.084754943847656, -12.270668029785156, 0.5434188842773438, 13.357498168945312, 26.171585083007812, 38.98567199707031, 51.79975891113281, 64.61384582519531, 77.42792510986328, 90.24201202392578, 103.05609893798828, 115.87017822265625, 128.68426513671875, 141.49835205078125, 154.31243896484375, 167.12652587890625, 179.94061279296875, 192.75469970703125, 205.56878662109375, 218.3828582763672, 231.1969451904297, 244.0110321044922, 256.8251037597656, 269.6391906738281, 282.4532775878906, 295.2673645019531, 308.0814514160156, 320.8955383300781, 333.7096252441406, 346.5237121582031]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 5.0, 8.0, 8.0, 7.0, 8.0, 15.0, 18.0, 10.0, 19.0, 28.0, 19.0, 23.0, 18.0, 25.0, 30.0, 27.0, 36.0, 24.0, 40.0, 35.0, 43.0, 34.0, 31.0, 31.0, 43.0, 40.0, 35.0, 34.0, 31.0, 44.0, 34.0, 20.0, 13.0, 17.0, 23.0, 15.0, 18.0, 12.0, 10.0, 9.0, 13.0, 9.0, 8.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-76.84820556640625, -74.42475891113281, -72.00131225585938, -69.57787322998047, -67.15442657470703, -64.7309799194336, -62.307533264160156, -59.88408660888672, -57.46064376831055, -55.03719711303711, -52.61375427246094, -50.1903076171875, -47.76686096191406, -45.34341812133789, -42.91997146606445, -40.49652862548828, -38.073081970214844, -35.649635314941406, -33.226192474365234, -30.802745819091797, -28.379301071166992, -25.955856323242188, -23.53240966796875, -21.108964920043945, -18.68552017211914, -16.262075424194336, -13.838629722595215, -11.415184020996094, -8.991739273071289, -6.568294525146484, -4.144848823547363, -1.7214031219482422, 0.7020416259765625, 3.1254868507385254, 5.548932075500488, 7.972377300262451, 10.395822525024414, 12.819267272949219, 15.24271297454834, 17.66615867614746, 20.089603424072266, 22.51304817199707, 24.936492919921875, 27.359939575195312, 29.783384323120117, 32.20682907104492, 34.63027572631836, 37.05371856689453, 39.47716522216797, 41.900611877441406, 44.32405471801758, 46.747501373291016, 49.17094421386719, 51.594390869140625, 54.01783752441406, 56.4412841796875, 58.86472702026367, 61.28817367553711, 63.71161651611328, 66.13506317138672, 68.55850982666016, 70.98194885253906, 73.4053955078125, 75.82884216308594, 78.25228881835938]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 6.0, 12.0, 11.0, 9.0, 15.0, 19.0, 26.0, 24.0, 34.0, 37.0, 27.0, 28.0, 35.0, 40.0, 37.0, 51.0, 45.0, 43.0, 57.0, 52.0, 45.0, 41.0, 39.0, 40.0, 23.0, 27.0, 23.0, 22.0, 23.0, 28.0, 21.0, 12.0, 15.0, 6.0, 5.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7109375, -12.2952880859375, -11.879638671875, -11.4639892578125, -11.04833984375, -10.6326904296875, -10.217041015625, -9.8013916015625, -9.3857421875, -8.9700927734375, -8.554443359375, -8.1387939453125, -7.72314453125, -7.3074951171875, -6.891845703125, -6.4761962890625, -6.060546875, -5.6448974609375, -5.229248046875, -4.8135986328125, -4.39794921875, -3.9822998046875, -3.566650390625, -3.1510009765625, -2.7353515625, -2.3197021484375, -1.904052734375, -1.4884033203125, -1.07275390625, -0.6571044921875, -0.241455078125, 0.1741943359375, 0.58984375, 1.0054931640625, 1.421142578125, 1.8367919921875, 2.25244140625, 2.6680908203125, 3.083740234375, 3.4993896484375, 3.9150390625, 4.3306884765625, 4.746337890625, 5.1619873046875, 5.57763671875, 5.9932861328125, 6.408935546875, 6.8245849609375, 7.240234375, 7.6558837890625, 8.071533203125, 8.4871826171875, 8.90283203125, 9.3184814453125, 9.734130859375, 10.1497802734375, 10.5654296875, 10.9810791015625, 11.396728515625, 11.8123779296875, 12.22802734375, 12.6436767578125, 13.059326171875, 13.4749755859375, 13.890625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 10.0, 15.0, 31.0, 47.0, 79.0, 105.0, 189.0, 285.0, 409.0, 749.0, 1110.0, 1784.0, 2835.0, 4491.0, 7158.0, 11356.0, 18292.0, 28540.0, 44680.0, 69459.0, 106582.0, 161643.0, 196285.0, 138879.0, 90902.0, 59384.0, 38239.0, 23945.0, 15183.0, 9607.0, 6023.0, 3738.0, 2428.0, 1482.0, 965.0, 627.0, 373.0, 224.0, 158.0, 100.0, 68.0, 37.0, 26.0, 16.0, 6.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3974609375, -1.3555145263671875, -1.313568115234375, -1.2716217041015625, -1.22967529296875, -1.1877288818359375, -1.145782470703125, -1.1038360595703125, -1.0618896484375, -1.0199432373046875, -0.977996826171875, -0.9360504150390625, -0.89410400390625, -0.8521575927734375, -0.810211181640625, -0.7682647705078125, -0.726318359375, -0.6843719482421875, -0.642425537109375, -0.6004791259765625, -0.55853271484375, -0.5165863037109375, -0.474639892578125, -0.4326934814453125, -0.3907470703125, -0.3488006591796875, -0.306854248046875, -0.2649078369140625, -0.22296142578125, -0.1810150146484375, -0.139068603515625, -0.0971221923828125, -0.05517578125, -0.0132293701171875, 0.028717041015625, 0.0706634521484375, 0.11260986328125, 0.1545562744140625, 0.196502685546875, 0.2384490966796875, 0.2803955078125, 0.3223419189453125, 0.364288330078125, 0.4062347412109375, 0.44818115234375, 0.4901275634765625, 0.532073974609375, 0.5740203857421875, 0.615966796875, 0.6579132080078125, 0.699859619140625, 0.7418060302734375, 0.78375244140625, 0.8256988525390625, 0.867645263671875, 0.9095916748046875, 0.9515380859375, 0.9934844970703125, 1.035430908203125, 1.0773773193359375, 1.11932373046875, 1.1612701416015625, 1.203216552734375, 1.2451629638671875, 1.287109375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 12.0, 7.0, 13.0, 19.0, 13.0, 16.0, 22.0, 29.0, 22.0, 26.0, 31.0, 35.0, 29.0, 47.0, 26.0, 36.0, 54.0, 38.0, 1059.0, 46.0, 45.0, 32.0, 45.0, 34.0, 35.0, 26.0, 26.0, 31.0, 21.0, 19.0, 25.0, 15.0, 14.0, 13.0, 11.0, 14.0, 9.0, 4.0, 5.0, 2.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5625, -7.326904296875, -7.09130859375, -6.855712890625, -6.6201171875, -6.384521484375, -6.14892578125, -5.913330078125, -5.677734375, -5.442138671875, -5.20654296875, -4.970947265625, -4.7353515625, -4.499755859375, -4.26416015625, -4.028564453125, -3.79296875, -3.557373046875, -3.32177734375, -3.086181640625, -2.8505859375, -2.614990234375, -2.37939453125, -2.143798828125, -1.908203125, -1.672607421875, -1.43701171875, -1.201416015625, -0.9658203125, -0.730224609375, -0.49462890625, -0.259033203125, -0.0234375, 0.212158203125, 0.44775390625, 0.683349609375, 0.9189453125, 1.154541015625, 1.39013671875, 1.625732421875, 1.861328125, 2.096923828125, 2.33251953125, 2.568115234375, 2.8037109375, 3.039306640625, 3.27490234375, 3.510498046875, 3.74609375, 3.981689453125, 4.21728515625, 4.452880859375, 4.6884765625, 4.924072265625, 5.15966796875, 5.395263671875, 5.630859375, 5.866455078125, 6.10205078125, 6.337646484375, 6.5732421875, 6.808837890625, 7.04443359375, 7.280029296875, 7.515625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 19.0, 17.0, 30.0, 26.0, 69.0, 77.0, 110.0, 179.0, 294.0, 457.0, 698.0, 997.0, 1477.0, 2257.0, 3339.0, 5059.0, 7751.0, 11645.0, 17947.0, 26704.0, 40513.0, 61160.0, 93937.0, 145612.0, 1243961.0, 149845.0, 96871.0, 63250.0, 41103.0, 27704.0, 18125.0, 12155.0, 8048.0, 5313.0, 3471.0, 2365.0, 1534.0, 995.0, 712.0, 480.0, 273.0, 203.0, 104.0, 83.0, 51.0, 46.0, 29.0, 18.0, 6.0, 5.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0], "bins": [-1.216796875, -1.1793975830078125, -1.141998291015625, -1.1045989990234375, -1.06719970703125, -1.0298004150390625, -0.992401123046875, -0.9550018310546875, -0.9176025390625, -0.8802032470703125, -0.842803955078125, -0.8054046630859375, -0.76800537109375, -0.7306060791015625, -0.693206787109375, -0.6558074951171875, -0.618408203125, -0.5810089111328125, -0.543609619140625, -0.5062103271484375, -0.46881103515625, -0.4314117431640625, -0.394012451171875, -0.3566131591796875, -0.3192138671875, -0.2818145751953125, -0.244415283203125, -0.2070159912109375, -0.16961669921875, -0.1322174072265625, -0.094818115234375, -0.0574188232421875, -0.02001953125, 0.0173797607421875, 0.054779052734375, 0.0921783447265625, 0.12957763671875, 0.1669769287109375, 0.204376220703125, 0.2417755126953125, 0.2791748046875, 0.3165740966796875, 0.353973388671875, 0.3913726806640625, 0.42877197265625, 0.4661712646484375, 0.503570556640625, 0.5409698486328125, 0.578369140625, 0.6157684326171875, 0.653167724609375, 0.6905670166015625, 0.72796630859375, 0.7653656005859375, 0.802764892578125, 0.8401641845703125, 0.8775634765625, 0.9149627685546875, 0.952362060546875, 0.9897613525390625, 1.02716064453125, 1.0645599365234375, 1.101959228515625, 1.1393585205078125, 1.1767578125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 11.0, 11.0, 16.0, 16.0, 18.0, 22.0, 24.0, 18.0, 27.0, 39.0, 45.0, 49.0, 56.0, 64.0, 64.0, 75.0, 65.0, 47.0, 55.0, 37.0, 49.0, 34.0, 26.0, 27.0, 22.0, 16.0, 11.0, 8.0, 5.0, 7.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0038356781005859375, -0.003734409809112549, -0.00363314151763916, -0.0035318732261657715, -0.003430604934692383, -0.003329336643218994, -0.0032280683517456055, -0.003126800060272217, -0.003025531768798828, -0.0029242634773254395, -0.0028229951858520508, -0.002721726894378662, -0.0026204586029052734, -0.0025191903114318848, -0.002417922019958496, -0.0023166537284851074, -0.0022153854370117188, -0.00211411714553833, -0.0020128488540649414, -0.0019115805625915527, -0.001810312271118164, -0.0017090439796447754, -0.0016077756881713867, -0.001506507396697998, -0.0014052391052246094, -0.0013039708137512207, -0.001202702522277832, -0.0011014342308044434, -0.0010001659393310547, -0.000898897647857666, -0.0007976293563842773, -0.0006963610649108887, -0.0005950927734375, -0.0004938244819641113, -0.00039255619049072266, -0.000291287899017334, -0.0001900196075439453, -8.875131607055664e-05, 1.2516975402832031e-05, 0.0001137852668762207, 0.00021505355834960938, 0.00031632184982299805, 0.0004175901412963867, 0.0005188584327697754, 0.0006201267242431641, 0.0007213950157165527, 0.0008226633071899414, 0.0009239315986633301, 0.0010251998901367188, 0.0011264681816101074, 0.001227736473083496, 0.0013290047645568848, 0.0014302730560302734, 0.0015315413475036621, 0.0016328096389770508, 0.0017340779304504395, 0.0018353462219238281, 0.0019366145133972168, 0.0020378828048706055, 0.002139151096343994, 0.002240419387817383, 0.0023416876792907715, 0.00244295597076416, 0.002544224262237549, 0.0026454925537109375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 6.0, 4.0, 6.0, 7.0, 18.0, 17.0, 22.0, 34.0, 32.0, 41.0, 74.0, 96.0, 156.0, 255.0, 688.0, 6251.0, 1031618.0, 7664.0, 769.0, 269.0, 136.0, 98.0, 55.0, 47.0, 27.0, 23.0, 29.0, 23.0, 14.0, 11.0, 13.0, 8.0, 11.0, 11.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057769775390625, -0.055506229400634766, -0.05324268341064453, -0.0509791374206543, -0.04871559143066406, -0.04645204544067383, -0.044188499450683594, -0.04192495346069336, -0.039661407470703125, -0.03739786148071289, -0.035134315490722656, -0.03287076950073242, -0.030607223510742188, -0.028343677520751953, -0.02608013153076172, -0.023816585540771484, -0.02155303955078125, -0.019289493560791016, -0.01702594757080078, -0.014762401580810547, -0.012498855590820312, -0.010235309600830078, -0.007971763610839844, -0.005708217620849609, -0.003444671630859375, -0.0011811256408691406, 0.0010824203491210938, 0.003345966339111328, 0.0056095123291015625, 0.007873058319091797, 0.010136604309082031, 0.012400150299072266, 0.0146636962890625, 0.016927242279052734, 0.01919078826904297, 0.021454334259033203, 0.023717880249023438, 0.025981426239013672, 0.028244972229003906, 0.03050851821899414, 0.032772064208984375, 0.03503561019897461, 0.037299156188964844, 0.03956270217895508, 0.04182624816894531, 0.04408979415893555, 0.04635334014892578, 0.048616886138916016, 0.05088043212890625, 0.053143978118896484, 0.05540752410888672, 0.05767107009887695, 0.05993461608886719, 0.06219816207885742, 0.06446170806884766, 0.06672525405883789, 0.06898880004882812, 0.07125234603881836, 0.0735158920288086, 0.07577943801879883, 0.07804298400878906, 0.0803065299987793, 0.08257007598876953, 0.08483362197875977, 0.08709716796875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 58.0, 545.0, 384.0, 25.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028951370622962713, -0.002528177807107568, -0.0021612183190882206, -0.001794259063899517, -0.0014272998087108135, -0.00106034055352211, -0.0006933810655027628, -0.00032642181031405926, 4.053744487464428e-05, 0.00040749675827100873, 0.0007744560716673732, 0.0011414154432713985, 0.001508374698460102, 0.0018753339536488056, 0.002242293441668153, 0.0026092526968568563, 0.00297621195204556, 0.0033431712072342634, 0.0037101306952536106, 0.004077089950442314, 0.004444049205631018, 0.004811008460819721, 0.005177968181669712, 0.005544926971197128, 0.005911886692047119, 0.006278845947235823, 0.006645805202424526, 0.007012764923274517, 0.007379723712801933, 0.007746683433651924, 0.008113643154501915, 0.008480601944029331, 0.008847560733556747, 0.009214520454406738, 0.009581479243934155, 0.009948438964784145, 0.010315397754311562, 0.010682357475161552, 0.011049317196011543, 0.01141627598553896, 0.011783234775066376, 0.012150194495916367, 0.012517153285443783, 0.012884113006293774, 0.01325107179582119, 0.01361803151667118, 0.013984991237521172, 0.014351950027048588, 0.014718909747898579, 0.01508586946874857, 0.015452828258275986, 0.015819787979125977, 0.016186747699975967, 0.01655370555818081, 0.0169206652790308, 0.01728762499988079, 0.01765458472073078, 0.018021544441580772, 0.018388504162430763, 0.018755462020635605, 0.019122421741485596, 0.019489381462335587, 0.019856341183185577, 0.020223300904035568, 0.02059025876224041]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 1.0, 7.0, 5.0, 7.0, 10.0, 15.0, 11.0, 10.0, 17.0, 22.0, 18.0, 27.0, 34.0, 38.0, 24.0, 30.0, 29.0, 26.0, 34.0, 45.0, 51.0, 45.0, 32.0, 36.0, 33.0, 30.0, 28.0, 31.0, 51.0, 27.0, 28.0, 29.0, 33.0, 23.0, 23.0, 17.0, 8.0, 13.0, 13.0, 9.0, 5.0, 7.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014243125915527344, -0.0013732602819800377, -0.001322207972407341, -0.0012711556628346443, -0.0012201033532619476, -0.001169051043689251, -0.0011179987341165543, -0.0010669464245438576, -0.0010158941149711609, -0.0009648418053984642, -0.0009137894958257675, -0.0008627371862530708, -0.0008116848766803741, -0.0007606325671076775, -0.0007095802575349808, -0.0006585279479622841, -0.0006074756383895874, -0.0005564233288168907, -0.000505371019244194, -0.00045431870967149734, -0.00040326640009880066, -0.000352214090526104, -0.0003011617809534073, -0.0002501094713807106, -0.00019905716180801392, -0.00014800485223531723, -9.695254266262054e-05, -4.590023308992386e-05, 5.152076482772827e-06, 5.620438605546951e-05, 0.0001072566956281662, 0.00015830900520086288, 0.00020936131477355957, 0.00026041362434625626, 0.00031146593391895294, 0.00036251824349164963, 0.0004135705530643463, 0.000464622862637043, 0.0005156751722097397, 0.0005667274817824364, 0.0006177797913551331, 0.0006688321009278297, 0.0007198844105005264, 0.0007709367200732231, 0.0008219890296459198, 0.0008730413392186165, 0.0009240936487913132, 0.0009751459583640099, 0.0010261982679367065, 0.0010772505775094032, 0.0011283028870821, 0.0011793551966547966, 0.0012304075062274933, 0.00128145981580019, 0.0013325121253728867, 0.0013835644349455833, 0.00143461674451828, 0.0014856690540909767, 0.0015367213636636734, 0.00158777367323637, 0.0016388259828090668, 0.0016898782923817635, 0.0017409306019544601, 0.0017919829115271568, 0.0018430352210998535]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 6.0, 12.0, 11.0, 9.0, 15.0, 19.0, 26.0, 24.0, 34.0, 37.0, 27.0, 28.0, 35.0, 40.0, 37.0, 51.0, 45.0, 43.0, 57.0, 52.0, 45.0, 41.0, 39.0, 40.0, 23.0, 27.0, 23.0, 22.0, 23.0, 28.0, 21.0, 12.0, 15.0, 6.0, 5.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7109375, -12.2952880859375, -11.879638671875, -11.4639892578125, -11.04833984375, -10.6326904296875, -10.217041015625, -9.8013916015625, -9.3857421875, -8.9700927734375, -8.554443359375, -8.1387939453125, -7.72314453125, -7.3074951171875, -6.891845703125, -6.4761962890625, -6.060546875, -5.6448974609375, -5.229248046875, -4.8135986328125, -4.39794921875, -3.9822998046875, -3.566650390625, -3.1510009765625, -2.7353515625, -2.3197021484375, -1.904052734375, -1.4884033203125, -1.07275390625, -0.6571044921875, -0.241455078125, 0.1741943359375, 0.58984375, 1.0054931640625, 1.421142578125, 1.8367919921875, 2.25244140625, 2.6680908203125, 3.083740234375, 3.4993896484375, 3.9150390625, 4.3306884765625, 4.746337890625, 5.1619873046875, 5.57763671875, 5.9932861328125, 6.408935546875, 6.8245849609375, 7.240234375, 7.6558837890625, 8.071533203125, 8.4871826171875, 8.90283203125, 9.3184814453125, 9.734130859375, 10.1497802734375, 10.5654296875, 10.9810791015625, 11.396728515625, 11.8123779296875, 12.22802734375, 12.6436767578125, 13.059326171875, 13.4749755859375, 13.890625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 4.0, 15.0, 9.0, 17.0, 30.0, 41.0, 32.0, 65.0, 83.0, 91.0, 130.0, 181.0, 260.0, 366.0, 568.0, 895.0, 1665.0, 3184.0, 6844.0, 16959.0, 45408.0, 129816.0, 459896.0, 250378.0, 80537.0, 29081.0, 11097.0, 4865.0, 2389.0, 1290.0, 795.0, 428.0, 282.0, 220.0, 150.0, 113.0, 93.0, 69.0, 51.0, 35.0, 37.0, 25.0, 21.0, 11.0, 8.0, 4.0, 6.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.703125, -10.3553466796875, -10.007568359375, -9.6597900390625, -9.31201171875, -8.9642333984375, -8.616455078125, -8.2686767578125, -7.9208984375, -7.5731201171875, -7.225341796875, -6.8775634765625, -6.52978515625, -6.1820068359375, -5.834228515625, -5.4864501953125, -5.138671875, -4.7908935546875, -4.443115234375, -4.0953369140625, -3.74755859375, -3.3997802734375, -3.052001953125, -2.7042236328125, -2.3564453125, -2.0086669921875, -1.660888671875, -1.3131103515625, -0.96533203125, -0.6175537109375, -0.269775390625, 0.0780029296875, 0.42578125, 0.7735595703125, 1.121337890625, 1.4691162109375, 1.81689453125, 2.1646728515625, 2.512451171875, 2.8602294921875, 3.2080078125, 3.5557861328125, 3.903564453125, 4.2513427734375, 4.59912109375, 4.9468994140625, 5.294677734375, 5.6424560546875, 5.990234375, 6.3380126953125, 6.685791015625, 7.0335693359375, 7.38134765625, 7.7291259765625, 8.076904296875, 8.4246826171875, 8.7724609375, 9.1202392578125, 9.468017578125, 9.8157958984375, 10.16357421875, 10.5113525390625, 10.859130859375, 11.2069091796875, 11.5546875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 4.0, 5.0, 7.0, 9.0, 12.0, 19.0, 17.0, 14.0, 28.0, 20.0, 27.0, 24.0, 34.0, 43.0, 34.0, 51.0, 50.0, 62.0, 121.0, 1572.0, 341.0, 104.0, 63.0, 50.0, 51.0, 49.0, 30.0, 37.0, 31.0, 24.0, 21.0, 20.0, 10.0, 15.0, 13.0, 9.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-44.875, -43.55078125, -42.2265625, -40.90234375, -39.578125, -38.25390625, -36.9296875, -35.60546875, -34.28125, -32.95703125, -31.6328125, -30.30859375, -28.984375, -27.66015625, -26.3359375, -25.01171875, -23.6875, -22.36328125, -21.0390625, -19.71484375, -18.390625, -17.06640625, -15.7421875, -14.41796875, -13.09375, -11.76953125, -10.4453125, -9.12109375, -7.796875, -6.47265625, -5.1484375, -3.82421875, -2.5, -1.17578125, 0.1484375, 1.47265625, 2.796875, 4.12109375, 5.4453125, 6.76953125, 8.09375, 9.41796875, 10.7421875, 12.06640625, 13.390625, 14.71484375, 16.0390625, 17.36328125, 18.6875, 20.01171875, 21.3359375, 22.66015625, 23.984375, 25.30859375, 26.6328125, 27.95703125, 29.28125, 30.60546875, 31.9296875, 33.25390625, 34.578125, 35.90234375, 37.2265625, 38.55078125, 39.875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 3.0, 4.0, 7.0, 18.0, 24.0, 45.0, 59.0, 106.0, 163.0, 297.0, 551.0, 3451.0, 3132244.0, 7274.0, 671.0, 318.0, 176.0, 105.0, 69.0, 60.0, 28.0, 16.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.75, -176.962890625, -171.17578125, -165.388671875, -159.6015625, -153.814453125, -148.02734375, -142.240234375, -136.453125, -130.666015625, -124.87890625, -119.091796875, -113.3046875, -107.517578125, -101.73046875, -95.943359375, -90.15625, -84.369140625, -78.58203125, -72.794921875, -67.0078125, -61.220703125, -55.43359375, -49.646484375, -43.859375, -38.072265625, -32.28515625, -26.498046875, -20.7109375, -14.923828125, -9.13671875, -3.349609375, 2.4375, 8.224609375, 14.01171875, 19.798828125, 25.5859375, 31.373046875, 37.16015625, 42.947265625, 48.734375, 54.521484375, 60.30859375, 66.095703125, 71.8828125, 77.669921875, 83.45703125, 89.244140625, 95.03125, 100.818359375, 106.60546875, 112.392578125, 118.1796875, 123.966796875, 129.75390625, 135.541015625, 141.328125, 147.115234375, 152.90234375, 158.689453125, 164.4765625, 170.263671875, 176.05078125, 181.837890625, 187.625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 617.0, 389.0, 5.0, 2.0], "bins": [-958.7362060546875, -942.990478515625, -927.2448120117188, -911.4990844726562, -895.75341796875, -880.0076904296875, -864.2620239257812, -848.5162963867188, -832.7706298828125, -817.02490234375, -801.2792358398438, -785.5335083007812, -769.787841796875, -754.0421142578125, -738.2964477539062, -722.5507202148438, -706.8050537109375, -691.059326171875, -675.3136596679688, -659.5679321289062, -643.822265625, -628.0765380859375, -612.3308715820312, -596.5851440429688, -580.8394165039062, -565.0936889648438, -549.3480224609375, -533.602294921875, -517.8566284179688, -502.1109313964844, -486.365234375, -470.6195068359375, -454.87384033203125, -439.1281433105469, -423.3824462890625, -407.6367492675781, -391.89105224609375, -376.1453552246094, -360.399658203125, -344.6539306640625, -328.9082336425781, -313.16253662109375, -297.4168395996094, -281.671142578125, -265.9254455566406, -250.17974853515625, -234.4340362548828, -218.68833923339844, -202.94264221191406, -187.1969451904297, -171.4512481689453, -155.70553588867188, -139.9598388671875, -124.21414947509766, -108.46844482421875, -92.72274780273438, -76.97705078125, -61.231353759765625, -45.485652923583984, -29.739952087402344, -13.994255065917969, 1.7514419555664062, 17.497146606445312, 33.24284362792969, 48.9885368347168]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 8.0, 5.0, 10.0, 10.0, 10.0, 13.0, 13.0, 13.0, 19.0, 18.0, 22.0, 32.0, 35.0, 18.0, 29.0, 37.0, 40.0, 42.0, 44.0, 58.0, 41.0, 45.0, 38.0, 45.0, 42.0, 34.0, 36.0, 28.0, 32.0, 22.0, 33.0, 24.0, 22.0, 13.0, 9.0, 11.0, 8.0, 9.0, 5.0, 4.0, 9.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-114.29349517822266, -110.54558563232422, -106.79767608642578, -103.04976654052734, -99.30184936523438, -95.55393981933594, -91.8060302734375, -88.05812072753906, -84.31021118164062, -80.56230163574219, -76.81439208984375, -73.06648254394531, -69.31857299804688, -65.57066345214844, -61.82274627685547, -58.07483673095703, -54.326927185058594, -50.579017639160156, -46.83110809326172, -43.083194732666016, -39.33528518676758, -35.58737564086914, -31.83946418762207, -28.091552734375, -24.343643188476562, -20.595733642578125, -16.847822189331055, -13.0999116897583, -9.352001190185547, -5.604091644287109, -1.856180191040039, 1.8917312622070312, 5.6396484375, 9.387558937072754, 13.135469436645508, 16.883380889892578, 20.631290435791016, 24.379199981689453, 28.127111434936523, 31.875022888183594, 35.62293243408203, 39.37084197998047, 43.118751525878906, 46.86666488647461, 50.61457443237305, 54.362483978271484, 58.11039733886719, 61.858306884765625, 65.60621643066406, 69.3541259765625, 73.10203552246094, 76.84994506835938, 80.59785461425781, 84.34576416015625, 88.09368133544922, 91.84159088134766, 95.5895004272461, 99.33740997314453, 103.08531951904297, 106.8332290649414, 110.58114624023438, 114.32905578613281, 118.07696533203125, 121.82487487792969, 125.57278442382812]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 8.0, 12.0, 10.0, 7.0, 21.0, 11.0, 32.0, 27.0, 33.0, 30.0, 31.0, 28.0, 38.0, 45.0, 31.0, 57.0, 57.0, 37.0, 50.0, 52.0, 47.0, 47.0, 31.0, 41.0, 19.0, 21.0, 24.0, 21.0, 24.0, 26.0, 16.0, 17.0, 10.0, 7.0, 5.0, 6.0, 6.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.84375, -13.4000244140625, -12.956298828125, -12.5125732421875, -12.06884765625, -11.6251220703125, -11.181396484375, -10.7376708984375, -10.2939453125, -9.8502197265625, -9.406494140625, -8.9627685546875, -8.51904296875, -8.0753173828125, -7.631591796875, -7.1878662109375, -6.744140625, -6.3004150390625, -5.856689453125, -5.4129638671875, -4.96923828125, -4.5255126953125, -4.081787109375, -3.6380615234375, -3.1943359375, -2.7506103515625, -2.306884765625, -1.8631591796875, -1.41943359375, -0.9757080078125, -0.531982421875, -0.0882568359375, 0.35546875, 0.7991943359375, 1.242919921875, 1.6866455078125, 2.13037109375, 2.5740966796875, 3.017822265625, 3.4615478515625, 3.9052734375, 4.3489990234375, 4.792724609375, 5.2364501953125, 5.68017578125, 6.1239013671875, 6.567626953125, 7.0113525390625, 7.455078125, 7.8988037109375, 8.342529296875, 8.7862548828125, 9.22998046875, 9.6737060546875, 10.117431640625, 10.5611572265625, 11.0048828125, 11.4486083984375, 11.892333984375, 12.3360595703125, 12.77978515625, 13.2235107421875, 13.667236328125, 14.1109619140625, 14.5546875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 3.0, 8.0, 8.0, 10.0, 9.0, 12.0, 17.0, 16.0, 21.0, 22.0, 24.0, 30.0, 35.0, 39.0, 79.0, 137.0, 454.0, 1794.0, 19137.0, 1103636.0, 2986106.0, 77615.0, 3796.0, 692.0, 209.0, 85.0, 42.0, 32.0, 25.0, 25.0, 19.0, 26.0, 15.0, 27.0, 16.0, 12.0, 16.0, 6.0, 8.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.34375, -45.77587890625, -44.2080078125, -42.64013671875, -41.072265625, -39.50439453125, -37.9365234375, -36.36865234375, -34.80078125, -33.23291015625, -31.6650390625, -30.09716796875, -28.529296875, -26.96142578125, -25.3935546875, -23.82568359375, -22.2578125, -20.68994140625, -19.1220703125, -17.55419921875, -15.986328125, -14.41845703125, -12.8505859375, -11.28271484375, -9.71484375, -8.14697265625, -6.5791015625, -5.01123046875, -3.443359375, -1.87548828125, -0.3076171875, 1.26025390625, 2.828125, 4.39599609375, 5.9638671875, 7.53173828125, 9.099609375, 10.66748046875, 12.2353515625, 13.80322265625, 15.37109375, 16.93896484375, 18.5068359375, 20.07470703125, 21.642578125, 23.21044921875, 24.7783203125, 26.34619140625, 27.9140625, 29.48193359375, 31.0498046875, 32.61767578125, 34.185546875, 35.75341796875, 37.3212890625, 38.88916015625, 40.45703125, 42.02490234375, 43.5927734375, 45.16064453125, 46.728515625, 48.29638671875, 49.8642578125, 51.43212890625, 53.0]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 12.0, 5.0, 8.0, 13.0, 25.0, 27.0, 36.0, 54.0, 71.0, 81.0, 106.0, 173.0, 202.0, 276.0, 418.0, 437.0, 474.0, 398.0, 335.0, 245.0, 204.0, 117.0, 78.0, 74.0, 48.0, 44.0, 33.0, 23.0, 12.0, 11.0, 4.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.234375, -26.41455078125, -25.5947265625, -24.77490234375, -23.955078125, -23.13525390625, -22.3154296875, -21.49560546875, -20.67578125, -19.85595703125, -19.0361328125, -18.21630859375, -17.396484375, -16.57666015625, -15.7568359375, -14.93701171875, -14.1171875, -13.29736328125, -12.4775390625, -11.65771484375, -10.837890625, -10.01806640625, -9.1982421875, -8.37841796875, -7.55859375, -6.73876953125, -5.9189453125, -5.09912109375, -4.279296875, -3.45947265625, -2.6396484375, -1.81982421875, -1.0, -0.18017578125, 0.6396484375, 1.45947265625, 2.279296875, 3.09912109375, 3.9189453125, 4.73876953125, 5.55859375, 6.37841796875, 7.1982421875, 8.01806640625, 8.837890625, 9.65771484375, 10.4775390625, 11.29736328125, 12.1171875, 12.93701171875, 13.7568359375, 14.57666015625, 15.396484375, 16.21630859375, 17.0361328125, 17.85595703125, 18.67578125, 19.49560546875, 20.3154296875, 21.13525390625, 21.955078125, 22.77490234375, 23.5947265625, 24.41455078125, 25.234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 8.0, 12.0, 11.0, 11.0, 16.0, 24.0, 29.0, 37.0, 45.0, 72.0, 83.0, 102.0, 133.0, 148.0, 230.0, 362.0, 605.0, 2983.0, 157010.0, 3976423.0, 52178.0, 1844.0, 559.0, 300.0, 210.0, 174.0, 124.0, 131.0, 85.0, 59.0, 48.0, 53.0, 43.0, 30.0, 22.0, 11.0, 12.0, 11.0, 16.0, 7.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-89.75, -86.697265625, -83.64453125, -80.591796875, -77.5390625, -74.486328125, -71.43359375, -68.380859375, -65.328125, -62.275390625, -59.22265625, -56.169921875, -53.1171875, -50.064453125, -47.01171875, -43.958984375, -40.90625, -37.853515625, -34.80078125, -31.748046875, -28.6953125, -25.642578125, -22.58984375, -19.537109375, -16.484375, -13.431640625, -10.37890625, -7.326171875, -4.2734375, -1.220703125, 1.83203125, 4.884765625, 7.9375, 10.990234375, 14.04296875, 17.095703125, 20.1484375, 23.201171875, 26.25390625, 29.306640625, 32.359375, 35.412109375, 38.46484375, 41.517578125, 44.5703125, 47.623046875, 50.67578125, 53.728515625, 56.78125, 59.833984375, 62.88671875, 65.939453125, 68.9921875, 72.044921875, 75.09765625, 78.150390625, 81.203125, 84.255859375, 87.30859375, 90.361328125, 93.4140625, 96.466796875, 99.51953125, 102.572265625, 105.625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 44.0, 188.0, 391.0, 290.0, 80.0, 12.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-503.3935241699219, -491.60693359375, -479.82037353515625, -468.0337829589844, -456.2471923828125, -444.46063232421875, -432.6740417480469, -420.887451171875, -409.10089111328125, -397.3143005371094, -385.5277404785156, -373.74114990234375, -361.9545593261719, -350.1679992675781, -338.38140869140625, -326.5948486328125, -314.8082275390625, -303.0216369628906, -291.2350769042969, -279.448486328125, -267.6618957519531, -255.87533569335938, -244.0887451171875, -232.3021697998047, -220.51559448242188, -208.72901916503906, -196.9424285888672, -185.15585327148438, -173.36927795410156, -161.58270263671875, -149.79611206054688, -138.00953674316406, -126.22294616699219, -114.43636322021484, -102.64978790283203, -90.86320495605469, -79.07662963867188, -67.29004669189453, -55.50346374511719, -43.716888427734375, -31.93030548095703, -20.143726348876953, -8.357145309448242, 3.4294357299804688, 15.216014862060547, 27.002593994140625, 38.78917694091797, 50.57575225830078, 62.362335205078125, 74.14891815185547, 85.93549346923828, 97.72207641601562, 109.50865173339844, 121.29523468017578, 133.08181762695312, 144.86839294433594, 156.65496826171875, 168.44154357910156, 180.22813415527344, 192.01470947265625, 203.80128479003906, 215.58786010742188, 227.37445068359375, 239.16102600097656, 250.94761657714844]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 6.0, 2.0, 14.0, 9.0, 11.0, 11.0, 9.0, 18.0, 21.0, 19.0, 16.0, 30.0, 22.0, 29.0, 39.0, 45.0, 31.0, 35.0, 38.0, 41.0, 54.0, 43.0, 38.0, 42.0, 41.0, 29.0, 38.0, 27.0, 35.0, 31.0, 20.0, 27.0, 20.0, 20.0, 11.0, 18.0, 10.0, 12.0, 11.0, 14.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.47265625, -82.67277526855469, -79.87289428710938, -77.0730209350586, -74.27313995361328, -71.47325897216797, -68.67337799072266, -65.87350463867188, -63.07362365722656, -60.27374267578125, -57.4738655090332, -54.67398452758789, -51.874107360839844, -49.07422637939453, -46.27434539794922, -43.47446823120117, -40.67458724975586, -37.87470626831055, -35.0748291015625, -32.27494812011719, -29.47507095336914, -26.675189971923828, -23.87531089782715, -21.07543182373047, -18.27555274963379, -15.47567367553711, -12.67579460144043, -9.875914573669434, -7.076035499572754, -4.276156425476074, -1.4762763977050781, 1.3236026763916016, 4.123481750488281, 6.923360824584961, 9.72323989868164, 12.523119926452637, 15.322999000549316, 18.122879028320312, 20.922758102416992, 23.722637176513672, 26.52251625061035, 29.32239532470703, 32.122276306152344, 34.92215347290039, 37.7220344543457, 40.52191162109375, 43.32179260253906, 46.121673583984375, 48.92155075073242, 51.721431732177734, 54.52130889892578, 57.321189880371094, 60.12106704711914, 62.92094802856445, 65.7208251953125, 68.52070617675781, 71.32058715820312, 74.12046813964844, 76.92034912109375, 79.72022247314453, 82.52010345458984, 85.31998443603516, 88.11986541748047, 90.91973876953125, 93.71961975097656]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 6.0, 9.0, 13.0, 22.0, 19.0, 13.0, 18.0, 22.0, 32.0, 35.0, 37.0, 29.0, 38.0, 43.0, 39.0, 36.0, 38.0, 50.0, 35.0, 50.0, 40.0, 42.0, 41.0, 28.0, 31.0, 32.0, 33.0, 24.0, 15.0, 17.0, 19.0, 23.0, 18.0, 11.0, 7.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.7265625, -12.3148193359375, -11.903076171875, -11.4913330078125, -11.07958984375, -10.6678466796875, -10.256103515625, -9.8443603515625, -9.4326171875, -9.0208740234375, -8.609130859375, -8.1973876953125, -7.78564453125, -7.3739013671875, -6.962158203125, -6.5504150390625, -6.138671875, -5.7269287109375, -5.315185546875, -4.9034423828125, -4.49169921875, -4.0799560546875, -3.668212890625, -3.2564697265625, -2.8447265625, -2.4329833984375, -2.021240234375, -1.6094970703125, -1.19775390625, -0.7860107421875, -0.374267578125, 0.0374755859375, 0.44921875, 0.8609619140625, 1.272705078125, 1.6844482421875, 2.09619140625, 2.5079345703125, 2.919677734375, 3.3314208984375, 3.7431640625, 4.1549072265625, 4.566650390625, 4.9783935546875, 5.39013671875, 5.8018798828125, 6.213623046875, 6.6253662109375, 7.037109375, 7.4488525390625, 7.860595703125, 8.2723388671875, 8.68408203125, 9.0958251953125, 9.507568359375, 9.9193115234375, 10.3310546875, 10.7427978515625, 11.154541015625, 11.5662841796875, 11.97802734375, 12.3897705078125, 12.801513671875, 13.2132568359375, 13.625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 7.0, 5.0, 16.0, 13.0, 37.0, 41.0, 69.0, 125.0, 146.0, 233.0, 314.0, 488.0, 730.0, 1092.0, 1664.0, 2514.0, 3622.0, 5608.0, 7980.0, 12251.0, 17684.0, 26340.0, 38053.0, 55742.0, 79479.0, 115094.0, 159325.0, 157473.0, 113157.0, 78003.0, 54340.0, 37439.0, 25744.0, 17468.0, 11943.0, 7985.0, 5334.0, 3632.0, 2424.0, 1638.0, 1093.0, 715.0, 488.0, 339.0, 222.0, 153.0, 105.0, 58.0, 44.0, 37.0, 21.0, 16.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.103515625, -1.0654296875, -1.02734375, -0.9892578125, -0.951171875, -0.9130859375, -0.875, -0.8369140625, -0.798828125, -0.7607421875, -0.72265625, -0.6845703125, -0.646484375, -0.6083984375, -0.5703125, -0.5322265625, -0.494140625, -0.4560546875, -0.41796875, -0.3798828125, -0.341796875, -0.3037109375, -0.265625, -0.2275390625, -0.189453125, -0.1513671875, -0.11328125, -0.0751953125, -0.037109375, 0.0009765625, 0.0390625, 0.0771484375, 0.115234375, 0.1533203125, 0.19140625, 0.2294921875, 0.267578125, 0.3056640625, 0.34375, 0.3818359375, 0.419921875, 0.4580078125, 0.49609375, 0.5341796875, 0.572265625, 0.6103515625, 0.6484375, 0.6865234375, 0.724609375, 0.7626953125, 0.80078125, 0.8388671875, 0.876953125, 0.9150390625, 0.953125, 0.9912109375, 1.029296875, 1.0673828125, 1.10546875, 1.1435546875, 1.181640625, 1.2197265625, 1.2578125, 1.2958984375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 8.0, 3.0, 7.0, 18.0, 13.0, 8.0, 16.0, 26.0, 11.0, 17.0, 26.0, 36.0, 24.0, 36.0, 32.0, 35.0, 37.0, 35.0, 49.0, 38.0, 1067.0, 36.0, 45.0, 42.0, 42.0, 37.0, 39.0, 30.0, 26.0, 32.0, 21.0, 27.0, 15.0, 15.0, 13.0, 10.0, 12.0, 4.0, 11.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.85052490234375, -8.5838623046875, -8.31719970703125, -8.050537109375, -7.78387451171875, -7.5172119140625, -7.25054931640625, -6.98388671875, -6.71722412109375, -6.4505615234375, -6.18389892578125, -5.917236328125, -5.65057373046875, -5.3839111328125, -5.11724853515625, -4.8505859375, -4.58392333984375, -4.3172607421875, -4.05059814453125, -3.783935546875, -3.51727294921875, -3.2506103515625, -2.98394775390625, -2.71728515625, -2.45062255859375, -2.1839599609375, -1.91729736328125, -1.650634765625, -1.38397216796875, -1.1173095703125, -0.85064697265625, -0.583984375, -0.31732177734375, -0.0506591796875, 0.21600341796875, 0.482666015625, 0.74932861328125, 1.0159912109375, 1.28265380859375, 1.54931640625, 1.81597900390625, 2.0826416015625, 2.34930419921875, 2.615966796875, 2.88262939453125, 3.1492919921875, 3.41595458984375, 3.6826171875, 3.94927978515625, 4.2159423828125, 4.48260498046875, 4.749267578125, 5.01593017578125, 5.2825927734375, 5.54925537109375, 5.81591796875, 6.08258056640625, 6.3492431640625, 6.61590576171875, 6.882568359375, 7.14923095703125, 7.4158935546875, 7.68255615234375, 7.94921875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 10.0, 29.0, 27.0, 61.0, 55.0, 124.0, 149.0, 260.0, 340.0, 515.0, 770.0, 1145.0, 1731.0, 2545.0, 3930.0, 5892.0, 8806.0, 13401.0, 20150.0, 30946.0, 47681.0, 73647.0, 117275.0, 186466.0, 1234562.0, 123423.0, 77543.0, 50100.0, 32549.0, 21399.0, 14147.0, 9132.0, 6079.0, 4119.0, 2699.0, 1706.0, 1185.0, 833.0, 537.0, 385.0, 264.0, 176.0, 100.0, 82.0, 38.0, 40.0, 25.0, 19.0, 16.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.3564453125, -1.3141326904296875, -1.271820068359375, -1.2295074462890625, -1.18719482421875, -1.1448822021484375, -1.102569580078125, -1.0602569580078125, -1.0179443359375, -0.9756317138671875, -0.933319091796875, -0.8910064697265625, -0.84869384765625, -0.8063812255859375, -0.764068603515625, -0.7217559814453125, -0.679443359375, -0.6371307373046875, -0.594818115234375, -0.5525054931640625, -0.51019287109375, -0.4678802490234375, -0.425567626953125, -0.3832550048828125, -0.3409423828125, -0.2986297607421875, -0.256317138671875, -0.2140045166015625, -0.17169189453125, -0.1293792724609375, -0.087066650390625, -0.0447540283203125, -0.00244140625, 0.0398712158203125, 0.082183837890625, 0.1244964599609375, 0.16680908203125, 0.2091217041015625, 0.251434326171875, 0.2937469482421875, 0.3360595703125, 0.3783721923828125, 0.420684814453125, 0.4629974365234375, 0.50531005859375, 0.5476226806640625, 0.589935302734375, 0.6322479248046875, 0.674560546875, 0.7168731689453125, 0.759185791015625, 0.8014984130859375, 0.84381103515625, 0.8861236572265625, 0.928436279296875, 0.9707489013671875, 1.0130615234375, 1.0553741455078125, 1.097686767578125, 1.1399993896484375, 1.18231201171875, 1.2246246337890625, 1.266937255859375, 1.3092498779296875, 1.3515625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 5.0, 5.0, 3.0, 14.0, 10.0, 8.0, 22.0, 22.0, 23.0, 29.0, 37.0, 50.0, 53.0, 43.0, 73.0, 68.0, 54.0, 61.0, 61.0, 72.0, 50.0, 51.0, 38.0, 37.0, 19.0, 21.0, 17.0, 15.0, 11.0, 7.0, 6.0, 4.0, 4.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019989013671875, -0.0019109547138214111, -0.0018230080604553223, -0.0017350614070892334, -0.0016471147537231445, -0.0015591681003570557, -0.0014712214469909668, -0.001383274793624878, -0.001295328140258789, -0.0012073814868927002, -0.0011194348335266113, -0.0010314881801605225, -0.0009435415267944336, -0.0008555948734283447, -0.0007676482200622559, -0.000679701566696167, -0.0005917549133300781, -0.0005038082599639893, -0.0004158616065979004, -0.0003279149532318115, -0.00023996829986572266, -0.0001520216464996338, -6.407499313354492e-05, 2.3871660232543945e-05, 0.00011181831359863281, 0.00019976496696472168, 0.00028771162033081055, 0.0003756582736968994, 0.0004636049270629883, 0.0005515515804290771, 0.000639498233795166, 0.0007274448871612549, 0.0008153915405273438, 0.0009033381938934326, 0.0009912848472595215, 0.0010792315006256104, 0.0011671781539916992, 0.001255124807357788, 0.001343071460723877, 0.0014310181140899658, 0.0015189647674560547, 0.0016069114208221436, 0.0016948580741882324, 0.0017828047275543213, 0.0018707513809204102, 0.001958698034286499, 0.002046644687652588, 0.0021345913410186768, 0.0022225379943847656, 0.0023104846477508545, 0.0023984313011169434, 0.0024863779544830322, 0.002574324607849121, 0.00266227126121521, 0.002750217914581299, 0.0028381645679473877, 0.0029261112213134766, 0.0030140578746795654, 0.0031020045280456543, 0.003189951181411743, 0.003277897834777832, 0.003365844488143921, 0.0034537911415100098, 0.0035417377948760986, 0.0036296844482421875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 4.0, 4.0, 6.0, 9.0, 10.0, 16.0, 15.0, 27.0, 23.0, 41.0, 57.0, 86.0, 114.0, 184.0, 537.0, 2724.0, 1029329.0, 13835.0, 802.0, 252.0, 126.0, 72.0, 61.0, 51.0, 35.0, 30.0, 28.0, 14.0, 9.0, 14.0, 10.0, 4.0, 5.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.08477783203125, -0.08269214630126953, -0.08060646057128906, -0.0785207748413086, -0.07643508911132812, -0.07434940338134766, -0.07226371765136719, -0.07017803192138672, -0.06809234619140625, -0.06600666046142578, -0.06392097473144531, -0.061835289001464844, -0.059749603271484375, -0.057663917541503906, -0.05557823181152344, -0.05349254608154297, -0.0514068603515625, -0.04932117462158203, -0.04723548889160156, -0.045149803161621094, -0.043064117431640625, -0.040978431701660156, -0.03889274597167969, -0.03680706024169922, -0.03472137451171875, -0.03263568878173828, -0.030550003051757812, -0.028464317321777344, -0.026378631591796875, -0.024292945861816406, -0.022207260131835938, -0.02012157440185547, -0.018035888671875, -0.01595020294189453, -0.013864517211914062, -0.011778831481933594, -0.009693145751953125, -0.007607460021972656, -0.0055217742919921875, -0.0034360885620117188, -0.00135040283203125, 0.0007352828979492188, 0.0028209686279296875, 0.004906654357910156, 0.006992340087890625, 0.009078025817871094, 0.011163711547851562, 0.013249397277832031, 0.0153350830078125, 0.01742076873779297, 0.019506454467773438, 0.021592140197753906, 0.023677825927734375, 0.025763511657714844, 0.027849197387695312, 0.02993488311767578, 0.03202056884765625, 0.03410625457763672, 0.03619194030761719, 0.038277626037597656, 0.040363311767578125, 0.042448997497558594, 0.04453468322753906, 0.04662036895751953, 0.0487060546875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 92.0, 723.0, 188.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002585046924650669, -0.0022451633121818304, -0.0019052796997129917, -0.001565396087244153, -0.0012255124747753143, -0.0008856288623064756, -0.000545745249837637, -0.00020586163736879826, 0.00013402197510004044, 0.00047390558756887913, 0.0008137892000377178, 0.0011536728125065565, 0.0014935564249753952, 0.001833440037444234, 0.0021733236499130726, 0.0025132072623819113, 0.00285309087485075, 0.0031929744873195887, 0.0035328580997884274, 0.003872741712257266, 0.004212625324726105, 0.0045525087043643, 0.004892392549663782, 0.0052322763949632645, 0.0055721597746014595, 0.0059120431542396545, 0.006251926999539137, 0.006591810844838619, 0.006931694224476814, 0.007271577604115009, 0.007611461449414492, 0.007951345294713974, 0.008291229605674744, 0.008631112985312939, 0.008970996364951134, 0.009310880675911903, 0.009650764055550098, 0.009990647435188293, 0.010330531746149063, 0.010670415125787258, 0.011010298505425453, 0.011350181885063648, 0.011690065264701843, 0.012029949575662613, 0.012369832955300808, 0.012709716334939003, 0.013049600645899773, 0.013389484025537968, 0.013729367405176163, 0.014069250784814358, 0.014409134164452553, 0.014749018475413322, 0.015088901855051517, 0.015428785234689713, 0.015768669545650482, 0.016108551993966103, 0.016448436304926872, 0.016788320615887642, 0.017128203064203262, 0.017468087375164032, 0.0178079716861248, 0.018147854134440422, 0.01848773844540119, 0.018827620893716812, 0.019167505204677582]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 5.0, 1.0, 4.0, 8.0, 7.0, 8.0, 11.0, 11.0, 15.0, 19.0, 16.0, 21.0, 15.0, 28.0, 27.0, 35.0, 41.0, 33.0, 39.0, 41.0, 34.0, 29.0, 30.0, 43.0, 32.0, 41.0, 47.0, 32.0, 35.0, 16.0, 29.0, 35.0, 30.0, 21.0, 25.0, 16.0, 23.0, 22.0, 15.0, 12.0, 13.0, 5.0, 3.0, 7.0, 4.0, 6.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0011688470840454102, -0.001131356693804264, -0.001093866303563118, -0.001056375913321972, -0.0010188855230808258, -0.0009813951328396797, -0.0009439047425985336, -0.0009064143523573875, -0.0008689239621162415, -0.0008314335718750954, -0.0007939431816339493, -0.0007564527913928032, -0.0007189624011516571, -0.000681472010910511, -0.0006439816206693649, -0.0006064912304282188, -0.0005690008401870728, -0.0005315104499459267, -0.0004940200597047806, -0.0004565296694636345, -0.0004190392792224884, -0.0003815488889813423, -0.00034405849874019623, -0.00030656810849905014, -0.00026907771825790405, -0.00023158732801675797, -0.00019409693777561188, -0.0001566065475344658, -0.0001191161572933197, -8.162576705217361e-05, -4.413537681102753e-05, -6.644986569881439e-06, 3.084540367126465e-05, 6.833579391241074e-05, 0.00010582618415355682, 0.0001433165743947029, 0.000180806964635849, 0.0002182973548769951, 0.0002557877451181412, 0.00029327813535928726, 0.00033076852560043335, 0.00036825891584157944, 0.0004057493060827255, 0.0004432396963238716, 0.0004807300865650177, 0.0005182204768061638, 0.0005557108670473099, 0.000593201257288456, 0.000630691647529602, 0.0006681820377707481, 0.0007056724280118942, 0.0007431628182530403, 0.0007806532084941864, 0.0008181435987353325, 0.0008556339889764786, 0.0008931243792176247, 0.0009306147694587708, 0.0009681051596999168, 0.001005595549941063, 0.001043085940182209, 0.001080576330423355, 0.0011180667206645012, 0.0011555571109056473, 0.0011930475011467934, 0.0012305378913879395]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 6.0, 9.0, 13.0, 22.0, 19.0, 13.0, 18.0, 22.0, 32.0, 35.0, 37.0, 29.0, 38.0, 43.0, 39.0, 36.0, 38.0, 50.0, 35.0, 50.0, 40.0, 42.0, 41.0, 28.0, 31.0, 32.0, 33.0, 24.0, 15.0, 17.0, 19.0, 23.0, 18.0, 11.0, 7.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.7265625, -12.3148193359375, -11.903076171875, -11.4913330078125, -11.07958984375, -10.6678466796875, -10.256103515625, -9.8443603515625, -9.4326171875, -9.0208740234375, -8.609130859375, -8.1973876953125, -7.78564453125, -7.3739013671875, -6.962158203125, -6.5504150390625, -6.138671875, -5.7269287109375, -5.315185546875, -4.9034423828125, -4.49169921875, -4.0799560546875, -3.668212890625, -3.2564697265625, -2.8447265625, -2.4329833984375, -2.021240234375, -1.6094970703125, -1.19775390625, -0.7860107421875, -0.374267578125, 0.0374755859375, 0.44921875, 0.8609619140625, 1.272705078125, 1.6844482421875, 2.09619140625, 2.5079345703125, 2.919677734375, 3.3314208984375, 3.7431640625, 4.1549072265625, 4.566650390625, 4.9783935546875, 5.39013671875, 5.8018798828125, 6.213623046875, 6.6253662109375, 7.037109375, 7.4488525390625, 7.860595703125, 8.2723388671875, 8.68408203125, 9.0958251953125, 9.507568359375, 9.9193115234375, 10.3310546875, 10.7427978515625, 11.154541015625, 11.5662841796875, 11.97802734375, 12.3897705078125, 12.801513671875, 13.2132568359375, 13.625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 10.0, 11.0, 15.0, 21.0, 36.0, 36.0, 52.0, 58.0, 83.0, 124.0, 181.0, 236.0, 318.0, 491.0, 677.0, 1168.0, 1973.0, 3333.0, 5758.0, 10739.0, 20041.0, 42329.0, 99552.0, 247033.0, 345755.0, 147596.0, 60859.0, 27643.0, 13905.0, 7532.0, 4155.0, 2487.0, 1473.0, 907.0, 593.0, 411.0, 258.0, 192.0, 133.0, 87.0, 75.0, 38.0, 39.0, 27.0, 35.0, 19.0, 12.0, 8.0, 9.0, 8.0, 6.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0], "bins": [-7.578125, -7.33538818359375, -7.0926513671875, -6.84991455078125, -6.607177734375, -6.36444091796875, -6.1217041015625, -5.87896728515625, -5.63623046875, -5.39349365234375, -5.1507568359375, -4.90802001953125, -4.665283203125, -4.42254638671875, -4.1798095703125, -3.93707275390625, -3.6943359375, -3.45159912109375, -3.2088623046875, -2.96612548828125, -2.723388671875, -2.48065185546875, -2.2379150390625, -1.99517822265625, -1.75244140625, -1.50970458984375, -1.2669677734375, -1.02423095703125, -0.781494140625, -0.53875732421875, -0.2960205078125, -0.05328369140625, 0.189453125, 0.43218994140625, 0.6749267578125, 0.91766357421875, 1.160400390625, 1.40313720703125, 1.6458740234375, 1.88861083984375, 2.13134765625, 2.37408447265625, 2.6168212890625, 2.85955810546875, 3.102294921875, 3.34503173828125, 3.5877685546875, 3.83050537109375, 4.0732421875, 4.31597900390625, 4.5587158203125, 4.80145263671875, 5.044189453125, 5.28692626953125, 5.5296630859375, 5.77239990234375, 6.01513671875, 6.25787353515625, 6.5006103515625, 6.74334716796875, 6.986083984375, 7.22882080078125, 7.4715576171875, 7.71429443359375, 7.95703125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 7.0, 5.0, 4.0, 6.0, 14.0, 14.0, 16.0, 24.0, 22.0, 24.0, 28.0, 22.0, 34.0, 41.0, 56.0, 44.0, 70.0, 128.0, 1589.0, 343.0, 111.0, 55.0, 48.0, 52.0, 41.0, 34.0, 34.0, 30.0, 22.0, 27.0, 13.0, 15.0, 17.0, 9.0, 9.0, 8.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.125, -47.67578125, -46.2265625, -44.77734375, -43.328125, -41.87890625, -40.4296875, -38.98046875, -37.53125, -36.08203125, -34.6328125, -33.18359375, -31.734375, -30.28515625, -28.8359375, -27.38671875, -25.9375, -24.48828125, -23.0390625, -21.58984375, -20.140625, -18.69140625, -17.2421875, -15.79296875, -14.34375, -12.89453125, -11.4453125, -9.99609375, -8.546875, -7.09765625, -5.6484375, -4.19921875, -2.75, -1.30078125, 0.1484375, 1.59765625, 3.046875, 4.49609375, 5.9453125, 7.39453125, 8.84375, 10.29296875, 11.7421875, 13.19140625, 14.640625, 16.08984375, 17.5390625, 18.98828125, 20.4375, 21.88671875, 23.3359375, 24.78515625, 26.234375, 27.68359375, 29.1328125, 30.58203125, 32.03125, 33.48046875, 34.9296875, 36.37890625, 37.828125, 39.27734375, 40.7265625, 42.17578125, 43.625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 6.0, 10.0, 23.0, 26.0, 24.0, 51.0, 48.0, 77.0, 94.0, 141.0, 188.0, 257.0, 413.0, 1039.0, 66156.0, 3072259.0, 3214.0, 560.0, 328.0, 184.0, 162.0, 127.0, 75.0, 58.0, 43.0, 36.0, 18.0, 16.0, 14.0, 13.0, 15.0, 6.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.25, -124.271484375, -120.29296875, -116.314453125, -112.3359375, -108.357421875, -104.37890625, -100.400390625, -96.421875, -92.443359375, -88.46484375, -84.486328125, -80.5078125, -76.529296875, -72.55078125, -68.572265625, -64.59375, -60.615234375, -56.63671875, -52.658203125, -48.6796875, -44.701171875, -40.72265625, -36.744140625, -32.765625, -28.787109375, -24.80859375, -20.830078125, -16.8515625, -12.873046875, -8.89453125, -4.916015625, -0.9375, 3.041015625, 7.01953125, 10.998046875, 14.9765625, 18.955078125, 22.93359375, 26.912109375, 30.890625, 34.869140625, 38.84765625, 42.826171875, 46.8046875, 50.783203125, 54.76171875, 58.740234375, 62.71875, 66.697265625, 70.67578125, 74.654296875, 78.6328125, 82.611328125, 86.58984375, 90.568359375, 94.546875, 98.525390625, 102.50390625, 106.482421875, 110.4609375, 114.439453125, 118.41796875, 122.396484375, 126.375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [73.0, 656.0, 281.0, 11.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.60875129699707, -6.226749420166016, 2.155252456665039, 10.537254333496094, 18.91925621032715, 27.301259994506836, 35.683258056640625, 44.06526184082031, 52.447265625, 60.82926940917969, 69.21127319335938, 77.59326934814453, 85.97527313232422, 94.3572769165039, 102.73927307128906, 111.12127685546875, 119.50328063964844, 127.88528442382812, 136.2672882080078, 144.6492919921875, 153.03128051757812, 161.41329956054688, 169.7952880859375, 178.1772918701172, 186.55929565429688, 194.94129943847656, 203.32330322265625, 211.70530700683594, 220.08731079101562, 228.46929931640625, 236.85130310058594, 245.23330688476562, 253.61529541015625, 261.9972839355469, 270.3793029785156, 278.76129150390625, 287.143310546875, 295.5252990722656, 303.9073181152344, 312.289306640625, 320.67132568359375, 329.0533142089844, 337.4353332519531, 345.81732177734375, 354.1993408203125, 362.5813293457031, 370.9633483886719, 379.3453369140625, 387.7273254394531, 396.10931396484375, 404.4913330078125, 412.8733215332031, 421.2553405761719, 429.6373291015625, 438.01934814453125, 446.4013366699219, 454.7833251953125, 463.1653137207031, 471.5473327636719, 479.9293212890625, 488.31134033203125, 496.6933288574219, 505.0753479003906, 513.4573364257812, 521.83935546875]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 11.0, 10.0, 7.0, 19.0, 19.0, 25.0, 26.0, 23.0, 24.0, 28.0, 34.0, 37.0, 27.0, 31.0, 40.0, 36.0, 32.0, 38.0, 31.0, 45.0, 35.0, 42.0, 42.0, 36.0, 41.0, 29.0, 31.0, 23.0, 16.0, 22.0, 20.0, 15.0, 12.0, 16.0, 8.0, 9.0, 6.0, 5.0, 7.0, 3.0, 7.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-107.27496337890625, -103.82782745361328, -100.38069152832031, -96.93354797363281, -93.48641204833984, -90.03927612304688, -86.5921401977539, -83.14500427246094, -79.69786834716797, -76.250732421875, -72.80359649658203, -69.35646057128906, -65.90931701660156, -62.462181091308594, -59.015045166015625, -55.567909240722656, -52.12076950073242, -48.67363357543945, -45.22649383544922, -41.77935791015625, -38.33222198486328, -34.88508605957031, -31.437946319580078, -27.99081039428711, -24.543672561645508, -21.096534729003906, -17.649398803710938, -14.202260971069336, -10.75512409210205, -7.307987213134766, -3.860849380493164, -0.4137134552001953, 3.0334243774414062, 6.480561256408691, 9.927698135375977, 13.374835968017578, 16.821971893310547, 20.26910972595215, 23.71624755859375, 27.16338348388672, 30.61052131652832, 34.05765914916992, 37.50479507446289, 40.951934814453125, 44.399070739746094, 47.84620666503906, 51.29334259033203, 54.740478515625, 58.187618255615234, 61.6347541809082, 65.08189392089844, 68.5290298461914, 71.97616577148438, 75.42330169677734, 78.87043762207031, 82.31758117675781, 85.76471710205078, 89.21185302734375, 92.65898895263672, 96.10612487792969, 99.55326843261719, 103.00040435791016, 106.44754028320312, 109.8946762084961, 113.34181213378906]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 8.0, 8.0, 11.0, 13.0, 19.0, 18.0, 21.0, 19.0, 25.0, 41.0, 24.0, 32.0, 47.0, 42.0, 34.0, 38.0, 48.0, 36.0, 49.0, 40.0, 47.0, 44.0, 28.0, 44.0, 29.0, 33.0, 24.0, 27.0, 26.0, 20.0, 19.0, 24.0, 11.0, 9.0, 7.0, 6.0, 10.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.09375, -12.6597900390625, -12.225830078125, -11.7918701171875, -11.35791015625, -10.9239501953125, -10.489990234375, -10.0560302734375, -9.6220703125, -9.1881103515625, -8.754150390625, -8.3201904296875, -7.88623046875, -7.4522705078125, -7.018310546875, -6.5843505859375, -6.150390625, -5.7164306640625, -5.282470703125, -4.8485107421875, -4.41455078125, -3.9805908203125, -3.546630859375, -3.1126708984375, -2.6787109375, -2.2447509765625, -1.810791015625, -1.3768310546875, -0.94287109375, -0.5089111328125, -0.074951171875, 0.3590087890625, 0.79296875, 1.2269287109375, 1.660888671875, 2.0948486328125, 2.52880859375, 2.9627685546875, 3.396728515625, 3.8306884765625, 4.2646484375, 4.6986083984375, 5.132568359375, 5.5665283203125, 6.00048828125, 6.4344482421875, 6.868408203125, 7.3023681640625, 7.736328125, 8.1702880859375, 8.604248046875, 9.0382080078125, 9.47216796875, 9.9061279296875, 10.340087890625, 10.7740478515625, 11.2080078125, 11.6419677734375, 12.075927734375, 12.5098876953125, 12.94384765625, 13.3778076171875, 13.811767578125, 14.2457275390625, 14.6796875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 9.0, 8.0, 5.0, 9.0, 14.0, 16.0, 25.0, 21.0, 20.0, 31.0, 38.0, 71.0, 85.0, 140.0, 269.0, 700.0, 2839.0, 24632.0, 609720.0, 3059120.0, 472515.0, 20218.0, 2437.0, 627.0, 229.0, 133.0, 74.0, 56.0, 45.0, 33.0, 26.0, 18.0, 19.0, 14.0, 10.0, 16.0, 8.0, 6.0, 2.0, 9.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.96875, -33.82080078125, -32.6728515625, -31.52490234375, -30.376953125, -29.22900390625, -28.0810546875, -26.93310546875, -25.78515625, -24.63720703125, -23.4892578125, -22.34130859375, -21.193359375, -20.04541015625, -18.8974609375, -17.74951171875, -16.6015625, -15.45361328125, -14.3056640625, -13.15771484375, -12.009765625, -10.86181640625, -9.7138671875, -8.56591796875, -7.41796875, -6.27001953125, -5.1220703125, -3.97412109375, -2.826171875, -1.67822265625, -0.5302734375, 0.61767578125, 1.765625, 2.91357421875, 4.0615234375, 5.20947265625, 6.357421875, 7.50537109375, 8.6533203125, 9.80126953125, 10.94921875, 12.09716796875, 13.2451171875, 14.39306640625, 15.541015625, 16.68896484375, 17.8369140625, 18.98486328125, 20.1328125, 21.28076171875, 22.4287109375, 23.57666015625, 24.724609375, 25.87255859375, 27.0205078125, 28.16845703125, 29.31640625, 30.46435546875, 31.6123046875, 32.76025390625, 33.908203125, 35.05615234375, 36.2041015625, 37.35205078125, 38.5]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 7.0, 3.0, 9.0, 18.0, 16.0, 26.0, 29.0, 44.0, 72.0, 90.0, 115.0, 164.0, 239.0, 342.0, 455.0, 529.0, 523.0, 415.0, 299.0, 204.0, 136.0, 92.0, 61.0, 56.0, 39.0, 31.0, 15.0, 13.0, 8.0, 8.0, 6.0, 0.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.802734375, -31.88671875, -30.970703125, -30.0546875, -29.138671875, -28.22265625, -27.306640625, -26.390625, -25.474609375, -24.55859375, -23.642578125, -22.7265625, -21.810546875, -20.89453125, -19.978515625, -19.0625, -18.146484375, -17.23046875, -16.314453125, -15.3984375, -14.482421875, -13.56640625, -12.650390625, -11.734375, -10.818359375, -9.90234375, -8.986328125, -8.0703125, -7.154296875, -6.23828125, -5.322265625, -4.40625, -3.490234375, -2.57421875, -1.658203125, -0.7421875, 0.173828125, 1.08984375, 2.005859375, 2.921875, 3.837890625, 4.75390625, 5.669921875, 6.5859375, 7.501953125, 8.41796875, 9.333984375, 10.25, 11.166015625, 12.08203125, 12.998046875, 13.9140625, 14.830078125, 15.74609375, 16.662109375, 17.578125, 18.494140625, 19.41015625, 20.326171875, 21.2421875, 22.158203125, 23.07421875, 23.990234375, 24.90625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 4.0, 11.0, 9.0, 16.0, 7.0, 14.0, 16.0, 20.0, 27.0, 41.0, 51.0, 72.0, 75.0, 101.0, 135.0, 175.0, 261.0, 388.0, 941.0, 18434.0, 3963438.0, 206287.0, 1971.0, 491.0, 323.0, 220.0, 150.0, 131.0, 104.0, 78.0, 70.0, 56.0, 34.0, 34.0, 28.0, 16.0, 14.0, 11.0, 9.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.75, -96.2744140625, -92.798828125, -89.3232421875, -85.84765625, -82.3720703125, -78.896484375, -75.4208984375, -71.9453125, -68.4697265625, -64.994140625, -61.5185546875, -58.04296875, -54.5673828125, -51.091796875, -47.6162109375, -44.140625, -40.6650390625, -37.189453125, -33.7138671875, -30.23828125, -26.7626953125, -23.287109375, -19.8115234375, -16.3359375, -12.8603515625, -9.384765625, -5.9091796875, -2.43359375, 1.0419921875, 4.517578125, 7.9931640625, 11.46875, 14.9443359375, 18.419921875, 21.8955078125, 25.37109375, 28.8466796875, 32.322265625, 35.7978515625, 39.2734375, 42.7490234375, 46.224609375, 49.7001953125, 53.17578125, 56.6513671875, 60.126953125, 63.6025390625, 67.078125, 70.5537109375, 74.029296875, 77.5048828125, 80.98046875, 84.4560546875, 87.931640625, 91.4072265625, 94.8828125, 98.3583984375, 101.833984375, 105.3095703125, 108.78515625, 112.2607421875, 115.736328125, 119.2119140625, 122.6875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 13.0, 16.0, 35.0, 56.0, 88.0, 114.0, 145.0, 165.0, 124.0, 101.0, 78.0, 41.0, 20.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.79792022705078, -88.779296875, -84.76066589355469, -80.7420425415039, -76.72341918945312, -72.70479583740234, -68.68617248535156, -64.66754150390625, -60.64891815185547, -56.63029479980469, -52.61166763305664, -48.593040466308594, -44.57441711425781, -40.55579376220703, -36.537166595458984, -32.51853942871094, -28.499916076660156, -24.481290817260742, -20.462665557861328, -16.444040298461914, -12.4254150390625, -8.406789779663086, -4.388164520263672, -0.3695392608642578, 3.6490859985351562, 7.66771125793457, 11.686336517333984, 15.704961776733398, 19.723587036132812, 23.742212295532227, 27.76083755493164, 31.779462814331055, 35.79808044433594, 39.81670379638672, 43.835330963134766, 47.85395812988281, 51.872581481933594, 55.891204833984375, 59.90983200073242, 63.92845916748047, 67.94708251953125, 71.96570587158203, 75.98432922363281, 80.00296020507812, 84.0215835571289, 88.04020690917969, 92.058837890625, 96.07746124267578, 100.09608459472656, 104.11470794677734, 108.13333129882812, 112.15196228027344, 116.17058563232422, 120.189208984375, 124.20783996582031, 128.22645568847656, 132.24508666992188, 136.2637176513672, 140.28233337402344, 144.30096435546875, 148.319580078125, 152.3382110595703, 156.35684204101562, 160.37545776367188, 164.3940887451172]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 6.0, 15.0, 19.0, 18.0, 15.0, 24.0, 19.0, 21.0, 23.0, 44.0, 42.0, 36.0, 38.0, 33.0, 46.0, 40.0, 41.0, 35.0, 38.0, 45.0, 33.0, 37.0, 32.0, 26.0, 38.0, 35.0, 30.0, 28.0, 19.0, 11.0, 24.0, 19.0, 6.0, 13.0, 9.0, 7.0, 5.0, 9.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-85.63916015625, -83.06629943847656, -80.4934310913086, -77.92057037353516, -75.34770202636719, -72.77484130859375, -70.20198059082031, -67.62911987304688, -65.0562515258789, -62.4833869934082, -59.9105224609375, -57.33766174316406, -54.76479721069336, -52.191932678222656, -49.61907196044922, -47.046207427978516, -44.47334289550781, -41.90047836303711, -39.327613830566406, -36.75475311279297, -34.181888580322266, -31.609024047851562, -29.036161422729492, -26.463298797607422, -23.89043426513672, -21.317569732666016, -18.744707107543945, -16.171844482421875, -13.598979949951172, -11.026116371154785, -8.453252792358398, -5.880390167236328, -3.307525634765625, -0.7346620559692383, 1.8382015228271484, 4.411065101623535, 6.983928680419922, 9.556792259216309, 12.129655838012695, 14.702518463134766, 17.27538299560547, 19.848247528076172, 22.421110153198242, 24.993972778320312, 27.566837310791016, 30.13970184326172, 32.712562561035156, 35.28542709350586, 37.85829162597656, 40.431156158447266, 43.00402069091797, 45.576881408691406, 48.14974594116211, 50.72261047363281, 53.29547119140625, 55.86833572387695, 58.441200256347656, 61.01406478881836, 63.58692932128906, 66.1597900390625, 68.73265075683594, 71.3055191040039, 73.87837982177734, 76.45124816894531, 79.02410888671875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 12.0, 12.0, 13.0, 15.0, 15.0, 16.0, 23.0, 22.0, 23.0, 30.0, 24.0, 35.0, 31.0, 37.0, 38.0, 44.0, 46.0, 39.0, 43.0, 38.0, 33.0, 33.0, 32.0, 45.0, 32.0, 25.0, 33.0, 21.0, 33.0, 21.0, 26.0, 15.0, 12.0, 21.0, 10.0, 7.0, 7.0, 12.0, 6.0, 6.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-13.125, -12.73583984375, -12.3466796875, -11.95751953125, -11.568359375, -11.17919921875, -10.7900390625, -10.40087890625, -10.01171875, -9.62255859375, -9.2333984375, -8.84423828125, -8.455078125, -8.06591796875, -7.6767578125, -7.28759765625, -6.8984375, -6.50927734375, -6.1201171875, -5.73095703125, -5.341796875, -4.95263671875, -4.5634765625, -4.17431640625, -3.78515625, -3.39599609375, -3.0068359375, -2.61767578125, -2.228515625, -1.83935546875, -1.4501953125, -1.06103515625, -0.671875, -0.28271484375, 0.1064453125, 0.49560546875, 0.884765625, 1.27392578125, 1.6630859375, 2.05224609375, 2.44140625, 2.83056640625, 3.2197265625, 3.60888671875, 3.998046875, 4.38720703125, 4.7763671875, 5.16552734375, 5.5546875, 5.94384765625, 6.3330078125, 6.72216796875, 7.111328125, 7.50048828125, 7.8896484375, 8.27880859375, 8.66796875, 9.05712890625, 9.4462890625, 9.83544921875, 10.224609375, 10.61376953125, 11.0029296875, 11.39208984375, 11.78125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 7.0, 7.0, 17.0, 23.0, 26.0, 49.0, 72.0, 106.0, 167.0, 211.0, 353.0, 518.0, 769.0, 1194.0, 1804.0, 2675.0, 4141.0, 6095.0, 9253.0, 13695.0, 20168.0, 29775.0, 43730.0, 64622.0, 97528.0, 148555.0, 192997.0, 135876.0, 89682.0, 59596.0, 40627.0, 27630.0, 18647.0, 12771.0, 8410.0, 5710.0, 3768.0, 2468.0, 1603.0, 1062.0, 733.0, 461.0, 322.0, 191.0, 156.0, 111.0, 57.0, 46.0, 34.0, 17.0, 9.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1865234375, -1.1461639404296875, -1.105804443359375, -1.0654449462890625, -1.02508544921875, -0.9847259521484375, -0.944366455078125, -0.9040069580078125, -0.8636474609375, -0.8232879638671875, -0.782928466796875, -0.7425689697265625, -0.70220947265625, -0.6618499755859375, -0.621490478515625, -0.5811309814453125, -0.540771484375, -0.5004119873046875, -0.460052490234375, -0.4196929931640625, -0.37933349609375, -0.3389739990234375, -0.298614501953125, -0.2582550048828125, -0.2178955078125, -0.1775360107421875, -0.137176513671875, -0.0968170166015625, -0.05645751953125, -0.0160980224609375, 0.024261474609375, 0.0646209716796875, 0.10498046875, 0.1453399658203125, 0.185699462890625, 0.2260589599609375, 0.26641845703125, 0.3067779541015625, 0.347137451171875, 0.3874969482421875, 0.4278564453125, 0.4682159423828125, 0.508575439453125, 0.5489349365234375, 0.58929443359375, 0.6296539306640625, 0.670013427734375, 0.7103729248046875, 0.750732421875, 0.7910919189453125, 0.831451416015625, 0.8718109130859375, 0.91217041015625, 0.9525299072265625, 0.992889404296875, 1.0332489013671875, 1.0736083984375, 1.1139678955078125, 1.154327392578125, 1.1946868896484375, 1.23504638671875, 1.2754058837890625, 1.315765380859375, 1.3561248779296875, 1.396484375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 3.0, 4.0, 3.0, 8.0, 8.0, 9.0, 14.0, 10.0, 15.0, 16.0, 19.0, 20.0, 19.0, 18.0, 31.0, 26.0, 35.0, 33.0, 39.0, 24.0, 25.0, 37.0, 39.0, 1072.0, 35.0, 43.0, 49.0, 40.0, 32.0, 42.0, 32.0, 23.0, 23.0, 26.0, 13.0, 17.0, 25.0, 12.0, 11.0, 17.0, 9.0, 4.0, 8.0, 6.0, 4.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0], "bins": [-7.60546875, -7.3714599609375, -7.137451171875, -6.9034423828125, -6.66943359375, -6.4354248046875, -6.201416015625, -5.9674072265625, -5.7333984375, -5.4993896484375, -5.265380859375, -5.0313720703125, -4.79736328125, -4.5633544921875, -4.329345703125, -4.0953369140625, -3.861328125, -3.6273193359375, -3.393310546875, -3.1593017578125, -2.92529296875, -2.6912841796875, -2.457275390625, -2.2232666015625, -1.9892578125, -1.7552490234375, -1.521240234375, -1.2872314453125, -1.05322265625, -0.8192138671875, -0.585205078125, -0.3511962890625, -0.1171875, 0.1168212890625, 0.350830078125, 0.5848388671875, 0.81884765625, 1.0528564453125, 1.286865234375, 1.5208740234375, 1.7548828125, 1.9888916015625, 2.222900390625, 2.4569091796875, 2.69091796875, 2.9249267578125, 3.158935546875, 3.3929443359375, 3.626953125, 3.8609619140625, 4.094970703125, 4.3289794921875, 4.56298828125, 4.7969970703125, 5.031005859375, 5.2650146484375, 5.4990234375, 5.7330322265625, 5.967041015625, 6.2010498046875, 6.43505859375, 6.6690673828125, 6.903076171875, 7.1370849609375, 7.37109375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 12.0, 15.0, 24.0, 33.0, 33.0, 74.0, 126.0, 123.0, 200.0, 316.0, 432.0, 613.0, 918.0, 1445.0, 2074.0, 3020.0, 4581.0, 6853.0, 10344.0, 15519.0, 23491.0, 36068.0, 54937.0, 84824.0, 134353.0, 1238839.0, 167265.0, 108384.0, 69196.0, 45111.0, 29700.0, 19406.0, 12916.0, 8425.0, 5782.0, 3773.0, 2569.0, 1670.0, 1121.0, 816.0, 589.0, 341.0, 250.0, 165.0, 131.0, 84.0, 60.0, 36.0, 26.0, 23.0, 10.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0], "bins": [-1.3125, -1.2724456787109375, -1.232391357421875, -1.1923370361328125, -1.15228271484375, -1.1122283935546875, -1.072174072265625, -1.0321197509765625, -0.9920654296875, -0.9520111083984375, -0.911956787109375, -0.8719024658203125, -0.83184814453125, -0.7917938232421875, -0.751739501953125, -0.7116851806640625, -0.671630859375, -0.6315765380859375, -0.591522216796875, -0.5514678955078125, -0.51141357421875, -0.4713592529296875, -0.431304931640625, -0.3912506103515625, -0.3511962890625, -0.3111419677734375, -0.271087646484375, -0.2310333251953125, -0.19097900390625, -0.1509246826171875, -0.110870361328125, -0.0708160400390625, -0.03076171875, 0.0092926025390625, 0.049346923828125, 0.0894012451171875, 0.12945556640625, 0.1695098876953125, 0.209564208984375, 0.2496185302734375, 0.2896728515625, 0.3297271728515625, 0.369781494140625, 0.4098358154296875, 0.44989013671875, 0.4899444580078125, 0.529998779296875, 0.5700531005859375, 0.610107421875, 0.6501617431640625, 0.690216064453125, 0.7302703857421875, 0.77032470703125, 0.8103790283203125, 0.850433349609375, 0.8904876708984375, 0.9305419921875, 0.9705963134765625, 1.010650634765625, 1.0507049560546875, 1.09075927734375, 1.1308135986328125, 1.170867919921875, 1.2109222412109375, 1.2509765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 8.0, 5.0, 7.0, 7.0, 6.0, 17.0, 17.0, 23.0, 22.0, 28.0, 30.0, 35.0, 41.0, 46.0, 66.0, 61.0, 69.0, 55.0, 70.0, 56.0, 56.0, 47.0, 39.0, 38.0, 24.0, 23.0, 12.0, 19.0, 18.0, 12.0, 8.0, 5.0, 3.0, 5.0, 2.0, 5.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.003932952880859375, -0.0038246214389801025, -0.00371628999710083, -0.0036079585552215576, -0.003499627113342285, -0.0033912956714630127, -0.0032829642295837402, -0.0031746327877044678, -0.0030663013458251953, -0.002957969903945923, -0.0028496384620666504, -0.002741307020187378, -0.0026329755783081055, -0.002524644136428833, -0.0024163126945495605, -0.002307981252670288, -0.0021996498107910156, -0.002091318368911743, -0.0019829869270324707, -0.0018746554851531982, -0.0017663240432739258, -0.0016579926013946533, -0.0015496611595153809, -0.0014413297176361084, -0.001332998275756836, -0.0012246668338775635, -0.001116335391998291, -0.0010080039501190186, -0.0008996725082397461, -0.0007913410663604736, -0.0006830096244812012, -0.0005746781826019287, -0.00046634674072265625, -0.0003580152988433838, -0.00024968385696411133, -0.00014135241508483887, -3.3020973205566406e-05, 7.531046867370605e-05, 0.00018364191055297852, 0.000291973352432251, 0.00040030479431152344, 0.0005086362361907959, 0.0006169676780700684, 0.0007252991199493408, 0.0008336305618286133, 0.0009419620037078857, 0.0010502934455871582, 0.0011586248874664307, 0.0012669563293457031, 0.0013752877712249756, 0.001483619213104248, 0.0015919506549835205, 0.001700282096862793, 0.0018086135387420654, 0.0019169449806213379, 0.0020252764225006104, 0.002133607864379883, 0.0022419393062591553, 0.0023502707481384277, 0.0024586021900177, 0.0025669336318969727, 0.002675265073776245, 0.0027835965156555176, 0.00289192795753479, 0.0030002593994140625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 9.0, 6.0, 8.0, 10.0, 9.0, 22.0, 25.0, 34.0, 36.0, 54.0, 72.0, 130.0, 247.0, 792.0, 75769.0, 969297.0, 1167.0, 364.0, 130.0, 92.0, 69.0, 47.0, 31.0, 28.0, 30.0, 17.0, 6.0, 10.0, 6.0, 5.0, 4.0, 3.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.081787109375, -0.07887840270996094, -0.07596969604492188, -0.07306098937988281, -0.07015228271484375, -0.06724357604980469, -0.06433486938476562, -0.06142616271972656, -0.0585174560546875, -0.05560874938964844, -0.052700042724609375, -0.04979133605957031, -0.04688262939453125, -0.04397392272949219, -0.041065216064453125, -0.03815650939941406, -0.035247802734375, -0.03233909606933594, -0.029430389404296875, -0.026521682739257812, -0.02361297607421875, -0.020704269409179688, -0.017795562744140625, -0.014886856079101562, -0.0119781494140625, -0.009069442749023438, -0.006160736083984375, -0.0032520294189453125, -0.00034332275390625, 0.0025653839111328125, 0.005474090576171875, 0.008382797241210938, 0.01129150390625, 0.014200210571289062, 0.017108917236328125, 0.020017623901367188, 0.02292633056640625, 0.025835037231445312, 0.028743743896484375, 0.03165245056152344, 0.0345611572265625, 0.03746986389160156, 0.040378570556640625, 0.04328727722167969, 0.04619598388671875, 0.04910469055175781, 0.052013397216796875, 0.05492210388183594, 0.057830810546875, 0.06073951721191406, 0.06364822387695312, 0.06655693054199219, 0.06946563720703125, 0.07237434387207031, 0.07528305053710938, 0.07819175720214844, 0.0811004638671875, 0.08400917053222656, 0.08691787719726562, 0.08982658386230469, 0.09273529052734375, 0.09564399719238281, 0.09855270385742188, 0.10146141052246094, 0.1043701171875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 13.0, 45.0, 122.0, 277.0, 304.0, 168.0, 58.0, 7.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.003455569501966238, -0.0033405963331460953, -0.0032256231643259525, -0.00311064999550581, -0.0029956770595163107, -0.002880703890696168, -0.002765730721876025, -0.0026507575530558825, -0.0025357843842357397, -0.002420811215415597, -0.002305838046595454, -0.002190865110605955, -0.0020758919417858124, -0.0019609187729656696, -0.0018459456041455269, -0.0017309724353253841, -0.0016159993829205632, -0.0015010262141004205, -0.0013860531616955996, -0.0012710799928754568, -0.001156106824055314, -0.0010411336552351713, -0.0009261606028303504, -0.0008111874340102077, -0.0006962143233977258, -0.000581241212785244, -0.00046626804396510124, -0.0003512949333526194, -0.00023632179363630712, -0.00012134865391999483, -6.375543307512999e-06, 0.00010859762551262975, 0.00022357073612511158, 0.00033854387584142387, 0.00045351701555773616, 0.000568490126170218, 0.0006834632949903607, 0.0007984364056028426, 0.0009134095162153244, 0.0010283826850354671, 0.00114335585385561, 0.0012583290226757526, 0.0013733020750805736, 0.0014882752439007163, 0.001603248412720859, 0.00171822146512568, 0.0018331946339458227, 0.0019481678027659655, 0.0020631407387554646, 0.0021781139075756073, 0.00229308707639575, 0.002408060245215893, 0.002523033181205392, 0.0026380063500255346, 0.0027529795188456774, 0.00286795268766582, 0.002982925856485963, 0.0030978990253061056, 0.0032128721941262484, 0.0033278451301157475, 0.00344281829893589, 0.003557791467756033, 0.0036727646365761757, 0.0037877378053963184, 0.003902710974216461]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 5.0, 9.0, 10.0, 8.0, 11.0, 13.0, 13.0, 22.0, 19.0, 31.0, 37.0, 36.0, 37.0, 22.0, 43.0, 43.0, 48.0, 46.0, 45.0, 39.0, 47.0, 57.0, 41.0, 36.0, 40.0, 32.0, 29.0, 23.0, 31.0, 23.0, 16.0, 11.0, 14.0, 23.0, 9.0, 13.0, 6.0, 10.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001829385757446289, -0.0017669163644313812, -0.0017044469714164734, -0.0016419775784015656, -0.0015795081853866577, -0.0015170387923717499, -0.001454569399356842, -0.0013921000063419342, -0.0013296306133270264, -0.0012671612203121185, -0.0012046918272972107, -0.0011422224342823029, -0.001079753041267395, -0.0010172836482524872, -0.0009548142552375793, -0.0008923448622226715, -0.0008298754692077637, -0.0007674060761928558, -0.000704936683177948, -0.0006424672901630402, -0.0005799978971481323, -0.0005175285041332245, -0.00045505911111831665, -0.0003925897181034088, -0.000330120325088501, -0.00026765093207359314, -0.0002051815390586853, -0.00014271214604377747, -8.024275302886963e-05, -1.7773360013961792e-05, 4.4696033000946045e-05, 0.00010716542601585388, 0.00016963481903076172, 0.00023210421204566956, 0.0002945736050605774, 0.00035704299807548523, 0.00041951239109039307, 0.0004819817841053009, 0.0005444511771202087, 0.0006069205701351166, 0.0006693899631500244, 0.0007318593561649323, 0.0007943287491798401, 0.0008567981421947479, 0.0009192675352096558, 0.0009817369282245636, 0.0010442063212394714, 0.0011066757142543793, 0.0011691451072692871, 0.001231614500284195, 0.0012940838932991028, 0.0013565532863140106, 0.0014190226793289185, 0.0014814920723438263, 0.0015439614653587341, 0.001606430858373642, 0.0016689002513885498, 0.0017313696444034576, 0.0017938390374183655, 0.0018563084304332733, 0.0019187778234481812, 0.001981247216463089, 0.002043716609477997, 0.0021061860024929047, 0.0021686553955078125]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 12.0, 12.0, 13.0, 15.0, 15.0, 16.0, 23.0, 22.0, 23.0, 30.0, 24.0, 35.0, 31.0, 37.0, 38.0, 44.0, 46.0, 39.0, 43.0, 38.0, 33.0, 33.0, 32.0, 45.0, 32.0, 25.0, 33.0, 21.0, 33.0, 21.0, 26.0, 15.0, 12.0, 21.0, 10.0, 7.0, 7.0, 12.0, 6.0, 6.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-13.125, -12.73583984375, -12.3466796875, -11.95751953125, -11.568359375, -11.17919921875, -10.7900390625, -10.40087890625, -10.01171875, -9.62255859375, -9.2333984375, -8.84423828125, -8.455078125, -8.06591796875, -7.6767578125, -7.28759765625, -6.8984375, -6.50927734375, -6.1201171875, -5.73095703125, -5.341796875, -4.95263671875, -4.5634765625, -4.17431640625, -3.78515625, -3.39599609375, -3.0068359375, -2.61767578125, -2.228515625, -1.83935546875, -1.4501953125, -1.06103515625, -0.671875, -0.28271484375, 0.1064453125, 0.49560546875, 0.884765625, 1.27392578125, 1.6630859375, 2.05224609375, 2.44140625, 2.83056640625, 3.2197265625, 3.60888671875, 3.998046875, 4.38720703125, 4.7763671875, 5.16552734375, 5.5546875, 5.94384765625, 6.3330078125, 6.72216796875, 7.111328125, 7.50048828125, 7.8896484375, 8.27880859375, 8.66796875, 9.05712890625, 9.4462890625, 9.83544921875, 10.224609375, 10.61376953125, 11.0029296875, 11.39208984375, 11.78125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 3.0, 15.0, 13.0, 16.0, 26.0, 24.0, 31.0, 53.0, 66.0, 98.0, 157.0, 252.0, 421.0, 846.0, 1870.0, 4100.0, 10766.0, 33324.0, 128890.0, 524250.0, 253101.0, 60941.0, 17708.0, 6239.0, 2617.0, 1182.0, 606.0, 332.0, 170.0, 129.0, 65.0, 68.0, 40.0, 22.0, 33.0, 15.0, 8.0, 11.0, 17.0, 6.0, 6.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-12.7109375, -12.3341064453125, -11.957275390625, -11.5804443359375, -11.20361328125, -10.8267822265625, -10.449951171875, -10.0731201171875, -9.6962890625, -9.3194580078125, -8.942626953125, -8.5657958984375, -8.18896484375, -7.8121337890625, -7.435302734375, -7.0584716796875, -6.681640625, -6.3048095703125, -5.927978515625, -5.5511474609375, -5.17431640625, -4.7974853515625, -4.420654296875, -4.0438232421875, -3.6669921875, -3.2901611328125, -2.913330078125, -2.5364990234375, -2.15966796875, -1.7828369140625, -1.406005859375, -1.0291748046875, -0.65234375, -0.2755126953125, 0.101318359375, 0.4781494140625, 0.85498046875, 1.2318115234375, 1.608642578125, 1.9854736328125, 2.3623046875, 2.7391357421875, 3.115966796875, 3.4927978515625, 3.86962890625, 4.2464599609375, 4.623291015625, 5.0001220703125, 5.376953125, 5.7537841796875, 6.130615234375, 6.5074462890625, 6.88427734375, 7.2611083984375, 7.637939453125, 8.0147705078125, 8.3916015625, 8.7684326171875, 9.145263671875, 9.5220947265625, 9.89892578125, 10.2757568359375, 10.652587890625, 11.0294189453125, 11.40625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 10.0, 10.0, 6.0, 12.0, 15.0, 27.0, 23.0, 31.0, 24.0, 40.0, 43.0, 38.0, 47.0, 40.0, 58.0, 167.0, 1866.0, 133.0, 61.0, 44.0, 47.0, 54.0, 41.0, 34.0, 24.0, 23.0, 24.0, 19.0, 25.0, 9.0, 8.0, 7.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.46875, -37.9716796875, -36.474609375, -34.9775390625, -33.48046875, -31.9833984375, -30.486328125, -28.9892578125, -27.4921875, -25.9951171875, -24.498046875, -23.0009765625, -21.50390625, -20.0068359375, -18.509765625, -17.0126953125, -15.515625, -14.0185546875, -12.521484375, -11.0244140625, -9.52734375, -8.0302734375, -6.533203125, -5.0361328125, -3.5390625, -2.0419921875, -0.544921875, 0.9521484375, 2.44921875, 3.9462890625, 5.443359375, 6.9404296875, 8.4375, 9.9345703125, 11.431640625, 12.9287109375, 14.42578125, 15.9228515625, 17.419921875, 18.9169921875, 20.4140625, 21.9111328125, 23.408203125, 24.9052734375, 26.40234375, 27.8994140625, 29.396484375, 30.8935546875, 32.390625, 33.8876953125, 35.384765625, 36.8818359375, 38.37890625, 39.8759765625, 41.373046875, 42.8701171875, 44.3671875, 45.8642578125, 47.361328125, 48.8583984375, 50.35546875, 51.8525390625, 53.349609375, 54.8466796875, 56.34375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 13.0, 10.0, 6.0, 19.0, 12.0, 29.0, 36.0, 43.0, 51.0, 75.0, 112.0, 175.0, 232.0, 375.0, 928.0, 14898.0, 3120005.0, 6882.0, 680.0, 351.0, 232.0, 141.0, 100.0, 77.0, 54.0, 40.0, 35.0, 20.0, 8.0, 14.0, 16.0, 3.0, 6.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-124.25, -120.6396484375, -117.029296875, -113.4189453125, -109.80859375, -106.1982421875, -102.587890625, -98.9775390625, -95.3671875, -91.7568359375, -88.146484375, -84.5361328125, -80.92578125, -77.3154296875, -73.705078125, -70.0947265625, -66.484375, -62.8740234375, -59.263671875, -55.6533203125, -52.04296875, -48.4326171875, -44.822265625, -41.2119140625, -37.6015625, -33.9912109375, -30.380859375, -26.7705078125, -23.16015625, -19.5498046875, -15.939453125, -12.3291015625, -8.71875, -5.1083984375, -1.498046875, 2.1123046875, 5.72265625, 9.3330078125, 12.943359375, 16.5537109375, 20.1640625, 23.7744140625, 27.384765625, 30.9951171875, 34.60546875, 38.2158203125, 41.826171875, 45.4365234375, 49.046875, 52.6572265625, 56.267578125, 59.8779296875, 63.48828125, 67.0986328125, 70.708984375, 74.3193359375, 77.9296875, 81.5400390625, 85.150390625, 88.7607421875, 92.37109375, 95.9814453125, 99.591796875, 103.2021484375, 106.8125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 30.0, 592.0, 389.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-352.5506896972656, -345.6189270019531, -338.68719482421875, -331.75543212890625, -324.8236999511719, -317.8919372558594, -310.9601745605469, -304.0284423828125, -297.0966796875, -290.1649169921875, -283.2331848144531, -276.3014221191406, -269.36968994140625, -262.43792724609375, -255.5061798095703, -248.57443237304688, -241.64266967773438, -234.71092224121094, -227.7791748046875, -220.847412109375, -213.91566467285156, -206.98391723632812, -200.0521697998047, -193.12042236328125, -186.1886749267578, -179.25692749023438, -172.32518005371094, -165.39341735839844, -158.461669921875, -151.52992248535156, -144.59817504882812, -137.66641235351562, -130.73464965820312, -123.80290222167969, -116.87114715576172, -109.93939971923828, -103.00764465332031, -96.07589721679688, -89.14414978027344, -82.21239471435547, -75.28065490722656, -68.34890747070312, -61.417152404785156, -54.48540496826172, -47.55364990234375, -40.62190246582031, -33.69015121459961, -26.758399963378906, -19.826644897460938, -12.894893646240234, -5.963143348693848, 0.9686069488525391, 7.900358200073242, 14.832107543945312, 21.763858795166016, 28.69561004638672, 35.62736129760742, 42.559112548828125, 49.49086380004883, 56.42261505126953, 63.35436248779297, 70.28611755371094, 77.21786499023438, 84.14961242675781, 91.08136749267578]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 5.0, 10.0, 12.0, 27.0, 17.0, 20.0, 21.0, 28.0, 21.0, 27.0, 40.0, 42.0, 45.0, 41.0, 42.0, 35.0, 42.0, 39.0, 47.0, 43.0, 50.0, 45.0, 29.0, 34.0, 32.0, 18.0, 27.0, 31.0, 24.0, 20.0, 11.0, 13.0, 8.0, 12.0, 7.0, 7.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.52529907226562, -105.02540588378906, -101.52552032470703, -98.025634765625, -94.52574157714844, -91.02584838867188, -87.52596282958984, -84.02607727050781, -80.52618408203125, -77.02629089355469, -73.52640533447266, -70.02651977539062, -66.52662658691406, -63.026737213134766, -59.52684783935547, -56.02695846557617, -52.527069091796875, -49.02717971801758, -45.52729034423828, -42.027400970458984, -38.52751159667969, -35.02762222290039, -31.527732849121094, -28.027843475341797, -24.5279541015625, -21.028064727783203, -17.528175354003906, -14.02828598022461, -10.528396606445312, -7.028507232666016, -3.5286178588867188, -0.028728485107421875, 3.4711685180664062, 6.971057891845703, 10.470947265625, 13.970836639404297, 17.470726013183594, 20.97061538696289, 24.470504760742188, 27.970394134521484, 31.47028350830078, 34.97017288208008, 38.470062255859375, 41.96995162963867, 45.46984100341797, 48.969730377197266, 52.46961975097656, 55.96950912475586, 59.469398498535156, 62.96928787231445, 66.46917724609375, 69.96907043457031, 73.46895599365234, 76.96884155273438, 80.46873474121094, 83.9686279296875, 87.46851348876953, 90.96839904785156, 94.46829223632812, 97.96818542480469, 101.46807098388672, 104.96795654296875, 108.46784973144531, 111.96774291992188, 115.4676284790039]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 10.0, 11.0, 15.0, 10.0, 23.0, 15.0, 19.0, 25.0, 29.0, 17.0, 38.0, 37.0, 21.0, 42.0, 47.0, 49.0, 43.0, 39.0, 38.0, 25.0, 49.0, 39.0, 37.0, 41.0, 32.0, 25.0, 23.0, 28.0, 21.0, 25.0, 20.0, 15.0, 17.0, 17.0, 7.0, 7.0, 13.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 3.0], "bins": [-14.0546875, -13.6458740234375, -13.237060546875, -12.8282470703125, -12.41943359375, -12.0106201171875, -11.601806640625, -11.1929931640625, -10.7841796875, -10.3753662109375, -9.966552734375, -9.5577392578125, -9.14892578125, -8.7401123046875, -8.331298828125, -7.9224853515625, -7.513671875, -7.1048583984375, -6.696044921875, -6.2872314453125, -5.87841796875, -5.4696044921875, -5.060791015625, -4.6519775390625, -4.2431640625, -3.8343505859375, -3.425537109375, -3.0167236328125, -2.60791015625, -2.1990966796875, -1.790283203125, -1.3814697265625, -0.97265625, -0.5638427734375, -0.155029296875, 0.2537841796875, 0.66259765625, 1.0714111328125, 1.480224609375, 1.8890380859375, 2.2978515625, 2.7066650390625, 3.115478515625, 3.5242919921875, 3.93310546875, 4.3419189453125, 4.750732421875, 5.1595458984375, 5.568359375, 5.9771728515625, 6.385986328125, 6.7947998046875, 7.20361328125, 7.6124267578125, 8.021240234375, 8.4300537109375, 8.8388671875, 9.2476806640625, 9.656494140625, 10.0653076171875, 10.47412109375, 10.8829345703125, 11.291748046875, 11.7005615234375, 12.109375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 3.0, 3.0, 2.0, 11.0, 11.0, 14.0, 21.0, 18.0, 27.0, 33.0, 34.0, 47.0, 53.0, 84.0, 76.0, 111.0, 143.0, 245.0, 424.0, 916.0, 3269.0, 20120.0, 355780.0, 2687969.0, 1060154.0, 55697.0, 6051.0, 1350.0, 532.0, 269.0, 163.0, 139.0, 95.0, 100.0, 63.0, 37.0, 37.0, 36.0, 22.0, 24.0, 25.0, 12.0, 18.0, 13.0, 10.0, 3.0, 6.0, 4.0, 1.0, 4.0, 3.0, 4.0], "bins": [-36.125, -35.113037109375, -34.10107421875, -33.089111328125, -32.0771484375, -31.065185546875, -30.05322265625, -29.041259765625, -28.029296875, -27.017333984375, -26.00537109375, -24.993408203125, -23.9814453125, -22.969482421875, -21.95751953125, -20.945556640625, -19.93359375, -18.921630859375, -17.90966796875, -16.897705078125, -15.8857421875, -14.873779296875, -13.86181640625, -12.849853515625, -11.837890625, -10.825927734375, -9.81396484375, -8.802001953125, -7.7900390625, -6.778076171875, -5.76611328125, -4.754150390625, -3.7421875, -2.730224609375, -1.71826171875, -0.706298828125, 0.3056640625, 1.317626953125, 2.32958984375, 3.341552734375, 4.353515625, 5.365478515625, 6.37744140625, 7.389404296875, 8.4013671875, 9.413330078125, 10.42529296875, 11.437255859375, 12.44921875, 13.461181640625, 14.47314453125, 15.485107421875, 16.4970703125, 17.509033203125, 18.52099609375, 19.532958984375, 20.544921875, 21.556884765625, 22.56884765625, 23.580810546875, 24.5927734375, 25.604736328125, 26.61669921875, 27.628662109375, 28.640625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 7.0, 4.0, 9.0, 14.0, 16.0, 18.0, 25.0, 45.0, 68.0, 104.0, 131.0, 186.0, 272.0, 364.0, 509.0, 581.0, 487.0, 389.0, 271.0, 158.0, 137.0, 78.0, 61.0, 39.0, 33.0, 23.0, 23.0, 8.0, 6.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.765625, -29.8466796875, -28.927734375, -28.0087890625, -27.08984375, -26.1708984375, -25.251953125, -24.3330078125, -23.4140625, -22.4951171875, -21.576171875, -20.6572265625, -19.73828125, -18.8193359375, -17.900390625, -16.9814453125, -16.0625, -15.1435546875, -14.224609375, -13.3056640625, -12.38671875, -11.4677734375, -10.548828125, -9.6298828125, -8.7109375, -7.7919921875, -6.873046875, -5.9541015625, -5.03515625, -4.1162109375, -3.197265625, -2.2783203125, -1.359375, -0.4404296875, 0.478515625, 1.3974609375, 2.31640625, 3.2353515625, 4.154296875, 5.0732421875, 5.9921875, 6.9111328125, 7.830078125, 8.7490234375, 9.66796875, 10.5869140625, 11.505859375, 12.4248046875, 13.34375, 14.2626953125, 15.181640625, 16.1005859375, 17.01953125, 17.9384765625, 18.857421875, 19.7763671875, 20.6953125, 21.6142578125, 22.533203125, 23.4521484375, 24.37109375, 25.2900390625, 26.208984375, 27.1279296875, 28.046875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 10.0, 9.0, 25.0, 37.0, 48.0, 55.0, 72.0, 89.0, 151.0, 211.0, 284.0, 415.0, 1044.0, 69654.0, 4112391.0, 7761.0, 715.0, 344.0, 258.0, 177.0, 149.0, 108.0, 82.0, 60.0, 31.0, 33.0, 18.0, 12.0, 12.0, 7.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.375, -133.814453125, -129.25390625, -124.693359375, -120.1328125, -115.572265625, -111.01171875, -106.451171875, -101.890625, -97.330078125, -92.76953125, -88.208984375, -83.6484375, -79.087890625, -74.52734375, -69.966796875, -65.40625, -60.845703125, -56.28515625, -51.724609375, -47.1640625, -42.603515625, -38.04296875, -33.482421875, -28.921875, -24.361328125, -19.80078125, -15.240234375, -10.6796875, -6.119140625, -1.55859375, 3.001953125, 7.5625, 12.123046875, 16.68359375, 21.244140625, 25.8046875, 30.365234375, 34.92578125, 39.486328125, 44.046875, 48.607421875, 53.16796875, 57.728515625, 62.2890625, 66.849609375, 71.41015625, 75.970703125, 80.53125, 85.091796875, 89.65234375, 94.212890625, 98.7734375, 103.333984375, 107.89453125, 112.455078125, 117.015625, 121.576171875, 126.13671875, 130.697265625, 135.2578125, 139.818359375, 144.37890625, 148.939453125, 153.5]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 113.0, 648.0, 234.0, 18.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-977.7388916015625, -959.5175170898438, -941.296142578125, -923.0747680664062, -904.8533935546875, -886.6320190429688, -868.41064453125, -850.1892700195312, -831.9678955078125, -813.7465209960938, -795.525146484375, -777.3037719726562, -759.0823974609375, -740.8610229492188, -722.6396484375, -704.4182739257812, -686.1968994140625, -667.9755249023438, -649.754150390625, -631.5327758789062, -613.3114013671875, -595.0900268554688, -576.86865234375, -558.6472778320312, -540.4259643554688, -522.20458984375, -503.98321533203125, -485.7618408203125, -467.54046630859375, -449.319091796875, -431.09771728515625, -412.8763427734375, -394.65496826171875, -376.43359375, -358.21221923828125, -339.9908447265625, -321.76947021484375, -303.548095703125, -285.32672119140625, -267.1053466796875, -248.88397216796875, -230.66259765625, -212.44122314453125, -194.2198486328125, -175.99847412109375, -157.777099609375, -139.5557403564453, -121.33436584472656, -103.11299133300781, -84.89161682128906, -66.67024230957031, -48.448875427246094, -30.227500915527344, -12.006126403808594, 6.215240478515625, 24.436614990234375, 42.657989501953125, 60.879364013671875, 79.10073852539062, 97.32210540771484, 115.5434799194336, 133.76486206054688, 151.98622131347656, 170.2075958251953, 188.42897033691406]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 10.0, 4.0, 8.0, 10.0, 8.0, 12.0, 18.0, 18.0, 20.0, 19.0, 19.0, 18.0, 31.0, 38.0, 31.0, 32.0, 36.0, 43.0, 43.0, 43.0, 49.0, 40.0, 56.0, 36.0, 33.0, 20.0, 30.0, 32.0, 31.0, 27.0, 25.0, 21.0, 22.0, 20.0, 19.0, 18.0, 12.0, 9.0, 11.0, 5.0, 5.0, 5.0, 2.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-79.32612609863281, -76.93557739257812, -74.54502868652344, -72.15448760986328, -69.7639389038086, -67.3733901977539, -64.98284149169922, -62.5922966003418, -60.201751708984375, -57.81120300292969, -55.420658111572266, -53.03010940551758, -50.639564514160156, -48.24901580810547, -45.85846710205078, -43.46792221069336, -41.07737350463867, -38.686824798583984, -36.29627990722656, -33.905731201171875, -31.515186309814453, -29.124637603759766, -26.73409080505371, -24.343544006347656, -21.9529972076416, -19.562450408935547, -17.171903610229492, -14.781355857849121, -12.390809059143066, -10.000262260437012, -7.609714508056641, -5.219167709350586, -2.8286209106445312, -0.43807387351989746, 1.9524731636047363, 4.343020439147949, 6.733567237854004, 9.124114036560059, 11.51466178894043, 13.905208587646484, 16.29575538635254, 18.686302185058594, 21.07684898376465, 23.467395782470703, 25.85794448852539, 28.248489379882812, 30.6390380859375, 33.02958679199219, 35.42013168334961, 37.8106803894043, 40.20122528076172, 42.591773986816406, 44.98231887817383, 47.372867584228516, 49.76341247558594, 52.153961181640625, 54.54450988769531, 56.93505859375, 59.32560348510742, 61.71615219116211, 64.10669708251953, 66.49724578857422, 68.8877944946289, 71.27833557128906, 73.66888427734375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 8.0, 8.0, 4.0, 11.0, 17.0, 16.0, 19.0, 21.0, 11.0, 26.0, 20.0, 30.0, 28.0, 35.0, 36.0, 42.0, 44.0, 35.0, 45.0, 40.0, 44.0, 52.0, 41.0, 37.0, 40.0, 33.0, 32.0, 28.0, 25.0, 22.0, 24.0, 19.0, 18.0, 13.0, 13.0, 11.0, 13.0, 8.0, 7.0, 5.0, 10.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.9609375, -12.5570068359375, -12.153076171875, -11.7491455078125, -11.34521484375, -10.9412841796875, -10.537353515625, -10.1334228515625, -9.7294921875, -9.3255615234375, -8.921630859375, -8.5177001953125, -8.11376953125, -7.7098388671875, -7.305908203125, -6.9019775390625, -6.498046875, -6.0941162109375, -5.690185546875, -5.2862548828125, -4.88232421875, -4.4783935546875, -4.074462890625, -3.6705322265625, -3.2666015625, -2.8626708984375, -2.458740234375, -2.0548095703125, -1.65087890625, -1.2469482421875, -0.843017578125, -0.4390869140625, -0.03515625, 0.3687744140625, 0.772705078125, 1.1766357421875, 1.58056640625, 1.9844970703125, 2.388427734375, 2.7923583984375, 3.1962890625, 3.6002197265625, 4.004150390625, 4.4080810546875, 4.81201171875, 5.2159423828125, 5.619873046875, 6.0238037109375, 6.427734375, 6.8316650390625, 7.235595703125, 7.6395263671875, 8.04345703125, 8.4473876953125, 8.851318359375, 9.2552490234375, 9.6591796875, 10.0631103515625, 10.467041015625, 10.8709716796875, 11.27490234375, 11.6788330078125, 12.082763671875, 12.4866943359375, 12.890625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 8.0, 10.0, 24.0, 25.0, 26.0, 47.0, 67.0, 132.0, 140.0, 228.0, 352.0, 487.0, 790.0, 1119.0, 1751.0, 2650.0, 4057.0, 6327.0, 9524.0, 14745.0, 22743.0, 34273.0, 51943.0, 79520.0, 121503.0, 181205.0, 176133.0, 116358.0, 76493.0, 50264.0, 33275.0, 21696.0, 14011.0, 9182.0, 5941.0, 3972.0, 2552.0, 1663.0, 1058.0, 785.0, 513.0, 312.0, 217.0, 142.0, 98.0, 65.0, 41.0, 38.0, 22.0, 12.0, 14.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2216796875, -1.1808929443359375, -1.140106201171875, -1.0993194580078125, -1.05853271484375, -1.0177459716796875, -0.976959228515625, -0.9361724853515625, -0.8953857421875, -0.8545989990234375, -0.813812255859375, -0.7730255126953125, -0.73223876953125, -0.6914520263671875, -0.650665283203125, -0.6098785400390625, -0.569091796875, -0.5283050537109375, -0.487518310546875, -0.4467315673828125, -0.40594482421875, -0.3651580810546875, -0.324371337890625, -0.2835845947265625, -0.2427978515625, -0.2020111083984375, -0.161224365234375, -0.1204376220703125, -0.07965087890625, -0.0388641357421875, 0.001922607421875, 0.0427093505859375, 0.08349609375, 0.1242828369140625, 0.165069580078125, 0.2058563232421875, 0.24664306640625, 0.2874298095703125, 0.328216552734375, 0.3690032958984375, 0.4097900390625, 0.4505767822265625, 0.491363525390625, 0.5321502685546875, 0.57293701171875, 0.6137237548828125, 0.654510498046875, 0.6952972412109375, 0.736083984375, 0.7768707275390625, 0.817657470703125, 0.8584442138671875, 0.89923095703125, 0.9400177001953125, 0.980804443359375, 1.0215911865234375, 1.0623779296875, 1.1031646728515625, 1.143951416015625, 1.1847381591796875, 1.22552490234375, 1.2663116455078125, 1.307098388671875, 1.3478851318359375, 1.388671875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 11.0, 12.0, 12.0, 18.0, 18.0, 19.0, 16.0, 27.0, 37.0, 34.0, 36.0, 30.0, 34.0, 36.0, 41.0, 63.0, 42.0, 1062.0, 39.0, 51.0, 26.0, 40.0, 32.0, 38.0, 26.0, 25.0, 30.0, 24.0, 22.0, 23.0, 15.0, 13.0, 13.0, 7.0, 8.0, 8.0, 10.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.765625, -7.501953125, -7.23828125, -6.974609375, -6.7109375, -6.447265625, -6.18359375, -5.919921875, -5.65625, -5.392578125, -5.12890625, -4.865234375, -4.6015625, -4.337890625, -4.07421875, -3.810546875, -3.546875, -3.283203125, -3.01953125, -2.755859375, -2.4921875, -2.228515625, -1.96484375, -1.701171875, -1.4375, -1.173828125, -0.91015625, -0.646484375, -0.3828125, -0.119140625, 0.14453125, 0.408203125, 0.671875, 0.935546875, 1.19921875, 1.462890625, 1.7265625, 1.990234375, 2.25390625, 2.517578125, 2.78125, 3.044921875, 3.30859375, 3.572265625, 3.8359375, 4.099609375, 4.36328125, 4.626953125, 4.890625, 5.154296875, 5.41796875, 5.681640625, 5.9453125, 6.208984375, 6.47265625, 6.736328125, 7.0, 7.263671875, 7.52734375, 7.791015625, 8.0546875, 8.318359375, 8.58203125, 8.845703125, 9.109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 11.0, 28.0, 37.0, 44.0, 81.0, 111.0, 146.0, 241.0, 352.0, 498.0, 762.0, 1207.0, 1793.0, 2676.0, 4238.0, 6634.0, 10294.0, 15939.0, 24927.0, 39621.0, 63883.0, 102565.0, 169214.0, 1263718.0, 146726.0, 89584.0, 55146.0, 35077.0, 21869.0, 13983.0, 8917.0, 5851.0, 3824.0, 2420.0, 1588.0, 1082.0, 681.0, 479.0, 283.0, 206.0, 111.0, 93.0, 63.0, 45.0, 25.0, 14.0, 9.0, 9.0, 9.0, 6.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.4306640625, -1.3877716064453125, -1.344879150390625, -1.3019866943359375, -1.25909423828125, -1.2162017822265625, -1.173309326171875, -1.1304168701171875, -1.0875244140625, -1.0446319580078125, -1.001739501953125, -0.9588470458984375, -0.91595458984375, -0.8730621337890625, -0.830169677734375, -0.7872772216796875, -0.744384765625, -0.7014923095703125, -0.658599853515625, -0.6157073974609375, -0.57281494140625, -0.5299224853515625, -0.487030029296875, -0.4441375732421875, -0.4012451171875, -0.3583526611328125, -0.315460205078125, -0.2725677490234375, -0.22967529296875, -0.1867828369140625, -0.143890380859375, -0.1009979248046875, -0.05810546875, -0.0152130126953125, 0.027679443359375, 0.0705718994140625, 0.11346435546875, 0.1563568115234375, 0.199249267578125, 0.2421417236328125, 0.2850341796875, 0.3279266357421875, 0.370819091796875, 0.4137115478515625, 0.45660400390625, 0.4994964599609375, 0.542388916015625, 0.5852813720703125, 0.628173828125, 0.6710662841796875, 0.713958740234375, 0.7568511962890625, 0.79974365234375, 0.8426361083984375, 0.885528564453125, 0.9284210205078125, 0.9713134765625, 1.0142059326171875, 1.057098388671875, 1.0999908447265625, 1.14288330078125, 1.1857757568359375, 1.228668212890625, 1.2715606689453125, 1.314453125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 10.0, 7.0, 10.0, 10.0, 29.0, 21.0, 41.0, 32.0, 47.0, 63.0, 84.0, 65.0, 75.0, 83.0, 82.0, 85.0, 54.0, 45.0, 31.0, 26.0, 19.0, 10.0, 8.0, 6.0, 7.0, 5.0, 3.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034961700439453125, -0.0033777058124542236, -0.0032592415809631348, -0.003140777349472046, -0.003022313117980957, -0.002903848886489868, -0.0027853846549987793, -0.0026669204235076904, -0.0025484561920166016, -0.0024299919605255127, -0.002311527729034424, -0.002193063497543335, -0.002074599266052246, -0.0019561350345611572, -0.0018376708030700684, -0.0017192065715789795, -0.0016007423400878906, -0.0014822781085968018, -0.0013638138771057129, -0.001245349645614624, -0.0011268854141235352, -0.0010084211826324463, -0.0008899569511413574, -0.0007714927196502686, -0.0006530284881591797, -0.0005345642566680908, -0.00041610002517700195, -0.0002976357936859131, -0.00017917156219482422, -6.070733070373535e-05, 5.7756900787353516e-05, 0.00017622113227844238, 0.00029468536376953125, 0.0004131495952606201, 0.000531613826751709, 0.0006500780582427979, 0.0007685422897338867, 0.0008870065212249756, 0.0010054707527160645, 0.0011239349842071533, 0.0012423992156982422, 0.001360863447189331, 0.00147932767868042, 0.0015977919101715088, 0.0017162561416625977, 0.0018347203731536865, 0.0019531846046447754, 0.0020716488361358643, 0.002190113067626953, 0.002308577299118042, 0.002427041530609131, 0.0025455057621002197, 0.0026639699935913086, 0.0027824342250823975, 0.0029008984565734863, 0.003019362688064575, 0.003137826919555664, 0.003256291151046753, 0.003374755382537842, 0.0034932196140289307, 0.0036116838455200195, 0.0037301480770111084, 0.0038486123085021973, 0.003967076539993286, 0.004085540771484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 5.0, 6.0, 5.0, 10.0, 6.0, 13.0, 19.0, 23.0, 37.0, 47.0, 55.0, 107.0, 205.0, 477.0, 6743.0, 1038206.0, 1743.0, 334.0, 156.0, 86.0, 53.0, 41.0, 44.0, 21.0, 26.0, 16.0, 13.0, 4.0, 11.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.09490966796875, -0.0921478271484375, -0.089385986328125, -0.0866241455078125, -0.0838623046875, -0.0811004638671875, -0.078338623046875, -0.0755767822265625, -0.07281494140625, -0.0700531005859375, -0.067291259765625, -0.0645294189453125, -0.061767578125, -0.0590057373046875, -0.056243896484375, -0.0534820556640625, -0.05072021484375, -0.0479583740234375, -0.045196533203125, -0.0424346923828125, -0.0396728515625, -0.0369110107421875, -0.034149169921875, -0.0313873291015625, -0.02862548828125, -0.0258636474609375, -0.023101806640625, -0.0203399658203125, -0.017578125, -0.0148162841796875, -0.012054443359375, -0.0092926025390625, -0.00653076171875, -0.0037689208984375, -0.001007080078125, 0.0017547607421875, 0.0045166015625, 0.0072784423828125, 0.010040283203125, 0.0128021240234375, 0.01556396484375, 0.0183258056640625, 0.021087646484375, 0.0238494873046875, 0.026611328125, 0.0293731689453125, 0.032135009765625, 0.0348968505859375, 0.03765869140625, 0.0404205322265625, 0.043182373046875, 0.0459442138671875, 0.0487060546875, 0.0514678955078125, 0.054229736328125, 0.0569915771484375, 0.05975341796875, 0.0625152587890625, 0.065277099609375, 0.0680389404296875, 0.07080078125, 0.0735626220703125, 0.076324462890625, 0.0790863037109375, 0.08184814453125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 59.0, 341.0, 488.0, 106.0, 13.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021171297412365675, -0.0019076892640441656, -0.0016982487868517637, -0.00148880819324404, -0.0012793677160516381, -0.0010699272388592362, -0.0008604866452515125, -0.0006510461680591106, -0.00044160569086670876, -0.0002321651845704764, -2.272467827424407e-05, 0.00018671585712581873, 0.0003961563343182206, 0.0006055968115106225, 0.0008150374051183462, 0.001024477882310748, 0.00123391835950315, 0.0014433588366955519, 0.0016527993138879538, 0.0018622399074956775, 0.002071680501103401, 0.002281120978295803, 0.002490561455488205, 0.002700001932680607, 0.0029094424098730087, 0.0031188828870654106, 0.0033283233642578125, 0.0035377638414502144, 0.0037472043186426163, 0.003956644795835018, 0.00416608527302742, 0.004375525750219822, 0.004584966227412224, 0.004794406704604626, 0.005003847181797028, 0.0052132876589894295, 0.005422728136181831, 0.005632168613374233, 0.005841609090566635, 0.006051049567759037, 0.006260490044951439, 0.006469930522143841, 0.006679370999336243, 0.0068888114765286446, 0.0070982519537210464, 0.007307692430913448, 0.00751713290810585, 0.007726573385298252, 0.007936013862490654, 0.008145454339683056, 0.008354894816875458, 0.00856433529406786, 0.008773775771260262, 0.008983216248452663, 0.009192656725645065, 0.009402097202837467, 0.009611538611352444, 0.009820979088544846, 0.010030419565737247, 0.01023986004292965, 0.010449300520122051, 0.010658740997314453, 0.010868181474506855, 0.011077621951699257, 0.011287062428891659]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 6.0, 9.0, 3.0, 10.0, 15.0, 17.0, 21.0, 17.0, 15.0, 14.0, 25.0, 21.0, 36.0, 25.0, 36.0, 25.0, 33.0, 37.0, 29.0, 47.0, 44.0, 35.0, 42.0, 40.0, 39.0, 38.0, 38.0, 22.0, 36.0, 28.0, 27.0, 22.0, 17.0, 18.0, 22.0, 13.0, 13.0, 10.0, 13.0, 7.0, 8.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014216899871826172, -0.0013732193037867546, -0.001324748620390892, -0.0012762779369950294, -0.0012278072535991669, -0.0011793365702033043, -0.0011308658868074417, -0.0010823952034115791, -0.0010339245200157166, -0.000985453836619854, -0.0009369831532239914, -0.0008885124698281288, -0.0008400417864322662, -0.0007915711030364037, -0.0007431004196405411, -0.0006946297362446785, -0.0006461590528488159, -0.0005976883694529533, -0.0005492176860570908, -0.0005007470026612282, -0.0004522763192653656, -0.000403805635869503, -0.00035533495247364044, -0.00030686426907777786, -0.0002583935856819153, -0.0002099229022860527, -0.00016145221889019012, -0.00011298153549432755, -6.451085209846497e-05, -1.6040168702602386e-05, 3.243051469326019e-05, 8.090119808912277e-05, 0.00012937188148498535, 0.00017784256488084793, 0.0002263132482767105, 0.0002747839316725731, 0.00032325461506843567, 0.00037172529846429825, 0.00042019598186016083, 0.0004686666652560234, 0.000517137348651886, 0.0005656080320477486, 0.0006140787154436111, 0.0006625493988394737, 0.0007110200822353363, 0.0007594907656311989, 0.0008079614490270615, 0.000856432132422924, 0.0009049028158187866, 0.0009533734992146492, 0.0010018441826105118, 0.0010503148660063744, 0.001098785549402237, 0.0011472562327980995, 0.001195726916193962, 0.0012441975995898247, 0.0012926682829856873, 0.0013411389663815498, 0.0013896096497774124, 0.001438080333173275, 0.0014865510165691376, 0.0015350216999650002, 0.0015834923833608627, 0.0016319630667567253, 0.0016804337501525879]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 8.0, 8.0, 4.0, 11.0, 17.0, 16.0, 19.0, 21.0, 11.0, 26.0, 20.0, 30.0, 28.0, 35.0, 36.0, 42.0, 44.0, 35.0, 45.0, 40.0, 44.0, 52.0, 41.0, 37.0, 40.0, 33.0, 32.0, 28.0, 25.0, 22.0, 24.0, 19.0, 18.0, 13.0, 13.0, 12.0, 12.0, 8.0, 7.0, 5.0, 10.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.9609375, -12.5570068359375, -12.153076171875, -11.7491455078125, -11.34521484375, -10.9412841796875, -10.537353515625, -10.1334228515625, -9.7294921875, -9.3255615234375, -8.921630859375, -8.5177001953125, -8.11376953125, -7.7098388671875, -7.305908203125, -6.9019775390625, -6.498046875, -6.0941162109375, -5.690185546875, -5.2862548828125, -4.88232421875, -4.4783935546875, -4.074462890625, -3.6705322265625, -3.2666015625, -2.8626708984375, -2.458740234375, -2.0548095703125, -1.65087890625, -1.2469482421875, -0.843017578125, -0.4390869140625, -0.03515625, 0.3687744140625, 0.772705078125, 1.1766357421875, 1.58056640625, 1.9844970703125, 2.388427734375, 2.7923583984375, 3.1962890625, 3.6002197265625, 4.004150390625, 4.4080810546875, 4.81201171875, 5.2159423828125, 5.619873046875, 6.0238037109375, 6.427734375, 6.8316650390625, 7.235595703125, 7.6395263671875, 8.04345703125, 8.4473876953125, 8.851318359375, 9.2552490234375, 9.6591796875, 10.0631103515625, 10.467041015625, 10.8709716796875, 11.27490234375, 11.6788330078125, 12.082763671875, 12.4866943359375, 12.890625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 9.0, 16.0, 15.0, 17.0, 20.0, 33.0, 50.0, 85.0, 141.0, 252.0, 477.0, 889.0, 1764.0, 3654.0, 7354.0, 15216.0, 33192.0, 79677.0, 222485.0, 417672.0, 156461.0, 59582.0, 25777.0, 11995.0, 5749.0, 2832.0, 1420.0, 720.0, 388.0, 230.0, 101.0, 80.0, 59.0, 34.0, 18.0, 20.0, 19.0, 17.0, 5.0, 4.0, 3.0, 0.0, 6.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-8.5390625, -8.2750244140625, -8.010986328125, -7.7469482421875, -7.48291015625, -7.2188720703125, -6.954833984375, -6.6907958984375, -6.4267578125, -6.1627197265625, -5.898681640625, -5.6346435546875, -5.37060546875, -5.1065673828125, -4.842529296875, -4.5784912109375, -4.314453125, -4.0504150390625, -3.786376953125, -3.5223388671875, -3.25830078125, -2.9942626953125, -2.730224609375, -2.4661865234375, -2.2021484375, -1.9381103515625, -1.674072265625, -1.4100341796875, -1.14599609375, -0.8819580078125, -0.617919921875, -0.3538818359375, -0.08984375, 0.1741943359375, 0.438232421875, 0.7022705078125, 0.96630859375, 1.2303466796875, 1.494384765625, 1.7584228515625, 2.0224609375, 2.2864990234375, 2.550537109375, 2.8145751953125, 3.07861328125, 3.3426513671875, 3.606689453125, 3.8707275390625, 4.134765625, 4.3988037109375, 4.662841796875, 4.9268798828125, 5.19091796875, 5.4549560546875, 5.718994140625, 5.9830322265625, 6.2470703125, 6.5111083984375, 6.775146484375, 7.0391845703125, 7.30322265625, 7.5672607421875, 7.831298828125, 8.0953369140625, 8.359375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 1.0, 6.0, 7.0, 8.0, 11.0, 12.0, 11.0, 9.0, 21.0, 27.0, 22.0, 35.0, 43.0, 46.0, 40.0, 36.0, 55.0, 81.0, 307.0, 1676.0, 119.0, 69.0, 61.0, 45.0, 44.0, 38.0, 34.0, 30.0, 27.0, 22.0, 24.0, 15.0, 14.0, 11.0, 8.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.25, -51.6484375, -50.046875, -48.4453125, -46.84375, -45.2421875, -43.640625, -42.0390625, -40.4375, -38.8359375, -37.234375, -35.6328125, -34.03125, -32.4296875, -30.828125, -29.2265625, -27.625, -26.0234375, -24.421875, -22.8203125, -21.21875, -19.6171875, -18.015625, -16.4140625, -14.8125, -13.2109375, -11.609375, -10.0078125, -8.40625, -6.8046875, -5.203125, -3.6015625, -2.0, -0.3984375, 1.203125, 2.8046875, 4.40625, 6.0078125, 7.609375, 9.2109375, 10.8125, 12.4140625, 14.015625, 15.6171875, 17.21875, 18.8203125, 20.421875, 22.0234375, 23.625, 25.2265625, 26.828125, 28.4296875, 30.03125, 31.6328125, 33.234375, 34.8359375, 36.4375, 38.0390625, 39.640625, 41.2421875, 42.84375, 44.4453125, 46.046875, 47.6484375, 49.25]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 10.0, 10.0, 16.0, 18.0, 26.0, 39.0, 39.0, 44.0, 82.0, 93.0, 128.0, 172.0, 256.0, 327.0, 813.0, 15049.0, 3118245.0, 8408.0, 732.0, 356.0, 202.0, 155.0, 108.0, 96.0, 54.0, 48.0, 37.0, 28.0, 23.0, 12.0, 14.0, 10.0, 10.0, 7.0, 5.0, 4.0, 1.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-122.6875, -118.7861328125, -114.884765625, -110.9833984375, -107.08203125, -103.1806640625, -99.279296875, -95.3779296875, -91.4765625, -87.5751953125, -83.673828125, -79.7724609375, -75.87109375, -71.9697265625, -68.068359375, -64.1669921875, -60.265625, -56.3642578125, -52.462890625, -48.5615234375, -44.66015625, -40.7587890625, -36.857421875, -32.9560546875, -29.0546875, -25.1533203125, -21.251953125, -17.3505859375, -13.44921875, -9.5478515625, -5.646484375, -1.7451171875, 2.15625, 6.0576171875, 9.958984375, 13.8603515625, 17.76171875, 21.6630859375, 25.564453125, 29.4658203125, 33.3671875, 37.2685546875, 41.169921875, 45.0712890625, 48.97265625, 52.8740234375, 56.775390625, 60.6767578125, 64.578125, 68.4794921875, 72.380859375, 76.2822265625, 80.18359375, 84.0849609375, 87.986328125, 91.8876953125, 95.7890625, 99.6904296875, 103.591796875, 107.4931640625, 111.39453125, 115.2958984375, 119.197265625, 123.0986328125, 127.0]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 15.0, 40.0, 119.0, 201.0, 240.0, 223.0, 112.0, 41.0, 17.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.34346008300781, -58.22357177734375, -56.10367965698242, -53.98379135131836, -51.86389923095703, -49.74401092529297, -47.624122619628906, -45.50423049926758, -43.38433837890625, -41.26445007324219, -39.14455795288086, -37.0246696472168, -34.90477752685547, -32.784889221191406, -30.66499900817871, -28.545108795166016, -26.425220489501953, -24.305330276489258, -22.185440063476562, -20.0655517578125, -17.945659637451172, -15.825770378112793, -13.705881118774414, -11.585990905761719, -9.466100692749023, -7.346210479736328, -5.226320743560791, -3.106431007385254, -0.9865407943725586, 1.1333494186401367, 3.2532386779785156, 5.373128890991211, 7.493019104003906, 9.612909317016602, 11.732799530029297, 13.852688789367676, 15.972579002380371, 18.09246826171875, 20.212358474731445, 22.33224868774414, 24.452138900756836, 26.57202911376953, 28.691919326782227, 30.811809539794922, 32.931697845458984, 35.05158996582031, 37.171478271484375, 39.29136657714844, 41.411258697509766, 43.53114700317383, 45.651039123535156, 47.77092742919922, 49.89081954956055, 52.01070785522461, 54.13059997558594, 56.25048828125, 58.37037658691406, 60.490264892578125, 62.61015701293945, 64.73004913330078, 66.84993743896484, 68.9698257446289, 71.08971405029297, 73.20960998535156, 75.32949829101562]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 15.0, 14.0, 6.0, 13.0, 16.0, 19.0, 22.0, 26.0, 19.0, 18.0, 19.0, 30.0, 29.0, 27.0, 30.0, 26.0, 42.0, 38.0, 34.0, 28.0, 41.0, 43.0, 40.0, 35.0, 31.0, 22.0, 29.0, 28.0, 24.0, 24.0, 30.0, 20.0, 16.0, 22.0, 23.0, 12.0, 11.0, 10.0, 13.0, 8.0, 7.0, 6.0, 2.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0], "bins": [-103.20541381835938, -100.02490234375, -96.84439849853516, -93.66388702392578, -90.4833755493164, -87.30287170410156, -84.12236022949219, -80.94184875488281, -77.76133728027344, -74.58082580566406, -71.40032196044922, -68.21981048583984, -65.03929901123047, -61.85879135131836, -58.67828369140625, -55.497772216796875, -52.31726837158203, -49.13676071166992, -45.95624923706055, -42.77574157714844, -39.59523010253906, -36.41472244262695, -33.234214782714844, -30.0537052154541, -26.87319564819336, -23.692686080932617, -20.512176513671875, -17.331668853759766, -14.151159286499023, -10.970649719238281, -7.790142059326172, -4.60963249206543, -1.4291229248046875, 1.7513861656188965, 4.9318952560424805, 8.112403869628906, 11.292913436889648, 14.47342300415039, 17.6539306640625, 20.834440231323242, 24.014949798583984, 27.195459365844727, 30.37596893310547, 33.55647659301758, 36.73698425292969, 39.91749572753906, 43.09800338745117, 46.27851104736328, 49.459022521972656, 52.639530181884766, 55.82004165649414, 59.00054931640625, 62.181060791015625, 65.361572265625, 68.54207611083984, 71.72258758544922, 74.90309143066406, 78.08360290527344, 81.26410675048828, 84.44461822509766, 87.62512969970703, 90.80563354492188, 93.98614501953125, 97.16665649414062, 100.34716796875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 8.0, 11.0, 12.0, 18.0, 10.0, 16.0, 15.0, 21.0, 26.0, 23.0, 24.0, 31.0, 35.0, 32.0, 37.0, 42.0, 37.0, 45.0, 44.0, 40.0, 38.0, 35.0, 41.0, 41.0, 46.0, 27.0, 24.0, 29.0, 28.0, 27.0, 18.0, 14.0, 14.0, 9.0, 12.0, 12.0, 10.0, 7.0, 9.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-13.4140625, -13.0093994140625, -12.604736328125, -12.2000732421875, -11.79541015625, -11.3907470703125, -10.986083984375, -10.5814208984375, -10.1767578125, -9.7720947265625, -9.367431640625, -8.9627685546875, -8.55810546875, -8.1534423828125, -7.748779296875, -7.3441162109375, -6.939453125, -6.5347900390625, -6.130126953125, -5.7254638671875, -5.32080078125, -4.9161376953125, -4.511474609375, -4.1068115234375, -3.7021484375, -3.2974853515625, -2.892822265625, -2.4881591796875, -2.08349609375, -1.6788330078125, -1.274169921875, -0.8695068359375, -0.46484375, -0.0601806640625, 0.344482421875, 0.7491455078125, 1.15380859375, 1.5584716796875, 1.963134765625, 2.3677978515625, 2.7724609375, 3.1771240234375, 3.581787109375, 3.9864501953125, 4.39111328125, 4.7957763671875, 5.200439453125, 5.6051025390625, 6.009765625, 6.4144287109375, 6.819091796875, 7.2237548828125, 7.62841796875, 8.0330810546875, 8.437744140625, 8.8424072265625, 9.2470703125, 9.6517333984375, 10.056396484375, 10.4610595703125, 10.86572265625, 11.2703857421875, 11.675048828125, 12.0797119140625, 12.484375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 15.0, 20.0, 10.0, 15.0, 13.0, 21.0, 20.0, 26.0, 43.0, 56.0, 84.0, 153.0, 318.0, 860.0, 4433.0, 67469.0, 2500117.0, 1582538.0, 33878.0, 2754.0, 677.0, 276.0, 124.0, 75.0, 54.0, 36.0, 31.0, 18.0, 21.0, 16.0, 14.0, 15.0, 11.0, 11.0, 9.0, 7.0, 6.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.1875, -45.75341796875, -44.3193359375, -42.88525390625, -41.451171875, -40.01708984375, -38.5830078125, -37.14892578125, -35.71484375, -34.28076171875, -32.8466796875, -31.41259765625, -29.978515625, -28.54443359375, -27.1103515625, -25.67626953125, -24.2421875, -22.80810546875, -21.3740234375, -19.93994140625, -18.505859375, -17.07177734375, -15.6376953125, -14.20361328125, -12.76953125, -11.33544921875, -9.9013671875, -8.46728515625, -7.033203125, -5.59912109375, -4.1650390625, -2.73095703125, -1.296875, 0.13720703125, 1.5712890625, 3.00537109375, 4.439453125, 5.87353515625, 7.3076171875, 8.74169921875, 10.17578125, 11.60986328125, 13.0439453125, 14.47802734375, 15.912109375, 17.34619140625, 18.7802734375, 20.21435546875, 21.6484375, 23.08251953125, 24.5166015625, 25.95068359375, 27.384765625, 28.81884765625, 30.2529296875, 31.68701171875, 33.12109375, 34.55517578125, 35.9892578125, 37.42333984375, 38.857421875, 40.29150390625, 41.7255859375, 43.15966796875, 44.59375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 11.0, 14.0, 18.0, 28.0, 24.0, 51.0, 56.0, 86.0, 101.0, 154.0, 178.0, 235.0, 284.0, 368.0, 411.0, 418.0, 381.0, 304.0, 222.0, 157.0, 123.0, 94.0, 76.0, 56.0, 44.0, 28.0, 25.0, 15.0, 23.0, 20.0, 9.0, 6.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-21.875, -21.2119140625, -20.548828125, -19.8857421875, -19.22265625, -18.5595703125, -17.896484375, -17.2333984375, -16.5703125, -15.9072265625, -15.244140625, -14.5810546875, -13.91796875, -13.2548828125, -12.591796875, -11.9287109375, -11.265625, -10.6025390625, -9.939453125, -9.2763671875, -8.61328125, -7.9501953125, -7.287109375, -6.6240234375, -5.9609375, -5.2978515625, -4.634765625, -3.9716796875, -3.30859375, -2.6455078125, -1.982421875, -1.3193359375, -0.65625, 0.0068359375, 0.669921875, 1.3330078125, 1.99609375, 2.6591796875, 3.322265625, 3.9853515625, 4.6484375, 5.3115234375, 5.974609375, 6.6376953125, 7.30078125, 7.9638671875, 8.626953125, 9.2900390625, 9.953125, 10.6162109375, 11.279296875, 11.9423828125, 12.60546875, 13.2685546875, 13.931640625, 14.5947265625, 15.2578125, 15.9208984375, 16.583984375, 17.2470703125, 17.91015625, 18.5732421875, 19.236328125, 19.8994140625, 20.5625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 3.0, 6.0, 5.0, 6.0, 9.0, 12.0, 11.0, 18.0, 24.0, 26.0, 38.0, 34.0, 39.0, 56.0, 67.0, 74.0, 111.0, 130.0, 153.0, 181.0, 276.0, 396.0, 973.0, 15758.0, 3856875.0, 314365.0, 2575.0, 520.0, 326.0, 236.0, 203.0, 140.0, 138.0, 105.0, 82.0, 55.0, 53.0, 37.0, 36.0, 24.0, 18.0, 22.0, 21.0, 12.0, 14.0, 7.0, 8.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-97.8125, -94.6318359375, -91.451171875, -88.2705078125, -85.08984375, -81.9091796875, -78.728515625, -75.5478515625, -72.3671875, -69.1865234375, -66.005859375, -62.8251953125, -59.64453125, -56.4638671875, -53.283203125, -50.1025390625, -46.921875, -43.7412109375, -40.560546875, -37.3798828125, -34.19921875, -31.0185546875, -27.837890625, -24.6572265625, -21.4765625, -18.2958984375, -15.115234375, -11.9345703125, -8.75390625, -5.5732421875, -2.392578125, 0.7880859375, 3.96875, 7.1494140625, 10.330078125, 13.5107421875, 16.69140625, 19.8720703125, 23.052734375, 26.2333984375, 29.4140625, 32.5947265625, 35.775390625, 38.9560546875, 42.13671875, 45.3173828125, 48.498046875, 51.6787109375, 54.859375, 58.0400390625, 61.220703125, 64.4013671875, 67.58203125, 70.7626953125, 73.943359375, 77.1240234375, 80.3046875, 83.4853515625, 86.666015625, 89.8466796875, 93.02734375, 96.2080078125, 99.388671875, 102.5693359375, 105.75]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 29.0, 328.0, 537.0, 118.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-436.3837890625, -421.9413757324219, -407.4989318847656, -393.0565185546875, -378.6141052246094, -364.1716613769531, -349.729248046875, -335.28680419921875, -320.8443908691406, -306.4019775390625, -291.95953369140625, -277.5171203613281, -263.07470703125, -248.63226318359375, -234.18984985351562, -219.74742126464844, -205.3050079345703, -190.86257934570312, -176.420166015625, -161.9777374267578, -147.53530883789062, -133.0928955078125, -118.65046691894531, -104.20803833007812, -89.76561737060547, -75.32319641113281, -60.880767822265625, -46.43834686279297, -31.995922088623047, -17.553497314453125, -3.1110763549804688, 11.331352233886719, 25.773773193359375, 40.2161979675293, 54.65862274169922, 69.10104370117188, 83.54347229003906, 97.98589324951172, 112.42831420898438, 126.87074279785156, 141.31317138671875, 155.75559997558594, 170.19801330566406, 184.64044189453125, 199.08287048339844, 213.52529907226562, 227.96771240234375, 242.41014099121094, 256.8525390625, 271.2949523925781, 285.7373962402344, 300.1798095703125, 314.6222229003906, 329.0646667480469, 343.507080078125, 357.94952392578125, 372.3919372558594, 386.8343505859375, 401.27679443359375, 415.7192077636719, 430.16162109375, 444.60406494140625, 459.0464782714844, 473.4888916015625, 487.93133544921875]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 13.0, 5.0, 5.0, 7.0, 9.0, 10.0, 12.0, 17.0, 18.0, 17.0, 21.0, 21.0, 24.0, 32.0, 25.0, 31.0, 24.0, 31.0, 30.0, 40.0, 44.0, 44.0, 44.0, 37.0, 30.0, 30.0, 38.0, 31.0, 20.0, 32.0, 37.0, 28.0, 21.0, 31.0, 13.0, 13.0, 22.0, 16.0, 11.0, 11.0, 13.0, 9.0, 3.0, 2.0, 13.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-69.1353759765625, -66.96306610107422, -64.79075622558594, -62.618446350097656, -60.446136474609375, -58.273826599121094, -56.10151672363281, -53.92920684814453, -51.75689697265625, -49.58458709716797, -47.41227722167969, -45.239967346191406, -43.067657470703125, -40.895347595214844, -38.72303771972656, -36.55072784423828, -34.37841796875, -32.20610809326172, -30.033798217773438, -27.861488342285156, -25.689178466796875, -23.516868591308594, -21.344558715820312, -19.17224884033203, -16.99993896484375, -14.827629089355469, -12.655319213867188, -10.483009338378906, -8.310699462890625, -6.138389587402344, -3.9660797119140625, -1.7937698364257812, 0.3785400390625, 2.5508499145507812, 4.7231597900390625, 6.895469665527344, 9.067779541015625, 11.240089416503906, 13.412399291992188, 15.584709167480469, 17.75701904296875, 19.92932891845703, 22.101638793945312, 24.273948669433594, 26.446258544921875, 28.618568420410156, 30.790878295898438, 32.96318817138672, 35.135498046875, 37.30780792236328, 39.48011779785156, 41.652427673339844, 43.824737548828125, 45.997047424316406, 48.16935729980469, 50.34166717529297, 52.51397705078125, 54.68628692626953, 56.85859680175781, 59.030906677246094, 61.203216552734375, 63.375526428222656, 65.54783630371094, 67.72014617919922, 69.8924560546875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 7.0, 4.0, 7.0, 7.0, 14.0, 16.0, 17.0, 7.0, 19.0, 21.0, 22.0, 22.0, 28.0, 27.0, 39.0, 27.0, 34.0, 33.0, 40.0, 47.0, 42.0, 45.0, 49.0, 43.0, 31.0, 36.0, 40.0, 30.0, 37.0, 34.0, 25.0, 17.0, 21.0, 19.0, 10.0, 12.0, 12.0, 12.0, 13.0, 9.0, 8.0, 3.0, 3.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.71875, -12.3233642578125, -11.927978515625, -11.5325927734375, -11.13720703125, -10.7418212890625, -10.346435546875, -9.9510498046875, -9.5556640625, -9.1602783203125, -8.764892578125, -8.3695068359375, -7.97412109375, -7.5787353515625, -7.183349609375, -6.7879638671875, -6.392578125, -5.9971923828125, -5.601806640625, -5.2064208984375, -4.81103515625, -4.4156494140625, -4.020263671875, -3.6248779296875, -3.2294921875, -2.8341064453125, -2.438720703125, -2.0433349609375, -1.64794921875, -1.2525634765625, -0.857177734375, -0.4617919921875, -0.06640625, 0.3289794921875, 0.724365234375, 1.1197509765625, 1.51513671875, 1.9105224609375, 2.305908203125, 2.7012939453125, 3.0966796875, 3.4920654296875, 3.887451171875, 4.2828369140625, 4.67822265625, 5.0736083984375, 5.468994140625, 5.8643798828125, 6.259765625, 6.6551513671875, 7.050537109375, 7.4459228515625, 7.84130859375, 8.2366943359375, 8.632080078125, 9.0274658203125, 9.4228515625, 9.8182373046875, 10.213623046875, 10.6090087890625, 11.00439453125, 11.3997802734375, 11.795166015625, 12.1905517578125, 12.5859375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 6.0, 3.0, 10.0, 14.0, 18.0, 37.0, 58.0, 81.0, 91.0, 161.0, 260.0, 354.0, 619.0, 966.0, 1432.0, 2381.0, 3702.0, 5904.0, 9080.0, 14620.0, 23678.0, 38278.0, 61334.0, 97455.0, 155719.0, 213661.0, 156526.0, 98200.0, 61379.0, 38412.0, 23832.0, 14857.0, 9324.0, 5924.0, 3727.0, 2312.0, 1480.0, 938.0, 615.0, 385.0, 253.0, 177.0, 101.0, 57.0, 42.0, 32.0, 21.0, 14.0, 17.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5048828125, -1.458587646484375, -1.41229248046875, -1.365997314453125, -1.3197021484375, -1.273406982421875, -1.22711181640625, -1.180816650390625, -1.134521484375, -1.088226318359375, -1.04193115234375, -0.995635986328125, -0.9493408203125, -0.903045654296875, -0.85675048828125, -0.810455322265625, -0.76416015625, -0.717864990234375, -0.67156982421875, -0.625274658203125, -0.5789794921875, -0.532684326171875, -0.48638916015625, -0.440093994140625, -0.393798828125, -0.347503662109375, -0.30120849609375, -0.254913330078125, -0.2086181640625, -0.162322998046875, -0.11602783203125, -0.069732666015625, -0.0234375, 0.022857666015625, 0.06915283203125, 0.115447998046875, 0.1617431640625, 0.208038330078125, 0.25433349609375, 0.300628662109375, 0.346923828125, 0.393218994140625, 0.43951416015625, 0.485809326171875, 0.5321044921875, 0.578399658203125, 0.62469482421875, 0.670989990234375, 0.71728515625, 0.763580322265625, 0.80987548828125, 0.856170654296875, 0.9024658203125, 0.948760986328125, 0.99505615234375, 1.041351318359375, 1.087646484375, 1.133941650390625, 1.18023681640625, 1.226531982421875, 1.2728271484375, 1.319122314453125, 1.36541748046875, 1.411712646484375, 1.4580078125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 9.0, 8.0, 6.0, 15.0, 17.0, 23.0, 19.0, 24.0, 23.0, 29.0, 33.0, 32.0, 33.0, 36.0, 33.0, 35.0, 39.0, 50.0, 1073.0, 31.0, 39.0, 38.0, 34.0, 29.0, 30.0, 39.0, 29.0, 31.0, 24.0, 24.0, 23.0, 22.0, 15.0, 11.0, 19.0, 13.0, 6.0, 5.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.109375, -7.853759765625, -7.59814453125, -7.342529296875, -7.0869140625, -6.831298828125, -6.57568359375, -6.320068359375, -6.064453125, -5.808837890625, -5.55322265625, -5.297607421875, -5.0419921875, -4.786376953125, -4.53076171875, -4.275146484375, -4.01953125, -3.763916015625, -3.50830078125, -3.252685546875, -2.9970703125, -2.741455078125, -2.48583984375, -2.230224609375, -1.974609375, -1.718994140625, -1.46337890625, -1.207763671875, -0.9521484375, -0.696533203125, -0.44091796875, -0.185302734375, 0.0703125, 0.325927734375, 0.58154296875, 0.837158203125, 1.0927734375, 1.348388671875, 1.60400390625, 1.859619140625, 2.115234375, 2.370849609375, 2.62646484375, 2.882080078125, 3.1376953125, 3.393310546875, 3.64892578125, 3.904541015625, 4.16015625, 4.415771484375, 4.67138671875, 4.927001953125, 5.1826171875, 5.438232421875, 5.69384765625, 5.949462890625, 6.205078125, 6.460693359375, 6.71630859375, 6.971923828125, 7.2275390625, 7.483154296875, 7.73876953125, 7.994384765625, 8.25]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 7.0, 10.0, 10.0, 13.0, 30.0, 39.0, 51.0, 108.0, 141.0, 223.0, 356.0, 612.0, 1009.0, 1497.0, 2445.0, 3900.0, 6331.0, 10435.0, 17106.0, 27743.0, 45247.0, 74043.0, 123632.0, 233277.0, 1223987.0, 127329.0, 76641.0, 46414.0, 28955.0, 17510.0, 10765.0, 6598.0, 4001.0, 2538.0, 1505.0, 964.0, 617.0, 405.0, 231.0, 138.0, 100.0, 57.0, 37.0, 27.0, 17.0, 12.0, 14.0, 4.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5126953125, -1.4654693603515625, -1.418243408203125, -1.3710174560546875, -1.32379150390625, -1.2765655517578125, -1.229339599609375, -1.1821136474609375, -1.1348876953125, -1.0876617431640625, -1.040435791015625, -0.9932098388671875, -0.94598388671875, -0.8987579345703125, -0.851531982421875, -0.8043060302734375, -0.757080078125, -0.7098541259765625, -0.662628173828125, -0.6154022216796875, -0.56817626953125, -0.5209503173828125, -0.473724365234375, -0.4264984130859375, -0.3792724609375, -0.3320465087890625, -0.284820556640625, -0.2375946044921875, -0.19036865234375, -0.1431427001953125, -0.095916748046875, -0.0486907958984375, -0.00146484375, 0.0457611083984375, 0.092987060546875, 0.1402130126953125, 0.18743896484375, 0.2346649169921875, 0.281890869140625, 0.3291168212890625, 0.3763427734375, 0.4235687255859375, 0.470794677734375, 0.5180206298828125, 0.56524658203125, 0.6124725341796875, 0.659698486328125, 0.7069244384765625, 0.754150390625, 0.8013763427734375, 0.848602294921875, 0.8958282470703125, 0.94305419921875, 0.9902801513671875, 1.037506103515625, 1.0847320556640625, 1.1319580078125, 1.1791839599609375, 1.226409912109375, 1.2736358642578125, 1.32086181640625, 1.3680877685546875, 1.415313720703125, 1.4625396728515625, 1.509765625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 4.0, 9.0, 10.0, 4.0, 12.0, 7.0, 11.0, 11.0, 27.0, 29.0, 31.0, 50.0, 73.0, 72.0, 77.0, 72.0, 76.0, 66.0, 61.0, 63.0, 52.0, 30.0, 27.0, 21.0, 19.0, 17.0, 13.0, 13.0, 9.0, 11.0, 2.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0032958984375, -0.003184497356414795, -0.00307309627532959, -0.0029616951942443848, -0.0028502941131591797, -0.0027388930320739746, -0.0026274919509887695, -0.0025160908699035645, -0.0024046897888183594, -0.0022932887077331543, -0.0021818876266479492, -0.002070486545562744, -0.001959085464477539, -0.001847684383392334, -0.001736283302307129, -0.0016248822212219238, -0.0015134811401367188, -0.0014020800590515137, -0.0012906789779663086, -0.0011792778968811035, -0.0010678768157958984, -0.0009564757347106934, -0.0008450746536254883, -0.0007336735725402832, -0.0006222724914550781, -0.000510871410369873, -0.00039947032928466797, -0.0002880692481994629, -0.0001766681671142578, -6.526708602905273e-05, 4.6133995056152344e-05, 0.00015753507614135742, 0.0002689361572265625, 0.0003803372383117676, 0.0004917383193969727, 0.0006031394004821777, 0.0007145404815673828, 0.0008259415626525879, 0.000937342643737793, 0.001048743724822998, 0.0011601448059082031, 0.0012715458869934082, 0.0013829469680786133, 0.0014943480491638184, 0.0016057491302490234, 0.0017171502113342285, 0.0018285512924194336, 0.0019399523735046387, 0.0020513534545898438, 0.002162754535675049, 0.002274155616760254, 0.002385556697845459, 0.002496957778930664, 0.002608358860015869, 0.0027197599411010742, 0.0028311610221862793, 0.0029425621032714844, 0.0030539631843566895, 0.0031653642654418945, 0.0032767653465270996, 0.0033881664276123047, 0.0034995675086975098, 0.003610968589782715, 0.00372236967086792, 0.003833770751953125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 6.0, 5.0, 13.0, 13.0, 16.0, 16.0, 30.0, 23.0, 44.0, 58.0, 89.0, 149.0, 306.0, 991.0, 895111.0, 150326.0, 741.0, 249.0, 105.0, 78.0, 45.0, 33.0, 25.0, 13.0, 12.0, 8.0, 9.0, 9.0, 3.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0987548828125, -0.09584331512451172, -0.09293174743652344, -0.09002017974853516, -0.08710861206054688, -0.0841970443725586, -0.08128547668457031, -0.07837390899658203, -0.07546234130859375, -0.07255077362060547, -0.06963920593261719, -0.0667276382446289, -0.06381607055664062, -0.060904502868652344, -0.05799293518066406, -0.05508136749267578, -0.0521697998046875, -0.04925823211669922, -0.04634666442871094, -0.043435096740722656, -0.040523529052734375, -0.037611961364746094, -0.03470039367675781, -0.03178882598876953, -0.02887725830078125, -0.02596569061279297, -0.023054122924804688, -0.020142555236816406, -0.017230987548828125, -0.014319419860839844, -0.011407852172851562, -0.008496284484863281, -0.005584716796875, -0.0026731491088867188, 0.0002384185791015625, 0.0031499862670898438, 0.006061553955078125, 0.008973121643066406, 0.011884689331054688, 0.014796257019042969, 0.01770782470703125, 0.02061939239501953, 0.023530960083007812, 0.026442527770996094, 0.029354095458984375, 0.032265663146972656, 0.03517723083496094, 0.03808879852294922, 0.0410003662109375, 0.04391193389892578, 0.04682350158691406, 0.049735069274902344, 0.052646636962890625, 0.055558204650878906, 0.05846977233886719, 0.06138134002685547, 0.06429290771484375, 0.06720447540283203, 0.07011604309082031, 0.0730276107788086, 0.07593917846679688, 0.07885074615478516, 0.08176231384277344, 0.08467388153076172, 0.08758544921875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 10.0, 63.0, 441.0, 420.0, 68.0, 11.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019389829831197858, -0.0016962802037596703, -0.0014535775408148766, -0.0012108748778700829, -0.0009681720985099673, -0.0007254694355651736, -0.0004827666562050581, -0.00024006387684494257, 2.6387860998511314e-06, 0.00024534150725230575, 0.00048804422840476036, 0.000730746949557215, 0.0009734496707096696, 0.0012161523336544633, 0.0014588551130145788, 0.0017015578923746943, 0.001944260555319488, 0.0021869633346796036, 0.0024296659976243973, 0.002672368660569191, 0.0029150713235139847, 0.0031577739864587784, 0.0034004768822342157, 0.003643179778009653, 0.003885882440954447, 0.0041285851038992405, 0.004371287766844034, 0.004613990429788828, 0.004856693558394909, 0.005099396221339703, 0.005342098884284496, 0.00558480154722929, 0.005827504210174084, 0.006070206873118877, 0.006312909536063671, 0.006555612199008465, 0.0067983148619532585, 0.007041017524898052, 0.007283720653504133, 0.007526423316448927, 0.007769125979393721, 0.008011829107999802, 0.008254531770944595, 0.008497234433889389, 0.008739937096834183, 0.008982639759778976, 0.00922534242272377, 0.009468045085668564, 0.009710747748613358, 0.009953450411558151, 0.010196153074502945, 0.010438855737447739, 0.010681558400392532, 0.010924261063337326, 0.01116696372628212, 0.011409666389226913, 0.011652369052171707, 0.0118950717151165, 0.012137774378061295, 0.012380477041006088, 0.012623179703950882, 0.012865882366895676, 0.01310858502984047, 0.013351287692785263, 0.013593991287052631]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 8.0, 8.0, 2.0, 7.0, 8.0, 13.0, 14.0, 16.0, 11.0, 29.0, 23.0, 28.0, 33.0, 27.0, 33.0, 47.0, 39.0, 43.0, 41.0, 32.0, 40.0, 55.0, 41.0, 54.0, 44.0, 47.0, 34.0, 41.0, 27.0, 24.0, 23.0, 28.0, 7.0, 11.0, 11.0, 17.0, 6.0, 12.0, 10.0, 1.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00161820650100708, -0.0015616370365023613, -0.0015050675719976425, -0.0014484981074929237, -0.001391928642988205, -0.0013353591784834862, -0.0012787897139787674, -0.0012222202494740486, -0.0011656507849693298, -0.001109081320464611, -0.0010525118559598923, -0.0009959423914551735, -0.0009393729269504547, -0.0008828034624457359, -0.0008262339979410172, -0.0007696645334362984, -0.0007130950689315796, -0.0006565256044268608, -0.000599956139922142, -0.0005433866754174232, -0.00048681721091270447, -0.0004302477464079857, -0.0003736782819032669, -0.0003171088173985481, -0.00026053935289382935, -0.00020396988838911057, -0.00014740042388439178, -9.0830959379673e-05, -3.4261494874954224e-05, 2.2307969629764557e-05, 7.887743413448334e-05, 0.00013544689863920212, 0.0001920163631439209, 0.0002485858276486397, 0.00030515529215335846, 0.00036172475665807724, 0.000418294221162796, 0.0004748636856675148, 0.0005314331501722336, 0.0005880026146769524, 0.0006445720791816711, 0.0007011415436863899, 0.0007577110081911087, 0.0008142804726958275, 0.0008708499372005463, 0.000927419401705265, 0.0009839888662099838, 0.0010405583307147026, 0.0010971277952194214, 0.0011536972597241402, 0.001210266724228859, 0.0012668361887335777, 0.0013234056532382965, 0.0013799751177430153, 0.001436544582247734, 0.0014931140467524529, 0.0015496835112571716, 0.0016062529757618904, 0.0016628224402666092, 0.001719391904771328, 0.0017759613692760468, 0.0018325308337807655, 0.0018891002982854843, 0.001945669762790203, 0.002002239227294922]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 7.0, 4.0, 7.0, 7.0, 14.0, 16.0, 17.0, 7.0, 19.0, 21.0, 22.0, 22.0, 28.0, 27.0, 39.0, 27.0, 34.0, 33.0, 40.0, 47.0, 42.0, 45.0, 49.0, 43.0, 31.0, 36.0, 40.0, 30.0, 37.0, 34.0, 25.0, 17.0, 21.0, 19.0, 10.0, 12.0, 12.0, 12.0, 13.0, 9.0, 8.0, 3.0, 3.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.71875, -12.3233642578125, -11.927978515625, -11.5325927734375, -11.13720703125, -10.7418212890625, -10.346435546875, -9.9510498046875, -9.5556640625, -9.1602783203125, -8.764892578125, -8.3695068359375, -7.97412109375, -7.5787353515625, -7.183349609375, -6.7879638671875, -6.392578125, -5.9971923828125, -5.601806640625, -5.2064208984375, -4.81103515625, -4.4156494140625, -4.020263671875, -3.6248779296875, -3.2294921875, -2.8341064453125, -2.438720703125, -2.0433349609375, -1.64794921875, -1.2525634765625, -0.857177734375, -0.4617919921875, -0.06640625, 0.3289794921875, 0.724365234375, 1.1197509765625, 1.51513671875, 1.9105224609375, 2.305908203125, 2.7012939453125, 3.0966796875, 3.4920654296875, 3.887451171875, 4.2828369140625, 4.67822265625, 5.0736083984375, 5.468994140625, 5.8643798828125, 6.259765625, 6.6551513671875, 7.050537109375, 7.4459228515625, 7.84130859375, 8.2366943359375, 8.632080078125, 9.0274658203125, 9.4228515625, 9.8182373046875, 10.213623046875, 10.6090087890625, 11.00439453125, 11.3997802734375, 11.795166015625, 12.1905517578125, 12.5859375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 6.0, 6.0, 5.0, 10.0, 14.0, 20.0, 24.0, 32.0, 30.0, 50.0, 74.0, 94.0, 120.0, 187.0, 270.0, 466.0, 900.0, 1942.0, 5159.0, 14265.0, 41359.0, 131818.0, 494734.0, 250386.0, 69305.0, 22974.0, 8185.0, 3137.0, 1276.0, 614.0, 325.0, 214.0, 151.0, 96.0, 74.0, 59.0, 45.0, 26.0, 18.0, 22.0, 17.0, 12.0, 8.0, 9.0, 3.0, 10.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-13.984375, -13.55712890625, -13.1298828125, -12.70263671875, -12.275390625, -11.84814453125, -11.4208984375, -10.99365234375, -10.56640625, -10.13916015625, -9.7119140625, -9.28466796875, -8.857421875, -8.43017578125, -8.0029296875, -7.57568359375, -7.1484375, -6.72119140625, -6.2939453125, -5.86669921875, -5.439453125, -5.01220703125, -4.5849609375, -4.15771484375, -3.73046875, -3.30322265625, -2.8759765625, -2.44873046875, -2.021484375, -1.59423828125, -1.1669921875, -0.73974609375, -0.3125, 0.11474609375, 0.5419921875, 0.96923828125, 1.396484375, 1.82373046875, 2.2509765625, 2.67822265625, 3.10546875, 3.53271484375, 3.9599609375, 4.38720703125, 4.814453125, 5.24169921875, 5.6689453125, 6.09619140625, 6.5234375, 6.95068359375, 7.3779296875, 7.80517578125, 8.232421875, 8.65966796875, 9.0869140625, 9.51416015625, 9.94140625, 10.36865234375, 10.7958984375, 11.22314453125, 11.650390625, 12.07763671875, 12.5048828125, 12.93212890625, 13.359375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 4.0, 7.0, 6.0, 14.0, 9.0, 11.0, 12.0, 19.0, 19.0, 27.0, 24.0, 30.0, 24.0, 36.0, 37.0, 29.0, 48.0, 39.0, 86.0, 202.0, 1608.0, 230.0, 91.0, 55.0, 41.0, 34.0, 30.0, 39.0, 32.0, 25.0, 31.0, 19.0, 15.0, 13.0, 18.0, 11.0, 13.0, 11.0, 4.0, 11.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-38.40625, -37.22509765625, -36.0439453125, -34.86279296875, -33.681640625, -32.50048828125, -31.3193359375, -30.13818359375, -28.95703125, -27.77587890625, -26.5947265625, -25.41357421875, -24.232421875, -23.05126953125, -21.8701171875, -20.68896484375, -19.5078125, -18.32666015625, -17.1455078125, -15.96435546875, -14.783203125, -13.60205078125, -12.4208984375, -11.23974609375, -10.05859375, -8.87744140625, -7.6962890625, -6.51513671875, -5.333984375, -4.15283203125, -2.9716796875, -1.79052734375, -0.609375, 0.57177734375, 1.7529296875, 2.93408203125, 4.115234375, 5.29638671875, 6.4775390625, 7.65869140625, 8.83984375, 10.02099609375, 11.2021484375, 12.38330078125, 13.564453125, 14.74560546875, 15.9267578125, 17.10791015625, 18.2890625, 19.47021484375, 20.6513671875, 21.83251953125, 23.013671875, 24.19482421875, 25.3759765625, 26.55712890625, 27.73828125, 28.91943359375, 30.1005859375, 31.28173828125, 32.462890625, 33.64404296875, 34.8251953125, 36.00634765625, 37.1875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 12.0, 13.0, 31.0, 35.0, 47.0, 59.0, 81.0, 138.0, 214.0, 365.0, 839.0, 10266.0, 3123882.0, 7921.0, 790.0, 345.0, 195.0, 149.0, 92.0, 58.0, 47.0, 38.0, 19.0, 17.0, 10.0, 8.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.0, -141.50390625, -137.0078125, -132.51171875, -128.015625, -123.51953125, -119.0234375, -114.52734375, -110.03125, -105.53515625, -101.0390625, -96.54296875, -92.046875, -87.55078125, -83.0546875, -78.55859375, -74.0625, -69.56640625, -65.0703125, -60.57421875, -56.078125, -51.58203125, -47.0859375, -42.58984375, -38.09375, -33.59765625, -29.1015625, -24.60546875, -20.109375, -15.61328125, -11.1171875, -6.62109375, -2.125, 2.37109375, 6.8671875, 11.36328125, 15.859375, 20.35546875, 24.8515625, 29.34765625, 33.84375, 38.33984375, 42.8359375, 47.33203125, 51.828125, 56.32421875, 60.8203125, 65.31640625, 69.8125, 74.30859375, 78.8046875, 83.30078125, 87.796875, 92.29296875, 96.7890625, 101.28515625, 105.78125, 110.27734375, 114.7734375, 119.26953125, 123.765625, 128.26171875, 132.7578125, 137.25390625, 141.75]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 15.0, 136.0, 398.0, 352.0, 103.0, 10.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.9329071044922, -153.5359344482422, -149.13894653320312, -144.74197387695312, -140.34500122070312, -135.94802856445312, -131.55104064941406, -127.15406799316406, -122.75708770751953, -118.360107421875, -113.963134765625, -109.56615447998047, -105.16917419433594, -100.77220153808594, -96.3752212524414, -91.97824096679688, -87.58126831054688, -83.18428802490234, -78.78731536865234, -74.39033508300781, -69.99336242675781, -65.59638214111328, -61.19940185546875, -56.802425384521484, -52.40544891357422, -48.00847244262695, -43.61149597167969, -39.214515686035156, -34.81753921508789, -30.420562744140625, -26.023584365844727, -21.626605987548828, -17.229629516601562, -12.83265209197998, -8.435674667358398, -4.038697242736816, 0.3582801818847656, 4.755256652832031, 9.15223503112793, 13.549213409423828, 17.946189880371094, 22.34316635131836, 26.740144729614258, 31.137123107910156, 35.53409957885742, 39.93107604980469, 44.32805633544922, 48.725032806396484, 53.12200927734375, 57.518985748291016, 61.91596221923828, 66.31294250488281, 70.70991516113281, 75.10689544677734, 79.50387573242188, 83.90084838867188, 88.2978286743164, 92.69480895996094, 97.09178161621094, 101.48876190185547, 105.8857421875, 110.28271484375, 114.67969512939453, 119.07667541503906, 123.47364807128906]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 7.0, 2.0, 5.0, 5.0, 8.0, 11.0, 9.0, 17.0, 15.0, 17.0, 19.0, 14.0, 33.0, 23.0, 25.0, 28.0, 34.0, 37.0, 47.0, 36.0, 35.0, 42.0, 39.0, 36.0, 39.0, 32.0, 34.0, 33.0, 35.0, 33.0, 32.0, 32.0, 26.0, 26.0, 19.0, 18.0, 12.0, 11.0, 13.0, 11.0, 6.0, 10.0, 10.0, 6.0, 7.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0], "bins": [-102.71715545654297, -99.72340393066406, -96.72965240478516, -93.73590087890625, -90.74214935302734, -87.74839782714844, -84.754638671875, -81.76089477539062, -78.76713562011719, -75.77338409423828, -72.77963256835938, -69.78588104248047, -66.79212951660156, -63.798377990722656, -60.804622650146484, -57.81087112426758, -54.81712341308594, -51.82337188720703, -48.829620361328125, -45.83586883544922, -42.84211730957031, -39.848365783691406, -36.854610443115234, -33.86085891723633, -30.867107391357422, -27.873355865478516, -24.87960433959961, -21.88585090637207, -18.892099380493164, -15.898347854614258, -12.904594421386719, -9.910842895507812, -6.917083740234375, -3.9233317375183105, -0.9295797348022461, 2.0641727447509766, 5.057924270629883, 8.051675796508789, 11.045429229736328, 14.039180755615234, 17.03293228149414, 20.026683807373047, 23.020435333251953, 26.014188766479492, 29.0079402923584, 32.00169372558594, 34.995445251464844, 37.98919677734375, 40.982948303222656, 43.97669982910156, 46.97045135498047, 49.964202880859375, 52.95795440673828, 55.95170593261719, 58.94546127319336, 61.939212799072266, 64.93296813964844, 67.92671966552734, 70.92047119140625, 73.91422271728516, 76.90797424316406, 79.90172576904297, 82.89547729492188, 85.88923645019531, 88.88298034667969]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 7.0, 6.0, 8.0, 11.0, 13.0, 14.0, 19.0, 19.0, 14.0, 23.0, 33.0, 30.0, 26.0, 30.0, 44.0, 38.0, 28.0, 39.0, 41.0, 39.0, 56.0, 50.0, 39.0, 44.0, 42.0, 45.0, 26.0, 31.0, 35.0, 21.0, 21.0, 10.0, 17.0, 13.0, 13.0, 12.0, 11.0, 10.0, 8.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.4453125, -14.005126953125, -13.56494140625, -13.124755859375, -12.6845703125, -12.244384765625, -11.80419921875, -11.364013671875, -10.923828125, -10.483642578125, -10.04345703125, -9.603271484375, -9.1630859375, -8.722900390625, -8.28271484375, -7.842529296875, -7.40234375, -6.962158203125, -6.52197265625, -6.081787109375, -5.6416015625, -5.201416015625, -4.76123046875, -4.321044921875, -3.880859375, -3.440673828125, -3.00048828125, -2.560302734375, -2.1201171875, -1.679931640625, -1.23974609375, -0.799560546875, -0.359375, 0.080810546875, 0.52099609375, 0.961181640625, 1.4013671875, 1.841552734375, 2.28173828125, 2.721923828125, 3.162109375, 3.602294921875, 4.04248046875, 4.482666015625, 4.9228515625, 5.363037109375, 5.80322265625, 6.243408203125, 6.68359375, 7.123779296875, 7.56396484375, 8.004150390625, 8.4443359375, 8.884521484375, 9.32470703125, 9.764892578125, 10.205078125, 10.645263671875, 11.08544921875, 11.525634765625, 11.9658203125, 12.406005859375, 12.84619140625, 13.286376953125, 13.7265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 5.0, 1.0, 5.0, 8.0, 12.0, 8.0, 10.0, 17.0, 14.0, 14.0, 22.0, 34.0, 48.0, 51.0, 60.0, 94.0, 136.0, 206.0, 384.0, 965.0, 5142.0, 92173.0, 2966208.0, 1101889.0, 23001.0, 2279.0, 599.0, 287.0, 157.0, 111.0, 87.0, 59.0, 42.0, 32.0, 26.0, 22.0, 20.0, 18.0, 6.0, 10.0, 8.0, 3.0, 8.0, 6.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-50.6875, -49.23095703125, -47.7744140625, -46.31787109375, -44.861328125, -43.40478515625, -41.9482421875, -40.49169921875, -39.03515625, -37.57861328125, -36.1220703125, -34.66552734375, -33.208984375, -31.75244140625, -30.2958984375, -28.83935546875, -27.3828125, -25.92626953125, -24.4697265625, -23.01318359375, -21.556640625, -20.10009765625, -18.6435546875, -17.18701171875, -15.73046875, -14.27392578125, -12.8173828125, -11.36083984375, -9.904296875, -8.44775390625, -6.9912109375, -5.53466796875, -4.078125, -2.62158203125, -1.1650390625, 0.29150390625, 1.748046875, 3.20458984375, 4.6611328125, 6.11767578125, 7.57421875, 9.03076171875, 10.4873046875, 11.94384765625, 13.400390625, 14.85693359375, 16.3134765625, 17.77001953125, 19.2265625, 20.68310546875, 22.1396484375, 23.59619140625, 25.052734375, 26.50927734375, 27.9658203125, 29.42236328125, 30.87890625, 32.33544921875, 33.7919921875, 35.24853515625, 36.705078125, 38.16162109375, 39.6181640625, 41.07470703125, 42.53125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 9.0, 12.0, 29.0, 40.0, 55.0, 111.0, 140.0, 278.0, 482.0, 774.0, 876.0, 521.0, 301.0, 179.0, 117.0, 49.0, 33.0, 26.0, 12.0, 10.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.46875, -26.1669921875, -24.865234375, -23.5634765625, -22.26171875, -20.9599609375, -19.658203125, -18.3564453125, -17.0546875, -15.7529296875, -14.451171875, -13.1494140625, -11.84765625, -10.5458984375, -9.244140625, -7.9423828125, -6.640625, -5.3388671875, -4.037109375, -2.7353515625, -1.43359375, -0.1318359375, 1.169921875, 2.4716796875, 3.7734375, 5.0751953125, 6.376953125, 7.6787109375, 8.98046875, 10.2822265625, 11.583984375, 12.8857421875, 14.1875, 15.4892578125, 16.791015625, 18.0927734375, 19.39453125, 20.6962890625, 21.998046875, 23.2998046875, 24.6015625, 25.9033203125, 27.205078125, 28.5068359375, 29.80859375, 31.1103515625, 32.412109375, 33.7138671875, 35.015625, 36.3173828125, 37.619140625, 38.9208984375, 40.22265625, 41.5244140625, 42.826171875, 44.1279296875, 45.4296875, 46.7314453125, 48.033203125, 49.3349609375, 50.63671875, 51.9384765625, 53.240234375, 54.5419921875, 55.84375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 14.0, 21.0, 37.0, 58.0, 94.0, 132.0, 247.0, 354.0, 670.0, 10504.0, 4177181.0, 3444.0, 590.0, 302.0, 230.0, 165.0, 98.0, 57.0, 23.0, 31.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-315.5, -308.060546875, -300.62109375, -293.181640625, -285.7421875, -278.302734375, -270.86328125, -263.423828125, -255.984375, -248.544921875, -241.10546875, -233.666015625, -226.2265625, -218.787109375, -211.34765625, -203.908203125, -196.46875, -189.029296875, -181.58984375, -174.150390625, -166.7109375, -159.271484375, -151.83203125, -144.392578125, -136.953125, -129.513671875, -122.07421875, -114.634765625, -107.1953125, -99.755859375, -92.31640625, -84.876953125, -77.4375, -69.998046875, -62.55859375, -55.119140625, -47.6796875, -40.240234375, -32.80078125, -25.361328125, -17.921875, -10.482421875, -3.04296875, 4.396484375, 11.8359375, 19.275390625, 26.71484375, 34.154296875, 41.59375, 49.033203125, 56.47265625, 63.912109375, 71.3515625, 78.791015625, 86.23046875, 93.669921875, 101.109375, 108.548828125, 115.98828125, 123.427734375, 130.8671875, 138.306640625, 145.74609375, 153.185546875, 160.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 10.0, 24.0, 34.0, 46.0, 94.0, 127.0, 138.0, 152.0, 120.0, 101.0, 72.0, 45.0, 17.0, 14.0, 8.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.55813598632812, -122.10962677001953, -118.6611099243164, -115.21260070800781, -111.76408386230469, -108.3155746459961, -104.8670654296875, -101.41854858398438, -97.97003173828125, -94.52152252197266, -91.07300567626953, -87.62449645996094, -84.17597961425781, -80.72747039794922, -77.27896118164062, -73.8304443359375, -70.3819351196289, -66.93342590332031, -63.48490905761719, -60.036399841308594, -56.58788299560547, -53.139373779296875, -49.690860748291016, -46.242347717285156, -42.7938346862793, -39.34532165527344, -35.89680862426758, -32.44829559326172, -28.999784469604492, -25.551271438598633, -22.102760314941406, -18.654247283935547, -15.205726623535156, -11.757213592529297, -8.308701515197754, -4.860189437866211, -1.4116764068603516, 2.036836624145508, 5.485347747802734, 8.933860778808594, 12.382373809814453, 15.830886840820312, 19.279399871826172, 22.7279109954834, 26.176424026489258, 29.624937057495117, 33.073448181152344, 36.5219612121582, 39.97047424316406, 43.41898727416992, 46.86750030517578, 50.316009521484375, 53.7645263671875, 57.213035583496094, 60.66154861450195, 64.11006164550781, 67.55857849121094, 71.00708770751953, 74.45560455322266, 77.90411376953125, 81.35263061523438, 84.80113983154297, 88.24964904785156, 91.69816589355469, 95.14667510986328]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 4.0, 8.0, 13.0, 6.0, 11.0, 14.0, 18.0, 25.0, 21.0, 18.0, 29.0, 27.0, 34.0, 36.0, 43.0, 36.0, 37.0, 41.0, 42.0, 56.0, 41.0, 39.0, 42.0, 34.0, 34.0, 46.0, 29.0, 32.0, 19.0, 28.0, 28.0, 20.0, 16.0, 14.0, 15.0, 8.0, 9.0, 7.0, 6.0, 8.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.1434326171875, -70.69056701660156, -68.23770141601562, -65.78483581542969, -63.33197021484375, -60.87910461425781, -58.426239013671875, -55.97337341308594, -53.5205078125, -51.06764221191406, -48.614776611328125, -46.16191101074219, -43.70904541015625, -41.25617980957031, -38.803314208984375, -36.35044860839844, -33.897579193115234, -31.444713592529297, -28.99184799194336, -26.538982391357422, -24.086116790771484, -21.633251190185547, -19.180383682250977, -16.72751808166504, -14.274652481079102, -11.821786880493164, -9.368921279907227, -6.916054725646973, -4.463189125061035, -2.0103235244750977, 0.44254302978515625, 2.8954086303710938, 5.348274230957031, 7.801139831542969, 10.254005432128906, 12.70687198638916, 15.159737586975098, 17.61260223388672, 20.06546974182129, 22.518335342407227, 24.971200942993164, 27.4240665435791, 29.87693214416504, 32.32979965209961, 34.78266525268555, 37.235530853271484, 39.68839645385742, 42.14126205444336, 44.5941276550293, 47.046993255615234, 49.49985885620117, 51.95272445678711, 54.40559005737305, 56.858455657958984, 59.31132507324219, 61.764190673828125, 64.21705627441406, 66.669921875, 69.12278747558594, 71.57565307617188, 74.02851867675781, 76.48138427734375, 78.93424987792969, 81.38711547851562, 83.83998107910156]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 9.0, 5.0, 14.0, 18.0, 13.0, 18.0, 12.0, 26.0, 24.0, 35.0, 34.0, 37.0, 37.0, 38.0, 41.0, 40.0, 57.0, 33.0, 46.0, 47.0, 45.0, 43.0, 38.0, 36.0, 28.0, 30.0, 29.0, 26.0, 25.0, 20.0, 15.0, 11.0, 14.0, 14.0, 2.0, 5.0, 8.0, 7.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.046875, -13.5921630859375, -13.137451171875, -12.6827392578125, -12.22802734375, -11.7733154296875, -11.318603515625, -10.8638916015625, -10.4091796875, -9.9544677734375, -9.499755859375, -9.0450439453125, -8.59033203125, -8.1356201171875, -7.680908203125, -7.2261962890625, -6.771484375, -6.3167724609375, -5.862060546875, -5.4073486328125, -4.95263671875, -4.4979248046875, -4.043212890625, -3.5885009765625, -3.1337890625, -2.6790771484375, -2.224365234375, -1.7696533203125, -1.31494140625, -0.8602294921875, -0.405517578125, 0.0491943359375, 0.50390625, 0.9586181640625, 1.413330078125, 1.8680419921875, 2.32275390625, 2.7774658203125, 3.232177734375, 3.6868896484375, 4.1416015625, 4.5963134765625, 5.051025390625, 5.5057373046875, 5.96044921875, 6.4151611328125, 6.869873046875, 7.3245849609375, 7.779296875, 8.2340087890625, 8.688720703125, 9.1434326171875, 9.59814453125, 10.0528564453125, 10.507568359375, 10.9622802734375, 11.4169921875, 11.8717041015625, 12.326416015625, 12.7811279296875, 13.23583984375, 13.6905517578125, 14.145263671875, 14.5999755859375, 15.0546875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 16.0, 13.0, 29.0, 34.0, 65.0, 102.0, 144.0, 200.0, 280.0, 386.0, 602.0, 768.0, 1146.0, 1614.0, 2339.0, 3410.0, 5082.0, 7212.0, 10347.0, 15100.0, 22265.0, 32702.0, 49073.0, 72423.0, 107703.0, 160847.0, 175581.0, 123090.0, 82638.0, 55587.0, 37407.0, 25311.0, 17077.0, 11569.0, 8120.0, 5563.0, 3816.0, 2676.0, 1819.0, 1365.0, 976.0, 577.0, 484.0, 285.0, 210.0, 168.0, 106.0, 71.0, 47.0, 34.0, 25.0, 20.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0], "bins": [-1.2568359375, -1.2177581787109375, -1.178680419921875, -1.1396026611328125, -1.10052490234375, -1.0614471435546875, -1.022369384765625, -0.9832916259765625, -0.9442138671875, -0.9051361083984375, -0.866058349609375, -0.8269805908203125, -0.78790283203125, -0.7488250732421875, -0.709747314453125, -0.6706695556640625, -0.631591796875, -0.5925140380859375, -0.553436279296875, -0.5143585205078125, -0.47528076171875, -0.4362030029296875, -0.397125244140625, -0.3580474853515625, -0.3189697265625, -0.2798919677734375, -0.240814208984375, -0.2017364501953125, -0.16265869140625, -0.1235809326171875, -0.084503173828125, -0.0454254150390625, -0.00634765625, 0.0327301025390625, 0.071807861328125, 0.1108856201171875, 0.14996337890625, 0.1890411376953125, 0.228118896484375, 0.2671966552734375, 0.3062744140625, 0.3453521728515625, 0.384429931640625, 0.4235076904296875, 0.46258544921875, 0.5016632080078125, 0.540740966796875, 0.5798187255859375, 0.618896484375, 0.6579742431640625, 0.697052001953125, 0.7361297607421875, 0.77520751953125, 0.8142852783203125, 0.853363037109375, 0.8924407958984375, 0.9315185546875, 0.9705963134765625, 1.009674072265625, 1.0487518310546875, 1.08782958984375, 1.1269073486328125, 1.165985107421875, 1.2050628662109375, 1.244140625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 6.0, 8.0, 8.0, 6.0, 12.0, 16.0, 20.0, 14.0, 24.0, 23.0, 28.0, 33.0, 25.0, 34.0, 41.0, 53.0, 33.0, 50.0, 33.0, 1065.0, 60.0, 43.0, 29.0, 31.0, 35.0, 28.0, 34.0, 26.0, 27.0, 20.0, 23.0, 28.0, 16.0, 9.0, 15.0, 12.0, 11.0, 12.0, 7.0, 7.0, 8.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.79248046875, -8.5146484375, -8.23681640625, -7.958984375, -7.68115234375, -7.4033203125, -7.12548828125, -6.84765625, -6.56982421875, -6.2919921875, -6.01416015625, -5.736328125, -5.45849609375, -5.1806640625, -4.90283203125, -4.625, -4.34716796875, -4.0693359375, -3.79150390625, -3.513671875, -3.23583984375, -2.9580078125, -2.68017578125, -2.40234375, -2.12451171875, -1.8466796875, -1.56884765625, -1.291015625, -1.01318359375, -0.7353515625, -0.45751953125, -0.1796875, 0.09814453125, 0.3759765625, 0.65380859375, 0.931640625, 1.20947265625, 1.4873046875, 1.76513671875, 2.04296875, 2.32080078125, 2.5986328125, 2.87646484375, 3.154296875, 3.43212890625, 3.7099609375, 3.98779296875, 4.265625, 4.54345703125, 4.8212890625, 5.09912109375, 5.376953125, 5.65478515625, 5.9326171875, 6.21044921875, 6.48828125, 6.76611328125, 7.0439453125, 7.32177734375, 7.599609375, 7.87744140625, 8.1552734375, 8.43310546875, 8.7109375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 2.0, 12.0, 12.0, 23.0, 31.0, 36.0, 54.0, 95.0, 124.0, 229.0, 296.0, 487.0, 675.0, 1060.0, 1642.0, 2415.0, 3572.0, 5348.0, 8152.0, 12737.0, 19654.0, 30416.0, 47592.0, 72686.0, 114818.0, 176645.0, 1238749.0, 127625.0, 81772.0, 53147.0, 33959.0, 21779.0, 14309.0, 9365.0, 6004.0, 3873.0, 2607.0, 1719.0, 1096.0, 740.0, 521.0, 312.0, 234.0, 190.0, 114.0, 73.0, 49.0, 31.0, 17.0, 19.0, 10.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.2998046875, -1.25665283203125, -1.2135009765625, -1.17034912109375, -1.127197265625, -1.08404541015625, -1.0408935546875, -0.99774169921875, -0.95458984375, -0.91143798828125, -0.8682861328125, -0.82513427734375, -0.781982421875, -0.73883056640625, -0.6956787109375, -0.65252685546875, -0.609375, -0.56622314453125, -0.5230712890625, -0.47991943359375, -0.436767578125, -0.39361572265625, -0.3504638671875, -0.30731201171875, -0.26416015625, -0.22100830078125, -0.1778564453125, -0.13470458984375, -0.091552734375, -0.04840087890625, -0.0052490234375, 0.03790283203125, 0.0810546875, 0.12420654296875, 0.1673583984375, 0.21051025390625, 0.253662109375, 0.29681396484375, 0.3399658203125, 0.38311767578125, 0.42626953125, 0.46942138671875, 0.5125732421875, 0.55572509765625, 0.598876953125, 0.64202880859375, 0.6851806640625, 0.72833251953125, 0.771484375, 0.81463623046875, 0.8577880859375, 0.90093994140625, 0.944091796875, 0.98724365234375, 1.0303955078125, 1.07354736328125, 1.11669921875, 1.15985107421875, 1.2030029296875, 1.24615478515625, 1.289306640625, 1.33245849609375, 1.3756103515625, 1.41876220703125, 1.4619140625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 12.0, 8.0, 9.0, 8.0, 17.0, 22.0, 16.0, 32.0, 38.0, 54.0, 44.0, 76.0, 71.0, 83.0, 82.0, 79.0, 63.0, 62.0, 45.0, 32.0, 37.0, 27.0, 15.0, 17.0, 6.0, 13.0, 4.0, 5.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00377655029296875, -0.00364530086517334, -0.0035140514373779297, -0.0033828020095825195, -0.0032515525817871094, -0.0031203031539916992, -0.002989053726196289, -0.002857804298400879, -0.0027265548706054688, -0.0025953054428100586, -0.0024640560150146484, -0.0023328065872192383, -0.002201557159423828, -0.002070307731628418, -0.0019390583038330078, -0.0018078088760375977, -0.0016765594482421875, -0.0015453100204467773, -0.0014140605926513672, -0.001282811164855957, -0.0011515617370605469, -0.0010203123092651367, -0.0008890628814697266, -0.0007578134536743164, -0.0006265640258789062, -0.0004953145980834961, -0.00036406517028808594, -0.00023281574249267578, -0.00010156631469726562, 2.968311309814453e-05, 0.0001609325408935547, 0.00029218196868896484, 0.000423431396484375, 0.0005546808242797852, 0.0006859302520751953, 0.0008171796798706055, 0.0009484291076660156, 0.0010796785354614258, 0.001210927963256836, 0.001342177391052246, 0.0014734268188476562, 0.0016046762466430664, 0.0017359256744384766, 0.0018671751022338867, 0.001998424530029297, 0.002129673957824707, 0.002260923385620117, 0.0023921728134155273, 0.0025234222412109375, 0.0026546716690063477, 0.002785921096801758, 0.002917170524597168, 0.003048419952392578, 0.0031796693801879883, 0.0033109188079833984, 0.0034421682357788086, 0.0035734176635742188, 0.003704667091369629, 0.003835916519165039, 0.003967165946960449, 0.004098415374755859, 0.0042296648025512695, 0.00436091423034668, 0.00449216365814209, 0.0046234130859375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 2.0, 3.0, 7.0, 6.0, 12.0, 11.0, 24.0, 27.0, 36.0, 46.0, 56.0, 89.0, 108.0, 262.0, 644.0, 59958.0, 985485.0, 989.0, 302.0, 136.0, 78.0, 67.0, 52.0, 32.0, 25.0, 18.0, 16.0, 14.0, 13.0, 5.0, 11.0, 5.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.109130859375, -0.10602474212646484, -0.10291862487792969, -0.09981250762939453, -0.09670639038085938, -0.09360027313232422, -0.09049415588378906, -0.0873880386352539, -0.08428192138671875, -0.0811758041381836, -0.07806968688964844, -0.07496356964111328, -0.07185745239257812, -0.06875133514404297, -0.06564521789550781, -0.06253910064697266, -0.0594329833984375, -0.056326866149902344, -0.05322074890136719, -0.05011463165283203, -0.047008514404296875, -0.04390239715576172, -0.04079627990722656, -0.037690162658691406, -0.03458404541015625, -0.031477928161621094, -0.028371810913085938, -0.02526569366455078, -0.022159576416015625, -0.01905345916748047, -0.015947341918945312, -0.012841224670410156, -0.009735107421875, -0.006628990173339844, -0.0035228729248046875, -0.00041675567626953125, 0.002689361572265625, 0.005795478820800781, 0.008901596069335938, 0.012007713317871094, 0.01511383056640625, 0.018219947814941406, 0.021326065063476562, 0.02443218231201172, 0.027538299560546875, 0.03064441680908203, 0.03375053405761719, 0.036856651306152344, 0.0399627685546875, 0.043068885803222656, 0.04617500305175781, 0.04928112030029297, 0.052387237548828125, 0.05549335479736328, 0.05859947204589844, 0.061705589294433594, 0.06481170654296875, 0.0679178237915039, 0.07102394104003906, 0.07413005828857422, 0.07723617553710938, 0.08034229278564453, 0.08344841003417969, 0.08655452728271484, 0.08966064453125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 39.0, 106.0, 268.0, 334.0, 167.0, 65.0, 14.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014605483738705516, -0.0013296190882101655, -0.0011986899189651012, -0.0010677606333047152, -0.0009368313476443291, -0.000805902061983943, -0.0006749728345312178, -0.0005440436070784926, -0.00041311432141810656, -0.00028218506486155093, -0.0001512558083049953, -2.032655174843967e-05, 0.00011060270480811596, 0.00024153199046850204, 0.0003724612179212272, 0.0005033904453739524, 0.0006343197310343385, 0.0007652490166947246, 0.0008961782441474497, 0.001027107471600175, 0.001158036757260561, 0.001288966042920947, 0.0014198953285813332, 0.0015508244978263974, 0.0016817537834867835, 0.0018126830691471696, 0.0019436122383922338, 0.00207454152405262, 0.002205470809713006, 0.002336400095373392, 0.002467329381033778, 0.0025982586666941643, 0.002729188185185194, 0.00286011747084558, 0.002991046756505966, 0.0031219760421663523, 0.0032529053278267384, 0.003383834380656481, 0.003514763666316867, 0.003645692951977253, 0.003776622237637639, 0.003907551523298025, 0.0040384805761277676, 0.004169410094618797, 0.00430033914744854, 0.0044312686659395695, 0.004562197718769312, 0.004693127237260342, 0.004824056290090084, 0.0049549853429198265, 0.005085914861410856, 0.005216843914240599, 0.005347773432731628, 0.005478702485561371, 0.005609632004052401, 0.005740561056882143, 0.005871490575373173, 0.006002419628202915, 0.006133349146693945, 0.006264278199523687, 0.006395207718014717, 0.0065261367708444595, 0.006657066289335489, 0.006787995342165232, 0.006918924394994974]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 16.0, 6.0, 5.0, 17.0, 26.0, 21.0, 13.0, 27.0, 32.0, 25.0, 26.0, 16.0, 27.0, 38.0, 20.0, 37.0, 49.0, 43.0, 24.0, 38.0, 29.0, 43.0, 29.0, 43.0, 20.0, 32.0, 34.0, 25.0, 25.0, 23.0, 23.0, 12.0, 20.0, 21.0, 18.0, 14.0, 15.0, 5.0, 12.0, 7.0, 7.0, 6.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0], "bins": [-0.001606285572052002, -0.0015572886914014816, -0.0015082918107509613, -0.001459294930100441, -0.0014102980494499207, -0.0013613011687994003, -0.00131230428814888, -0.0012633074074983597, -0.0012143105268478394, -0.001165313646197319, -0.0011163167655467987, -0.0010673198848962784, -0.001018323004245758, -0.0009693261235952377, -0.0009203292429447174, -0.0008713323622941971, -0.0008223354816436768, -0.0007733386009931564, -0.0007243417203426361, -0.0006753448396921158, -0.0006263479590415955, -0.0005773510783910751, -0.0005283541977405548, -0.0004793573170900345, -0.00043036043643951416, -0.00038136355578899384, -0.0003323666751384735, -0.0002833697944879532, -0.00023437291383743286, -0.00018537603318691254, -0.0001363791525363922, -8.738227188587189e-05, -3.838539123535156e-05, 1.0611489415168762e-05, 5.960837006568909e-05, 0.00010860525071620941, 0.00015760213136672974, 0.00020659901201725006, 0.0002555958926677704, 0.0003045927733182907, 0.00035358965396881104, 0.00040258653461933136, 0.0004515834152698517, 0.000500580295920372, 0.0005495771765708923, 0.0005985740572214127, 0.000647570937871933, 0.0006965678185224533, 0.0007455646991729736, 0.000794561579823494, 0.0008435584604740143, 0.0008925553411245346, 0.0009415522217750549, 0.0009905491024255753, 0.0010395459830760956, 0.001088542863726616, 0.0011375397443771362, 0.0011865366250276566, 0.0012355335056781769, 0.0012845303863286972, 0.0013335272669792175, 0.0013825241476297379, 0.0014315210282802582, 0.0014805179089307785, 0.0015295147895812988]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 9.0, 5.0, 14.0, 18.0, 13.0, 18.0, 12.0, 26.0, 24.0, 35.0, 34.0, 37.0, 37.0, 38.0, 41.0, 40.0, 57.0, 33.0, 46.0, 47.0, 45.0, 43.0, 38.0, 36.0, 28.0, 30.0, 29.0, 27.0, 24.0, 20.0, 15.0, 11.0, 14.0, 14.0, 2.0, 5.0, 8.0, 7.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.046875, -13.5921630859375, -13.137451171875, -12.6827392578125, -12.22802734375, -11.7733154296875, -11.318603515625, -10.8638916015625, -10.4091796875, -9.9544677734375, -9.499755859375, -9.0450439453125, -8.59033203125, -8.1356201171875, -7.680908203125, -7.2261962890625, -6.771484375, -6.3167724609375, -5.862060546875, -5.4073486328125, -4.95263671875, -4.4979248046875, -4.043212890625, -3.5885009765625, -3.1337890625, -2.6790771484375, -2.224365234375, -1.7696533203125, -1.31494140625, -0.8602294921875, -0.405517578125, 0.0491943359375, 0.50390625, 0.9586181640625, 1.413330078125, 1.8680419921875, 2.32275390625, 2.7774658203125, 3.232177734375, 3.6868896484375, 4.1416015625, 4.5963134765625, 5.051025390625, 5.5057373046875, 5.96044921875, 6.4151611328125, 6.869873046875, 7.3245849609375, 7.779296875, 8.2340087890625, 8.688720703125, 9.1434326171875, 9.59814453125, 10.0528564453125, 10.507568359375, 10.9622802734375, 11.4169921875, 11.8717041015625, 12.326416015625, 12.7811279296875, 13.23583984375, 13.6905517578125, 14.145263671875, 14.5999755859375, 15.0546875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 8.0, 13.0, 8.0, 13.0, 27.0, 29.0, 37.0, 32.0, 59.0, 76.0, 123.0, 154.0, 222.0, 374.0, 634.0, 1259.0, 4733.0, 35766.0, 632701.0, 342190.0, 23804.0, 3553.0, 1108.0, 528.0, 355.0, 210.0, 130.0, 105.0, 69.0, 56.0, 35.0, 34.0, 34.0, 16.0, 13.0, 6.0, 9.0, 9.0, 7.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.375, -25.521728515625, -24.66845703125, -23.815185546875, -22.9619140625, -22.108642578125, -21.25537109375, -20.402099609375, -19.548828125, -18.695556640625, -17.84228515625, -16.989013671875, -16.1357421875, -15.282470703125, -14.42919921875, -13.575927734375, -12.72265625, -11.869384765625, -11.01611328125, -10.162841796875, -9.3095703125, -8.456298828125, -7.60302734375, -6.749755859375, -5.896484375, -5.043212890625, -4.18994140625, -3.336669921875, -2.4833984375, -1.630126953125, -0.77685546875, 0.076416015625, 0.9296875, 1.782958984375, 2.63623046875, 3.489501953125, 4.3427734375, 5.196044921875, 6.04931640625, 6.902587890625, 7.755859375, 8.609130859375, 9.46240234375, 10.315673828125, 11.1689453125, 12.022216796875, 12.87548828125, 13.728759765625, 14.58203125, 15.435302734375, 16.28857421875, 17.141845703125, 17.9951171875, 18.848388671875, 19.70166015625, 20.554931640625, 21.408203125, 22.261474609375, 23.11474609375, 23.968017578125, 24.8212890625, 25.674560546875, 26.52783203125, 27.381103515625, 28.234375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 2.0, 4.0, 6.0, 6.0, 13.0, 10.0, 9.0, 19.0, 14.0, 23.0, 23.0, 26.0, 35.0, 35.0, 42.0, 42.0, 47.0, 69.0, 88.0, 408.0, 1606.0, 95.0, 45.0, 45.0, 36.0, 41.0, 37.0, 38.0, 21.0, 26.0, 21.0, 23.0, 18.0, 12.0, 17.0, 18.0, 4.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-50.15625, -48.63818359375, -47.1201171875, -45.60205078125, -44.083984375, -42.56591796875, -41.0478515625, -39.52978515625, -38.01171875, -36.49365234375, -34.9755859375, -33.45751953125, -31.939453125, -30.42138671875, -28.9033203125, -27.38525390625, -25.8671875, -24.34912109375, -22.8310546875, -21.31298828125, -19.794921875, -18.27685546875, -16.7587890625, -15.24072265625, -13.72265625, -12.20458984375, -10.6865234375, -9.16845703125, -7.650390625, -6.13232421875, -4.6142578125, -3.09619140625, -1.578125, -0.06005859375, 1.4580078125, 2.97607421875, 4.494140625, 6.01220703125, 7.5302734375, 9.04833984375, 10.56640625, 12.08447265625, 13.6025390625, 15.12060546875, 16.638671875, 18.15673828125, 19.6748046875, 21.19287109375, 22.7109375, 24.22900390625, 25.7470703125, 27.26513671875, 28.783203125, 30.30126953125, 31.8193359375, 33.33740234375, 34.85546875, 36.37353515625, 37.8916015625, 39.40966796875, 40.927734375, 42.44580078125, 43.9638671875, 45.48193359375, 47.0]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 3.0, 7.0, 7.0, 16.0, 13.0, 19.0, 18.0, 26.0, 21.0, 26.0, 28.0, 47.0, 58.0, 76.0, 102.0, 223.0, 401.0, 1219.0, 2732779.0, 408549.0, 1036.0, 342.0, 210.0, 123.0, 68.0, 64.0, 38.0, 38.0, 26.0, 28.0, 13.0, 21.0, 7.0, 10.0, 12.0, 9.0, 4.0, 4.0, 2.0, 0.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-141.625, -137.048828125, -132.47265625, -127.896484375, -123.3203125, -118.744140625, -114.16796875, -109.591796875, -105.015625, -100.439453125, -95.86328125, -91.287109375, -86.7109375, -82.134765625, -77.55859375, -72.982421875, -68.40625, -63.830078125, -59.25390625, -54.677734375, -50.1015625, -45.525390625, -40.94921875, -36.373046875, -31.796875, -27.220703125, -22.64453125, -18.068359375, -13.4921875, -8.916015625, -4.33984375, 0.236328125, 4.8125, 9.388671875, 13.96484375, 18.541015625, 23.1171875, 27.693359375, 32.26953125, 36.845703125, 41.421875, 45.998046875, 50.57421875, 55.150390625, 59.7265625, 64.302734375, 68.87890625, 73.455078125, 78.03125, 82.607421875, 87.18359375, 91.759765625, 96.3359375, 100.912109375, 105.48828125, 110.064453125, 114.640625, 119.216796875, 123.79296875, 128.369140625, 132.9453125, 137.521484375, 142.09765625, 146.673828125, 151.25]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 18.0, 77.0, 181.0, 285.0, 249.0, 141.0, 43.0, 13.0, 6.0], "bins": [-121.4266586303711, -119.35983276367188, -117.29300689697266, -115.22618103027344, -113.15935516357422, -111.092529296875, -109.02570343017578, -106.95887756347656, -104.89205932617188, -102.82523345947266, -100.75840759277344, -98.69158172607422, -96.624755859375, -94.55792999267578, -92.49110412597656, -90.42428588867188, -88.35745239257812, -86.2906265258789, -84.22380065917969, -82.15697479248047, -80.09014892578125, -78.02332305908203, -75.95649719238281, -73.88967895507812, -71.82284545898438, -69.75601959228516, -67.68919372558594, -65.62236785888672, -63.5555419921875, -61.48871612548828, -59.42189407348633, -57.35506820678711, -55.288246154785156, -53.22142028808594, -51.15459442138672, -49.0877685546875, -47.02094268798828, -44.95411682128906, -42.88729476928711, -40.82046890258789, -38.75364303588867, -36.68681716918945, -34.619991302490234, -32.553165435791016, -30.48634147644043, -28.41951560974121, -26.352691650390625, -24.285865783691406, -22.219039916992188, -20.15221405029297, -18.08538818359375, -16.018564224243164, -13.951738357543945, -11.884912490844727, -9.818087577819824, -7.751262664794922, -5.6844377517700195, -3.617612361907959, -1.5507869720458984, 0.5160384178161621, 2.5828638076782227, 4.649689674377441, 6.716514587402344, 8.783339500427246, 10.850165367126465]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 10.0, 10.0, 8.0, 15.0, 15.0, 14.0, 23.0, 14.0, 21.0, 23.0, 34.0, 36.0, 42.0, 37.0, 32.0, 42.0, 41.0, 46.0, 46.0, 35.0, 32.0, 39.0, 34.0, 24.0, 37.0, 36.0, 16.0, 24.0, 24.0, 35.0, 18.0, 15.0, 17.0, 18.0, 16.0, 20.0, 9.0, 9.0, 6.0, 2.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.99846649169922, -115.9561767578125, -111.91388702392578, -107.87159729003906, -103.82930755615234, -99.78701782226562, -95.74473571777344, -91.70243835449219, -87.66015625, -83.61786651611328, -79.57557678222656, -75.53328704833984, -71.49099731445312, -67.4487075805664, -63.40642166137695, -59.364131927490234, -55.32183837890625, -51.27954864501953, -47.23725891113281, -43.194969177246094, -39.152679443359375, -35.110389709472656, -31.068103790283203, -27.025814056396484, -22.983524322509766, -18.941234588623047, -14.898945808410645, -10.856657028198242, -6.814367294311523, -2.7720775604248047, 1.2702102661132812, 5.3125, 9.35479736328125, 13.397087097167969, 17.439376831054688, 21.481664657592773, 25.523954391479492, 29.56624412536621, 33.6085319519043, 37.650821685791016, 41.693111419677734, 45.73540115356445, 49.77769088745117, 53.819976806640625, 57.862266540527344, 61.90455627441406, 65.94684600830078, 69.9891357421875, 74.03142547607422, 78.07371520996094, 82.11600494384766, 86.15829467773438, 90.2005844116211, 94.24287414550781, 98.28515625, 102.32745361328125, 106.36973571777344, 110.41202545166016, 114.45431518554688, 118.4966049194336, 122.53889465332031, 126.58118438720703, 130.62347412109375, 134.66575622558594, 138.7080535888672]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 1.0, 7.0, 5.0, 17.0, 14.0, 12.0, 17.0, 21.0, 18.0, 21.0, 24.0, 34.0, 35.0, 28.0, 40.0, 44.0, 40.0, 51.0, 40.0, 35.0, 51.0, 45.0, 42.0, 40.0, 30.0, 36.0, 32.0, 32.0, 26.0, 16.0, 26.0, 22.0, 16.0, 14.0, 15.0, 10.0, 10.0, 6.0, 4.0, 5.0, 8.0, 9.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3046875, -13.8402099609375, -13.375732421875, -12.9112548828125, -12.44677734375, -11.9822998046875, -11.517822265625, -11.0533447265625, -10.5888671875, -10.1243896484375, -9.659912109375, -9.1954345703125, -8.73095703125, -8.2664794921875, -7.802001953125, -7.3375244140625, -6.873046875, -6.4085693359375, -5.944091796875, -5.4796142578125, -5.01513671875, -4.5506591796875, -4.086181640625, -3.6217041015625, -3.1572265625, -2.6927490234375, -2.228271484375, -1.7637939453125, -1.29931640625, -0.8348388671875, -0.370361328125, 0.0941162109375, 0.55859375, 1.0230712890625, 1.487548828125, 1.9520263671875, 2.41650390625, 2.8809814453125, 3.345458984375, 3.8099365234375, 4.2744140625, 4.7388916015625, 5.203369140625, 5.6678466796875, 6.13232421875, 6.5968017578125, 7.061279296875, 7.5257568359375, 7.990234375, 8.4547119140625, 8.919189453125, 9.3836669921875, 9.84814453125, 10.3126220703125, 10.777099609375, 11.2415771484375, 11.7060546875, 12.1705322265625, 12.635009765625, 13.0994873046875, 13.56396484375, 14.0284423828125, 14.492919921875, 14.9573974609375, 15.421875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 3.0, 8.0, 11.0, 14.0, 20.0, 23.0, 28.0, 46.0, 58.0, 81.0, 107.0, 127.0, 197.0, 347.0, 574.0, 1025.0, 2098.0, 4867.0, 13543.0, 47498.0, 202285.0, 766236.0, 1537291.0, 1134144.0, 365005.0, 84302.0, 21332.0, 7020.0, 2787.0, 1292.0, 709.0, 380.0, 224.0, 164.0, 97.0, 98.0, 66.0, 45.0, 34.0, 24.0, 17.0, 14.0, 11.0, 10.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.109375, -15.584716796875, -15.06005859375, -14.535400390625, -14.0107421875, -13.486083984375, -12.96142578125, -12.436767578125, -11.912109375, -11.387451171875, -10.86279296875, -10.338134765625, -9.8134765625, -9.288818359375, -8.76416015625, -8.239501953125, -7.71484375, -7.190185546875, -6.66552734375, -6.140869140625, -5.6162109375, -5.091552734375, -4.56689453125, -4.042236328125, -3.517578125, -2.992919921875, -2.46826171875, -1.943603515625, -1.4189453125, -0.894287109375, -0.36962890625, 0.155029296875, 0.6796875, 1.204345703125, 1.72900390625, 2.253662109375, 2.7783203125, 3.302978515625, 3.82763671875, 4.352294921875, 4.876953125, 5.401611328125, 5.92626953125, 6.450927734375, 6.9755859375, 7.500244140625, 8.02490234375, 8.549560546875, 9.07421875, 9.598876953125, 10.12353515625, 10.648193359375, 11.1728515625, 11.697509765625, 12.22216796875, 12.746826171875, 13.271484375, 13.796142578125, 14.32080078125, 14.845458984375, 15.3701171875, 15.894775390625, 16.41943359375, 16.944091796875, 17.46875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 11.0, 18.0, 21.0, 34.0, 47.0, 89.0, 116.0, 163.0, 266.0, 428.0, 525.0, 652.0, 556.0, 389.0, 253.0, 182.0, 113.0, 78.0, 52.0, 37.0, 18.0, 10.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.8125, -48.641357421875, -47.47021484375, -46.299072265625, -45.1279296875, -43.956787109375, -42.78564453125, -41.614501953125, -40.443359375, -39.272216796875, -38.10107421875, -36.929931640625, -35.7587890625, -34.587646484375, -33.41650390625, -32.245361328125, -31.07421875, -29.903076171875, -28.73193359375, -27.560791015625, -26.3896484375, -25.218505859375, -24.04736328125, -22.876220703125, -21.705078125, -20.533935546875, -19.36279296875, -18.191650390625, -17.0205078125, -15.849365234375, -14.67822265625, -13.507080078125, -12.3359375, -11.164794921875, -9.99365234375, -8.822509765625, -7.6513671875, -6.480224609375, -5.30908203125, -4.137939453125, -2.966796875, -1.795654296875, -0.62451171875, 0.546630859375, 1.7177734375, 2.888916015625, 4.06005859375, 5.231201171875, 6.40234375, 7.573486328125, 8.74462890625, 9.915771484375, 11.0869140625, 12.258056640625, 13.42919921875, 14.600341796875, 15.771484375, 16.942626953125, 18.11376953125, 19.284912109375, 20.4560546875, 21.627197265625, 22.79833984375, 23.969482421875, 25.140625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 14.0, 8.0, 13.0, 28.0, 47.0, 50.0, 85.0, 134.0, 175.0, 203.0, 317.0, 530.0, 1369.0, 49474.0, 4127564.0, 11573.0, 1091.0, 503.0, 316.0, 210.0, 159.0, 117.0, 104.0, 48.0, 47.0, 31.0, 22.0, 23.0, 10.0, 10.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.0, -110.470703125, -105.94140625, -101.412109375, -96.8828125, -92.353515625, -87.82421875, -83.294921875, -78.765625, -74.236328125, -69.70703125, -65.177734375, -60.6484375, -56.119140625, -51.58984375, -47.060546875, -42.53125, -38.001953125, -33.47265625, -28.943359375, -24.4140625, -19.884765625, -15.35546875, -10.826171875, -6.296875, -1.767578125, 2.76171875, 7.291015625, 11.8203125, 16.349609375, 20.87890625, 25.408203125, 29.9375, 34.466796875, 38.99609375, 43.525390625, 48.0546875, 52.583984375, 57.11328125, 61.642578125, 66.171875, 70.701171875, 75.23046875, 79.759765625, 84.2890625, 88.818359375, 93.34765625, 97.876953125, 102.40625, 106.935546875, 111.46484375, 115.994140625, 120.5234375, 125.052734375, 129.58203125, 134.111328125, 138.640625, 143.169921875, 147.69921875, 152.228515625, 156.7578125, 161.287109375, 165.81640625, 170.345703125, 174.875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 35.0, 155.0, 385.0, 318.0, 102.0, 13.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-511.6800231933594, -502.3577575683594, -493.0354919433594, -483.7132263183594, -474.3909606933594, -465.0686950683594, -455.7464294433594, -446.42413330078125, -437.10186767578125, -427.77960205078125, -418.45733642578125, -409.13507080078125, -399.81280517578125, -390.49053955078125, -381.16827392578125, -371.84600830078125, -362.52374267578125, -353.20147705078125, -343.87921142578125, -334.55694580078125, -325.23468017578125, -315.91241455078125, -306.59014892578125, -297.26788330078125, -287.94561767578125, -278.62335205078125, -269.30108642578125, -259.97882080078125, -250.65655517578125, -241.33428955078125, -232.0120086669922, -222.6897430419922, -213.367431640625, -204.045166015625, -194.722900390625, -185.400634765625, -176.078369140625, -166.756103515625, -157.43382263183594, -148.11155700683594, -138.789306640625, -129.467041015625, -120.144775390625, -110.82250213623047, -101.50023651123047, -92.17797088623047, -82.85569763183594, -73.53343200683594, -64.2111587524414, -54.888893127441406, -45.56662368774414, -36.244354248046875, -26.922088623046875, -17.599822998046875, -8.27755355834961, 1.0447158813476562, 10.366981506347656, 19.68924903869629, 29.011516571044922, 38.33378601074219, 47.65605163574219, 56.97831726074219, 66.30058288574219, 75.62285614013672, 84.94512176513672]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 11.0, 10.0, 9.0, 17.0, 14.0, 15.0, 22.0, 14.0, 18.0, 18.0, 31.0, 30.0, 31.0, 41.0, 35.0, 39.0, 47.0, 34.0, 43.0, 37.0, 44.0, 42.0, 42.0, 48.0, 33.0, 29.0, 34.0, 43.0, 25.0, 24.0, 26.0, 19.0, 10.0, 13.0, 13.0, 8.0, 8.0, 9.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.5745849609375, -92.62934875488281, -89.68411254882812, -86.73887634277344, -83.79363250732422, -80.84839630126953, -77.90316009521484, -74.95792388916016, -72.01268005371094, -69.06744384765625, -66.12220764160156, -63.17696762084961, -60.231727600097656, -57.28649139404297, -54.34125518798828, -51.396018981933594, -48.450782775878906, -45.50554656982422, -42.560306549072266, -39.61507034301758, -36.669830322265625, -33.72459411621094, -30.77935791015625, -27.83411979675293, -24.88888168334961, -21.94364356994629, -18.99840545654297, -16.05316925048828, -13.107931137084961, -10.16269302368164, -7.217456817626953, -4.272218704223633, -1.3269805908203125, 1.6182570457458496, 4.563494682312012, 7.508731842041016, 10.453969955444336, 13.399208068847656, 16.344444274902344, 19.289682388305664, 22.234920501708984, 25.180158615112305, 28.125396728515625, 31.070632934570312, 34.015869140625, 36.96110916137695, 39.90634536743164, 42.851585388183594, 45.79682159423828, 48.74205780029297, 51.68729782104492, 54.63253402709961, 57.57777404785156, 60.52301025390625, 63.46824645996094, 66.41348266601562, 69.35871887207031, 72.303955078125, 75.24919128417969, 78.19442749023438, 81.1396713256836, 84.08490753173828, 87.03014373779297, 89.97537994384766, 92.92062377929688]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 10.0, 8.0, 14.0, 9.0, 12.0, 21.0, 14.0, 21.0, 31.0, 28.0, 32.0, 36.0, 42.0, 42.0, 39.0, 39.0, 40.0, 64.0, 34.0, 47.0, 58.0, 38.0, 41.0, 34.0, 36.0, 29.0, 23.0, 20.0, 20.0, 9.0, 23.0, 14.0, 18.0, 14.0, 11.0, 6.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6015625, -13.1275634765625, -12.653564453125, -12.1795654296875, -11.70556640625, -11.2315673828125, -10.757568359375, -10.2835693359375, -9.8095703125, -9.3355712890625, -8.861572265625, -8.3875732421875, -7.91357421875, -7.4395751953125, -6.965576171875, -6.4915771484375, -6.017578125, -5.5435791015625, -5.069580078125, -4.5955810546875, -4.12158203125, -3.6475830078125, -3.173583984375, -2.6995849609375, -2.2255859375, -1.7515869140625, -1.277587890625, -0.8035888671875, -0.32958984375, 0.1444091796875, 0.618408203125, 1.0924072265625, 1.56640625, 2.0404052734375, 2.514404296875, 2.9884033203125, 3.46240234375, 3.9364013671875, 4.410400390625, 4.8843994140625, 5.3583984375, 5.8323974609375, 6.306396484375, 6.7803955078125, 7.25439453125, 7.7283935546875, 8.202392578125, 8.6763916015625, 9.150390625, 9.6243896484375, 10.098388671875, 10.5723876953125, 11.04638671875, 11.5203857421875, 11.994384765625, 12.4683837890625, 12.9423828125, 13.4163818359375, 13.890380859375, 14.3643798828125, 14.83837890625, 15.3123779296875, 15.786376953125, 16.2603759765625, 16.734375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 8.0, 11.0, 24.0, 29.0, 37.0, 65.0, 89.0, 161.0, 241.0, 368.0, 543.0, 831.0, 1295.0, 1920.0, 2972.0, 4525.0, 6953.0, 10709.0, 16182.0, 26049.0, 40733.0, 65245.0, 103418.0, 163862.0, 208581.0, 144366.0, 91295.0, 57318.0, 36019.0, 22635.0, 14910.0, 9433.0, 6117.0, 4009.0, 2669.0, 1724.0, 1097.0, 719.0, 462.0, 307.0, 226.0, 125.0, 86.0, 65.0, 46.0, 33.0, 12.0, 9.0, 7.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.513671875, -1.4654083251953125, -1.417144775390625, -1.3688812255859375, -1.32061767578125, -1.2723541259765625, -1.224090576171875, -1.1758270263671875, -1.1275634765625, -1.0792999267578125, -1.031036376953125, -0.9827728271484375, -0.93450927734375, -0.8862457275390625, -0.837982177734375, -0.7897186279296875, -0.741455078125, -0.6931915283203125, -0.644927978515625, -0.5966644287109375, -0.54840087890625, -0.5001373291015625, -0.451873779296875, -0.4036102294921875, -0.3553466796875, -0.3070831298828125, -0.258819580078125, -0.2105560302734375, -0.16229248046875, -0.1140289306640625, -0.065765380859375, -0.0175018310546875, 0.03076171875, 0.0790252685546875, 0.127288818359375, 0.1755523681640625, 0.22381591796875, 0.2720794677734375, 0.320343017578125, 0.3686065673828125, 0.4168701171875, 0.4651336669921875, 0.513397216796875, 0.5616607666015625, 0.60992431640625, 0.6581878662109375, 0.706451416015625, 0.7547149658203125, 0.802978515625, 0.8512420654296875, 0.899505615234375, 0.9477691650390625, 0.99603271484375, 1.0442962646484375, 1.092559814453125, 1.1408233642578125, 1.1890869140625, 1.2373504638671875, 1.285614013671875, 1.3338775634765625, 1.38214111328125, 1.4304046630859375, 1.478668212890625, 1.5269317626953125, 1.5751953125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 5.0, 5.0, 6.0, 7.0, 8.0, 12.0, 19.0, 20.0, 20.0, 21.0, 20.0, 26.0, 20.0, 32.0, 17.0, 26.0, 25.0, 29.0, 34.0, 34.0, 30.0, 33.0, 31.0, 1063.0, 38.0, 34.0, 35.0, 37.0, 24.0, 36.0, 25.0, 11.0, 34.0, 22.0, 21.0, 21.0, 19.0, 20.0, 13.0, 10.0, 9.0, 11.0, 7.0, 8.0, 5.0, 10.0, 6.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0], "bins": [-8.0390625, -7.80316162109375, -7.5672607421875, -7.33135986328125, -7.095458984375, -6.85955810546875, -6.6236572265625, -6.38775634765625, -6.15185546875, -5.91595458984375, -5.6800537109375, -5.44415283203125, -5.208251953125, -4.97235107421875, -4.7364501953125, -4.50054931640625, -4.2646484375, -4.02874755859375, -3.7928466796875, -3.55694580078125, -3.321044921875, -3.08514404296875, -2.8492431640625, -2.61334228515625, -2.37744140625, -2.14154052734375, -1.9056396484375, -1.66973876953125, -1.433837890625, -1.19793701171875, -0.9620361328125, -0.72613525390625, -0.490234375, -0.25433349609375, -0.0184326171875, 0.21746826171875, 0.453369140625, 0.68927001953125, 0.9251708984375, 1.16107177734375, 1.39697265625, 1.63287353515625, 1.8687744140625, 2.10467529296875, 2.340576171875, 2.57647705078125, 2.8123779296875, 3.04827880859375, 3.2841796875, 3.52008056640625, 3.7559814453125, 3.99188232421875, 4.227783203125, 4.46368408203125, 4.6995849609375, 4.93548583984375, 5.17138671875, 5.40728759765625, 5.6431884765625, 5.87908935546875, 6.114990234375, 6.35089111328125, 6.5867919921875, 6.82269287109375, 7.05859375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 10.0, 18.0, 18.0, 48.0, 62.0, 93.0, 106.0, 182.0, 292.0, 397.0, 637.0, 956.0, 1290.0, 1893.0, 2801.0, 3996.0, 5724.0, 8515.0, 12503.0, 18458.0, 27521.0, 40009.0, 59729.0, 89267.0, 135297.0, 1234717.0, 149805.0, 99014.0, 66080.0, 43628.0, 30054.0, 20434.0, 13803.0, 9391.0, 6388.0, 4382.0, 3105.0, 2013.0, 1368.0, 997.0, 696.0, 449.0, 314.0, 225.0, 155.0, 108.0, 66.0, 53.0, 25.0, 11.0, 11.0, 4.0, 6.0, 5.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.2744140625, -1.2341156005859375, -1.193817138671875, -1.1535186767578125, -1.11322021484375, -1.0729217529296875, -1.032623291015625, -0.9923248291015625, -0.9520263671875, -0.9117279052734375, -0.871429443359375, -0.8311309814453125, -0.79083251953125, -0.7505340576171875, -0.710235595703125, -0.6699371337890625, -0.629638671875, -0.5893402099609375, -0.549041748046875, -0.5087432861328125, -0.46844482421875, -0.4281463623046875, -0.387847900390625, -0.3475494384765625, -0.3072509765625, -0.2669525146484375, -0.226654052734375, -0.1863555908203125, -0.14605712890625, -0.1057586669921875, -0.065460205078125, -0.0251617431640625, 0.01513671875, 0.0554351806640625, 0.095733642578125, 0.1360321044921875, 0.17633056640625, 0.2166290283203125, 0.256927490234375, 0.2972259521484375, 0.3375244140625, 0.3778228759765625, 0.418121337890625, 0.4584197998046875, 0.49871826171875, 0.5390167236328125, 0.579315185546875, 0.6196136474609375, 0.659912109375, 0.7002105712890625, 0.740509033203125, 0.7808074951171875, 0.82110595703125, 0.8614044189453125, 0.901702880859375, 0.9420013427734375, 0.9822998046875, 1.0225982666015625, 1.062896728515625, 1.1031951904296875, 1.14349365234375, 1.1837921142578125, 1.224090576171875, 1.2643890380859375, 1.3046875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 4.0, 11.0, 14.0, 11.0, 19.0, 24.0, 53.0, 46.0, 50.0, 62.0, 116.0, 101.0, 105.0, 68.0, 80.0, 62.0, 44.0, 34.0, 25.0, 15.0, 15.0, 11.0, 3.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003940582275390625, -0.003789365291595459, -0.003638148307800293, -0.003486931324005127, -0.003335714340209961, -0.003184497356414795, -0.003033280372619629, -0.002882063388824463, -0.002730846405029297, -0.002579629421234131, -0.002428412437438965, -0.002277195453643799, -0.002125978469848633, -0.001974761486053467, -0.0018235445022583008, -0.0016723275184631348, -0.0015211105346679688, -0.0013698935508728027, -0.0012186765670776367, -0.0010674595832824707, -0.0009162425994873047, -0.0007650256156921387, -0.0006138086318969727, -0.00046259164810180664, -0.0003113746643066406, -0.0001601576805114746, -8.940696716308594e-06, 0.00014227628707885742, 0.00029349327087402344, 0.00044471025466918945, 0.0005959272384643555, 0.0007471442222595215, 0.0008983612060546875, 0.0010495781898498535, 0.0012007951736450195, 0.0013520121574401855, 0.0015032291412353516, 0.0016544461250305176, 0.0018056631088256836, 0.0019568800926208496, 0.0021080970764160156, 0.0022593140602111816, 0.0024105310440063477, 0.0025617480278015137, 0.0027129650115966797, 0.0028641819953918457, 0.0030153989791870117, 0.0031666159629821777, 0.0033178329467773438, 0.0034690499305725098, 0.0036202669143676758, 0.003771483898162842, 0.003922700881958008, 0.004073917865753174, 0.00422513484954834, 0.004376351833343506, 0.004527568817138672, 0.004678785800933838, 0.004830002784729004, 0.00498121976852417, 0.005132436752319336, 0.005283653736114502, 0.005434870719909668, 0.005586087703704834, 0.0057373046875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 15.0, 12.0, 34.0, 26.0, 58.0, 98.0, 161.0, 319.0, 1652.0, 1043676.0, 1649.0, 384.0, 155.0, 96.0, 59.0, 51.0, 29.0, 15.0, 13.0, 9.0, 7.0, 1.0, 9.0, 6.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1435546875, -0.1397256851196289, -0.1358966827392578, -0.13206768035888672, -0.12823867797851562, -0.12440967559814453, -0.12058067321777344, -0.11675167083740234, -0.11292266845703125, -0.10909366607666016, -0.10526466369628906, -0.10143566131591797, -0.09760665893554688, -0.09377765655517578, -0.08994865417480469, -0.0861196517944336, -0.0822906494140625, -0.0784616470336914, -0.07463264465332031, -0.07080364227294922, -0.06697463989257812, -0.06314563751220703, -0.05931663513183594, -0.055487632751464844, -0.05165863037109375, -0.047829627990722656, -0.04400062561035156, -0.04017162322998047, -0.036342620849609375, -0.03251361846923828, -0.028684616088867188, -0.024855613708496094, -0.021026611328125, -0.017197608947753906, -0.013368606567382812, -0.009539604187011719, -0.005710601806640625, -0.0018815994262695312, 0.0019474029541015625, 0.005776405334472656, 0.00960540771484375, 0.013434410095214844, 0.017263412475585938, 0.02109241485595703, 0.024921417236328125, 0.02875041961669922, 0.03257942199707031, 0.036408424377441406, 0.0402374267578125, 0.044066429138183594, 0.04789543151855469, 0.05172443389892578, 0.055553436279296875, 0.05938243865966797, 0.06321144104003906, 0.06704044342041016, 0.07086944580078125, 0.07469844818115234, 0.07852745056152344, 0.08235645294189453, 0.08618545532226562, 0.09001445770263672, 0.09384346008300781, 0.0976724624633789, 0.10150146484375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 20.0, 691.0, 300.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002911006798967719, -0.002484816126525402, -0.002058625454083085, -0.0016324346652254462, -0.0012062439927831292, -0.0007800532039254904, -0.00035386253148317337, 7.232814095914364e-05, 0.0004985188134014606, 0.0009247094858437777, 0.0013509001582860947, 0.0017770909471437335, 0.0022032815031707287, 0.0026294724084436893, 0.0030556630808860064, 0.0034818537533283234, 0.003908044658601284, 0.004334235563874245, 0.004760426003485918, 0.005186616908758879, 0.005612807348370552, 0.006038998253643513, 0.006465189158916473, 0.006891379598528147, 0.00731757003813982, 0.007743760943412781, 0.008169951848685741, 0.008596141822636127, 0.009022332727909088, 0.009448523633182049, 0.00987471453845501, 0.010300904512405396, 0.010727095417678356, 0.011153286322951317, 0.011579477228224277, 0.012005667202174664, 0.012431858107447624, 0.012858049012720585, 0.013284239917993546, 0.013710429891943932, 0.014136620797216892, 0.014562811702489853, 0.014989002607762814, 0.0154151925817132, 0.01584138348698616, 0.016267575323581696, 0.01669376529753208, 0.017119955271482468, 0.017546147108078003, 0.01797233708202839, 0.018398528918623924, 0.01882471889257431, 0.019250910729169846, 0.01967710070312023, 0.020103290677070618, 0.020529482513666153, 0.02095567248761654, 0.021381862461566925, 0.02180805429816246, 0.022234244272112846, 0.02266043610870838, 0.023086626082658768, 0.023512816056609154, 0.02393900789320469, 0.024365197867155075]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 7.0, 9.0, 7.0, 7.0, 8.0, 13.0, 13.0, 25.0, 15.0, 13.0, 19.0, 30.0, 25.0, 24.0, 31.0, 41.0, 36.0, 36.0, 37.0, 33.0, 37.0, 39.0, 28.0, 39.0, 36.0, 35.0, 42.0, 29.0, 30.0, 27.0, 31.0, 21.0, 22.0, 18.0, 24.0, 23.0, 12.0, 17.0, 10.0, 11.0, 7.0, 10.0, 2.0, 8.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.001588284969329834, -0.0015390831977128983, -0.0014898814260959625, -0.0014406796544790268, -0.001391477882862091, -0.0013422761112451553, -0.0012930743396282196, -0.0012438725680112839, -0.0011946707963943481, -0.0011454690247774124, -0.0010962672531604767, -0.001047065481543541, -0.0009978637099266052, -0.0009486619383096695, -0.0008994601666927338, -0.000850258395075798, -0.0008010566234588623, -0.0007518548518419266, -0.0007026530802249908, -0.0006534513086080551, -0.0006042495369911194, -0.0005550477653741837, -0.0005058459937572479, -0.0004566442221403122, -0.00040744245052337646, -0.00035824067890644073, -0.000309038907289505, -0.0002598371356725693, -0.00021063536405563354, -0.00016143359243869781, -0.00011223182082176208, -6.303004920482635e-05, -1.3828277587890625e-05, 3.5373494029045105e-05, 8.457526564598083e-05, 0.00013377703726291656, 0.0001829788088798523, 0.00023218058049678802, 0.00028138235211372375, 0.0003305841237306595, 0.0003797858953475952, 0.00042898766696453094, 0.0004781894385814667, 0.0005273912101984024, 0.0005765929818153381, 0.0006257947534322739, 0.0006749965250492096, 0.0007241982966661453, 0.0007734000682830811, 0.0008226018399000168, 0.0008718036115169525, 0.0009210053831338882, 0.000970207154750824, 0.0010194089263677597, 0.0010686106979846954, 0.0011178124696016312, 0.001167014241218567, 0.0012162160128355026, 0.0012654177844524384, 0.001314619556069374, 0.0013638213276863098, 0.0014130230993032455, 0.0014622248709201813, 0.001511426642537117, 0.0015606284141540527]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 10.0, 8.0, 14.0, 9.0, 12.0, 21.0, 14.0, 21.0, 31.0, 28.0, 32.0, 36.0, 42.0, 42.0, 39.0, 40.0, 39.0, 64.0, 34.0, 47.0, 58.0, 38.0, 41.0, 34.0, 36.0, 29.0, 23.0, 20.0, 20.0, 9.0, 23.0, 14.0, 18.0, 14.0, 11.0, 6.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6015625, -13.1275634765625, -12.653564453125, -12.1795654296875, -11.70556640625, -11.2315673828125, -10.757568359375, -10.2835693359375, -9.8095703125, -9.3355712890625, -8.861572265625, -8.3875732421875, -7.91357421875, -7.4395751953125, -6.965576171875, -6.4915771484375, -6.017578125, -5.5435791015625, -5.069580078125, -4.5955810546875, -4.12158203125, -3.6475830078125, -3.173583984375, -2.6995849609375, -2.2255859375, -1.7515869140625, -1.277587890625, -0.8035888671875, -0.32958984375, 0.1444091796875, 0.618408203125, 1.0924072265625, 1.56640625, 2.0404052734375, 2.514404296875, 2.9884033203125, 3.46240234375, 3.9364013671875, 4.410400390625, 4.8843994140625, 5.3583984375, 5.8323974609375, 6.306396484375, 6.7803955078125, 7.25439453125, 7.7283935546875, 8.202392578125, 8.6763916015625, 9.150390625, 9.6243896484375, 10.098388671875, 10.5723876953125, 11.04638671875, 11.5203857421875, 11.994384765625, 12.4683837890625, 12.9423828125, 13.4163818359375, 13.890380859375, 14.3643798828125, 14.83837890625, 15.3123779296875, 15.786376953125, 16.2603759765625, 16.734375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 5.0, 12.0, 14.0, 13.0, 15.0, 23.0, 32.0, 34.0, 37.0, 83.0, 150.0, 244.0, 520.0, 1293.0, 3021.0, 7427.0, 18473.0, 48062.0, 140511.0, 419270.0, 273377.0, 84306.0, 30889.0, 12164.0, 4823.0, 1975.0, 855.0, 375.0, 187.0, 110.0, 62.0, 44.0, 36.0, 28.0, 25.0, 17.0, 15.0, 7.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9765625, -11.560302734375, -11.14404296875, -10.727783203125, -10.3115234375, -9.895263671875, -9.47900390625, -9.062744140625, -8.646484375, -8.230224609375, -7.81396484375, -7.397705078125, -6.9814453125, -6.565185546875, -6.14892578125, -5.732666015625, -5.31640625, -4.900146484375, -4.48388671875, -4.067626953125, -3.6513671875, -3.235107421875, -2.81884765625, -2.402587890625, -1.986328125, -1.570068359375, -1.15380859375, -0.737548828125, -0.3212890625, 0.094970703125, 0.51123046875, 0.927490234375, 1.34375, 1.760009765625, 2.17626953125, 2.592529296875, 3.0087890625, 3.425048828125, 3.84130859375, 4.257568359375, 4.673828125, 5.090087890625, 5.50634765625, 5.922607421875, 6.3388671875, 6.755126953125, 7.17138671875, 7.587646484375, 8.00390625, 8.420166015625, 8.83642578125, 9.252685546875, 9.6689453125, 10.085205078125, 10.50146484375, 10.917724609375, 11.333984375, 11.750244140625, 12.16650390625, 12.582763671875, 12.9990234375, 13.415283203125, 13.83154296875, 14.247802734375, 14.6640625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 1.0, 6.0, 8.0, 9.0, 7.0, 11.0, 16.0, 11.0, 13.0, 18.0, 17.0, 25.0, 25.0, 26.0, 30.0, 27.0, 32.0, 33.0, 39.0, 58.0, 87.0, 256.0, 1556.0, 208.0, 91.0, 51.0, 42.0, 37.0, 36.0, 31.0, 32.0, 24.0, 28.0, 18.0, 19.0, 18.0, 13.0, 17.0, 11.0, 14.0, 4.0, 8.0, 3.0, 5.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-41.09375, -39.828125, -38.5625, -37.296875, -36.03125, -34.765625, -33.5, -32.234375, -30.96875, -29.703125, -28.4375, -27.171875, -25.90625, -24.640625, -23.375, -22.109375, -20.84375, -19.578125, -18.3125, -17.046875, -15.78125, -14.515625, -13.25, -11.984375, -10.71875, -9.453125, -8.1875, -6.921875, -5.65625, -4.390625, -3.125, -1.859375, -0.59375, 0.671875, 1.9375, 3.203125, 4.46875, 5.734375, 7.0, 8.265625, 9.53125, 10.796875, 12.0625, 13.328125, 14.59375, 15.859375, 17.125, 18.390625, 19.65625, 20.921875, 22.1875, 23.453125, 24.71875, 25.984375, 27.25, 28.515625, 29.78125, 31.046875, 32.3125, 33.578125, 34.84375, 36.109375, 37.375, 38.640625, 39.90625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 10.0, 8.0, 5.0, 9.0, 12.0, 25.0, 19.0, 19.0, 27.0, 38.0, 39.0, 66.0, 79.0, 110.0, 123.0, 204.0, 272.0, 416.0, 1029.0, 11944.0, 2887215.0, 238631.0, 3445.0, 681.0, 341.0, 218.0, 143.0, 133.0, 105.0, 69.0, 58.0, 43.0, 29.0, 20.0, 26.0, 18.0, 17.0, 10.0, 12.0, 7.0, 4.0, 4.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-79.5, -77.2158203125, -74.931640625, -72.6474609375, -70.36328125, -68.0791015625, -65.794921875, -63.5107421875, -61.2265625, -58.9423828125, -56.658203125, -54.3740234375, -52.08984375, -49.8056640625, -47.521484375, -45.2373046875, -42.953125, -40.6689453125, -38.384765625, -36.1005859375, -33.81640625, -31.5322265625, -29.248046875, -26.9638671875, -24.6796875, -22.3955078125, -20.111328125, -17.8271484375, -15.54296875, -13.2587890625, -10.974609375, -8.6904296875, -6.40625, -4.1220703125, -1.837890625, 0.4462890625, 2.73046875, 5.0146484375, 7.298828125, 9.5830078125, 11.8671875, 14.1513671875, 16.435546875, 18.7197265625, 21.00390625, 23.2880859375, 25.572265625, 27.8564453125, 30.140625, 32.4248046875, 34.708984375, 36.9931640625, 39.27734375, 41.5615234375, 43.845703125, 46.1298828125, 48.4140625, 50.6982421875, 52.982421875, 55.2666015625, 57.55078125, 59.8349609375, 62.119140625, 64.4033203125, 66.6875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [514.0, 504.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.902969360351562, -0.14458084106445312, 17.613807678222656, 35.372196197509766, 53.130584716796875, 70.88897705078125, 88.6473617553711, 106.40574645996094, 124.16413879394531, 141.9225311279297, 159.680908203125, 177.43930053710938, 195.19769287109375, 212.95608520507812, 230.7144775390625, 248.4728546142578, 266.23126220703125, 283.9896545410156, 301.748046875, 319.5064392089844, 337.26483154296875, 355.023193359375, 372.7815856933594, 390.53997802734375, 408.29833984375, 426.0567321777344, 443.81512451171875, 461.5735168457031, 479.3319091796875, 497.09027099609375, 514.8486938476562, 532.6070556640625, 550.365478515625, 568.1238403320312, 585.8822631835938, 603.640625, 621.3990478515625, 639.1574096679688, 656.9158325195312, 674.6741943359375, 692.4326171875, 710.1909790039062, 727.9494018554688, 745.707763671875, 763.4661865234375, 781.2245483398438, 798.9829711914062, 816.7413330078125, 834.4996948242188, 852.258056640625, 870.0164794921875, 887.7748413085938, 905.5332641601562, 923.2916259765625, 941.050048828125, 958.8084106445312, 976.5667724609375, 994.3251342773438, 1012.0835571289062, 1029.8419189453125, 1047.600341796875, 1065.3587646484375, 1083.1170654296875, 1100.87548828125, 1118.6339111328125]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 2.0, 8.0, 12.0, 12.0, 15.0, 10.0, 17.0, 16.0, 18.0, 28.0, 23.0, 35.0, 29.0, 46.0, 42.0, 38.0, 35.0, 33.0, 44.0, 44.0, 53.0, 50.0, 41.0, 33.0, 39.0, 37.0, 31.0, 28.0, 22.0, 30.0, 20.0, 20.0, 14.0, 13.0, 10.0, 15.0, 4.0, 2.0, 7.0, 8.0, 6.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-121.51361083984375, -117.98515319824219, -114.4566879272461, -110.92822265625, -107.39976501464844, -103.87130737304688, -100.34284210205078, -96.81437683105469, -93.28591918945312, -89.75746154785156, -86.22899627685547, -82.70053100585938, -79.17207336425781, -75.64361572265625, -72.11515045166016, -68.58668518066406, -65.0582275390625, -61.52976608276367, -58.001304626464844, -54.472843170166016, -50.94438171386719, -47.41592025756836, -43.88745880126953, -40.3589973449707, -36.830535888671875, -33.30207443237305, -29.77361297607422, -26.24515151977539, -22.716690063476562, -19.188228607177734, -15.659767150878906, -12.131305694580078, -8.60284423828125, -5.074382781982422, -1.5459213256835938, 1.9825401306152344, 5.5110015869140625, 9.03946304321289, 12.567924499511719, 16.096385955810547, 19.624847412109375, 23.153308868408203, 26.68177032470703, 30.21023178100586, 33.73869323730469, 37.267154693603516, 40.795616149902344, 44.32407760620117, 47.8525390625, 51.38100051879883, 54.909461975097656, 58.437923431396484, 61.96638488769531, 65.49484252929688, 69.02330780029297, 72.55177307128906, 76.08023071289062, 79.60868835449219, 83.13715362548828, 86.66561889648438, 90.19407653808594, 93.7225341796875, 97.2509994506836, 100.77946472167969, 104.30792236328125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 3.0, 3.0, 4.0, 12.0, 13.0, 11.0, 12.0, 16.0, 21.0, 25.0, 22.0, 35.0, 31.0, 36.0, 40.0, 37.0, 39.0, 45.0, 48.0, 53.0, 47.0, 46.0, 50.0, 41.0, 35.0, 42.0, 42.0, 27.0, 21.0, 25.0, 16.0, 17.0, 17.0, 14.0, 16.0, 15.0, 10.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.578125, -14.07177734375, -13.5654296875, -13.05908203125, -12.552734375, -12.04638671875, -11.5400390625, -11.03369140625, -10.52734375, -10.02099609375, -9.5146484375, -9.00830078125, -8.501953125, -7.99560546875, -7.4892578125, -6.98291015625, -6.4765625, -5.97021484375, -5.4638671875, -4.95751953125, -4.451171875, -3.94482421875, -3.4384765625, -2.93212890625, -2.42578125, -1.91943359375, -1.4130859375, -0.90673828125, -0.400390625, 0.10595703125, 0.6123046875, 1.11865234375, 1.625, 2.13134765625, 2.6376953125, 3.14404296875, 3.650390625, 4.15673828125, 4.6630859375, 5.16943359375, 5.67578125, 6.18212890625, 6.6884765625, 7.19482421875, 7.701171875, 8.20751953125, 8.7138671875, 9.22021484375, 9.7265625, 10.23291015625, 10.7392578125, 11.24560546875, 11.751953125, 12.25830078125, 12.7646484375, 13.27099609375, 13.77734375, 14.28369140625, 14.7900390625, 15.29638671875, 15.802734375, 16.30908203125, 16.8154296875, 17.32177734375, 17.828125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 5.0, 6.0, 5.0, 6.0, 4.0, 10.0, 12.0, 9.0, 14.0, 24.0, 27.0, 22.0, 43.0, 45.0, 57.0, 67.0, 85.0, 113.0, 221.0, 564.0, 4313.0, 153846.0, 3594068.0, 431292.0, 7741.0, 839.0, 265.0, 139.0, 95.0, 71.0, 55.0, 44.0, 21.0, 33.0, 34.0, 15.0, 12.0, 20.0, 13.0, 7.0, 6.0, 6.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.25, -44.57470703125, -42.8994140625, -41.22412109375, -39.548828125, -37.87353515625, -36.1982421875, -34.52294921875, -32.84765625, -31.17236328125, -29.4970703125, -27.82177734375, -26.146484375, -24.47119140625, -22.7958984375, -21.12060546875, -19.4453125, -17.77001953125, -16.0947265625, -14.41943359375, -12.744140625, -11.06884765625, -9.3935546875, -7.71826171875, -6.04296875, -4.36767578125, -2.6923828125, -1.01708984375, 0.658203125, 2.33349609375, 4.0087890625, 5.68408203125, 7.359375, 9.03466796875, 10.7099609375, 12.38525390625, 14.060546875, 15.73583984375, 17.4111328125, 19.08642578125, 20.76171875, 22.43701171875, 24.1123046875, 25.78759765625, 27.462890625, 29.13818359375, 30.8134765625, 32.48876953125, 34.1640625, 35.83935546875, 37.5146484375, 39.18994140625, 40.865234375, 42.54052734375, 44.2158203125, 45.89111328125, 47.56640625, 49.24169921875, 50.9169921875, 52.59228515625, 54.267578125, 55.94287109375, 57.6181640625, 59.29345703125, 60.96875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 4.0, 4.0, 5.0, 6.0, 8.0, 9.0, 15.0, 16.0, 29.0, 46.0, 72.0, 82.0, 98.0, 132.0, 203.0, 288.0, 383.0, 512.0, 502.0, 474.0, 325.0, 243.0, 162.0, 121.0, 90.0, 64.0, 56.0, 30.0, 25.0, 13.0, 15.0, 14.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.53125, -26.703125, -25.875, -25.046875, -24.21875, -23.390625, -22.5625, -21.734375, -20.90625, -20.078125, -19.25, -18.421875, -17.59375, -16.765625, -15.9375, -15.109375, -14.28125, -13.453125, -12.625, -11.796875, -10.96875, -10.140625, -9.3125, -8.484375, -7.65625, -6.828125, -6.0, -5.171875, -4.34375, -3.515625, -2.6875, -1.859375, -1.03125, -0.203125, 0.625, 1.453125, 2.28125, 3.109375, 3.9375, 4.765625, 5.59375, 6.421875, 7.25, 8.078125, 8.90625, 9.734375, 10.5625, 11.390625, 12.21875, 13.046875, 13.875, 14.703125, 15.53125, 16.359375, 17.1875, 18.015625, 18.84375, 19.671875, 20.5, 21.328125, 22.15625, 22.984375, 23.8125, 24.640625, 25.46875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 4.0, 10.0, 9.0, 16.0, 14.0, 21.0, 23.0, 25.0, 42.0, 65.0, 83.0, 123.0, 146.0, 198.0, 304.0, 582.0, 2134.0, 268496.0, 3912577.0, 7329.0, 770.0, 370.0, 246.0, 180.0, 103.0, 103.0, 81.0, 57.0, 50.0, 17.0, 29.0, 19.0, 11.0, 9.0, 10.0, 3.0, 8.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.0, -130.673828125, -126.34765625, -122.021484375, -117.6953125, -113.369140625, -109.04296875, -104.716796875, -100.390625, -96.064453125, -91.73828125, -87.412109375, -83.0859375, -78.759765625, -74.43359375, -70.107421875, -65.78125, -61.455078125, -57.12890625, -52.802734375, -48.4765625, -44.150390625, -39.82421875, -35.498046875, -31.171875, -26.845703125, -22.51953125, -18.193359375, -13.8671875, -9.541015625, -5.21484375, -0.888671875, 3.4375, 7.763671875, 12.08984375, 16.416015625, 20.7421875, 25.068359375, 29.39453125, 33.720703125, 38.046875, 42.373046875, 46.69921875, 51.025390625, 55.3515625, 59.677734375, 64.00390625, 68.330078125, 72.65625, 76.982421875, 81.30859375, 85.634765625, 89.9609375, 94.287109375, 98.61328125, 102.939453125, 107.265625, 111.591796875, 115.91796875, 120.244140625, 124.5703125, 128.896484375, 133.22265625, 137.548828125, 141.875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 14.0, 100.0, 296.0, 331.0, 204.0, 53.0, 15.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-224.96385192871094, -217.29205322265625, -209.62026977539062, -201.94847106933594, -194.27667236328125, -186.60487365722656, -178.93307495117188, -171.26129150390625, -163.58949279785156, -155.91769409179688, -148.24591064453125, -140.57411193847656, -132.90231323242188, -125.23051452636719, -117.55872344970703, -109.88693237304688, -102.21513366699219, -94.5433349609375, -86.87154388427734, -79.19975280761719, -71.5279541015625, -63.85615921020508, -56.184364318847656, -48.512569427490234, -40.84077453613281, -33.16897964477539, -25.49718475341797, -17.825389862060547, -10.153594970703125, -2.481800079345703, 5.189994812011719, 12.86178970336914, 20.5335693359375, 28.205364227294922, 35.877159118652344, 43.548954010009766, 51.22074890136719, 58.89254379272461, 66.56433868408203, 74.23612976074219, 81.90792846679688, 89.57972717285156, 97.25151824951172, 104.92330932617188, 112.59510803222656, 120.26690673828125, 127.9386978149414, 135.61048889160156, 143.28228759765625, 150.95408630371094, 158.62588500976562, 166.29766845703125, 173.96946716308594, 181.64126586914062, 189.31304931640625, 196.98484802246094, 204.65664672851562, 212.3284454345703, 220.000244140625, 227.67202758789062, 235.3438262939453, 243.015625, 250.68740844726562, 258.3592224121094, 266.031005859375]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 12.0, 9.0, 10.0, 14.0, 18.0, 17.0, 28.0, 26.0, 27.0, 22.0, 32.0, 49.0, 49.0, 51.0, 48.0, 56.0, 50.0, 41.0, 35.0, 41.0, 46.0, 42.0, 34.0, 37.0, 29.0, 25.0, 21.0, 23.0, 23.0, 15.0, 15.0, 11.0, 14.0, 8.0, 4.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-85.64910888671875, -82.68594360351562, -79.7227783203125, -76.75960540771484, -73.79644012451172, -70.8332748413086, -67.87010192871094, -64.90693664550781, -61.94377136230469, -58.98060607910156, -56.01743698120117, -53.05426788330078, -50.091102600097656, -47.12793731689453, -44.16476821899414, -41.20159912109375, -38.238433837890625, -35.2752685546875, -32.31209945678711, -29.34893226623535, -26.385765075683594, -23.422597885131836, -20.459430694580078, -17.49626350402832, -14.533096313476562, -11.569929122924805, -8.606761932373047, -5.643594741821289, -2.6804275512695312, 0.28273963928222656, 3.2459068298339844, 6.209074020385742, 9.1722412109375, 12.135408401489258, 15.098575592041016, 18.061742782592773, 21.02490997314453, 23.98807716369629, 26.951244354248047, 29.914411544799805, 32.87757873535156, 35.84074401855469, 38.80391311645508, 41.76708221435547, 44.730247497558594, 47.69341278076172, 50.65658187866211, 53.6197509765625, 56.582916259765625, 59.54608154296875, 62.50925064086914, 65.47241973876953, 68.43558502197266, 71.39875030517578, 74.36192321777344, 77.32508850097656, 80.28825378417969, 83.25141906738281, 86.21458435058594, 89.1777572631836, 92.14092254638672, 95.10408782958984, 98.0672607421875, 101.03042602539062, 103.99359130859375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 6.0, 8.0, 16.0, 19.0, 16.0, 18.0, 20.0, 12.0, 30.0, 21.0, 38.0, 34.0, 48.0, 25.0, 50.0, 48.0, 32.0, 52.0, 46.0, 49.0, 43.0, 42.0, 51.0, 36.0, 30.0, 27.0, 26.0, 28.0, 19.0, 20.0, 19.0, 11.0, 11.0, 6.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.640625, -14.14990234375, -13.6591796875, -13.16845703125, -12.677734375, -12.18701171875, -11.6962890625, -11.20556640625, -10.71484375, -10.22412109375, -9.7333984375, -9.24267578125, -8.751953125, -8.26123046875, -7.7705078125, -7.27978515625, -6.7890625, -6.29833984375, -5.8076171875, -5.31689453125, -4.826171875, -4.33544921875, -3.8447265625, -3.35400390625, -2.86328125, -2.37255859375, -1.8818359375, -1.39111328125, -0.900390625, -0.40966796875, 0.0810546875, 0.57177734375, 1.0625, 1.55322265625, 2.0439453125, 2.53466796875, 3.025390625, 3.51611328125, 4.0068359375, 4.49755859375, 4.98828125, 5.47900390625, 5.9697265625, 6.46044921875, 6.951171875, 7.44189453125, 7.9326171875, 8.42333984375, 8.9140625, 9.40478515625, 9.8955078125, 10.38623046875, 10.876953125, 11.36767578125, 11.8583984375, 12.34912109375, 12.83984375, 13.33056640625, 13.8212890625, 14.31201171875, 14.802734375, 15.29345703125, 15.7841796875, 16.27490234375, 16.765625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 9.0, 21.0, 15.0, 36.0, 69.0, 116.0, 161.0, 244.0, 365.0, 580.0, 925.0, 1437.0, 2307.0, 3721.0, 5851.0, 9431.0, 14997.0, 24130.0, 39073.0, 64010.0, 107684.0, 180950.0, 224266.0, 144993.0, 86568.0, 51984.0, 31749.0, 19860.0, 12423.0, 7586.0, 4726.0, 3026.0, 1946.0, 1191.0, 746.0, 475.0, 301.0, 194.0, 135.0, 73.0, 64.0, 48.0, 23.0, 11.0, 10.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6328125, -1.5789031982421875, -1.524993896484375, -1.4710845947265625, -1.41717529296875, -1.3632659912109375, -1.309356689453125, -1.2554473876953125, -1.2015380859375, -1.1476287841796875, -1.093719482421875, -1.0398101806640625, -0.98590087890625, -0.9319915771484375, -0.878082275390625, -0.8241729736328125, -0.770263671875, -0.7163543701171875, -0.662445068359375, -0.6085357666015625, -0.55462646484375, -0.5007171630859375, -0.446807861328125, -0.3928985595703125, -0.3389892578125, -0.2850799560546875, -0.231170654296875, -0.1772613525390625, -0.12335205078125, -0.0694427490234375, -0.015533447265625, 0.0383758544921875, 0.09228515625, 0.1461944580078125, 0.200103759765625, 0.2540130615234375, 0.30792236328125, 0.3618316650390625, 0.415740966796875, 0.4696502685546875, 0.5235595703125, 0.5774688720703125, 0.631378173828125, 0.6852874755859375, 0.73919677734375, 0.7931060791015625, 0.847015380859375, 0.9009246826171875, 0.954833984375, 1.0087432861328125, 1.062652587890625, 1.1165618896484375, 1.17047119140625, 1.2243804931640625, 1.278289794921875, 1.3321990966796875, 1.3861083984375, 1.4400177001953125, 1.493927001953125, 1.5478363037109375, 1.60174560546875, 1.6556549072265625, 1.709564208984375, 1.7634735107421875, 1.8173828125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 3.0, 4.0, 7.0, 12.0, 8.0, 12.0, 14.0, 17.0, 23.0, 17.0, 20.0, 35.0, 27.0, 28.0, 32.0, 40.0, 36.0, 28.0, 41.0, 32.0, 1073.0, 39.0, 38.0, 31.0, 39.0, 37.0, 37.0, 34.0, 31.0, 31.0, 23.0, 20.0, 19.0, 18.0, 27.0, 18.0, 13.0, 11.0, 10.0, 10.0, 7.0, 4.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.7012939453125, -8.426025390625, -8.1507568359375, -7.87548828125, -7.6002197265625, -7.324951171875, -7.0496826171875, -6.7744140625, -6.4991455078125, -6.223876953125, -5.9486083984375, -5.67333984375, -5.3980712890625, -5.122802734375, -4.8475341796875, -4.572265625, -4.2969970703125, -4.021728515625, -3.7464599609375, -3.47119140625, -3.1959228515625, -2.920654296875, -2.6453857421875, -2.3701171875, -2.0948486328125, -1.819580078125, -1.5443115234375, -1.26904296875, -0.9937744140625, -0.718505859375, -0.4432373046875, -0.16796875, 0.1072998046875, 0.382568359375, 0.6578369140625, 0.93310546875, 1.2083740234375, 1.483642578125, 1.7589111328125, 2.0341796875, 2.3094482421875, 2.584716796875, 2.8599853515625, 3.13525390625, 3.4105224609375, 3.685791015625, 3.9610595703125, 4.236328125, 4.5115966796875, 4.786865234375, 5.0621337890625, 5.33740234375, 5.6126708984375, 5.887939453125, 6.1632080078125, 6.4384765625, 6.7137451171875, 6.989013671875, 7.2642822265625, 7.53955078125, 7.8148193359375, 8.090087890625, 8.3653564453125, 8.640625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 18.0, 19.0, 24.0, 46.0, 74.0, 110.0, 179.0, 253.0, 407.0, 556.0, 829.0, 1345.0, 2043.0, 2969.0, 4746.0, 7159.0, 11378.0, 17388.0, 27025.0, 41798.0, 64877.0, 104149.0, 163074.0, 1248262.0, 145120.0, 90844.0, 57698.0, 37029.0, 24026.0, 15488.0, 10000.0, 6198.0, 4293.0, 2654.0, 1760.0, 1115.0, 727.0, 503.0, 323.0, 205.0, 140.0, 85.0, 58.0, 44.0, 39.0, 16.0, 18.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4384765625, -1.392608642578125, -1.34674072265625, -1.300872802734375, -1.2550048828125, -1.209136962890625, -1.16326904296875, -1.117401123046875, -1.071533203125, -1.025665283203125, -0.97979736328125, -0.933929443359375, -0.8880615234375, -0.842193603515625, -0.79632568359375, -0.750457763671875, -0.70458984375, -0.658721923828125, -0.61285400390625, -0.566986083984375, -0.5211181640625, -0.475250244140625, -0.42938232421875, -0.383514404296875, -0.337646484375, -0.291778564453125, -0.24591064453125, -0.200042724609375, -0.1541748046875, -0.108306884765625, -0.06243896484375, -0.016571044921875, 0.029296875, 0.075164794921875, 0.12103271484375, 0.166900634765625, 0.2127685546875, 0.258636474609375, 0.30450439453125, 0.350372314453125, 0.396240234375, 0.442108154296875, 0.48797607421875, 0.533843994140625, 0.5797119140625, 0.625579833984375, 0.67144775390625, 0.717315673828125, 0.76318359375, 0.809051513671875, 0.85491943359375, 0.900787353515625, 0.9466552734375, 0.992523193359375, 1.03839111328125, 1.084259033203125, 1.130126953125, 1.175994873046875, 1.22186279296875, 1.267730712890625, 1.3135986328125, 1.359466552734375, 1.40533447265625, 1.451202392578125, 1.4970703125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 6.0, 11.0, 11.0, 12.0, 21.0, 25.0, 24.0, 38.0, 54.0, 59.0, 65.0, 75.0, 74.0, 81.0, 89.0, 61.0, 57.0, 48.0, 42.0, 20.0, 25.0, 28.0, 14.0, 15.0, 8.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00310516357421875, -0.0029949545860290527, -0.0028847455978393555, -0.002774536609649658, -0.002664327621459961, -0.0025541186332702637, -0.0024439096450805664, -0.002333700656890869, -0.002223491668701172, -0.0021132826805114746, -0.0020030736923217773, -0.00189286470413208, -0.0017826557159423828, -0.0016724467277526855, -0.0015622377395629883, -0.001452028751373291, -0.0013418197631835938, -0.0012316107749938965, -0.0011214017868041992, -0.001011192798614502, -0.0009009838104248047, -0.0007907748222351074, -0.0006805658340454102, -0.0005703568458557129, -0.0004601478576660156, -0.00034993886947631836, -0.0002397298812866211, -0.00012952089309692383, -1.9311904907226562e-05, 9.08970832824707e-05, 0.00020110607147216797, 0.00031131505966186523, 0.0004215240478515625, 0.0005317330360412598, 0.000641942024230957, 0.0007521510124206543, 0.0008623600006103516, 0.0009725689888000488, 0.001082777976989746, 0.0011929869651794434, 0.0013031959533691406, 0.0014134049415588379, 0.0015236139297485352, 0.0016338229179382324, 0.0017440319061279297, 0.001854240894317627, 0.0019644498825073242, 0.0020746588706970215, 0.0021848678588867188, 0.002295076847076416, 0.0024052858352661133, 0.0025154948234558105, 0.002625703811645508, 0.002735912799835205, 0.0028461217880249023, 0.0029563307762145996, 0.003066539764404297, 0.003176748752593994, 0.0032869577407836914, 0.0033971667289733887, 0.003507375717163086, 0.003617584705352783, 0.0037277936935424805, 0.0038380026817321777, 0.003948211669921875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 9.0, 9.0, 15.0, 17.0, 29.0, 19.0, 36.0, 79.0, 101.0, 173.0, 417.0, 2185.0, 1042543.0, 1967.0, 415.0, 189.0, 98.0, 60.0, 54.0, 33.0, 28.0, 23.0, 13.0, 5.0, 4.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10467529296875, -0.10172557830810547, -0.09877586364746094, -0.0958261489868164, -0.09287643432617188, -0.08992671966552734, -0.08697700500488281, -0.08402729034423828, -0.08107757568359375, -0.07812786102294922, -0.07517814636230469, -0.07222843170166016, -0.06927871704101562, -0.0663290023803711, -0.06337928771972656, -0.06042957305908203, -0.0574798583984375, -0.05453014373779297, -0.05158042907714844, -0.048630714416503906, -0.045680999755859375, -0.042731285095214844, -0.03978157043457031, -0.03683185577392578, -0.03388214111328125, -0.03093242645263672, -0.027982711791992188, -0.025032997131347656, -0.022083282470703125, -0.019133567810058594, -0.016183853149414062, -0.013234138488769531, -0.010284423828125, -0.007334709167480469, -0.0043849945068359375, -0.0014352798461914062, 0.001514434814453125, 0.004464149475097656, 0.0074138641357421875, 0.010363578796386719, 0.01331329345703125, 0.01626300811767578, 0.019212722778320312, 0.022162437438964844, 0.025112152099609375, 0.028061866760253906, 0.031011581420898438, 0.03396129608154297, 0.0369110107421875, 0.03986072540283203, 0.04281044006347656, 0.045760154724121094, 0.048709869384765625, 0.051659584045410156, 0.05460929870605469, 0.05755901336669922, 0.06050872802734375, 0.06345844268798828, 0.06640815734863281, 0.06935787200927734, 0.07230758666992188, 0.0752573013305664, 0.07820701599121094, 0.08115673065185547, 0.0841064453125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 20.0, 267.0, 618.0, 102.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018993988633155823, -0.0016395584680140018, -0.0013797181891277432, -0.0011198779102414846, -0.0008600375149399042, -0.0006001971196383238, -0.0003403568407520652, -8.051656186580658e-05, 0.00017932383343577385, 0.00043916417052969337, 0.0006990045076236129, 0.0009588448447175324, 0.001218685181811452, 0.0014785255771130323, 0.001738365855999291, 0.0019982061348855495, 0.00225804653018713, 0.0025178869254887104, 0.002777727320790291, 0.0030375674832612276, 0.003297407878562808, 0.0035572482738643885, 0.0038170884363353252, 0.004076928831636906, 0.004336769226938486, 0.0045966096222400665, 0.004856450017541647, 0.005116290412843227, 0.0053761303424835205, 0.005635971203446388, 0.005895811133086681, 0.006155651528388262, 0.006415490992367268, 0.006675331387668848, 0.0069351717829704285, 0.007195012178272009, 0.007454852573573589, 0.0077146925032138824, 0.00797453336417675, 0.008234373293817043, 0.008494213223457336, 0.00875405315309763, 0.009013894014060497, 0.00927373394370079, 0.009533574804663658, 0.009793414734303951, 0.010053255595266819, 0.010313095524907112, 0.01057293638586998, 0.010832776315510273, 0.01109261717647314, 0.011352457106113434, 0.011612297967076302, 0.011872137896716595, 0.012131978757679462, 0.012391818687319756, 0.012651659548282623, 0.012911499477922916, 0.013171340338885784, 0.013431180268526077, 0.013691021129488945, 0.013950861059129238, 0.014210701920092106, 0.014470541849732399, 0.014730381779372692]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 9.0, 5.0, 5.0, 8.0, 8.0, 9.0, 13.0, 16.0, 13.0, 11.0, 23.0, 24.0, 28.0, 26.0, 30.0, 30.0, 31.0, 42.0, 44.0, 45.0, 33.0, 49.0, 32.0, 37.0, 40.0, 40.0, 33.0, 32.0, 27.0, 29.0, 32.0, 28.0, 26.0, 21.0, 17.0, 18.0, 18.0, 12.0, 8.0, 3.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.001431882381439209, -0.0013854308053851128, -0.0013389792293310165, -0.0012925276532769203, -0.001246076077222824, -0.0011996245011687279, -0.0011531729251146317, -0.0011067213490605354, -0.0010602697730064392, -0.001013818196952343, -0.0009673666208982468, -0.0009209150448441505, -0.0008744634687900543, -0.0008280118927359581, -0.0007815603166818619, -0.0007351087406277657, -0.0006886571645736694, -0.0006422055885195732, -0.000595754012465477, -0.0005493024364113808, -0.0005028508603572845, -0.0004563992843031883, -0.0004099477082490921, -0.0003634961321949959, -0.00031704455614089966, -0.00027059298008680344, -0.00022414140403270721, -0.000177689827978611, -0.00013123825192451477, -8.478667587041855e-05, -3.833509981632233e-05, 8.116476237773895e-06, 5.456805229187012e-05, 0.00010101962834596634, 0.00014747120440006256, 0.00019392278045415878, 0.000240374356508255, 0.0002868259325623512, 0.00033327750861644745, 0.00037972908467054367, 0.0004261806607246399, 0.0004726322367787361, 0.0005190838128328323, 0.0005655353888869286, 0.0006119869649410248, 0.000658438540995121, 0.0007048901170492172, 0.0007513416931033134, 0.0007977932691574097, 0.0008442448452115059, 0.0008906964212656021, 0.0009371479973196983, 0.0009835995733737946, 0.0010300511494278908, 0.001076502725481987, 0.0011229543015360832, 0.0011694058775901794, 0.0012158574536442757, 0.0012623090296983719, 0.0013087606057524681, 0.0013552121818065643, 0.0014016637578606606, 0.0014481153339147568, 0.001494566909968853, 0.0015410184860229492]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 6.0, 8.0, 16.0, 19.0, 16.0, 18.0, 20.0, 12.0, 30.0, 21.0, 38.0, 34.0, 48.0, 25.0, 50.0, 48.0, 32.0, 52.0, 46.0, 49.0, 43.0, 42.0, 51.0, 36.0, 30.0, 27.0, 26.0, 28.0, 19.0, 20.0, 19.0, 11.0, 11.0, 6.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.640625, -14.14990234375, -13.6591796875, -13.16845703125, -12.677734375, -12.18701171875, -11.6962890625, -11.20556640625, -10.71484375, -10.22412109375, -9.7333984375, -9.24267578125, -8.751953125, -8.26123046875, -7.7705078125, -7.27978515625, -6.7890625, -6.29833984375, -5.8076171875, -5.31689453125, -4.826171875, -4.33544921875, -3.8447265625, -3.35400390625, -2.86328125, -2.37255859375, -1.8818359375, -1.39111328125, -0.900390625, -0.40966796875, 0.0810546875, 0.57177734375, 1.0625, 1.55322265625, 2.0439453125, 2.53466796875, 3.025390625, 3.51611328125, 4.0068359375, 4.49755859375, 4.98828125, 5.47900390625, 5.9697265625, 6.46044921875, 6.951171875, 7.44189453125, 7.9326171875, 8.42333984375, 8.9140625, 9.40478515625, 9.8955078125, 10.38623046875, 10.876953125, 11.36767578125, 11.8583984375, 12.34912109375, 12.83984375, 13.33056640625, 13.8212890625, 14.31201171875, 14.802734375, 15.29345703125, 15.7841796875, 16.27490234375, 16.765625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 8.0, 15.0, 15.0, 23.0, 20.0, 34.0, 38.0, 37.0, 76.0, 68.0, 159.0, 200.0, 347.0, 653.0, 1910.0, 10639.0, 82681.0, 713854.0, 208948.0, 23166.0, 3507.0, 913.0, 415.0, 243.0, 167.0, 95.0, 83.0, 55.0, 39.0, 33.0, 25.0, 16.0, 13.0, 8.0, 8.0, 13.0, 10.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.296875, -27.343994140625, -26.39111328125, -25.438232421875, -24.4853515625, -23.532470703125, -22.57958984375, -21.626708984375, -20.673828125, -19.720947265625, -18.76806640625, -17.815185546875, -16.8623046875, -15.909423828125, -14.95654296875, -14.003662109375, -13.05078125, -12.097900390625, -11.14501953125, -10.192138671875, -9.2392578125, -8.286376953125, -7.33349609375, -6.380615234375, -5.427734375, -4.474853515625, -3.52197265625, -2.569091796875, -1.6162109375, -0.663330078125, 0.28955078125, 1.242431640625, 2.1953125, 3.148193359375, 4.10107421875, 5.053955078125, 6.0068359375, 6.959716796875, 7.91259765625, 8.865478515625, 9.818359375, 10.771240234375, 11.72412109375, 12.677001953125, 13.6298828125, 14.582763671875, 15.53564453125, 16.488525390625, 17.44140625, 18.394287109375, 19.34716796875, 20.300048828125, 21.2529296875, 22.205810546875, 23.15869140625, 24.111572265625, 25.064453125, 26.017333984375, 26.97021484375, 27.923095703125, 28.8759765625, 29.828857421875, 30.78173828125, 31.734619140625, 32.6875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 5.0, 11.0, 8.0, 12.0, 14.0, 11.0, 19.0, 20.0, 18.0, 40.0, 36.0, 45.0, 36.0, 58.0, 59.0, 73.0, 140.0, 1484.0, 419.0, 109.0, 58.0, 48.0, 34.0, 40.0, 20.0, 33.0, 30.0, 31.0, 24.0, 18.0, 28.0, 14.0, 9.0, 4.0, 6.0, 7.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.71875, -47.14599609375, -45.5732421875, -44.00048828125, -42.427734375, -40.85498046875, -39.2822265625, -37.70947265625, -36.13671875, -34.56396484375, -32.9912109375, -31.41845703125, -29.845703125, -28.27294921875, -26.7001953125, -25.12744140625, -23.5546875, -21.98193359375, -20.4091796875, -18.83642578125, -17.263671875, -15.69091796875, -14.1181640625, -12.54541015625, -10.97265625, -9.39990234375, -7.8271484375, -6.25439453125, -4.681640625, -3.10888671875, -1.5361328125, 0.03662109375, 1.609375, 3.18212890625, 4.7548828125, 6.32763671875, 7.900390625, 9.47314453125, 11.0458984375, 12.61865234375, 14.19140625, 15.76416015625, 17.3369140625, 18.90966796875, 20.482421875, 22.05517578125, 23.6279296875, 25.20068359375, 26.7734375, 28.34619140625, 29.9189453125, 31.49169921875, 33.064453125, 34.63720703125, 36.2099609375, 37.78271484375, 39.35546875, 40.92822265625, 42.5009765625, 44.07373046875, 45.646484375, 47.21923828125, 48.7919921875, 50.36474609375, 51.9375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 12.0, 8.0, 7.0, 26.0, 26.0, 43.0, 57.0, 53.0, 60.0, 103.0, 131.0, 278.0, 613.0, 3430.0, 1991797.0, 1144329.0, 3171.0, 671.0, 262.0, 170.0, 107.0, 90.0, 62.0, 46.0, 24.0, 22.0, 16.0, 20.0, 6.0, 12.0, 7.0, 7.0, 2.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-140.25, -136.123046875, -131.99609375, -127.869140625, -123.7421875, -119.615234375, -115.48828125, -111.361328125, -107.234375, -103.107421875, -98.98046875, -94.853515625, -90.7265625, -86.599609375, -82.47265625, -78.345703125, -74.21875, -70.091796875, -65.96484375, -61.837890625, -57.7109375, -53.583984375, -49.45703125, -45.330078125, -41.203125, -37.076171875, -32.94921875, -28.822265625, -24.6953125, -20.568359375, -16.44140625, -12.314453125, -8.1875, -4.060546875, 0.06640625, 4.193359375, 8.3203125, 12.447265625, 16.57421875, 20.701171875, 24.828125, 28.955078125, 33.08203125, 37.208984375, 41.3359375, 45.462890625, 49.58984375, 53.716796875, 57.84375, 61.970703125, 66.09765625, 70.224609375, 74.3515625, 78.478515625, 82.60546875, 86.732421875, 90.859375, 94.986328125, 99.11328125, 103.240234375, 107.3671875, 111.494140625, 115.62109375, 119.748046875, 123.875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 419.0, 574.0, 19.0], "bins": [-936.6903076171875, -921.5911865234375, -906.4920654296875, -891.3929443359375, -876.2937622070312, -861.1946411132812, -846.0955200195312, -830.9963989257812, -815.8972778320312, -800.7981567382812, -785.6990356445312, -770.599853515625, -755.500732421875, -740.401611328125, -725.302490234375, -710.203369140625, -695.104248046875, -680.005126953125, -664.906005859375, -649.806884765625, -634.7077026367188, -619.6085815429688, -604.5094604492188, -589.4103393554688, -574.3111572265625, -559.2120361328125, -544.1129150390625, -529.0137939453125, -513.9146118164062, -498.81549072265625, -483.71636962890625, -468.61724853515625, -453.51812744140625, -438.41900634765625, -423.3198547363281, -408.2207336425781, -393.1216125488281, -378.0224609375, -362.92333984375, -347.82421875, -332.7250671386719, -317.6259460449219, -302.52679443359375, -287.42767333984375, -272.32855224609375, -257.22943115234375, -242.13027954101562, -227.03115844726562, -211.93203735351562, -196.83290100097656, -181.73377990722656, -166.6346435546875, -151.5355224609375, -136.43638610839844, -121.33724975585938, -106.23812103271484, -91.13898468017578, -76.03985595703125, -60.94072341918945, -45.841590881347656, -30.742462158203125, -15.643333435058594, -0.5441970825195312, 14.554931640625, 29.6540584564209]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 11.0, 10.0, 5.0, 9.0, 14.0, 25.0, 19.0, 25.0, 21.0, 18.0, 24.0, 33.0, 33.0, 39.0, 36.0, 38.0, 46.0, 47.0, 42.0, 47.0, 54.0, 33.0, 32.0, 39.0, 40.0, 32.0, 21.0, 22.0, 30.0, 27.0, 19.0, 18.0, 15.0, 5.0, 11.0, 14.0, 8.0, 5.0, 5.0, 5.0, 6.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.52316284179688, -109.79229736328125, -106.0614242553711, -102.33055877685547, -98.59968566894531, -94.86882019042969, -91.13795471191406, -87.40708923339844, -83.67621612548828, -79.94535064697266, -76.2144775390625, -72.48361206054688, -68.75274658203125, -65.0218734741211, -61.29100799560547, -57.56013870239258, -53.82926940917969, -50.0984001159668, -46.367530822753906, -42.63666534423828, -38.90579605102539, -35.1749267578125, -31.444059371948242, -27.713191986083984, -23.982322692871094, -20.251453399658203, -16.520586013793945, -12.789717674255371, -9.058849334716797, -5.327980041503906, -1.5971126556396484, 2.1337547302246094, 5.8646240234375, 9.595492362976074, 13.326360702514648, 17.057228088378906, 20.788097381591797, 24.518966674804688, 28.249834060668945, 31.980701446533203, 35.711570739746094, 39.442440032958984, 43.173309326171875, 46.9041748046875, 50.63504409790039, 54.36591339111328, 58.096778869628906, 61.8276481628418, 65.55851745605469, 69.28938293457031, 73.02025604248047, 76.7511215209961, 80.48199462890625, 84.21286010742188, 87.9437255859375, 91.67459106445312, 95.40546417236328, 99.1363296508789, 102.86720275878906, 106.59806823730469, 110.32893371582031, 114.05980682373047, 117.7906723022461, 121.52154541015625, 125.25241088867188]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 10.0, 3.0, 8.0, 8.0, 14.0, 16.0, 18.0, 14.0, 20.0, 20.0, 21.0, 27.0, 25.0, 39.0, 34.0, 32.0, 49.0, 51.0, 36.0, 39.0, 34.0, 47.0, 43.0, 44.0, 39.0, 32.0, 33.0, 22.0, 31.0, 32.0, 20.0, 14.0, 17.0, 14.0, 19.0, 19.0, 10.0, 7.0, 13.0, 7.0, 5.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.046875, -14.579833984375, -14.11279296875, -13.645751953125, -13.1787109375, -12.711669921875, -12.24462890625, -11.777587890625, -11.310546875, -10.843505859375, -10.37646484375, -9.909423828125, -9.4423828125, -8.975341796875, -8.50830078125, -8.041259765625, -7.57421875, -7.107177734375, -6.64013671875, -6.173095703125, -5.7060546875, -5.239013671875, -4.77197265625, -4.304931640625, -3.837890625, -3.370849609375, -2.90380859375, -2.436767578125, -1.9697265625, -1.502685546875, -1.03564453125, -0.568603515625, -0.1015625, 0.365478515625, 0.83251953125, 1.299560546875, 1.7666015625, 2.233642578125, 2.70068359375, 3.167724609375, 3.634765625, 4.101806640625, 4.56884765625, 5.035888671875, 5.5029296875, 5.969970703125, 6.43701171875, 6.904052734375, 7.37109375, 7.838134765625, 8.30517578125, 8.772216796875, 9.2392578125, 9.706298828125, 10.17333984375, 10.640380859375, 11.107421875, 11.574462890625, 12.04150390625, 12.508544921875, 12.9755859375, 13.442626953125, 13.90966796875, 14.376708984375, 14.84375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 8.0, 7.0, 9.0, 9.0, 8.0, 13.0, 9.0, 17.0, 18.0, 31.0, 27.0, 34.0, 50.0, 50.0, 84.0, 111.0, 165.0, 279.0, 505.0, 1383.0, 7863.0, 163736.0, 2728247.0, 1243195.0, 42947.0, 3503.0, 800.0, 359.0, 207.0, 152.0, 95.0, 86.0, 48.0, 39.0, 27.0, 28.0, 29.0, 25.0, 18.0, 5.0, 12.0, 13.0, 12.0, 6.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.125, -36.845703125, -35.56640625, -34.287109375, -33.0078125, -31.728515625, -30.44921875, -29.169921875, -27.890625, -26.611328125, -25.33203125, -24.052734375, -22.7734375, -21.494140625, -20.21484375, -18.935546875, -17.65625, -16.376953125, -15.09765625, -13.818359375, -12.5390625, -11.259765625, -9.98046875, -8.701171875, -7.421875, -6.142578125, -4.86328125, -3.583984375, -2.3046875, -1.025390625, 0.25390625, 1.533203125, 2.8125, 4.091796875, 5.37109375, 6.650390625, 7.9296875, 9.208984375, 10.48828125, 11.767578125, 13.046875, 14.326171875, 15.60546875, 16.884765625, 18.1640625, 19.443359375, 20.72265625, 22.001953125, 23.28125, 24.560546875, 25.83984375, 27.119140625, 28.3984375, 29.677734375, 30.95703125, 32.236328125, 33.515625, 34.794921875, 36.07421875, 37.353515625, 38.6328125, 39.912109375, 41.19140625, 42.470703125, 43.75]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 8.0, 12.0, 33.0, 32.0, 41.0, 61.0, 98.0, 143.0, 187.0, 287.0, 416.0, 578.0, 628.0, 499.0, 342.0, 242.0, 165.0, 103.0, 60.0, 38.0, 32.0, 19.0, 9.0, 7.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.625, -34.64013671875, -33.6552734375, -32.67041015625, -31.685546875, -30.70068359375, -29.7158203125, -28.73095703125, -27.74609375, -26.76123046875, -25.7763671875, -24.79150390625, -23.806640625, -22.82177734375, -21.8369140625, -20.85205078125, -19.8671875, -18.88232421875, -17.8974609375, -16.91259765625, -15.927734375, -14.94287109375, -13.9580078125, -12.97314453125, -11.98828125, -11.00341796875, -10.0185546875, -9.03369140625, -8.048828125, -7.06396484375, -6.0791015625, -5.09423828125, -4.109375, -3.12451171875, -2.1396484375, -1.15478515625, -0.169921875, 0.81494140625, 1.7998046875, 2.78466796875, 3.76953125, 4.75439453125, 5.7392578125, 6.72412109375, 7.708984375, 8.69384765625, 9.6787109375, 10.66357421875, 11.6484375, 12.63330078125, 13.6181640625, 14.60302734375, 15.587890625, 16.57275390625, 17.5576171875, 18.54248046875, 19.52734375, 20.51220703125, 21.4970703125, 22.48193359375, 23.466796875, 24.45166015625, 25.4365234375, 26.42138671875, 27.40625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 7.0, 12.0, 13.0, 14.0, 20.0, 22.0, 26.0, 48.0, 43.0, 72.0, 109.0, 125.0, 213.0, 315.0, 657.0, 2239.0, 58287.0, 4067723.0, 60332.0, 2269.0, 609.0, 303.0, 183.0, 163.0, 108.0, 77.0, 68.0, 43.0, 37.0, 36.0, 26.0, 26.0, 11.0, 11.0, 5.0, 5.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-107.4375, -104.02734375, -100.6171875, -97.20703125, -93.796875, -90.38671875, -86.9765625, -83.56640625, -80.15625, -76.74609375, -73.3359375, -69.92578125, -66.515625, -63.10546875, -59.6953125, -56.28515625, -52.875, -49.46484375, -46.0546875, -42.64453125, -39.234375, -35.82421875, -32.4140625, -29.00390625, -25.59375, -22.18359375, -18.7734375, -15.36328125, -11.953125, -8.54296875, -5.1328125, -1.72265625, 1.6875, 5.09765625, 8.5078125, 11.91796875, 15.328125, 18.73828125, 22.1484375, 25.55859375, 28.96875, 32.37890625, 35.7890625, 39.19921875, 42.609375, 46.01953125, 49.4296875, 52.83984375, 56.25, 59.66015625, 63.0703125, 66.48046875, 69.890625, 73.30078125, 76.7109375, 80.12109375, 83.53125, 86.94140625, 90.3515625, 93.76171875, 97.171875, 100.58203125, 103.9921875, 107.40234375, 110.8125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 26.0, 462.0, 500.0, 28.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-705.7628173828125, -687.2308959960938, -668.698974609375, -650.1670532226562, -631.6351318359375, -613.1032104492188, -594.5712890625, -576.039306640625, -557.5074462890625, -538.9755249023438, -520.443603515625, -501.91168212890625, -483.3797607421875, -464.84783935546875, -446.3158874511719, -427.7839660644531, -409.25201416015625, -390.7200927734375, -372.18817138671875, -353.65625, -335.12432861328125, -316.5924072265625, -298.0604553222656, -279.5285339355469, -260.9966125488281, -242.46469116210938, -223.93276977539062, -205.4008331298828, -186.86891174316406, -168.3369903564453, -149.8050537109375, -131.27313232421875, -112.74114990234375, -94.209228515625, -75.67729949951172, -57.1453742980957, -38.61344909667969, -20.081527709960938, -1.5495986938476562, 16.982330322265625, 35.514251708984375, 54.04617691040039, 72.5781021118164, 91.11003112792969, 109.64195251464844, 128.1738739013672, 146.705810546875, 165.23773193359375, 183.7696533203125, 202.30157470703125, 220.83349609375, 239.3654327392578, 257.8973388671875, 276.42926025390625, 294.9612121582031, 313.4931335449219, 332.0250549316406, 350.5569763183594, 369.0888977050781, 387.6208190917969, 406.15277099609375, 424.6846923828125, 443.21661376953125, 461.74853515625, 480.28045654296875]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 4.0, 9.0, 11.0, 6.0, 20.0, 13.0, 13.0, 21.0, 21.0, 20.0, 20.0, 32.0, 26.0, 24.0, 42.0, 43.0, 39.0, 42.0, 41.0, 40.0, 34.0, 39.0, 43.0, 33.0, 39.0, 34.0, 30.0, 41.0, 29.0, 17.0, 26.0, 32.0, 11.0, 18.0, 18.0, 16.0, 9.0, 10.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-85.25485229492188, -82.76126861572266, -80.26768493652344, -77.77409362792969, -75.28050994873047, -72.78692626953125, -70.29334259033203, -67.79975891113281, -65.30616760253906, -62.812583923339844, -60.31899642944336, -57.82541275024414, -55.331825256347656, -52.83824157714844, -50.34465789794922, -47.85107421875, -45.35749053955078, -42.86390686035156, -40.37031936645508, -37.87673568725586, -35.383148193359375, -32.889564514160156, -30.395980834960938, -27.902395248413086, -25.408809661865234, -22.915224075317383, -20.42163848876953, -17.928054809570312, -15.434469223022461, -12.94088363647461, -10.447299003601074, -7.953714370727539, -5.4601287841796875, -2.966543674468994, -0.4729585647583008, 2.0206265449523926, 4.514211654663086, 7.0077972412109375, 9.501381874084473, 11.994966506958008, 14.48855209350586, 16.98213768005371, 19.475723266601562, 21.96930694580078, 24.462892532348633, 26.956478118896484, 29.450061798095703, 31.943647384643555, 34.437232971191406, 36.930816650390625, 39.42440414428711, 41.91798782348633, 44.41157531738281, 46.90515899658203, 49.39874267578125, 51.89232635498047, 54.38591384887695, 56.87949752807617, 59.373085021972656, 61.866668701171875, 64.3602523803711, 66.85383605957031, 69.34742736816406, 71.84101104736328, 74.3345947265625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 5.0, 6.0, 9.0, 14.0, 12.0, 19.0, 18.0, 16.0, 18.0, 28.0, 22.0, 31.0, 41.0, 39.0, 48.0, 60.0, 51.0, 43.0, 45.0, 47.0, 50.0, 42.0, 53.0, 37.0, 29.0, 40.0, 26.0, 27.0, 20.0, 21.0, 16.0, 18.0, 12.0, 13.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.95458984375, -16.3935546875, -15.83251953125, -15.271484375, -14.71044921875, -14.1494140625, -13.58837890625, -13.02734375, -12.46630859375, -11.9052734375, -11.34423828125, -10.783203125, -10.22216796875, -9.6611328125, -9.10009765625, -8.5390625, -7.97802734375, -7.4169921875, -6.85595703125, -6.294921875, -5.73388671875, -5.1728515625, -4.61181640625, -4.05078125, -3.48974609375, -2.9287109375, -2.36767578125, -1.806640625, -1.24560546875, -0.6845703125, -0.12353515625, 0.4375, 0.99853515625, 1.5595703125, 2.12060546875, 2.681640625, 3.24267578125, 3.8037109375, 4.36474609375, 4.92578125, 5.48681640625, 6.0478515625, 6.60888671875, 7.169921875, 7.73095703125, 8.2919921875, 8.85302734375, 9.4140625, 9.97509765625, 10.5361328125, 11.09716796875, 11.658203125, 12.21923828125, 12.7802734375, 13.34130859375, 13.90234375, 14.46337890625, 15.0244140625, 15.58544921875, 16.146484375, 16.70751953125, 17.2685546875, 17.82958984375, 18.390625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 12.0, 14.0, 12.0, 26.0, 29.0, 51.0, 90.0, 138.0, 218.0, 374.0, 590.0, 982.0, 1610.0, 2680.0, 4675.0, 7759.0, 13201.0, 22280.0, 38258.0, 65577.0, 116072.0, 203380.0, 235035.0, 142815.0, 80378.0, 46038.0, 27056.0, 15873.0, 9286.0, 5607.0, 3366.0, 2003.0, 1238.0, 700.0, 443.0, 257.0, 183.0, 102.0, 58.0, 33.0, 30.0, 11.0, 10.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.9510955810546875, -1.888519287109375, -1.8259429931640625, -1.76336669921875, -1.7007904052734375, -1.638214111328125, -1.5756378173828125, -1.5130615234375, -1.4504852294921875, -1.387908935546875, -1.3253326416015625, -1.26275634765625, -1.2001800537109375, -1.137603759765625, -1.0750274658203125, -1.012451171875, -0.9498748779296875, -0.887298583984375, -0.8247222900390625, -0.76214599609375, -0.6995697021484375, -0.636993408203125, -0.5744171142578125, -0.5118408203125, -0.4492645263671875, -0.386688232421875, -0.3241119384765625, -0.26153564453125, -0.1989593505859375, -0.136383056640625, -0.0738067626953125, -0.01123046875, 0.0513458251953125, 0.113922119140625, 0.1764984130859375, 0.23907470703125, 0.3016510009765625, 0.364227294921875, 0.4268035888671875, 0.4893798828125, 0.5519561767578125, 0.614532470703125, 0.6771087646484375, 0.73968505859375, 0.8022613525390625, 0.864837646484375, 0.9274139404296875, 0.989990234375, 1.0525665283203125, 1.115142822265625, 1.1777191162109375, 1.24029541015625, 1.3028717041015625, 1.365447998046875, 1.4280242919921875, 1.4906005859375, 1.5531768798828125, 1.615753173828125, 1.6783294677734375, 1.74090576171875, 1.8034820556640625, 1.866058349609375, 1.9286346435546875, 1.9912109375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 8.0, 5.0, 9.0, 14.0, 17.0, 22.0, 19.0, 27.0, 30.0, 29.0, 42.0, 41.0, 39.0, 49.0, 49.0, 42.0, 56.0, 1073.0, 45.0, 37.0, 38.0, 46.0, 38.0, 32.0, 24.0, 25.0, 23.0, 30.0, 24.0, 26.0, 16.0, 10.0, 6.0, 6.0, 6.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6953125, -10.3193359375, -9.943359375, -9.5673828125, -9.19140625, -8.8154296875, -8.439453125, -8.0634765625, -7.6875, -7.3115234375, -6.935546875, -6.5595703125, -6.18359375, -5.8076171875, -5.431640625, -5.0556640625, -4.6796875, -4.3037109375, -3.927734375, -3.5517578125, -3.17578125, -2.7998046875, -2.423828125, -2.0478515625, -1.671875, -1.2958984375, -0.919921875, -0.5439453125, -0.16796875, 0.2080078125, 0.583984375, 0.9599609375, 1.3359375, 1.7119140625, 2.087890625, 2.4638671875, 2.83984375, 3.2158203125, 3.591796875, 3.9677734375, 4.34375, 4.7197265625, 5.095703125, 5.4716796875, 5.84765625, 6.2236328125, 6.599609375, 6.9755859375, 7.3515625, 7.7275390625, 8.103515625, 8.4794921875, 8.85546875, 9.2314453125, 9.607421875, 9.9833984375, 10.359375, 10.7353515625, 11.111328125, 11.4873046875, 11.86328125, 12.2392578125, 12.615234375, 12.9912109375, 13.3671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 9.0, 4.0, 11.0, 24.0, 25.0, 34.0, 67.0, 106.0, 157.0, 288.0, 460.0, 742.0, 1250.0, 2003.0, 3390.0, 5574.0, 9516.0, 16154.0, 27514.0, 47523.0, 83003.0, 146358.0, 1287623.0, 197822.0, 112953.0, 64167.0, 37146.0, 21821.0, 12541.0, 7502.0, 4434.0, 2698.0, 1663.0, 964.0, 612.0, 368.0, 224.0, 148.0, 93.0, 57.0, 34.0, 24.0, 13.0, 3.0, 4.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05078125, -1.9882049560546875, -1.925628662109375, -1.8630523681640625, -1.80047607421875, -1.7378997802734375, -1.675323486328125, -1.6127471923828125, -1.5501708984375, -1.4875946044921875, -1.425018310546875, -1.3624420166015625, -1.29986572265625, -1.2372894287109375, -1.174713134765625, -1.1121368408203125, -1.049560546875, -0.9869842529296875, -0.924407958984375, -0.8618316650390625, -0.79925537109375, -0.7366790771484375, -0.674102783203125, -0.6115264892578125, -0.5489501953125, -0.4863739013671875, -0.423797607421875, -0.3612213134765625, -0.29864501953125, -0.2360687255859375, -0.173492431640625, -0.1109161376953125, -0.04833984375, 0.0142364501953125, 0.076812744140625, 0.1393890380859375, 0.20196533203125, 0.2645416259765625, 0.327117919921875, 0.3896942138671875, 0.4522705078125, 0.5148468017578125, 0.577423095703125, 0.6399993896484375, 0.70257568359375, 0.7651519775390625, 0.827728271484375, 0.8903045654296875, 0.952880859375, 1.0154571533203125, 1.078033447265625, 1.1406097412109375, 1.20318603515625, 1.2657623291015625, 1.328338623046875, 1.3909149169921875, 1.4534912109375, 1.5160675048828125, 1.578643798828125, 1.6412200927734375, 1.70379638671875, 1.7663726806640625, 1.828948974609375, 1.8915252685546875, 1.9541015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 11.0, 17.0, 14.0, 23.0, 27.0, 39.0, 37.0, 43.0, 78.0, 63.0, 87.0, 86.0, 66.0, 80.0, 52.0, 57.0, 44.0, 26.0, 37.0, 19.0, 11.0, 13.0, 12.0, 9.0, 6.0, 11.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.003604888916015625, -0.0034918487071990967, -0.0033788084983825684, -0.00326576828956604, -0.0031527280807495117, -0.0030396878719329834, -0.002926647663116455, -0.0028136074542999268, -0.0027005672454833984, -0.00258752703666687, -0.002474486827850342, -0.0023614466190338135, -0.002248406410217285, -0.002135366201400757, -0.0020223259925842285, -0.0019092857837677002, -0.0017962455749511719, -0.0016832053661346436, -0.0015701651573181152, -0.001457124948501587, -0.0013440847396850586, -0.0012310445308685303, -0.001118004322052002, -0.0010049641132354736, -0.0008919239044189453, -0.000778883695602417, -0.0006658434867858887, -0.0005528032779693604, -0.00043976306915283203, -0.0003267228603363037, -0.0002136826515197754, -0.00010064244270324707, 1.239776611328125e-05, 0.00012543797492980957, 0.0002384781837463379, 0.0003515183925628662, 0.00046455860137939453, 0.0005775988101959229, 0.0006906390190124512, 0.0008036792278289795, 0.0009167194366455078, 0.0010297596454620361, 0.0011427998542785645, 0.0012558400630950928, 0.001368880271911621, 0.0014819204807281494, 0.0015949606895446777, 0.001708000898361206, 0.0018210411071777344, 0.0019340813159942627, 0.002047121524810791, 0.0021601617336273193, 0.0022732019424438477, 0.002386242151260376, 0.0024992823600769043, 0.0026123225688934326, 0.002725362777709961, 0.0028384029865264893, 0.0029514431953430176, 0.003064483404159546, 0.0031775236129760742, 0.0032905638217926025, 0.003403604030609131, 0.003516644239425659, 0.0036296844482421875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 5.0, 2.0, 7.0, 8.0, 11.0, 9.0, 14.0, 17.0, 27.0, 42.0, 68.0, 58.0, 88.0, 129.0, 321.0, 762.0, 64108.0, 980605.0, 1221.0, 389.0, 203.0, 121.0, 89.0, 66.0, 40.0, 30.0, 24.0, 18.0, 19.0, 11.0, 9.0, 3.0, 0.0, 1.0, 6.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.07977294921875, -0.07729148864746094, -0.07481002807617188, -0.07232856750488281, -0.06984710693359375, -0.06736564636230469, -0.06488418579101562, -0.06240272521972656, -0.0599212646484375, -0.05743980407714844, -0.054958343505859375, -0.05247688293457031, -0.04999542236328125, -0.04751396179199219, -0.045032501220703125, -0.04255104064941406, -0.040069580078125, -0.03758811950683594, -0.035106658935546875, -0.03262519836425781, -0.03014373779296875, -0.027662277221679688, -0.025180816650390625, -0.022699356079101562, -0.0202178955078125, -0.017736434936523438, -0.015254974365234375, -0.012773513793945312, -0.01029205322265625, -0.0078105926513671875, -0.005329132080078125, -0.0028476715087890625, -0.0003662109375, 0.0021152496337890625, 0.004596710205078125, 0.0070781707763671875, 0.00955963134765625, 0.012041091918945312, 0.014522552490234375, 0.017004013061523438, 0.0194854736328125, 0.021966934204101562, 0.024448394775390625, 0.026929855346679688, 0.02941131591796875, 0.03189277648925781, 0.034374237060546875, 0.03685569763183594, 0.039337158203125, 0.04181861877441406, 0.044300079345703125, 0.04678153991699219, 0.04926300048828125, 0.05174446105957031, 0.054225921630859375, 0.05670738220214844, 0.0591888427734375, 0.06167030334472656, 0.06415176391601562, 0.06663322448730469, 0.06911468505859375, 0.07159614562988281, 0.07407760620117188, 0.07655906677246094, 0.07904052734375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 24.0, 99.0, 311.0, 391.0, 154.0, 23.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.007985332980751991, -0.00782609824091196, -0.007666863966733217, -0.007507629226893187, -0.007348394487053156, -0.0071891602128744125, -0.007029925473034382, -0.006870690733194351, -0.0067114559933543205, -0.00655222125351429, -0.0063929869793355465, -0.006233752239495516, -0.006074517499655485, -0.005915283225476742, -0.005756048485636711, -0.0055968137457966805, -0.005437579471617937, -0.005278344731777906, -0.005119110457599163, -0.004959875717759132, -0.004800640977919102, -0.004641406238079071, -0.004482171963900328, -0.004322937224060297, -0.004163702949881554, -0.004004468210041523, -0.003845233703032136, -0.003685999196022749, -0.0035267644561827183, -0.0033675299491733313, -0.0032082954421639442, -0.0030490607023239136, -0.002889825962483883, -0.002730591455474496, -0.0025713567156344652, -0.002412122208625078, -0.0022528874687850475, -0.0020936529617756605, -0.0019344184547662735, -0.0017751838313415647, -0.0016159492079168558, -0.001456714584492147, -0.0012974799610674381, -0.0011382454540580511, -0.0009790108306333423, -0.0008197762072086334, -0.0006605416419915855, -0.0005013070767745376, -0.0003420724533498287, -0.00018283785902895033, -2.3603264708071947e-05, 0.00013563132961280644, 0.0002948659239336848, 0.00045410054735839367, 0.0006133351125754416, 0.0007725696777924895, 0.0009318043012171984, 0.0010910389246419072, 0.001250273548066616, 0.001409508055076003, 0.001568742678500712, 0.0017279773019254208, 0.0018872118089348078, 0.002046446315944195, 0.0022056810557842255]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 8.0, 11.0, 8.0, 11.0, 15.0, 11.0, 10.0, 16.0, 32.0, 26.0, 28.0, 22.0, 28.0, 36.0, 40.0, 39.0, 24.0, 32.0, 43.0, 36.0, 28.0, 36.0, 50.0, 30.0, 32.0, 28.0, 33.0, 40.0, 28.0, 22.0, 18.0, 23.0, 18.0, 18.0, 13.0, 19.0, 17.0, 11.0, 12.0, 5.0, 9.0, 10.0, 6.0, 5.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0013865232467651367, -0.0013429252430796623, -0.001299327239394188, -0.0012557292357087135, -0.0012121312320232391, -0.0011685332283377647, -0.0011249352246522903, -0.001081337220966816, -0.0010377392172813416, -0.0009941412135958672, -0.0009505432099103928, -0.0009069452062249184, -0.000863347202539444, -0.0008197491988539696, -0.0007761511951684952, -0.0007325531914830208, -0.0006889551877975464, -0.000645357184112072, -0.0006017591804265976, -0.0005581611767411232, -0.0005145631730556488, -0.0004709651693701744, -0.0004273671656847, -0.0003837691619992256, -0.0003401711583137512, -0.0002965731546282768, -0.00025297515094280243, -0.00020937714725732803, -0.00016577914357185364, -0.00012218113988637924, -7.858313620090485e-05, -3.498513251543045e-05, 8.612871170043945e-06, 5.221087485551834e-05, 9.580887854099274e-05, 0.00013940688222646713, 0.00018300488591194153, 0.00022660288959741592, 0.0002702008932828903, 0.0003137988969683647, 0.0003573969006538391, 0.0004009949043393135, 0.0004445929080247879, 0.0004881909117102623, 0.0005317889153957367, 0.0005753869190812111, 0.0006189849227666855, 0.0006625829264521599, 0.0007061809301376343, 0.0007497789338231087, 0.0007933769375085831, 0.0008369749411940575, 0.0008805729448795319, 0.0009241709485650063, 0.0009677689522504807, 0.001011366955935955, 0.0010549649596214294, 0.0010985629633069038, 0.0011421609669923782, 0.0011857589706778526, 0.001229356974363327, 0.0012729549780488014, 0.0013165529817342758, 0.0013601509854197502, 0.0014037489891052246]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 5.0, 6.0, 9.0, 14.0, 12.0, 19.0, 18.0, 16.0, 18.0, 28.0, 22.0, 31.0, 41.0, 39.0, 48.0, 60.0, 51.0, 43.0, 45.0, 47.0, 50.0, 42.0, 53.0, 37.0, 29.0, 40.0, 26.0, 27.0, 20.0, 21.0, 16.0, 18.0, 12.0, 13.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.95458984375, -16.3935546875, -15.83251953125, -15.271484375, -14.71044921875, -14.1494140625, -13.58837890625, -13.02734375, -12.46630859375, -11.9052734375, -11.34423828125, -10.783203125, -10.22216796875, -9.6611328125, -9.10009765625, -8.5390625, -7.97802734375, -7.4169921875, -6.85595703125, -6.294921875, -5.73388671875, -5.1728515625, -4.61181640625, -4.05078125, -3.48974609375, -2.9287109375, -2.36767578125, -1.806640625, -1.24560546875, -0.6845703125, -0.12353515625, 0.4375, 0.99853515625, 1.5595703125, 2.12060546875, 2.681640625, 3.24267578125, 3.8037109375, 4.36474609375, 4.92578125, 5.48681640625, 6.0478515625, 6.60888671875, 7.169921875, 7.73095703125, 8.2919921875, 8.85302734375, 9.4140625, 9.97509765625, 10.5361328125, 11.09716796875, 11.658203125, 12.21923828125, 12.7802734375, 13.34130859375, 13.90234375, 14.46337890625, 15.0244140625, 15.58544921875, 16.146484375, 16.70751953125, 17.2685546875, 17.82958984375, 18.390625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 11.0, 9.0, 11.0, 24.0, 25.0, 24.0, 47.0, 46.0, 58.0, 90.0, 120.0, 183.0, 293.0, 404.0, 555.0, 829.0, 1982.0, 11593.0, 161240.0, 829147.0, 34214.0, 4248.0, 1189.0, 625.0, 438.0, 322.0, 243.0, 161.0, 108.0, 83.0, 55.0, 49.0, 43.0, 23.0, 20.0, 14.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.40625, -42.98486328125, -41.5634765625, -40.14208984375, -38.720703125, -37.29931640625, -35.8779296875, -34.45654296875, -33.03515625, -31.61376953125, -30.1923828125, -28.77099609375, -27.349609375, -25.92822265625, -24.5068359375, -23.08544921875, -21.6640625, -20.24267578125, -18.8212890625, -17.39990234375, -15.978515625, -14.55712890625, -13.1357421875, -11.71435546875, -10.29296875, -8.87158203125, -7.4501953125, -6.02880859375, -4.607421875, -3.18603515625, -1.7646484375, -0.34326171875, 1.078125, 2.49951171875, 3.9208984375, 5.34228515625, 6.763671875, 8.18505859375, 9.6064453125, 11.02783203125, 12.44921875, 13.87060546875, 15.2919921875, 16.71337890625, 18.134765625, 19.55615234375, 20.9775390625, 22.39892578125, 23.8203125, 25.24169921875, 26.6630859375, 28.08447265625, 29.505859375, 30.92724609375, 32.3486328125, 33.77001953125, 35.19140625, 36.61279296875, 38.0341796875, 39.45556640625, 40.876953125, 42.29833984375, 43.7197265625, 45.14111328125, 46.5625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 2.0, 4.0, 12.0, 7.0, 11.0, 9.0, 12.0, 17.0, 19.0, 23.0, 34.0, 35.0, 32.0, 35.0, 39.0, 42.0, 34.0, 44.0, 95.0, 379.0, 1606.0, 119.0, 60.0, 45.0, 49.0, 43.0, 38.0, 30.0, 28.0, 20.0, 16.0, 17.0, 16.0, 15.0, 15.0, 13.0, 10.0, 10.0, 6.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-52.53125, -50.99072265625, -49.4501953125, -47.90966796875, -46.369140625, -44.82861328125, -43.2880859375, -41.74755859375, -40.20703125, -38.66650390625, -37.1259765625, -35.58544921875, -34.044921875, -32.50439453125, -30.9638671875, -29.42333984375, -27.8828125, -26.34228515625, -24.8017578125, -23.26123046875, -21.720703125, -20.18017578125, -18.6396484375, -17.09912109375, -15.55859375, -14.01806640625, -12.4775390625, -10.93701171875, -9.396484375, -7.85595703125, -6.3154296875, -4.77490234375, -3.234375, -1.69384765625, -0.1533203125, 1.38720703125, 2.927734375, 4.46826171875, 6.0087890625, 7.54931640625, 9.08984375, 10.63037109375, 12.1708984375, 13.71142578125, 15.251953125, 16.79248046875, 18.3330078125, 19.87353515625, 21.4140625, 22.95458984375, 24.4951171875, 26.03564453125, 27.576171875, 29.11669921875, 30.6572265625, 32.19775390625, 33.73828125, 35.27880859375, 36.8193359375, 38.35986328125, 39.900390625, 41.44091796875, 42.9814453125, 44.52197265625, 46.0625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 4.0, 7.0, 14.0, 14.0, 21.0, 13.0, 19.0, 18.0, 24.0, 22.0, 30.0, 32.0, 60.0, 82.0, 138.0, 211.0, 453.0, 2120.0, 2468107.0, 671462.0, 1693.0, 473.0, 183.0, 115.0, 78.0, 55.0, 45.0, 45.0, 24.0, 32.0, 23.0, 14.0, 11.0, 12.0, 13.0, 5.0, 12.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.75, -123.486328125, -119.22265625, -114.958984375, -110.6953125, -106.431640625, -102.16796875, -97.904296875, -93.640625, -89.376953125, -85.11328125, -80.849609375, -76.5859375, -72.322265625, -68.05859375, -63.794921875, -59.53125, -55.267578125, -51.00390625, -46.740234375, -42.4765625, -38.212890625, -33.94921875, -29.685546875, -25.421875, -21.158203125, -16.89453125, -12.630859375, -8.3671875, -4.103515625, 0.16015625, 4.423828125, 8.6875, 12.951171875, 17.21484375, 21.478515625, 25.7421875, 30.005859375, 34.26953125, 38.533203125, 42.796875, 47.060546875, 51.32421875, 55.587890625, 59.8515625, 64.115234375, 68.37890625, 72.642578125, 76.90625, 81.169921875, 85.43359375, 89.697265625, 93.9609375, 98.224609375, 102.48828125, 106.751953125, 111.015625, 115.279296875, 119.54296875, 123.806640625, 128.0703125, 132.333984375, 136.59765625, 140.861328125, 145.125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 44.0, 595.0, 356.0, 23.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.111148834228516, -27.849672317504883, -20.58819580078125, -13.32672119140625, -6.065244674682617, 1.1962318420410156, 8.457706451416016, 15.719184875488281, 22.98065948486328, 30.242136001586914, 37.50361251831055, 44.76508712768555, 52.02656555175781, 59.28804016113281, 66.54951477050781, 73.81098937988281, 81.07246398925781, 88.33393859863281, 95.59541320800781, 102.85688781738281, 110.11837005615234, 117.37984466552734, 124.64131927490234, 131.90280151367188, 139.16427612304688, 146.42575073242188, 153.68722534179688, 160.94869995117188, 168.21017456054688, 175.47164916992188, 182.73312377929688, 189.99461364746094, 197.25608825683594, 204.51756286621094, 211.77903747558594, 219.04051208496094, 226.30198669433594, 233.5634765625, 240.824951171875, 248.08642578125, 255.347900390625, 262.609375, 269.870849609375, 277.13232421875, 284.393798828125, 291.6552734375, 298.916748046875, 306.17822265625, 313.439697265625, 320.701171875, 327.962646484375, 335.22412109375, 342.485595703125, 349.7470703125, 357.008544921875, 364.27001953125, 371.5315246582031, 378.7929992675781, 386.0544738769531, 393.3159484863281, 400.5774230957031, 407.8388977050781, 415.1003723144531, 422.3618469238281, 429.6233215332031]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 5.0, 9.0, 16.0, 13.0, 13.0, 12.0, 20.0, 16.0, 27.0, 16.0, 22.0, 27.0, 26.0, 22.0, 30.0, 27.0, 30.0, 35.0, 44.0, 36.0, 40.0, 31.0, 31.0, 41.0, 40.0, 42.0, 27.0, 26.0, 33.0, 29.0, 29.0, 29.0, 28.0, 20.0, 17.0, 17.0, 8.0, 16.0, 9.0, 4.0, 10.0, 6.0, 3.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-105.90666198730469, -102.45897674560547, -99.01129913330078, -95.56361389160156, -92.11593627929688, -88.66825103759766, -85.22056579589844, -81.77288818359375, -78.32521057128906, -74.87752532958984, -71.42984771728516, -67.98216247558594, -64.53448486328125, -61.08679962158203, -57.63911819458008, -54.191436767578125, -50.743751525878906, -47.29607009887695, -43.848388671875, -40.40070343017578, -36.953025817871094, -33.505340576171875, -30.057659149169922, -26.60997772216797, -23.162296295166016, -19.714614868164062, -16.26693344116211, -12.819250106811523, -9.37156867980957, -5.923887252807617, -2.4762039184570312, 0.9714775085449219, 4.419158935546875, 7.866840839385986, 11.314522743225098, 14.762205123901367, 18.20988655090332, 21.657567977905273, 25.10525131225586, 28.552932739257812, 32.000614166259766, 35.44829559326172, 38.89597702026367, 42.343658447265625, 45.791343688964844, 49.23902130126953, 52.68670654296875, 56.1343879699707, 59.582069396972656, 63.02975082397461, 66.47743225097656, 69.92511749267578, 73.37279510498047, 76.82048034667969, 80.26815795898438, 83.7158432006836, 87.16352844238281, 90.61121368408203, 94.05889129638672, 97.50657653808594, 100.95425415039062, 104.40193939208984, 107.84962463378906, 111.29730224609375, 114.74497985839844]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 12.0, 16.0, 9.0, 14.0, 18.0, 17.0, 23.0, 33.0, 18.0, 30.0, 33.0, 53.0, 41.0, 49.0, 50.0, 51.0, 44.0, 60.0, 50.0, 33.0, 47.0, 42.0, 34.0, 43.0, 31.0, 25.0, 23.0, 16.0, 23.0, 9.0, 14.0, 13.0, 5.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.6259765625, -18.048828125, -17.4716796875, -16.89453125, -16.3173828125, -15.740234375, -15.1630859375, -14.5859375, -14.0087890625, -13.431640625, -12.8544921875, -12.27734375, -11.7001953125, -11.123046875, -10.5458984375, -9.96875, -9.3916015625, -8.814453125, -8.2373046875, -7.66015625, -7.0830078125, -6.505859375, -5.9287109375, -5.3515625, -4.7744140625, -4.197265625, -3.6201171875, -3.04296875, -2.4658203125, -1.888671875, -1.3115234375, -0.734375, -0.1572265625, 0.419921875, 0.9970703125, 1.57421875, 2.1513671875, 2.728515625, 3.3056640625, 3.8828125, 4.4599609375, 5.037109375, 5.6142578125, 6.19140625, 6.7685546875, 7.345703125, 7.9228515625, 8.5, 9.0771484375, 9.654296875, 10.2314453125, 10.80859375, 11.3857421875, 11.962890625, 12.5400390625, 13.1171875, 13.6943359375, 14.271484375, 14.8486328125, 15.42578125, 16.0029296875, 16.580078125, 17.1572265625, 17.734375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 8.0, 7.0, 5.0, 10.0, 14.0, 15.0, 26.0, 37.0, 44.0, 39.0, 52.0, 81.0, 93.0, 146.0, 168.0, 248.0, 283.0, 496.0, 873.0, 1998.0, 7635.0, 67189.0, 1127248.0, 2616715.0, 341439.0, 22095.0, 3818.0, 1314.0, 642.0, 417.0, 282.0, 196.0, 155.0, 126.0, 84.0, 72.0, 40.0, 42.0, 25.0, 31.0, 30.0, 9.0, 13.0, 8.0, 9.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.875, -33.79443359375, -32.7138671875, -31.63330078125, -30.552734375, -29.47216796875, -28.3916015625, -27.31103515625, -26.23046875, -25.14990234375, -24.0693359375, -22.98876953125, -21.908203125, -20.82763671875, -19.7470703125, -18.66650390625, -17.5859375, -16.50537109375, -15.4248046875, -14.34423828125, -13.263671875, -12.18310546875, -11.1025390625, -10.02197265625, -8.94140625, -7.86083984375, -6.7802734375, -5.69970703125, -4.619140625, -3.53857421875, -2.4580078125, -1.37744140625, -0.296875, 0.78369140625, 1.8642578125, 2.94482421875, 4.025390625, 5.10595703125, 6.1865234375, 7.26708984375, 8.34765625, 9.42822265625, 10.5087890625, 11.58935546875, 12.669921875, 13.75048828125, 14.8310546875, 15.91162109375, 16.9921875, 18.07275390625, 19.1533203125, 20.23388671875, 21.314453125, 22.39501953125, 23.4755859375, 24.55615234375, 25.63671875, 26.71728515625, 27.7978515625, 28.87841796875, 29.958984375, 31.03955078125, 32.1201171875, 33.20068359375, 34.28125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 5.0, 9.0, 14.0, 22.0, 42.0, 57.0, 128.0, 223.0, 346.0, 647.0, 876.0, 720.0, 434.0, 229.0, 144.0, 74.0, 41.0, 28.0, 20.0, 9.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-54.125, -52.72314453125, -51.3212890625, -49.91943359375, -48.517578125, -47.11572265625, -45.7138671875, -44.31201171875, -42.91015625, -41.50830078125, -40.1064453125, -38.70458984375, -37.302734375, -35.90087890625, -34.4990234375, -33.09716796875, -31.6953125, -30.29345703125, -28.8916015625, -27.48974609375, -26.087890625, -24.68603515625, -23.2841796875, -21.88232421875, -20.48046875, -19.07861328125, -17.6767578125, -16.27490234375, -14.873046875, -13.47119140625, -12.0693359375, -10.66748046875, -9.265625, -7.86376953125, -6.4619140625, -5.06005859375, -3.658203125, -2.25634765625, -0.8544921875, 0.54736328125, 1.94921875, 3.35107421875, 4.7529296875, 6.15478515625, 7.556640625, 8.95849609375, 10.3603515625, 11.76220703125, 13.1640625, 14.56591796875, 15.9677734375, 17.36962890625, 18.771484375, 20.17333984375, 21.5751953125, 22.97705078125, 24.37890625, 25.78076171875, 27.1826171875, 28.58447265625, 29.986328125, 31.38818359375, 32.7900390625, 34.19189453125, 35.59375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 15.0, 15.0, 26.0, 30.0, 39.0, 74.0, 112.0, 175.0, 325.0, 663.0, 2159.0, 49478.0, 4107845.0, 30050.0, 1879.0, 607.0, 283.0, 153.0, 91.0, 68.0, 58.0, 35.0, 26.0, 22.0, 12.0, 7.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.625, -129.5078125, -125.390625, -121.2734375, -117.15625, -113.0390625, -108.921875, -104.8046875, -100.6875, -96.5703125, -92.453125, -88.3359375, -84.21875, -80.1015625, -75.984375, -71.8671875, -67.75, -63.6328125, -59.515625, -55.3984375, -51.28125, -47.1640625, -43.046875, -38.9296875, -34.8125, -30.6953125, -26.578125, -22.4609375, -18.34375, -14.2265625, -10.109375, -5.9921875, -1.875, 2.2421875, 6.359375, 10.4765625, 14.59375, 18.7109375, 22.828125, 26.9453125, 31.0625, 35.1796875, 39.296875, 43.4140625, 47.53125, 51.6484375, 55.765625, 59.8828125, 64.0, 68.1171875, 72.234375, 76.3515625, 80.46875, 84.5859375, 88.703125, 92.8203125, 96.9375, 101.0546875, 105.171875, 109.2890625, 113.40625, 117.5234375, 121.640625, 125.7578125, 129.875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 37.0, 343.0, 504.0, 118.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-424.31805419921875, -411.1553039550781, -397.9925842285156, -384.829833984375, -371.6670837402344, -358.5043640136719, -345.34161376953125, -332.17889404296875, -319.0161437988281, -305.8533935546875, -292.690673828125, -279.5279235839844, -266.36517333984375, -253.20245361328125, -240.03970336914062, -226.87696838378906, -213.71421813964844, -200.55148315429688, -187.38873291015625, -174.2259979248047, -161.06326293945312, -147.9005126953125, -134.73777770996094, -121.57504272460938, -108.41230010986328, -95.24955749511719, -82.08682250976562, -68.92407989501953, -55.7613410949707, -42.598602294921875, -29.43585968017578, -16.27312469482422, -3.110382080078125, 10.05235767364502, 23.215097427368164, 36.377838134765625, 49.54057693481445, 62.70331573486328, 75.86605834960938, 89.02879333496094, 102.19153594970703, 115.35427856445312, 128.5170135498047, 141.67974853515625, 154.84249877929688, 168.00523376464844, 181.16796875, 194.33071899414062, 207.4934539794922, 220.65618896484375, 233.81893920898438, 246.98167419433594, 260.1444091796875, 273.3071594238281, 286.46990966796875, 299.63262939453125, 312.7953796386719, 325.9581298828125, 339.120849609375, 352.2835998535156, 365.44635009765625, 378.60906982421875, 391.7718200683594, 404.9345703125, 418.0972900390625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 9.0, 6.0, 7.0, 10.0, 12.0, 12.0, 11.0, 18.0, 32.0, 19.0, 30.0, 33.0, 30.0, 41.0, 38.0, 43.0, 50.0, 45.0, 48.0, 42.0, 46.0, 52.0, 39.0, 43.0, 44.0, 35.0, 46.0, 27.0, 28.0, 23.0, 17.0, 13.0, 14.0, 8.0, 9.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.2860107421875, -103.18708801269531, -100.0881576538086, -96.9892349243164, -93.89030456542969, -90.7913818359375, -87.69245910644531, -84.59353637695312, -81.4946060180664, -78.39568328857422, -75.2967529296875, -72.19783020019531, -69.09890747070312, -65.9999771118164, -62.90105438232422, -59.802127838134766, -56.70320129394531, -53.60427474975586, -50.505348205566406, -47.40642547607422, -44.307498931884766, -41.20857238769531, -38.109649658203125, -35.01072311401367, -31.91179656982422, -28.812870025634766, -25.713945388793945, -22.615020751953125, -19.516094207763672, -16.41716766357422, -13.318243026733398, -10.219318389892578, -7.120391845703125, -4.021466255187988, -0.9225406646728516, 2.176384925842285, 5.275310516357422, 8.374236106872559, 11.473161697387695, 14.572086334228516, 17.67101287841797, 20.769939422607422, 23.868864059448242, 26.967788696289062, 30.066715240478516, 33.16564178466797, 36.264564514160156, 39.36349105834961, 42.46241760253906, 45.561344146728516, 48.66027069091797, 51.759193420410156, 54.85811996459961, 57.95704650878906, 61.05596923828125, 64.15489196777344, 67.25382232666016, 70.35274505615234, 73.45167541503906, 76.55059814453125, 79.64952087402344, 82.74845123291016, 85.84737396240234, 88.94630432128906, 92.04522705078125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 5.0, 10.0, 15.0, 3.0, 12.0, 10.0, 22.0, 17.0, 25.0, 25.0, 32.0, 32.0, 34.0, 47.0, 39.0, 32.0, 32.0, 51.0, 48.0, 41.0, 37.0, 46.0, 39.0, 52.0, 36.0, 30.0, 22.0, 29.0, 38.0, 20.0, 27.0, 14.0, 19.0, 14.0, 4.0, 10.0, 6.0, 4.0, 6.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0390625, -14.5018310546875, -13.964599609375, -13.4273681640625, -12.89013671875, -12.3529052734375, -11.815673828125, -11.2784423828125, -10.7412109375, -10.2039794921875, -9.666748046875, -9.1295166015625, -8.59228515625, -8.0550537109375, -7.517822265625, -6.9805908203125, -6.443359375, -5.9061279296875, -5.368896484375, -4.8316650390625, -4.29443359375, -3.7572021484375, -3.219970703125, -2.6827392578125, -2.1455078125, -1.6082763671875, -1.071044921875, -0.5338134765625, 0.00341796875, 0.5406494140625, 1.077880859375, 1.6151123046875, 2.15234375, 2.6895751953125, 3.226806640625, 3.7640380859375, 4.30126953125, 4.8385009765625, 5.375732421875, 5.9129638671875, 6.4501953125, 6.9874267578125, 7.524658203125, 8.0618896484375, 8.59912109375, 9.1363525390625, 9.673583984375, 10.2108154296875, 10.748046875, 11.2852783203125, 11.822509765625, 12.3597412109375, 12.89697265625, 13.4342041015625, 13.971435546875, 14.5086669921875, 15.0458984375, 15.5831298828125, 16.120361328125, 16.6575927734375, 17.19482421875, 17.7320556640625, 18.269287109375, 18.8065185546875, 19.34375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 15.0, 15.0, 23.0, 48.0, 56.0, 98.0, 138.0, 202.0, 280.0, 457.0, 739.0, 1114.0, 1727.0, 2794.0, 4190.0, 6734.0, 10512.0, 16966.0, 27119.0, 43475.0, 71623.0, 117262.0, 187117.0, 206074.0, 134453.0, 81857.0, 49969.0, 31130.0, 19308.0, 12110.0, 7470.0, 4955.0, 3014.0, 1913.0, 1236.0, 806.0, 540.0, 341.0, 218.0, 144.0, 98.0, 71.0, 59.0, 25.0, 17.0, 18.0, 8.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-1.80859375, -1.7523193359375, -1.696044921875, -1.6397705078125, -1.58349609375, -1.5272216796875, -1.470947265625, -1.4146728515625, -1.3583984375, -1.3021240234375, -1.245849609375, -1.1895751953125, -1.13330078125, -1.0770263671875, -1.020751953125, -0.9644775390625, -0.908203125, -0.8519287109375, -0.795654296875, -0.7393798828125, -0.68310546875, -0.6268310546875, -0.570556640625, -0.5142822265625, -0.4580078125, -0.4017333984375, -0.345458984375, -0.2891845703125, -0.23291015625, -0.1766357421875, -0.120361328125, -0.0640869140625, -0.0078125, 0.0484619140625, 0.104736328125, 0.1610107421875, 0.21728515625, 0.2735595703125, 0.329833984375, 0.3861083984375, 0.4423828125, 0.4986572265625, 0.554931640625, 0.6112060546875, 0.66748046875, 0.7237548828125, 0.780029296875, 0.8363037109375, 0.892578125, 0.9488525390625, 1.005126953125, 1.0614013671875, 1.11767578125, 1.1739501953125, 1.230224609375, 1.2864990234375, 1.3427734375, 1.3990478515625, 1.455322265625, 1.5115966796875, 1.56787109375, 1.6241455078125, 1.680419921875, 1.7366943359375, 1.79296875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 13.0, 8.0, 14.0, 13.0, 21.0, 16.0, 20.0, 27.0, 14.0, 29.0, 29.0, 34.0, 27.0, 42.0, 33.0, 34.0, 48.0, 34.0, 1073.0, 38.0, 40.0, 38.0, 44.0, 39.0, 38.0, 32.0, 32.0, 40.0, 22.0, 18.0, 17.0, 15.0, 13.0, 11.0, 9.0, 8.0, 8.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-11.4296875, -11.1068115234375, -10.783935546875, -10.4610595703125, -10.13818359375, -9.8153076171875, -9.492431640625, -9.1695556640625, -8.8466796875, -8.5238037109375, -8.200927734375, -7.8780517578125, -7.55517578125, -7.2322998046875, -6.909423828125, -6.5865478515625, -6.263671875, -5.9407958984375, -5.617919921875, -5.2950439453125, -4.97216796875, -4.6492919921875, -4.326416015625, -4.0035400390625, -3.6806640625, -3.3577880859375, -3.034912109375, -2.7120361328125, -2.38916015625, -2.0662841796875, -1.743408203125, -1.4205322265625, -1.09765625, -0.7747802734375, -0.451904296875, -0.1290283203125, 0.19384765625, 0.5167236328125, 0.839599609375, 1.1624755859375, 1.4853515625, 1.8082275390625, 2.131103515625, 2.4539794921875, 2.77685546875, 3.0997314453125, 3.422607421875, 3.7454833984375, 4.068359375, 4.3912353515625, 4.714111328125, 5.0369873046875, 5.35986328125, 5.6827392578125, 6.005615234375, 6.3284912109375, 6.6513671875, 6.9742431640625, 7.297119140625, 7.6199951171875, 7.94287109375, 8.2657470703125, 8.588623046875, 8.9114990234375, 9.234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 11.0, 7.0, 17.0, 33.0, 41.0, 82.0, 86.0, 140.0, 188.0, 331.0, 496.0, 767.0, 1155.0, 1639.0, 2700.0, 4338.0, 6668.0, 10415.0, 16903.0, 26943.0, 43073.0, 69662.0, 114047.0, 183837.0, 1255546.0, 137160.0, 83340.0, 51211.0, 31884.0, 19930.0, 12355.0, 7954.0, 4983.0, 3332.0, 2075.0, 1347.0, 840.0, 549.0, 331.0, 243.0, 155.0, 119.0, 61.0, 40.0, 35.0, 16.0, 21.0, 17.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.78125, -1.727569580078125, -1.67388916015625, -1.620208740234375, -1.5665283203125, -1.512847900390625, -1.45916748046875, -1.405487060546875, -1.351806640625, -1.298126220703125, -1.24444580078125, -1.190765380859375, -1.1370849609375, -1.083404541015625, -1.02972412109375, -0.976043701171875, -0.92236328125, -0.868682861328125, -0.81500244140625, -0.761322021484375, -0.7076416015625, -0.653961181640625, -0.60028076171875, -0.546600341796875, -0.492919921875, -0.439239501953125, -0.38555908203125, -0.331878662109375, -0.2781982421875, -0.224517822265625, -0.17083740234375, -0.117156982421875, -0.0634765625, -0.009796142578125, 0.04388427734375, 0.097564697265625, 0.1512451171875, 0.204925537109375, 0.25860595703125, 0.312286376953125, 0.365966796875, 0.419647216796875, 0.47332763671875, 0.527008056640625, 0.5806884765625, 0.634368896484375, 0.68804931640625, 0.741729736328125, 0.79541015625, 0.849090576171875, 0.90277099609375, 0.956451416015625, 1.0101318359375, 1.063812255859375, 1.11749267578125, 1.171173095703125, 1.224853515625, 1.278533935546875, 1.33221435546875, 1.385894775390625, 1.4395751953125, 1.493255615234375, 1.54693603515625, 1.600616455078125, 1.654296875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 12.0, 10.0, 15.0, 18.0, 28.0, 40.0, 37.0, 61.0, 66.0, 74.0, 91.0, 87.0, 90.0, 85.0, 70.0, 55.0, 49.0, 28.0, 19.0, 14.0, 10.0, 11.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004901885986328125, -0.004735291004180908, -0.004568696022033691, -0.004402101039886475, -0.004235506057739258, -0.004068911075592041, -0.0039023160934448242, -0.0037357211112976074, -0.0035691261291503906, -0.003402531147003174, -0.003235936164855957, -0.0030693411827087402, -0.0029027462005615234, -0.0027361512184143066, -0.00256955623626709, -0.002402961254119873, -0.0022363662719726562, -0.0020697712898254395, -0.0019031763076782227, -0.0017365813255310059, -0.001569986343383789, -0.0014033913612365723, -0.0012367963790893555, -0.0010702013969421387, -0.0009036064147949219, -0.0007370114326477051, -0.0005704164505004883, -0.0004038214683532715, -0.0002372264862060547, -7.063150405883789e-05, 9.59634780883789e-05, 0.0002625584602355957, 0.0004291534423828125, 0.0005957484245300293, 0.0007623434066772461, 0.0009289383888244629, 0.0010955333709716797, 0.0012621283531188965, 0.0014287233352661133, 0.00159531831741333, 0.0017619132995605469, 0.0019285082817077637, 0.0020951032638549805, 0.0022616982460021973, 0.002428293228149414, 0.002594888210296631, 0.0027614831924438477, 0.0029280781745910645, 0.0030946731567382812, 0.003261268138885498, 0.003427863121032715, 0.0035944581031799316, 0.0037610530853271484, 0.003927648067474365, 0.004094243049621582, 0.004260838031768799, 0.004427433013916016, 0.004594027996063232, 0.004760622978210449, 0.004927217960357666, 0.005093812942504883, 0.0052604079246521, 0.005427002906799316, 0.005593597888946533, 0.00576019287109375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 4.0, 10.0, 16.0, 12.0, 25.0, 31.0, 48.0, 62.0, 139.0, 202.0, 449.0, 1669.0, 1042054.0, 2712.0, 484.0, 213.0, 135.0, 94.0, 44.0, 53.0, 20.0, 19.0, 13.0, 17.0, 9.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1278076171875, -0.12411022186279297, -0.12041282653808594, -0.1167154312133789, -0.11301803588867188, -0.10932064056396484, -0.10562324523925781, -0.10192584991455078, -0.09822845458984375, -0.09453105926513672, -0.09083366394042969, -0.08713626861572266, -0.08343887329101562, -0.0797414779663086, -0.07604408264160156, -0.07234668731689453, -0.0686492919921875, -0.06495189666748047, -0.06125450134277344, -0.057557106018066406, -0.053859710693359375, -0.050162315368652344, -0.04646492004394531, -0.04276752471923828, -0.03907012939453125, -0.03537273406982422, -0.03167533874511719, -0.027977943420410156, -0.024280548095703125, -0.020583152770996094, -0.016885757446289062, -0.013188362121582031, -0.009490966796875, -0.005793571472167969, -0.0020961761474609375, 0.0016012191772460938, 0.005298614501953125, 0.008996009826660156, 0.012693405151367188, 0.01639080047607422, 0.02008819580078125, 0.02378559112548828, 0.027482986450195312, 0.031180381774902344, 0.034877777099609375, 0.038575172424316406, 0.04227256774902344, 0.04596996307373047, 0.0496673583984375, 0.05336475372314453, 0.05706214904785156, 0.060759544372558594, 0.06445693969726562, 0.06815433502197266, 0.07185173034667969, 0.07554912567138672, 0.07924652099609375, 0.08294391632080078, 0.08664131164550781, 0.09033870697021484, 0.09403610229492188, 0.0977334976196289, 0.10143089294433594, 0.10512828826904297, 0.10882568359375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [108.0, 827.0, 80.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007027438259683549, -0.00020967214368283749, 0.00028339953860267997, 0.0007764711626805365, 0.001269542844966054, 0.0017626145854592323, 0.002255686093121767, 0.0027487578336149454, 0.0032418295741081238, 0.003734901314601302, 0.0042279730550944805, 0.004721044562757015, 0.005214116536080837, 0.005707188043743372, 0.006200259551405907, 0.006693331524729729, 0.007186403032392263, 0.007679474540054798, 0.00817254651337862, 0.008665617555379868, 0.00915868952870369, 0.009651761502027512, 0.010144833475351334, 0.010637904517352581, 0.011130976490676403, 0.011624048464000225, 0.012117119506001472, 0.012610191479325294, 0.013103263452649117, 0.013596335425972939, 0.014089406467974186, 0.014582478441298008, 0.015075549483299255, 0.015568621456623077, 0.0160616934299469, 0.01655476540327072, 0.017047835513949394, 0.017540907487273216, 0.01803397946059704, 0.01852705143392086, 0.019020123407244682, 0.019513195380568504, 0.020006267353892326, 0.020499337464571, 0.02099240943789482, 0.021485481411218643, 0.021978553384542465, 0.022471625357866287, 0.02296469733119011, 0.02345776930451393, 0.023950841277837753, 0.024443913251161575, 0.024936983361840248, 0.02543005533516407, 0.025923127308487892, 0.026416199281811714, 0.026909269392490387, 0.02740234136581421, 0.02789541333913803, 0.028388485312461853, 0.028881555423140526, 0.029374627396464348, 0.02986769936978817, 0.030360771343111992, 0.030853843316435814]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 8.0, 7.0, 10.0, 10.0, 10.0, 12.0, 7.0, 20.0, 17.0, 21.0, 26.0, 21.0, 13.0, 33.0, 27.0, 28.0, 35.0, 36.0, 38.0, 44.0, 45.0, 46.0, 45.0, 33.0, 33.0, 38.0, 31.0, 30.0, 36.0, 34.0, 33.0, 24.0, 40.0, 18.0, 14.0, 11.0, 9.0, 14.0, 9.0, 9.0, 12.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0020775198936462402, -0.0020182253792881966, -0.001958930864930153, -0.0018996363505721092, -0.0018403418362140656, -0.0017810473218560219, -0.0017217528074979782, -0.0016624582931399345, -0.0016031637787818909, -0.0015438692644238472, -0.0014845747500658035, -0.0014252802357077599, -0.0013659857213497162, -0.0013066912069916725, -0.0012473966926336288, -0.0011881021782755852, -0.0011288076639175415, -0.0010695131495594978, -0.0010102186352014542, -0.0009509241208434105, -0.0008916296064853668, -0.0008323350921273232, -0.0007730405777692795, -0.0007137460634112358, -0.0006544515490531921, -0.0005951570346951485, -0.0005358625203371048, -0.0004765680059790611, -0.00041727349162101746, -0.0003579789772629738, -0.0002986844629049301, -0.00023938994854688644, -0.00018009543418884277, -0.0001208009198307991, -6.150640547275543e-05, -2.2118911147117615e-06, 5.708262324333191e-05, 0.00011637713760137558, 0.00017567165195941925, 0.00023496616631746292, 0.0002942606806755066, 0.00035355519503355026, 0.00041284970939159393, 0.0004721442237496376, 0.0005314387381076813, 0.0005907332524657249, 0.0006500277668237686, 0.0007093222811818123, 0.000768616795539856, 0.0008279113098978996, 0.0008872058242559433, 0.000946500338613987, 0.0010057948529720306, 0.0010650893673300743, 0.001124383881688118, 0.0011836783960461617, 0.0012429729104042053, 0.001302267424762249, 0.0013615619391202927, 0.0014208564534783363, 0.00148015096783638, 0.0015394454821944237, 0.0015987399965524673, 0.001658034510910511, 0.0017173290252685547]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 5.0, 10.0, 15.0, 3.0, 12.0, 10.0, 22.0, 17.0, 25.0, 25.0, 32.0, 32.0, 34.0, 47.0, 39.0, 32.0, 32.0, 51.0, 48.0, 41.0, 37.0, 46.0, 39.0, 52.0, 36.0, 30.0, 22.0, 29.0, 38.0, 20.0, 27.0, 14.0, 19.0, 14.0, 4.0, 10.0, 6.0, 4.0, 6.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0390625, -14.5018310546875, -13.964599609375, -13.4273681640625, -12.89013671875, -12.3529052734375, -11.815673828125, -11.2784423828125, -10.7412109375, -10.2039794921875, -9.666748046875, -9.1295166015625, -8.59228515625, -8.0550537109375, -7.517822265625, -6.9805908203125, -6.443359375, -5.9061279296875, -5.368896484375, -4.8316650390625, -4.29443359375, -3.7572021484375, -3.219970703125, -2.6827392578125, -2.1455078125, -1.6082763671875, -1.071044921875, -0.5338134765625, 0.00341796875, 0.5406494140625, 1.077880859375, 1.6151123046875, 2.15234375, 2.6895751953125, 3.226806640625, 3.7640380859375, 4.30126953125, 4.8385009765625, 5.375732421875, 5.9129638671875, 6.4501953125, 6.9874267578125, 7.524658203125, 8.0618896484375, 8.59912109375, 9.1363525390625, 9.673583984375, 10.2108154296875, 10.748046875, 11.2852783203125, 11.822509765625, 12.3597412109375, 12.89697265625, 13.4342041015625, 13.971435546875, 14.5086669921875, 15.0458984375, 15.5831298828125, 16.120361328125, 16.6575927734375, 17.19482421875, 17.7320556640625, 18.269287109375, 18.8065185546875, 19.34375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 6.0, 14.0, 14.0, 21.0, 22.0, 32.0, 41.0, 54.0, 67.0, 77.0, 125.0, 182.0, 282.0, 514.0, 1060.0, 2580.0, 7346.0, 23675.0, 88336.0, 371354.0, 412772.0, 99860.0, 26638.0, 7984.0, 2852.0, 1105.0, 525.0, 320.0, 178.0, 149.0, 88.0, 69.0, 44.0, 43.0, 27.0, 21.0, 17.0, 14.0, 8.0, 10.0, 3.0, 5.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.59375, -18.89501953125, -18.1962890625, -17.49755859375, -16.798828125, -16.10009765625, -15.4013671875, -14.70263671875, -14.00390625, -13.30517578125, -12.6064453125, -11.90771484375, -11.208984375, -10.51025390625, -9.8115234375, -9.11279296875, -8.4140625, -7.71533203125, -7.0166015625, -6.31787109375, -5.619140625, -4.92041015625, -4.2216796875, -3.52294921875, -2.82421875, -2.12548828125, -1.4267578125, -0.72802734375, -0.029296875, 0.66943359375, 1.3681640625, 2.06689453125, 2.765625, 3.46435546875, 4.1630859375, 4.86181640625, 5.560546875, 6.25927734375, 6.9580078125, 7.65673828125, 8.35546875, 9.05419921875, 9.7529296875, 10.45166015625, 11.150390625, 11.84912109375, 12.5478515625, 13.24658203125, 13.9453125, 14.64404296875, 15.3427734375, 16.04150390625, 16.740234375, 17.43896484375, 18.1376953125, 18.83642578125, 19.53515625, 20.23388671875, 20.9326171875, 21.63134765625, 22.330078125, 23.02880859375, 23.7275390625, 24.42626953125, 25.125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 1.0, 5.0, 8.0, 13.0, 7.0, 24.0, 17.0, 14.0, 23.0, 27.0, 34.0, 35.0, 30.0, 31.0, 48.0, 50.0, 54.0, 90.0, 116.0, 209.0, 1470.0, 177.0, 88.0, 64.0, 54.0, 50.0, 38.0, 46.0, 29.0, 30.0, 28.0, 20.0, 16.0, 17.0, 23.0, 10.0, 6.0, 11.0, 16.0, 0.0, 5.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-41.3125, -39.90234375, -38.4921875, -37.08203125, -35.671875, -34.26171875, -32.8515625, -31.44140625, -30.03125, -28.62109375, -27.2109375, -25.80078125, -24.390625, -22.98046875, -21.5703125, -20.16015625, -18.75, -17.33984375, -15.9296875, -14.51953125, -13.109375, -11.69921875, -10.2890625, -8.87890625, -7.46875, -6.05859375, -4.6484375, -3.23828125, -1.828125, -0.41796875, 0.9921875, 2.40234375, 3.8125, 5.22265625, 6.6328125, 8.04296875, 9.453125, 10.86328125, 12.2734375, 13.68359375, 15.09375, 16.50390625, 17.9140625, 19.32421875, 20.734375, 22.14453125, 23.5546875, 24.96484375, 26.375, 27.78515625, 29.1953125, 30.60546875, 32.015625, 33.42578125, 34.8359375, 36.24609375, 37.65625, 39.06640625, 40.4765625, 41.88671875, 43.296875, 44.70703125, 46.1171875, 47.52734375, 48.9375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 8.0, 0.0, 1.0, 4.0, 4.0, 9.0, 8.0, 13.0, 15.0, 14.0, 34.0, 41.0, 43.0, 67.0, 87.0, 122.0, 179.0, 246.0, 436.0, 850.0, 4000.0, 96791.0, 2953506.0, 83441.0, 3658.0, 812.0, 418.0, 235.0, 188.0, 136.0, 96.0, 67.0, 45.0, 41.0, 31.0, 16.0, 18.0, 8.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-63.96875, -61.64111328125, -59.3134765625, -56.98583984375, -54.658203125, -52.33056640625, -50.0029296875, -47.67529296875, -45.34765625, -43.02001953125, -40.6923828125, -38.36474609375, -36.037109375, -33.70947265625, -31.3818359375, -29.05419921875, -26.7265625, -24.39892578125, -22.0712890625, -19.74365234375, -17.416015625, -15.08837890625, -12.7607421875, -10.43310546875, -8.10546875, -5.77783203125, -3.4501953125, -1.12255859375, 1.205078125, 3.53271484375, 5.8603515625, 8.18798828125, 10.515625, 12.84326171875, 15.1708984375, 17.49853515625, 19.826171875, 22.15380859375, 24.4814453125, 26.80908203125, 29.13671875, 31.46435546875, 33.7919921875, 36.11962890625, 38.447265625, 40.77490234375, 43.1025390625, 45.43017578125, 47.7578125, 50.08544921875, 52.4130859375, 54.74072265625, 57.068359375, 59.39599609375, 61.7236328125, 64.05126953125, 66.37890625, 68.70654296875, 71.0341796875, 73.36181640625, 75.689453125, 78.01708984375, 80.3447265625, 82.67236328125, 85.0]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 8.0, 29.0, 65.0, 130.0, 225.0, 231.0, 177.0, 72.0, 43.0, 19.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.59333801269531, -88.8408432006836, -86.0883560180664, -83.33586120605469, -80.5833740234375, -77.83087921142578, -75.0783920288086, -72.32589721679688, -69.57341003417969, -66.82091522216797, -64.06842803955078, -61.31593704223633, -58.563446044921875, -55.81095504760742, -53.05846405029297, -50.30596923828125, -47.5534782409668, -44.800987243652344, -42.04849624633789, -39.29600524902344, -36.543514251708984, -33.79102325439453, -31.038530349731445, -28.286039352416992, -25.53354835510254, -22.781057357788086, -20.028566360473633, -17.276073455810547, -14.52358341217041, -11.771092414855957, -9.018600463867188, -6.266109466552734, -3.5136184692382812, -0.761127233505249, 1.9913640022277832, 4.7438554763793945, 7.496346473693848, 10.2488374710083, 13.00132942199707, 15.753820419311523, 18.506311416625977, 21.25880241394043, 24.011293411254883, 26.76378631591797, 29.516277313232422, 32.268768310546875, 35.02125930786133, 37.77375030517578, 40.526241302490234, 43.27873229980469, 46.03122329711914, 48.783714294433594, 51.53620529174805, 54.2886962890625, 57.04119110107422, 59.793678283691406, 62.546173095703125, 65.29866790771484, 68.05115509033203, 70.80364990234375, 73.55613708496094, 76.30863189697266, 79.06111907958984, 81.81361389160156, 84.56610107421875]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 11.0, 9.0, 7.0, 10.0, 8.0, 13.0, 16.0, 19.0, 17.0, 16.0, 19.0, 32.0, 28.0, 28.0, 26.0, 25.0, 34.0, 27.0, 35.0, 33.0, 46.0, 36.0, 40.0, 34.0, 32.0, 41.0, 28.0, 39.0, 26.0, 24.0, 29.0, 27.0, 25.0, 23.0, 18.0, 17.0, 16.0, 9.0, 14.0, 10.0, 5.0, 4.0, 7.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 3.0, 3.0], "bins": [-100.16975402832031, -97.17277526855469, -94.1758041381836, -91.17882537841797, -88.18185424804688, -85.18487548828125, -82.18790435791016, -79.19092559814453, -76.19395446777344, -73.19697570800781, -70.20000457763672, -67.2030258178711, -64.2060546875, -61.20907974243164, -58.21210479736328, -55.215126037597656, -52.2181510925293, -49.22117614746094, -46.22420120239258, -43.22722625732422, -40.23025131225586, -37.2332763671875, -34.236297607421875, -31.23932456970215, -28.24234962463379, -25.24537467956543, -22.24839973449707, -19.251422882080078, -16.25444793701172, -13.257473945617676, -10.260498046875, -7.263523101806641, -4.266548156738281, -1.2695729732513428, 1.7274022102355957, 4.724377632141113, 7.721352577209473, 10.718327522277832, 13.715303421020508, 16.712278366088867, 19.709253311157227, 22.706228256225586, 25.703203201293945, 28.700180053710938, 31.697154998779297, 34.694129943847656, 37.691104888916016, 40.688079833984375, 43.685054779052734, 46.682029724121094, 49.67900466918945, 52.67597961425781, 55.67295455932617, 58.66992950439453, 61.666908264160156, 64.66387939453125, 67.66085815429688, 70.6578369140625, 73.6548080444336, 76.65178680419922, 79.64875793457031, 82.64573669433594, 85.64270782470703, 88.63968658447266, 91.63665771484375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 2.0, 9.0, 11.0, 16.0, 9.0, 12.0, 16.0, 22.0, 25.0, 24.0, 17.0, 27.0, 30.0, 35.0, 35.0, 35.0, 39.0, 46.0, 33.0, 43.0, 35.0, 59.0, 39.0, 25.0, 47.0, 35.0, 34.0, 27.0, 29.0, 28.0, 28.0, 25.0, 14.0, 20.0, 10.0, 10.0, 7.0, 9.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-16.046875, -15.526611328125, -15.00634765625, -14.486083984375, -13.9658203125, -13.445556640625, -12.92529296875, -12.405029296875, -11.884765625, -11.364501953125, -10.84423828125, -10.323974609375, -9.8037109375, -9.283447265625, -8.76318359375, -8.242919921875, -7.72265625, -7.202392578125, -6.68212890625, -6.161865234375, -5.6416015625, -5.121337890625, -4.60107421875, -4.080810546875, -3.560546875, -3.040283203125, -2.52001953125, -1.999755859375, -1.4794921875, -0.959228515625, -0.43896484375, 0.081298828125, 0.6015625, 1.121826171875, 1.64208984375, 2.162353515625, 2.6826171875, 3.202880859375, 3.72314453125, 4.243408203125, 4.763671875, 5.283935546875, 5.80419921875, 6.324462890625, 6.8447265625, 7.364990234375, 7.88525390625, 8.405517578125, 8.92578125, 9.446044921875, 9.96630859375, 10.486572265625, 11.0068359375, 11.527099609375, 12.04736328125, 12.567626953125, 13.087890625, 13.608154296875, 14.12841796875, 14.648681640625, 15.1689453125, 15.689208984375, 16.20947265625, 16.729736328125, 17.25]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 15.0, 9.0, 7.0, 14.0, 8.0, 13.0, 9.0, 20.0, 23.0, 28.0, 30.0, 41.0, 55.0, 104.0, 159.0, 303.0, 782.0, 3461.0, 38287.0, 1175189.0, 2793801.0, 171675.0, 7754.0, 1331.0, 483.0, 201.0, 124.0, 83.0, 56.0, 34.0, 28.0, 24.0, 14.0, 12.0, 15.0, 14.0, 5.0, 11.0, 11.0, 7.0, 8.0, 8.0, 1.0, 5.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-44.21875, -42.80224609375, -41.3857421875, -39.96923828125, -38.552734375, -37.13623046875, -35.7197265625, -34.30322265625, -32.88671875, -31.47021484375, -30.0537109375, -28.63720703125, -27.220703125, -25.80419921875, -24.3876953125, -22.97119140625, -21.5546875, -20.13818359375, -18.7216796875, -17.30517578125, -15.888671875, -14.47216796875, -13.0556640625, -11.63916015625, -10.22265625, -8.80615234375, -7.3896484375, -5.97314453125, -4.556640625, -3.14013671875, -1.7236328125, -0.30712890625, 1.109375, 2.52587890625, 3.9423828125, 5.35888671875, 6.775390625, 8.19189453125, 9.6083984375, 11.02490234375, 12.44140625, 13.85791015625, 15.2744140625, 16.69091796875, 18.107421875, 19.52392578125, 20.9404296875, 22.35693359375, 23.7734375, 25.18994140625, 26.6064453125, 28.02294921875, 29.439453125, 30.85595703125, 32.2724609375, 33.68896484375, 35.10546875, 36.52197265625, 37.9384765625, 39.35498046875, 40.771484375, 42.18798828125, 43.6044921875, 45.02099609375, 46.4375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 5.0, 12.0, 14.0, 22.0, 34.0, 40.0, 67.0, 101.0, 153.0, 251.0, 394.0, 525.0, 624.0, 564.0, 405.0, 279.0, 181.0, 130.0, 71.0, 54.0, 38.0, 26.0, 15.0, 20.0, 12.0, 5.0, 2.0, 7.0, 9.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.546875, -25.706298828125, -24.86572265625, -24.025146484375, -23.1845703125, -22.343994140625, -21.50341796875, -20.662841796875, -19.822265625, -18.981689453125, -18.14111328125, -17.300537109375, -16.4599609375, -15.619384765625, -14.77880859375, -13.938232421875, -13.09765625, -12.257080078125, -11.41650390625, -10.575927734375, -9.7353515625, -8.894775390625, -8.05419921875, -7.213623046875, -6.373046875, -5.532470703125, -4.69189453125, -3.851318359375, -3.0107421875, -2.170166015625, -1.32958984375, -0.489013671875, 0.3515625, 1.192138671875, 2.03271484375, 2.873291015625, 3.7138671875, 4.554443359375, 5.39501953125, 6.235595703125, 7.076171875, 7.916748046875, 8.75732421875, 9.597900390625, 10.4384765625, 11.279052734375, 12.11962890625, 12.960205078125, 13.80078125, 14.641357421875, 15.48193359375, 16.322509765625, 17.1630859375, 18.003662109375, 18.84423828125, 19.684814453125, 20.525390625, 21.365966796875, 22.20654296875, 23.047119140625, 23.8876953125, 24.728271484375, 25.56884765625, 26.409423828125, 27.25]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 7.0, 12.0, 12.0, 17.0, 6.0, 34.0, 21.0, 31.0, 59.0, 66.0, 136.0, 210.0, 459.0, 948.0, 3058.0, 19211.0, 378256.0, 3614195.0, 161897.0, 11734.0, 2257.0, 720.0, 403.0, 186.0, 91.0, 66.0, 46.0, 30.0, 22.0, 16.0, 18.0, 7.0, 9.0, 6.0, 8.0, 6.0, 8.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.4375, -42.6865234375, -40.935546875, -39.1845703125, -37.43359375, -35.6826171875, -33.931640625, -32.1806640625, -30.4296875, -28.6787109375, -26.927734375, -25.1767578125, -23.42578125, -21.6748046875, -19.923828125, -18.1728515625, -16.421875, -14.6708984375, -12.919921875, -11.1689453125, -9.41796875, -7.6669921875, -5.916015625, -4.1650390625, -2.4140625, -0.6630859375, 1.087890625, 2.8388671875, 4.58984375, 6.3408203125, 8.091796875, 9.8427734375, 11.59375, 13.3447265625, 15.095703125, 16.8466796875, 18.59765625, 20.3486328125, 22.099609375, 23.8505859375, 25.6015625, 27.3525390625, 29.103515625, 30.8544921875, 32.60546875, 34.3564453125, 36.107421875, 37.8583984375, 39.609375, 41.3603515625, 43.111328125, 44.8623046875, 46.61328125, 48.3642578125, 50.115234375, 51.8662109375, 53.6171875, 55.3681640625, 57.119140625, 58.8701171875, 60.62109375, 62.3720703125, 64.123046875, 65.8740234375, 67.625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 59.0, 761.0, 193.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1019.1182250976562, -998.5784301757812, -978.0386352539062, -957.4988403320312, -936.9590454101562, -916.4192504882812, -895.8794555664062, -875.339599609375, -854.7998046875, -834.260009765625, -813.72021484375, -793.180419921875, -772.640625, -752.100830078125, -731.56103515625, -711.021240234375, -690.4814453125, -669.941650390625, -649.40185546875, -628.862060546875, -608.322265625, -587.782470703125, -567.24267578125, -546.702880859375, -526.1630859375, -505.623291015625, -485.08349609375, -464.543701171875, -444.00390625, -423.464111328125, -402.9242858886719, -382.3844909667969, -361.8446350097656, -341.3048400878906, -320.7650451660156, -300.2252502441406, -279.6854248046875, -259.1456298828125, -238.6058349609375, -218.0660400390625, -197.5262451171875, -176.9864501953125, -156.4466552734375, -135.90684509277344, -115.36705017089844, -94.82725524902344, -74.2874526977539, -53.747650146484375, -33.207855224609375, -12.66805648803711, 7.871742248535156, 28.411540985107422, 48.95133972167969, 69.49113464355469, 90.03093719482422, 110.57073974609375, 131.11053466796875, 151.65032958984375, 172.19012451171875, 192.7299346923828, 213.2697296142578, 233.8095245361328, 254.34933471679688, 274.8891296386719, 295.4289245605469]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 6.0, 5.0, 4.0, 11.0, 7.0, 13.0, 14.0, 24.0, 23.0, 33.0, 30.0, 35.0, 39.0, 42.0, 40.0, 52.0, 32.0, 50.0, 32.0, 49.0, 55.0, 45.0, 41.0, 35.0, 27.0, 36.0, 27.0, 35.0, 22.0, 37.0, 19.0, 15.0, 19.0, 9.0, 3.0, 4.0, 7.0, 3.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-79.953857421875, -77.24220275878906, -74.53054809570312, -71.81889343261719, -69.10723876953125, -66.39558410644531, -63.68393325805664, -60.9722785949707, -58.260623931884766, -55.54896926879883, -52.83731460571289, -50.12566375732422, -47.41400909423828, -44.702354431152344, -41.990699768066406, -39.27904510498047, -36.56739044189453, -33.855735778808594, -31.144081115722656, -28.43242835998535, -25.720773696899414, -23.009119033813477, -20.297466278076172, -17.585811614990234, -14.874156951904297, -12.16250228881836, -9.450848579406738, -6.739194869995117, -4.02754020690918, -1.3158855438232422, 1.3957672119140625, 4.107421875, 6.8190765380859375, 9.530731201171875, 12.242384910583496, 14.954038619995117, 17.665693283081055, 20.377347946166992, 23.089000701904297, 25.800655364990234, 28.512310028076172, 31.22396469116211, 33.93561935424805, 36.64727020263672, 39.358924865722656, 42.070579528808594, 44.78223419189453, 47.49388885498047, 50.205543518066406, 52.917198181152344, 55.62885284423828, 58.34050750732422, 61.052162170410156, 63.763816833496094, 66.4754638671875, 69.18711853027344, 71.89877319335938, 74.61042785644531, 77.32208251953125, 80.03373718261719, 82.74539184570312, 85.45704650878906, 88.168701171875, 90.88035583496094, 93.59201049804688]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 6.0, 3.0, 7.0, 10.0, 10.0, 14.0, 16.0, 18.0, 19.0, 20.0, 28.0, 27.0, 23.0, 32.0, 30.0, 34.0, 44.0, 50.0, 44.0, 40.0, 47.0, 54.0, 47.0, 31.0, 31.0, 38.0, 41.0, 36.0, 25.0, 39.0, 27.0, 25.0, 20.0, 16.0, 9.0, 10.0, 7.0, 5.0, 3.0, 4.0, 5.0, 6.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6015625, -15.0321044921875, -14.462646484375, -13.8931884765625, -13.32373046875, -12.7542724609375, -12.184814453125, -11.6153564453125, -11.0458984375, -10.4764404296875, -9.906982421875, -9.3375244140625, -8.76806640625, -8.1986083984375, -7.629150390625, -7.0596923828125, -6.490234375, -5.9207763671875, -5.351318359375, -4.7818603515625, -4.21240234375, -3.6429443359375, -3.073486328125, -2.5040283203125, -1.9345703125, -1.3651123046875, -0.795654296875, -0.2261962890625, 0.34326171875, 0.9127197265625, 1.482177734375, 2.0516357421875, 2.62109375, 3.1905517578125, 3.760009765625, 4.3294677734375, 4.89892578125, 5.4683837890625, 6.037841796875, 6.6072998046875, 7.1767578125, 7.7462158203125, 8.315673828125, 8.8851318359375, 9.45458984375, 10.0240478515625, 10.593505859375, 11.1629638671875, 11.732421875, 12.3018798828125, 12.871337890625, 13.4407958984375, 14.01025390625, 14.5797119140625, 15.149169921875, 15.7186279296875, 16.2880859375, 16.8575439453125, 17.427001953125, 17.9964599609375, 18.56591796875, 19.1353759765625, 19.704833984375, 20.2742919921875, 20.84375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 13.0, 18.0, 29.0, 41.0, 52.0, 97.0, 136.0, 195.0, 287.0, 477.0, 757.0, 1226.0, 1944.0, 3019.0, 4914.0, 7651.0, 12494.0, 19813.0, 32059.0, 50939.0, 82554.0, 135408.0, 207521.0, 185569.0, 114507.0, 70118.0, 43938.0, 27316.0, 17107.0, 10636.0, 6531.0, 4010.0, 2643.0, 1630.0, 1017.0, 672.0, 443.0, 264.0, 155.0, 106.0, 98.0, 43.0, 40.0, 23.0, 18.0, 5.0, 6.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.79296875, -1.7348175048828125, -1.676666259765625, -1.6185150146484375, -1.56036376953125, -1.5022125244140625, -1.444061279296875, -1.3859100341796875, -1.3277587890625, -1.2696075439453125, -1.211456298828125, -1.1533050537109375, -1.09515380859375, -1.0370025634765625, -0.978851318359375, -0.9207000732421875, -0.862548828125, -0.8043975830078125, -0.746246337890625, -0.6880950927734375, -0.62994384765625, -0.5717926025390625, -0.513641357421875, -0.4554901123046875, -0.3973388671875, -0.3391876220703125, -0.281036376953125, -0.2228851318359375, -0.16473388671875, -0.1065826416015625, -0.048431396484375, 0.0097198486328125, 0.06787109375, 0.1260223388671875, 0.184173583984375, 0.2423248291015625, 0.30047607421875, 0.3586273193359375, 0.416778564453125, 0.4749298095703125, 0.5330810546875, 0.5912322998046875, 0.649383544921875, 0.7075347900390625, 0.76568603515625, 0.8238372802734375, 0.881988525390625, 0.9401397705078125, 0.998291015625, 1.0564422607421875, 1.114593505859375, 1.1727447509765625, 1.23089599609375, 1.2890472412109375, 1.347198486328125, 1.4053497314453125, 1.4635009765625, 1.5216522216796875, 1.579803466796875, 1.6379547119140625, 1.69610595703125, 1.7542572021484375, 1.812408447265625, 1.8705596923828125, 1.9287109375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 9.0, 14.0, 4.0, 19.0, 17.0, 17.0, 20.0, 25.0, 30.0, 24.0, 32.0, 31.0, 28.0, 35.0, 37.0, 44.0, 38.0, 1069.0, 48.0, 41.0, 50.0, 44.0, 42.0, 32.0, 37.0, 22.0, 27.0, 19.0, 14.0, 20.0, 15.0, 24.0, 12.0, 17.0, 10.0, 12.0, 8.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.5390625, -11.1849365234375, -10.830810546875, -10.4766845703125, -10.12255859375, -9.7684326171875, -9.414306640625, -9.0601806640625, -8.7060546875, -8.3519287109375, -7.997802734375, -7.6436767578125, -7.28955078125, -6.9354248046875, -6.581298828125, -6.2271728515625, -5.873046875, -5.5189208984375, -5.164794921875, -4.8106689453125, -4.45654296875, -4.1024169921875, -3.748291015625, -3.3941650390625, -3.0400390625, -2.6859130859375, -2.331787109375, -1.9776611328125, -1.62353515625, -1.2694091796875, -0.915283203125, -0.5611572265625, -0.20703125, 0.1470947265625, 0.501220703125, 0.8553466796875, 1.20947265625, 1.5635986328125, 1.917724609375, 2.2718505859375, 2.6259765625, 2.9801025390625, 3.334228515625, 3.6883544921875, 4.04248046875, 4.3966064453125, 4.750732421875, 5.1048583984375, 5.458984375, 5.8131103515625, 6.167236328125, 6.5213623046875, 6.87548828125, 7.2296142578125, 7.583740234375, 7.9378662109375, 8.2919921875, 8.6461181640625, 9.000244140625, 9.3543701171875, 9.70849609375, 10.0626220703125, 10.416748046875, 10.7708740234375, 11.125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 6.0, 8.0, 15.0, 22.0, 36.0, 54.0, 84.0, 114.0, 150.0, 245.0, 353.0, 518.0, 770.0, 1116.0, 1608.0, 2449.0, 3673.0, 5714.0, 8738.0, 13518.0, 20695.0, 32456.0, 50593.0, 81968.0, 133400.0, 1251260.0, 181547.0, 113372.0, 69447.0, 43763.0, 27603.0, 17788.0, 11434.0, 7704.0, 4922.0, 3400.0, 2141.0, 1428.0, 946.0, 677.0, 433.0, 300.0, 191.0, 143.0, 106.0, 59.0, 49.0, 36.0, 35.0, 10.0, 13.0, 4.0, 3.0, 8.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.7646484375, -1.7092132568359375, -1.653778076171875, -1.5983428955078125, -1.54290771484375, -1.4874725341796875, -1.432037353515625, -1.3766021728515625, -1.3211669921875, -1.2657318115234375, -1.210296630859375, -1.1548614501953125, -1.09942626953125, -1.0439910888671875, -0.988555908203125, -0.9331207275390625, -0.877685546875, -0.8222503662109375, -0.766815185546875, -0.7113800048828125, -0.65594482421875, -0.6005096435546875, -0.545074462890625, -0.4896392822265625, -0.4342041015625, -0.3787689208984375, -0.323333740234375, -0.2678985595703125, -0.21246337890625, -0.1570281982421875, -0.101593017578125, -0.0461578369140625, 0.00927734375, 0.0647125244140625, 0.120147705078125, 0.1755828857421875, 0.23101806640625, 0.2864532470703125, 0.341888427734375, 0.3973236083984375, 0.4527587890625, 0.5081939697265625, 0.563629150390625, 0.6190643310546875, 0.67449951171875, 0.7299346923828125, 0.785369873046875, 0.8408050537109375, 0.896240234375, 0.9516754150390625, 1.007110595703125, 1.0625457763671875, 1.11798095703125, 1.1734161376953125, 1.228851318359375, 1.2842864990234375, 1.3397216796875, 1.3951568603515625, 1.450592041015625, 1.5060272216796875, 1.56146240234375, 1.6168975830078125, 1.672332763671875, 1.7277679443359375, 1.783203125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 5.0, 5.0, 9.0, 4.0, 4.0, 7.0, 12.0, 23.0, 12.0, 9.0, 19.0, 20.0, 30.0, 35.0, 36.0, 51.0, 40.0, 51.0, 49.0, 55.0, 39.0, 49.0, 63.0, 42.0, 60.0, 37.0, 33.0, 37.0, 39.0, 21.0, 17.0, 20.0, 12.0, 10.0, 9.0, 9.0, 4.0, 8.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0033779144287109375, -0.0032731294631958008, -0.003168344497680664, -0.0030635595321655273, -0.0029587745666503906, -0.002853989601135254, -0.002749204635620117, -0.0026444196701049805, -0.0025396347045898438, -0.002434849739074707, -0.0023300647735595703, -0.0022252798080444336, -0.002120494842529297, -0.00201570987701416, -0.0019109249114990234, -0.0018061399459838867, -0.00170135498046875, -0.0015965700149536133, -0.0014917850494384766, -0.0013870000839233398, -0.0012822151184082031, -0.0011774301528930664, -0.0010726451873779297, -0.000967860221862793, -0.0008630752563476562, -0.0007582902908325195, -0.0006535053253173828, -0.0005487203598022461, -0.0004439353942871094, -0.00033915042877197266, -0.00023436546325683594, -0.00012958049774169922, -2.47955322265625e-05, 7.998943328857422e-05, 0.00018477439880371094, 0.00028955936431884766, 0.0003943443298339844, 0.0004991292953491211, 0.0006039142608642578, 0.0007086992263793945, 0.0008134841918945312, 0.000918269157409668, 0.0010230541229248047, 0.0011278390884399414, 0.0012326240539550781, 0.0013374090194702148, 0.0014421939849853516, 0.0015469789505004883, 0.001651763916015625, 0.0017565488815307617, 0.0018613338470458984, 0.001966118812561035, 0.002070903778076172, 0.0021756887435913086, 0.0022804737091064453, 0.002385258674621582, 0.0024900436401367188, 0.0025948286056518555, 0.002699613571166992, 0.002804398536682129, 0.0029091835021972656, 0.0030139684677124023, 0.003118753433227539, 0.0032235383987426758, 0.0033283233642578125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 4.0, 6.0, 9.0, 8.0, 10.0, 17.0, 24.0, 27.0, 26.0, 37.0, 30.0, 68.0, 74.0, 104.0, 154.0, 219.0, 347.0, 710.0, 4900.0, 1029167.0, 10646.0, 743.0, 363.0, 229.0, 155.0, 103.0, 62.0, 53.0, 50.0, 44.0, 29.0, 17.0, 22.0, 20.0, 17.0, 8.0, 7.0, 5.0, 4.0, 4.0, 6.0, 2.0, 9.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.072021484375, -0.0698099136352539, -0.06759834289550781, -0.06538677215576172, -0.06317520141601562, -0.06096363067626953, -0.05875205993652344, -0.056540489196777344, -0.05432891845703125, -0.052117347717285156, -0.04990577697753906, -0.04769420623779297, -0.045482635498046875, -0.04327106475830078, -0.04105949401855469, -0.038847923278808594, -0.0366363525390625, -0.034424781799316406, -0.03221321105957031, -0.03000164031982422, -0.027790069580078125, -0.02557849884033203, -0.023366928100585938, -0.021155357360839844, -0.01894378662109375, -0.016732215881347656, -0.014520645141601562, -0.012309074401855469, -0.010097503662109375, -0.007885932922363281, -0.0056743621826171875, -0.0034627914428710938, -0.001251220703125, 0.0009603500366210938, 0.0031719207763671875, 0.005383491516113281, 0.007595062255859375, 0.009806632995605469, 0.012018203735351562, 0.014229774475097656, 0.01644134521484375, 0.018652915954589844, 0.020864486694335938, 0.02307605743408203, 0.025287628173828125, 0.02749919891357422, 0.029710769653320312, 0.031922340393066406, 0.0341339111328125, 0.036345481872558594, 0.03855705261230469, 0.04076862335205078, 0.042980194091796875, 0.04519176483154297, 0.04740333557128906, 0.049614906311035156, 0.05182647705078125, 0.054038047790527344, 0.05624961853027344, 0.05846118927001953, 0.060672760009765625, 0.06288433074951172, 0.06509590148925781, 0.0673074722290039, 0.06951904296875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 4.0, 12.0, 33.0, 38.0, 71.0, 141.0, 181.0, 207.0, 135.0, 83.0, 46.0, 23.0, 13.0, 10.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002235602820292115, -0.0021529877558350563, -0.0020703724585473537, -0.001987757394090295, -0.001905142213217914, -0.0018225270323455334, -0.0017399118514731526, -0.001657296670600772, -0.001574681606143713, -0.0014920664252713323, -0.0014094512443989515, -0.0013268361799418926, -0.0012442209990695119, -0.0011616058181971312, -0.0010789906373247504, -0.0009963754564523697, -0.000913760275579989, -0.0008311450947076082, -0.0007485299720428884, -0.0006659147911705077, -0.0005832996685057878, -0.0005006844876334071, -0.0004180693067610264, -0.00033545418409630656, -0.00025283900322392583, -0.00017022385145537555, -8.760868513491005e-05, -4.993518814444542e-06, 7.762163295410573e-05, 0.000160236784722656, 0.00024285196559503675, 0.00032546708825975657, 0.0004080822691321373, 0.000490697450004518, 0.0005733125726692379, 0.0006559277535416186, 0.0007385428762063384, 0.0008211580570787191, 0.0009037732379510999, 0.0009863884188234806, 0.0010690034832805395, 0.0011516186641529202, 0.001234233845025301, 0.0013168489094823599, 0.0013994640903547406, 0.0014820792712271214, 0.001564694452099502, 0.0016473096329718828, 0.0017299248138442636, 0.0018125399947166443, 0.001895155175589025, 0.0019777703564614058, 0.0020603854209184647, 0.0021430007182061672, 0.002225615782663226, 0.002308230847120285, 0.0023908461444079876, 0.0024734612088650465, 0.002556076506152749, 0.002638691570609808, 0.0027213068678975105, 0.0028039219323545694, 0.0028865369968116283, 0.002969152294099331, 0.00305176735855639]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 1.0, 3.0, 8.0, 11.0, 5.0, 13.0, 14.0, 21.0, 13.0, 23.0, 31.0, 23.0, 36.0, 26.0, 36.0, 39.0, 40.0, 42.0, 40.0, 39.0, 36.0, 56.0, 31.0, 49.0, 44.0, 45.0, 34.0, 30.0, 33.0, 31.0, 21.0, 23.0, 17.0, 14.0, 14.0, 12.0, 11.0, 7.0, 6.0, 4.0, 7.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018064379692077637, -0.0017452612519264221, -0.0016840845346450806, -0.001622907817363739, -0.0015617311000823975, -0.001500554382801056, -0.0014393776655197144, -0.0013782009482383728, -0.0013170242309570312, -0.0012558475136756897, -0.0011946707963943481, -0.0011334940791130066, -0.001072317361831665, -0.0010111406445503235, -0.0009499639272689819, -0.0008887872099876404, -0.0008276104927062988, -0.0007664337754249573, -0.0007052570581436157, -0.0006440803408622742, -0.0005829036235809326, -0.0005217269062995911, -0.0004605501890182495, -0.00039937347173690796, -0.0003381967544555664, -0.00027702003717422485, -0.0002158433198928833, -0.00015466660261154175, -9.34898853302002e-05, -3.231316804885864e-05, 2.886354923248291e-05, 9.004026651382446e-05, 0.00015121698379516602, 0.00021239370107650757, 0.0002735704183578491, 0.0003347471356391907, 0.0003959238529205322, 0.0004571005702018738, 0.0005182772874832153, 0.0005794540047645569, 0.0006406307220458984, 0.00070180743932724, 0.0007629841566085815, 0.0008241608738899231, 0.0008853375911712646, 0.0009465143084526062, 0.0010076910257339478, 0.0010688677430152893, 0.0011300444602966309, 0.0011912211775779724, 0.001252397894859314, 0.0013135746121406555, 0.001374751329421997, 0.0014359280467033386, 0.0014971047639846802, 0.0015582814812660217, 0.0016194581985473633, 0.0016806349158287048, 0.0017418116331100464, 0.001802988350391388, 0.0018641650676727295, 0.001925341784954071, 0.0019865185022354126, 0.002047695219516754, 0.0021088719367980957]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 6.0, 3.0, 7.0, 10.0, 10.0, 14.0, 16.0, 18.0, 19.0, 20.0, 28.0, 27.0, 23.0, 32.0, 30.0, 34.0, 44.0, 50.0, 44.0, 40.0, 47.0, 54.0, 47.0, 31.0, 31.0, 38.0, 41.0, 36.0, 25.0, 39.0, 27.0, 25.0, 20.0, 16.0, 9.0, 10.0, 7.0, 5.0, 3.0, 4.0, 5.0, 6.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6015625, -15.0321044921875, -14.462646484375, -13.8931884765625, -13.32373046875, -12.7542724609375, -12.184814453125, -11.6153564453125, -11.0458984375, -10.4764404296875, -9.906982421875, -9.3375244140625, -8.76806640625, -8.1986083984375, -7.629150390625, -7.0596923828125, -6.490234375, -5.9207763671875, -5.351318359375, -4.7818603515625, -4.21240234375, -3.6429443359375, -3.073486328125, -2.5040283203125, -1.9345703125, -1.3651123046875, -0.795654296875, -0.2261962890625, 0.34326171875, 0.9127197265625, 1.482177734375, 2.0516357421875, 2.62109375, 3.1905517578125, 3.760009765625, 4.3294677734375, 4.89892578125, 5.4683837890625, 6.037841796875, 6.6072998046875, 7.1767578125, 7.7462158203125, 8.315673828125, 8.8851318359375, 9.45458984375, 10.0240478515625, 10.593505859375, 11.1629638671875, 11.732421875, 12.3018798828125, 12.871337890625, 13.4407958984375, 14.01025390625, 14.5797119140625, 15.149169921875, 15.7186279296875, 16.2880859375, 16.8575439453125, 17.427001953125, 17.9964599609375, 18.56591796875, 19.1353759765625, 19.704833984375, 20.2742919921875, 20.84375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 10.0, 15.0, 13.0, 19.0, 21.0, 45.0, 49.0, 67.0, 119.0, 148.0, 224.0, 291.0, 441.0, 746.0, 1417.0, 2995.0, 8406.0, 29566.0, 114989.0, 415936.0, 346452.0, 90317.0, 23543.0, 6829.0, 2567.0, 1244.0, 659.0, 446.0, 297.0, 182.0, 142.0, 97.0, 70.0, 52.0, 36.0, 34.0, 25.0, 16.0, 9.0, 10.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.265625, -23.570556640625, -22.87548828125, -22.180419921875, -21.4853515625, -20.790283203125, -20.09521484375, -19.400146484375, -18.705078125, -18.010009765625, -17.31494140625, -16.619873046875, -15.9248046875, -15.229736328125, -14.53466796875, -13.839599609375, -13.14453125, -12.449462890625, -11.75439453125, -11.059326171875, -10.3642578125, -9.669189453125, -8.97412109375, -8.279052734375, -7.583984375, -6.888916015625, -6.19384765625, -5.498779296875, -4.8037109375, -4.108642578125, -3.41357421875, -2.718505859375, -2.0234375, -1.328369140625, -0.63330078125, 0.061767578125, 0.7568359375, 1.451904296875, 2.14697265625, 2.842041015625, 3.537109375, 4.232177734375, 4.92724609375, 5.622314453125, 6.3173828125, 7.012451171875, 7.70751953125, 8.402587890625, 9.09765625, 9.792724609375, 10.48779296875, 11.182861328125, 11.8779296875, 12.572998046875, 13.26806640625, 13.963134765625, 14.658203125, 15.353271484375, 16.04833984375, 16.743408203125, 17.4384765625, 18.133544921875, 18.82861328125, 19.523681640625, 20.21875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 11.0, 6.0, 6.0, 14.0, 14.0, 14.0, 25.0, 19.0, 25.0, 41.0, 38.0, 45.0, 49.0, 68.0, 81.0, 156.0, 1514.0, 349.0, 147.0, 77.0, 65.0, 57.0, 47.0, 34.0, 20.0, 26.0, 23.0, 17.0, 11.0, 19.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-67.4375, -65.560546875, -63.68359375, -61.806640625, -59.9296875, -58.052734375, -56.17578125, -54.298828125, -52.421875, -50.544921875, -48.66796875, -46.791015625, -44.9140625, -43.037109375, -41.16015625, -39.283203125, -37.40625, -35.529296875, -33.65234375, -31.775390625, -29.8984375, -28.021484375, -26.14453125, -24.267578125, -22.390625, -20.513671875, -18.63671875, -16.759765625, -14.8828125, -13.005859375, -11.12890625, -9.251953125, -7.375, -5.498046875, -3.62109375, -1.744140625, 0.1328125, 2.009765625, 3.88671875, 5.763671875, 7.640625, 9.517578125, 11.39453125, 13.271484375, 15.1484375, 17.025390625, 18.90234375, 20.779296875, 22.65625, 24.533203125, 26.41015625, 28.287109375, 30.1640625, 32.041015625, 33.91796875, 35.794921875, 37.671875, 39.548828125, 41.42578125, 43.302734375, 45.1796875, 47.056640625, 48.93359375, 50.810546875, 52.6875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 6.0, 7.0, 15.0, 13.0, 27.0, 22.0, 42.0, 48.0, 80.0, 87.0, 157.0, 184.0, 310.0, 589.0, 1714.0, 67706.0, 3043156.0, 28638.0, 1336.0, 511.0, 312.0, 203.0, 138.0, 111.0, 64.0, 61.0, 47.0, 28.0, 23.0, 20.0, 12.0, 15.0, 11.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.8125, -82.0244140625, -79.236328125, -76.4482421875, -73.66015625, -70.8720703125, -68.083984375, -65.2958984375, -62.5078125, -59.7197265625, -56.931640625, -54.1435546875, -51.35546875, -48.5673828125, -45.779296875, -42.9912109375, -40.203125, -37.4150390625, -34.626953125, -31.8388671875, -29.05078125, -26.2626953125, -23.474609375, -20.6865234375, -17.8984375, -15.1103515625, -12.322265625, -9.5341796875, -6.74609375, -3.9580078125, -1.169921875, 1.6181640625, 4.40625, 7.1943359375, 9.982421875, 12.7705078125, 15.55859375, 18.3466796875, 21.134765625, 23.9228515625, 26.7109375, 29.4990234375, 32.287109375, 35.0751953125, 37.86328125, 40.6513671875, 43.439453125, 46.2275390625, 49.015625, 51.8037109375, 54.591796875, 57.3798828125, 60.16796875, 62.9560546875, 65.744140625, 68.5322265625, 71.3203125, 74.1083984375, 76.896484375, 79.6845703125, 82.47265625, 85.2607421875, 88.048828125, 90.8369140625, 93.625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 463.0, 554.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-455.4273986816406, -425.091064453125, -394.7547302246094, -364.41839599609375, -334.08209228515625, -303.7457580566406, -273.409423828125, -243.07310485839844, -212.7367706298828, -182.4004364013672, -152.06411743164062, -121.727783203125, -91.3914566040039, -61.05513000488281, -30.718795776367188, -0.382476806640625, 29.953857421875, 60.290184020996094, 90.62651062011719, 120.96284484863281, 151.29916381835938, 181.635498046875, 211.97183227539062, 242.3081512451172, 272.64447021484375, 302.9808044433594, 333.317138671875, 363.6534423828125, 393.9897766113281, 424.32611083984375, 454.6624450683594, 484.998779296875, 515.3351440429688, 545.6714477539062, 576.0078125, 606.3441162109375, 636.6804809570312, 667.0167846679688, 697.3531494140625, 727.689453125, 758.0257568359375, 788.362060546875, 818.6984252929688, 849.0347290039062, 879.37109375, 909.7073974609375, 940.043701171875, 970.3800659179688, 1000.7164306640625, 1031.052734375, 1061.3890380859375, 1091.7254638671875, 1122.061767578125, 1152.3980712890625, 1182.734375, 1213.0706787109375, 1243.406982421875, 1273.7432861328125, 1304.07958984375, 1334.416015625, 1364.7523193359375, 1395.088623046875, 1425.4249267578125, 1455.76123046875, 1486.09765625]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 9.0, 7.0, 17.0, 21.0, 22.0, 29.0, 18.0, 23.0, 32.0, 28.0, 44.0, 30.0, 39.0, 38.0, 56.0, 32.0, 40.0, 33.0, 46.0, 48.0, 33.0, 47.0, 30.0, 37.0, 37.0, 26.0, 24.0, 24.0, 20.0, 23.0, 17.0, 11.0, 10.0, 5.0, 10.0, 4.0, 11.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-144.21868896484375, -140.26858520507812, -136.3184814453125, -132.36837768554688, -128.41827392578125, -124.46817016601562, -120.51805877685547, -116.56795501708984, -112.61785125732422, -108.6677474975586, -104.71764373779297, -100.76753997802734, -96.81742858886719, -92.86732482910156, -88.91722106933594, -84.96711730957031, -81.01701354980469, -77.06690979003906, -73.11680603027344, -69.16670227050781, -65.21659851074219, -61.2664909362793, -57.316383361816406, -53.36627960205078, -49.416175842285156, -45.46607208251953, -41.515968322753906, -37.565860748291016, -33.61575698852539, -29.665653228759766, -25.715547561645508, -21.76544189453125, -17.815338134765625, -13.865233421325684, -9.915128707885742, -5.965023994445801, -2.0149192810058594, 1.9351844787597656, 5.885290145874023, 9.835395812988281, 13.785499572753906, 17.73560333251953, 21.68570899963379, 25.635814666748047, 29.585918426513672, 33.5360221862793, 37.48612976074219, 41.43623352050781, 45.38633728027344, 49.33644104003906, 53.28654479980469, 57.23665237426758, 61.1867561340332, 65.13685607910156, 69.08696746826172, 73.03707122802734, 76.98717498779297, 80.9372787475586, 84.88738250732422, 88.83748626708984, 92.78759765625, 96.73770141601562, 100.68780517578125, 104.63790893554688, 108.5880126953125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 0.0, 5.0, 4.0, 10.0, 4.0, 9.0, 8.0, 8.0, 15.0, 8.0, 20.0, 16.0, 21.0, 24.0, 24.0, 26.0, 25.0, 33.0, 29.0, 26.0, 35.0, 33.0, 52.0, 34.0, 41.0, 40.0, 33.0, 54.0, 34.0, 37.0, 36.0, 24.0, 27.0, 34.0, 30.0, 24.0, 30.0, 19.0, 13.0, 13.0, 15.0, 9.0, 6.0, 2.0, 4.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6953125, -14.1815185546875, -13.667724609375, -13.1539306640625, -12.64013671875, -12.1263427734375, -11.612548828125, -11.0987548828125, -10.5849609375, -10.0711669921875, -9.557373046875, -9.0435791015625, -8.52978515625, -8.0159912109375, -7.502197265625, -6.9884033203125, -6.474609375, -5.9608154296875, -5.447021484375, -4.9332275390625, -4.41943359375, -3.9056396484375, -3.391845703125, -2.8780517578125, -2.3642578125, -1.8504638671875, -1.336669921875, -0.8228759765625, -0.30908203125, 0.2047119140625, 0.718505859375, 1.2322998046875, 1.74609375, 2.2598876953125, 2.773681640625, 3.2874755859375, 3.80126953125, 4.3150634765625, 4.828857421875, 5.3426513671875, 5.8564453125, 6.3702392578125, 6.884033203125, 7.3978271484375, 7.91162109375, 8.4254150390625, 8.939208984375, 9.4530029296875, 9.966796875, 10.4805908203125, 10.994384765625, 11.5081787109375, 12.02197265625, 12.5357666015625, 13.049560546875, 13.5633544921875, 14.0771484375, 14.5909423828125, 15.104736328125, 15.6185302734375, 16.13232421875, 16.6461181640625, 17.159912109375, 17.6737060546875, 18.1875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 14.0, 8.0, 12.0, 15.0, 13.0, 16.0, 25.0, 31.0, 43.0, 41.0, 58.0, 80.0, 110.0, 157.0, 176.0, 224.0, 306.0, 383.0, 713.0, 2102068.0, 2087353.0, 662.0, 405.0, 318.0, 212.0, 174.0, 152.0, 119.0, 66.0, 72.0, 46.0, 44.0, 23.0, 22.0, 16.0, 15.0, 13.0, 11.0, 15.0, 9.0, 6.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-379.25, -367.3984375, -355.546875, -343.6953125, -331.84375, -319.9921875, -308.140625, -296.2890625, -284.4375, -272.5859375, -260.734375, -248.8828125, -237.03125, -225.1796875, -213.328125, -201.4765625, -189.625, -177.7734375, -165.921875, -154.0703125, -142.21875, -130.3671875, -118.515625, -106.6640625, -94.8125, -82.9609375, -71.109375, -59.2578125, -47.40625, -35.5546875, -23.703125, -11.8515625, 0.0, 11.8515625, 23.703125, 35.5546875, 47.40625, 59.2578125, 71.109375, 82.9609375, 94.8125, 106.6640625, 118.515625, 130.3671875, 142.21875, 154.0703125, 165.921875, 177.7734375, 189.625, 201.4765625, 213.328125, 225.1796875, 237.03125, 248.8828125, 260.734375, 272.5859375, 284.4375, 296.2890625, 308.140625, 319.9921875, 331.84375, 343.6953125, 355.546875, 367.3984375, 379.25]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 2.0, 2.0, 8.0, 5.0, 20.0, 25.0, 25.0, 39.0, 67.0, 103.0, 166.0, 253.0, 498.0, 801.0, 767.0, 527.0, 313.0, 153.0, 98.0, 66.0, 44.0, 32.0, 16.0, 16.0, 8.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.90625, -33.7431640625, -32.580078125, -31.4169921875, -30.25390625, -29.0908203125, -27.927734375, -26.7646484375, -25.6015625, -24.4384765625, -23.275390625, -22.1123046875, -20.94921875, -19.7861328125, -18.623046875, -17.4599609375, -16.296875, -15.1337890625, -13.970703125, -12.8076171875, -11.64453125, -10.4814453125, -9.318359375, -8.1552734375, -6.9921875, -5.8291015625, -4.666015625, -3.5029296875, -2.33984375, -1.1767578125, -0.013671875, 1.1494140625, 2.3125, 3.4755859375, 4.638671875, 5.8017578125, 6.96484375, 8.1279296875, 9.291015625, 10.4541015625, 11.6171875, 12.7802734375, 13.943359375, 15.1064453125, 16.26953125, 17.4326171875, 18.595703125, 19.7587890625, 20.921875, 22.0849609375, 23.248046875, 24.4111328125, 25.57421875, 26.7373046875, 27.900390625, 29.0634765625, 30.2265625, 31.3896484375, 32.552734375, 33.7158203125, 34.87890625, 36.0419921875, 37.205078125, 38.3681640625, 39.53125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 1.0, 5.0, 1.0, 7.0, 5.0, 10.0, 7.0, 12.0, 14.0, 13.0, 21.0, 28.0, 29.0, 30.0, 39.0, 41.0, 55.0, 79.0, 121.0, 474.0, 6109.0, 4128247.0, 57385.0, 896.0, 200.0, 88.0, 54.0, 49.0, 44.0, 35.0, 22.0, 22.0, 24.0, 20.0, 19.0, 13.0, 4.0, 12.0, 9.0, 10.0, 5.0, 6.0, 0.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-178.625, -172.607421875, -166.58984375, -160.572265625, -154.5546875, -148.537109375, -142.51953125, -136.501953125, -130.484375, -124.466796875, -118.44921875, -112.431640625, -106.4140625, -100.396484375, -94.37890625, -88.361328125, -82.34375, -76.326171875, -70.30859375, -64.291015625, -58.2734375, -52.255859375, -46.23828125, -40.220703125, -34.203125, -28.185546875, -22.16796875, -16.150390625, -10.1328125, -4.115234375, 1.90234375, 7.919921875, 13.9375, 19.955078125, 25.97265625, 31.990234375, 38.0078125, 44.025390625, 50.04296875, 56.060546875, 62.078125, 68.095703125, 74.11328125, 80.130859375, 86.1484375, 92.166015625, 98.18359375, 104.201171875, 110.21875, 116.236328125, 122.25390625, 128.271484375, 134.2890625, 140.306640625, 146.32421875, 152.341796875, 158.359375, 164.376953125, 170.39453125, 176.412109375, 182.4296875, 188.447265625, 194.46484375, 200.482421875, 206.5]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 11.0, 338.0, 623.0, 40.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1047.48828125, -1027.42041015625, -1007.3526611328125, -987.2847900390625, -967.2169799804688, -947.149169921875, -927.0813598632812, -907.0135498046875, -886.9456787109375, -866.8778686523438, -846.81005859375, -826.7421875, -806.6743774414062, -786.6065673828125, -766.5387573242188, -746.470947265625, -726.403076171875, -706.3352661132812, -686.2674560546875, -666.1995849609375, -646.1317749023438, -626.06396484375, -605.9961547851562, -585.9283447265625, -565.8605346679688, -545.792724609375, -525.7249145507812, -505.6570739746094, -485.5892333984375, -465.52142333984375, -445.45361328125, -425.3857727050781, -405.31793212890625, -385.2501220703125, -365.1822814941406, -345.1144714355469, -325.046630859375, -304.97882080078125, -284.9110107421875, -264.8431701660156, -244.77536010742188, -224.70753479003906, -204.63970947265625, -184.5718994140625, -164.50405883789062, -144.43624877929688, -124.36842346191406, -104.30059814453125, -84.23277282714844, -64.16494750976562, -44.09712600708008, -24.02930450439453, -3.9614791870117188, 16.106346130371094, 36.174163818359375, 56.24198913574219, 76.309814453125, 96.37763977050781, 116.44546508789062, 136.51327514648438, 156.58111572265625, 176.64892578125, 196.7167510986328, 216.78457641601562, 236.85240173339844]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 3.0, 7.0, 7.0, 12.0, 25.0, 17.0, 14.0, 22.0, 13.0, 23.0, 25.0, 33.0, 21.0, 33.0, 28.0, 40.0, 30.0, 29.0, 32.0, 37.0, 37.0, 42.0, 41.0, 31.0, 40.0, 34.0, 40.0, 38.0, 37.0, 20.0, 23.0, 14.0, 26.0, 18.0, 20.0, 12.0, 10.0, 15.0, 6.0, 6.0, 5.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-78.3214340209961, -75.7307357788086, -73.14002990722656, -70.54933166503906, -67.95863342285156, -65.36792755126953, -62.77722930908203, -60.186527252197266, -57.5958251953125, -55.005123138427734, -52.41442108154297, -49.82372283935547, -47.2330207824707, -44.64231872558594, -42.05162048339844, -39.46091842651367, -36.870216369628906, -34.27951431274414, -31.688814163208008, -29.098114013671875, -26.50741195678711, -23.916709899902344, -21.32600975036621, -18.735309600830078, -16.144607543945312, -13.553906440734863, -10.963205337524414, -8.372504234313965, -5.781803131103516, -3.1911020278930664, -0.6004009246826172, 1.9902992248535156, 4.58099365234375, 7.171694755554199, 9.762395858764648, 12.353096961975098, 14.943798065185547, 17.534500122070312, 20.125200271606445, 22.715900421142578, 25.306602478027344, 27.89730453491211, 30.488004684448242, 33.078704833984375, 35.66940689086914, 38.260108947753906, 40.850807189941406, 43.44150924682617, 46.03221130371094, 48.6229133605957, 51.21361541748047, 53.80431365966797, 56.395015716552734, 58.9857177734375, 61.576416015625, 64.1671142578125, 66.75782012939453, 69.34851837158203, 71.93922424316406, 74.52992248535156, 77.12062072753906, 79.7113265991211, 82.3020248413086, 84.89273071289062, 87.48342895507812]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 6.0, 1.0, 4.0, 3.0, 9.0, 9.0, 8.0, 16.0, 14.0, 13.0, 13.0, 26.0, 13.0, 11.0, 25.0, 30.0, 36.0, 31.0, 20.0, 34.0, 40.0, 41.0, 40.0, 52.0, 51.0, 42.0, 47.0, 40.0, 38.0, 45.0, 22.0, 33.0, 32.0, 22.0, 25.0, 17.0, 16.0, 16.0, 16.0, 18.0, 5.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.3671875, -14.8199462890625, -14.272705078125, -13.7254638671875, -13.17822265625, -12.6309814453125, -12.083740234375, -11.5364990234375, -10.9892578125, -10.4420166015625, -9.894775390625, -9.3475341796875, -8.80029296875, -8.2530517578125, -7.705810546875, -7.1585693359375, -6.611328125, -6.0640869140625, -5.516845703125, -4.9696044921875, -4.42236328125, -3.8751220703125, -3.327880859375, -2.7806396484375, -2.2333984375, -1.6861572265625, -1.138916015625, -0.5916748046875, -0.04443359375, 0.5028076171875, 1.050048828125, 1.5972900390625, 2.14453125, 2.6917724609375, 3.239013671875, 3.7862548828125, 4.33349609375, 4.8807373046875, 5.427978515625, 5.9752197265625, 6.5224609375, 7.0697021484375, 7.616943359375, 8.1641845703125, 8.71142578125, 9.2586669921875, 9.805908203125, 10.3531494140625, 10.900390625, 11.4476318359375, 11.994873046875, 12.5421142578125, 13.08935546875, 13.6365966796875, 14.183837890625, 14.7310791015625, 15.2783203125, 15.8255615234375, 16.372802734375, 16.9200439453125, 17.46728515625, 18.0145263671875, 18.561767578125, 19.1090087890625, 19.65625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 10.0, 12.0, 33.0, 34.0, 44.0, 94.0, 110.0, 197.0, 348.0, 555.0, 909.0, 1525.0, 2519.0, 4152.0, 6896.0, 11399.0, 18994.0, 31915.0, 55294.0, 96999.0, 177853.0, 260383.0, 163667.0, 89685.0, 51210.0, 29557.0, 17569.0, 10411.0, 6389.0, 3793.0, 2321.0, 1327.0, 904.0, 510.0, 321.0, 198.0, 164.0, 88.0, 52.0, 42.0, 21.0, 21.0, 9.0, 5.0, 1.0, 3.0, 4.0, 3.0], "bins": [-2.6328125, -2.562469482421875, -2.49212646484375, -2.421783447265625, -2.3514404296875, -2.281097412109375, -2.21075439453125, -2.140411376953125, -2.070068359375, -1.999725341796875, -1.92938232421875, -1.859039306640625, -1.7886962890625, -1.718353271484375, -1.64801025390625, -1.577667236328125, -1.50732421875, -1.436981201171875, -1.36663818359375, -1.296295166015625, -1.2259521484375, -1.155609130859375, -1.08526611328125, -1.014923095703125, -0.944580078125, -0.874237060546875, -0.80389404296875, -0.733551025390625, -0.6632080078125, -0.592864990234375, -0.52252197265625, -0.452178955078125, -0.3818359375, -0.311492919921875, -0.24114990234375, -0.170806884765625, -0.1004638671875, -0.030120849609375, 0.04022216796875, 0.110565185546875, 0.180908203125, 0.251251220703125, 0.32159423828125, 0.391937255859375, 0.4622802734375, 0.532623291015625, 0.60296630859375, 0.673309326171875, 0.74365234375, 0.813995361328125, 0.88433837890625, 0.954681396484375, 1.0250244140625, 1.095367431640625, 1.16571044921875, 1.236053466796875, 1.306396484375, 1.376739501953125, 1.44708251953125, 1.517425537109375, 1.5877685546875, 1.658111572265625, 1.72845458984375, 1.798797607421875, 1.869140625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 9.0, 2.0, 8.0, 12.0, 13.0, 11.0, 6.0, 14.0, 18.0, 11.0, 20.0, 18.0, 32.0, 32.0, 27.0, 28.0, 31.0, 36.0, 45.0, 51.0, 51.0, 35.0, 1061.0, 40.0, 36.0, 43.0, 34.0, 27.0, 38.0, 21.0, 29.0, 18.0, 23.0, 26.0, 17.0, 22.0, 17.0, 21.0, 10.0, 11.0, 3.0, 2.0, 3.0, 6.0, 4.0, 1.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.8736572265625, -9.536376953125, -9.1990966796875, -8.86181640625, -8.5245361328125, -8.187255859375, -7.8499755859375, -7.5126953125, -7.1754150390625, -6.838134765625, -6.5008544921875, -6.16357421875, -5.8262939453125, -5.489013671875, -5.1517333984375, -4.814453125, -4.4771728515625, -4.139892578125, -3.8026123046875, -3.46533203125, -3.1280517578125, -2.790771484375, -2.4534912109375, -2.1162109375, -1.7789306640625, -1.441650390625, -1.1043701171875, -0.76708984375, -0.4298095703125, -0.092529296875, 0.2447509765625, 0.58203125, 0.9193115234375, 1.256591796875, 1.5938720703125, 1.93115234375, 2.2684326171875, 2.605712890625, 2.9429931640625, 3.2802734375, 3.6175537109375, 3.954833984375, 4.2921142578125, 4.62939453125, 4.9666748046875, 5.303955078125, 5.6412353515625, 5.978515625, 6.3157958984375, 6.653076171875, 6.9903564453125, 7.32763671875, 7.6649169921875, 8.002197265625, 8.3394775390625, 8.6767578125, 9.0140380859375, 9.351318359375, 9.6885986328125, 10.02587890625, 10.3631591796875, 10.700439453125, 11.0377197265625, 11.375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 6.0, 15.0, 21.0, 40.0, 57.0, 77.0, 138.0, 193.0, 268.0, 433.0, 695.0, 1003.0, 1523.0, 2464.0, 3794.0, 6051.0, 9529.0, 14653.0, 22967.0, 36276.0, 58010.0, 93580.0, 154476.0, 1265854.0, 162086.0, 97685.0, 60487.0, 38058.0, 24026.0, 15273.0, 9950.0, 6044.0, 4058.0, 2600.0, 1699.0, 1029.0, 719.0, 449.0, 277.0, 212.0, 104.0, 79.0, 56.0, 40.0, 26.0, 16.0, 12.0, 7.0, 6.0, 4.0, 5.0, 1.0, 0.0, 1.0], "bins": [-1.9267578125, -1.86932373046875, -1.8118896484375, -1.75445556640625, -1.697021484375, -1.63958740234375, -1.5821533203125, -1.52471923828125, -1.46728515625, -1.40985107421875, -1.3524169921875, -1.29498291015625, -1.237548828125, -1.18011474609375, -1.1226806640625, -1.06524658203125, -1.0078125, -0.95037841796875, -0.8929443359375, -0.83551025390625, -0.778076171875, -0.72064208984375, -0.6632080078125, -0.60577392578125, -0.54833984375, -0.49090576171875, -0.4334716796875, -0.37603759765625, -0.318603515625, -0.26116943359375, -0.2037353515625, -0.14630126953125, -0.0888671875, -0.03143310546875, 0.0260009765625, 0.08343505859375, 0.140869140625, 0.19830322265625, 0.2557373046875, 0.31317138671875, 0.37060546875, 0.42803955078125, 0.4854736328125, 0.54290771484375, 0.600341796875, 0.65777587890625, 0.7152099609375, 0.77264404296875, 0.830078125, 0.88751220703125, 0.9449462890625, 1.00238037109375, 1.059814453125, 1.11724853515625, 1.1746826171875, 1.23211669921875, 1.28955078125, 1.34698486328125, 1.4044189453125, 1.46185302734375, 1.519287109375, 1.57672119140625, 1.6341552734375, 1.69158935546875, 1.7490234375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 6.0, 5.0, 7.0, 9.0, 15.0, 18.0, 20.0, 25.0, 20.0, 31.0, 40.0, 53.0, 71.0, 88.0, 93.0, 72.0, 58.0, 67.0, 60.0, 42.0, 38.0, 24.0, 25.0, 22.0, 18.0, 11.0, 14.0, 8.0, 4.0, 11.0, 6.0, 1.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004520416259765625, -0.004369974136352539, -0.004219532012939453, -0.004069089889526367, -0.003918647766113281, -0.0037682056427001953, -0.0036177635192871094, -0.0034673213958740234, -0.0033168792724609375, -0.0031664371490478516, -0.0030159950256347656, -0.0028655529022216797, -0.0027151107788085938, -0.002564668655395508, -0.002414226531982422, -0.002263784408569336, -0.00211334228515625, -0.001962900161743164, -0.0018124580383300781, -0.0016620159149169922, -0.0015115737915039062, -0.0013611316680908203, -0.0012106895446777344, -0.0010602474212646484, -0.0009098052978515625, -0.0007593631744384766, -0.0006089210510253906, -0.0004584789276123047, -0.00030803680419921875, -0.0001575946807861328, -7.152557373046875e-06, 0.00014328956604003906, 0.000293731689453125, 0.00044417381286621094, 0.0005946159362792969, 0.0007450580596923828, 0.0008955001831054688, 0.0010459423065185547, 0.0011963844299316406, 0.0013468265533447266, 0.0014972686767578125, 0.0016477108001708984, 0.0017981529235839844, 0.0019485950469970703, 0.0020990371704101562, 0.002249479293823242, 0.002399921417236328, 0.002550363540649414, 0.0027008056640625, 0.002851247787475586, 0.003001689910888672, 0.003152132034301758, 0.0033025741577148438, 0.0034530162811279297, 0.0036034584045410156, 0.0037539005279541016, 0.0039043426513671875, 0.0040547847747802734, 0.004205226898193359, 0.004355669021606445, 0.004506111145019531, 0.004656553268432617, 0.004806995391845703, 0.004957437515258789, 0.005107879638671875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 6.0, 3.0, 6.0, 2.0, 11.0, 13.0, 18.0, 17.0, 27.0, 34.0, 53.0, 65.0, 99.0, 112.0, 201.0, 334.0, 538.0, 1192.0, 875687.0, 167682.0, 1067.0, 507.0, 279.0, 171.0, 109.0, 81.0, 65.0, 37.0, 35.0, 21.0, 22.0, 9.0, 7.0, 10.0, 8.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09857177734375, -0.09566593170166016, -0.09276008605957031, -0.08985424041748047, -0.08694839477539062, -0.08404254913330078, -0.08113670349121094, -0.0782308578491211, -0.07532501220703125, -0.0724191665649414, -0.06951332092285156, -0.06660747528076172, -0.06370162963867188, -0.06079578399658203, -0.05788993835449219, -0.054984092712402344, -0.0520782470703125, -0.049172401428222656, -0.04626655578613281, -0.04336071014404297, -0.040454864501953125, -0.03754901885986328, -0.03464317321777344, -0.031737327575683594, -0.02883148193359375, -0.025925636291503906, -0.023019790649414062, -0.02011394500732422, -0.017208099365234375, -0.014302253723144531, -0.011396408081054688, -0.008490562438964844, -0.005584716796875, -0.0026788711547851562, 0.0002269744873046875, 0.0031328201293945312, 0.006038665771484375, 0.008944511413574219, 0.011850357055664062, 0.014756202697753906, 0.01766204833984375, 0.020567893981933594, 0.023473739624023438, 0.02637958526611328, 0.029285430908203125, 0.03219127655029297, 0.03509712219238281, 0.038002967834472656, 0.0409088134765625, 0.043814659118652344, 0.04672050476074219, 0.04962635040283203, 0.052532196044921875, 0.05543804168701172, 0.05834388732910156, 0.061249732971191406, 0.06415557861328125, 0.0670614242553711, 0.06996726989746094, 0.07287311553955078, 0.07577896118164062, 0.07868480682373047, 0.08159065246582031, 0.08449649810791016, 0.08740234375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 12.0, 27.0, 64.0, 159.0, 303.0, 250.0, 129.0, 38.0, 19.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0023831615690141916, -0.0022629122249782085, -0.002142663113772869, -0.0020224140025675297, -0.0019021646585315466, -0.0017819154309108853, -0.001661666203290224, -0.0015414169756695628, -0.0014211677480489016, -0.0013009185204282403, -0.001180669292807579, -0.0010604200651869178, -0.0009401708375662565, -0.0008199216099455953, -0.000699672382324934, -0.0005794231547042727, -0.0004591739270836115, -0.00033892469946295023, -0.00021867547184228897, -9.842624422162771e-05, 2.1822983399033546e-05, 0.0001420722110196948, 0.00026232143864035606, 0.0003825706662610173, 0.0005028198938816786, 0.0006230691215023398, 0.0007433183491230011, 0.0008635675767436624, 0.0009838168043643236, 0.0011040660319849849, 0.0012243152596056461, 0.0013445644872263074, 0.001464813482016325, 0.0015850627096369863, 0.0017053119372576475, 0.0018255611648783088, 0.00194581039249897, 0.0020660595037043095, 0.0021863088477402925, 0.0023065581917762756, 0.002426807302981615, 0.0025470564141869545, 0.0026673057582229376, 0.0027875551022589207, 0.00290780421346426, 0.0030280533246695995, 0.0031483026687055826, 0.0032685520127415657, 0.003388801123946905, 0.0035090502351522446, 0.0036292995791882277, 0.0037495489232242107, 0.00386979803442955, 0.00399004714563489, 0.004110296256840229, 0.004230545833706856, 0.004350794944912195, 0.004471044056117535, 0.004591293632984161, 0.004711542744189501, 0.00483179185539484, 0.00495204096660018, 0.005072290077805519, 0.005192539654672146, 0.005312788765877485]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 3.0, 2.0, 11.0, 9.0, 10.0, 13.0, 14.0, 19.0, 22.0, 24.0, 33.0, 36.0, 36.0, 39.0, 43.0, 42.0, 56.0, 38.0, 37.0, 35.0, 49.0, 51.0, 44.0, 37.0, 39.0, 37.0, 34.0, 29.0, 22.0, 23.0, 21.0, 13.0, 14.0, 18.0, 11.0, 8.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0024521350860595703, -0.002376510761678219, -0.0023008864372968674, -0.002225262112915516, -0.0021496377885341644, -0.002074013464152813, -0.0019983891397714615, -0.00192276481539011, -0.0018471404910087585, -0.001771516166627407, -0.0016958918422460556, -0.0016202675178647041, -0.0015446431934833527, -0.0014690188691020012, -0.0013933945447206497, -0.0013177702203392982, -0.0012421458959579468, -0.0011665215715765953, -0.0010908972471952438, -0.0010152729228138924, -0.0009396485984325409, -0.0008640242740511894, -0.000788399949669838, -0.0007127756252884865, -0.000637151300907135, -0.0005615269765257835, -0.00048590265214443207, -0.0004102783277630806, -0.0003346540033817291, -0.00025902967900037766, -0.00018340535461902618, -0.00010778103023767471, -3.215670585632324e-05, 4.346761852502823e-05, 0.0001190919429063797, 0.00019471626728773117, 0.00027034059166908264, 0.0003459649160504341, 0.0004215892404317856, 0.0004972135648131371, 0.0005728378891944885, 0.00064846221357584, 0.0007240865379571915, 0.0007997108623385429, 0.0008753351867198944, 0.0009509595111012459, 0.0010265838354825974, 0.0011022081598639488, 0.0011778324842453003, 0.0012534568086266518, 0.0013290811330080032, 0.0014047054573893547, 0.0014803297817707062, 0.0015559541061520576, 0.0016315784305334091, 0.0017072027549147606, 0.001782827079296112, 0.0018584514036774635, 0.001934075728058815, 0.0020097000524401665, 0.002085324376821518, 0.0021609487012028694, 0.002236573025584221, 0.0023121973499655724, 0.002387821674346924]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 6.0, 1.0, 4.0, 3.0, 9.0, 9.0, 8.0, 16.0, 14.0, 13.0, 13.0, 26.0, 13.0, 11.0, 25.0, 30.0, 36.0, 31.0, 20.0, 34.0, 40.0, 41.0, 40.0, 52.0, 51.0, 42.0, 47.0, 40.0, 38.0, 45.0, 22.0, 33.0, 32.0, 22.0, 25.0, 17.0, 16.0, 16.0, 16.0, 18.0, 5.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.3671875, -14.8199462890625, -14.272705078125, -13.7254638671875, -13.17822265625, -12.6309814453125, -12.083740234375, -11.5364990234375, -10.9892578125, -10.4420166015625, -9.894775390625, -9.3475341796875, -8.80029296875, -8.2530517578125, -7.705810546875, -7.1585693359375, -6.611328125, -6.0640869140625, -5.516845703125, -4.9696044921875, -4.42236328125, -3.8751220703125, -3.327880859375, -2.7806396484375, -2.2333984375, -1.6861572265625, -1.138916015625, -0.5916748046875, -0.04443359375, 0.5028076171875, 1.050048828125, 1.5972900390625, 2.14453125, 2.6917724609375, 3.239013671875, 3.7862548828125, 4.33349609375, 4.8807373046875, 5.427978515625, 5.9752197265625, 6.5224609375, 7.0697021484375, 7.616943359375, 8.1641845703125, 8.71142578125, 9.2586669921875, 9.805908203125, 10.3531494140625, 10.900390625, 11.4476318359375, 11.994873046875, 12.5421142578125, 13.08935546875, 13.6365966796875, 14.183837890625, 14.7310791015625, 15.2783203125, 15.8255615234375, 16.372802734375, 16.9200439453125, 17.46728515625, 18.0145263671875, 18.561767578125, 19.1090087890625, 19.65625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 9.0, 3.0, 10.0, 26.0, 27.0, 35.0, 49.0, 66.0, 91.0, 147.0, 185.0, 208.0, 294.0, 416.0, 521.0, 692.0, 886.0, 1257.0, 2200.0, 6319.0, 34176.0, 239808.0, 598574.0, 132994.0, 19023.0, 4206.0, 1818.0, 1081.0, 844.0, 663.0, 487.0, 393.0, 282.0, 221.0, 136.0, 121.0, 96.0, 49.0, 44.0, 32.0, 16.0, 10.0, 11.0, 14.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.1875, -28.25634765625, -27.3251953125, -26.39404296875, -25.462890625, -24.53173828125, -23.6005859375, -22.66943359375, -21.73828125, -20.80712890625, -19.8759765625, -18.94482421875, -18.013671875, -17.08251953125, -16.1513671875, -15.22021484375, -14.2890625, -13.35791015625, -12.4267578125, -11.49560546875, -10.564453125, -9.63330078125, -8.7021484375, -7.77099609375, -6.83984375, -5.90869140625, -4.9775390625, -4.04638671875, -3.115234375, -2.18408203125, -1.2529296875, -0.32177734375, 0.609375, 1.54052734375, 2.4716796875, 3.40283203125, 4.333984375, 5.26513671875, 6.1962890625, 7.12744140625, 8.05859375, 8.98974609375, 9.9208984375, 10.85205078125, 11.783203125, 12.71435546875, 13.6455078125, 14.57666015625, 15.5078125, 16.43896484375, 17.3701171875, 18.30126953125, 19.232421875, 20.16357421875, 21.0947265625, 22.02587890625, 22.95703125, 23.88818359375, 24.8193359375, 25.75048828125, 26.681640625, 27.61279296875, 28.5439453125, 29.47509765625, 30.40625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 5.0, 4.0, 12.0, 8.0, 10.0, 7.0, 12.0, 15.0, 18.0, 9.0, 36.0, 25.0, 34.0, 33.0, 31.0, 42.0, 36.0, 54.0, 76.0, 189.0, 1556.0, 280.0, 104.0, 67.0, 53.0, 46.0, 33.0, 32.0, 32.0, 29.0, 17.0, 20.0, 16.0, 18.0, 13.0, 10.0, 10.0, 8.0, 6.0, 4.0, 6.0, 8.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-42.03125, -40.61865234375, -39.2060546875, -37.79345703125, -36.380859375, -34.96826171875, -33.5556640625, -32.14306640625, -30.73046875, -29.31787109375, -27.9052734375, -26.49267578125, -25.080078125, -23.66748046875, -22.2548828125, -20.84228515625, -19.4296875, -18.01708984375, -16.6044921875, -15.19189453125, -13.779296875, -12.36669921875, -10.9541015625, -9.54150390625, -8.12890625, -6.71630859375, -5.3037109375, -3.89111328125, -2.478515625, -1.06591796875, 0.3466796875, 1.75927734375, 3.171875, 4.58447265625, 5.9970703125, 7.40966796875, 8.822265625, 10.23486328125, 11.6474609375, 13.06005859375, 14.47265625, 15.88525390625, 17.2978515625, 18.71044921875, 20.123046875, 21.53564453125, 22.9482421875, 24.36083984375, 25.7734375, 27.18603515625, 28.5986328125, 30.01123046875, 31.423828125, 32.83642578125, 34.2490234375, 35.66162109375, 37.07421875, 38.48681640625, 39.8994140625, 41.31201171875, 42.724609375, 44.13720703125, 45.5498046875, 46.96240234375, 48.375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 8.0, 7.0, 5.0, 15.0, 15.0, 12.0, 17.0, 17.0, 18.0, 30.0, 29.0, 44.0, 75.0, 83.0, 152.0, 222.0, 397.0, 865.0, 3850.0, 3118596.0, 18645.0, 1191.0, 503.0, 269.0, 162.0, 118.0, 89.0, 63.0, 53.0, 27.0, 27.0, 16.0, 18.0, 15.0, 9.0, 10.0, 8.0, 6.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-153.375, -148.81640625, -144.2578125, -139.69921875, -135.140625, -130.58203125, -126.0234375, -121.46484375, -116.90625, -112.34765625, -107.7890625, -103.23046875, -98.671875, -94.11328125, -89.5546875, -84.99609375, -80.4375, -75.87890625, -71.3203125, -66.76171875, -62.203125, -57.64453125, -53.0859375, -48.52734375, -43.96875, -39.41015625, -34.8515625, -30.29296875, -25.734375, -21.17578125, -16.6171875, -12.05859375, -7.5, -2.94140625, 1.6171875, 6.17578125, 10.734375, 15.29296875, 19.8515625, 24.41015625, 28.96875, 33.52734375, 38.0859375, 42.64453125, 47.203125, 51.76171875, 56.3203125, 60.87890625, 65.4375, 69.99609375, 74.5546875, 79.11328125, 83.671875, 88.23046875, 92.7890625, 97.34765625, 101.90625, 106.46484375, 111.0234375, 115.58203125, 120.140625, 124.69921875, 129.2578125, 133.81640625, 138.375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 15.0, 670.0, 331.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.5048828125, -81.67568969726562, -64.84650421142578, -48.01731491088867, -31.188125610351562, -14.358932495117188, 2.4702529907226562, 19.2994384765625, 36.128631591796875, 52.957820892333984, 69.7870101928711, 86.61619567871094, 103.44538879394531, 120.27458190917969, 137.103759765625, 153.93295288085938, 170.76214599609375, 187.59133911132812, 204.4205322265625, 221.2497100830078, 238.0789031982422, 254.90809631347656, 271.7372741699219, 288.56646728515625, 305.3956604003906, 322.224853515625, 339.0540466308594, 355.88323974609375, 372.71240234375, 389.5416259765625, 406.37078857421875, 423.1999816894531, 440.0291748046875, 456.8583679199219, 473.68756103515625, 490.5167541503906, 507.345947265625, 524.1751098632812, 541.0043334960938, 557.83349609375, 574.6627197265625, 591.4918823242188, 608.3211059570312, 625.1502685546875, 641.9794921875, 658.8086547851562, 675.6378784179688, 692.467041015625, 709.2962036132812, 726.1253662109375, 742.95458984375, 759.7837524414062, 776.6129760742188, 793.442138671875, 810.2713623046875, 827.1005249023438, 843.9296875, 860.7588500976562, 877.5880737304688, 894.417236328125, 911.2464599609375, 928.0756225585938, 944.9048461914062, 961.7340087890625, 978.563232421875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 10.0, 16.0, 9.0, 12.0, 17.0, 11.0, 21.0, 29.0, 25.0, 17.0, 31.0, 38.0, 30.0, 40.0, 37.0, 47.0, 52.0, 43.0, 38.0, 48.0, 36.0, 50.0, 35.0, 34.0, 31.0, 31.0, 30.0, 17.0, 23.0, 17.0, 21.0, 13.0, 12.0, 13.0, 19.0, 7.0, 5.0, 9.0, 4.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-126.76602172851562, -122.73422241210938, -118.70243072509766, -114.6706314086914, -110.63883209228516, -106.60704040527344, -102.57524108886719, -98.54344177246094, -94.51164245605469, -90.47984313964844, -86.44805145263672, -82.41625213623047, -78.38445281982422, -74.3526611328125, -70.32086181640625, -66.2890625, -62.25727081298828, -58.2254753112793, -54.19367599487305, -50.16188049316406, -46.13008117675781, -42.09828567504883, -38.066490173339844, -34.034690856933594, -30.00289535522461, -25.971097946166992, -21.939300537109375, -17.90750503540039, -13.875707626342773, -9.843910217285156, -5.812114715576172, -1.7803173065185547, 2.2514801025390625, 6.2832770347595215, 10.31507396697998, 14.346870422363281, 18.3786678314209, 22.410465240478516, 26.4422607421875, 30.474058151245117, 34.505855560302734, 38.53765106201172, 42.56945037841797, 46.60124588012695, 50.63304138183594, 54.66484069824219, 58.69663619995117, 62.728431701660156, 66.7602310180664, 70.79203033447266, 74.82382202148438, 78.85562133789062, 82.88742065429688, 86.91921997070312, 90.95101165771484, 94.9828109741211, 99.01460266113281, 103.04640197753906, 107.07819366455078, 111.10999298095703, 115.14179229736328, 119.173583984375, 123.20538330078125, 127.2371826171875, 131.26898193359375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 12.0, 6.0, 7.0, 9.0, 12.0, 12.0, 17.0, 23.0, 22.0, 21.0, 32.0, 26.0, 19.0, 34.0, 23.0, 35.0, 34.0, 43.0, 58.0, 48.0, 39.0, 37.0, 45.0, 45.0, 35.0, 42.0, 40.0, 29.0, 25.0, 31.0, 22.0, 23.0, 16.0, 20.0, 12.0, 12.0, 11.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.125, -14.567626953125, -14.01025390625, -13.452880859375, -12.8955078125, -12.338134765625, -11.78076171875, -11.223388671875, -10.666015625, -10.108642578125, -9.55126953125, -8.993896484375, -8.4365234375, -7.879150390625, -7.32177734375, -6.764404296875, -6.20703125, -5.649658203125, -5.09228515625, -4.534912109375, -3.9775390625, -3.420166015625, -2.86279296875, -2.305419921875, -1.748046875, -1.190673828125, -0.63330078125, -0.075927734375, 0.4814453125, 1.038818359375, 1.59619140625, 2.153564453125, 2.7109375, 3.268310546875, 3.82568359375, 4.383056640625, 4.9404296875, 5.497802734375, 6.05517578125, 6.612548828125, 7.169921875, 7.727294921875, 8.28466796875, 8.842041015625, 9.3994140625, 9.956787109375, 10.51416015625, 11.071533203125, 11.62890625, 12.186279296875, 12.74365234375, 13.301025390625, 13.8583984375, 14.415771484375, 14.97314453125, 15.530517578125, 16.087890625, 16.645263671875, 17.20263671875, 17.760009765625, 18.3173828125, 18.874755859375, 19.43212890625, 19.989501953125, 20.546875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 3.0, 13.0, 17.0, 14.0, 17.0, 23.0, 29.0, 39.0, 37.0, 58.0, 67.0, 85.0, 103.0, 133.0, 191.0, 334.0, 708.0, 1916.0, 6766.0, 59868.0, 1325606.0, 2618113.0, 163197.0, 11827.0, 2769.0, 933.0, 436.0, 231.0, 175.0, 110.0, 98.0, 64.0, 75.0, 45.0, 42.0, 34.0, 18.0, 19.0, 15.0, 15.0, 4.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.46875, -41.978515625, -40.48828125, -38.998046875, -37.5078125, -36.017578125, -34.52734375, -33.037109375, -31.546875, -30.056640625, -28.56640625, -27.076171875, -25.5859375, -24.095703125, -22.60546875, -21.115234375, -19.625, -18.134765625, -16.64453125, -15.154296875, -13.6640625, -12.173828125, -10.68359375, -9.193359375, -7.703125, -6.212890625, -4.72265625, -3.232421875, -1.7421875, -0.251953125, 1.23828125, 2.728515625, 4.21875, 5.708984375, 7.19921875, 8.689453125, 10.1796875, 11.669921875, 13.16015625, 14.650390625, 16.140625, 17.630859375, 19.12109375, 20.611328125, 22.1015625, 23.591796875, 25.08203125, 26.572265625, 28.0625, 29.552734375, 31.04296875, 32.533203125, 34.0234375, 35.513671875, 37.00390625, 38.494140625, 39.984375, 41.474609375, 42.96484375, 44.455078125, 45.9453125, 47.435546875, 48.92578125, 50.416015625, 51.90625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 8.0, 16.0, 13.0, 31.0, 40.0, 49.0, 82.0, 83.0, 102.0, 147.0, 239.0, 283.0, 422.0, 525.0, 536.0, 418.0, 277.0, 182.0, 146.0, 100.0, 81.0, 65.0, 55.0, 42.0, 26.0, 22.0, 17.0, 13.0, 10.0, 9.0, 4.0, 6.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.53125, -29.5732421875, -28.615234375, -27.6572265625, -26.69921875, -25.7412109375, -24.783203125, -23.8251953125, -22.8671875, -21.9091796875, -20.951171875, -19.9931640625, -19.03515625, -18.0771484375, -17.119140625, -16.1611328125, -15.203125, -14.2451171875, -13.287109375, -12.3291015625, -11.37109375, -10.4130859375, -9.455078125, -8.4970703125, -7.5390625, -6.5810546875, -5.623046875, -4.6650390625, -3.70703125, -2.7490234375, -1.791015625, -0.8330078125, 0.125, 1.0830078125, 2.041015625, 2.9990234375, 3.95703125, 4.9150390625, 5.873046875, 6.8310546875, 7.7890625, 8.7470703125, 9.705078125, 10.6630859375, 11.62109375, 12.5791015625, 13.537109375, 14.4951171875, 15.453125, 16.4111328125, 17.369140625, 18.3271484375, 19.28515625, 20.2431640625, 21.201171875, 22.1591796875, 23.1171875, 24.0751953125, 25.033203125, 25.9912109375, 26.94921875, 27.9072265625, 28.865234375, 29.8232421875, 30.78125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 3.0, 3.0, 16.0, 16.0, 25.0, 33.0, 56.0, 80.0, 101.0, 196.0, 346.0, 724.0, 2134.0, 15826.0, 2744705.0, 1414876.0, 11788.0, 1921.0, 666.0, 290.0, 162.0, 94.0, 69.0, 37.0, 26.0, 17.0, 20.0, 10.0, 8.0, 11.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.6875, -103.7197265625, -100.751953125, -97.7841796875, -94.81640625, -91.8486328125, -88.880859375, -85.9130859375, -82.9453125, -79.9775390625, -77.009765625, -74.0419921875, -71.07421875, -68.1064453125, -65.138671875, -62.1708984375, -59.203125, -56.2353515625, -53.267578125, -50.2998046875, -47.33203125, -44.3642578125, -41.396484375, -38.4287109375, -35.4609375, -32.4931640625, -29.525390625, -26.5576171875, -23.58984375, -20.6220703125, -17.654296875, -14.6865234375, -11.71875, -8.7509765625, -5.783203125, -2.8154296875, 0.15234375, 3.1201171875, 6.087890625, 9.0556640625, 12.0234375, 14.9912109375, 17.958984375, 20.9267578125, 23.89453125, 26.8623046875, 29.830078125, 32.7978515625, 35.765625, 38.7333984375, 41.701171875, 44.6689453125, 47.63671875, 50.6044921875, 53.572265625, 56.5400390625, 59.5078125, 62.4755859375, 65.443359375, 68.4111328125, 71.37890625, 74.3466796875, 77.314453125, 80.2822265625, 83.25]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 66.0, 936.0, 13.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1059.983642578125, -1016.536376953125, -973.089111328125, -929.641845703125, -886.194580078125, -842.747314453125, -799.2999877929688, -755.8527221679688, -712.4054565429688, -668.9581909179688, -625.5109252929688, -582.0635986328125, -538.6163330078125, -495.1690979003906, -451.7218017578125, -408.2745361328125, -364.8272705078125, -321.3800048828125, -277.9327392578125, -234.48544311523438, -191.03817749023438, -147.59091186523438, -104.14361572265625, -60.69635009765625, -17.24908447265625, 26.19818878173828, 69.64546203613281, 113.09274291992188, 156.54000854492188, 199.98727416992188, 243.4345703125, 286.8818359375, 330.3289794921875, 373.7762451171875, 417.2235107421875, 460.6708068847656, 504.1180725097656, 547.5653076171875, 591.0126342773438, 634.4598999023438, 677.9071655273438, 721.3544311523438, 764.8016967773438, 808.2490234375, 851.6962890625, 895.1435546875, 938.5908203125, 982.0380859375, 1025.4853515625, 1068.9326171875, 1112.3798828125, 1155.8271484375, 1199.2744140625, 1242.7216796875, 1286.1689453125, 1329.6162109375, 1373.0634765625, 1416.5107421875, 1459.9580078125, 1503.4052734375, 1546.8525390625, 1590.2998046875, 1633.7470703125, 1677.1943359375, 1720.6417236328125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 4.0, 6.0, 8.0, 7.0, 17.0, 19.0, 13.0, 15.0, 16.0, 23.0, 35.0, 31.0, 22.0, 27.0, 32.0, 34.0, 47.0, 37.0, 57.0, 38.0, 39.0, 40.0, 34.0, 42.0, 27.0, 46.0, 42.0, 21.0, 34.0, 28.0, 26.0, 22.0, 22.0, 20.0, 12.0, 12.0, 11.0, 9.0, 7.0, 2.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-115.52212524414062, -111.89141082763672, -108.26069641113281, -104.6299819946289, -100.999267578125, -97.3685531616211, -93.73783874511719, -90.10713195800781, -86.47640991210938, -82.84569549560547, -79.21498107910156, -75.58426666259766, -71.95355224609375, -68.32283782958984, -64.69212341308594, -61.0614128112793, -57.430702209472656, -53.79998779296875, -50.169273376464844, -46.53855895996094, -42.90784454345703, -39.277130126953125, -35.646419525146484, -32.01570510864258, -28.384990692138672, -24.754276275634766, -21.12356185913086, -17.492849349975586, -13.86213493347168, -10.231420516967773, -6.6007080078125, -2.9699935913085938, 0.6607208251953125, 4.2914347648620605, 7.922148704528809, 11.552862167358398, 15.183576583862305, 18.81429100036621, 22.445003509521484, 26.07571792602539, 29.706432342529297, 33.3371467590332, 36.96786117553711, 40.59857177734375, 44.229286193847656, 47.86000061035156, 51.49071502685547, 55.121429443359375, 58.75214385986328, 62.38285827636719, 66.0135726928711, 69.644287109375, 73.2750015258789, 76.90571594238281, 80.53642272949219, 84.16714477539062, 87.7978515625, 91.4285659790039, 95.05928039550781, 98.68999481201172, 102.32070922851562, 105.95142364501953, 109.58213806152344, 113.21284484863281, 116.84356689453125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 9.0, 5.0, 5.0, 12.0, 20.0, 12.0, 16.0, 26.0, 26.0, 32.0, 32.0, 36.0, 27.0, 35.0, 35.0, 39.0, 39.0, 36.0, 43.0, 47.0, 55.0, 34.0, 43.0, 36.0, 33.0, 28.0, 30.0, 30.0, 18.0, 28.0, 17.0, 20.0, 17.0, 12.0, 14.0, 10.0, 10.0, 8.0, 4.0, 2.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-15.046875, -14.5791015625, -14.111328125, -13.6435546875, -13.17578125, -12.7080078125, -12.240234375, -11.7724609375, -11.3046875, -10.8369140625, -10.369140625, -9.9013671875, -9.43359375, -8.9658203125, -8.498046875, -8.0302734375, -7.5625, -7.0947265625, -6.626953125, -6.1591796875, -5.69140625, -5.2236328125, -4.755859375, -4.2880859375, -3.8203125, -3.3525390625, -2.884765625, -2.4169921875, -1.94921875, -1.4814453125, -1.013671875, -0.5458984375, -0.078125, 0.3896484375, 0.857421875, 1.3251953125, 1.79296875, 2.2607421875, 2.728515625, 3.1962890625, 3.6640625, 4.1318359375, 4.599609375, 5.0673828125, 5.53515625, 6.0029296875, 6.470703125, 6.9384765625, 7.40625, 7.8740234375, 8.341796875, 8.8095703125, 9.27734375, 9.7451171875, 10.212890625, 10.6806640625, 11.1484375, 11.6162109375, 12.083984375, 12.5517578125, 13.01953125, 13.4873046875, 13.955078125, 14.4228515625, 14.890625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 13.0, 10.0, 6.0, 12.0, 14.0, 40.0, 51.0, 77.0, 94.0, 164.0, 235.0, 371.0, 549.0, 860.0, 1448.0, 2141.0, 3235.0, 5136.0, 7978.0, 12549.0, 19479.0, 30640.0, 49134.0, 79749.0, 132205.0, 212423.0, 189780.0, 113598.0, 69255.0, 42839.0, 26797.0, 16986.0, 10969.0, 6960.0, 4416.0, 2906.0, 1844.0, 1143.0, 799.0, 548.0, 350.0, 247.0, 170.0, 108.0, 73.0, 50.0, 36.0, 27.0, 13.0, 14.0, 6.0, 4.0, 4.0, 3.0, 3.0, 6.0, 1.0], "bins": [-1.65234375, -1.60205078125, -1.5517578125, -1.50146484375, -1.451171875, -1.40087890625, -1.3505859375, -1.30029296875, -1.25, -1.19970703125, -1.1494140625, -1.09912109375, -1.048828125, -0.99853515625, -0.9482421875, -0.89794921875, -0.84765625, -0.79736328125, -0.7470703125, -0.69677734375, -0.646484375, -0.59619140625, -0.5458984375, -0.49560546875, -0.4453125, -0.39501953125, -0.3447265625, -0.29443359375, -0.244140625, -0.19384765625, -0.1435546875, -0.09326171875, -0.04296875, 0.00732421875, 0.0576171875, 0.10791015625, 0.158203125, 0.20849609375, 0.2587890625, 0.30908203125, 0.359375, 0.40966796875, 0.4599609375, 0.51025390625, 0.560546875, 0.61083984375, 0.6611328125, 0.71142578125, 0.76171875, 0.81201171875, 0.8623046875, 0.91259765625, 0.962890625, 1.01318359375, 1.0634765625, 1.11376953125, 1.1640625, 1.21435546875, 1.2646484375, 1.31494140625, 1.365234375, 1.41552734375, 1.4658203125, 1.51611328125, 1.56640625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 6.0, 12.0, 10.0, 10.0, 16.0, 22.0, 22.0, 28.0, 17.0, 31.0, 28.0, 30.0, 39.0, 39.0, 38.0, 39.0, 45.0, 45.0, 1070.0, 36.0, 39.0, 32.0, 43.0, 25.0, 37.0, 27.0, 33.0, 26.0, 24.0, 19.0, 23.0, 20.0, 13.0, 12.0, 13.0, 11.0, 9.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.7109375, -8.415771484375, -8.12060546875, -7.825439453125, -7.5302734375, -7.235107421875, -6.93994140625, -6.644775390625, -6.349609375, -6.054443359375, -5.75927734375, -5.464111328125, -5.1689453125, -4.873779296875, -4.57861328125, -4.283447265625, -3.98828125, -3.693115234375, -3.39794921875, -3.102783203125, -2.8076171875, -2.512451171875, -2.21728515625, -1.922119140625, -1.626953125, -1.331787109375, -1.03662109375, -0.741455078125, -0.4462890625, -0.151123046875, 0.14404296875, 0.439208984375, 0.734375, 1.029541015625, 1.32470703125, 1.619873046875, 1.9150390625, 2.210205078125, 2.50537109375, 2.800537109375, 3.095703125, 3.390869140625, 3.68603515625, 3.981201171875, 4.2763671875, 4.571533203125, 4.86669921875, 5.161865234375, 5.45703125, 5.752197265625, 6.04736328125, 6.342529296875, 6.6376953125, 6.932861328125, 7.22802734375, 7.523193359375, 7.818359375, 8.113525390625, 8.40869140625, 8.703857421875, 8.9990234375, 9.294189453125, 9.58935546875, 9.884521484375, 10.1796875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 3.0, 5.0, 8.0, 13.0, 23.0, 26.0, 51.0, 64.0, 74.0, 102.0, 170.0, 296.0, 387.0, 583.0, 897.0, 1398.0, 2134.0, 3092.0, 4906.0, 7882.0, 12403.0, 19653.0, 31679.0, 51712.0, 84439.0, 140826.0, 1267912.0, 182339.0, 108909.0, 66259.0, 40785.0, 24958.0, 15495.0, 9874.0, 6188.0, 4020.0, 2507.0, 1691.0, 1145.0, 722.0, 488.0, 324.0, 214.0, 177.0, 98.0, 64.0, 48.0, 26.0, 23.0, 22.0, 7.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5029296875, -1.4540557861328125, -1.405181884765625, -1.3563079833984375, -1.30743408203125, -1.2585601806640625, -1.209686279296875, -1.1608123779296875, -1.1119384765625, -1.0630645751953125, -1.014190673828125, -0.9653167724609375, -0.91644287109375, -0.8675689697265625, -0.818695068359375, -0.7698211669921875, -0.720947265625, -0.6720733642578125, -0.623199462890625, -0.5743255615234375, -0.52545166015625, -0.4765777587890625, -0.427703857421875, -0.3788299560546875, -0.3299560546875, -0.2810821533203125, -0.232208251953125, -0.1833343505859375, -0.13446044921875, -0.0855865478515625, -0.036712646484375, 0.0121612548828125, 0.06103515625, 0.1099090576171875, 0.158782958984375, 0.2076568603515625, 0.25653076171875, 0.3054046630859375, 0.354278564453125, 0.4031524658203125, 0.4520263671875, 0.5009002685546875, 0.549774169921875, 0.5986480712890625, 0.64752197265625, 0.6963958740234375, 0.745269775390625, 0.7941436767578125, 0.843017578125, 0.8918914794921875, 0.940765380859375, 0.9896392822265625, 1.03851318359375, 1.0873870849609375, 1.136260986328125, 1.1851348876953125, 1.2340087890625, 1.2828826904296875, 1.331756591796875, 1.3806304931640625, 1.42950439453125, 1.4783782958984375, 1.527252197265625, 1.5761260986328125, 1.625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 7.0, 5.0, 11.0, 6.0, 17.0, 8.0, 15.0, 17.0, 29.0, 36.0, 37.0, 41.0, 49.0, 76.0, 69.0, 86.0, 79.0, 69.0, 62.0, 53.0, 50.0, 36.0, 27.0, 19.0, 17.0, 17.0, 11.0, 9.0, 11.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0047149658203125, -0.004561722278594971, -0.004408478736877441, -0.004255235195159912, -0.004101991653442383, -0.0039487481117248535, -0.0037955045700073242, -0.003642261028289795, -0.0034890174865722656, -0.0033357739448547363, -0.003182530403137207, -0.0030292868614196777, -0.0028760433197021484, -0.002722799777984619, -0.00256955623626709, -0.0024163126945495605, -0.0022630691528320312, -0.002109825611114502, -0.0019565820693969727, -0.0018033385276794434, -0.001650094985961914, -0.0014968514442443848, -0.0013436079025268555, -0.0011903643608093262, -0.0010371208190917969, -0.0008838772773742676, -0.0007306337356567383, -0.000577390193939209, -0.0004241466522216797, -0.0002709031105041504, -0.0001176595687866211, 3.55839729309082e-05, 0.0001888275146484375, 0.0003420710563659668, 0.0004953145980834961, 0.0006485581398010254, 0.0008018016815185547, 0.000955045223236084, 0.0011082887649536133, 0.0012615323066711426, 0.0014147758483886719, 0.0015680193901062012, 0.0017212629318237305, 0.0018745064735412598, 0.002027750015258789, 0.0021809935569763184, 0.0023342370986938477, 0.002487480640411377, 0.0026407241821289062, 0.0027939677238464355, 0.002947211265563965, 0.003100454807281494, 0.0032536983489990234, 0.0034069418907165527, 0.003560185432434082, 0.0037134289741516113, 0.0038666725158691406, 0.00401991605758667, 0.004173159599304199, 0.0043264031410217285, 0.004479646682739258, 0.004632890224456787, 0.004786133766174316, 0.004939377307891846, 0.005092620849609375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 3.0, 6.0, 8.0, 16.0, 14.0, 31.0, 16.0, 32.0, 47.0, 61.0, 75.0, 115.0, 175.0, 233.0, 474.0, 895.0, 21519.0, 1021111.0, 1974.0, 643.0, 336.0, 209.0, 146.0, 93.0, 73.0, 64.0, 36.0, 21.0, 25.0, 16.0, 15.0, 12.0, 10.0, 12.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09234619140625, -0.0895700454711914, -0.08679389953613281, -0.08401775360107422, -0.08124160766601562, -0.07846546173095703, -0.07568931579589844, -0.07291316986083984, -0.07013702392578125, -0.06736087799072266, -0.06458473205566406, -0.06180858612060547, -0.059032440185546875, -0.05625629425048828, -0.05348014831542969, -0.050704002380371094, -0.0479278564453125, -0.045151710510253906, -0.04237556457519531, -0.03959941864013672, -0.036823272705078125, -0.03404712677001953, -0.03127098083496094, -0.028494834899902344, -0.02571868896484375, -0.022942543029785156, -0.020166397094726562, -0.01739025115966797, -0.014614105224609375, -0.011837959289550781, -0.009061813354492188, -0.006285667419433594, -0.003509521484375, -0.0007333755493164062, 0.0020427703857421875, 0.004818916320800781, 0.007595062255859375, 0.010371208190917969, 0.013147354125976562, 0.015923500061035156, 0.01869964599609375, 0.021475791931152344, 0.024251937866210938, 0.02702808380126953, 0.029804229736328125, 0.03258037567138672, 0.03535652160644531, 0.038132667541503906, 0.0409088134765625, 0.043684959411621094, 0.04646110534667969, 0.04923725128173828, 0.052013397216796875, 0.05478954315185547, 0.05756568908691406, 0.060341835021972656, 0.06311798095703125, 0.06589412689208984, 0.06867027282714844, 0.07144641876220703, 0.07422256469726562, 0.07699871063232422, 0.07977485656738281, 0.0825510025024414, 0.0853271484375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 11.0, 710.0, 288.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006648569367825985, -0.006035926286131144, -0.005423282738775015, -0.0048106396570801735, -0.004197996109724045, -0.0035853530280292034, -0.002972709946334362, -0.0023600663989782333, -0.001747423317283392, -0.001134780002757907, -0.0005221368046477437, 9.050639346241951e-05, 0.0007031497079879045, 0.0013157930225133896, 0.001928436104208231, 0.0025410796515643597, 0.003153722733259201, 0.003766366047784686, 0.004379009362310171, 0.0049916524440050125, 0.005604295991361141, 0.006216939073055983, 0.006829582154750824, 0.007442225702106953, 0.008054869249463081, 0.00866751279681921, 0.009280155412852764, 0.009892798960208893, 0.010505442507565022, 0.01111808605492115, 0.011730728670954704, 0.012343372218310833, 0.012956013903021812, 0.013568657450377941, 0.014181300066411495, 0.014793943613767624, 0.015406587161123753, 0.01601923070847988, 0.016631873324513435, 0.01724451780319214, 0.017857160419225693, 0.018469803035259247, 0.01908244751393795, 0.019695090129971504, 0.02030773274600506, 0.02092037722468376, 0.021533019840717316, 0.02214566245675087, 0.022758305072784424, 0.023370947688817978, 0.02398359216749668, 0.024596234783530235, 0.02520887739956379, 0.025821521878242493, 0.026434164494276047, 0.0270468071103096, 0.027659451588988304, 0.028272094205021858, 0.02888473868370056, 0.029497381299734116, 0.03011002391576767, 0.030722668394446373, 0.03133530914783478, 0.03194795548915863, 0.032560598105192184]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 5.0, 7.0, 7.0, 10.0, 16.0, 11.0, 11.0, 23.0, 19.0, 23.0, 17.0, 19.0, 27.0, 29.0, 27.0, 41.0, 35.0, 38.0, 44.0, 45.0, 49.0, 46.0, 50.0, 43.0, 32.0, 35.0, 37.0, 45.0, 30.0, 21.0, 29.0, 13.0, 12.0, 13.0, 19.0, 18.0, 17.0, 7.0, 14.0, 3.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021241307258605957, -0.0020545776933431625, -0.0019850246608257294, -0.0019154716283082962, -0.001845918595790863, -0.0017763655632734299, -0.0017068125307559967, -0.0016372594982385635, -0.0015677064657211304, -0.0014981534332036972, -0.001428600400686264, -0.0013590473681688309, -0.0012894943356513977, -0.0012199413031339645, -0.0011503882706165314, -0.0010808352380990982, -0.001011282205581665, -0.0009417291730642319, -0.0008721761405467987, -0.0008026231080293655, -0.0007330700755119324, -0.0006635170429944992, -0.000593964010477066, -0.0005244109779596329, -0.0004548579454421997, -0.00038530491292476654, -0.0003157518804073334, -0.0002461988478899002, -0.00017664581537246704, -0.00010709278285503387, -3.753975033760071e-05, 3.201328217983246e-05, 0.00010156631469726562, 0.0001711193472146988, 0.00024067237973213196, 0.0003102254122495651, 0.0003797784447669983, 0.00044933147728443146, 0.0005188845098018646, 0.0005884375423192978, 0.000657990574836731, 0.0007275436073541641, 0.0007970966398715973, 0.0008666496723890305, 0.0009362027049064636, 0.0010057557374238968, 0.00107530876994133, 0.0011448618024587631, 0.0012144148349761963, 0.0012839678674936295, 0.0013535209000110626, 0.0014230739325284958, 0.001492626965045929, 0.0015621799975633621, 0.0016317330300807953, 0.0017012860625982285, 0.0017708390951156616, 0.0018403921276330948, 0.001909945160150528, 0.001979498192667961, 0.0020490512251853943, 0.0021186042577028275, 0.0021881572902202606, 0.002257710322737694, 0.002327263355255127]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 9.0, 5.0, 5.0, 12.0, 20.0, 12.0, 16.0, 26.0, 26.0, 32.0, 32.0, 36.0, 27.0, 35.0, 35.0, 39.0, 39.0, 36.0, 43.0, 47.0, 55.0, 34.0, 43.0, 36.0, 33.0, 28.0, 30.0, 30.0, 18.0, 28.0, 17.0, 20.0, 17.0, 12.0, 14.0, 10.0, 10.0, 8.0, 4.0, 2.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-15.046875, -14.5791015625, -14.111328125, -13.6435546875, -13.17578125, -12.7080078125, -12.240234375, -11.7724609375, -11.3046875, -10.8369140625, -10.369140625, -9.9013671875, -9.43359375, -8.9658203125, -8.498046875, -8.0302734375, -7.5625, -7.0947265625, -6.626953125, -6.1591796875, -5.69140625, -5.2236328125, -4.755859375, -4.2880859375, -3.8203125, -3.3525390625, -2.884765625, -2.4169921875, -1.94921875, -1.4814453125, -1.013671875, -0.5458984375, -0.078125, 0.3896484375, 0.857421875, 1.3251953125, 1.79296875, 2.2607421875, 2.728515625, 3.1962890625, 3.6640625, 4.1318359375, 4.599609375, 5.0673828125, 5.53515625, 6.0029296875, 6.470703125, 6.9384765625, 7.40625, 7.8740234375, 8.341796875, 8.8095703125, 9.27734375, 9.7451171875, 10.212890625, 10.6806640625, 11.1484375, 11.6162109375, 12.083984375, 12.5517578125, 13.01953125, 13.4873046875, 13.955078125, 14.4228515625, 14.890625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 12.0, 3.0, 10.0, 11.0, 12.0, 23.0, 28.0, 32.0, 40.0, 82.0, 114.0, 147.0, 183.0, 271.0, 420.0, 575.0, 890.0, 1348.0, 2151.0, 3860.0, 10560.0, 76334.0, 744086.0, 178192.0, 16976.0, 4882.0, 2518.0, 1541.0, 1002.0, 715.0, 463.0, 325.0, 217.0, 161.0, 101.0, 83.0, 52.0, 35.0, 27.0, 21.0, 20.0, 17.0, 9.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-41.375, -40.10791015625, -38.8408203125, -37.57373046875, -36.306640625, -35.03955078125, -33.7724609375, -32.50537109375, -31.23828125, -29.97119140625, -28.7041015625, -27.43701171875, -26.169921875, -24.90283203125, -23.6357421875, -22.36865234375, -21.1015625, -19.83447265625, -18.5673828125, -17.30029296875, -16.033203125, -14.76611328125, -13.4990234375, -12.23193359375, -10.96484375, -9.69775390625, -8.4306640625, -7.16357421875, -5.896484375, -4.62939453125, -3.3623046875, -2.09521484375, -0.828125, 0.43896484375, 1.7060546875, 2.97314453125, 4.240234375, 5.50732421875, 6.7744140625, 8.04150390625, 9.30859375, 10.57568359375, 11.8427734375, 13.10986328125, 14.376953125, 15.64404296875, 16.9111328125, 18.17822265625, 19.4453125, 20.71240234375, 21.9794921875, 23.24658203125, 24.513671875, 25.78076171875, 27.0478515625, 28.31494140625, 29.58203125, 30.84912109375, 32.1162109375, 33.38330078125, 34.650390625, 35.91748046875, 37.1845703125, 38.45166015625, 39.71875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 8.0, 9.0, 20.0, 25.0, 24.0, 21.0, 29.0, 52.0, 57.0, 53.0, 77.0, 91.0, 1581.0, 514.0, 78.0, 71.0, 54.0, 45.0, 45.0, 31.0, 27.0, 24.0, 23.0, 17.0, 9.0, 11.0, 8.0, 8.0, 3.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-59.03125, -57.34375, -55.65625, -53.96875, -52.28125, -50.59375, -48.90625, -47.21875, -45.53125, -43.84375, -42.15625, -40.46875, -38.78125, -37.09375, -35.40625, -33.71875, -32.03125, -30.34375, -28.65625, -26.96875, -25.28125, -23.59375, -21.90625, -20.21875, -18.53125, -16.84375, -15.15625, -13.46875, -11.78125, -10.09375, -8.40625, -6.71875, -5.03125, -3.34375, -1.65625, 0.03125, 1.71875, 3.40625, 5.09375, 6.78125, 8.46875, 10.15625, 11.84375, 13.53125, 15.21875, 16.90625, 18.59375, 20.28125, 21.96875, 23.65625, 25.34375, 27.03125, 28.71875, 30.40625, 32.09375, 33.78125, 35.46875, 37.15625, 38.84375, 40.53125, 42.21875, 43.90625, 45.59375, 47.28125, 48.96875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 8.0, 12.0, 18.0, 19.0, 22.0, 39.0, 72.0, 68.0, 115.0, 159.0, 260.0, 607.0, 2609.0, 3132676.0, 7250.0, 859.0, 320.0, 185.0, 126.0, 85.0, 62.0, 34.0, 27.0, 23.0, 14.0, 9.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-167.5, -162.033203125, -156.56640625, -151.099609375, -145.6328125, -140.166015625, -134.69921875, -129.232421875, -123.765625, -118.298828125, -112.83203125, -107.365234375, -101.8984375, -96.431640625, -90.96484375, -85.498046875, -80.03125, -74.564453125, -69.09765625, -63.630859375, -58.1640625, -52.697265625, -47.23046875, -41.763671875, -36.296875, -30.830078125, -25.36328125, -19.896484375, -14.4296875, -8.962890625, -3.49609375, 1.970703125, 7.4375, 12.904296875, 18.37109375, 23.837890625, 29.3046875, 34.771484375, 40.23828125, 45.705078125, 51.171875, 56.638671875, 62.10546875, 67.572265625, 73.0390625, 78.505859375, 83.97265625, 89.439453125, 94.90625, 100.373046875, 105.83984375, 111.306640625, 116.7734375, 122.240234375, 127.70703125, 133.173828125, 138.640625, 144.107421875, 149.57421875, 155.041015625, 160.5078125, 165.974609375, 171.44140625, 176.908203125, 182.375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 12.0, 61.0, 303.0, 456.0, 150.0, 21.0, 9.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-220.38963317871094, -213.33377075195312, -206.2779083251953, -199.2220458984375, -192.16616821289062, -185.11032104492188, -178.054443359375, -170.9985809326172, -163.94271850585938, -156.88685607910156, -149.83099365234375, -142.77513122558594, -135.71926879882812, -128.66339111328125, -121.60752868652344, -114.55166625976562, -107.49580383300781, -100.43994140625, -93.38407897949219, -86.32820892333984, -79.27234649658203, -72.21648406982422, -65.16061401367188, -58.10475158691406, -51.04888916015625, -43.99302673339844, -36.93716049194336, -29.881296157836914, -22.82543182373047, -15.769569396972656, -8.713703155517578, -1.6578369140625, 5.398040771484375, 12.45390510559082, 19.509769439697266, 26.56563377380371, 33.621498107910156, 40.67736053466797, 47.73322677612305, 54.789093017578125, 61.84495544433594, 68.90081787109375, 75.95668029785156, 83.0125503540039, 90.06841278076172, 97.12427520751953, 104.18014526367188, 111.23600769042969, 118.2918701171875, 125.34773254394531, 132.40359497070312, 139.45945739746094, 146.51531982421875, 153.57119750976562, 160.62705993652344, 167.68292236328125, 174.73878479003906, 181.79464721679688, 188.8505096435547, 195.9063720703125, 202.96224975585938, 210.01809692382812, 217.073974609375, 224.1298370361328, 231.18569946289062]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 9.0, 6.0, 7.0, 13.0, 12.0, 26.0, 24.0, 21.0, 29.0, 28.0, 35.0, 37.0, 35.0, 56.0, 56.0, 57.0, 63.0, 50.0, 49.0, 42.0, 47.0, 45.0, 42.0, 44.0, 26.0, 20.0, 23.0, 14.0, 12.0, 13.0, 8.0, 13.0, 10.0, 5.0, 2.0, 6.0, 3.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.30824279785156, -156.46434020996094, -151.62045288085938, -146.77655029296875, -141.93264770507812, -137.08876037597656, -132.24485778808594, -127.40096282958984, -122.55706787109375, -117.71317291259766, -112.86927795410156, -108.02537536621094, -103.18148040771484, -98.33758544921875, -93.49368286132812, -88.64978790283203, -83.80589294433594, -78.96199798583984, -74.11810302734375, -69.27420043945312, -64.43030548095703, -59.58641052246094, -54.74251174926758, -49.89861297607422, -45.054718017578125, -40.21082305908203, -35.36692428588867, -30.523027420043945, -25.67913055419922, -20.835233688354492, -15.991336822509766, -11.147438049316406, -6.303558349609375, -1.4596614837646484, 3.384235382080078, 8.228132247924805, 13.072029113769531, 17.915925979614258, 22.759822845458984, 27.603721618652344, 32.44761657714844, 37.29151153564453, 42.13541030883789, 46.97930908203125, 51.823204040527344, 56.66709899902344, 61.5109977722168, 66.35489654541016, 71.19879150390625, 76.04268646240234, 80.88658142089844, 85.73048400878906, 90.57437896728516, 95.41827392578125, 100.26217651367188, 105.10607147216797, 109.94996643066406, 114.79386138916016, 119.63775634765625, 124.48165893554688, 129.3255615234375, 134.16944885253906, 139.0133514404297, 143.85723876953125, 148.70114135742188]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 7.0, 3.0, 12.0, 16.0, 9.0, 14.0, 24.0, 19.0, 22.0, 20.0, 29.0, 36.0, 45.0, 40.0, 33.0, 41.0, 46.0, 42.0, 46.0, 43.0, 37.0, 47.0, 37.0, 45.0, 35.0, 28.0, 29.0, 25.0, 28.0, 22.0, 22.0, 19.0, 13.0, 9.0, 12.0, 10.0, 8.0, 4.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.3125, -14.79833984375, -14.2841796875, -13.77001953125, -13.255859375, -12.74169921875, -12.2275390625, -11.71337890625, -11.19921875, -10.68505859375, -10.1708984375, -9.65673828125, -9.142578125, -8.62841796875, -8.1142578125, -7.60009765625, -7.0859375, -6.57177734375, -6.0576171875, -5.54345703125, -5.029296875, -4.51513671875, -4.0009765625, -3.48681640625, -2.97265625, -2.45849609375, -1.9443359375, -1.43017578125, -0.916015625, -0.40185546875, 0.1123046875, 0.62646484375, 1.140625, 1.65478515625, 2.1689453125, 2.68310546875, 3.197265625, 3.71142578125, 4.2255859375, 4.73974609375, 5.25390625, 5.76806640625, 6.2822265625, 6.79638671875, 7.310546875, 7.82470703125, 8.3388671875, 8.85302734375, 9.3671875, 9.88134765625, 10.3955078125, 10.90966796875, 11.423828125, 11.93798828125, 12.4521484375, 12.96630859375, 13.48046875, 13.99462890625, 14.5087890625, 15.02294921875, 15.537109375, 16.05126953125, 16.5654296875, 17.07958984375, 17.59375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 12.0, 18.0, 14.0, 24.0, 43.0, 54.0, 64.0, 121.0, 135.0, 210.0, 346.0, 531.0, 959.0, 1880.0, 4789.0, 16119.0, 96358.0, 898240.0, 2497501.0, 596902.0, 60462.0, 11735.0, 3879.0, 1608.0, 829.0, 487.0, 316.0, 200.0, 122.0, 104.0, 53.0, 41.0, 33.0, 25.0, 21.0, 12.0, 7.0, 13.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.859375, -28.908447265625, -27.95751953125, -27.006591796875, -26.0556640625, -25.104736328125, -24.15380859375, -23.202880859375, -22.251953125, -21.301025390625, -20.35009765625, -19.399169921875, -18.4482421875, -17.497314453125, -16.54638671875, -15.595458984375, -14.64453125, -13.693603515625, -12.74267578125, -11.791748046875, -10.8408203125, -9.889892578125, -8.93896484375, -7.988037109375, -7.037109375, -6.086181640625, -5.13525390625, -4.184326171875, -3.2333984375, -2.282470703125, -1.33154296875, -0.380615234375, 0.5703125, 1.521240234375, 2.47216796875, 3.423095703125, 4.3740234375, 5.324951171875, 6.27587890625, 7.226806640625, 8.177734375, 9.128662109375, 10.07958984375, 11.030517578125, 11.9814453125, 12.932373046875, 13.88330078125, 14.834228515625, 15.78515625, 16.736083984375, 17.68701171875, 18.637939453125, 19.5888671875, 20.539794921875, 21.49072265625, 22.441650390625, 23.392578125, 24.343505859375, 25.29443359375, 26.245361328125, 27.1962890625, 28.147216796875, 29.09814453125, 30.049072265625, 31.0]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 11.0, 4.0, 14.0, 28.0, 40.0, 56.0, 87.0, 141.0, 236.0, 316.0, 472.0, 659.0, 657.0, 454.0, 265.0, 224.0, 156.0, 86.0, 51.0, 40.0, 19.0, 22.0, 15.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-47.21875, -46.03955078125, -44.8603515625, -43.68115234375, -42.501953125, -41.32275390625, -40.1435546875, -38.96435546875, -37.78515625, -36.60595703125, -35.4267578125, -34.24755859375, -33.068359375, -31.88916015625, -30.7099609375, -29.53076171875, -28.3515625, -27.17236328125, -25.9931640625, -24.81396484375, -23.634765625, -22.45556640625, -21.2763671875, -20.09716796875, -18.91796875, -17.73876953125, -16.5595703125, -15.38037109375, -14.201171875, -13.02197265625, -11.8427734375, -10.66357421875, -9.484375, -8.30517578125, -7.1259765625, -5.94677734375, -4.767578125, -3.58837890625, -2.4091796875, -1.22998046875, -0.05078125, 1.12841796875, 2.3076171875, 3.48681640625, 4.666015625, 5.84521484375, 7.0244140625, 8.20361328125, 9.3828125, 10.56201171875, 11.7412109375, 12.92041015625, 14.099609375, 15.27880859375, 16.4580078125, 17.63720703125, 18.81640625, 19.99560546875, 21.1748046875, 22.35400390625, 23.533203125, 24.71240234375, 25.8916015625, 27.07080078125, 28.25]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 8.0, 16.0, 30.0, 40.0, 67.0, 137.0, 233.0, 518.0, 1378.0, 5332.0, 3771802.0, 409143.0, 3573.0, 1062.0, 444.0, 210.0, 109.0, 42.0, 33.0, 25.0, 21.0, 11.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-110.625, -106.79296875, -102.9609375, -99.12890625, -95.296875, -91.46484375, -87.6328125, -83.80078125, -79.96875, -76.13671875, -72.3046875, -68.47265625, -64.640625, -60.80859375, -56.9765625, -53.14453125, -49.3125, -45.48046875, -41.6484375, -37.81640625, -33.984375, -30.15234375, -26.3203125, -22.48828125, -18.65625, -14.82421875, -10.9921875, -7.16015625, -3.328125, 0.50390625, 4.3359375, 8.16796875, 12.0, 15.83203125, 19.6640625, 23.49609375, 27.328125, 31.16015625, 34.9921875, 38.82421875, 42.65625, 46.48828125, 50.3203125, 54.15234375, 57.984375, 61.81640625, 65.6484375, 69.48046875, 73.3125, 77.14453125, 80.9765625, 84.80859375, 88.640625, 92.47265625, 96.3046875, 100.13671875, 103.96875, 107.80078125, 111.6328125, 115.46484375, 119.296875, 123.12890625, 126.9609375, 130.79296875, 134.625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 10.0, 105.0, 517.0, 336.0, 43.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-546.1066284179688, -533.6357421875, -521.164794921875, -508.69390869140625, -496.2229919433594, -483.7521057128906, -471.28118896484375, -458.810302734375, -446.3393859863281, -433.86846923828125, -421.3975830078125, -408.9266662597656, -396.45574951171875, -383.98486328125, -371.5139465332031, -359.04302978515625, -346.5721435546875, -334.1012268066406, -321.6303405761719, -309.159423828125, -296.6885070800781, -284.2176208496094, -271.7467041015625, -259.27581787109375, -246.80487060546875, -234.33396911621094, -221.86305236816406, -209.39215087890625, -196.92124938964844, -184.45034790039062, -171.97943115234375, -159.50852966308594, -147.03762817382812, -134.5667266845703, -122.09581756591797, -109.62490844726562, -97.15400695800781, -84.68309783935547, -72.21218872070312, -59.74128723144531, -47.27037811279297, -34.79947280883789, -22.32856559753418, -9.857658386230469, 2.6132469177246094, 15.084152221679688, 27.55506134033203, 40.025962829589844, 52.49687194824219, 64.96778106689453, 77.43868255615234, 89.90959167480469, 102.3804931640625, 114.85140228271484, 127.32231140136719, 139.793212890625, 152.26412963867188, 164.7350311279297, 177.20594787597656, 189.67684936523438, 202.1477508544922, 214.61865234375, 227.08956909179688, 239.5604705810547, 252.0313720703125]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 8.0, 7.0, 4.0, 10.0, 10.0, 11.0, 10.0, 19.0, 12.0, 26.0, 23.0, 24.0, 36.0, 23.0, 22.0, 31.0, 28.0, 34.0, 37.0, 34.0, 32.0, 41.0, 25.0, 40.0, 44.0, 27.0, 28.0, 24.0, 34.0, 37.0, 21.0, 27.0, 26.0, 25.0, 26.0, 18.0, 11.0, 13.0, 18.0, 12.0, 9.0, 9.0, 8.0, 12.0, 7.0, 3.0, 7.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.83758544921875, -87.79442596435547, -84.75126647949219, -81.70811462402344, -78.66495513916016, -75.62179565429688, -72.5786361694336, -69.53547668457031, -66.49231719970703, -63.44915771484375, -60.406002044677734, -57.36284255981445, -54.31968307495117, -51.276527404785156, -48.233367919921875, -45.190208435058594, -42.14705276489258, -39.1038932800293, -36.06073760986328, -33.017578125, -29.97441864013672, -26.93126106262207, -23.888103485107422, -20.84494400024414, -17.801786422729492, -14.758627891540527, -11.715469360351562, -8.672311782836914, -5.629153251647949, -2.5859947204589844, 0.45716285705566406, 3.5003223419189453, 6.543479919433594, 9.586638450622559, 12.629796981811523, 15.672954559326172, 18.716114044189453, 21.7592716217041, 24.80242919921875, 27.84558868408203, 30.88874626159668, 33.93190383911133, 36.97506332397461, 40.018218994140625, 43.061378479003906, 46.10453796386719, 49.14769744873047, 52.19085693359375, 55.234012603759766, 58.27717208862305, 61.32032775878906, 64.36348724365234, 67.40664672851562, 70.4498062133789, 73.49296569824219, 76.53611755371094, 79.57927703857422, 82.6224365234375, 85.66559600830078, 88.70875549316406, 91.75190734863281, 94.7950668334961, 97.83822631835938, 100.88138580322266, 103.92454528808594]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 8.0, 8.0, 8.0, 13.0, 4.0, 14.0, 6.0, 18.0, 8.0, 22.0, 36.0, 27.0, 14.0, 36.0, 21.0, 40.0, 32.0, 30.0, 39.0, 48.0, 30.0, 32.0, 40.0, 42.0, 42.0, 39.0, 27.0, 34.0, 30.0, 32.0, 19.0, 24.0, 22.0, 16.0, 15.0, 9.0, 25.0, 18.0, 13.0, 9.0, 8.0, 9.0, 5.0, 5.0, 6.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-10.734375, -10.39599609375, -10.0576171875, -9.71923828125, -9.380859375, -9.04248046875, -8.7041015625, -8.36572265625, -8.02734375, -7.68896484375, -7.3505859375, -7.01220703125, -6.673828125, -6.33544921875, -5.9970703125, -5.65869140625, -5.3203125, -4.98193359375, -4.6435546875, -4.30517578125, -3.966796875, -3.62841796875, -3.2900390625, -2.95166015625, -2.61328125, -2.27490234375, -1.9365234375, -1.59814453125, -1.259765625, -0.92138671875, -0.5830078125, -0.24462890625, 0.09375, 0.43212890625, 0.7705078125, 1.10888671875, 1.447265625, 1.78564453125, 2.1240234375, 2.46240234375, 2.80078125, 3.13916015625, 3.4775390625, 3.81591796875, 4.154296875, 4.49267578125, 4.8310546875, 5.16943359375, 5.5078125, 5.84619140625, 6.1845703125, 6.52294921875, 6.861328125, 7.19970703125, 7.5380859375, 7.87646484375, 8.21484375, 8.55322265625, 8.8916015625, 9.22998046875, 9.568359375, 9.90673828125, 10.2451171875, 10.58349609375, 10.921875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 15.0, 22.0, 32.0, 53.0, 51.0, 128.0, 160.0, 250.0, 385.0, 560.0, 792.0, 1167.0, 1773.0, 2739.0, 3824.0, 5678.0, 8509.0, 12702.0, 18318.0, 27327.0, 41680.0, 61798.0, 91752.0, 135780.0, 185990.0, 146699.0, 98430.0, 66519.0, 44133.0, 29700.0, 19942.0, 13629.0, 9079.0, 6059.0, 4232.0, 2787.0, 1907.0, 1308.0, 872.0, 579.0, 405.0, 284.0, 180.0, 104.0, 82.0, 42.0, 26.0, 33.0, 14.0, 9.0, 8.0, 2.0, 3.0, 2.0, 2.0], "bins": [-1.1962890625, -1.160675048828125, -1.12506103515625, -1.089447021484375, -1.0538330078125, -1.018218994140625, -0.98260498046875, -0.946990966796875, -0.911376953125, -0.875762939453125, -0.84014892578125, -0.804534912109375, -0.7689208984375, -0.733306884765625, -0.69769287109375, -0.662078857421875, -0.62646484375, -0.590850830078125, -0.55523681640625, -0.519622802734375, -0.4840087890625, -0.448394775390625, -0.41278076171875, -0.377166748046875, -0.341552734375, -0.305938720703125, -0.27032470703125, -0.234710693359375, -0.1990966796875, -0.163482666015625, -0.12786865234375, -0.092254638671875, -0.056640625, -0.021026611328125, 0.01458740234375, 0.050201416015625, 0.0858154296875, 0.121429443359375, 0.15704345703125, 0.192657470703125, 0.228271484375, 0.263885498046875, 0.29949951171875, 0.335113525390625, 0.3707275390625, 0.406341552734375, 0.44195556640625, 0.477569580078125, 0.51318359375, 0.548797607421875, 0.58441162109375, 0.620025634765625, 0.6556396484375, 0.691253662109375, 0.72686767578125, 0.762481689453125, 0.798095703125, 0.833709716796875, 0.86932373046875, 0.904937744140625, 0.9405517578125, 0.976165771484375, 1.01177978515625, 1.047393798828125, 1.0830078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 10.0, 10.0, 8.0, 14.0, 12.0, 15.0, 17.0, 17.0, 14.0, 20.0, 18.0, 28.0, 26.0, 24.0, 37.0, 32.0, 27.0, 38.0, 50.0, 27.0, 1063.0, 42.0, 42.0, 39.0, 40.0, 28.0, 31.0, 25.0, 30.0, 34.0, 29.0, 29.0, 21.0, 15.0, 10.0, 16.0, 7.0, 15.0, 10.0, 11.0, 12.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-7.48828125, -7.26727294921875, -7.0462646484375, -6.82525634765625, -6.604248046875, -6.38323974609375, -6.1622314453125, -5.94122314453125, -5.72021484375, -5.49920654296875, -5.2781982421875, -5.05718994140625, -4.836181640625, -4.61517333984375, -4.3941650390625, -4.17315673828125, -3.9521484375, -3.73114013671875, -3.5101318359375, -3.28912353515625, -3.068115234375, -2.84710693359375, -2.6260986328125, -2.40509033203125, -2.18408203125, -1.96307373046875, -1.7420654296875, -1.52105712890625, -1.300048828125, -1.07904052734375, -0.8580322265625, -0.63702392578125, -0.416015625, -0.19500732421875, 0.0260009765625, 0.24700927734375, 0.468017578125, 0.68902587890625, 0.9100341796875, 1.13104248046875, 1.35205078125, 1.57305908203125, 1.7940673828125, 2.01507568359375, 2.236083984375, 2.45709228515625, 2.6781005859375, 2.89910888671875, 3.1201171875, 3.34112548828125, 3.5621337890625, 3.78314208984375, 4.004150390625, 4.22515869140625, 4.4461669921875, 4.66717529296875, 4.88818359375, 5.10919189453125, 5.3302001953125, 5.55120849609375, 5.772216796875, 5.99322509765625, 6.2142333984375, 6.43524169921875, 6.65625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 6.0, 16.0, 9.0, 23.0, 34.0, 42.0, 56.0, 95.0, 96.0, 184.0, 295.0, 451.0, 635.0, 888.0, 1307.0, 1844.0, 2758.0, 4046.0, 6047.0, 8815.0, 13287.0, 20032.0, 30825.0, 46464.0, 71766.0, 111284.0, 175402.0, 1239328.0, 125875.0, 80472.0, 52343.0, 34263.0, 22273.0, 14947.0, 9922.0, 6746.0, 4617.0, 3027.0, 2082.0, 1352.0, 934.0, 720.0, 482.0, 302.0, 239.0, 180.0, 101.0, 84.0, 48.0, 48.0, 15.0, 7.0, 8.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0], "bins": [-1.12109375, -1.0850830078125, -1.049072265625, -1.0130615234375, -0.97705078125, -0.9410400390625, -0.905029296875, -0.8690185546875, -0.8330078125, -0.7969970703125, -0.760986328125, -0.7249755859375, -0.68896484375, -0.6529541015625, -0.616943359375, -0.5809326171875, -0.544921875, -0.5089111328125, -0.472900390625, -0.4368896484375, -0.40087890625, -0.3648681640625, -0.328857421875, -0.2928466796875, -0.2568359375, -0.2208251953125, -0.184814453125, -0.1488037109375, -0.11279296875, -0.0767822265625, -0.040771484375, -0.0047607421875, 0.03125, 0.0672607421875, 0.103271484375, 0.1392822265625, 0.17529296875, 0.2113037109375, 0.247314453125, 0.2833251953125, 0.3193359375, 0.3553466796875, 0.391357421875, 0.4273681640625, 0.46337890625, 0.4993896484375, 0.535400390625, 0.5714111328125, 0.607421875, 0.6434326171875, 0.679443359375, 0.7154541015625, 0.75146484375, 0.7874755859375, 0.823486328125, 0.8594970703125, 0.8955078125, 0.9315185546875, 0.967529296875, 1.0035400390625, 1.03955078125, 1.0755615234375, 1.111572265625, 1.1475830078125, 1.18359375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 8.0, 9.0, 13.0, 18.0, 22.0, 24.0, 42.0, 50.0, 69.0, 95.0, 115.0, 96.0, 83.0, 85.0, 60.0, 58.0, 43.0, 30.0, 17.0, 16.0, 7.0, 9.0, 7.0, 3.0, 10.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004001617431640625, -0.0038559436798095703, -0.0037102699279785156, -0.003564596176147461, -0.0034189224243164062, -0.0032732486724853516, -0.003127574920654297, -0.002981901168823242, -0.0028362274169921875, -0.002690553665161133, -0.002544879913330078, -0.0023992061614990234, -0.0022535324096679688, -0.002107858657836914, -0.0019621849060058594, -0.0018165111541748047, -0.00167083740234375, -0.0015251636505126953, -0.0013794898986816406, -0.001233816146850586, -0.0010881423950195312, -0.0009424686431884766, -0.0007967948913574219, -0.0006511211395263672, -0.0005054473876953125, -0.0003597736358642578, -0.00021409988403320312, -6.842613220214844e-05, 7.724761962890625e-05, 0.00022292137145996094, 0.0003685951232910156, 0.0005142688751220703, 0.000659942626953125, 0.0008056163787841797, 0.0009512901306152344, 0.001096963882446289, 0.0012426376342773438, 0.0013883113861083984, 0.0015339851379394531, 0.0016796588897705078, 0.0018253326416015625, 0.001971006393432617, 0.002116680145263672, 0.0022623538970947266, 0.0024080276489257812, 0.002553701400756836, 0.0026993751525878906, 0.0028450489044189453, 0.00299072265625, 0.0031363964080810547, 0.0032820701599121094, 0.003427743911743164, 0.0035734176635742188, 0.0037190914154052734, 0.003864765167236328, 0.004010438919067383, 0.0041561126708984375, 0.004301786422729492, 0.004447460174560547, 0.0045931339263916016, 0.004738807678222656, 0.004884481430053711, 0.005030155181884766, 0.00517582893371582, 0.005321502685546875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 5.0, 7.0, 16.0, 9.0, 18.0, 23.0, 40.0, 47.0, 96.0, 116.0, 165.0, 340.0, 580.0, 1283.0, 1033782.0, 10017.0, 875.0, 417.0, 233.0, 142.0, 105.0, 74.0, 49.0, 38.0, 22.0, 16.0, 10.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0943603515625, -0.09192609786987305, -0.0894918441772461, -0.08705759048461914, -0.08462333679199219, -0.08218908309936523, -0.07975482940673828, -0.07732057571411133, -0.07488632202148438, -0.07245206832885742, -0.07001781463623047, -0.06758356094360352, -0.06514930725097656, -0.06271505355834961, -0.060280799865722656, -0.0578465461730957, -0.05541229248046875, -0.0529780387878418, -0.050543785095214844, -0.04810953140258789, -0.04567527770996094, -0.043241024017333984, -0.04080677032470703, -0.03837251663208008, -0.035938262939453125, -0.03350400924682617, -0.03106975555419922, -0.028635501861572266, -0.026201248168945312, -0.02376699447631836, -0.021332740783691406, -0.018898487091064453, -0.0164642333984375, -0.014029979705810547, -0.011595726013183594, -0.00916147232055664, -0.0067272186279296875, -0.004292964935302734, -0.0018587112426757812, 0.0005755424499511719, 0.003009796142578125, 0.005444049835205078, 0.007878303527832031, 0.010312557220458984, 0.012746810913085938, 0.01518106460571289, 0.017615318298339844, 0.020049571990966797, 0.02248382568359375, 0.024918079376220703, 0.027352333068847656, 0.02978658676147461, 0.03222084045410156, 0.034655094146728516, 0.03708934783935547, 0.03952360153198242, 0.041957855224609375, 0.04439210891723633, 0.04682636260986328, 0.049260616302490234, 0.05169486999511719, 0.05412912368774414, 0.056563377380371094, 0.05899763107299805, 0.061431884765625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 300.0, 678.0, 27.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005797862075269222, -0.0055241514928638935, -0.005250440910458565, -0.004976730793714523, -0.0047030202113091946, -0.004429309628903866, -0.004155599046498537, -0.0038818884640932083, -0.003608178114518523, -0.0033344675321131945, -0.0030607571825385094, -0.0027870466001331806, -0.002513336017727852, -0.0022396256681531668, -0.001965915085747838, -0.001692204619757831, -0.0014184941537678242, -0.0011447836877778172, -0.0008710731635801494, -0.0005973626393824816, -0.00032365217339247465, -4.994170740246773e-05, 0.00022376887500286102, 0.000497479340992868, 0.0007711898069828749, 0.0010449002729728818, 0.0013186107389628887, 0.0015923213213682175, 0.0018660317873582244, 0.0021397422533482313, 0.00241345283575356, 0.002687163185328245, 0.002960873767733574, 0.0032345843501389027, 0.0035082946997135878, 0.0037820052821189165, 0.004055715631693602, 0.00432942621409893, 0.004603136796504259, 0.004876847378909588, 0.005150557495653629, 0.005424268078058958, 0.005697978660464287, 0.005971688777208328, 0.006245399359613657, 0.006519109942018986, 0.0067928205244243145, 0.007066531106829643, 0.007340241689234972, 0.007613952271640301, 0.007887662388384342, 0.008161373436450958, 0.008435083553195, 0.008708793669939041, 0.008982504718005657, 0.009256214834749699, 0.009529925882816315, 0.009803635999560356, 0.010077347047626972, 0.010351057164371014, 0.01062476821243763, 0.010898478329181671, 0.011172188445925713, 0.011445899493992329, 0.01171960961073637]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 11.0, 7.0, 7.0, 7.0, 6.0, 9.0, 12.0, 21.0, 19.0, 30.0, 26.0, 39.0, 28.0, 33.0, 23.0, 29.0, 38.0, 40.0, 55.0, 37.0, 45.0, 36.0, 32.0, 41.0, 36.0, 42.0, 29.0, 34.0, 35.0, 27.0, 21.0, 22.0, 13.0, 22.0, 22.0, 14.0, 13.0, 9.0, 6.0, 7.0, 6.0, 4.0, 2.0, 5.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00160294771194458, -0.0015491126105189323, -0.0014952775090932846, -0.0014414424076676369, -0.0013876073062419891, -0.0013337722048163414, -0.0012799371033906937, -0.001226102001965046, -0.0011722669005393982, -0.0011184317991137505, -0.0010645966976881027, -0.001010761596262455, -0.0009569264948368073, -0.0009030913934111595, -0.0008492562919855118, -0.000795421190559864, -0.0007415860891342163, -0.0006877509877085686, -0.0006339158862829208, -0.0005800807848572731, -0.0005262456834316254, -0.00047241058200597763, -0.0004185754805803299, -0.00036474037915468216, -0.0003109052777290344, -0.0002570701763033867, -0.00020323507487773895, -0.00014939997345209122, -9.556487202644348e-05, -4.1729770600795746e-05, 1.210533082485199e-05, 6.594043225049973e-05, 0.00011977553367614746, 0.0001736106351017952, 0.00022744573652744293, 0.00028128083795309067, 0.0003351159393787384, 0.00038895104080438614, 0.0004427861422300339, 0.0004966212436556816, 0.0005504563450813293, 0.0006042914465069771, 0.0006581265479326248, 0.0007119616493582726, 0.0007657967507839203, 0.000819631852209568, 0.0008734669536352158, 0.0009273020550608635, 0.0009811371564865112, 0.001034972257912159, 0.0010888073593378067, 0.0011426424607634544, 0.0011964775621891022, 0.00125031266361475, 0.0013041477650403976, 0.0013579828664660454, 0.0014118179678916931, 0.0014656530693173409, 0.0015194881707429886, 0.0015733232721686363, 0.001627158373594284, 0.0016809934750199318, 0.0017348285764455795, 0.0017886636778712273, 0.001842498779296875]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 8.0, 8.0, 8.0, 13.0, 4.0, 14.0, 6.0, 18.0, 8.0, 22.0, 36.0, 27.0, 14.0, 36.0, 21.0, 40.0, 32.0, 30.0, 40.0, 47.0, 30.0, 32.0, 40.0, 41.0, 43.0, 39.0, 27.0, 34.0, 30.0, 32.0, 19.0, 24.0, 22.0, 16.0, 15.0, 9.0, 25.0, 18.0, 13.0, 9.0, 8.0, 9.0, 5.0, 5.0, 6.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-10.734375, -10.39599609375, -10.0576171875, -9.71923828125, -9.380859375, -9.04248046875, -8.7041015625, -8.36572265625, -8.02734375, -7.68896484375, -7.3505859375, -7.01220703125, -6.673828125, -6.33544921875, -5.9970703125, -5.65869140625, -5.3203125, -4.98193359375, -4.6435546875, -4.30517578125, -3.966796875, -3.62841796875, -3.2900390625, -2.95166015625, -2.61328125, -2.27490234375, -1.9365234375, -1.59814453125, -1.259765625, -0.92138671875, -0.5830078125, -0.24462890625, 0.09375, 0.43212890625, 0.7705078125, 1.10888671875, 1.447265625, 1.78564453125, 2.1240234375, 2.46240234375, 2.80078125, 3.13916015625, 3.4775390625, 3.81591796875, 4.154296875, 4.49267578125, 4.8310546875, 5.16943359375, 5.5078125, 5.84619140625, 6.1845703125, 6.52294921875, 6.861328125, 7.19970703125, 7.5380859375, 7.87646484375, 8.21484375, 8.55322265625, 8.8916015625, 9.22998046875, 9.568359375, 9.90673828125, 10.2451171875, 10.58349609375, 10.921875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 7.0, 12.0, 11.0, 9.0, 21.0, 20.0, 34.0, 34.0, 41.0, 67.0, 81.0, 103.0, 150.0, 241.0, 327.0, 470.0, 715.0, 1142.0, 2129.0, 4439.0, 10828.0, 32401.0, 130003.0, 590026.0, 204592.0, 44410.0, 14303.0, 5481.0, 2482.0, 1411.0, 834.0, 496.0, 319.0, 256.0, 166.0, 107.0, 90.0, 89.0, 49.0, 42.0, 27.0, 16.0, 15.0, 14.0, 13.0, 10.0, 4.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-20.25, -19.5888671875, -18.927734375, -18.2666015625, -17.60546875, -16.9443359375, -16.283203125, -15.6220703125, -14.9609375, -14.2998046875, -13.638671875, -12.9775390625, -12.31640625, -11.6552734375, -10.994140625, -10.3330078125, -9.671875, -9.0107421875, -8.349609375, -7.6884765625, -7.02734375, -6.3662109375, -5.705078125, -5.0439453125, -4.3828125, -3.7216796875, -3.060546875, -2.3994140625, -1.73828125, -1.0771484375, -0.416015625, 0.2451171875, 0.90625, 1.5673828125, 2.228515625, 2.8896484375, 3.55078125, 4.2119140625, 4.873046875, 5.5341796875, 6.1953125, 6.8564453125, 7.517578125, 8.1787109375, 8.83984375, 9.5009765625, 10.162109375, 10.8232421875, 11.484375, 12.1455078125, 12.806640625, 13.4677734375, 14.12890625, 14.7900390625, 15.451171875, 16.1123046875, 16.7734375, 17.4345703125, 18.095703125, 18.7568359375, 19.41796875, 20.0791015625, 20.740234375, 21.4013671875, 22.0625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 6.0, 9.0, 11.0, 14.0, 12.0, 21.0, 16.0, 20.0, 17.0, 41.0, 24.0, 41.0, 41.0, 56.0, 80.0, 94.0, 258.0, 1680.0, 153.0, 75.0, 65.0, 59.0, 41.0, 25.0, 35.0, 30.0, 20.0, 20.0, 11.0, 15.0, 9.0, 13.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-37.5, -36.375, -35.25, -34.125, -33.0, -31.875, -30.75, -29.625, -28.5, -27.375, -26.25, -25.125, -24.0, -22.875, -21.75, -20.625, -19.5, -18.375, -17.25, -16.125, -15.0, -13.875, -12.75, -11.625, -10.5, -9.375, -8.25, -7.125, -6.0, -4.875, -3.75, -2.625, -1.5, -0.375, 0.75, 1.875, 3.0, 4.125, 5.25, 6.375, 7.5, 8.625, 9.75, 10.875, 12.0, 13.125, 14.25, 15.375, 16.5, 17.625, 18.75, 19.875, 21.0, 22.125, 23.25, 24.375, 25.5, 26.625, 27.75, 28.875, 30.0, 31.125, 32.25, 33.375, 34.5]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 8.0, 9.0, 12.0, 13.0, 12.0, 29.0, 32.0, 42.0, 38.0, 68.0, 144.0, 257.0, 529.0, 1158.0, 76885.0, 3062774.0, 2128.0, 656.0, 337.0, 183.0, 107.0, 53.0, 50.0, 31.0, 28.0, 18.0, 13.0, 17.0, 13.0, 13.0, 10.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-108.375, -105.0048828125, -101.634765625, -98.2646484375, -94.89453125, -91.5244140625, -88.154296875, -84.7841796875, -81.4140625, -78.0439453125, -74.673828125, -71.3037109375, -67.93359375, -64.5634765625, -61.193359375, -57.8232421875, -54.453125, -51.0830078125, -47.712890625, -44.3427734375, -40.97265625, -37.6025390625, -34.232421875, -30.8623046875, -27.4921875, -24.1220703125, -20.751953125, -17.3818359375, -14.01171875, -10.6416015625, -7.271484375, -3.9013671875, -0.53125, 2.8388671875, 6.208984375, 9.5791015625, 12.94921875, 16.3193359375, 19.689453125, 23.0595703125, 26.4296875, 29.7998046875, 33.169921875, 36.5400390625, 39.91015625, 43.2802734375, 46.650390625, 50.0205078125, 53.390625, 56.7607421875, 60.130859375, 63.5009765625, 66.87109375, 70.2412109375, 73.611328125, 76.9814453125, 80.3515625, 83.7216796875, 87.091796875, 90.4619140625, 93.83203125, 97.2021484375, 100.572265625, 103.9423828125, 107.3125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 121.0, 878.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-455.6017761230469, -444.0265808105469, -432.45135498046875, -420.87615966796875, -409.30096435546875, -397.72576904296875, -386.15057373046875, -374.5753479003906, -363.0001525878906, -351.4249572753906, -339.8497314453125, -328.2745361328125, -316.6993408203125, -305.1241455078125, -293.5489501953125, -281.9737243652344, -270.3985290527344, -258.8233337402344, -247.2481231689453, -235.67291259765625, -224.09771728515625, -212.52252197265625, -200.9473114013672, -189.37210083007812, -177.79690551757812, -166.22171020507812, -154.64649963378906, -143.0712890625, -131.49609375, -119.92089080810547, -108.34568786621094, -96.7704849243164, -85.19525146484375, -73.62004852294922, -62.04484558105469, -50.469642639160156, -38.894439697265625, -27.319236755371094, -15.744033813476562, -4.168830871582031, 7.4063720703125, 18.98157501220703, 30.556777954101562, 42.131980895996094, 53.707183837890625, 65.28238677978516, 76.85758972167969, 88.43279266357422, 100.00799560546875, 111.58319854736328, 123.15840148925781, 134.73361206054688, 146.30880737304688, 157.88400268554688, 169.45921325683594, 181.034423828125, 192.609619140625, 204.184814453125, 215.76002502441406, 227.33523559570312, 238.91043090820312, 250.48562622070312, 262.06085205078125, 273.63604736328125, 285.21124267578125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 7.0, 5.0, 5.0, 7.0, 8.0, 22.0, 13.0, 25.0, 22.0, 18.0, 21.0, 24.0, 33.0, 33.0, 30.0, 36.0, 40.0, 35.0, 46.0, 43.0, 43.0, 45.0, 35.0, 31.0, 41.0, 40.0, 31.0, 44.0, 29.0, 39.0, 19.0, 20.0, 17.0, 15.0, 18.0, 15.0, 7.0, 10.0, 7.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-88.51687622070312, -85.93806457519531, -83.3592529296875, -80.78043365478516, -78.20162200927734, -75.62281036376953, -73.04399871826172, -70.46517944335938, -67.88636779785156, -65.30755615234375, -62.72874069213867, -60.14992904663086, -57.57111358642578, -54.99230194091797, -52.413490295410156, -49.83467483520508, -47.255863189697266, -44.67705154418945, -42.098236083984375, -39.51942443847656, -36.940608978271484, -34.36179733276367, -31.782983779907227, -29.20417022705078, -26.625356674194336, -24.04654312133789, -21.467729568481445, -18.888916015625, -16.310104370117188, -13.731289863586426, -11.152477264404297, -8.573663711547852, -5.994850158691406, -3.41603684425354, -0.8372235298156738, 1.7415895462036133, 4.320403099060059, 6.899216651916504, 9.478029251098633, 12.056842803955078, 14.635656356811523, 17.21446990966797, 19.793283462524414, 22.37209701538086, 24.950908660888672, 27.52972412109375, 30.108535766601562, 32.687347412109375, 35.26616287231445, 37.844974517822266, 40.423789978027344, 43.002601623535156, 45.581417083740234, 48.16022872924805, 50.739044189453125, 53.31785583496094, 55.89666748046875, 58.47547912597656, 61.05429458618164, 63.63310623168945, 66.21192169189453, 68.79073333740234, 71.36954498291016, 73.9483642578125, 76.52717590332031]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 3.0, 8.0, 11.0, 10.0, 7.0, 17.0, 12.0, 17.0, 22.0, 17.0, 26.0, 26.0, 35.0, 29.0, 34.0, 44.0, 41.0, 40.0, 50.0, 34.0, 43.0, 48.0, 37.0, 42.0, 35.0, 34.0, 37.0, 26.0, 22.0, 28.0, 23.0, 26.0, 14.0, 14.0, 11.0, 16.0, 13.0, 11.0, 7.0, 5.0, 7.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1484375, -11.7032470703125, -11.258056640625, -10.8128662109375, -10.36767578125, -9.9224853515625, -9.477294921875, -9.0321044921875, -8.5869140625, -8.1417236328125, -7.696533203125, -7.2513427734375, -6.80615234375, -6.3609619140625, -5.915771484375, -5.4705810546875, -5.025390625, -4.5802001953125, -4.135009765625, -3.6898193359375, -3.24462890625, -2.7994384765625, -2.354248046875, -1.9090576171875, -1.4638671875, -1.0186767578125, -0.573486328125, -0.1282958984375, 0.31689453125, 0.7620849609375, 1.207275390625, 1.6524658203125, 2.09765625, 2.5428466796875, 2.988037109375, 3.4332275390625, 3.87841796875, 4.3236083984375, 4.768798828125, 5.2139892578125, 5.6591796875, 6.1043701171875, 6.549560546875, 6.9947509765625, 7.43994140625, 7.8851318359375, 8.330322265625, 8.7755126953125, 9.220703125, 9.6658935546875, 10.111083984375, 10.5562744140625, 11.00146484375, 11.4466552734375, 11.891845703125, 12.3370361328125, 12.7822265625, 13.2274169921875, 13.672607421875, 14.1177978515625, 14.56298828125, 15.0081787109375, 15.453369140625, 15.8985595703125, 16.34375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 12.0, 11.0, 17.0, 23.0, 40.0, 34.0, 46.0, 59.0, 61.0, 85.0, 116.0, 176.0, 225.0, 318.0, 469.0, 880.0, 2177.0, 15473.0, 3759030.0, 407319.0, 4312.0, 1344.0, 606.0, 381.0, 250.0, 200.0, 126.0, 90.0, 73.0, 65.0, 55.0, 48.0, 29.0, 30.0, 21.0, 12.0, 20.0, 10.0, 7.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.6875, -91.3935546875, -88.099609375, -84.8056640625, -81.51171875, -78.2177734375, -74.923828125, -71.6298828125, -68.3359375, -65.0419921875, -61.748046875, -58.4541015625, -55.16015625, -51.8662109375, -48.572265625, -45.2783203125, -41.984375, -38.6904296875, -35.396484375, -32.1025390625, -28.80859375, -25.5146484375, -22.220703125, -18.9267578125, -15.6328125, -12.3388671875, -9.044921875, -5.7509765625, -2.45703125, 0.8369140625, 4.130859375, 7.4248046875, 10.71875, 14.0126953125, 17.306640625, 20.6005859375, 23.89453125, 27.1884765625, 30.482421875, 33.7763671875, 37.0703125, 40.3642578125, 43.658203125, 46.9521484375, 50.24609375, 53.5400390625, 56.833984375, 60.1279296875, 63.421875, 66.7158203125, 70.009765625, 73.3037109375, 76.59765625, 79.8916015625, 83.185546875, 86.4794921875, 89.7734375, 93.0673828125, 96.361328125, 99.6552734375, 102.94921875, 106.2431640625, 109.537109375, 112.8310546875, 116.125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 6.0, 6.0, 12.0, 29.0, 52.0, 84.0, 173.0, 409.0, 817.0, 1036.0, 739.0, 365.0, 168.0, 69.0, 40.0, 23.0, 13.0, 8.0, 8.0, 5.0, 4.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.625, -42.31982421875, -41.0146484375, -39.70947265625, -38.404296875, -37.09912109375, -35.7939453125, -34.48876953125, -33.18359375, -31.87841796875, -30.5732421875, -29.26806640625, -27.962890625, -26.65771484375, -25.3525390625, -24.04736328125, -22.7421875, -21.43701171875, -20.1318359375, -18.82666015625, -17.521484375, -16.21630859375, -14.9111328125, -13.60595703125, -12.30078125, -10.99560546875, -9.6904296875, -8.38525390625, -7.080078125, -5.77490234375, -4.4697265625, -3.16455078125, -1.859375, -0.55419921875, 0.7509765625, 2.05615234375, 3.361328125, 4.66650390625, 5.9716796875, 7.27685546875, 8.58203125, 9.88720703125, 11.1923828125, 12.49755859375, 13.802734375, 15.10791015625, 16.4130859375, 17.71826171875, 19.0234375, 20.32861328125, 21.6337890625, 22.93896484375, 24.244140625, 25.54931640625, 26.8544921875, 28.15966796875, 29.46484375, 30.77001953125, 32.0751953125, 33.38037109375, 34.685546875, 35.99072265625, 37.2958984375, 38.60107421875, 39.90625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 8.0, 7.0, 10.0, 15.0, 18.0, 42.0, 78.0, 121.0, 302.0, 699.0, 2094.0, 10026.0, 189680.0, 3810705.0, 167694.0, 9514.0, 2002.0, 659.0, 288.0, 148.0, 65.0, 34.0, 21.0, 14.0, 9.0, 6.0, 4.0, 7.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.5, -41.05859375, -39.6171875, -38.17578125, -36.734375, -35.29296875, -33.8515625, -32.41015625, -30.96875, -29.52734375, -28.0859375, -26.64453125, -25.203125, -23.76171875, -22.3203125, -20.87890625, -19.4375, -17.99609375, -16.5546875, -15.11328125, -13.671875, -12.23046875, -10.7890625, -9.34765625, -7.90625, -6.46484375, -5.0234375, -3.58203125, -2.140625, -0.69921875, 0.7421875, 2.18359375, 3.625, 5.06640625, 6.5078125, 7.94921875, 9.390625, 10.83203125, 12.2734375, 13.71484375, 15.15625, 16.59765625, 18.0390625, 19.48046875, 20.921875, 22.36328125, 23.8046875, 25.24609375, 26.6875, 28.12890625, 29.5703125, 31.01171875, 32.453125, 33.89453125, 35.3359375, 36.77734375, 38.21875, 39.66015625, 41.1015625, 42.54296875, 43.984375, 45.42578125, 46.8671875, 48.30859375, 49.75]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 15.0, 14.0, 48.0, 85.0, 160.0, 191.0, 173.0, 139.0, 105.0, 40.0, 19.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.97997283935547, -60.34026336669922, -52.70055389404297, -45.06084060668945, -37.4211311340332, -29.781421661376953, -22.141708374023438, -14.501998901367188, -6.8622894287109375, 0.7774209976196289, 8.417131423950195, 16.056842803955078, 23.696552276611328, 31.336261749267578, 38.975975036621094, 46.615684509277344, 54.255393981933594, 61.895103454589844, 69.5348129272461, 77.17453002929688, 84.81423950195312, 92.45394897460938, 100.09365844726562, 107.73336791992188, 115.37307739257812, 123.01278686523438, 130.65249633789062, 138.29220581054688, 145.93191528320312, 153.57162475585938, 161.21133422851562, 168.85104370117188, 176.49075317382812, 184.13046264648438, 191.77017211914062, 199.40988159179688, 207.04959106445312, 214.68930053710938, 222.32901000976562, 229.96871948242188, 237.60842895507812, 245.24813842773438, 252.88784790039062, 260.5275573730469, 268.1672668457031, 275.8069763183594, 283.4466857910156, 291.0863952636719, 298.72613525390625, 306.3658447265625, 314.00555419921875, 321.645263671875, 329.28497314453125, 336.9246826171875, 344.56439208984375, 352.2041015625, 359.84381103515625, 367.4835205078125, 375.12322998046875, 382.762939453125, 390.40264892578125, 398.0423583984375, 405.68206787109375, 413.32177734375, 420.96148681640625]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 6.0, 11.0, 14.0, 6.0, 13.0, 17.0, 21.0, 21.0, 36.0, 28.0, 42.0, 35.0, 38.0, 42.0, 47.0, 42.0, 36.0, 44.0, 43.0, 39.0, 49.0, 33.0, 41.0, 47.0, 38.0, 21.0, 33.0, 26.0, 17.0, 16.0, 19.0, 16.0, 8.0, 16.0, 8.0, 7.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.54390716552734, -73.96456909179688, -71.38522338867188, -68.80587768554688, -66.2265396118164, -63.64719772338867, -61.06785583496094, -58.4885139465332, -55.90917205810547, -53.329830169677734, -50.75048828125, -48.171146392822266, -45.59180450439453, -43.0124626159668, -40.43312072753906, -37.85377883911133, -35.274436950683594, -32.69509506225586, -30.115753173828125, -27.53641128540039, -24.957069396972656, -22.377727508544922, -19.798385620117188, -17.219043731689453, -14.639701843261719, -12.060359954833984, -9.48101806640625, -6.901676177978516, -4.322334289550781, -1.7429924011230469, 0.8363494873046875, 3.415691375732422, 5.995025634765625, 8.57436752319336, 11.153709411621094, 13.733051300048828, 16.312393188476562, 18.891735076904297, 21.47107696533203, 24.050418853759766, 26.6297607421875, 29.209102630615234, 31.78844451904297, 34.3677864074707, 36.94712829589844, 39.52647018432617, 42.105812072753906, 44.68515396118164, 47.264495849609375, 49.84383773803711, 52.423179626464844, 55.00252151489258, 57.58186340332031, 60.16120529174805, 62.74054718017578, 65.31988525390625, 67.89923095703125, 70.47857666015625, 73.05791473388672, 75.63725280761719, 78.21659851074219, 80.79594421386719, 83.37528228759766, 85.95462036132812, 88.53396606445312]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 8.0, 12.0, 6.0, 11.0, 13.0, 13.0, 11.0, 17.0, 21.0, 27.0, 35.0, 45.0, 26.0, 43.0, 51.0, 55.0, 35.0, 51.0, 42.0, 40.0, 43.0, 52.0, 40.0, 45.0, 33.0, 32.0, 29.0, 19.0, 28.0, 21.0, 24.0, 9.0, 15.0, 13.0, 8.0, 7.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.625, -121.380859375, -117.13671875, -112.892578125, -108.6484375, -104.404296875, -100.16015625, -95.916015625, -91.671875, -87.427734375, -83.18359375, -78.939453125, -74.6953125, -70.451171875, -66.20703125, -61.962890625, -57.71875, -53.474609375, -49.23046875, -44.986328125, -40.7421875, -36.498046875, -32.25390625, -28.009765625, -23.765625, -19.521484375, -15.27734375, -11.033203125, -6.7890625, -2.544921875, 1.69921875, 5.943359375, 10.1875, 14.431640625, 18.67578125, 22.919921875, 27.1640625, 31.408203125, 35.65234375, 39.896484375, 44.140625, 48.384765625, 52.62890625, 56.873046875, 61.1171875, 65.361328125, 69.60546875, 73.849609375, 78.09375, 82.337890625, 86.58203125, 90.826171875, 95.0703125, 99.314453125, 103.55859375, 107.802734375, 112.046875, 116.291015625, 120.53515625, 124.779296875, 129.0234375, 133.267578125, 137.51171875, 141.755859375, 146.0]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 11.0, 17.0, 17.0, 41.0, 44.0, 78.0, 123.0, 199.0, 344.0, 573.0, 824.0, 1356.0, 2245.0, 3641.0, 5944.0, 9996.0, 16073.0, 27057.0, 45498.0, 78062.0, 134245.0, 224577.0, 205247.0, 119846.0, 69856.0, 41082.0, 24129.0, 14488.0, 8839.0, 5400.0, 3308.0, 2066.0, 1215.0, 783.0, 488.0, 317.0, 199.0, 113.0, 66.0, 52.0, 35.0, 18.0, 16.0, 6.0, 3.0, 8.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.0625, -17.513427734375, -16.96435546875, -16.415283203125, -15.8662109375, -15.317138671875, -14.76806640625, -14.218994140625, -13.669921875, -13.120849609375, -12.57177734375, -12.022705078125, -11.4736328125, -10.924560546875, -10.37548828125, -9.826416015625, -9.27734375, -8.728271484375, -8.17919921875, -7.630126953125, -7.0810546875, -6.531982421875, -5.98291015625, -5.433837890625, -4.884765625, -4.335693359375, -3.78662109375, -3.237548828125, -2.6884765625, -2.139404296875, -1.59033203125, -1.041259765625, -0.4921875, 0.056884765625, 0.60595703125, 1.155029296875, 1.7041015625, 2.253173828125, 2.80224609375, 3.351318359375, 3.900390625, 4.449462890625, 4.99853515625, 5.547607421875, 6.0966796875, 6.645751953125, 7.19482421875, 7.743896484375, 8.29296875, 8.842041015625, 9.39111328125, 9.940185546875, 10.4892578125, 11.038330078125, 11.58740234375, 12.136474609375, 12.685546875, 13.234619140625, 13.78369140625, 14.332763671875, 14.8818359375, 15.430908203125, 15.97998046875, 16.529052734375, 17.078125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 3.0, 2.0, 6.0, 9.0, 12.0, 13.0, 14.0, 21.0, 22.0, 22.0, 24.0, 35.0, 29.0, 35.0, 32.0, 36.0, 45.0, 43.0, 27.0, 37.0, 1070.0, 37.0, 42.0, 38.0, 39.0, 36.0, 34.0, 34.0, 31.0, 20.0, 31.0, 16.0, 18.0, 14.0, 19.0, 18.0, 12.0, 7.0, 15.0, 2.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-75.125, -72.7548828125, -70.384765625, -68.0146484375, -65.64453125, -63.2744140625, -60.904296875, -58.5341796875, -56.1640625, -53.7939453125, -51.423828125, -49.0537109375, -46.68359375, -44.3134765625, -41.943359375, -39.5732421875, -37.203125, -34.8330078125, -32.462890625, -30.0927734375, -27.72265625, -25.3525390625, -22.982421875, -20.6123046875, -18.2421875, -15.8720703125, -13.501953125, -11.1318359375, -8.76171875, -6.3916015625, -4.021484375, -1.6513671875, 0.71875, 3.0888671875, 5.458984375, 7.8291015625, 10.19921875, 12.5693359375, 14.939453125, 17.3095703125, 19.6796875, 22.0498046875, 24.419921875, 26.7900390625, 29.16015625, 31.5302734375, 33.900390625, 36.2705078125, 38.640625, 41.0107421875, 43.380859375, 45.7509765625, 48.12109375, 50.4912109375, 52.861328125, 55.2314453125, 57.6015625, 59.9716796875, 62.341796875, 64.7119140625, 67.08203125, 69.4521484375, 71.822265625, 74.1923828125, 76.5625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 7.0, 17.0, 30.0, 35.0, 53.0, 90.0, 151.0, 183.0, 311.0, 469.0, 549.0, 898.0, 1287.0, 1900.0, 2835.0, 4134.0, 6415.0, 9610.0, 14561.0, 21894.0, 33684.0, 51765.0, 81799.0, 130350.0, 1246862.0, 175825.0, 111310.0, 69969.0, 44599.0, 28595.0, 19052.0, 12756.0, 8246.0, 5420.0, 3725.0, 2505.0, 1725.0, 1119.0, 805.0, 533.0, 333.0, 215.0, 170.0, 119.0, 73.0, 56.0, 26.0, 20.0, 19.0, 13.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-12.8515625, -12.44775390625, -12.0439453125, -11.64013671875, -11.236328125, -10.83251953125, -10.4287109375, -10.02490234375, -9.62109375, -9.21728515625, -8.8134765625, -8.40966796875, -8.005859375, -7.60205078125, -7.1982421875, -6.79443359375, -6.390625, -5.98681640625, -5.5830078125, -5.17919921875, -4.775390625, -4.37158203125, -3.9677734375, -3.56396484375, -3.16015625, -2.75634765625, -2.3525390625, -1.94873046875, -1.544921875, -1.14111328125, -0.7373046875, -0.33349609375, 0.0703125, 0.47412109375, 0.8779296875, 1.28173828125, 1.685546875, 2.08935546875, 2.4931640625, 2.89697265625, 3.30078125, 3.70458984375, 4.1083984375, 4.51220703125, 4.916015625, 5.31982421875, 5.7236328125, 6.12744140625, 6.53125, 6.93505859375, 7.3388671875, 7.74267578125, 8.146484375, 8.55029296875, 8.9541015625, 9.35791015625, 9.76171875, 10.16552734375, 10.5693359375, 10.97314453125, 11.376953125, 11.78076171875, 12.1845703125, 12.58837890625, 12.9921875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 6.0, 8.0, 8.0, 17.0, 17.0, 30.0, 42.0, 54.0, 62.0, 61.0, 83.0, 87.0, 86.0, 81.0, 69.0, 63.0, 53.0, 42.0, 34.0, 24.0, 15.0, 8.0, 9.0, 9.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035980224609375, -0.03482484817504883, -0.033669471740722656, -0.032514095306396484, -0.03135871887207031, -0.03020334243774414, -0.02904796600341797, -0.027892589569091797, -0.026737213134765625, -0.025581836700439453, -0.02442646026611328, -0.02327108383178711, -0.022115707397460938, -0.020960330963134766, -0.019804954528808594, -0.018649578094482422, -0.01749420166015625, -0.016338825225830078, -0.015183448791503906, -0.014028072357177734, -0.012872695922851562, -0.01171731948852539, -0.010561943054199219, -0.009406566619873047, -0.008251190185546875, -0.007095813751220703, -0.005940437316894531, -0.004785060882568359, -0.0036296844482421875, -0.0024743080139160156, -0.0013189315795898438, -0.00016355514526367188, 0.0009918212890625, 0.002147197723388672, 0.0033025741577148438, 0.004457950592041016, 0.0056133270263671875, 0.006768703460693359, 0.007924079895019531, 0.009079456329345703, 0.010234832763671875, 0.011390209197998047, 0.012545585632324219, 0.01370096206665039, 0.014856338500976562, 0.016011714935302734, 0.017167091369628906, 0.018322467803955078, 0.01947784423828125, 0.020633220672607422, 0.021788597106933594, 0.022943973541259766, 0.024099349975585938, 0.02525472640991211, 0.02641010284423828, 0.027565479278564453, 0.028720855712890625, 0.029876232147216797, 0.03103160858154297, 0.03218698501586914, 0.03334236145019531, 0.034497737884521484, 0.035653114318847656, 0.03680849075317383, 0.0379638671875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 8.0, 7.0, 14.0, 23.0, 21.0, 27.0, 44.0, 66.0, 86.0, 147.0, 255.0, 476.0, 870.0, 1908.0, 4954.0, 22237.0, 294574.0, 655178.0, 54127.0, 8208.0, 2661.0, 1214.0, 549.0, 326.0, 198.0, 108.0, 67.0, 45.0, 32.0, 33.0, 25.0, 13.0, 12.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.298095703125, -0.28911590576171875, -0.2801361083984375, -0.27115631103515625, -0.262176513671875, -0.25319671630859375, -0.2442169189453125, -0.23523712158203125, -0.22625732421875, -0.21727752685546875, -0.2082977294921875, -0.19931793212890625, -0.190338134765625, -0.18135833740234375, -0.1723785400390625, -0.16339874267578125, -0.1544189453125, -0.14543914794921875, -0.1364593505859375, -0.12747955322265625, -0.118499755859375, -0.10951995849609375, -0.1005401611328125, -0.09156036376953125, -0.08258056640625, -0.07360076904296875, -0.0646209716796875, -0.05564117431640625, -0.046661376953125, -0.03768157958984375, -0.0287017822265625, -0.01972198486328125, -0.0107421875, -0.00176239013671875, 0.0072174072265625, 0.01619720458984375, 0.025177001953125, 0.03415679931640625, 0.0431365966796875, 0.05211639404296875, 0.06109619140625, 0.07007598876953125, 0.0790557861328125, 0.08803558349609375, 0.097015380859375, 0.10599517822265625, 0.1149749755859375, 0.12395477294921875, 0.1329345703125, 0.14191436767578125, 0.1508941650390625, 0.15987396240234375, 0.168853759765625, 0.17783355712890625, 0.1868133544921875, 0.19579315185546875, 0.20477294921875, 0.21375274658203125, 0.2227325439453125, 0.23171234130859375, 0.240692138671875, 0.24967193603515625, 0.2586517333984375, 0.26763153076171875, 0.276611328125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 10.0, 13.0, 40.0, 99.0, 135.0, 232.0, 195.0, 120.0, 72.0, 37.0, 20.0, 14.0, 9.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025282271206378937, -0.023666420951485634, -0.02205057069659233, -0.020434722304344177, -0.018818870186805725, -0.01720302179455757, -0.015587171539664268, -0.013971321284770966, -0.012355471029877663, -0.01073962077498436, -0.009123770520091057, -0.0075079211965203285, -0.005892070941627026, -0.004276220686733723, -0.0026603713631629944, -0.0010445211082696915, 0.0005713291466236115, 0.0021871791686862707, 0.00380302919074893, 0.005418878979980946, 0.0070347292348742485, 0.008650579489767551, 0.01026642881333828, 0.011882279068231583, 0.013498129323124886, 0.015113979578018188, 0.01672982983291149, 0.018345680087804794, 0.019961528480052948, 0.0215773805975914, 0.023193228989839554, 0.024809079244732857, 0.02642492949962616, 0.028040779754519463, 0.029656630009412766, 0.03127247840166092, 0.03288833051919937, 0.034504178911447525, 0.03612002730369568, 0.03773587942123413, 0.03935173153877258, 0.04096757993102074, 0.04258343204855919, 0.04419928044080734, 0.045815132558345795, 0.04743098095059395, 0.0490468293428421, 0.050662681460380554, 0.05227852985262871, 0.05389437824487686, 0.055510230362415314, 0.05712607875466347, 0.05874193087220192, 0.06035777926445007, 0.061973631381988525, 0.06358948349952698, 0.06520532816648483, 0.06682118028402328, 0.06843702495098114, 0.07005287706851959, 0.07166872918605804, 0.0732845813035965, 0.07490042597055435, 0.0765162780880928, 0.07813213020563126]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 5.0, 5.0, 9.0, 8.0, 5.0, 7.0, 8.0, 11.0, 9.0, 24.0, 17.0, 18.0, 25.0, 32.0, 34.0, 32.0, 41.0, 30.0, 44.0, 41.0, 44.0, 43.0, 37.0, 44.0, 29.0, 39.0, 37.0, 41.0, 37.0, 34.0, 27.0, 37.0, 22.0, 21.0, 18.0, 19.0, 17.0, 13.0, 9.0, 7.0, 6.0, 2.0, 6.0, 2.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.015754342079162598, -0.01525197084993124, -0.014749599620699883, -0.014247228391468525, -0.013744857162237167, -0.01324248593300581, -0.012740114703774452, -0.012237743474543095, -0.011735372245311737, -0.01123300101608038, -0.010730629786849022, -0.010228258557617664, -0.009725887328386307, -0.00922351609915495, -0.008721144869923592, -0.008218773640692234, -0.0077164024114608765, -0.007214031182229519, -0.006711659952998161, -0.006209288723766804, -0.005706917494535446, -0.005204546265304089, -0.004702175036072731, -0.0041998038068413734, -0.003697432577610016, -0.0031950613483786583, -0.0026926901191473007, -0.002190318889915943, -0.0016879476606845856, -0.001185576431453228, -0.0006832052022218704, -0.00018083397299051285, 0.0003215372562408447, 0.0008239084854722023, 0.0013262797147035599, 0.0018286509439349174, 0.002331022173166275, 0.0028333934023976326, 0.00333576463162899, 0.0038381358608603477, 0.004340507090091705, 0.004842878319323063, 0.0053452495485544205, 0.005847620777785778, 0.006349992007017136, 0.006852363236248493, 0.007354734465479851, 0.007857105694711208, 0.008359476923942566, 0.008861848153173923, 0.009364219382405281, 0.009866590611636639, 0.010368961840867996, 0.010871333070099354, 0.011373704299330711, 0.011876075528562069, 0.012378446757793427, 0.012880817987024784, 0.013383189216256142, 0.0138855604454875, 0.014387931674718857, 0.014890302903950214, 0.015392674133181572, 0.015895046293735504, 0.016397416591644287]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 9.0, 10.0, 6.0, 12.0, 13.0, 13.0, 11.0, 17.0, 21.0, 29.0, 33.0, 45.0, 26.0, 43.0, 51.0, 54.0, 36.0, 52.0, 41.0, 40.0, 43.0, 50.0, 42.0, 45.0, 32.0, 33.0, 29.0, 19.0, 28.0, 21.0, 24.0, 9.0, 15.0, 13.0, 8.0, 7.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.6875, -121.4423828125, -117.197265625, -112.9521484375, -108.70703125, -104.4619140625, -100.216796875, -95.9716796875, -91.7265625, -87.4814453125, -83.236328125, -78.9912109375, -74.74609375, -70.5009765625, -66.255859375, -62.0107421875, -57.765625, -53.5205078125, -49.275390625, -45.0302734375, -40.78515625, -36.5400390625, -32.294921875, -28.0498046875, -23.8046875, -19.5595703125, -15.314453125, -11.0693359375, -6.82421875, -2.5791015625, 1.666015625, 5.9111328125, 10.15625, 14.4013671875, 18.646484375, 22.8916015625, 27.13671875, 31.3818359375, 35.626953125, 39.8720703125, 44.1171875, 48.3623046875, 52.607421875, 56.8525390625, 61.09765625, 65.3427734375, 69.587890625, 73.8330078125, 78.078125, 82.3232421875, 86.568359375, 90.8134765625, 95.05859375, 99.3037109375, 103.548828125, 107.7939453125, 112.0390625, 116.2841796875, 120.529296875, 124.7744140625, 129.01953125, 133.2646484375, 137.509765625, 141.7548828125, 146.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 8.0, 12.0, 14.0, 16.0, 20.0, 41.0, 45.0, 60.0, 115.0, 159.0, 257.0, 514.0, 910.0, 1521.0, 3244.0, 7414.0, 21610.0, 101059.0, 591186.0, 256729.0, 42256.0, 11784.0, 4543.0, 2235.0, 1166.0, 616.0, 341.0, 216.0, 141.0, 85.0, 58.0, 52.0, 24.0, 20.0, 19.0, 12.0, 16.0, 8.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.0, -34.86572265625, -33.7314453125, -32.59716796875, -31.462890625, -30.32861328125, -29.1943359375, -28.06005859375, -26.92578125, -25.79150390625, -24.6572265625, -23.52294921875, -22.388671875, -21.25439453125, -20.1201171875, -18.98583984375, -17.8515625, -16.71728515625, -15.5830078125, -14.44873046875, -13.314453125, -12.18017578125, -11.0458984375, -9.91162109375, -8.77734375, -7.64306640625, -6.5087890625, -5.37451171875, -4.240234375, -3.10595703125, -1.9716796875, -0.83740234375, 0.296875, 1.43115234375, 2.5654296875, 3.69970703125, 4.833984375, 5.96826171875, 7.1025390625, 8.23681640625, 9.37109375, 10.50537109375, 11.6396484375, 12.77392578125, 13.908203125, 15.04248046875, 16.1767578125, 17.31103515625, 18.4453125, 19.57958984375, 20.7138671875, 21.84814453125, 22.982421875, 24.11669921875, 25.2509765625, 26.38525390625, 27.51953125, 28.65380859375, 29.7880859375, 30.92236328125, 32.056640625, 33.19091796875, 34.3251953125, 35.45947265625, 36.59375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 7.0, 12.0, 15.0, 19.0, 30.0, 37.0, 56.0, 68.0, 81.0, 91.0, 2133.0, 119.0, 76.0, 80.0, 61.0, 51.0, 27.0, 27.0, 29.0, 10.0, 4.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-451.75, -439.46484375, -427.1796875, -414.89453125, -402.609375, -390.32421875, -378.0390625, -365.75390625, -353.46875, -341.18359375, -328.8984375, -316.61328125, -304.328125, -292.04296875, -279.7578125, -267.47265625, -255.1875, -242.90234375, -230.6171875, -218.33203125, -206.046875, -193.76171875, -181.4765625, -169.19140625, -156.90625, -144.62109375, -132.3359375, -120.05078125, -107.765625, -95.48046875, -83.1953125, -70.91015625, -58.625, -46.33984375, -34.0546875, -21.76953125, -9.484375, 2.80078125, 15.0859375, 27.37109375, 39.65625, 51.94140625, 64.2265625, 76.51171875, 88.796875, 101.08203125, 113.3671875, 125.65234375, 137.9375, 150.22265625, 162.5078125, 174.79296875, 187.078125, 199.36328125, 211.6484375, 223.93359375, 236.21875, 248.50390625, 260.7890625, 273.07421875, 285.359375, 297.64453125, 309.9296875, 322.21484375, 334.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 9.0, 8.0, 21.0, 37.0, 101.0, 221.0, 413.0, 1165.0, 5408.0, 2800223.0, 332367.0, 4076.0, 933.0, 359.0, 198.0, 75.0, 43.0, 23.0, 10.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-135.375, -131.3857421875, -127.396484375, -123.4072265625, -119.41796875, -115.4287109375, -111.439453125, -107.4501953125, -103.4609375, -99.4716796875, -95.482421875, -91.4931640625, -87.50390625, -83.5146484375, -79.525390625, -75.5361328125, -71.546875, -67.5576171875, -63.568359375, -59.5791015625, -55.58984375, -51.6005859375, -47.611328125, -43.6220703125, -39.6328125, -35.6435546875, -31.654296875, -27.6650390625, -23.67578125, -19.6865234375, -15.697265625, -11.7080078125, -7.71875, -3.7294921875, 0.259765625, 4.2490234375, 8.23828125, 12.2275390625, 16.216796875, 20.2060546875, 24.1953125, 28.1845703125, 32.173828125, 36.1630859375, 40.15234375, 44.1416015625, 48.130859375, 52.1201171875, 56.109375, 60.0986328125, 64.087890625, 68.0771484375, 72.06640625, 76.0556640625, 80.044921875, 84.0341796875, 88.0234375, 92.0126953125, 96.001953125, 99.9912109375, 103.98046875, 107.9697265625, 111.958984375, 115.9482421875, 119.9375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 8.0, 8.0, 23.0, 48.0, 105.0, 198.0, 232.0, 177.0, 83.0, 46.0, 27.0, 13.0, 8.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-252.2066650390625, -237.6568603515625, -223.1070556640625, -208.55726623535156, -194.00746154785156, -179.45765686035156, -164.90786743164062, -150.35806274414062, -135.80825805664062, -121.25845336914062, -106.70865631103516, -92.15885925292969, -77.60905456542969, -63.05924987792969, -48.50945281982422, -33.95965576171875, -19.40985107421875, -4.860050201416016, 9.689750671386719, 24.239551544189453, 38.78935241699219, 53.33915710449219, 67.88895416259766, 82.43875122070312, 96.98855590820312, 111.53836059570312, 126.0881576538086, 140.63795471191406, 155.18775939941406, 169.73756408691406, 184.287353515625, 198.837158203125, 213.386962890625, 227.936767578125, 242.486572265625, 257.036376953125, 271.586181640625, 286.135986328125, 300.6857604980469, 315.2355651855469, 329.7853698730469, 344.3351745605469, 358.8849792480469, 373.4347839355469, 387.98455810546875, 402.53436279296875, 417.08416748046875, 431.63397216796875, 446.18377685546875, 460.73358154296875, 475.28338623046875, 489.83319091796875, 504.38299560546875, 518.9328002929688, 533.4826049804688, 548.0323486328125, 562.5821533203125, 577.1319580078125, 591.6817626953125, 606.2315673828125, 620.7813720703125, 635.3311767578125, 649.8809814453125, 664.4307861328125, 678.9805908203125]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 7.0, 8.0, 10.0, 5.0, 9.0, 13.0, 8.0, 15.0, 16.0, 14.0, 17.0, 26.0, 32.0, 29.0, 40.0, 37.0, 50.0, 41.0, 47.0, 47.0, 49.0, 53.0, 44.0, 42.0, 41.0, 37.0, 40.0, 29.0, 26.0, 20.0, 19.0, 20.0, 18.0, 20.0, 14.0, 6.0, 7.0, 10.0, 11.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-336.05377197265625, -327.0004577636719, -317.9471435546875, -308.893798828125, -299.8404846191406, -290.78717041015625, -281.73382568359375, -272.6805114746094, -263.627197265625, -254.57388305664062, -245.5205535888672, -236.46722412109375, -227.41390991210938, -218.360595703125, -209.30726623535156, -200.25393676757812, -191.20062255859375, -182.14730834960938, -173.09397888183594, -164.0406494140625, -154.98733520507812, -145.93402099609375, -136.8806915283203, -127.8273696899414, -118.7740478515625, -109.7207260131836, -100.66740417480469, -91.61408233642578, -82.56076049804688, -73.50743865966797, -64.45411682128906, -55.400794982910156, -46.34747314453125, -37.294151306152344, -28.240829467773438, -19.18750762939453, -10.134185791015625, -1.0808639526367188, 7.9724578857421875, 17.025779724121094, 26.0791015625, 35.132423400878906, 44.18574523925781, 53.23906707763672, 62.292388916015625, 71.34571075439453, 80.39903259277344, 89.45235443115234, 98.50567626953125, 107.55899810791016, 116.61231994628906, 125.66564178466797, 134.71896362304688, 143.77227783203125, 152.8256072998047, 161.87893676757812, 170.9322509765625, 179.98556518554688, 189.0388946533203, 198.09222412109375, 207.14553833007812, 216.1988525390625, 225.25218200683594, 234.30551147460938, 243.35882568359375]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 6.0, 5.0, 12.0, 10.0, 10.0, 19.0, 28.0, 32.0, 34.0, 52.0, 40.0, 61.0, 86.0, 115.0, 141.0, 167.0, 187.0, 219.0, 280.0, 318.0, 387.0, 509.0, 697.0, 1040771.0, 1127.0, 611.0, 485.0, 389.0, 338.0, 246.0, 212.0, 165.0, 133.0, 123.0, 108.0, 79.0, 68.0, 59.0, 42.0, 49.0, 20.0, 21.0, 19.0, 10.0, 12.0, 11.0, 9.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 4.0], "bins": [-71.16878509521484, -69.06757354736328, -66.96636199951172, -64.86515045166016, -62.76394271850586, -60.6627311706543, -58.561519622802734, -56.46030807495117, -54.359100341796875, -52.25788879394531, -50.15667724609375, -48.05546569824219, -45.95425796508789, -43.85304641723633, -41.751834869384766, -39.6506233215332, -37.54941177368164, -35.44820022583008, -33.346988677978516, -31.245779037475586, -29.144569396972656, -27.043357849121094, -24.94214630126953, -22.84093475341797, -20.73972511291504, -18.638513565063477, -16.537303924560547, -14.436092376708984, -12.334881782531738, -10.233671188354492, -8.13245964050293, -6.031249046325684, -3.930034637451172, -1.8288238048553467, 0.2723870277404785, 2.373598098754883, 4.474808692932129, 6.576019287109375, 8.677230834960938, 10.778441429138184, 12.87965202331543, 14.980862617492676, 17.082073211669922, 19.183284759521484, 21.284496307373047, 23.385705947875977, 25.48691749572754, 27.58812713623047, 29.68933868408203, 31.790550231933594, 33.891761779785156, 35.99297332763672, 38.094181060791016, 40.19539260864258, 42.29660415649414, 44.3978157043457, 46.4990234375, 48.60023498535156, 50.701446533203125, 52.80265808105469, 54.903865814208984, 57.00507736206055, 59.10628890991211, 61.20750045776367, 63.308712005615234]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 5.0, 10.0, 9.0, 2.0, 3.0, 6.0, 5.0, 14.0, 24.0, 44.0, 106.0, 2091.0, 51460616.0, 116.0, 50.0, 22.0, 11.0, 17.0, 7.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 6.0, 2.0, 4.0, 7.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9416.0, -9009.373046875, -8602.74609375, -8196.119140625, -7789.4921875, -7382.865234375, -6976.23876953125, -6569.61181640625, -6162.98486328125, -5756.35791015625, -5349.73095703125, -4943.1044921875, -4536.4775390625, -4129.8505859375, -3723.2236328125, -3316.5966796875, -2909.9697265625, -2503.3427734375, -2096.7158203125, -1690.089111328125, -1283.462158203125, -876.835205078125, -470.20849609375, -63.58154296875, 343.04541015625, 749.6723022460938, 1156.2991943359375, 1562.926025390625, 1969.552978515625, 2376.179931640625, 2782.806640625, 3189.43359375, 3596.060546875, 4002.6875, 4409.314453125, 4815.94140625, 5222.568359375, 5629.1953125, 6035.82177734375, 6442.44873046875, 6849.07568359375, 7255.70263671875, 7662.32958984375, 8068.9560546875, 8475.5830078125, 8882.2099609375, 9288.8369140625, 9695.4638671875, 10102.0908203125, 10508.7177734375, 10915.3447265625, 11321.9716796875, 11728.5986328125, 12135.2255859375, 12541.8515625, 12948.478515625, 13355.10546875, 13761.732421875, 14168.359375, 14574.986328125, 14981.61328125, 15388.240234375, 15794.8671875, 16201.494140625, 16608.12109375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 14.0, 18.0, 39.0, 55.0, 66.0, 107.0, 170.0, 225.0, 357.0, 541.0, 792.0, 1218.0, 2009.0, 3039.0, 4664.0, 7516.0, 11551.0, 18736.0, 30368.0, 49329.0, 80966.0, 136573.0, 235494.0, 436492.0, 3765087.0, 737497.0, 317174.0, 178811.0, 105802.0, 63129.0, 38739.0, 23930.0, 14989.0, 9205.0, 6019.0, 3718.0, 2438.0, 1599.0, 932.0, 700.0, 462.0, 284.0, 185.0, 132.0, 105.0, 55.0, 37.0, 28.0, 12.0, 8.0, 11.0, 2.0, 2.0, 2.0, 2.0], "bins": [-8.6953125, -8.43768310546875, -8.1800537109375, -7.92242431640625, -7.664794921875, -7.40716552734375, -7.1495361328125, -6.89190673828125, -6.63427734375, -6.37664794921875, -6.1190185546875, -5.86138916015625, -5.603759765625, -5.34613037109375, -5.0885009765625, -4.83087158203125, -4.5732421875, -4.31561279296875, -4.0579833984375, -3.80035400390625, -3.542724609375, -3.28509521484375, -3.0274658203125, -2.76983642578125, -2.51220703125, -2.25457763671875, -1.9969482421875, -1.73931884765625, -1.481689453125, -1.22406005859375, -0.9664306640625, -0.70880126953125, -0.451171875, -0.19354248046875, 0.0640869140625, 0.32171630859375, 0.579345703125, 0.83697509765625, 1.0946044921875, 1.35223388671875, 1.60986328125, 1.86749267578125, 2.1251220703125, 2.38275146484375, 2.640380859375, 2.89801025390625, 3.1556396484375, 3.41326904296875, 3.6708984375, 3.92852783203125, 4.1861572265625, 4.44378662109375, 4.701416015625, 4.95904541015625, 5.2166748046875, 5.47430419921875, 5.73193359375, 5.98956298828125, 6.2471923828125, 6.50482177734375, 6.762451171875, 7.02008056640625, 7.2777099609375, 7.53533935546875, 7.79296875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 9.0, 9.0, 14.0, 8.0, 15.0, 19.0, 16.0, 22.0, 19.0, 30.0, 37.0, 30.0, 36.0, 34.0, 39.0, 34.0, 42.0, 48.0, 173.0, 782.0, 167.0, 48.0, 26.0, 30.0, 32.0, 37.0, 27.0, 25.0, 29.0, 29.0, 20.0, 25.0, 15.0, 18.0, 13.0, 10.0, 13.0, 10.0, 11.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.8125, -25.96240234375, -25.1123046875, -24.26220703125, -23.412109375, -22.56201171875, -21.7119140625, -20.86181640625, -20.01171875, -19.16162109375, -18.3115234375, -17.46142578125, -16.611328125, -15.76123046875, -14.9111328125, -14.06103515625, -13.2109375, -12.36083984375, -11.5107421875, -10.66064453125, -9.810546875, -8.96044921875, -8.1103515625, -7.26025390625, -6.41015625, -5.56005859375, -4.7099609375, -3.85986328125, -3.009765625, -2.15966796875, -1.3095703125, -0.45947265625, 0.390625, 1.24072265625, 2.0908203125, 2.94091796875, 3.791015625, 4.64111328125, 5.4912109375, 6.34130859375, 7.19140625, 8.04150390625, 8.8916015625, 9.74169921875, 10.591796875, 11.44189453125, 12.2919921875, 13.14208984375, 13.9921875, 14.84228515625, 15.6923828125, 16.54248046875, 17.392578125, 18.24267578125, 19.0927734375, 19.94287109375, 20.79296875, 21.64306640625, 22.4931640625, 23.34326171875, 24.193359375, 25.04345703125, 25.8935546875, 26.74365234375, 27.59375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 6.0, 4.0, 15.0, 16.0, 23.0, 35.0, 70.0, 82.0, 128.0, 199.0, 285.0, 402.0, 609.0, 989.0, 1502.0, 2251.0, 3626.0, 5521.0, 9114.0, 14801.0, 24229.0, 41236.0, 72733.0, 137289.0, 285355.0, 892716.0, 3962053.0, 420631.0, 186384.0, 96383.0, 53539.0, 30770.0, 17919.0, 11265.0, 6885.0, 4264.0, 2748.0, 1897.0, 1188.0, 766.0, 495.0, 342.0, 207.0, 140.0, 89.0, 81.0, 49.0, 48.0, 25.0, 14.0, 6.0, 3.0, 4.0, 5.0, 3.0, 0.0, 3.0], "bins": [-14.1328125, -13.7073974609375, -13.281982421875, -12.8565673828125, -12.43115234375, -12.0057373046875, -11.580322265625, -11.1549072265625, -10.7294921875, -10.3040771484375, -9.878662109375, -9.4532470703125, -9.02783203125, -8.6024169921875, -8.177001953125, -7.7515869140625, -7.326171875, -6.9007568359375, -6.475341796875, -6.0499267578125, -5.62451171875, -5.1990966796875, -4.773681640625, -4.3482666015625, -3.9228515625, -3.4974365234375, -3.072021484375, -2.6466064453125, -2.22119140625, -1.7957763671875, -1.370361328125, -0.9449462890625, -0.51953125, -0.0941162109375, 0.331298828125, 0.7567138671875, 1.18212890625, 1.6075439453125, 2.032958984375, 2.4583740234375, 2.8837890625, 3.3092041015625, 3.734619140625, 4.1600341796875, 4.58544921875, 5.0108642578125, 5.436279296875, 5.8616943359375, 6.287109375, 6.7125244140625, 7.137939453125, 7.5633544921875, 7.98876953125, 8.4141845703125, 8.839599609375, 9.2650146484375, 9.6904296875, 10.1158447265625, 10.541259765625, 10.9666748046875, 11.39208984375, 11.8175048828125, 12.242919921875, 12.6683349609375, 13.09375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 6.0, 4.0, 8.0, 5.0, 10.0, 13.0, 9.0, 12.0, 22.0, 14.0, 25.0, 32.0, 28.0, 36.0, 39.0, 44.0, 43.0, 85.0, 297.0, 697.0, 138.0, 71.0, 52.0, 49.0, 33.0, 29.0, 42.0, 35.0, 24.0, 24.0, 20.0, 17.0, 16.0, 13.0, 5.0, 8.0, 5.0, 2.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.75, -24.028076171875, -23.30615234375, -22.584228515625, -21.8623046875, -21.140380859375, -20.41845703125, -19.696533203125, -18.974609375, -18.252685546875, -17.53076171875, -16.808837890625, -16.0869140625, -15.364990234375, -14.64306640625, -13.921142578125, -13.19921875, -12.477294921875, -11.75537109375, -11.033447265625, -10.3115234375, -9.589599609375, -8.86767578125, -8.145751953125, -7.423828125, -6.701904296875, -5.97998046875, -5.258056640625, -4.5361328125, -3.814208984375, -3.09228515625, -2.370361328125, -1.6484375, -0.926513671875, -0.20458984375, 0.517333984375, 1.2392578125, 1.961181640625, 2.68310546875, 3.405029296875, 4.126953125, 4.848876953125, 5.57080078125, 6.292724609375, 7.0146484375, 7.736572265625, 8.45849609375, 9.180419921875, 9.90234375, 10.624267578125, 11.34619140625, 12.068115234375, 12.7900390625, 13.511962890625, 14.23388671875, 14.955810546875, 15.677734375, 16.399658203125, 17.12158203125, 17.843505859375, 18.5654296875, 19.287353515625, 20.00927734375, 20.731201171875, 21.453125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 6.0, 10.0, 8.0, 2.0, 15.0, 19.0, 41.0, 25.0, 59.0, 71.0, 89.0, 172.0, 248.0, 359.0, 439.0, 793.0, 1410.0, 2301.0, 4399.0, 9550.0, 28217.0, 162152.0, 5983911.0, 64973.0, 17090.0, 6908.0, 3226.0, 1832.0, 1059.0, 640.0, 434.0, 319.0, 249.0, 142.0, 69.0, 35.0, 47.0, 37.0, 26.0, 25.0, 17.0, 6.0, 2.0, 0.0, 0.0, 3.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-60.125, -58.1396484375, -56.154296875, -54.1689453125, -52.18359375, -50.1982421875, -48.212890625, -46.2275390625, -44.2421875, -42.2568359375, -40.271484375, -38.2861328125, -36.30078125, -34.3154296875, -32.330078125, -30.3447265625, -28.359375, -26.3740234375, -24.388671875, -22.4033203125, -20.41796875, -18.4326171875, -16.447265625, -14.4619140625, -12.4765625, -10.4912109375, -8.505859375, -6.5205078125, -4.53515625, -2.5498046875, -0.564453125, 1.4208984375, 3.40625, 5.3916015625, 7.376953125, 9.3623046875, 11.34765625, 13.3330078125, 15.318359375, 17.3037109375, 19.2890625, 21.2744140625, 23.259765625, 25.2451171875, 27.23046875, 29.2158203125, 31.201171875, 33.1865234375, 35.171875, 37.1572265625, 39.142578125, 41.1279296875, 43.11328125, 45.0986328125, 47.083984375, 49.0693359375, 51.0546875, 53.0400390625, 55.025390625, 57.0107421875, 58.99609375, 60.9814453125, 62.966796875, 64.9521484375, 66.9375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 18.0, 23.0, 17.0, 21.0, 26.0, 34.0, 38.0, 47.0, 68.0, 68.0, 133.0, 357.0, 567.0, 153.0, 90.0, 68.0, 51.0, 36.0, 39.0, 42.0, 24.0, 26.0, 17.0, 13.0, 9.0, 6.0, 8.0, 3.0, 5.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.328125, -20.59814453125, -19.8681640625, -19.13818359375, -18.408203125, -17.67822265625, -16.9482421875, -16.21826171875, -15.48828125, -14.75830078125, -14.0283203125, -13.29833984375, -12.568359375, -11.83837890625, -11.1083984375, -10.37841796875, -9.6484375, -8.91845703125, -8.1884765625, -7.45849609375, -6.728515625, -5.99853515625, -5.2685546875, -4.53857421875, -3.80859375, -3.07861328125, -2.3486328125, -1.61865234375, -0.888671875, -0.15869140625, 0.5712890625, 1.30126953125, 2.03125, 2.76123046875, 3.4912109375, 4.22119140625, 4.951171875, 5.68115234375, 6.4111328125, 7.14111328125, 7.87109375, 8.60107421875, 9.3310546875, 10.06103515625, 10.791015625, 11.52099609375, 12.2509765625, 12.98095703125, 13.7109375, 14.44091796875, 15.1708984375, 15.90087890625, 16.630859375, 17.36083984375, 18.0908203125, 18.82080078125, 19.55078125, 20.28076171875, 21.0107421875, 21.74072265625, 22.470703125, 23.20068359375, 23.9306640625, 24.66064453125, 25.390625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 17.0, 24.0, 50.0, 136.0, 490.0, 190.0, 56.0, 21.0, 11.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.84056854248047, -83.31663513183594, -79.79270935058594, -76.26878356933594, -72.7448501586914, -69.22091674804688, -65.69699096679688, -62.17306137084961, -58.649131774902344, -55.12520217895508, -51.60127258300781, -48.07734298706055, -44.55341339111328, -41.029483795166016, -37.50555419921875, -33.981624603271484, -30.45769500732422, -26.933765411376953, -23.409835815429688, -19.885906219482422, -16.361976623535156, -12.83804702758789, -9.314117431640625, -5.790187835693359, -2.2662582397460938, 1.2576713562011719, 4.7816009521484375, 8.305530548095703, 11.829460144042969, 15.353389739990234, 18.8773193359375, 22.401248931884766, 25.9251708984375, 29.449100494384766, 32.97303009033203, 36.4969596862793, 40.02088928222656, 43.54481887817383, 47.068748474121094, 50.59267807006836, 54.116607666015625, 57.64053726196289, 61.164466857910156, 64.68840026855469, 68.21232604980469, 71.73625183105469, 75.26018524169922, 78.78411865234375, 82.30804443359375, 85.83197021484375, 89.35590362548828, 92.87983703613281, 96.40376281738281, 99.92768859863281, 103.45162200927734, 106.97555541992188, 110.49948120117188, 114.02340698242188, 117.5473403930664, 121.07127380371094, 124.59519958496094, 128.11912536621094, 131.64306640625, 135.1669921875, 138.69091796875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 9.0, 13.0, 25.0, 31.0, 45.0, 62.0, 65.0, 81.0, 91.0, 99.0, 94.0, 74.0, 75.0, 72.0, 51.0, 48.0, 30.0, 16.0, 13.0, 6.0, 5.0, 1.0, 2.0], "bins": [-86.64862060546875, -84.94123840332031, -83.2338638305664, -81.52648162841797, -79.81910705566406, -78.11172485351562, -76.40434265136719, -74.69696807861328, -72.98958587646484, -71.2822036743164, -69.5748291015625, -67.86744689941406, -66.16007232666016, -64.45269012451172, -62.74531173706055, -61.037933349609375, -59.3305549621582, -57.62317657470703, -55.91579818725586, -54.20841979980469, -52.50103759765625, -50.79365921020508, -49.086280822753906, -47.378902435302734, -45.67152404785156, -43.96414566040039, -42.25676727294922, -40.54938507080078, -38.84200668334961, -37.13462829589844, -35.427249908447266, -33.719871520996094, -32.012489318847656, -30.305110931396484, -28.59773063659668, -26.890352249145508, -25.182971954345703, -23.47559356689453, -21.76821517944336, -20.060836791992188, -18.35345458984375, -16.646076202392578, -14.938695907592773, -13.231317520141602, -11.523938179016113, -9.816558837890625, -8.109180450439453, -6.401801109313965, -4.694421768188477, -2.9870426654815674, -1.2796635627746582, 0.4277153015136719, 2.13509464263916, 3.8424739837646484, 5.54985237121582, 7.257231712341309, 8.964611053466797, 10.671990394592285, 12.379369735717773, 14.086748123168945, 15.794127464294434, 17.501506805419922, 19.208885192871094, 20.916263580322266, 22.62364387512207]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 2.0, 8.0, 8.0, 10.0, 8.0, 9.0, 12.0, 26.0, 26.0, 51.0, 67.0, 90.0, 133.0, 284.0, 451.0, 836.0, 1662.0, 3409.0, 7225.0, 17039.0, 48186.0, 236670.0, 3775263.0, 64561.0, 21015.0, 8858.0, 4071.0, 2075.0, 1045.0, 558.0, 286.0, 157.0, 83.0, 37.0, 20.0, 11.0, 8.0, 3.0, 2.0], "bins": [-0.2493896484375, -0.24410247802734375, -0.2388153076171875, -0.23352813720703125, -0.228240966796875, -0.22295379638671875, -0.2176666259765625, -0.21237945556640625, -0.20709228515625, -0.20180511474609375, -0.1965179443359375, -0.19123077392578125, -0.185943603515625, -0.18065643310546875, -0.1753692626953125, -0.17008209228515625, -0.164794921875, -0.15950775146484375, -0.1542205810546875, -0.14893341064453125, -0.143646240234375, -0.13835906982421875, -0.1330718994140625, -0.12778472900390625, -0.12249755859375, -0.11721038818359375, -0.1119232177734375, -0.10663604736328125, -0.101348876953125, -0.09606170654296875, -0.0907745361328125, -0.08548736572265625, -0.0802001953125, -0.07491302490234375, -0.0696258544921875, -0.06433868408203125, -0.059051513671875, -0.05376434326171875, -0.0484771728515625, -0.04319000244140625, -0.03790283203125, -0.03261566162109375, -0.0273284912109375, -0.02204132080078125, -0.016754150390625, -0.01146697998046875, -0.0061798095703125, -0.00089263916015625, 0.00439453125, 0.00968170166015625, 0.0149688720703125, 0.02025604248046875, 0.025543212890625, 0.03083038330078125, 0.0361175537109375, 0.04140472412109375, 0.04669189453125, 0.05197906494140625, 0.0572662353515625, 0.06255340576171875, 0.067840576171875, 0.07312774658203125, 0.0784149169921875, 0.08370208740234375, 0.0889892578125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 4.0, 5.0, 10.0, 6.0, 6.0, 14.0, 7.0, 11.0, 15.0, 22.0, 262.0, 541.0, 15.0, 14.0, 10.0, 7.0, 10.0, 7.0, 7.0, 6.0, 7.0, 1.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.026611328125, -0.025960803031921387, -0.025310277938842773, -0.02465975284576416, -0.024009227752685547, -0.023358702659606934, -0.02270817756652832, -0.022057652473449707, -0.021407127380371094, -0.02075660228729248, -0.020106077194213867, -0.019455552101135254, -0.01880502700805664, -0.018154501914978027, -0.017503976821899414, -0.0168534517288208, -0.016202926635742188, -0.015552401542663574, -0.014901876449584961, -0.014251351356506348, -0.013600826263427734, -0.012950301170349121, -0.012299776077270508, -0.011649250984191895, -0.010998725891113281, -0.010348200798034668, -0.009697675704956055, -0.009047150611877441, -0.008396625518798828, -0.007746100425720215, -0.0070955753326416016, -0.006445050239562988, -0.005794525146484375, -0.005144000053405762, -0.0044934749603271484, -0.003842949867248535, -0.003192424774169922, -0.0025418996810913086, -0.0018913745880126953, -0.001240849494934082, -0.0005903244018554688, 6.020069122314453e-05, 0.0007107257843017578, 0.001361250877380371, 0.0020117759704589844, 0.0026623010635375977, 0.003312826156616211, 0.003963351249694824, 0.0046138763427734375, 0.005264401435852051, 0.005914926528930664, 0.006565451622009277, 0.007215976715087891, 0.007866501808166504, 0.008517026901245117, 0.00916755199432373, 0.009818077087402344, 0.010468602180480957, 0.01111912727355957, 0.011769652366638184, 0.012420177459716797, 0.01307070255279541, 0.013721227645874023, 0.014371752738952637, 0.01502227783203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 9.0, 9.0, 14.0, 18.0, 30.0, 52.0, 65.0, 101.0, 137.0, 237.0, 459.0, 916.0, 2090.0, 6167.0, 22902.0, 111523.0, 845616.0, 2820121.0, 313083.0, 52060.0, 12178.0, 3617.0, 1346.0, 655.0, 341.0, 179.0, 115.0, 77.0, 46.0, 40.0, 27.0, 16.0, 13.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1529541015625, -0.14806365966796875, -0.1431732177734375, -0.13828277587890625, -0.133392333984375, -0.12850189208984375, -0.1236114501953125, -0.11872100830078125, -0.11383056640625, -0.10894012451171875, -0.1040496826171875, -0.09915924072265625, -0.094268798828125, -0.08937835693359375, -0.0844879150390625, -0.07959747314453125, -0.07470703125, -0.06981658935546875, -0.0649261474609375, -0.06003570556640625, -0.055145263671875, -0.05025482177734375, -0.0453643798828125, -0.04047393798828125, -0.03558349609375, -0.03069305419921875, -0.0258026123046875, -0.02091217041015625, -0.016021728515625, -0.01113128662109375, -0.0062408447265625, -0.00135040283203125, 0.0035400390625, 0.00843048095703125, 0.0133209228515625, 0.01821136474609375, 0.023101806640625, 0.02799224853515625, 0.0328826904296875, 0.03777313232421875, 0.04266357421875, 0.04755401611328125, 0.0524444580078125, 0.05733489990234375, 0.062225341796875, 0.06711578369140625, 0.0720062255859375, 0.07689666748046875, 0.081787109375, 0.08667755126953125, 0.0915679931640625, 0.09645843505859375, 0.101348876953125, 0.10623931884765625, 0.1111297607421875, 0.11602020263671875, 0.12091064453125, 0.12580108642578125, 0.1306915283203125, 0.13558197021484375, 0.140472412109375, 0.14536285400390625, 0.1502532958984375, 0.15514373779296875, 0.1600341796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 6.0, 3.0, 7.0, 1.0, 10.0, 6.0, 15.0, 15.0, 23.0, 25.0, 37.0, 33.0, 55.0, 60.0, 72.0, 84.0, 113.0, 109.0, 159.0, 179.0, 218.0, 287.0, 362.0, 499.0, 304.0, 289.0, 194.0, 167.0, 108.0, 104.0, 99.0, 81.0, 68.0, 56.0, 48.0, 36.0, 35.0, 14.0, 22.0, 21.0, 14.0, 11.0, 6.0, 3.0, 4.0, 2.0, 5.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0224151611328125, -0.02170085906982422, -0.020986557006835938, -0.020272254943847656, -0.019557952880859375, -0.018843650817871094, -0.018129348754882812, -0.01741504669189453, -0.01670074462890625, -0.01598644256591797, -0.015272140502929688, -0.014557838439941406, -0.013843536376953125, -0.013129234313964844, -0.012414932250976562, -0.011700630187988281, -0.010986328125, -0.010272026062011719, -0.009557723999023438, -0.008843421936035156, -0.008129119873046875, -0.007414817810058594, -0.0067005157470703125, -0.005986213684082031, -0.00527191162109375, -0.004557609558105469, -0.0038433074951171875, -0.0031290054321289062, -0.002414703369140625, -0.0017004013061523438, -0.0009860992431640625, -0.00027179718017578125, 0.0004425048828125, 0.0011568069458007812, 0.0018711090087890625, 0.0025854110717773438, 0.003299713134765625, 0.004014015197753906, 0.0047283172607421875, 0.005442619323730469, 0.00615692138671875, 0.006871223449707031, 0.0075855255126953125, 0.008299827575683594, 0.009014129638671875, 0.009728431701660156, 0.010442733764648438, 0.011157035827636719, 0.011871337890625, 0.012585639953613281, 0.013299942016601562, 0.014014244079589844, 0.014728546142578125, 0.015442848205566406, 0.016157150268554688, 0.01687145233154297, 0.01758575439453125, 0.01830005645751953, 0.019014358520507812, 0.019728660583496094, 0.020442962646484375, 0.021157264709472656, 0.021871566772460938, 0.02258586883544922, 0.0233001708984375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 10.0, 25.0, 28.0, 44.0, 69.0, 115.0, 161.0, 185.0, 111.0, 105.0, 59.0, 44.0, 16.0, 12.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44241875410079956, -0.4314727485179901, -0.42052674293518066, -0.4095807373523712, -0.39863473176956177, -0.3876887559890747, -0.37674272060394287, -0.3657967448234558, -0.35485073924064636, -0.3439047336578369, -0.33295872807502747, -0.322012722492218, -0.31106671690940857, -0.3001207113265991, -0.28917473554611206, -0.2782287299633026, -0.26728272438049316, -0.2563367187976837, -0.24539071321487427, -0.23444470763206482, -0.22349871695041656, -0.21255271136760712, -0.20160670578479767, -0.19066071510314941, -0.17971467971801758, -0.16876867413520813, -0.15782266855239868, -0.14687666296958923, -0.13593067228794098, -0.12498466670513153, -0.11403866112232208, -0.10309266299009323, -0.09214666485786438, -0.08120065927505493, -0.07025466114282608, -0.05930865556001663, -0.04836265370249748, -0.03741665184497833, -0.026470646262168884, -0.015524648129940033, -0.004578642547130585, 0.00636736024171114, 0.017313363030552864, 0.028259366750717163, 0.03920536860823631, 0.05015137046575546, 0.06109737604856491, 0.07204337418079376, 0.08298937976360321, 0.09393538534641266, 0.10488138347864151, 0.11582738906145096, 0.1267733871936798, 0.13771939277648926, 0.1486653983592987, 0.15961140394210815, 0.1705574095249176, 0.18150341510772705, 0.1924494206905365, 0.20339542627334595, 0.2143414169549942, 0.22528742253780365, 0.2362334281206131, 0.24717941880226135, 0.2581254243850708]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 8.0, 9.0, 9.0, 11.0, 11.0, 13.0, 17.0, 31.0, 31.0, 37.0, 34.0, 38.0, 51.0, 43.0, 40.0, 65.0, 46.0, 46.0, 54.0, 46.0, 52.0, 31.0, 37.0, 35.0, 30.0, 28.0, 22.0, 28.0, 13.0, 15.0, 19.0, 14.0, 5.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12418943643569946, -0.11976609379053116, -0.11534275859594345, -0.11091941595077515, -0.10649608075618744, -0.10207273811101913, -0.09764939546585083, -0.09322606027126312, -0.08880271762609482, -0.08437937498092651, -0.0799560397863388, -0.0755326971411705, -0.0711093544960022, -0.06668601930141449, -0.062262676656246185, -0.05783933773636818, -0.05341599881649017, -0.04899265989661217, -0.04456932097673416, -0.04014597833156586, -0.03572263941168785, -0.031299300491809845, -0.02687595970928669, -0.022452618926763535, -0.01802928000688553, -0.013605940155684948, -0.009182600304484367, -0.004759260453283787, -0.0003359206020832062, 0.0040874183177948, 0.008510759100317955, 0.01293409988284111, 0.017357438802719116, 0.021780777722597122, 0.026204118505120277, 0.030627459287643433, 0.03505079820752144, 0.039474137127399445, 0.04389747977256775, 0.048320818692445755, 0.05274415761232376, 0.05716749653220177, 0.06159083545207977, 0.06601417809724808, 0.07043752074241638, 0.07486085593700409, 0.0792841985821724, 0.0837075412273407, 0.0881308764219284, 0.09255421906709671, 0.09697755426168442, 0.10140089690685272, 0.10582423210144043, 0.11024757474660873, 0.11467091739177704, 0.11909425258636475, 0.12351759523153305, 0.12794093787670135, 0.13236427307128906, 0.13678760826587677, 0.14121095836162567, 0.14563429355621338, 0.1500576287508011, 0.15448097884655, 0.1589043140411377]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 0.0, 7.0, 13.0, 9.0, 20.0, 28.0, 31.0, 48.0, 67.0, 95.0, 202.0, 365.0, 727.0, 1535.0, 3980.0, 11664.0, 61092.0, 914371.0, 39034.0, 9368.0, 3246.0, 1286.0, 586.0, 305.0, 162.0, 104.0, 59.0, 45.0, 29.0, 19.0, 12.0, 13.0, 8.0, 4.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.257568359375, -0.2496185302734375, -0.241668701171875, -0.2337188720703125, -0.22576904296875, -0.2178192138671875, -0.209869384765625, -0.2019195556640625, -0.1939697265625, -0.1860198974609375, -0.178070068359375, -0.1701202392578125, -0.16217041015625, -0.1542205810546875, -0.146270751953125, -0.1383209228515625, -0.13037109375, -0.1224212646484375, -0.114471435546875, -0.1065216064453125, -0.09857177734375, -0.0906219482421875, -0.082672119140625, -0.0747222900390625, -0.0667724609375, -0.0588226318359375, -0.050872802734375, -0.0429229736328125, -0.03497314453125, -0.0270233154296875, -0.019073486328125, -0.0111236572265625, -0.003173828125, 0.0047760009765625, 0.012725830078125, 0.0206756591796875, 0.02862548828125, 0.0365753173828125, 0.044525146484375, 0.0524749755859375, 0.0604248046875, 0.0683746337890625, 0.076324462890625, 0.0842742919921875, 0.09222412109375, 0.1001739501953125, 0.108123779296875, 0.1160736083984375, 0.1240234375, 0.1319732666015625, 0.139923095703125, 0.1478729248046875, 0.15582275390625, 0.1637725830078125, 0.171722412109375, 0.1796722412109375, 0.1876220703125, 0.1955718994140625, 0.203521728515625, 0.2114715576171875, 0.21942138671875, 0.2273712158203125, 0.235321044921875, 0.2432708740234375, 0.251220703125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 4.0, 6.0, 5.0, 7.0, 11.0, 11.0, 16.0, 19.0, 58.0, 160.0, 320.0, 200.0, 83.0, 34.0, 8.0, 13.0, 6.0, 13.0, 3.0, 7.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0243072509765625, -0.023676156997680664, -0.023045063018798828, -0.022413969039916992, -0.021782875061035156, -0.02115178108215332, -0.020520687103271484, -0.01988959312438965, -0.019258499145507812, -0.018627405166625977, -0.01799631118774414, -0.017365217208862305, -0.01673412322998047, -0.016103029251098633, -0.015471935272216797, -0.014840841293334961, -0.014209747314453125, -0.013578653335571289, -0.012947559356689453, -0.012316465377807617, -0.011685371398925781, -0.011054277420043945, -0.01042318344116211, -0.009792089462280273, -0.009160995483398438, -0.008529901504516602, -0.007898807525634766, -0.00726771354675293, -0.006636619567871094, -0.006005525588989258, -0.005374431610107422, -0.004743337631225586, -0.00411224365234375, -0.003481149673461914, -0.002850055694580078, -0.002218961715698242, -0.0015878677368164062, -0.0009567737579345703, -0.0003256797790527344, 0.00030541419982910156, 0.0009365081787109375, 0.0015676021575927734, 0.0021986961364746094, 0.0028297901153564453, 0.0034608840942382812, 0.004091978073120117, 0.004723072052001953, 0.005354166030883789, 0.005985260009765625, 0.006616353988647461, 0.007247447967529297, 0.007878541946411133, 0.008509635925292969, 0.009140729904174805, 0.00977182388305664, 0.010402917861938477, 0.011034011840820312, 0.011665105819702148, 0.012296199798583984, 0.01292729377746582, 0.013558387756347656, 0.014189481735229492, 0.014820575714111328, 0.015451669692993164, 0.016082763671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 4.0, 9.0, 6.0, 13.0, 14.0, 27.0, 34.0, 55.0, 70.0, 102.0, 138.0, 233.0, 479.0, 793.0, 1443.0, 3257.0, 10335.0, 79332.0, 837200.0, 96593.0, 11329.0, 3538.0, 1527.0, 794.0, 434.0, 242.0, 189.0, 119.0, 83.0, 49.0, 35.0, 23.0, 14.0, 11.0, 9.0, 4.0, 7.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23779296875, -0.229156494140625, -0.22052001953125, -0.211883544921875, -0.2032470703125, -0.194610595703125, -0.18597412109375, -0.177337646484375, -0.168701171875, -0.160064697265625, -0.15142822265625, -0.142791748046875, -0.1341552734375, -0.125518798828125, -0.11688232421875, -0.108245849609375, -0.099609375, -0.090972900390625, -0.08233642578125, -0.073699951171875, -0.0650634765625, -0.056427001953125, -0.04779052734375, -0.039154052734375, -0.030517578125, -0.021881103515625, -0.01324462890625, -0.004608154296875, 0.0040283203125, 0.012664794921875, 0.02130126953125, 0.029937744140625, 0.03857421875, 0.047210693359375, 0.05584716796875, 0.064483642578125, 0.0731201171875, 0.081756591796875, 0.09039306640625, 0.099029541015625, 0.107666015625, 0.116302490234375, 0.12493896484375, 0.133575439453125, 0.1422119140625, 0.150848388671875, 0.15948486328125, 0.168121337890625, 0.1767578125, 0.185394287109375, 0.19403076171875, 0.202667236328125, 0.2113037109375, 0.219940185546875, 0.22857666015625, 0.237213134765625, 0.245849609375, 0.254486083984375, 0.26312255859375, 0.271759033203125, 0.2803955078125, 0.289031982421875, 0.29766845703125, 0.306304931640625, 0.31494140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 6.0, 7.0, 7.0, 9.0, 5.0, 14.0, 14.0, 14.0, 22.0, 16.0, 17.0, 26.0, 34.0, 23.0, 31.0, 26.0, 32.0, 30.0, 41.0, 34.0, 42.0, 29.0, 44.0, 48.0, 45.0, 45.0, 22.0, 35.0, 31.0, 40.0, 29.0, 22.0, 18.0, 26.0, 18.0, 14.0, 18.0, 14.0, 12.0, 11.0, 6.0, 6.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0640869140625, -0.062012672424316406, -0.05993843078613281, -0.05786418914794922, -0.055789947509765625, -0.05371570587158203, -0.05164146423339844, -0.049567222595214844, -0.04749298095703125, -0.045418739318847656, -0.04334449768066406, -0.04127025604248047, -0.039196014404296875, -0.03712177276611328, -0.03504753112792969, -0.032973289489746094, -0.0308990478515625, -0.028824806213378906, -0.026750564575195312, -0.02467632293701172, -0.022602081298828125, -0.02052783966064453, -0.018453598022460938, -0.016379356384277344, -0.01430511474609375, -0.012230873107910156, -0.010156631469726562, -0.008082389831542969, -0.006008148193359375, -0.003933906555175781, -0.0018596649169921875, 0.00021457672119140625, 0.002288818359375, 0.004363059997558594, 0.0064373016357421875, 0.008511543273925781, 0.010585784912109375, 0.012660026550292969, 0.014734268188476562, 0.016808509826660156, 0.01888275146484375, 0.020956993103027344, 0.023031234741210938, 0.02510547637939453, 0.027179718017578125, 0.02925395965576172, 0.03132820129394531, 0.033402442932128906, 0.0354766845703125, 0.037550926208496094, 0.03962516784667969, 0.04169940948486328, 0.043773651123046875, 0.04584789276123047, 0.04792213439941406, 0.049996376037597656, 0.05207061767578125, 0.054144859313964844, 0.05621910095214844, 0.05829334259033203, 0.060367584228515625, 0.06244182586669922, 0.06451606750488281, 0.0665903091430664, 0.06866455078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 11.0, 13.0, 30.0, 46.0, 68.0, 130.0, 291.0, 567.0, 1780.0, 8300.0, 198659.0, 819255.0, 15406.0, 2537.0, 769.0, 305.0, 145.0, 78.0, 63.0, 32.0, 19.0, 11.0, 7.0, 11.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3955078125, -0.3861236572265625, -0.376739501953125, -0.3673553466796875, -0.35797119140625, -0.3485870361328125, -0.339202880859375, -0.3298187255859375, -0.3204345703125, -0.3110504150390625, -0.301666259765625, -0.2922821044921875, -0.28289794921875, -0.2735137939453125, -0.264129638671875, -0.2547454833984375, -0.245361328125, -0.2359771728515625, -0.226593017578125, -0.2172088623046875, -0.20782470703125, -0.1984405517578125, -0.189056396484375, -0.1796722412109375, -0.1702880859375, -0.1609039306640625, -0.151519775390625, -0.1421356201171875, -0.13275146484375, -0.1233673095703125, -0.113983154296875, -0.1045989990234375, -0.09521484375, -0.0858306884765625, -0.076446533203125, -0.0670623779296875, -0.05767822265625, -0.0482940673828125, -0.038909912109375, -0.0295257568359375, -0.0201416015625, -0.0107574462890625, -0.001373291015625, 0.0080108642578125, 0.01739501953125, 0.0267791748046875, 0.036163330078125, 0.0455474853515625, 0.054931640625, 0.0643157958984375, 0.073699951171875, 0.0830841064453125, 0.09246826171875, 0.1018524169921875, 0.111236572265625, 0.1206207275390625, 0.1300048828125, 0.1393890380859375, 0.148773193359375, 0.1581573486328125, 0.16754150390625, 0.1769256591796875, 0.186309814453125, 0.1956939697265625, 0.205078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 3.0, 1.0, 8.0, 20.0, 11.0, 16.0, 16.0, 30.0, 40.0, 56.0, 78.0, 80.0, 120.0, 75.0, 103.0, 68.0, 74.0, 55.0, 41.0, 30.0, 24.0, 10.0, 14.0, 10.0, 9.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4662742614746094e-05, -1.4225021004676819e-05, -1.3787299394607544e-05, -1.3349577784538269e-05, -1.2911856174468994e-05, -1.247413456439972e-05, -1.2036412954330444e-05, -1.159869134426117e-05, -1.1160969734191895e-05, -1.072324812412262e-05, -1.0285526514053345e-05, -9.84780490398407e-06, -9.410083293914795e-06, -8.97236168384552e-06, -8.534640073776245e-06, -8.09691846370697e-06, -7.659196853637695e-06, -7.22147524356842e-06, -6.7837536334991455e-06, -6.346032023429871e-06, -5.908310413360596e-06, -5.470588803291321e-06, -5.032867193222046e-06, -4.595145583152771e-06, -4.157423973083496e-06, -3.719702363014221e-06, -3.2819807529449463e-06, -2.8442591428756714e-06, -2.4065375328063965e-06, -1.9688159227371216e-06, -1.5310943126678467e-06, -1.0933727025985718e-06, -6.556510925292969e-07, -2.1792948246002197e-07, 2.1979212760925293e-07, 6.575137376785278e-07, 1.0952353477478027e-06, 1.5329569578170776e-06, 1.9706785678863525e-06, 2.4084001779556274e-06, 2.8461217880249023e-06, 3.2838433980941772e-06, 3.721565008163452e-06, 4.159286618232727e-06, 4.597008228302002e-06, 5.034729838371277e-06, 5.472451448440552e-06, 5.910173058509827e-06, 6.3478946685791016e-06, 6.7856162786483765e-06, 7.223337888717651e-06, 7.661059498786926e-06, 8.098781108856201e-06, 8.536502718925476e-06, 8.974224328994751e-06, 9.411945939064026e-06, 9.8496675491333e-06, 1.0287389159202576e-05, 1.072511076927185e-05, 1.1162832379341125e-05, 1.16005539894104e-05, 1.2038275599479675e-05, 1.247599720954895e-05, 1.2913718819618225e-05, 1.33514404296875e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 7.0, 8.0, 8.0, 23.0, 22.0, 59.0, 77.0, 156.0, 234.0, 427.0, 830.0, 1797.0, 5329.0, 32105.0, 819716.0, 169549.0, 12343.0, 3216.0, 1277.0, 554.0, 330.0, 164.0, 99.0, 61.0, 42.0, 47.0, 20.0, 19.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24365234375, -0.23455047607421875, -0.2254486083984375, -0.21634674072265625, -0.207244873046875, -0.19814300537109375, -0.1890411376953125, -0.17993927001953125, -0.17083740234375, -0.16173553466796875, -0.1526336669921875, -0.14353179931640625, -0.134429931640625, -0.12532806396484375, -0.1162261962890625, -0.10712432861328125, -0.0980224609375, -0.08892059326171875, -0.0798187255859375, -0.07071685791015625, -0.061614990234375, -0.05251312255859375, -0.0434112548828125, -0.03430938720703125, -0.02520751953125, -0.01610565185546875, -0.0070037841796875, 0.00209808349609375, 0.011199951171875, 0.02030181884765625, 0.0294036865234375, 0.03850555419921875, 0.047607421875, 0.05670928955078125, 0.0658111572265625, 0.07491302490234375, 0.084014892578125, 0.09311676025390625, 0.1022186279296875, 0.11132049560546875, 0.12042236328125, 0.12952423095703125, 0.1386260986328125, 0.14772796630859375, 0.156829833984375, 0.16593170166015625, 0.1750335693359375, 0.18413543701171875, 0.1932373046875, 0.20233917236328125, 0.2114410400390625, 0.22054290771484375, 0.229644775390625, 0.23874664306640625, 0.2478485107421875, 0.25695037841796875, 0.26605224609375, 0.27515411376953125, 0.2842559814453125, 0.29335784912109375, 0.302459716796875, 0.31156158447265625, 0.3206634521484375, 0.32976531982421875, 0.3388671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 2.0, 11.0, 8.0, 9.0, 18.0, 24.0, 27.0, 50.0, 73.0, 96.0, 124.0, 162.0, 111.0, 67.0, 45.0, 37.0, 20.0, 24.0, 21.0, 17.0, 10.0, 5.0, 8.0, 9.0, 4.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1119384765625, -0.1082305908203125, -0.104522705078125, -0.1008148193359375, -0.09710693359375, -0.0933990478515625, -0.089691162109375, -0.0859832763671875, -0.082275390625, -0.0785675048828125, -0.074859619140625, -0.0711517333984375, -0.06744384765625, -0.0637359619140625, -0.060028076171875, -0.0563201904296875, -0.0526123046875, -0.0489044189453125, -0.045196533203125, -0.0414886474609375, -0.03778076171875, -0.0340728759765625, -0.030364990234375, -0.0266571044921875, -0.02294921875, -0.0192413330078125, -0.015533447265625, -0.0118255615234375, -0.00811767578125, -0.0044097900390625, -0.000701904296875, 0.0030059814453125, 0.0067138671875, 0.0104217529296875, 0.014129638671875, 0.0178375244140625, 0.02154541015625, 0.0252532958984375, 0.028961181640625, 0.0326690673828125, 0.036376953125, 0.0400848388671875, 0.043792724609375, 0.0475006103515625, 0.05120849609375, 0.0549163818359375, 0.058624267578125, 0.0623321533203125, 0.0660400390625, 0.0697479248046875, 0.073455810546875, 0.0771636962890625, 0.08087158203125, 0.0845794677734375, 0.088287353515625, 0.0919952392578125, 0.095703125, 0.0994110107421875, 0.103118896484375, 0.1068267822265625, 0.11053466796875, 0.1142425537109375, 0.117950439453125, 0.1216583251953125, 0.1253662109375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 3.0, 18.0, 38.0, 175.0, 478.0, 172.0, 48.0, 19.0, 16.0, 13.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4274253845214844, -3.3486196994781494, -3.2698142528533936, -3.1910085678100586, -3.1122031211853027, -3.0333974361419678, -2.954591751098633, -2.875786304473877, -2.796980619430542, -2.718174934387207, -2.639369487762451, -2.560563802719116, -2.4817583560943604, -2.4029526710510254, -2.3241472244262695, -2.2453415393829346, -2.1665358543395996, -2.0877301692962646, -2.008924722671509, -1.9301190376281738, -1.8513134717941284, -1.772507905960083, -1.6937023401260376, -1.6148967742919922, -1.5360913276672363, -1.457285761833191, -1.3784801959991455, -1.2996745109558105, -1.2208689451217651, -1.1420633792877197, -1.0632578134536743, -0.9844521880149841, -0.9056466817855835, -0.8268411159515381, -0.7480354905128479, -0.6692299246788025, -0.5904242992401123, -0.5116187334060669, -0.4328131675720215, -0.3540075421333313, -0.2752019762992859, -0.1963963806629181, -0.11759079992771149, -0.03878521919250488, 0.040020376443862915, 0.11882597208023071, 0.19763153791427612, 0.2764371633529663, 0.3552427291870117, 0.4340483248233795, 0.5128539204597473, 0.5916594862937927, 0.6704651117324829, 0.7492706775665283, 0.8280762434005737, 0.9068818688392639, 0.9856874346733093, 1.0644930601119995, 1.143298625946045, 1.2221041917800903, 1.3009097576141357, 1.3797154426574707, 1.4585208892822266, 1.5373265743255615, 1.616132140159607]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 10.0, 15.0, 12.0, 31.0, 59.0, 78.0, 133.0, 137.0, 127.0, 103.0, 67.0, 59.0, 35.0, 23.0, 18.0, 12.0, 8.0, 4.0, 4.0, 4.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4160118103027344, -1.3756730556488037, -1.335334300994873, -1.2949955463409424, -1.2546567916870117, -1.214318037033081, -1.1739792823791504, -1.1336405277252197, -1.093301773071289, -1.0529630184173584, -1.0126242637634277, -0.9722855091094971, -0.9319467544555664, -0.8916079998016357, -0.8512692451477051, -0.8109304904937744, -0.7705917358398438, -0.7302529811859131, -0.6899142265319824, -0.6495754718780518, -0.6092367172241211, -0.5688979625701904, -0.5285592079162598, -0.4882204532623291, -0.44788169860839844, -0.4075429439544678, -0.3672041893005371, -0.32686543464660645, -0.2865266799926758, -0.24618792533874512, -0.20584917068481445, -0.1655104160308838, -0.12517166137695312, -0.08483290672302246, -0.0444941520690918, -0.004155397415161133, 0.03618335723876953, 0.0765221118927002, 0.11686086654663086, 0.15719962120056152, 0.1975383758544922, 0.23787713050842285, 0.2782158851623535, 0.3185546398162842, 0.35889339447021484, 0.3992321491241455, 0.43957090377807617, 0.47990965843200684, 0.5202484130859375, 0.5605871677398682, 0.6009259223937988, 0.6412646770477295, 0.6816034317016602, 0.7219421863555908, 0.7622809410095215, 0.8026196956634521, 0.8429584503173828, 0.8832972049713135, 0.9236359596252441, 0.9639747142791748, 1.0043134689331055, 1.0446522235870361, 1.0849909782409668, 1.1253297328948975, 1.1656684875488281]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 13.0, 19.0, 21.0, 74.0, 224.0, 933.0, 4184023.0, 8764.0, 102.0, 44.0, 27.0, 11.0, 12.0, 5.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-28.546875, -27.9732666015625, -27.399658203125, -26.8260498046875, -26.25244140625, -25.6788330078125, -25.105224609375, -24.5316162109375, -23.9580078125, -23.3843994140625, -22.810791015625, -22.2371826171875, -21.66357421875, -21.0899658203125, -20.516357421875, -19.9427490234375, -19.369140625, -18.7955322265625, -18.221923828125, -17.6483154296875, -17.07470703125, -16.5010986328125, -15.927490234375, -15.3538818359375, -14.7802734375, -14.2066650390625, -13.633056640625, -13.0594482421875, -12.48583984375, -11.9122314453125, -11.338623046875, -10.7650146484375, -10.19140625, -9.6177978515625, -9.044189453125, -8.4705810546875, -7.89697265625, -7.3233642578125, -6.749755859375, -6.1761474609375, -5.6025390625, -5.0289306640625, -4.455322265625, -3.8817138671875, -3.30810546875, -2.7344970703125, -2.160888671875, -1.5872802734375, -1.013671875, -0.4400634765625, 0.133544921875, 0.7071533203125, 1.28076171875, 1.8543701171875, 2.427978515625, 3.0015869140625, 3.5751953125, 4.1488037109375, 4.722412109375, 5.2960205078125, 5.86962890625, 6.4432373046875, 7.016845703125, 7.5904541015625, 8.1640625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 7.0, 7.0, 12.0, 8.0, 22.0, 16.0, 20.0, 35.0, 93.0, 186.0, 234.0, 148.0, 87.0, 44.0, 24.0, 22.0, 7.0, 10.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02313232421875, -0.022584915161132812, -0.022037506103515625, -0.021490097045898438, -0.02094268798828125, -0.020395278930664062, -0.019847869873046875, -0.019300460815429688, -0.0187530517578125, -0.018205642700195312, -0.017658233642578125, -0.017110824584960938, -0.01656341552734375, -0.016016006469726562, -0.015468597412109375, -0.014921188354492188, -0.014373779296875, -0.013826370239257812, -0.013278961181640625, -0.012731552124023438, -0.01218414306640625, -0.011636734008789062, -0.011089324951171875, -0.010541915893554688, -0.0099945068359375, -0.009447097778320312, -0.008899688720703125, -0.008352279663085938, -0.00780487060546875, -0.0072574615478515625, -0.006710052490234375, -0.0061626434326171875, -0.005615234375, -0.0050678253173828125, -0.004520416259765625, -0.0039730072021484375, -0.00342559814453125, -0.0028781890869140625, -0.002330780029296875, -0.0017833709716796875, -0.0012359619140625, -0.0006885528564453125, -0.000141143798828125, 0.0004062652587890625, 0.00095367431640625, 0.0015010833740234375, 0.002048492431640625, 0.0025959014892578125, 0.003143310546875, 0.0036907196044921875, 0.004238128662109375, 0.0047855377197265625, 0.00533294677734375, 0.0058803558349609375, 0.006427764892578125, 0.0069751739501953125, 0.0075225830078125, 0.008069992065429688, 0.008617401123046875, 0.009164810180664062, 0.00971221923828125, 0.010259628295898438, 0.010807037353515625, 0.011354446411132812, 0.01190185546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 11.0, 26.0, 66.0, 143.0, 383.0, 3570998.0, 621271.0, 512.0, 311.0, 198.0, 133.0, 97.0, 57.0, 40.0, 24.0, 7.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4248046875, -1.2819976806640625, -1.139190673828125, -0.9963836669921875, -0.85357666015625, -0.7107696533203125, -0.567962646484375, -0.4251556396484375, -0.2823486328125, -0.1395416259765625, 0.003265380859375, 0.1460723876953125, 0.28887939453125, 0.4316864013671875, 0.574493408203125, 0.7173004150390625, 0.860107421875, 1.0029144287109375, 1.145721435546875, 1.2885284423828125, 1.43133544921875, 1.5741424560546875, 1.716949462890625, 1.8597564697265625, 2.0025634765625, 2.1453704833984375, 2.288177490234375, 2.4309844970703125, 2.57379150390625, 2.7165985107421875, 2.859405517578125, 3.0022125244140625, 3.14501953125, 3.2878265380859375, 3.430633544921875, 3.5734405517578125, 3.71624755859375, 3.8590545654296875, 4.001861572265625, 4.1446685791015625, 4.2874755859375, 4.4302825927734375, 4.573089599609375, 4.7158966064453125, 4.85870361328125, 5.0015106201171875, 5.144317626953125, 5.2871246337890625, 5.429931640625, 5.5727386474609375, 5.715545654296875, 5.8583526611328125, 6.00115966796875, 6.1439666748046875, 6.286773681640625, 6.4295806884765625, 6.5723876953125, 6.7151947021484375, 6.858001708984375, 7.0008087158203125, 7.14361572265625, 7.2864227294921875, 7.429229736328125, 7.5720367431640625, 7.71484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 13.0, 20.0, 45.0, 71.0, 160.0, 260.0, 581.0, 1242.0, 545.0, 407.0, 267.0, 173.0, 125.0, 70.0, 48.0, 21.0, 17.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026275634765625, -0.024927616119384766, -0.02357959747314453, -0.022231578826904297, -0.020883560180664062, -0.019535541534423828, -0.018187522888183594, -0.01683950424194336, -0.015491485595703125, -0.01414346694946289, -0.012795448303222656, -0.011447429656982422, -0.010099411010742188, -0.008751392364501953, -0.007403373718261719, -0.006055355072021484, -0.00470733642578125, -0.0033593177795410156, -0.0020112991333007812, -0.0006632804870605469, 0.0006847381591796875, 0.002032756805419922, 0.0033807754516601562, 0.004728794097900391, 0.006076812744140625, 0.007424831390380859, 0.008772850036621094, 0.010120868682861328, 0.011468887329101562, 0.012816905975341797, 0.014164924621582031, 0.015512943267822266, 0.0168609619140625, 0.018208980560302734, 0.01955699920654297, 0.020905017852783203, 0.022253036499023438, 0.023601055145263672, 0.024949073791503906, 0.02629709243774414, 0.027645111083984375, 0.02899312973022461, 0.030341148376464844, 0.03168916702270508, 0.03303718566894531, 0.03438520431518555, 0.03573322296142578, 0.037081241607666016, 0.03842926025390625, 0.039777278900146484, 0.04112529754638672, 0.04247331619262695, 0.04382133483886719, 0.04516935348510742, 0.046517372131347656, 0.04786539077758789, 0.049213409423828125, 0.05056142807006836, 0.051909446716308594, 0.05325746536254883, 0.05460548400878906, 0.0559535026550293, 0.05730152130126953, 0.058649539947509766, 0.05999755859375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [18.0, 982.0, 18.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.676487922668457, -0.08301091194152832, 0.5104660987854004, 1.103943109512329, 1.6974201202392578, 2.2908971309661865, 2.8843741416931152, 3.477850914001465, 4.071328163146973, 4.6648054122924805, 5.25828218460083, 5.85175895690918, 6.4452362060546875, 7.038713455200195, 7.632190227508545, 8.225666999816895, 8.819144248962402, 9.41262149810791, 10.006097793579102, 10.59957504272461, 11.193052291870117, 11.786529541015625, 12.380006790161133, 12.973483085632324, 13.566960334777832, 14.16043758392334, 14.753913879394531, 15.347391128540039, 15.940868377685547, 16.534345626831055, 17.127822875976562, 17.721298217773438, 18.314777374267578, 18.908254623413086, 19.501731872558594, 20.0952091217041, 20.68868637084961, 21.282161712646484, 21.875638961791992, 22.4691162109375, 23.062593460083008, 23.656070709228516, 24.249547958374023, 24.84302520751953, 25.436500549316406, 26.029977798461914, 26.623455047607422, 27.21693229675293, 27.810409545898438, 28.403886795043945, 28.997364044189453, 29.59084129333496, 30.18431854248047, 30.777793884277344, 31.37127113342285, 31.96474838256836, 32.5582275390625, 33.151702880859375, 33.745182037353516, 34.33865737915039, 34.93213653564453, 35.525611877441406, 36.11909103393555, 36.71256637573242, 37.3060417175293]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 8.0, 19.0, 24.0, 65.0, 74.0, 146.0, 189.0, 169.0, 140.0, 91.0, 38.0, 26.0, 12.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5328328013420105, -0.4855237305164337, -0.43821465969085693, -0.39090561866760254, -0.34359651803970337, -0.296287477016449, -0.2489784061908722, -0.2016693353652954, -0.15436026453971863, -0.10705119371414185, -0.05974213033914566, -0.012433066964149475, 0.03487600386142731, 0.08218507468700409, 0.12949413061141968, 0.17680320143699646, 0.22411227226257324, 0.27142134308815, 0.3187304139137268, 0.3660394549369812, 0.41334855556488037, 0.46065759658813477, 0.5079666376113892, 0.5552757382392883, 0.6025848388671875, 0.6498938798904419, 0.6972029805183411, 0.7445120215415955, 0.7918211221694946, 0.839130163192749, 0.8864392042160034, 0.9337483048439026, 0.9810572862625122, 1.0283663272857666, 1.075675368309021, 1.122984528541565, 1.1702935695648193, 1.2176026105880737, 1.2649116516113281, 1.312220811843872, 1.3595298528671265, 1.4068388938903809, 1.4541479349136353, 1.5014570951461792, 1.5487661361694336, 1.596075177192688, 1.6433842182159424, 1.6906933784484863, 1.7380023002624512, 1.7853113412857056, 1.83262038230896, 1.879929542541504, 1.9272385835647583, 1.9745476245880127, 2.0218567848205566, 2.0691657066345215, 2.1164748668670654, 2.1637840270996094, 2.211092948913574, 2.258402109146118, 2.305711030960083, 2.353020191192627, 2.400329351425171, 2.4476382732391357, 2.4949474334716797]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 2.0, 1.0, 7.0, 2.0, 5.0, 3.0, 11.0, 23.0, 43.0, 44.0, 52.0, 115.0, 165.0, 306.0, 498.0, 842.0, 1413.0, 2563.0, 4591.0, 8547.0, 17937.0, 52617.0, 317689.0, 514145.0, 80543.0, 23123.0, 10474.0, 5686.0, 3007.0, 1606.0, 959.0, 613.0, 338.0, 215.0, 138.0, 75.0, 51.0, 30.0, 15.0, 15.0, 12.0, 11.0, 4.0, 5.0, 7.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1463623046875, -0.14166259765625, -0.136962890625, -0.13226318359375, -0.1275634765625, -0.12286376953125, -0.1181640625, -0.11346435546875, -0.1087646484375, -0.10406494140625, -0.099365234375, -0.09466552734375, -0.0899658203125, -0.08526611328125, -0.08056640625, -0.07586669921875, -0.0711669921875, -0.06646728515625, -0.061767578125, -0.05706787109375, -0.0523681640625, -0.04766845703125, -0.04296875, -0.03826904296875, -0.0335693359375, -0.02886962890625, -0.024169921875, -0.01947021484375, -0.0147705078125, -0.01007080078125, -0.00537109375, -0.00067138671875, 0.0040283203125, 0.00872802734375, 0.013427734375, 0.01812744140625, 0.0228271484375, 0.02752685546875, 0.0322265625, 0.03692626953125, 0.0416259765625, 0.04632568359375, 0.051025390625, 0.05572509765625, 0.0604248046875, 0.06512451171875, 0.06982421875, 0.07452392578125, 0.0792236328125, 0.08392333984375, 0.088623046875, 0.09332275390625, 0.0980224609375, 0.10272216796875, 0.107421875, 0.11212158203125, 0.1168212890625, 0.12152099609375, 0.126220703125, 0.13092041015625, 0.1356201171875, 0.14031982421875, 0.14501953125, 0.14971923828125, 0.1544189453125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0, 12.0, 6.0, 5.0, 7.0, 12.0, 11.0, 26.0, 21.0, 27.0, 45.0, 71.0, 103.0, 100.0, 126.0, 107.0, 76.0, 66.0, 37.0, 34.0, 17.0, 20.0, 10.0, 7.0, 7.0, 12.0, 3.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008148193359375, -0.007812857627868652, -0.007477521896362305, -0.007142186164855957, -0.006806850433349609, -0.006471514701843262, -0.006136178970336914, -0.005800843238830566, -0.005465507507324219, -0.005130171775817871, -0.0047948360443115234, -0.004459500312805176, -0.004124164581298828, -0.0037888288497924805, -0.003453493118286133, -0.003118157386779785, -0.0027828216552734375, -0.00244748592376709, -0.002112150192260742, -0.0017768144607543945, -0.0014414787292480469, -0.0011061429977416992, -0.0007708072662353516, -0.0004354715347290039, -0.00010013580322265625, 0.0002351999282836914, 0.0005705356597900391, 0.0009058713912963867, 0.0012412071228027344, 0.001576542854309082, 0.0019118785858154297, 0.0022472143173217773, 0.002582550048828125, 0.0029178857803344727, 0.0032532215118408203, 0.003588557243347168, 0.003923892974853516, 0.004259228706359863, 0.004594564437866211, 0.004929900169372559, 0.005265235900878906, 0.005600571632385254, 0.0059359073638916016, 0.006271243095397949, 0.006606578826904297, 0.0069419145584106445, 0.007277250289916992, 0.00761258602142334, 0.007947921752929688, 0.008283257484436035, 0.008618593215942383, 0.00895392894744873, 0.009289264678955078, 0.009624600410461426, 0.009959936141967773, 0.010295271873474121, 0.010630607604980469, 0.010965943336486816, 0.011301279067993164, 0.011636614799499512, 0.01197195053100586, 0.012307286262512207, 0.012642621994018555, 0.012977957725524902, 0.01331329345703125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 5.0, 1.0, 10.0, 9.0, 6.0, 5.0, 18.0, 16.0, 28.0, 26.0, 26.0, 29.0, 38.0, 42.0, 55.0, 83.0, 303.0, 3673.0, 353625.0, 684262.0, 5509.0, 394.0, 97.0, 49.0, 45.0, 35.0, 28.0, 29.0, 25.0, 12.0, 20.0, 10.0, 8.0, 12.0, 4.0, 4.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482666015625, -0.4676170349121094, -0.45256805419921875, -0.4375190734863281, -0.4224700927734375, -0.4074211120605469, -0.39237213134765625, -0.3773231506347656, -0.362274169921875, -0.3472251892089844, -0.33217620849609375, -0.3171272277832031, -0.3020782470703125, -0.2870292663574219, -0.27198028564453125, -0.2569313049316406, -0.24188232421875, -0.22683334350585938, -0.21178436279296875, -0.19673538208007812, -0.1816864013671875, -0.16663742065429688, -0.15158843994140625, -0.13653945922851562, -0.121490478515625, -0.10644149780273438, -0.09139251708984375, -0.07634353637695312, -0.0612945556640625, -0.046245574951171875, -0.03119659423828125, -0.016147613525390625, -0.0010986328125, 0.013950347900390625, 0.02899932861328125, 0.044048309326171875, 0.0590972900390625, 0.07414627075195312, 0.08919525146484375, 0.10424423217773438, 0.119293212890625, 0.13434219360351562, 0.14939117431640625, 0.16444015502929688, 0.1794891357421875, 0.19453811645507812, 0.20958709716796875, 0.22463607788085938, 0.23968505859375, 0.2547340393066406, 0.26978302001953125, 0.2848320007324219, 0.2998809814453125, 0.3149299621582031, 0.32997894287109375, 0.3450279235839844, 0.360076904296875, 0.3751258850097656, 0.39017486572265625, 0.4052238464355469, 0.4202728271484375, 0.4353218078613281, 0.45037078857421875, 0.4654197692871094, 0.48046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 6.0, 3.0, 7.0, 10.0, 12.0, 8.0, 14.0, 12.0, 16.0, 14.0, 17.0, 20.0, 34.0, 34.0, 29.0, 30.0, 38.0, 29.0, 40.0, 30.0, 39.0, 44.0, 43.0, 37.0, 42.0, 36.0, 45.0, 33.0, 41.0, 32.0, 30.0, 34.0, 23.0, 26.0, 11.0, 16.0, 15.0, 12.0, 12.0, 3.0, 4.0, 5.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.043853759765625, -0.04261302947998047, -0.04137229919433594, -0.040131568908691406, -0.038890838623046875, -0.037650108337402344, -0.03640937805175781, -0.03516864776611328, -0.03392791748046875, -0.03268718719482422, -0.03144645690917969, -0.030205726623535156, -0.028964996337890625, -0.027724266052246094, -0.026483535766601562, -0.02524280548095703, -0.0240020751953125, -0.02276134490966797, -0.021520614624023438, -0.020279884338378906, -0.019039154052734375, -0.017798423767089844, -0.016557693481445312, -0.015316963195800781, -0.01407623291015625, -0.012835502624511719, -0.011594772338867188, -0.010354042053222656, -0.009113311767578125, -0.007872581481933594, -0.0066318511962890625, -0.005391120910644531, -0.004150390625, -0.0029096603393554688, -0.0016689300537109375, -0.00042819976806640625, 0.000812530517578125, 0.0020532608032226562, 0.0032939910888671875, 0.004534721374511719, 0.00577545166015625, 0.007016181945800781, 0.008256912231445312, 0.009497642517089844, 0.010738372802734375, 0.011979103088378906, 0.013219833374023438, 0.014460563659667969, 0.0157012939453125, 0.01694202423095703, 0.018182754516601562, 0.019423484802246094, 0.020664215087890625, 0.021904945373535156, 0.023145675659179688, 0.02438640594482422, 0.02562713623046875, 0.02686786651611328, 0.028108596801757812, 0.029349327087402344, 0.030590057373046875, 0.031830787658691406, 0.03307151794433594, 0.03431224822998047, 0.035552978515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 4.0, 7.0, 8.0, 23.0, 70.0, 269.0, 3488.0, 1041157.0, 3147.0, 238.0, 60.0, 29.0, 14.0, 2.0, 4.0, 6.0, 4.0, 2.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5390625, -1.48095703125, -1.4228515625, -1.36474609375, -1.306640625, -1.24853515625, -1.1904296875, -1.13232421875, -1.07421875, -1.01611328125, -0.9580078125, -0.89990234375, -0.841796875, -0.78369140625, -0.7255859375, -0.66748046875, -0.609375, -0.55126953125, -0.4931640625, -0.43505859375, -0.376953125, -0.31884765625, -0.2607421875, -0.20263671875, -0.14453125, -0.08642578125, -0.0283203125, 0.02978515625, 0.087890625, 0.14599609375, 0.2041015625, 0.26220703125, 0.3203125, 0.37841796875, 0.4365234375, 0.49462890625, 0.552734375, 0.61083984375, 0.6689453125, 0.72705078125, 0.78515625, 0.84326171875, 0.9013671875, 0.95947265625, 1.017578125, 1.07568359375, 1.1337890625, 1.19189453125, 1.25, 1.30810546875, 1.3662109375, 1.42431640625, 1.482421875, 1.54052734375, 1.5986328125, 1.65673828125, 1.71484375, 1.77294921875, 1.8310546875, 1.88916015625, 1.947265625, 2.00537109375, 2.0634765625, 2.12158203125, 2.1796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 9.0, 16.0, 29.0, 39.0, 153.0, 341.0, 231.0, 81.0, 23.0, 25.0, 10.0, 6.0, 8.0, 7.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011467933654785156, -0.00011094287037849426, -0.00010720640420913696, -0.00010346993803977966, -9.973347187042236e-05, -9.599700570106506e-05, -9.226053953170776e-05, -8.852407336235046e-05, -8.478760719299316e-05, -8.105114102363586e-05, -7.731467485427856e-05, -7.357820868492126e-05, -6.984174251556396e-05, -6.610527634620667e-05, -6.236881017684937e-05, -5.8632344007492065e-05, -5.4895877838134766e-05, -5.1159411668777466e-05, -4.7422945499420166e-05, -4.3686479330062866e-05, -3.9950013160705566e-05, -3.6213546991348267e-05, -3.247708082199097e-05, -2.8740614652633667e-05, -2.5004148483276367e-05, -2.1267682313919067e-05, -1.7531216144561768e-05, -1.3794749975204468e-05, -1.0058283805847168e-05, -6.321817636489868e-06, -2.5853514671325684e-06, 1.1511147022247314e-06, 4.887580871582031e-06, 8.624047040939331e-06, 1.2360513210296631e-05, 1.609697937965393e-05, 1.983344554901123e-05, 2.356991171836853e-05, 2.730637788772583e-05, 3.104284405708313e-05, 3.477931022644043e-05, 3.851577639579773e-05, 4.225224256515503e-05, 4.598870873451233e-05, 4.972517490386963e-05, 5.346164107322693e-05, 5.719810724258423e-05, 6.093457341194153e-05, 6.467103958129883e-05, 6.840750575065613e-05, 7.214397192001343e-05, 7.588043808937073e-05, 7.961690425872803e-05, 8.335337042808533e-05, 8.708983659744263e-05, 9.082630276679993e-05, 9.456276893615723e-05, 9.829923510551453e-05, 0.00010203570127487183, 0.00010577216744422913, 0.00010950863361358643, 0.00011324509978294373, 0.00011698156595230103, 0.00012071803212165833, 0.00012445449829101562]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 2.0, 8.0, 27.0, 55.0, 137.0, 371.0, 1263.0, 9100.0, 871133.0, 160478.0, 4669.0, 821.0, 295.0, 105.0, 42.0, 20.0, 4.0, 4.0, 3.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81884765625, -0.7923202514648438, -0.7657928466796875, -0.7392654418945312, -0.712738037109375, -0.6862106323242188, -0.6596832275390625, -0.6331558227539062, -0.60662841796875, -0.5801010131835938, -0.5535736083984375, -0.5270462036132812, -0.500518798828125, -0.47399139404296875, -0.4474639892578125, -0.42093658447265625, -0.3944091796875, -0.36788177490234375, -0.3413543701171875, -0.31482696533203125, -0.288299560546875, -0.26177215576171875, -0.2352447509765625, -0.20871734619140625, -0.18218994140625, -0.15566253662109375, -0.1291351318359375, -0.10260772705078125, -0.076080322265625, -0.04955291748046875, -0.0230255126953125, 0.00350189208984375, 0.030029296875, 0.05655670166015625, 0.0830841064453125, 0.10961151123046875, 0.136138916015625, 0.16266632080078125, 0.1891937255859375, 0.21572113037109375, 0.24224853515625, 0.26877593994140625, 0.2953033447265625, 0.32183074951171875, 0.348358154296875, 0.37488555908203125, 0.4014129638671875, 0.42794036865234375, 0.4544677734375, 0.48099517822265625, 0.5075225830078125, 0.5340499877929688, 0.560577392578125, 0.5871047973632812, 0.6136322021484375, 0.6401596069335938, 0.66668701171875, 0.6932144165039062, 0.7197418212890625, 0.7462692260742188, 0.772796630859375, 0.7993240356445312, 0.8258514404296875, 0.8523788452148438, 0.87890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 2.0, 9.0, 7.0, 12.0, 14.0, 44.0, 54.0, 147.0, 219.0, 217.0, 121.0, 55.0, 28.0, 21.0, 14.0, 8.0, 5.0, 4.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1956787109375, -0.1903705596923828, -0.18506240844726562, -0.17975425720214844, -0.17444610595703125, -0.16913795471191406, -0.16382980346679688, -0.1585216522216797, -0.1532135009765625, -0.1479053497314453, -0.14259719848632812, -0.13728904724121094, -0.13198089599609375, -0.12667274475097656, -0.12136459350585938, -0.11605644226074219, -0.110748291015625, -0.10544013977050781, -0.10013198852539062, -0.09482383728027344, -0.08951568603515625, -0.08420753479003906, -0.07889938354492188, -0.07359123229980469, -0.0682830810546875, -0.06297492980957031, -0.057666778564453125, -0.05235862731933594, -0.04705047607421875, -0.04174232482910156, -0.036434173583984375, -0.031126022338867188, -0.02581787109375, -0.020509719848632812, -0.015201568603515625, -0.009893417358398438, -0.00458526611328125, 0.0007228851318359375, 0.006031036376953125, 0.011339187622070312, 0.0166473388671875, 0.021955490112304688, 0.027263641357421875, 0.03257179260253906, 0.03787994384765625, 0.04318809509277344, 0.048496246337890625, 0.05380439758300781, 0.059112548828125, 0.06442070007324219, 0.06972885131835938, 0.07503700256347656, 0.08034515380859375, 0.08565330505371094, 0.09096145629882812, 0.09626960754394531, 0.1015777587890625, 0.10688591003417969, 0.11219406127929688, 0.11750221252441406, 0.12281036376953125, 0.12811851501464844, 0.13342666625976562, 0.1387348175048828, 0.14404296875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 11.0, 23.0, 61.0, 131.0, 214.0, 249.0, 150.0, 77.0, 35.0, 23.0, 8.0, 9.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1968357563018799, -1.1637367010116577, -1.130637764930725, -1.097538709640503, -1.0644397735595703, -1.0313407182693481, -0.9982417821884155, -0.9651427268981934, -0.9320437908172607, -0.8989447951316833, -0.865845799446106, -0.8327468037605286, -0.7996478080749512, -0.7665488123893738, -0.7334498167037964, -0.7003507614135742, -0.6672517657279968, -0.6341527700424194, -0.601053774356842, -0.5679547786712646, -0.5348557829856873, -0.5017567873001099, -0.4686577618122101, -0.4355587661266327, -0.4024597704410553, -0.3693607747554779, -0.3362617790699005, -0.30316275358200073, -0.27006375789642334, -0.23696477711200714, -0.20386576652526855, -0.17076677083969116, -0.13766777515411377, -0.10456877946853638, -0.07146977633237839, -0.0383707731962204, -0.005271777510643005, 0.027827218174934387, 0.060926228761672974, 0.09402522444725037, 0.12712422013282776, 0.16022321581840515, 0.19332221150398254, 0.22642122209072113, 0.2595202326774597, 0.2926192283630371, 0.3257182240486145, 0.3588172197341919, 0.3919162154197693, 0.4250152111053467, 0.4581142067909241, 0.49121320247650146, 0.5243121981620789, 0.5574111938476562, 0.5905102491378784, 0.623609185218811, 0.6567082405090332, 0.6898072361946106, 0.722906231880188, 0.7560052275657654, 0.7891042232513428, 0.8222032189369202, 0.8553022146224976, 0.8884012699127197, 0.9215002059936523]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 2.0, 11.0, 10.0, 16.0, 8.0, 30.0, 37.0, 60.0, 59.0, 79.0, 69.0, 102.0, 90.0, 88.0, 66.0, 64.0, 62.0, 34.0, 22.0, 18.0, 15.0, 10.0, 6.0, 10.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5755372047424316, -0.5581703186035156, -0.5408034324645996, -0.5234366059303284, -0.5060697197914124, -0.48870283365249634, -0.4713359475135803, -0.4539690613746643, -0.4366022050380707, -0.41923531889915466, -0.40186846256256104, -0.384501576423645, -0.367134690284729, -0.3497678339481354, -0.33240094780921936, -0.31503409147262573, -0.2976672053337097, -0.2803003191947937, -0.2629334628582001, -0.24556657671928406, -0.22819970548152924, -0.21083283424377441, -0.1934659481048584, -0.17609907686710358, -0.15873220562934875, -0.14136533439159393, -0.12399845570325851, -0.1066315770149231, -0.08926470577716827, -0.07189783453941345, -0.05453095585107803, -0.037164077162742615, -0.019797146320343018, -0.0024302713572978973, 0.014936603605747223, 0.03230347856879234, 0.04967035353183746, 0.06703722476959229, 0.0844041034579277, 0.10177098214626312, 0.11913785338401794, 0.13650472462177277, 0.1538715958595276, 0.1712384819984436, 0.18860535323619843, 0.20597222447395325, 0.22333911061286926, 0.24070598185062408, 0.2580728530883789, 0.2754397392272949, 0.29280659556388855, 0.31017348170280457, 0.3275403380393982, 0.3449072241783142, 0.3622741103172302, 0.37964099645614624, 0.39700785279273987, 0.4143747389316559, 0.4317415952682495, 0.4491084814071655, 0.46647536754608154, 0.48384222388267517, 0.5012090802192688, 0.5185759663581848, 0.5359428524971008]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 10.0, 6.0, 2.0, 6.0, 2.0, 8.0, 8.0, 8.0, 8.0, 6.0, 20.0, 10.0, 18.0, 10.0, 22.0, 16.0, 24.0, 82.0, 276.0, 4188237.0, 4958.0, 297.0, 76.0, 34.0, 22.0, 18.0, 20.0, 10.0, 6.0, 12.0, 2.0, 12.0, 6.0, 12.0, 2.0, 4.0, 0.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-5.953125, -5.77166748046875, -5.5902099609375, -5.40875244140625, -5.227294921875, -5.04583740234375, -4.8643798828125, -4.68292236328125, -4.50146484375, -4.32000732421875, -4.1385498046875, -3.95709228515625, -3.775634765625, -3.59417724609375, -3.4127197265625, -3.23126220703125, -3.0498046875, -2.86834716796875, -2.6868896484375, -2.50543212890625, -2.323974609375, -2.14251708984375, -1.9610595703125, -1.77960205078125, -1.59814453125, -1.41668701171875, -1.2352294921875, -1.05377197265625, -0.872314453125, -0.69085693359375, -0.5093994140625, -0.32794189453125, -0.146484375, 0.03497314453125, 0.2164306640625, 0.39788818359375, 0.579345703125, 0.76080322265625, 0.9422607421875, 1.12371826171875, 1.30517578125, 1.48663330078125, 1.6680908203125, 1.84954833984375, 2.031005859375, 2.21246337890625, 2.3939208984375, 2.57537841796875, 2.7568359375, 2.93829345703125, 3.1197509765625, 3.30120849609375, 3.482666015625, 3.66412353515625, 3.8455810546875, 4.02703857421875, 4.20849609375, 4.38995361328125, 4.5714111328125, 4.75286865234375, 4.934326171875, 5.11578369140625, 5.2972412109375, 5.47869873046875, 5.66015625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 13.0, 13.0, 16.0, 20.0, 43.0, 88.0, 127.0, 178.0, 153.0, 114.0, 112.0, 48.0, 21.0, 16.0, 12.0, 12.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01171875, -0.011137008666992188, -0.010555267333984375, -0.009973526000976562, -0.00939178466796875, -0.008810043334960938, -0.008228302001953125, -0.0076465606689453125, -0.0070648193359375, -0.0064830780029296875, -0.005901336669921875, -0.0053195953369140625, -0.00473785400390625, -0.0041561126708984375, -0.003574371337890625, -0.0029926300048828125, -0.002410888671875, -0.0018291473388671875, -0.001247406005859375, -0.0006656646728515625, -8.392333984375e-05, 0.0004978179931640625, 0.001079559326171875, 0.0016613006591796875, 0.0022430419921875, 0.0028247833251953125, 0.003406524658203125, 0.0039882659912109375, 0.00457000732421875, 0.0051517486572265625, 0.005733489990234375, 0.0063152313232421875, 0.00689697265625, 0.0074787139892578125, 0.008060455322265625, 0.008642196655273438, 0.00922393798828125, 0.009805679321289062, 0.010387420654296875, 0.010969161987304688, 0.0115509033203125, 0.012132644653320312, 0.012714385986328125, 0.013296127319335938, 0.01387786865234375, 0.014459609985351562, 0.015041351318359375, 0.015623092651367188, 0.016204833984375, 0.016786575317382812, 0.017368316650390625, 0.017950057983398438, 0.01853179931640625, 0.019113540649414062, 0.019695281982421875, 0.020277023315429688, 0.0208587646484375, 0.021440505981445312, 0.022022247314453125, 0.022603988647460938, 0.02318572998046875, 0.023767471313476562, 0.024349212646484375, 0.024930953979492188, 0.0255126953125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 26.0, 333.0, 4193482.0, 435.0, 17.0, 3.0], "bins": [-22.09375, -21.7288818359375, -21.364013671875, -20.9991455078125, -20.63427734375, -20.2694091796875, -19.904541015625, -19.5396728515625, -19.1748046875, -18.8099365234375, -18.445068359375, -18.0802001953125, -17.71533203125, -17.3504638671875, -16.985595703125, -16.6207275390625, -16.255859375, -15.8909912109375, -15.526123046875, -15.1612548828125, -14.79638671875, -14.4315185546875, -14.066650390625, -13.7017822265625, -13.3369140625, -12.9720458984375, -12.607177734375, -12.2423095703125, -11.87744140625, -11.5125732421875, -11.147705078125, -10.7828369140625, -10.41796875, -10.0531005859375, -9.688232421875, -9.3233642578125, -8.95849609375, -8.5936279296875, -8.228759765625, -7.8638916015625, -7.4990234375, -7.1341552734375, -6.769287109375, -6.4044189453125, -6.03955078125, -5.6746826171875, -5.309814453125, -4.9449462890625, -4.580078125, -4.2152099609375, -3.850341796875, -3.4854736328125, -3.12060546875, -2.7557373046875, -2.390869140625, -2.0260009765625, -1.6611328125, -1.2962646484375, -0.931396484375, -0.5665283203125, -0.20166015625, 0.1632080078125, 0.528076171875, 0.8929443359375, 1.2578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 9.0, 16.0, 64.0, 228.0, 1068.0, 2296.0, 282.0, 71.0, 28.0, 10.0, 5.0, 4.0, 3.0, 2.0], "bins": [-0.1671142578125, -0.16408300399780273, -0.16105175018310547, -0.1580204963684082, -0.15498924255371094, -0.15195798873901367, -0.1489267349243164, -0.14589548110961914, -0.14286422729492188, -0.1398329734802246, -0.13680171966552734, -0.13377046585083008, -0.1307392120361328, -0.12770795822143555, -0.12467670440673828, -0.12164545059204102, -0.11861419677734375, -0.11558294296264648, -0.11255168914794922, -0.10952043533325195, -0.10648918151855469, -0.10345792770385742, -0.10042667388916016, -0.09739542007446289, -0.09436416625976562, -0.09133291244506836, -0.0883016586303711, -0.08527040481567383, -0.08223915100097656, -0.0792078971862793, -0.07617664337158203, -0.07314538955688477, -0.0701141357421875, -0.06708288192749023, -0.06405162811279297, -0.0610203742980957, -0.05798912048339844, -0.05495786666870117, -0.051926612854003906, -0.04889535903930664, -0.045864105224609375, -0.04283285140991211, -0.039801597595214844, -0.03677034378051758, -0.03373908996582031, -0.030707836151123047, -0.02767658233642578, -0.024645328521728516, -0.02161407470703125, -0.018582820892333984, -0.015551567077636719, -0.012520313262939453, -0.009489059448242188, -0.006457805633544922, -0.0034265518188476562, -0.0003952980041503906, 0.002635955810546875, 0.005667209625244141, 0.008698463439941406, 0.011729717254638672, 0.014760971069335938, 0.017792224884033203, 0.02082347869873047, 0.023854732513427734, 0.026885986328125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 943.0, 78.0], "bins": [-53.487030029296875, -52.636539459228516, -51.786048889160156, -50.9355583190918, -50.08506774902344, -49.23457717895508, -48.38408660888672, -47.53359603881836, -46.68310546875, -45.83261489868164, -44.98212432861328, -44.13163375854492, -43.28114318847656, -42.4306526184082, -41.580162048339844, -40.729671478271484, -39.879180908203125, -39.028690338134766, -38.178199768066406, -37.32770919799805, -36.47721862792969, -35.62672805786133, -34.77623748779297, -33.92574691772461, -33.075260162353516, -32.224769592285156, -31.374279022216797, -30.523788452148438, -29.673297882080078, -28.82280731201172, -27.97231674194336, -27.121826171875, -26.27133560180664, -25.42084503173828, -24.570354461669922, -23.719863891601562, -22.869373321533203, -22.018882751464844, -21.168392181396484, -20.317901611328125, -19.4674129486084, -18.61692237854004, -17.76643180847168, -16.91594123840332, -16.06545066833496, -15.214960098266602, -14.364470481872559, -13.5139799118042, -12.66348934173584, -11.81299877166748, -10.962508201599121, -10.112018585205078, -9.261528015136719, -8.41103744506836, -7.560546875, -6.710056304931641, -5.859565734863281, -5.009075164794922, -4.1585845947265625, -3.3080945014953613, -2.457603931427002, -1.6071133613586426, -0.7566232681274414, 0.09386730194091797, 0.9443579912185669]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 10.0, 25.0, 77.0, 174.0, 277.0, 226.0, 124.0, 60.0, 25.0, 10.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.495227336883545, -3.42746901512146, -3.359710693359375, -3.291952133178711, -3.224193811416626, -3.156435489654541, -3.088677167892456, -3.020918846130371, -2.953160285949707, -2.885401964187622, -2.817643642425537, -2.749885082244873, -2.682126760482788, -2.614368438720703, -2.546610116958618, -2.478851795196533, -2.4110934734344482, -2.3433351516723633, -2.2755768299102783, -2.2078182697296143, -2.1400599479675293, -2.0723016262054443, -2.0045433044433594, -1.9367849826812744, -1.8690265417099, -1.801268219947815, -1.7335097789764404, -1.6657514572143555, -1.5979931354522705, -1.530234694480896, -1.462476372718811, -1.3947179317474365, -1.3269596099853516, -1.2592012882232666, -1.191442847251892, -1.1236845254898071, -1.0559260845184326, -0.9881677627563477, -0.9204094409942627, -0.852651059627533, -0.7848926782608032, -0.7171342968940735, -0.6493759155273438, -0.5816175937652588, -0.513859212398529, -0.4461008310317993, -0.37834247946739197, -0.3105841279029846, -0.24282574653625488, -0.17506738007068634, -0.1073090136051178, -0.039550647139549255, 0.028207719326019287, 0.09596610069274902, 0.16372445225715637, 0.23148280382156372, 0.29924118518829346, 0.3669995665550232, 0.43475791811943054, 0.5025162696838379, 0.5702746510505676, 0.6380330324172974, 0.7057913541793823, 0.7735497355461121, 0.8413081169128418]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 6.0, 3.0, 4.0, 3.0, 12.0, 14.0, 16.0, 12.0, 23.0, 17.0, 25.0, 33.0, 23.0, 25.0, 38.0, 30.0, 41.0, 41.0, 43.0, 55.0, 1049.0, 1045394.0, 1218.0, 50.0, 39.0, 40.0, 40.0, 33.0, 34.0, 25.0, 34.0, 22.0, 17.0, 14.0, 12.0, 16.0, 9.0, 11.0, 4.0, 10.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -4.01702880859375, -3.8895263671875, -3.76202392578125, -3.634521484375, -3.50701904296875, -3.3795166015625, -3.25201416015625, -3.12451171875, -2.99700927734375, -2.8695068359375, -2.74200439453125, -2.614501953125, -2.48699951171875, -2.3594970703125, -2.23199462890625, -2.1044921875, -1.97698974609375, -1.8494873046875, -1.72198486328125, -1.594482421875, -1.46697998046875, -1.3394775390625, -1.21197509765625, -1.08447265625, -0.95697021484375, -0.8294677734375, -0.70196533203125, -0.574462890625, -0.44696044921875, -0.3194580078125, -0.19195556640625, -0.064453125, 0.06304931640625, 0.1905517578125, 0.31805419921875, 0.445556640625, 0.57305908203125, 0.7005615234375, 0.82806396484375, 0.95556640625, 1.08306884765625, 1.2105712890625, 1.33807373046875, 1.465576171875, 1.59307861328125, 1.7205810546875, 1.84808349609375, 1.9755859375, 2.10308837890625, 2.2305908203125, 2.35809326171875, 2.485595703125, 2.61309814453125, 2.7406005859375, 2.86810302734375, 2.99560546875, 3.12310791015625, 3.2506103515625, 3.37811279296875, 3.505615234375, 3.63311767578125, 3.7606201171875, 3.88812255859375, 4.015625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 114.0, 576.0, 289.0, 26.0, 1.0, 1.0, 1.0], "bins": [-0.77685546875, -0.763606071472168, -0.7503566741943359, -0.7371072769165039, -0.7238578796386719, -0.7106084823608398, -0.6973590850830078, -0.6841096878051758, -0.6708602905273438, -0.6576108932495117, -0.6443614959716797, -0.6311120986938477, -0.6178627014160156, -0.6046133041381836, -0.5913639068603516, -0.5781145095825195, -0.5648651123046875, -0.5516157150268555, -0.5383663177490234, -0.5251169204711914, -0.5118675231933594, -0.49861812591552734, -0.4853687286376953, -0.4721193313598633, -0.45886993408203125, -0.4456205368041992, -0.4323711395263672, -0.41912174224853516, -0.4058723449707031, -0.3926229476928711, -0.37937355041503906, -0.36612415313720703, -0.352874755859375, -0.33962535858154297, -0.32637596130371094, -0.3131265640258789, -0.2998771667480469, -0.28662776947021484, -0.2733783721923828, -0.2601289749145508, -0.24687957763671875, -0.23363018035888672, -0.2203807830810547, -0.20713138580322266, -0.19388198852539062, -0.1806325912475586, -0.16738319396972656, -0.15413379669189453, -0.1408843994140625, -0.12763500213623047, -0.11438560485839844, -0.1011362075805664, -0.08788681030273438, -0.07463741302490234, -0.06138801574707031, -0.04813861846923828, -0.03488922119140625, -0.02163982391357422, -0.008390426635742188, 0.004858970642089844, 0.018108367919921875, 0.031357765197753906, 0.04460716247558594, 0.05785655975341797, 0.07110595703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 1.0, 7.0, 12.0, 5.0, 8.0, 12.0, 23.0, 27.0, 36.0, 64.0, 103.0, 215.0, 480.0, 1236.0, 3944.0, 18119.0, 136785.0, 783718.0, 85659.0, 13193.0, 3076.0, 965.0, 390.0, 164.0, 106.0, 53.0, 48.0, 26.0, 17.0, 15.0, 10.0, 7.0, 5.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2841796875, -1.2389678955078125, -1.193756103515625, -1.1485443115234375, -1.10333251953125, -1.0581207275390625, -1.012908935546875, -0.9676971435546875, -0.9224853515625, -0.8772735595703125, -0.832061767578125, -0.7868499755859375, -0.74163818359375, -0.6964263916015625, -0.651214599609375, -0.6060028076171875, -0.560791015625, -0.5155792236328125, -0.470367431640625, -0.4251556396484375, -0.37994384765625, -0.3347320556640625, -0.289520263671875, -0.2443084716796875, -0.1990966796875, -0.1538848876953125, -0.108673095703125, -0.0634613037109375, -0.01824951171875, 0.0269622802734375, 0.072174072265625, 0.1173858642578125, 0.16259765625, 0.2078094482421875, 0.253021240234375, 0.2982330322265625, 0.34344482421875, 0.3886566162109375, 0.433868408203125, 0.4790802001953125, 0.5242919921875, 0.5695037841796875, 0.614715576171875, 0.6599273681640625, 0.70513916015625, 0.7503509521484375, 0.795562744140625, 0.8407745361328125, 0.885986328125, 0.9311981201171875, 0.976409912109375, 1.0216217041015625, 1.06683349609375, 1.1120452880859375, 1.157257080078125, 1.2024688720703125, 1.2476806640625, 1.2928924560546875, 1.338104248046875, 1.3833160400390625, 1.42852783203125, 1.4737396240234375, 1.518951416015625, 1.5641632080078125, 1.609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 6.0, 8.0, 18.0, 12.0, 10.0, 24.0, 25.0, 36.0, 51.0, 46.0, 68.0, 65.0, 66.0, 79.0, 69.0, 66.0, 65.0, 55.0, 49.0, 46.0, 29.0, 27.0, 12.0, 20.0, 12.0, 7.0, 9.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5859375, -0.5654525756835938, -0.5449676513671875, -0.5244827270507812, -0.503997802734375, -0.48351287841796875, -0.4630279541015625, -0.44254302978515625, -0.42205810546875, -0.40157318115234375, -0.3810882568359375, -0.36060333251953125, -0.340118408203125, -0.31963348388671875, -0.2991485595703125, -0.27866363525390625, -0.2581787109375, -0.23769378662109375, -0.2172088623046875, -0.19672393798828125, -0.176239013671875, -0.15575408935546875, -0.1352691650390625, -0.11478424072265625, -0.09429931640625, -0.07381439208984375, -0.0533294677734375, -0.03284454345703125, -0.012359619140625, 0.00812530517578125, 0.0286102294921875, 0.04909515380859375, 0.069580078125, 0.09006500244140625, 0.1105499267578125, 0.13103485107421875, 0.151519775390625, 0.17200469970703125, 0.1924896240234375, 0.21297454833984375, 0.23345947265625, 0.25394439697265625, 0.2744293212890625, 0.29491424560546875, 0.315399169921875, 0.33588409423828125, 0.3563690185546875, 0.37685394287109375, 0.3973388671875, 0.41782379150390625, 0.4383087158203125, 0.45879364013671875, 0.479278564453125, 0.49976348876953125, 0.5202484130859375, 0.5407333374023438, 0.56121826171875, 0.5817031860351562, 0.6021881103515625, 0.6226730346679688, 0.643157958984375, 0.6636428833007812, 0.6841278076171875, 0.7046127319335938, 0.72509765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 9.0, 2.0, 6.0, 5.0, 14.0, 10.0, 7.0, 15.0, 25.0, 30.0, 53.0, 71.0, 151.0, 388.0, 1095.0, 4833.0, 45314.0, 900062.0, 87285.0, 6769.0, 1506.0, 466.0, 169.0, 81.0, 46.0, 37.0, 21.0, 16.0, 13.0, 13.0, 7.0, 6.0, 5.0, 6.0, 4.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.73046875, -1.6719970703125, -1.613525390625, -1.5550537109375, -1.49658203125, -1.4381103515625, -1.379638671875, -1.3211669921875, -1.2626953125, -1.2042236328125, -1.145751953125, -1.0872802734375, -1.02880859375, -0.9703369140625, -0.911865234375, -0.8533935546875, -0.794921875, -0.7364501953125, -0.677978515625, -0.6195068359375, -0.56103515625, -0.5025634765625, -0.444091796875, -0.3856201171875, -0.3271484375, -0.2686767578125, -0.210205078125, -0.1517333984375, -0.09326171875, -0.0347900390625, 0.023681640625, 0.0821533203125, 0.140625, 0.1990966796875, 0.257568359375, 0.3160400390625, 0.37451171875, 0.4329833984375, 0.491455078125, 0.5499267578125, 0.6083984375, 0.6668701171875, 0.725341796875, 0.7838134765625, 0.84228515625, 0.9007568359375, 0.959228515625, 1.0177001953125, 1.076171875, 1.1346435546875, 1.193115234375, 1.2515869140625, 1.31005859375, 1.3685302734375, 1.427001953125, 1.4854736328125, 1.5439453125, 1.6024169921875, 1.660888671875, 1.7193603515625, 1.77783203125, 1.8363037109375, 1.894775390625, 1.9532470703125, 2.01171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 0.0, 0.0, 7.0, 5.0, 6.0, 16.0, 19.0, 22.0, 37.0, 39.0, 51.0, 64.0, 115.0, 115.0, 121.0, 99.0, 82.0, 72.0, 41.0, 24.0, 19.0, 13.0, 13.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.636713027954102e-05, -8.303392678499222e-05, -7.970072329044342e-05, -7.636751979589462e-05, -7.303431630134583e-05, -6.970111280679703e-05, -6.636790931224823e-05, -6.303470581769943e-05, -5.9701502323150635e-05, -5.636829882860184e-05, -5.303509533405304e-05, -4.970189183950424e-05, -4.6368688344955444e-05, -4.303548485040665e-05, -3.970228135585785e-05, -3.636907786130905e-05, -3.3035874366760254e-05, -2.9702670872211456e-05, -2.636946737766266e-05, -2.303626388311386e-05, -1.9703060388565063e-05, -1.6369856894016266e-05, -1.3036653399467468e-05, -9.70344990491867e-06, -6.370246410369873e-06, -3.0370429158210754e-06, 2.9616057872772217e-07, 3.6293640732765198e-06, 6.962567567825317e-06, 1.0295771062374115e-05, 1.3628974556922913e-05, 1.696217805147171e-05, 2.0295381546020508e-05, 2.3628585040569305e-05, 2.6961788535118103e-05, 3.02949920296669e-05, 3.36281955242157e-05, 3.6961399018764496e-05, 4.0294602513313293e-05, 4.362780600786209e-05, 4.696100950241089e-05, 5.0294212996959686e-05, 5.3627416491508484e-05, 5.696061998605728e-05, 6.029382348060608e-05, 6.362702697515488e-05, 6.696023046970367e-05, 7.029343396425247e-05, 7.362663745880127e-05, 7.695984095335007e-05, 8.029304444789886e-05, 8.362624794244766e-05, 8.695945143699646e-05, 9.029265493154526e-05, 9.362585842609406e-05, 9.695906192064285e-05, 0.00010029226541519165, 0.00010362546890974045, 0.00010695867240428925, 0.00011029187589883804, 0.00011362507939338684, 0.00011695828288793564, 0.00012029148638248444, 0.00012362468987703323, 0.00012695789337158203]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 4.0, 8.0, 6.0, 8.0, 12.0, 23.0, 19.0, 56.0, 96.0, 292.0, 799.0, 3221.0, 18739.0, 495501.0, 505544.0, 19326.0, 3435.0, 903.0, 304.0, 108.0, 52.0, 26.0, 16.0, 16.0, 3.0, 2.0, 6.0, 4.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.814453125, -1.75189208984375, -1.6893310546875, -1.62677001953125, -1.564208984375, -1.50164794921875, -1.4390869140625, -1.37652587890625, -1.31396484375, -1.25140380859375, -1.1888427734375, -1.12628173828125, -1.063720703125, -1.00115966796875, -0.9385986328125, -0.87603759765625, -0.8134765625, -0.75091552734375, -0.6883544921875, -0.62579345703125, -0.563232421875, -0.50067138671875, -0.4381103515625, -0.37554931640625, -0.31298828125, -0.25042724609375, -0.1878662109375, -0.12530517578125, -0.062744140625, -0.00018310546875, 0.0623779296875, 0.12493896484375, 0.1875, 0.25006103515625, 0.3126220703125, 0.37518310546875, 0.437744140625, 0.50030517578125, 0.5628662109375, 0.62542724609375, 0.68798828125, 0.75054931640625, 0.8131103515625, 0.87567138671875, 0.938232421875, 1.00079345703125, 1.0633544921875, 1.12591552734375, 1.1884765625, 1.25103759765625, 1.3135986328125, 1.37615966796875, 1.438720703125, 1.50128173828125, 1.5638427734375, 1.62640380859375, 1.68896484375, 1.75152587890625, 1.8140869140625, 1.87664794921875, 1.939208984375, 2.00177001953125, 2.0643310546875, 2.12689208984375, 2.189453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 2.0, 6.0, 6.0, 12.0, 10.0, 16.0, 24.0, 32.0, 49.0, 79.0, 127.0, 162.0, 152.0, 108.0, 70.0, 38.0, 25.0, 16.0, 11.0, 7.0, 5.0, 8.0, 7.0, 6.0, 4.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6005859375, -0.5773391723632812, -0.5540924072265625, -0.5308456420898438, -0.507598876953125, -0.48435211181640625, -0.4611053466796875, -0.43785858154296875, -0.41461181640625, -0.39136505126953125, -0.3681182861328125, -0.34487152099609375, -0.321624755859375, -0.29837799072265625, -0.2751312255859375, -0.25188446044921875, -0.2286376953125, -0.20539093017578125, -0.1821441650390625, -0.15889739990234375, -0.135650634765625, -0.11240386962890625, -0.0891571044921875, -0.06591033935546875, -0.04266357421875, -0.01941680908203125, 0.0038299560546875, 0.02707672119140625, 0.050323486328125, 0.07357025146484375, 0.0968170166015625, 0.12006378173828125, 0.143310546875, 0.16655731201171875, 0.1898040771484375, 0.21305084228515625, 0.236297607421875, 0.25954437255859375, 0.2827911376953125, 0.30603790283203125, 0.32928466796875, 0.35253143310546875, 0.3757781982421875, 0.39902496337890625, 0.422271728515625, 0.44551849365234375, 0.4687652587890625, 0.49201202392578125, 0.5152587890625, 0.5385055541992188, 0.5617523193359375, 0.5849990844726562, 0.608245849609375, 0.6314926147460938, 0.6547393798828125, 0.6779861450195312, 0.70123291015625, 0.7244796752929688, 0.7477264404296875, 0.7709732055664062, 0.794219970703125, 0.8174667358398438, 0.8407135009765625, 0.8639602661132812, 0.88720703125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 524.0, 481.0, 9.0, 2.0, 1.0, 1.0], "bins": [-175.54312133789062, -172.56423950195312, -169.58535766601562, -166.60647583007812, -163.62759399414062, -160.64871215820312, -157.66983032226562, -154.69094848632812, -151.71206665039062, -148.73318481445312, -145.75430297851562, -142.77542114257812, -139.79653930664062, -136.81765747070312, -133.83877563476562, -130.85989379882812, -127.88101959228516, -124.90213775634766, -121.92325592041016, -118.94437408447266, -115.96549224853516, -112.98661041259766, -110.00773620605469, -107.02885437011719, -104.04997253417969, -101.07109069824219, -98.09220886230469, -95.11332702636719, -92.13444519042969, -89.15556335449219, -86.17668151855469, -83.19779968261719, -80.21891784667969, -77.24003601074219, -74.26115417480469, -71.28227233886719, -68.30339050292969, -65.32450866699219, -62.34563064575195, -59.36674880981445, -56.38787078857422, -53.40898895263672, -50.43010711669922, -47.45122528076172, -44.47234344482422, -41.49346160888672, -38.514583587646484, -35.535701751708984, -32.556819915771484, -29.577938079833984, -26.599056243896484, -23.620176315307617, -20.641294479370117, -17.662412643432617, -14.68353271484375, -11.70465087890625, -8.72576904296875, -5.746887683868408, -2.7680063247680664, 0.2108745574951172, 3.189756393432617, 6.168638229370117, 9.147518157958984, 12.126399993896484, 15.105281829833984]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 15.0, 31.0, 42.0, 56.0, 88.0, 94.0, 126.0, 119.0, 116.0, 99.0, 79.0, 45.0, 22.0, 34.0, 19.0, 8.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.14976692199707, -11.889132499694824, -11.628498077392578, -11.367863655090332, -11.107229232788086, -10.84659481048584, -10.585960388183594, -10.325325965881348, -10.064691543579102, -9.804057121276855, -9.54342269897461, -9.282788276672363, -9.022153854370117, -8.761519432067871, -8.500885009765625, -8.240250587463379, -7.979615688323975, -7.7189812660217285, -7.458346843719482, -7.197712421417236, -6.93707799911499, -6.676443576812744, -6.41580867767334, -6.155174255371094, -5.894539833068848, -5.633905410766602, -5.3732709884643555, -5.112636566162109, -4.852002143859863, -4.591367721557617, -4.330733299255371, -4.070098876953125, -3.809464454650879, -3.548830032348633, -3.2881956100463867, -3.0275611877441406, -2.7669267654418945, -2.5062923431396484, -2.2456576824188232, -1.9850232601165771, -1.724388837814331, -1.463754415512085, -1.2031199932098389, -0.9424854516983032, -0.6818510293960571, -0.42121660709381104, -0.1605820655822754, 0.1000523567199707, 0.3606867790222168, 0.6213212013244629, 0.8819556832313538, 1.1425901651382446, 1.4032245874404907, 1.6638590097427368, 1.9244935512542725, 2.1851279735565186, 2.4457623958587646, 2.7063968181610107, 2.967031240463257, 3.227665901184082, 3.488300323486328, 3.748934745788574, 4.00956916809082, 4.270203590393066, 4.5308380126953125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 16.0, 19.0, 32.0, 51.0, 78.0, 165.0, 428.0, 319793.0, 3873320.0, 259.0, 66.0, 27.0, 16.0, 8.0, 6.0, 1.0, 2.0], "bins": [-33.96875, -33.35137939453125, -32.7340087890625, -32.11663818359375, -31.499267578125, -30.88189697265625, -30.2645263671875, -29.64715576171875, -29.02978515625, -28.41241455078125, -27.7950439453125, -27.17767333984375, -26.560302734375, -25.94293212890625, -25.3255615234375, -24.70819091796875, -24.0908203125, -23.47344970703125, -22.8560791015625, -22.23870849609375, -21.621337890625, -21.00396728515625, -20.3865966796875, -19.76922607421875, -19.15185546875, -18.53448486328125, -17.9171142578125, -17.29974365234375, -16.682373046875, -16.06500244140625, -15.4476318359375, -14.83026123046875, -14.212890625, -13.59552001953125, -12.9781494140625, -12.36077880859375, -11.743408203125, -11.12603759765625, -10.5086669921875, -9.89129638671875, -9.27392578125, -8.65655517578125, -8.0391845703125, -7.42181396484375, -6.804443359375, -6.18707275390625, -5.5697021484375, -4.95233154296875, -4.3349609375, -3.71759033203125, -3.1002197265625, -2.48284912109375, -1.865478515625, -1.24810791015625, -0.6307373046875, -0.01336669921875, 0.60400390625, 1.22137451171875, 1.8387451171875, 2.45611572265625, 3.073486328125, 3.69085693359375, 4.3082275390625, 4.92559814453125, 5.54296875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 19.0, 80.0, 269.0, 382.0, 177.0, 76.0, 12.0, 4.0], "bins": [-0.9345703125, -0.918818473815918, -0.9030666351318359, -0.8873147964477539, -0.8715629577636719, -0.8558111190795898, -0.8400592803955078, -0.8243074417114258, -0.8085556030273438, -0.7928037643432617, -0.7770519256591797, -0.7613000869750977, -0.7455482482910156, -0.7297964096069336, -0.7140445709228516, -0.6982927322387695, -0.6825408935546875, -0.6667890548706055, -0.6510372161865234, -0.6352853775024414, -0.6195335388183594, -0.6037817001342773, -0.5880298614501953, -0.5722780227661133, -0.5565261840820312, -0.5407743453979492, -0.5250225067138672, -0.5092706680297852, -0.4935188293457031, -0.4777669906616211, -0.46201515197753906, -0.44626331329345703, -0.430511474609375, -0.41475963592529297, -0.39900779724121094, -0.3832559585571289, -0.3675041198730469, -0.35175228118896484, -0.3360004425048828, -0.3202486038208008, -0.30449676513671875, -0.2887449264526367, -0.2729930877685547, -0.25724124908447266, -0.24148941040039062, -0.2257375717163086, -0.20998573303222656, -0.19423389434814453, -0.1784820556640625, -0.16273021697998047, -0.14697837829589844, -0.1312265396118164, -0.11547470092773438, -0.09972286224365234, -0.08397102355957031, -0.06821918487548828, -0.05246734619140625, -0.03671550750732422, -0.020963668823242188, -0.005211830139160156, 0.010540008544921875, 0.026291847229003906, 0.04204368591308594, 0.05779552459716797, 0.07354736328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 11.0, 35.0, 108.0, 235.0, 445.0, 474826.0, 3717958.0, 472.0, 140.0, 44.0, 9.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-52.34375, -51.297119140625, -50.25048828125, -49.203857421875, -48.1572265625, -47.110595703125, -46.06396484375, -45.017333984375, -43.970703125, -42.924072265625, -41.87744140625, -40.830810546875, -39.7841796875, -38.737548828125, -37.69091796875, -36.644287109375, -35.59765625, -34.551025390625, -33.50439453125, -32.457763671875, -31.4111328125, -30.364501953125, -29.31787109375, -28.271240234375, -27.224609375, -26.177978515625, -25.13134765625, -24.084716796875, -23.0380859375, -21.991455078125, -20.94482421875, -19.898193359375, -18.8515625, -17.804931640625, -16.75830078125, -15.711669921875, -14.6650390625, -13.618408203125, -12.57177734375, -11.525146484375, -10.478515625, -9.431884765625, -8.38525390625, -7.338623046875, -6.2919921875, -5.245361328125, -4.19873046875, -3.152099609375, -2.10546875, -1.058837890625, -0.01220703125, 1.034423828125, 2.0810546875, 3.127685546875, 4.17431640625, 5.220947265625, 6.267578125, 7.314208984375, 8.36083984375, 9.407470703125, 10.4541015625, 11.500732421875, 12.54736328125, 13.593994140625, 14.640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 326.0, 3659.0, 79.0, 15.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.359375, -4.2670440673828125, -4.174713134765625, -4.0823822021484375, -3.99005126953125, -3.8977203369140625, -3.805389404296875, -3.7130584716796875, -3.6207275390625, -3.5283966064453125, -3.436065673828125, -3.3437347412109375, -3.25140380859375, -3.1590728759765625, -3.066741943359375, -2.9744110107421875, -2.882080078125, -2.7897491455078125, -2.697418212890625, -2.6050872802734375, -2.51275634765625, -2.4204254150390625, -2.328094482421875, -2.2357635498046875, -2.1434326171875, -2.0511016845703125, -1.958770751953125, -1.8664398193359375, -1.77410888671875, -1.6817779541015625, -1.589447021484375, -1.4971160888671875, -1.40478515625, -1.3124542236328125, -1.220123291015625, -1.1277923583984375, -1.03546142578125, -0.9431304931640625, -0.850799560546875, -0.7584686279296875, -0.6661376953125, -0.5738067626953125, -0.481475830078125, -0.3891448974609375, -0.29681396484375, -0.2044830322265625, -0.112152099609375, -0.0198211669921875, 0.072509765625, 0.1648406982421875, 0.257171630859375, 0.3495025634765625, 0.44183349609375, 0.5341644287109375, 0.626495361328125, 0.7188262939453125, 0.8111572265625, 0.9034881591796875, 0.995819091796875, 1.0881500244140625, 1.18048095703125, 1.2728118896484375, 1.365142822265625, 1.4574737548828125, 1.5498046875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 257.0, 715.0, 27.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.99972534179688, -63.67671203613281, -62.35369873046875, -61.03068542480469, -59.707672119140625, -58.38465881347656, -57.0616455078125, -55.73863220214844, -54.415618896484375, -53.09260559082031, -51.76959228515625, -50.44657897949219, -49.123565673828125, -47.80055236816406, -46.4775390625, -45.15452575683594, -43.83150863647461, -42.50849533081055, -41.185482025146484, -39.86246871948242, -38.53945541381836, -37.2164421081543, -35.893428802490234, -34.570411682128906, -33.247398376464844, -31.92438507080078, -30.60137176513672, -29.278358459472656, -27.955345153808594, -26.63233184814453, -25.309316635131836, -23.986303329467773, -22.663288116455078, -21.340274810791016, -20.017261505126953, -18.69424819946289, -17.371234893798828, -16.048221588134766, -14.72520637512207, -13.402193069458008, -12.079179763793945, -10.756166458129883, -9.43315315246582, -8.110138893127441, -6.787125587463379, -5.464112281799316, -4.141098499298096, -2.818084716796875, -1.4950714111328125, -0.1720578670501709, 1.1509556770324707, 2.4739692211151123, 3.796982765197754, 5.119996070861816, 6.443009853363037, 7.766023635864258, 9.08903694152832, 10.412050247192383, 11.735063552856445, 13.058077812194824, 14.381091117858887, 15.70410442352295, 17.027118682861328, 18.35013198852539, 19.673145294189453]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 19.0, 31.0, 51.0, 86.0, 141.0, 150.0, 158.0, 133.0, 95.0, 70.0, 34.0, 17.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.002391815185547, -14.516193389892578, -14.029995918273926, -13.543798446655273, -13.057600021362305, -12.571401596069336, -12.085204124450684, -11.599006652832031, -11.112808227539062, -10.626609802246094, -10.140412330627441, -9.654214859008789, -9.16801643371582, -8.681818008422852, -8.1956205368042, -7.709422588348389, -7.223224639892578, -6.737026691436768, -6.250828742980957, -5.7646307945251465, -5.278432846069336, -4.792234897613525, -4.306036949157715, -3.8198390007019043, -3.3336410522460938, -2.847443103790283, -2.3612451553344727, -1.875047206878662, -1.3888492584228516, -0.902651309967041, -0.41645336151123047, 0.06974458694458008, 0.5559425354003906, 1.0421404838562012, 1.5283384323120117, 2.0145363807678223, 2.500734329223633, 2.9869322776794434, 3.473130226135254, 3.9593281745910645, 4.445526123046875, 4.9317240715026855, 5.417922019958496, 5.904119968414307, 6.390317916870117, 6.876515865325928, 7.362713813781738, 7.848911762237549, 8.33510971069336, 8.821308135986328, 9.30750560760498, 9.793703079223633, 10.279901504516602, 10.76609992980957, 11.252297401428223, 11.738494873046875, 12.224693298339844, 12.710891723632812, 13.197089195251465, 13.683286666870117, 14.169485092163086, 14.655683517456055, 15.141880989074707, 15.62807846069336, 16.114276885986328]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 14.0, 15.0, 16.0, 22.0, 38.0, 53.0, 73.0, 94.0, 190.0, 662.0, 3291.0, 92251.0, 937413.0, 12052.0, 1584.0, 376.0, 144.0, 78.0, 59.0, 38.0, 28.0, 18.0, 10.0, 12.0, 7.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.63763427734375, -7.4080810546875, -7.17852783203125, -6.948974609375, -6.71942138671875, -6.4898681640625, -6.26031494140625, -6.03076171875, -5.80120849609375, -5.5716552734375, -5.34210205078125, -5.112548828125, -4.88299560546875, -4.6534423828125, -4.42388916015625, -4.1943359375, -3.96478271484375, -3.7352294921875, -3.50567626953125, -3.276123046875, -3.04656982421875, -2.8170166015625, -2.58746337890625, -2.35791015625, -2.12835693359375, -1.8988037109375, -1.66925048828125, -1.439697265625, -1.21014404296875, -0.9805908203125, -0.75103759765625, -0.521484375, -0.29193115234375, -0.0623779296875, 0.16717529296875, 0.396728515625, 0.62628173828125, 0.8558349609375, 1.08538818359375, 1.31494140625, 1.54449462890625, 1.7740478515625, 2.00360107421875, 2.233154296875, 2.46270751953125, 2.6922607421875, 2.92181396484375, 3.1513671875, 3.38092041015625, 3.6104736328125, 3.84002685546875, 4.069580078125, 4.29913330078125, 4.5286865234375, 4.75823974609375, 4.98779296875, 5.21734619140625, 5.4468994140625, 5.67645263671875, 5.906005859375, 6.13555908203125, 6.3651123046875, 6.59466552734375, 6.82421875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 32.0, 39.0, 82.0, 122.0, 171.0, 184.0, 155.0, 82.0, 79.0, 27.0, 15.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3486328125, -1.3194122314453125, -1.290191650390625, -1.2609710693359375, -1.23175048828125, -1.2025299072265625, -1.173309326171875, -1.1440887451171875, -1.1148681640625, -1.0856475830078125, -1.056427001953125, -1.0272064208984375, -0.99798583984375, -0.9687652587890625, -0.939544677734375, -0.9103240966796875, -0.881103515625, -0.8518829345703125, -0.822662353515625, -0.7934417724609375, -0.76422119140625, -0.7350006103515625, -0.705780029296875, -0.6765594482421875, -0.6473388671875, -0.6181182861328125, -0.588897705078125, -0.5596771240234375, -0.53045654296875, -0.5012359619140625, -0.472015380859375, -0.4427947998046875, -0.41357421875, -0.3843536376953125, -0.355133056640625, -0.3259124755859375, -0.29669189453125, -0.2674713134765625, -0.238250732421875, -0.2090301513671875, -0.1798095703125, -0.1505889892578125, -0.121368408203125, -0.0921478271484375, -0.06292724609375, -0.0337066650390625, -0.004486083984375, 0.0247344970703125, 0.053955078125, 0.0831756591796875, 0.112396240234375, 0.1416168212890625, 0.17083740234375, 0.2000579833984375, 0.229278564453125, 0.2584991455078125, 0.2877197265625, 0.3169403076171875, 0.346160888671875, 0.3753814697265625, 0.40460205078125, 0.4338226318359375, 0.463043212890625, 0.4922637939453125, 0.521484375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 1.0, 6.0, 4.0, 13.0, 11.0, 8.0, 9.0, 22.0, 18.0, 34.0, 51.0, 71.0, 130.0, 369.0, 1454.0, 28794.0, 980652.0, 34574.0, 1605.0, 348.0, 125.0, 69.0, 43.0, 31.0, 22.0, 20.0, 26.0, 9.0, 5.0, 9.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.99609375, -4.84246826171875, -4.6888427734375, -4.53521728515625, -4.381591796875, -4.22796630859375, -4.0743408203125, -3.92071533203125, -3.76708984375, -3.61346435546875, -3.4598388671875, -3.30621337890625, -3.152587890625, -2.99896240234375, -2.8453369140625, -2.69171142578125, -2.5380859375, -2.38446044921875, -2.2308349609375, -2.07720947265625, -1.923583984375, -1.76995849609375, -1.6163330078125, -1.46270751953125, -1.30908203125, -1.15545654296875, -1.0018310546875, -0.84820556640625, -0.694580078125, -0.54095458984375, -0.3873291015625, -0.23370361328125, -0.080078125, 0.07354736328125, 0.2271728515625, 0.38079833984375, 0.534423828125, 0.68804931640625, 0.8416748046875, 0.99530029296875, 1.14892578125, 1.30255126953125, 1.4561767578125, 1.60980224609375, 1.763427734375, 1.91705322265625, 2.0706787109375, 2.22430419921875, 2.3779296875, 2.53155517578125, 2.6851806640625, 2.83880615234375, 2.992431640625, 3.14605712890625, 3.2996826171875, 3.45330810546875, 3.60693359375, 3.76055908203125, 3.9141845703125, 4.06781005859375, 4.221435546875, 4.37506103515625, 4.5286865234375, 4.68231201171875, 4.8359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 8.0, 11.0, 10.0, 15.0, 21.0, 26.0, 36.0, 44.0, 36.0, 52.0, 67.0, 55.0, 49.0, 59.0, 67.0, 55.0, 56.0, 50.0, 42.0, 34.0, 38.0, 26.0, 24.0, 23.0, 18.0, 12.0, 12.0, 12.0, 6.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.505615234375, -1.45654296875, -1.407470703125, -1.3583984375, -1.309326171875, -1.26025390625, -1.211181640625, -1.162109375, -1.113037109375, -1.06396484375, -1.014892578125, -0.9658203125, -0.916748046875, -0.86767578125, -0.818603515625, -0.76953125, -0.720458984375, -0.67138671875, -0.622314453125, -0.5732421875, -0.524169921875, -0.47509765625, -0.426025390625, -0.376953125, -0.327880859375, -0.27880859375, -0.229736328125, -0.1806640625, -0.131591796875, -0.08251953125, -0.033447265625, 0.015625, 0.064697265625, 0.11376953125, 0.162841796875, 0.2119140625, 0.260986328125, 0.31005859375, 0.359130859375, 0.408203125, 0.457275390625, 0.50634765625, 0.555419921875, 0.6044921875, 0.653564453125, 0.70263671875, 0.751708984375, 0.80078125, 0.849853515625, 0.89892578125, 0.947998046875, 0.9970703125, 1.046142578125, 1.09521484375, 1.144287109375, 1.193359375, 1.242431640625, 1.29150390625, 1.340576171875, 1.3896484375, 1.438720703125, 1.48779296875, 1.536865234375, 1.5859375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 9.0, 6.0, 10.0, 11.0, 41.0, 60.0, 170.0, 634.0, 6002.0, 1005879.0, 33976.0, 1243.0, 304.0, 104.0, 45.0, 27.0, 9.0, 9.0, 8.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.91796875, -5.76885986328125, -5.6197509765625, -5.47064208984375, -5.321533203125, -5.17242431640625, -5.0233154296875, -4.87420654296875, -4.72509765625, -4.57598876953125, -4.4268798828125, -4.27777099609375, -4.128662109375, -3.97955322265625, -3.8304443359375, -3.68133544921875, -3.5322265625, -3.38311767578125, -3.2340087890625, -3.08489990234375, -2.935791015625, -2.78668212890625, -2.6375732421875, -2.48846435546875, -2.33935546875, -2.19024658203125, -2.0411376953125, -1.89202880859375, -1.742919921875, -1.59381103515625, -1.4447021484375, -1.29559326171875, -1.146484375, -0.99737548828125, -0.8482666015625, -0.69915771484375, -0.550048828125, -0.40093994140625, -0.2518310546875, -0.10272216796875, 0.04638671875, 0.19549560546875, 0.3446044921875, 0.49371337890625, 0.642822265625, 0.79193115234375, 0.9410400390625, 1.09014892578125, 1.2392578125, 1.38836669921875, 1.5374755859375, 1.68658447265625, 1.835693359375, 1.98480224609375, 2.1339111328125, 2.28302001953125, 2.43212890625, 2.58123779296875, 2.7303466796875, 2.87945556640625, 3.028564453125, 3.17767333984375, 3.3267822265625, 3.47589111328125, 3.625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 4.0, 4.0, 16.0, 14.0, 35.0, 40.0, 71.0, 76.0, 147.0, 163.0, 145.0, 79.0, 67.0, 46.0, 32.0, 20.0, 11.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021076202392578125, -0.00020498409867286682, -0.0001992061734199524, -0.00019342824816703796, -0.00018765032291412354, -0.0001818723976612091, -0.00017609447240829468, -0.00017031654715538025, -0.00016453862190246582, -0.0001587606966495514, -0.00015298277139663696, -0.00014720484614372253, -0.0001414269208908081, -0.00013564899563789368, -0.00012987107038497925, -0.00012409314513206482, -0.00011831521987915039, -0.00011253729462623596, -0.00010675936937332153, -0.0001009814441204071, -9.520351886749268e-05, -8.942559361457825e-05, -8.364766836166382e-05, -7.786974310874939e-05, -7.209181785583496e-05, -6.631389260292053e-05, -6.0535967350006104e-05, -5.4758042097091675e-05, -4.8980116844177246e-05, -4.320219159126282e-05, -3.742426633834839e-05, -3.164634108543396e-05, -2.586841583251953e-05, -2.0090490579605103e-05, -1.4312565326690674e-05, -8.534640073776245e-06, -2.7567148208618164e-06, 3.0212104320526123e-06, 8.799135684967041e-06, 1.457706093788147e-05, 2.03549861907959e-05, 2.6132911443710327e-05, 3.1910836696624756e-05, 3.7688761949539185e-05, 4.346668720245361e-05, 4.924461245536804e-05, 5.502253770828247e-05, 6.08004629611969e-05, 6.657838821411133e-05, 7.235631346702576e-05, 7.813423871994019e-05, 8.391216397285461e-05, 8.969008922576904e-05, 9.546801447868347e-05, 0.0001012459397315979, 0.00010702386498451233, 0.00011280179023742676, 0.00011857971549034119, 0.00012435764074325562, 0.00013013556599617004, 0.00013591349124908447, 0.0001416914165019989, 0.00014746934175491333, 0.00015324726700782776, 0.0001590251922607422]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 12.0, 13.0, 18.0, 36.0, 42.0, 95.0, 237.0, 883.0, 6724.0, 766624.0, 268551.0, 4182.0, 737.0, 201.0, 81.0, 36.0, 24.0, 12.0, 8.0, 8.0, 8.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.484375, -3.381622314453125, -3.27886962890625, -3.176116943359375, -3.0733642578125, -2.970611572265625, -2.86785888671875, -2.765106201171875, -2.662353515625, -2.559600830078125, -2.45684814453125, -2.354095458984375, -2.2513427734375, -2.148590087890625, -2.04583740234375, -1.943084716796875, -1.84033203125, -1.737579345703125, -1.63482666015625, -1.532073974609375, -1.4293212890625, -1.326568603515625, -1.22381591796875, -1.121063232421875, -1.018310546875, -0.915557861328125, -0.81280517578125, -0.710052490234375, -0.6072998046875, -0.504547119140625, -0.40179443359375, -0.299041748046875, -0.1962890625, -0.093536376953125, 0.00921630859375, 0.111968994140625, 0.2147216796875, 0.317474365234375, 0.42022705078125, 0.522979736328125, 0.625732421875, 0.728485107421875, 0.83123779296875, 0.933990478515625, 1.0367431640625, 1.139495849609375, 1.24224853515625, 1.345001220703125, 1.44775390625, 1.550506591796875, 1.65325927734375, 1.756011962890625, 1.8587646484375, 1.961517333984375, 2.06427001953125, 2.167022705078125, 2.269775390625, 2.372528076171875, 2.47528076171875, 2.578033447265625, 2.6807861328125, 2.783538818359375, 2.88629150390625, 2.989044189453125, 3.091796875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 14.0, 7.0, 22.0, 37.0, 84.0, 122.0, 209.0, 218.0, 112.0, 67.0, 35.0, 17.0, 12.0, 11.0, 5.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.150390625, -1.11322021484375, -1.0760498046875, -1.03887939453125, -1.001708984375, -0.96453857421875, -0.9273681640625, -0.89019775390625, -0.85302734375, -0.81585693359375, -0.7786865234375, -0.74151611328125, -0.704345703125, -0.66717529296875, -0.6300048828125, -0.59283447265625, -0.5556640625, -0.51849365234375, -0.4813232421875, -0.44415283203125, -0.406982421875, -0.36981201171875, -0.3326416015625, -0.29547119140625, -0.25830078125, -0.22113037109375, -0.1839599609375, -0.14678955078125, -0.109619140625, -0.07244873046875, -0.0352783203125, 0.00189208984375, 0.0390625, 0.07623291015625, 0.1134033203125, 0.15057373046875, 0.187744140625, 0.22491455078125, 0.2620849609375, 0.29925537109375, 0.33642578125, 0.37359619140625, 0.4107666015625, 0.44793701171875, 0.485107421875, 0.52227783203125, 0.5594482421875, 0.59661865234375, 0.6337890625, 0.67095947265625, 0.7081298828125, 0.74530029296875, 0.782470703125, 0.81964111328125, 0.8568115234375, 0.89398193359375, 0.93115234375, 0.96832275390625, 1.0054931640625, 1.04266357421875, 1.079833984375, 1.11700439453125, 1.1541748046875, 1.19134521484375, 1.228515625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 53.0, 419.0, 413.0, 89.0, 14.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.389394760131836, -25.473508834838867, -24.5576229095459, -23.64173698425293, -22.72585105895996, -21.809965133666992, -20.89407730102539, -19.978191375732422, -19.062305450439453, -18.146419525146484, -17.230533599853516, -16.314647674560547, -15.398761749267578, -14.48287582397461, -13.566988945007324, -12.651103019714355, -11.735218048095703, -10.819332122802734, -9.903446197509766, -8.987560272216797, -8.071674346923828, -7.155787944793701, -6.239901542663574, -5.3240156173706055, -4.408129692077637, -3.492243766784668, -2.57635760307312, -1.6604714393615723, -0.7445855140686035, 0.17130041122436523, 1.0871868133544922, 2.003072738647461, 2.9189605712890625, 3.8348464965820312, 4.750732421875, 5.666618824005127, 6.582504749298096, 7.4983906745910645, 8.414277076721191, 9.33016300201416, 10.246048927307129, 11.161934852600098, 12.077820777893066, 12.993707656860352, 13.90959358215332, 14.825479507446289, 15.741365432739258, 16.657251358032227, 17.573137283325195, 18.489023208618164, 19.404909133911133, 20.3207950592041, 21.23668098449707, 22.15256690979004, 23.06845474243164, 23.98434066772461, 24.900226593017578, 25.816112518310547, 26.731998443603516, 27.647884368896484, 28.563770294189453, 29.479656219482422, 30.39554214477539, 31.31142807006836, 32.22731399536133]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 8.0, 7.0, 10.0, 17.0, 15.0, 19.0, 20.0, 37.0, 39.0, 45.0, 48.0, 47.0, 75.0, 56.0, 56.0, 71.0, 49.0, 49.0, 57.0, 46.0, 37.0, 35.0, 27.0, 27.0, 20.0, 21.0, 11.0, 9.0, 12.0, 7.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.838167190551758, -9.514019966125488, -9.189872741699219, -8.86572551727295, -8.54157829284668, -8.217430114746094, -7.893282890319824, -7.569135665893555, -7.244988441467285, -6.920841217041016, -6.596693992614746, -6.272546291351318, -5.948399066925049, -5.624251842498779, -5.300104141235352, -4.975956916809082, -4.6518096923828125, -4.327662467956543, -4.003515243530273, -3.6793675422668457, -3.355220317840576, -3.0310730934143066, -2.706925630569458, -2.3827781677246094, -2.05863094329834, -1.7344835996627808, -1.4103362560272217, -1.0861889123916626, -0.7620415687561035, -0.43789422512054443, -0.11374688148498535, 0.21040058135986328, 0.5345468521118164, 0.8586941957473755, 1.1828415393829346, 1.5069888830184937, 1.8311362266540527, 2.1552834510803223, 2.479430913925171, 2.8035783767700195, 3.127725601196289, 3.4518728256225586, 3.7760202884674072, 4.100167751312256, 4.424314975738525, 4.748462200164795, 5.072609901428223, 5.396757125854492, 5.720904350280762, 6.045051574707031, 6.369198799133301, 6.6933465003967285, 7.017493724822998, 7.341640949249268, 7.665788650512695, 7.989935874938965, 8.314083099365234, 8.638230323791504, 8.962377548217773, 9.286524772644043, 9.610671997070312, 9.934820175170898, 10.258967399597168, 10.583114624023438, 10.907261848449707]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 4.0, 6.0, 14.0, 15.0, 21.0, 20.0, 32.0, 48.0, 68.0, 70.0, 129.0, 212.0, 518.0, 1811.0, 17013.0, 4011289.0, 157567.0, 4485.0, 679.0, 164.0, 56.0, 29.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.125, -12.8502197265625, -12.575439453125, -12.3006591796875, -12.02587890625, -11.7510986328125, -11.476318359375, -11.2015380859375, -10.9267578125, -10.6519775390625, -10.377197265625, -10.1024169921875, -9.82763671875, -9.5528564453125, -9.278076171875, -9.0032958984375, -8.728515625, -8.4537353515625, -8.178955078125, -7.9041748046875, -7.62939453125, -7.3546142578125, -7.079833984375, -6.8050537109375, -6.5302734375, -6.2554931640625, -5.980712890625, -5.7059326171875, -5.43115234375, -5.1563720703125, -4.881591796875, -4.6068115234375, -4.33203125, -4.0572509765625, -3.782470703125, -3.5076904296875, -3.23291015625, -2.9581298828125, -2.683349609375, -2.4085693359375, -2.1337890625, -1.8590087890625, -1.584228515625, -1.3094482421875, -1.03466796875, -0.7598876953125, -0.485107421875, -0.2103271484375, 0.064453125, 0.3392333984375, 0.614013671875, 0.8887939453125, 1.16357421875, 1.4383544921875, 1.713134765625, 1.9879150390625, 2.2626953125, 2.5374755859375, 2.812255859375, 3.0870361328125, 3.36181640625, 3.6365966796875, 3.911376953125, 4.1861572265625, 4.4609375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 10.0, 17.0, 40.0, 64.0, 99.0, 125.0, 171.0, 160.0, 113.0, 84.0, 51.0, 34.0, 20.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0], "bins": [-1.435546875, -1.407806396484375, -1.38006591796875, -1.352325439453125, -1.3245849609375, -1.296844482421875, -1.26910400390625, -1.241363525390625, -1.213623046875, -1.185882568359375, -1.15814208984375, -1.130401611328125, -1.1026611328125, -1.074920654296875, -1.04718017578125, -1.019439697265625, -0.99169921875, -0.963958740234375, -0.93621826171875, -0.908477783203125, -0.8807373046875, -0.852996826171875, -0.82525634765625, -0.797515869140625, -0.769775390625, -0.742034912109375, -0.71429443359375, -0.686553955078125, -0.6588134765625, -0.631072998046875, -0.60333251953125, -0.575592041015625, -0.5478515625, -0.520111083984375, -0.49237060546875, -0.464630126953125, -0.4368896484375, -0.409149169921875, -0.38140869140625, -0.353668212890625, -0.325927734375, -0.298187255859375, -0.27044677734375, -0.242706298828125, -0.2149658203125, -0.187225341796875, -0.15948486328125, -0.131744384765625, -0.10400390625, -0.076263427734375, -0.04852294921875, -0.020782470703125, 0.0069580078125, 0.034698486328125, 0.06243896484375, 0.090179443359375, 0.117919921875, 0.145660400390625, 0.17340087890625, 0.201141357421875, 0.2288818359375, 0.256622314453125, 0.28436279296875, 0.312103271484375, 0.33984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 33.0, 70.0, 210.0, 1081.0, 4188066.0, 4516.0, 206.0, 66.0, 20.0, 8.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -63.167724609375, -61.89794921875, -60.628173828125, -59.3583984375, -58.088623046875, -56.81884765625, -55.549072265625, -54.279296875, -53.009521484375, -51.73974609375, -50.469970703125, -49.2001953125, -47.930419921875, -46.66064453125, -45.390869140625, -44.12109375, -42.851318359375, -41.58154296875, -40.311767578125, -39.0419921875, -37.772216796875, -36.50244140625, -35.232666015625, -33.962890625, -32.693115234375, -31.42333984375, -30.153564453125, -28.8837890625, -27.614013671875, -26.34423828125, -25.074462890625, -23.8046875, -22.534912109375, -21.26513671875, -19.995361328125, -18.7255859375, -17.455810546875, -16.18603515625, -14.916259765625, -13.646484375, -12.376708984375, -11.10693359375, -9.837158203125, -8.5673828125, -7.297607421875, -6.02783203125, -4.758056640625, -3.48828125, -2.218505859375, -0.94873046875, 0.321044921875, 1.5908203125, 2.860595703125, 4.13037109375, 5.400146484375, 6.669921875, 7.939697265625, 9.20947265625, 10.479248046875, 11.7490234375, 13.018798828125, 14.28857421875, 15.558349609375, 16.828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 17.0, 50.0, 458.0, 3389.0, 109.0, 32.0, 18.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.02734375, -5.918327331542969, -5.8093109130859375, -5.700294494628906, -5.591278076171875, -5.482261657714844, -5.3732452392578125, -5.264228820800781, -5.15521240234375, -5.046195983886719, -4.9371795654296875, -4.828163146972656, -4.719146728515625, -4.610130310058594, -4.5011138916015625, -4.392097473144531, -4.2830810546875, -4.174064636230469, -4.0650482177734375, -3.9560317993164062, -3.847015380859375, -3.7379989624023438, -3.6289825439453125, -3.5199661254882812, -3.41094970703125, -3.3019332885742188, -3.1929168701171875, -3.0839004516601562, -2.974884033203125, -2.8658676147460938, -2.7568511962890625, -2.6478347778320312, -2.538818359375, -2.4298019409179688, -2.3207855224609375, -2.2117691040039062, -2.102752685546875, -1.9937362670898438, -1.8847198486328125, -1.7757034301757812, -1.66668701171875, -1.5576705932617188, -1.4486541748046875, -1.3396377563476562, -1.230621337890625, -1.1216049194335938, -1.0125885009765625, -0.9035720825195312, -0.7945556640625, -0.6855392456054688, -0.5765228271484375, -0.46750640869140625, -0.358489990234375, -0.24947357177734375, -0.1404571533203125, -0.03144073486328125, 0.07757568359375, 0.18659210205078125, 0.2956085205078125, 0.40462493896484375, 0.513641357421875, 0.6226577758789062, 0.7316741943359375, 0.8406906127929688, 0.94970703125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 13.0, 95.0, 846.0, 42.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.04470443725586, -29.828142166137695, -28.61157989501953, -27.395017623901367, -26.178455352783203, -24.96189308166504, -23.745330810546875, -22.52876853942871, -21.312206268310547, -20.095643997192383, -18.87908172607422, -17.662519454956055, -16.44595718383789, -15.229394912719727, -14.012832641601562, -12.796270370483398, -11.579708099365234, -10.36314582824707, -9.146583557128906, -7.930021286010742, -6.713459014892578, -5.496896743774414, -4.28033447265625, -3.063772201538086, -1.8472099304199219, -0.6306476593017578, 0.5859146118164062, 1.8024768829345703, 3.0190391540527344, 4.235601425170898, 5.4521636962890625, 6.668725967407227, 7.885284423828125, 9.101846694946289, 10.318408966064453, 11.534971237182617, 12.751533508300781, 13.968095779418945, 15.18465805053711, 16.401220321655273, 17.617782592773438, 18.8343448638916, 20.050907135009766, 21.26746940612793, 22.484031677246094, 23.700593948364258, 24.917156219482422, 26.133718490600586, 27.35028076171875, 28.566843032836914, 29.783405303955078, 30.999967575073242, 32.216529846191406, 33.43309020996094, 34.649654388427734, 35.86621856689453, 37.08277893066406, 38.299339294433594, 39.51590347290039, 40.73246765136719, 41.94902801513672, 43.16558837890625, 44.38215255737305, 45.598716735839844, 46.815277099609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 27.0, 40.0, 60.0, 76.0, 93.0, 117.0, 127.0, 100.0, 98.0, 88.0, 59.0, 45.0, 20.0, 18.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.386377334594727, -13.97288990020752, -13.559402465820312, -13.145914077758789, -12.732426643371582, -12.318939208984375, -11.905450820922852, -11.491963386535645, -11.078475952148438, -10.66498851776123, -10.251501083374023, -9.8380126953125, -9.424525260925293, -9.011037826538086, -8.597549438476562, -8.184062004089355, -7.770574569702148, -7.357087135314941, -6.943599224090576, -6.530111312866211, -6.116623878479004, -5.703136444091797, -5.289648532867432, -4.876160621643066, -4.462673187255859, -4.049185752868652, -3.635697841644287, -3.222210168838501, -2.808722496032715, -2.3952348232269287, -1.9817471504211426, -1.5682594776153564, -1.1547718048095703, -0.7412841320037842, -0.32779645919799805, 0.08569121360778809, 0.4991788864135742, 0.9126665592193604, 1.3261542320251465, 1.7396419048309326, 2.1531295776367188, 2.566617250442505, 2.980104923248291, 3.393592596054077, 3.8070802688598633, 4.22056770324707, 4.6340556144714355, 5.047543525695801, 5.461030960083008, 5.874518394470215, 6.28800630569458, 6.701494216918945, 7.114981651306152, 7.528469085693359, 7.941956996917725, 8.35544490814209, 8.768932342529297, 9.182419776916504, 9.595907211303711, 10.009395599365234, 10.422883033752441, 10.836370468139648, 11.249858856201172, 11.663346290588379, 12.076833724975586]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 4.0, 7.0, 11.0, 9.0, 15.0, 19.0, 27.0, 43.0, 50.0, 79.0, 123.0, 186.0, 324.0, 634.0, 1592.0, 6850.0, 55422.0, 745943.0, 214990.0, 16898.0, 3124.0, 1015.0, 469.0, 267.0, 148.0, 94.0, 68.0, 48.0, 28.0, 19.0, 14.0, 14.0, 3.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.73809814453125, -4.5933837890625, -4.44866943359375, -4.303955078125, -4.15924072265625, -4.0145263671875, -3.86981201171875, -3.72509765625, -3.58038330078125, -3.4356689453125, -3.29095458984375, -3.146240234375, -3.00152587890625, -2.8568115234375, -2.71209716796875, -2.5673828125, -2.42266845703125, -2.2779541015625, -2.13323974609375, -1.988525390625, -1.84381103515625, -1.6990966796875, -1.55438232421875, -1.40966796875, -1.26495361328125, -1.1202392578125, -0.97552490234375, -0.830810546875, -0.68609619140625, -0.5413818359375, -0.39666748046875, -0.251953125, -0.10723876953125, 0.0374755859375, 0.18218994140625, 0.326904296875, 0.47161865234375, 0.6163330078125, 0.76104736328125, 0.90576171875, 1.05047607421875, 1.1951904296875, 1.33990478515625, 1.484619140625, 1.62933349609375, 1.7740478515625, 1.91876220703125, 2.0634765625, 2.20819091796875, 2.3529052734375, 2.49761962890625, 2.642333984375, 2.78704833984375, 2.9317626953125, 3.07647705078125, 3.22119140625, 3.36590576171875, 3.5106201171875, 3.65533447265625, 3.800048828125, 3.94476318359375, 4.0894775390625, 4.23419189453125, 4.37890625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 11.0, 22.0, 33.0, 34.0, 60.0, 87.0, 99.0, 96.0, 115.0, 99.0, 92.0, 89.0, 51.0, 38.0, 36.0, 14.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.369140625, -1.3360214233398438, -1.3029022216796875, -1.2697830200195312, -1.236663818359375, -1.2035446166992188, -1.1704254150390625, -1.1373062133789062, -1.10418701171875, -1.0710678100585938, -1.0379486083984375, -1.0048294067382812, -0.971710205078125, -0.9385910034179688, -0.9054718017578125, -0.8723526000976562, -0.8392333984375, -0.8061141967773438, -0.7729949951171875, -0.7398757934570312, -0.706756591796875, -0.6736373901367188, -0.6405181884765625, -0.6073989868164062, -0.57427978515625, -0.5411605834960938, -0.5080413818359375, -0.47492218017578125, -0.441802978515625, -0.40868377685546875, -0.3755645751953125, -0.34244537353515625, -0.309326171875, -0.27620697021484375, -0.2430877685546875, -0.20996856689453125, -0.176849365234375, -0.14373016357421875, -0.1106109619140625, -0.07749176025390625, -0.04437255859375, -0.01125335693359375, 0.0218658447265625, 0.05498504638671875, 0.088104248046875, 0.12122344970703125, 0.1543426513671875, 0.18746185302734375, 0.2205810546875, 0.25370025634765625, 0.2868194580078125, 0.31993865966796875, 0.353057861328125, 0.38617706298828125, 0.4192962646484375, 0.45241546630859375, 0.48553466796875, 0.5186538696289062, 0.5517730712890625, 0.5848922729492188, 0.618011474609375, 0.6511306762695312, 0.6842498779296875, 0.7173690795898438, 0.75048828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 10.0, 18.0, 16.0, 20.0, 41.0, 46.0, 74.0, 119.0, 241.0, 657.0, 2597.0, 28157.0, 832524.0, 174766.0, 7215.0, 1180.0, 379.0, 163.0, 83.0, 64.0, 42.0, 36.0, 22.0, 27.0, 9.0, 9.0, 5.0, 5.0, 6.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.203125, -4.06182861328125, -3.9205322265625, -3.77923583984375, -3.637939453125, -3.49664306640625, -3.3553466796875, -3.21405029296875, -3.07275390625, -2.93145751953125, -2.7901611328125, -2.64886474609375, -2.507568359375, -2.36627197265625, -2.2249755859375, -2.08367919921875, -1.9423828125, -1.80108642578125, -1.6597900390625, -1.51849365234375, -1.377197265625, -1.23590087890625, -1.0946044921875, -0.95330810546875, -0.81201171875, -0.67071533203125, -0.5294189453125, -0.38812255859375, -0.246826171875, -0.10552978515625, 0.0357666015625, 0.17706298828125, 0.318359375, 0.45965576171875, 0.6009521484375, 0.74224853515625, 0.883544921875, 1.02484130859375, 1.1661376953125, 1.30743408203125, 1.44873046875, 1.59002685546875, 1.7313232421875, 1.87261962890625, 2.013916015625, 2.15521240234375, 2.2965087890625, 2.43780517578125, 2.5791015625, 2.72039794921875, 2.8616943359375, 3.00299072265625, 3.144287109375, 3.28558349609375, 3.4268798828125, 3.56817626953125, 3.70947265625, 3.85076904296875, 3.9920654296875, 4.13336181640625, 4.274658203125, 4.41595458984375, 4.5572509765625, 4.69854736328125, 4.83984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 4.0, 4.0, 7.0, 5.0, 10.0, 16.0, 23.0, 25.0, 33.0, 38.0, 41.0, 56.0, 55.0, 46.0, 59.0, 67.0, 68.0, 62.0, 65.0, 50.0, 52.0, 46.0, 39.0, 25.0, 26.0, 18.0, 20.0, 10.0, 9.0, 4.0, 6.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.626953125, -2.539031982421875, -2.45111083984375, -2.363189697265625, -2.2752685546875, -2.187347412109375, -2.09942626953125, -2.011505126953125, -1.923583984375, -1.835662841796875, -1.74774169921875, -1.659820556640625, -1.5718994140625, -1.483978271484375, -1.39605712890625, -1.308135986328125, -1.22021484375, -1.132293701171875, -1.04437255859375, -0.956451416015625, -0.8685302734375, -0.780609130859375, -0.69268798828125, -0.604766845703125, -0.516845703125, -0.428924560546875, -0.34100341796875, -0.253082275390625, -0.1651611328125, -0.077239990234375, 0.01068115234375, 0.098602294921875, 0.1865234375, 0.274444580078125, 0.36236572265625, 0.450286865234375, 0.5382080078125, 0.626129150390625, 0.71405029296875, 0.801971435546875, 0.889892578125, 0.977813720703125, 1.06573486328125, 1.153656005859375, 1.2415771484375, 1.329498291015625, 1.41741943359375, 1.505340576171875, 1.59326171875, 1.681182861328125, 1.76910400390625, 1.857025146484375, 1.9449462890625, 2.032867431640625, 2.12078857421875, 2.208709716796875, 2.296630859375, 2.384552001953125, 2.47247314453125, 2.560394287109375, 2.6483154296875, 2.736236572265625, 2.82415771484375, 2.912078857421875, 3.0]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 4.0, 5.0, 10.0, 12.0, 11.0, 14.0, 18.0, 18.0, 49.0, 63.0, 77.0, 137.0, 206.0, 336.0, 593.0, 1032.0, 1967.0, 4228.0, 10341.0, 35416.0, 203334.0, 621505.0, 127609.0, 25477.0, 8418.0, 3585.0, 1750.0, 926.0, 516.0, 320.0, 170.0, 111.0, 76.0, 62.0, 38.0, 30.0, 16.0, 20.0, 6.0, 10.0, 4.0, 4.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.80224609375, -0.7789154052734375, -0.755584716796875, -0.7322540283203125, -0.70892333984375, -0.6855926513671875, -0.662261962890625, -0.6389312744140625, -0.6156005859375, -0.5922698974609375, -0.568939208984375, -0.5456085205078125, -0.52227783203125, -0.4989471435546875, -0.475616455078125, -0.4522857666015625, -0.428955078125, -0.4056243896484375, -0.382293701171875, -0.3589630126953125, -0.33563232421875, -0.3123016357421875, -0.288970947265625, -0.2656402587890625, -0.2423095703125, -0.2189788818359375, -0.195648193359375, -0.1723175048828125, -0.14898681640625, -0.1256561279296875, -0.102325439453125, -0.0789947509765625, -0.0556640625, -0.0323333740234375, -0.009002685546875, 0.0143280029296875, 0.03765869140625, 0.0609893798828125, 0.084320068359375, 0.1076507568359375, 0.1309814453125, 0.1543121337890625, 0.177642822265625, 0.2009735107421875, 0.22430419921875, 0.2476348876953125, 0.270965576171875, 0.2942962646484375, 0.317626953125, 0.3409576416015625, 0.364288330078125, 0.3876190185546875, 0.41094970703125, 0.4342803955078125, 0.457611083984375, 0.4809417724609375, 0.5042724609375, 0.5276031494140625, 0.550933837890625, 0.5742645263671875, 0.59759521484375, 0.6209259033203125, 0.644256591796875, 0.6675872802734375, 0.69091796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 8.0, 11.0, 23.0, 25.0, 26.0, 48.0, 72.0, 111.0, 129.0, 174.0, 124.0, 78.0, 51.0, 31.0, 12.0, 19.0, 15.0, 7.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001704692840576172, -0.00016530044376850128, -0.00016013160347938538, -0.00015496276319026947, -0.00014979392290115356, -0.00014462508261203766, -0.00013945624232292175, -0.00013428740203380585, -0.00012911856174468994, -0.00012394972145557404, -0.00011878088116645813, -0.00011361204087734222, -0.00010844320058822632, -0.00010327436029911041, -9.810552000999451e-05, -9.29366797208786e-05, -8.77678394317627e-05, -8.259899914264679e-05, -7.743015885353088e-05, -7.226131856441498e-05, -6.709247827529907e-05, -6.192363798618317e-05, -5.675479769706726e-05, -5.1585957407951355e-05, -4.641711711883545e-05, -4.1248276829719543e-05, -3.607943654060364e-05, -3.091059625148773e-05, -2.5741755962371826e-05, -2.057291567325592e-05, -1.5404075384140015e-05, -1.0235235095024109e-05, -5.066394805908203e-06, 1.0244548320770264e-07, 5.271285772323608e-06, 1.0440126061439514e-05, 1.560896635055542e-05, 2.0777806639671326e-05, 2.594664692878723e-05, 3.111548721790314e-05, 3.628432750701904e-05, 4.145316779613495e-05, 4.6622008085250854e-05, 5.179084837436676e-05, 5.6959688663482666e-05, 6.212852895259857e-05, 6.729736924171448e-05, 7.246620953083038e-05, 7.763504981994629e-05, 8.28038901090622e-05, 8.79727303981781e-05, 9.3141570687294e-05, 9.831041097640991e-05, 0.00010347925126552582, 0.00010864809155464172, 0.00011381693184375763, 0.00011898577213287354, 0.00012415461242198944, 0.00012932345271110535, 0.00013449229300022125, 0.00013966113328933716, 0.00014482997357845306, 0.00014999881386756897, 0.00015516765415668488, 0.00016033649444580078]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 3.0, 4.0, 13.0, 16.0, 31.0, 28.0, 43.0, 63.0, 100.0, 152.0, 305.0, 496.0, 1011.0, 2012.0, 4510.0, 11595.0, 50170.0, 519574.0, 400299.0, 40123.0, 10050.0, 3991.0, 1793.0, 929.0, 526.0, 283.0, 138.0, 94.0, 74.0, 32.0, 38.0, 16.0, 8.0, 9.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8876953125, -0.8590011596679688, -0.8303070068359375, -0.8016128540039062, -0.772918701171875, -0.7442245483398438, -0.7155303955078125, -0.6868362426757812, -0.65814208984375, -0.6294479370117188, -0.6007537841796875, -0.5720596313476562, -0.543365478515625, -0.5146713256835938, -0.4859771728515625, -0.45728302001953125, -0.4285888671875, -0.39989471435546875, -0.3712005615234375, -0.34250640869140625, -0.313812255859375, -0.28511810302734375, -0.2564239501953125, -0.22772979736328125, -0.19903564453125, -0.17034149169921875, -0.1416473388671875, -0.11295318603515625, -0.084259033203125, -0.05556488037109375, -0.0268707275390625, 0.00182342529296875, 0.030517578125, 0.05921173095703125, 0.0879058837890625, 0.11660003662109375, 0.145294189453125, 0.17398834228515625, 0.2026824951171875, 0.23137664794921875, 0.26007080078125, 0.28876495361328125, 0.3174591064453125, 0.34615325927734375, 0.374847412109375, 0.40354156494140625, 0.4322357177734375, 0.46092987060546875, 0.4896240234375, 0.5183181762695312, 0.5470123291015625, 0.5757064819335938, 0.604400634765625, 0.6330947875976562, 0.6617889404296875, 0.6904830932617188, 0.71917724609375, 0.7478713989257812, 0.7765655517578125, 0.8052597045898438, 0.833953857421875, 0.8626480102539062, 0.8913421630859375, 0.9200363159179688, 0.94873046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 3.0, 7.0, 12.0, 17.0, 24.0, 32.0, 35.0, 57.0, 69.0, 85.0, 126.0, 115.0, 87.0, 95.0, 69.0, 50.0, 35.0, 20.0, 17.0, 13.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.646484375, -0.62579345703125, -0.6051025390625, -0.58441162109375, -0.563720703125, -0.54302978515625, -0.5223388671875, -0.50164794921875, -0.48095703125, -0.46026611328125, -0.4395751953125, -0.41888427734375, -0.398193359375, -0.37750244140625, -0.3568115234375, -0.33612060546875, -0.3154296875, -0.29473876953125, -0.2740478515625, -0.25335693359375, -0.232666015625, -0.21197509765625, -0.1912841796875, -0.17059326171875, -0.14990234375, -0.12921142578125, -0.1085205078125, -0.08782958984375, -0.067138671875, -0.04644775390625, -0.0257568359375, -0.00506591796875, 0.015625, 0.03631591796875, 0.0570068359375, 0.07769775390625, 0.098388671875, 0.11907958984375, 0.1397705078125, 0.16046142578125, 0.18115234375, 0.20184326171875, 0.2225341796875, 0.24322509765625, 0.263916015625, 0.28460693359375, 0.3052978515625, 0.32598876953125, 0.3466796875, 0.36737060546875, 0.3880615234375, 0.40875244140625, 0.429443359375, 0.45013427734375, 0.4708251953125, 0.49151611328125, 0.51220703125, 0.53289794921875, 0.5535888671875, 0.57427978515625, 0.594970703125, 0.61566162109375, 0.6363525390625, 0.65704345703125, 0.677734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 48.0, 419.0, 447.0, 66.0, 14.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.79530715942383, -42.38101577758789, -40.96672821044922, -39.55243682861328, -38.138145446777344, -36.723854064941406, -35.309566497802734, -33.8952751159668, -32.480987548828125, -31.06669807434082, -29.652406692504883, -28.238117218017578, -26.82382583618164, -25.409536361694336, -23.99524688720703, -22.580955505371094, -21.166664123535156, -19.75237464904785, -18.338083267211914, -16.92379379272461, -15.509503364562988, -14.095212936401367, -12.680923461914062, -11.266633033752441, -9.85234260559082, -8.4380521774292, -7.023762226104736, -5.609472274780273, -4.195181846618652, -2.7808914184570312, -1.3666019439697266, 0.04768848419189453, 1.46197509765625, 2.876265287399292, 4.290555477142334, 5.704845428466797, 7.119135856628418, 8.533426284790039, 9.947715759277344, 11.362006187438965, 12.776296615600586, 14.190587043762207, 15.604877471923828, 17.019166946411133, 18.433456420898438, 19.847747802734375, 21.26203727722168, 22.676326751708984, 24.090618133544922, 25.504907608032227, 26.919198989868164, 28.33348846435547, 29.747779846191406, 31.16206932067871, 32.576358795166016, 33.99065017700195, 35.404937744140625, 36.81922912597656, 38.233516693115234, 39.64780807495117, 41.06209945678711, 42.47638702392578, 43.89067840576172, 45.304969787597656, 46.719261169433594]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 1.0, 4.0, 6.0, 9.0, 11.0, 10.0, 16.0, 15.0, 28.0, 29.0, 24.0, 40.0, 41.0, 33.0, 38.0, 40.0, 63.0, 43.0, 62.0, 54.0, 61.0, 44.0, 47.0, 47.0, 41.0, 36.0, 29.0, 27.0, 17.0, 16.0, 15.0, 12.0, 8.0, 8.0, 0.0, 2.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.20128345489502, -12.788833618164062, -12.376384735107422, -11.963934898376465, -11.551485061645508, -11.13903522491455, -10.726585388183594, -10.314136505126953, -9.901686668395996, -9.489236831665039, -9.076787948608398, -8.664338111877441, -8.251888275146484, -7.839438438415527, -7.4269890785217285, -7.01453971862793, -6.602089881896973, -6.189640045166016, -5.777190685272217, -5.364741325378418, -4.952291488647461, -4.539841651916504, -4.127392292022705, -3.714942693710327, -3.302493095397949, -2.8900434970855713, -2.4775938987731934, -2.0651443004608154, -1.6526947021484375, -1.2402451038360596, -0.8277955055236816, -0.4153459072113037, -0.0028972625732421875, 0.40955233573913574, 0.8220019340515137, 1.2344515323638916, 1.6469011306762695, 2.0593507289886475, 2.4718003273010254, 2.8842499256134033, 3.2966995239257812, 3.709149122238159, 4.121598720550537, 4.534048080444336, 4.946497917175293, 5.35894775390625, 5.771397113800049, 6.183846473693848, 6.596296310424805, 7.008746147155762, 7.4211955070495605, 7.833644866943359, 8.246094703674316, 8.658544540405273, 9.070993423461914, 9.483443260192871, 9.895893096923828, 10.308342933654785, 10.720792770385742, 11.133241653442383, 11.54569149017334, 11.958141326904297, 12.370590209960938, 12.783040046691895, 13.195489883422852]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 6.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 11.0, 11.0, 8.0, 20.0, 28.0, 54.0, 63.0, 132.0, 181.0, 342.0, 647.0, 1552.0, 6168.0, 56015.0, 4030286.0, 88696.0, 7306.0, 1631.0, 596.0, 246.0, 117.0, 44.0, 34.0, 23.0, 8.0, 13.0, 7.0, 11.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.15399169921875, -5.9759521484375, -5.79791259765625, -5.619873046875, -5.44183349609375, -5.2637939453125, -5.08575439453125, -4.90771484375, -4.72967529296875, -4.5516357421875, -4.37359619140625, -4.195556640625, -4.01751708984375, -3.8394775390625, -3.66143798828125, -3.4833984375, -3.30535888671875, -3.1273193359375, -2.94927978515625, -2.771240234375, -2.59320068359375, -2.4151611328125, -2.23712158203125, -2.05908203125, -1.88104248046875, -1.7030029296875, -1.52496337890625, -1.346923828125, -1.16888427734375, -0.9908447265625, -0.81280517578125, -0.634765625, -0.45672607421875, -0.2786865234375, -0.10064697265625, 0.077392578125, 0.25543212890625, 0.4334716796875, 0.61151123046875, 0.78955078125, 0.96759033203125, 1.1456298828125, 1.32366943359375, 1.501708984375, 1.67974853515625, 1.8577880859375, 2.03582763671875, 2.2138671875, 2.39190673828125, 2.5699462890625, 2.74798583984375, 2.926025390625, 3.10406494140625, 3.2821044921875, 3.46014404296875, 3.63818359375, 3.81622314453125, 3.9942626953125, 4.17230224609375, 4.350341796875, 4.52838134765625, 4.7064208984375, 4.88446044921875, 5.0625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 12.0, 16.0, 32.0, 52.0, 40.0, 87.0, 107.0, 89.0, 90.0, 105.0, 85.0, 76.0, 69.0, 48.0, 32.0, 25.0, 13.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-1.3955078125, -1.3634490966796875, -1.331390380859375, -1.2993316650390625, -1.26727294921875, -1.2352142333984375, -1.203155517578125, -1.1710968017578125, -1.1390380859375, -1.1069793701171875, -1.074920654296875, -1.0428619384765625, -1.01080322265625, -0.9787445068359375, -0.946685791015625, -0.9146270751953125, -0.882568359375, -0.8505096435546875, -0.818450927734375, -0.7863922119140625, -0.75433349609375, -0.7222747802734375, -0.690216064453125, -0.6581573486328125, -0.6260986328125, -0.5940399169921875, -0.561981201171875, -0.5299224853515625, -0.49786376953125, -0.4658050537109375, -0.433746337890625, -0.4016876220703125, -0.36962890625, -0.3375701904296875, -0.305511474609375, -0.2734527587890625, -0.24139404296875, -0.2093353271484375, -0.177276611328125, -0.1452178955078125, -0.1131591796875, -0.0811004638671875, -0.049041748046875, -0.0169830322265625, 0.01507568359375, 0.0471343994140625, 0.079193115234375, 0.1112518310546875, 0.143310546875, 0.1753692626953125, 0.207427978515625, 0.2394866943359375, 0.27154541015625, 0.3036041259765625, 0.335662841796875, 0.3677215576171875, 0.3997802734375, 0.4318389892578125, 0.463897705078125, 0.4959564208984375, 0.52801513671875, 0.5600738525390625, 0.592132568359375, 0.6241912841796875, 0.65625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 15.0, 53.0, 125.0, 478.0, 6900.0, 4183738.0, 2437.0, 351.0, 133.0, 38.0, 13.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.265625, -18.651611328125, -18.03759765625, -17.423583984375, -16.8095703125, -16.195556640625, -15.58154296875, -14.967529296875, -14.353515625, -13.739501953125, -13.12548828125, -12.511474609375, -11.8974609375, -11.283447265625, -10.66943359375, -10.055419921875, -9.44140625, -8.827392578125, -8.21337890625, -7.599365234375, -6.9853515625, -6.371337890625, -5.75732421875, -5.143310546875, -4.529296875, -3.915283203125, -3.30126953125, -2.687255859375, -2.0732421875, -1.459228515625, -0.84521484375, -0.231201171875, 0.3828125, 0.996826171875, 1.61083984375, 2.224853515625, 2.8388671875, 3.452880859375, 4.06689453125, 4.680908203125, 5.294921875, 5.908935546875, 6.52294921875, 7.136962890625, 7.7509765625, 8.364990234375, 8.97900390625, 9.593017578125, 10.20703125, 10.821044921875, 11.43505859375, 12.049072265625, 12.6630859375, 13.277099609375, 13.89111328125, 14.505126953125, 15.119140625, 15.733154296875, 16.34716796875, 16.961181640625, 17.5751953125, 18.189208984375, 18.80322265625, 19.417236328125, 20.03125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 46.0, 214.0, 3263.0, 464.0, 53.0, 20.0, 8.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.08203125, -2.99322509765625, -2.9044189453125, -2.81561279296875, -2.726806640625, -2.63800048828125, -2.5491943359375, -2.46038818359375, -2.37158203125, -2.28277587890625, -2.1939697265625, -2.10516357421875, -2.016357421875, -1.92755126953125, -1.8387451171875, -1.74993896484375, -1.6611328125, -1.57232666015625, -1.4835205078125, -1.39471435546875, -1.305908203125, -1.21710205078125, -1.1282958984375, -1.03948974609375, -0.95068359375, -0.86187744140625, -0.7730712890625, -0.68426513671875, -0.595458984375, -0.50665283203125, -0.4178466796875, -0.32904052734375, -0.240234375, -0.15142822265625, -0.0626220703125, 0.02618408203125, 0.114990234375, 0.20379638671875, 0.2926025390625, 0.38140869140625, 0.47021484375, 0.55902099609375, 0.6478271484375, 0.73663330078125, 0.825439453125, 0.91424560546875, 1.0030517578125, 1.09185791015625, 1.1806640625, 1.26947021484375, 1.3582763671875, 1.44708251953125, 1.535888671875, 1.62469482421875, 1.7135009765625, 1.80230712890625, 1.89111328125, 1.97991943359375, 2.0687255859375, 2.15753173828125, 2.246337890625, 2.33514404296875, 2.4239501953125, 2.51275634765625, 2.6015625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 40.0, 948.0, 17.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.586273193359375, -58.275943756103516, -56.965614318847656, -55.6552848815918, -54.34495544433594, -53.03462600708008, -51.72429656982422, -50.413970947265625, -49.1036376953125, -47.79330825805664, -46.48297882080078, -45.17264938354492, -43.86231994628906, -42.5519905090332, -41.241661071777344, -39.93133544921875, -38.62100601196289, -37.31067657470703, -36.00034713745117, -34.69001770019531, -33.37968826293945, -32.069358825683594, -30.759031295776367, -29.448701858520508, -28.13837242126465, -26.82804298400879, -25.51771354675293, -24.20738410949707, -22.897056579589844, -21.586727142333984, -20.276397705078125, -18.966068267822266, -17.655742645263672, -16.345413208007812, -15.035083770751953, -13.72475528717041, -12.41442584991455, -11.104096412658691, -9.793767929077148, -8.483438491821289, -7.17310905456543, -5.86277961730957, -4.552450656890869, -3.242121458053589, -1.9317922592163086, -0.6214628219604492, 0.688866138458252, 1.9991950988769531, 3.3095245361328125, 4.619853973388672, 5.930182933807373, 7.240511894226074, 8.550841331481934, 9.861170768737793, 11.171499252319336, 12.481828689575195, 13.792158126831055, 15.102487564086914, 16.412817001342773, 17.723146438598633, 19.03347396850586, 20.34380340576172, 21.654132843017578, 22.964462280273438, 24.274791717529297]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 14.0, 24.0, 18.0, 36.0, 30.0, 58.0, 43.0, 71.0, 75.0, 75.0, 81.0, 63.0, 77.0, 71.0, 54.0, 58.0, 41.0, 31.0, 23.0, 15.0, 5.0, 4.0, 5.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.693879127502441, -4.563742637634277, -4.433605670928955, -4.303469181060791, -4.173332214355469, -4.043195724487305, -3.9130592346191406, -3.7829225063323975, -3.6527857780456543, -3.522649049758911, -3.392512321472168, -3.262375831604004, -3.1322391033172607, -3.0021023750305176, -2.8719658851623535, -2.7418291568756104, -2.611692428588867, -2.481555700302124, -2.351418972015381, -2.221282482147217, -2.0911457538604736, -1.9610090255737305, -1.8308724164962769, -1.7007358074188232, -1.57059907913208, -1.440462350845337, -1.3103257417678833, -1.1801891326904297, -1.0500524044036865, -0.9199157357215881, -0.7897790670394897, -0.6596423983573914, -0.5295052528381348, -0.3993685841560364, -0.269231915473938, -0.1390952467918396, -0.008958578109741211, 0.12117809057235718, 0.25131475925445557, 0.38145142793655396, 0.5115880966186523, 0.6417247653007507, 0.7718614339828491, 0.9019981026649475, 1.032134771347046, 1.162271499633789, 1.2924081087112427, 1.4225447177886963, 1.5526814460754395, 1.6828181743621826, 1.8129547834396362, 1.9430913925170898, 2.073228120803833, 2.203364849090576, 2.3335013389587402, 2.4636380672454834, 2.5937747955322266, 2.7239115238189697, 2.854048252105713, 2.984184741973877, 3.11432147026062, 3.2444581985473633, 3.3745946884155273, 3.5047314167022705, 3.6348681449890137]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 5.0, 3.0, 8.0, 16.0, 14.0, 23.0, 43.0, 50.0, 72.0, 118.0, 179.0, 355.0, 659.0, 1521.0, 4683.0, 26590.0, 297056.0, 643384.0, 61152.0, 8432.0, 2241.0, 897.0, 420.0, 201.0, 151.0, 91.0, 52.0, 34.0, 31.0, 19.0, 16.0, 9.0, 5.0, 7.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.13671875, -4.025482177734375, -3.91424560546875, -3.803009033203125, -3.6917724609375, -3.580535888671875, -3.46929931640625, -3.358062744140625, -3.246826171875, -3.135589599609375, -3.02435302734375, -2.913116455078125, -2.8018798828125, -2.690643310546875, -2.57940673828125, -2.468170166015625, -2.35693359375, -2.245697021484375, -2.13446044921875, -2.023223876953125, -1.9119873046875, -1.800750732421875, -1.68951416015625, -1.578277587890625, -1.467041015625, -1.355804443359375, -1.24456787109375, -1.133331298828125, -1.0220947265625, -0.910858154296875, -0.79962158203125, -0.688385009765625, -0.5771484375, -0.465911865234375, -0.35467529296875, -0.243438720703125, -0.1322021484375, -0.020965576171875, 0.09027099609375, 0.201507568359375, 0.312744140625, 0.423980712890625, 0.53521728515625, 0.646453857421875, 0.7576904296875, 0.868927001953125, 0.98016357421875, 1.091400146484375, 1.20263671875, 1.313873291015625, 1.42510986328125, 1.536346435546875, 1.6475830078125, 1.758819580078125, 1.87005615234375, 1.981292724609375, 2.092529296875, 2.203765869140625, 2.31500244140625, 2.426239013671875, 2.5374755859375, 2.648712158203125, 2.75994873046875, 2.871185302734375, 2.982421875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 23.0, 17.0, 46.0, 51.0, 67.0, 55.0, 84.0, 95.0, 105.0, 87.0, 76.0, 83.0, 48.0, 42.0, 41.0, 25.0, 19.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.224609375, -1.1949844360351562, -1.1653594970703125, -1.1357345581054688, -1.106109619140625, -1.0764846801757812, -1.0468597412109375, -1.0172348022460938, -0.98760986328125, -0.9579849243164062, -0.9283599853515625, -0.8987350463867188, -0.869110107421875, -0.8394851684570312, -0.8098602294921875, -0.7802352905273438, -0.7506103515625, -0.7209854125976562, -0.6913604736328125, -0.6617355346679688, -0.632110595703125, -0.6024856567382812, -0.5728607177734375, -0.5432357788085938, -0.51361083984375, -0.48398590087890625, -0.4543609619140625, -0.42473602294921875, -0.395111083984375, -0.36548614501953125, -0.3358612060546875, -0.30623626708984375, -0.276611328125, -0.24698638916015625, -0.2173614501953125, -0.18773651123046875, -0.158111572265625, -0.12848663330078125, -0.0988616943359375, -0.06923675537109375, -0.03961181640625, -0.00998687744140625, 0.0196380615234375, 0.04926300048828125, 0.078887939453125, 0.10851287841796875, 0.1381378173828125, 0.16776275634765625, 0.1973876953125, 0.22701263427734375, 0.2566375732421875, 0.28626251220703125, 0.315887451171875, 0.34551239013671875, 0.3751373291015625, 0.40476226806640625, 0.43438720703125, 0.46401214599609375, 0.4936370849609375, 0.5232620239257812, 0.552886962890625, 0.5825119018554688, 0.6121368408203125, 0.6417617797851562, 0.67138671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 7.0, 10.0, 16.0, 25.0, 51.0, 65.0, 122.0, 241.0, 783.0, 3119.0, 35558.0, 894609.0, 106496.0, 5637.0, 1089.0, 364.0, 134.0, 71.0, 51.0, 26.0, 18.0, 18.0, 9.0, 6.0, 6.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.4375, -6.27093505859375, -6.1043701171875, -5.93780517578125, -5.771240234375, -5.60467529296875, -5.4381103515625, -5.27154541015625, -5.10498046875, -4.93841552734375, -4.7718505859375, -4.60528564453125, -4.438720703125, -4.27215576171875, -4.1055908203125, -3.93902587890625, -3.7724609375, -3.60589599609375, -3.4393310546875, -3.27276611328125, -3.106201171875, -2.93963623046875, -2.7730712890625, -2.60650634765625, -2.43994140625, -2.27337646484375, -2.1068115234375, -1.94024658203125, -1.773681640625, -1.60711669921875, -1.4405517578125, -1.27398681640625, -1.107421875, -0.94085693359375, -0.7742919921875, -0.60772705078125, -0.441162109375, -0.27459716796875, -0.1080322265625, 0.05853271484375, 0.22509765625, 0.39166259765625, 0.5582275390625, 0.72479248046875, 0.891357421875, 1.05792236328125, 1.2244873046875, 1.39105224609375, 1.5576171875, 1.72418212890625, 1.8907470703125, 2.05731201171875, 2.223876953125, 2.39044189453125, 2.5570068359375, 2.72357177734375, 2.89013671875, 3.05670166015625, 3.2232666015625, 3.38983154296875, 3.556396484375, 3.72296142578125, 3.8895263671875, 4.05609130859375, 4.22265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 10.0, 3.0, 7.0, 7.0, 11.0, 18.0, 31.0, 39.0, 46.0, 44.0, 63.0, 90.0, 96.0, 81.0, 69.0, 83.0, 86.0, 51.0, 49.0, 27.0, 24.0, 15.0, 19.0, 8.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.85546875, -4.72930908203125, -4.6031494140625, -4.47698974609375, -4.350830078125, -4.22467041015625, -4.0985107421875, -3.97235107421875, -3.84619140625, -3.72003173828125, -3.5938720703125, -3.46771240234375, -3.341552734375, -3.21539306640625, -3.0892333984375, -2.96307373046875, -2.8369140625, -2.71075439453125, -2.5845947265625, -2.45843505859375, -2.332275390625, -2.20611572265625, -2.0799560546875, -1.95379638671875, -1.82763671875, -1.70147705078125, -1.5753173828125, -1.44915771484375, -1.322998046875, -1.19683837890625, -1.0706787109375, -0.94451904296875, -0.818359375, -0.69219970703125, -0.5660400390625, -0.43988037109375, -0.313720703125, -0.18756103515625, -0.0614013671875, 0.06475830078125, 0.19091796875, 0.31707763671875, 0.4432373046875, 0.56939697265625, 0.695556640625, 0.82171630859375, 0.9478759765625, 1.07403564453125, 1.2001953125, 1.32635498046875, 1.4525146484375, 1.57867431640625, 1.704833984375, 1.83099365234375, 1.9571533203125, 2.08331298828125, 2.20947265625, 2.33563232421875, 2.4617919921875, 2.58795166015625, 2.714111328125, 2.84027099609375, 2.9664306640625, 3.09259033203125, 3.21875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 8.0, 6.0, 15.0, 17.0, 34.0, 46.0, 67.0, 129.0, 222.0, 374.0, 808.0, 1716.0, 4650.0, 17660.0, 113284.0, 688008.0, 186710.0, 24740.0, 6069.0, 2089.0, 867.0, 443.0, 223.0, 136.0, 76.0, 46.0, 40.0, 16.0, 16.0, 8.0, 8.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.80615234375, -0.7789230346679688, -0.7516937255859375, -0.7244644165039062, -0.697235107421875, -0.6700057983398438, -0.6427764892578125, -0.6155471801757812, -0.58831787109375, -0.5610885620117188, -0.5338592529296875, -0.5066299438476562, -0.479400634765625, -0.45217132568359375, -0.4249420166015625, -0.39771270751953125, -0.3704833984375, -0.34325408935546875, -0.3160247802734375, -0.28879547119140625, -0.261566162109375, -0.23433685302734375, -0.2071075439453125, -0.17987823486328125, -0.15264892578125, -0.12541961669921875, -0.0981903076171875, -0.07096099853515625, -0.043731689453125, -0.01650238037109375, 0.0107269287109375, 0.03795623779296875, 0.065185546875, 0.09241485595703125, 0.1196441650390625, 0.14687347412109375, 0.174102783203125, 0.20133209228515625, 0.2285614013671875, 0.25579071044921875, 0.28302001953125, 0.31024932861328125, 0.3374786376953125, 0.36470794677734375, 0.391937255859375, 0.41916656494140625, 0.4463958740234375, 0.47362518310546875, 0.5008544921875, 0.5280838012695312, 0.5553131103515625, 0.5825424194335938, 0.609771728515625, 0.6370010375976562, 0.6642303466796875, 0.6914596557617188, 0.71868896484375, 0.7459182739257812, 0.7731475830078125, 0.8003768920898438, 0.827606201171875, 0.8548355102539062, 0.8820648193359375, 0.9092941284179688, 0.9365234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 7.0, 14.0, 10.0, 13.0, 29.0, 49.0, 51.0, 100.0, 121.0, 142.0, 135.0, 102.0, 65.0, 54.0, 35.0, 17.0, 7.0, 9.0, 5.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0002319812774658203, -0.00022643059492111206, -0.0002208799123764038, -0.00021532922983169556, -0.0002097785472869873, -0.00020422786474227905, -0.0001986771821975708, -0.00019312649965286255, -0.0001875758171081543, -0.00018202513456344604, -0.0001764744520187378, -0.00017092376947402954, -0.0001653730869293213, -0.00015982240438461304, -0.00015427172183990479, -0.00014872103929519653, -0.00014317035675048828, -0.00013761967420578003, -0.00013206899166107178, -0.00012651830911636353, -0.00012096762657165527, -0.00011541694402694702, -0.00010986626148223877, -0.00010431557893753052, -9.876489639282227e-05, -9.321421384811401e-05, -8.766353130340576e-05, -8.211284875869751e-05, -7.656216621398926e-05, -7.1011483669281e-05, -6.546080112457275e-05, -5.99101185798645e-05, -5.435943603515625e-05, -4.8808753490448e-05, -4.3258070945739746e-05, -3.7707388401031494e-05, -3.215670585632324e-05, -2.660602331161499e-05, -2.1055340766906738e-05, -1.5504658222198486e-05, -9.953975677490234e-06, -4.403293132781982e-06, 1.1473894119262695e-06, 6.6980719566345215e-06, 1.2248754501342773e-05, 1.7799437046051025e-05, 2.3350119590759277e-05, 2.890080213546753e-05, 3.445148468017578e-05, 4.000216722488403e-05, 4.5552849769592285e-05, 5.110353231430054e-05, 5.665421485900879e-05, 6.220489740371704e-05, 6.775557994842529e-05, 7.330626249313354e-05, 7.88569450378418e-05, 8.440762758255005e-05, 8.99583101272583e-05, 9.550899267196655e-05, 0.0001010596752166748, 0.00010661035776138306, 0.00011216104030609131, 0.00011771172285079956, 0.0001232624053955078]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 11.0, 9.0, 14.0, 16.0, 31.0, 44.0, 89.0, 178.0, 408.0, 941.0, 2321.0, 8719.0, 48029.0, 480228.0, 450407.0, 44653.0, 8417.0, 2345.0, 855.0, 370.0, 185.0, 97.0, 54.0, 35.0, 22.0, 15.0, 3.0, 10.0, 7.0, 7.0, 1.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.94287109375, -0.91339111328125, -0.8839111328125, -0.85443115234375, -0.824951171875, -0.79547119140625, -0.7659912109375, -0.73651123046875, -0.70703125, -0.67755126953125, -0.6480712890625, -0.61859130859375, -0.589111328125, -0.55963134765625, -0.5301513671875, -0.50067138671875, -0.47119140625, -0.44171142578125, -0.4122314453125, -0.38275146484375, -0.353271484375, -0.32379150390625, -0.2943115234375, -0.26483154296875, -0.2353515625, -0.20587158203125, -0.1763916015625, -0.14691162109375, -0.117431640625, -0.08795166015625, -0.0584716796875, -0.02899169921875, 0.00048828125, 0.02996826171875, 0.0594482421875, 0.08892822265625, 0.118408203125, 0.14788818359375, 0.1773681640625, 0.20684814453125, 0.236328125, 0.26580810546875, 0.2952880859375, 0.32476806640625, 0.354248046875, 0.38372802734375, 0.4132080078125, 0.44268798828125, 0.47216796875, 0.50164794921875, 0.5311279296875, 0.56060791015625, 0.590087890625, 0.61956787109375, 0.6490478515625, 0.67852783203125, 0.7080078125, 0.73748779296875, 0.7669677734375, 0.79644775390625, 0.825927734375, 0.85540771484375, 0.8848876953125, 0.91436767578125, 0.94384765625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 10.0, 13.0, 23.0, 29.0, 41.0, 61.0, 88.0, 110.0, 129.0, 151.0, 87.0, 70.0, 63.0, 35.0, 22.0, 21.0, 10.0, 9.0, 7.0, 2.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.78662109375, -0.7618637084960938, -0.7371063232421875, -0.7123489379882812, -0.687591552734375, -0.6628341674804688, -0.6380767822265625, -0.6133193969726562, -0.58856201171875, -0.5638046264648438, -0.5390472412109375, -0.5142898559570312, -0.489532470703125, -0.46477508544921875, -0.4400177001953125, -0.41526031494140625, -0.3905029296875, -0.36574554443359375, -0.3409881591796875, -0.31623077392578125, -0.291473388671875, -0.26671600341796875, -0.2419586181640625, -0.21720123291015625, -0.19244384765625, -0.16768646240234375, -0.1429290771484375, -0.11817169189453125, -0.093414306640625, -0.06865692138671875, -0.0438995361328125, -0.01914215087890625, 0.005615234375, 0.03037261962890625, 0.0551300048828125, 0.07988739013671875, 0.104644775390625, 0.12940216064453125, 0.1541595458984375, 0.17891693115234375, 0.20367431640625, 0.22843170166015625, 0.2531890869140625, 0.27794647216796875, 0.302703857421875, 0.32746124267578125, 0.3522186279296875, 0.37697601318359375, 0.4017333984375, 0.42649078369140625, 0.4512481689453125, 0.47600555419921875, 0.500762939453125, 0.5255203247070312, 0.5502777099609375, 0.5750350952148438, 0.59979248046875, 0.6245498657226562, 0.6493072509765625, 0.6740646362304688, 0.698822021484375, 0.7235794067382812, 0.7483367919921875, 0.7730941772460938, 0.7978515625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 26.0, 205.0, 619.0, 128.0, 24.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.25709533691406, -90.52912902832031, -88.80116271972656, -87.07319641113281, -85.34523010253906, -83.61726379394531, -81.88929748535156, -80.16133880615234, -78.4333724975586, -76.70540618896484, -74.9774398803711, -73.24947357177734, -71.5215072631836, -69.79354858398438, -68.06558227539062, -66.33761596679688, -64.60964965820312, -62.881683349609375, -61.153717041015625, -59.425750732421875, -57.69778823852539, -55.96982192993164, -54.24185562133789, -52.51388931274414, -50.785919189453125, -49.057952880859375, -47.329986572265625, -45.602020263671875, -43.87405776977539, -42.14609146118164, -40.41812515258789, -38.69015884399414, -36.96219253540039, -35.23422622680664, -33.50625991821289, -31.778295516967773, -30.050331115722656, -28.322364807128906, -26.594398498535156, -24.866432189941406, -23.13846778869629, -21.41050148010254, -19.682537078857422, -17.954570770263672, -16.226604461669922, -14.498640060424805, -12.770673751831055, -11.042708396911621, -9.314743041992188, -7.586777687072754, -5.858811855316162, -4.13084602355957, -2.4028806686401367, -0.6749153137207031, 1.0530509948730469, 2.7810163497924805, 4.508981704711914, 6.236947059631348, 7.9649128913879395, 9.692878723144531, 11.420844078063965, 13.148809432983398, 14.876775741577148, 16.604740142822266, 18.332706451416016]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 1.0, 10.0, 10.0, 16.0, 26.0, 25.0, 24.0, 27.0, 31.0, 36.0, 46.0, 59.0, 44.0, 47.0, 50.0, 49.0, 52.0, 45.0, 37.0, 45.0, 34.0, 36.0, 33.0, 40.0, 30.0, 29.0, 22.0, 19.0, 14.0, 8.0, 8.0, 10.0, 5.0, 6.0, 3.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.424535751342773, -15.943592071533203, -15.462648391723633, -14.981704711914062, -14.500761032104492, -14.019817352294922, -13.538874626159668, -13.057930946350098, -12.576987266540527, -12.096043586730957, -11.615099906921387, -11.134156227111816, -10.653213500976562, -10.172269821166992, -9.691326141357422, -9.210382461547852, -8.729438781738281, -8.248495101928711, -7.767551422119141, -7.2866082191467285, -6.805664539337158, -6.324720859527588, -5.843777656555176, -5.3628339767456055, -4.881890296936035, -4.400946617126465, -3.9200031757354736, -3.4390597343444824, -2.958116054534912, -2.477172374725342, -1.9962289333343506, -1.5152854919433594, -1.0343427658081055, -0.5533992052078247, -0.07245564460754395, 0.4084879159927368, 0.8894314765930176, 1.370375156402588, 1.851318597793579, 2.3322620391845703, 2.8132057189941406, 3.294149398803711, 3.775092840194702, 4.256036281585693, 4.736979961395264, 5.217923641204834, 5.698866844177246, 6.179810523986816, 6.660754203796387, 7.141697883605957, 7.622641563415527, 8.103585243225098, 8.584527969360352, 9.065471649169922, 9.546415328979492, 10.027359008789062, 10.508302688598633, 10.989246368408203, 11.470190048217773, 11.951133728027344, 12.432077407836914, 12.913021087646484, 13.393963813781738, 13.874907493591309, 14.355851173400879]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 4.0, 16.0, 7.0, 14.0, 8.0, 13.0, 28.0, 46.0, 53.0, 60.0, 125.0, 204.0, 312.0, 674.0, 1212.0, 3293.0, 10912.0, 70392.0, 3836395.0, 240988.0, 21253.0, 4988.0, 1650.0, 749.0, 356.0, 215.0, 95.0, 77.0, 49.0, 34.0, 13.0, 10.0, 12.0, 3.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.19140625, -6.03546142578125, -5.8795166015625, -5.72357177734375, -5.567626953125, -5.41168212890625, -5.2557373046875, -5.09979248046875, -4.94384765625, -4.78790283203125, -4.6319580078125, -4.47601318359375, -4.320068359375, -4.16412353515625, -4.0081787109375, -3.85223388671875, -3.6962890625, -3.54034423828125, -3.3843994140625, -3.22845458984375, -3.072509765625, -2.91656494140625, -2.7606201171875, -2.60467529296875, -2.44873046875, -2.29278564453125, -2.1368408203125, -1.98089599609375, -1.824951171875, -1.66900634765625, -1.5130615234375, -1.35711669921875, -1.201171875, -1.04522705078125, -0.8892822265625, -0.73333740234375, -0.577392578125, -0.42144775390625, -0.2655029296875, -0.10955810546875, 0.04638671875, 0.20233154296875, 0.3582763671875, 0.51422119140625, 0.670166015625, 0.82611083984375, 0.9820556640625, 1.13800048828125, 1.2939453125, 1.44989013671875, 1.6058349609375, 1.76177978515625, 1.917724609375, 2.07366943359375, 2.2296142578125, 2.38555908203125, 2.54150390625, 2.69744873046875, 2.8533935546875, 3.00933837890625, 3.165283203125, 3.32122802734375, 3.4771728515625, 3.63311767578125, 3.7890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 4.0, 5.0, 6.0, 10.0, 26.0, 32.0, 39.0, 43.0, 52.0, 89.0, 80.0, 85.0, 81.0, 82.0, 88.0, 65.0, 60.0, 43.0, 35.0, 20.0, 18.0, 12.0, 12.0, 9.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2265625, -1.1968536376953125, -1.167144775390625, -1.1374359130859375, -1.10772705078125, -1.0780181884765625, -1.048309326171875, -1.0186004638671875, -0.9888916015625, -0.9591827392578125, -0.929473876953125, -0.8997650146484375, -0.87005615234375, -0.8403472900390625, -0.810638427734375, -0.7809295654296875, -0.751220703125, -0.7215118408203125, -0.691802978515625, -0.6620941162109375, -0.63238525390625, -0.6026763916015625, -0.572967529296875, -0.5432586669921875, -0.5135498046875, -0.4838409423828125, -0.454132080078125, -0.4244232177734375, -0.39471435546875, -0.3650054931640625, -0.335296630859375, -0.3055877685546875, -0.27587890625, -0.2461700439453125, -0.216461181640625, -0.1867523193359375, -0.15704345703125, -0.1273345947265625, -0.097625732421875, -0.0679168701171875, -0.0382080078125, -0.0084991455078125, 0.021209716796875, 0.0509185791015625, 0.08062744140625, 0.1103363037109375, 0.140045166015625, 0.1697540283203125, 0.199462890625, 0.2291717529296875, 0.258880615234375, 0.2885894775390625, 0.31829833984375, 0.3480072021484375, 0.377716064453125, 0.4074249267578125, 0.4371337890625, 0.4668426513671875, 0.496551513671875, 0.5262603759765625, 0.55596923828125, 0.5856781005859375, 0.615386962890625, 0.6450958251953125, 0.6748046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 8.0, 14.0, 18.0, 32.0, 60.0, 107.0, 233.0, 677.0, 2732.0, 27643.0, 4137535.0, 22249.0, 2191.0, 471.0, 137.0, 74.0, 41.0, 28.0, 11.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.546875, -12.2120361328125, -11.877197265625, -11.5423583984375, -11.20751953125, -10.8726806640625, -10.537841796875, -10.2030029296875, -9.8681640625, -9.5333251953125, -9.198486328125, -8.8636474609375, -8.52880859375, -8.1939697265625, -7.859130859375, -7.5242919921875, -7.189453125, -6.8546142578125, -6.519775390625, -6.1849365234375, -5.85009765625, -5.5152587890625, -5.180419921875, -4.8455810546875, -4.5107421875, -4.1759033203125, -3.841064453125, -3.5062255859375, -3.17138671875, -2.8365478515625, -2.501708984375, -2.1668701171875, -1.83203125, -1.4971923828125, -1.162353515625, -0.8275146484375, -0.49267578125, -0.1578369140625, 0.177001953125, 0.5118408203125, 0.8466796875, 1.1815185546875, 1.516357421875, 1.8511962890625, 2.18603515625, 2.5208740234375, 2.855712890625, 3.1905517578125, 3.525390625, 3.8602294921875, 4.195068359375, 4.5299072265625, 4.86474609375, 5.1995849609375, 5.534423828125, 5.8692626953125, 6.2041015625, 6.5389404296875, 6.873779296875, 7.2086181640625, 7.54345703125, 7.8782958984375, 8.213134765625, 8.5479736328125, 8.8828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 6.0, 2.0, 6.0, 5.0, 8.0, 16.0, 39.0, 93.0, 303.0, 2730.0, 614.0, 149.0, 53.0, 14.0, 14.0, 9.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.15625, -4.0652618408203125, -3.974273681640625, -3.8832855224609375, -3.79229736328125, -3.7013092041015625, -3.610321044921875, -3.5193328857421875, -3.4283447265625, -3.3373565673828125, -3.246368408203125, -3.1553802490234375, -3.06439208984375, -2.9734039306640625, -2.882415771484375, -2.7914276123046875, -2.700439453125, -2.6094512939453125, -2.518463134765625, -2.4274749755859375, -2.33648681640625, -2.2454986572265625, -2.154510498046875, -2.0635223388671875, -1.9725341796875, -1.8815460205078125, -1.790557861328125, -1.6995697021484375, -1.60858154296875, -1.5175933837890625, -1.426605224609375, -1.3356170654296875, -1.24462890625, -1.1536407470703125, -1.062652587890625, -0.9716644287109375, -0.88067626953125, -0.7896881103515625, -0.698699951171875, -0.6077117919921875, -0.5167236328125, -0.4257354736328125, -0.334747314453125, -0.2437591552734375, -0.15277099609375, -0.0617828369140625, 0.029205322265625, 0.1201934814453125, 0.211181640625, 0.3021697998046875, 0.393157958984375, 0.4841461181640625, 0.57513427734375, 0.6661224365234375, 0.757110595703125, 0.8480987548828125, 0.9390869140625, 1.0300750732421875, 1.121063232421875, 1.2120513916015625, 1.30303955078125, 1.3940277099609375, 1.485015869140625, 1.5760040283203125, 1.6669921875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 8.0, 64.0, 327.0, 476.0, 99.0, 24.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.391414642333984, -30.68013572692871, -29.968856811523438, -29.257577896118164, -28.54629898071289, -27.835020065307617, -27.123741149902344, -26.41246223449707, -25.701183319091797, -24.989904403686523, -24.27862548828125, -23.567346572875977, -22.856067657470703, -22.14478874206543, -21.433509826660156, -20.722230911254883, -20.01095199584961, -19.299673080444336, -18.588394165039062, -17.87711524963379, -17.165836334228516, -16.454557418823242, -15.743278503417969, -15.031999588012695, -14.320720672607422, -13.609441757202148, -12.898162841796875, -12.186883926391602, -11.475605010986328, -10.764326095581055, -10.053047180175781, -9.341768264770508, -8.63049030303955, -7.919211387634277, -7.207932472229004, -6.4966535568237305, -5.785374641418457, -5.074095726013184, -4.36281681060791, -3.6515378952026367, -2.9402589797973633, -2.22898006439209, -1.5177011489868164, -0.806422233581543, -0.09514331817626953, 0.6161355972290039, 1.3274145126342773, 2.038693428039551, 2.749972343444824, 3.4612512588500977, 4.172530174255371, 4.8838090896606445, 5.595088005065918, 6.306366920471191, 7.017645835876465, 7.728924751281738, 8.440203666687012, 9.151482582092285, 9.862761497497559, 10.574040412902832, 11.285319328308105, 11.996598243713379, 12.707877159118652, 13.419156074523926, 14.1304349899292]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 23.0, 28.0, 62.0, 80.0, 116.0, 109.0, 112.0, 130.0, 112.0, 80.0, 52.0, 29.0, 30.0, 10.0, 7.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.645078659057617, -11.257071495056152, -10.869063377380371, -10.481056213378906, -10.093048095703125, -9.70504093170166, -9.317033767700195, -8.929025650024414, -8.541017532348633, -8.153010368347168, -7.765002250671387, -7.376995086669922, -6.988986968994141, -6.600979804992676, -6.212972164154053, -5.82496452331543, -5.436957359313965, -5.048949718475342, -4.660942077636719, -4.272934913635254, -3.8849270343780518, -3.4969193935394287, -3.1089119911193848, -2.7209043502807617, -2.3328967094421387, -1.9448890686035156, -1.5568815469741821, -1.1688740253448486, -0.7808663845062256, -0.39285874366760254, -0.004851341247558594, 0.38315629959106445, 0.7711639404296875, 1.1591715812683105, 1.547179102897644, 1.9351866245269775, 2.3231942653656006, 2.7112019062042236, 3.0992093086242676, 3.4872169494628906, 3.8752245903015137, 4.263232231140137, 4.65123987197876, 5.039247512817383, 5.427254676818848, 5.815262794494629, 6.203269958496094, 6.591277599334717, 6.97928524017334, 7.367292881011963, 7.755300521850586, 8.14330768585205, 8.531315803527832, 8.919322967529297, 9.307331085205078, 9.695338249206543, 10.083345413208008, 10.471352577209473, 10.859360694885254, 11.247367858886719, 11.6353759765625, 12.023383140563965, 12.41139030456543, 12.799398422241211, 13.187406539916992]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 7.0, 15.0, 20.0, 17.0, 20.0, 46.0, 59.0, 91.0, 130.0, 222.0, 383.0, 744.0, 1806.0, 6341.0, 42496.0, 434925.0, 500157.0, 50044.0, 7157.0, 2010.0, 789.0, 391.0, 239.0, 138.0, 108.0, 55.0, 38.0, 26.0, 16.0, 21.0, 6.0, 8.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.35546875, -4.243896484375, -4.13232421875, -4.020751953125, -3.9091796875, -3.797607421875, -3.68603515625, -3.574462890625, -3.462890625, -3.351318359375, -3.23974609375, -3.128173828125, -3.0166015625, -2.905029296875, -2.79345703125, -2.681884765625, -2.5703125, -2.458740234375, -2.34716796875, -2.235595703125, -2.1240234375, -2.012451171875, -1.90087890625, -1.789306640625, -1.677734375, -1.566162109375, -1.45458984375, -1.343017578125, -1.2314453125, -1.119873046875, -1.00830078125, -0.896728515625, -0.78515625, -0.673583984375, -0.56201171875, -0.450439453125, -0.3388671875, -0.227294921875, -0.11572265625, -0.004150390625, 0.107421875, 0.218994140625, 0.33056640625, 0.442138671875, 0.5537109375, 0.665283203125, 0.77685546875, 0.888427734375, 1.0, 1.111572265625, 1.22314453125, 1.334716796875, 1.4462890625, 1.557861328125, 1.66943359375, 1.781005859375, 1.892578125, 2.004150390625, 2.11572265625, 2.227294921875, 2.3388671875, 2.450439453125, 2.56201171875, 2.673583984375, 2.78515625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 14.0, 26.0, 54.0, 94.0, 94.0, 134.0, 133.0, 127.0, 117.0, 81.0, 44.0, 34.0, 17.0, 11.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.91015625, -1.8662567138671875, -1.822357177734375, -1.7784576416015625, -1.73455810546875, -1.6906585693359375, -1.646759033203125, -1.6028594970703125, -1.5589599609375, -1.5150604248046875, -1.471160888671875, -1.4272613525390625, -1.38336181640625, -1.3394622802734375, -1.295562744140625, -1.2516632080078125, -1.207763671875, -1.1638641357421875, -1.119964599609375, -1.0760650634765625, -1.03216552734375, -0.9882659912109375, -0.944366455078125, -0.9004669189453125, -0.8565673828125, -0.8126678466796875, -0.768768310546875, -0.7248687744140625, -0.68096923828125, -0.6370697021484375, -0.593170166015625, -0.5492706298828125, -0.50537109375, -0.4614715576171875, -0.417572021484375, -0.3736724853515625, -0.32977294921875, -0.2858734130859375, -0.241973876953125, -0.1980743408203125, -0.1541748046875, -0.1102752685546875, -0.066375732421875, -0.0224761962890625, 0.02142333984375, 0.0653228759765625, 0.109222412109375, 0.1531219482421875, 0.197021484375, 0.2409210205078125, 0.284820556640625, 0.3287200927734375, 0.37261962890625, 0.4165191650390625, 0.460418701171875, 0.5043182373046875, 0.5482177734375, 0.5921173095703125, 0.636016845703125, 0.6799163818359375, 0.72381591796875, 0.7677154541015625, 0.811614990234375, 0.8555145263671875, 0.8994140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 9.0, 5.0, 7.0, 13.0, 25.0, 20.0, 43.0, 58.0, 107.0, 129.0, 190.0, 320.0, 602.0, 1357.0, 3897.0, 13943.0, 59027.0, 274863.0, 507997.0, 142187.0, 31472.0, 7882.0, 2353.0, 881.0, 456.0, 229.0, 133.0, 99.0, 78.0, 60.0, 34.0, 32.0, 18.0, 10.0, 8.0, 8.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9228515625, -1.8667755126953125, -1.810699462890625, -1.7546234130859375, -1.69854736328125, -1.6424713134765625, -1.586395263671875, -1.5303192138671875, -1.4742431640625, -1.4181671142578125, -1.362091064453125, -1.3060150146484375, -1.24993896484375, -1.1938629150390625, -1.137786865234375, -1.0817108154296875, -1.025634765625, -0.9695587158203125, -0.913482666015625, -0.8574066162109375, -0.80133056640625, -0.7452545166015625, -0.689178466796875, -0.6331024169921875, -0.5770263671875, -0.5209503173828125, -0.464874267578125, -0.4087982177734375, -0.35272216796875, -0.2966461181640625, -0.240570068359375, -0.1844940185546875, -0.12841796875, -0.0723419189453125, -0.016265869140625, 0.0398101806640625, 0.09588623046875, 0.1519622802734375, 0.208038330078125, 0.2641143798828125, 0.3201904296875, 0.3762664794921875, 0.432342529296875, 0.4884185791015625, 0.54449462890625, 0.6005706787109375, 0.656646728515625, 0.7127227783203125, 0.768798828125, 0.8248748779296875, 0.880950927734375, 0.9370269775390625, 0.99310302734375, 1.0491790771484375, 1.105255126953125, 1.1613311767578125, 1.2174072265625, 1.2734832763671875, 1.329559326171875, 1.3856353759765625, 1.44171142578125, 1.4977874755859375, 1.553863525390625, 1.6099395751953125, 1.666015625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 15.0, 4.0, 8.0, 12.0, 17.0, 20.0, 27.0, 27.0, 30.0, 47.0, 46.0, 38.0, 66.0, 67.0, 53.0, 64.0, 68.0, 46.0, 60.0, 54.0, 43.0, 30.0, 44.0, 28.0, 21.0, 21.0, 13.0, 12.0, 12.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16796875, -2.077850341796875, -1.98773193359375, -1.897613525390625, -1.8074951171875, -1.717376708984375, -1.62725830078125, -1.537139892578125, -1.447021484375, -1.356903076171875, -1.26678466796875, -1.176666259765625, -1.0865478515625, -0.996429443359375, -0.90631103515625, -0.816192626953125, -0.72607421875, -0.635955810546875, -0.54583740234375, -0.455718994140625, -0.3656005859375, -0.275482177734375, -0.18536376953125, -0.095245361328125, -0.005126953125, 0.084991455078125, 0.17510986328125, 0.265228271484375, 0.3553466796875, 0.445465087890625, 0.53558349609375, 0.625701904296875, 0.7158203125, 0.805938720703125, 0.89605712890625, 0.986175537109375, 1.0762939453125, 1.166412353515625, 1.25653076171875, 1.346649169921875, 1.436767578125, 1.526885986328125, 1.61700439453125, 1.707122802734375, 1.7972412109375, 1.887359619140625, 1.97747802734375, 2.067596435546875, 2.15771484375, 2.247833251953125, 2.33795166015625, 2.428070068359375, 2.5181884765625, 2.608306884765625, 2.69842529296875, 2.788543701171875, 2.878662109375, 2.968780517578125, 3.05889892578125, 3.149017333984375, 3.2391357421875, 3.329254150390625, 3.41937255859375, 3.509490966796875, 3.599609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 14.0, 17.0, 34.0, 38.0, 60.0, 133.0, 225.0, 407.0, 947.0, 2389.0, 7407.0, 29683.0, 187791.0, 590449.0, 187432.0, 29974.0, 7220.0, 2414.0, 987.0, 419.0, 228.0, 116.0, 59.0, 41.0, 23.0, 16.0, 12.0, 1.0, 4.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6533203125, -0.6295623779296875, -0.605804443359375, -0.5820465087890625, -0.55828857421875, -0.5345306396484375, -0.510772705078125, -0.4870147705078125, -0.4632568359375, -0.4394989013671875, -0.415740966796875, -0.3919830322265625, -0.36822509765625, -0.3444671630859375, -0.320709228515625, -0.2969512939453125, -0.273193359375, -0.2494354248046875, -0.225677490234375, -0.2019195556640625, -0.17816162109375, -0.1544036865234375, -0.130645751953125, -0.1068878173828125, -0.0831298828125, -0.0593719482421875, -0.035614013671875, -0.0118560791015625, 0.01190185546875, 0.0356597900390625, 0.059417724609375, 0.0831756591796875, 0.10693359375, 0.1306915283203125, 0.154449462890625, 0.1782073974609375, 0.20196533203125, 0.2257232666015625, 0.249481201171875, 0.2732391357421875, 0.2969970703125, 0.3207550048828125, 0.344512939453125, 0.3682708740234375, 0.39202880859375, 0.4157867431640625, 0.439544677734375, 0.4633026123046875, 0.487060546875, 0.5108184814453125, 0.534576416015625, 0.5583343505859375, 0.58209228515625, 0.6058502197265625, 0.629608154296875, 0.6533660888671875, 0.6771240234375, 0.7008819580078125, 0.724639892578125, 0.7483978271484375, 0.77215576171875, 0.7959136962890625, 0.819671630859375, 0.8434295654296875, 0.8671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 5.0, 3.0, 6.0, 12.0, 14.0, 27.0, 31.0, 46.0, 63.0, 75.0, 99.0, 110.0, 104.0, 73.0, 82.0, 70.0, 43.0, 32.0, 25.0, 19.0, 13.0, 7.0, 13.0, 4.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00011485815048217773, -0.00011061038821935654, -0.00010636262595653534, -0.00010211486369371414, -9.786710143089294e-05, -9.361933916807175e-05, -8.937157690525055e-05, -8.512381464242935e-05, -8.087605237960815e-05, -7.662829011678696e-05, -7.238052785396576e-05, -6.813276559114456e-05, -6.388500332832336e-05, -5.963724106550217e-05, -5.538947880268097e-05, -5.114171653985977e-05, -4.6893954277038574e-05, -4.264619201421738e-05, -3.839842975139618e-05, -3.415066748857498e-05, -2.9902905225753784e-05, -2.5655142962932587e-05, -2.140738070011139e-05, -1.715961843729019e-05, -1.2911856174468994e-05, -8.664093911647797e-06, -4.416331648826599e-06, -1.685693860054016e-07, 4.079192876815796e-06, 8.326955139636993e-06, 1.2574717402458191e-05, 1.682247966527939e-05, 2.1070241928100586e-05, 2.5318004190921783e-05, 2.956576645374298e-05, 3.381352871656418e-05, 3.8061290979385376e-05, 4.2309053242206573e-05, 4.655681550502777e-05, 5.080457776784897e-05, 5.5052340030670166e-05, 5.9300102293491364e-05, 6.354786455631256e-05, 6.779562681913376e-05, 7.204338908195496e-05, 7.629115134477615e-05, 8.053891360759735e-05, 8.478667587041855e-05, 8.903443813323975e-05, 9.328220039606094e-05, 9.752996265888214e-05, 0.00010177772492170334, 0.00010602548718452454, 0.00011027324944734573, 0.00011452101171016693, 0.00011876877397298813, 0.00012301653623580933, 0.00012726429849863052, 0.00013151206076145172, 0.00013575982302427292, 0.00014000758528709412, 0.00014425534754991531, 0.0001485031098127365, 0.0001527508720755577, 0.0001569986343383789]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 3.0, 5.0, 17.0, 17.0, 38.0, 46.0, 114.0, 208.0, 515.0, 1702.0, 7608.0, 47275.0, 403242.0, 508845.0, 65697.0, 9887.0, 2184.0, 628.0, 237.0, 112.0, 77.0, 31.0, 25.0, 11.0, 11.0, 3.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99658203125, -0.968170166015625, -0.93975830078125, -0.911346435546875, -0.8829345703125, -0.854522705078125, -0.82611083984375, -0.797698974609375, -0.769287109375, -0.740875244140625, -0.71246337890625, -0.684051513671875, -0.6556396484375, -0.627227783203125, -0.59881591796875, -0.570404052734375, -0.5419921875, -0.513580322265625, -0.48516845703125, -0.456756591796875, -0.4283447265625, -0.399932861328125, -0.37152099609375, -0.343109130859375, -0.314697265625, -0.286285400390625, -0.25787353515625, -0.229461669921875, -0.2010498046875, -0.172637939453125, -0.14422607421875, -0.115814208984375, -0.08740234375, -0.058990478515625, -0.03057861328125, -0.002166748046875, 0.0262451171875, 0.054656982421875, 0.08306884765625, 0.111480712890625, 0.139892578125, 0.168304443359375, 0.19671630859375, 0.225128173828125, 0.2535400390625, 0.281951904296875, 0.31036376953125, 0.338775634765625, 0.3671875, 0.395599365234375, 0.42401123046875, 0.452423095703125, 0.4808349609375, 0.509246826171875, 0.53765869140625, 0.566070556640625, 0.594482421875, 0.622894287109375, 0.65130615234375, 0.679718017578125, 0.7081298828125, 0.736541748046875, 0.76495361328125, 0.793365478515625, 0.82177734375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 9.0, 10.0, 16.0, 19.0, 40.0, 47.0, 61.0, 83.0, 71.0, 84.0, 111.0, 96.0, 90.0, 58.0, 56.0, 40.0, 30.0, 24.0, 15.0, 11.0, 8.0, 3.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.83203125, -0.8114700317382812, -0.7909088134765625, -0.7703475952148438, -0.749786376953125, -0.7292251586914062, -0.7086639404296875, -0.6881027221679688, -0.66754150390625, -0.6469802856445312, -0.6264190673828125, -0.6058578491210938, -0.585296630859375, -0.5647354125976562, -0.5441741943359375, -0.5236129760742188, -0.5030517578125, -0.48249053955078125, -0.4619293212890625, -0.44136810302734375, -0.420806884765625, -0.40024566650390625, -0.3796844482421875, -0.35912322998046875, -0.33856201171875, -0.31800079345703125, -0.2974395751953125, -0.27687835693359375, -0.256317138671875, -0.23575592041015625, -0.2151947021484375, -0.19463348388671875, -0.174072265625, -0.15351104736328125, -0.1329498291015625, -0.11238861083984375, -0.091827392578125, -0.07126617431640625, -0.0507049560546875, -0.03014373779296875, -0.00958251953125, 0.01097869873046875, 0.0315399169921875, 0.05210113525390625, 0.072662353515625, 0.09322357177734375, 0.1137847900390625, 0.13434600830078125, 0.1549072265625, 0.17546844482421875, 0.1960296630859375, 0.21659088134765625, 0.237152099609375, 0.25771331787109375, 0.2782745361328125, 0.29883575439453125, 0.31939697265625, 0.33995819091796875, 0.3605194091796875, 0.38108062744140625, 0.401641845703125, 0.42220306396484375, 0.4427642822265625, 0.46332550048828125, 0.48388671875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 23.0, 86.0, 280.0, 413.0, 152.0, 39.0, 12.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.636882781982422, -19.616531372070312, -18.596179962158203, -17.57582664489746, -16.55547523498535, -15.535123825073242, -14.514771461486816, -13.49441909790039, -12.474067687988281, -11.453716278076172, -10.433363914489746, -9.41301155090332, -8.392660140991211, -7.372308254241943, -6.351956367492676, -5.331604480743408, -4.311252593994141, -3.290900707244873, -2.2705488204956055, -1.250196933746338, -0.2298450469970703, 0.7905068397521973, 1.8108587265014648, 2.8312106132507324, 3.8515625, 4.871914386749268, 5.892266273498535, 6.912618160247803, 7.93297004699707, 8.95332145690918, 9.973673820495605, 10.994026184082031, 12.014381408691406, 13.034732818603516, 14.055085182189941, 15.075437545776367, 16.095788955688477, 17.116140365600586, 18.136493682861328, 19.156845092773438, 20.177196502685547, 21.197547912597656, 22.217899322509766, 23.238252639770508, 24.258604049682617, 25.278955459594727, 26.29930877685547, 27.319660186767578, 28.340011596679688, 29.360363006591797, 30.380714416503906, 31.40106773376465, 32.421417236328125, 33.4417724609375, 34.46212387084961, 35.48247528076172, 36.50282669067383, 37.52317810058594, 38.54352951049805, 39.563880920410156, 40.58423614501953, 41.60458755493164, 42.62493896484375, 43.64529037475586, 44.66564178466797]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 11.0, 7.0, 11.0, 18.0, 23.0, 20.0, 25.0, 37.0, 35.0, 41.0, 50.0, 50.0, 52.0, 56.0, 73.0, 51.0, 55.0, 59.0, 44.0, 48.0, 38.0, 34.0, 31.0, 27.0, 37.0, 17.0, 10.0, 5.0, 6.0, 7.0, 8.0, 8.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.901290893554688, -19.38831329345703, -18.875337600708008, -18.36236000061035, -17.849384307861328, -17.336406707763672, -16.82343101501465, -16.310453414916992, -15.797476768493652, -15.284500122070312, -14.771523475646973, -14.258546829223633, -13.745569229125977, -13.232593536376953, -12.719615936279297, -12.206639289855957, -11.693662643432617, -11.180685997009277, -10.667709350585938, -10.154732704162598, -9.641756057739258, -9.128778457641602, -8.615801811218262, -8.102825164794922, -7.589848518371582, -7.076871871948242, -6.563895225524902, -6.050918102264404, -5.5379414558410645, -5.024964809417725, -4.511987686157227, -3.9990110397338867, -3.486034393310547, -2.973057746887207, -2.460080862045288, -1.9471040964126587, -1.4341273307800293, -0.9211506843566895, -0.4081737995147705, 0.10480308532714844, 0.6177797317504883, 1.1307564973831177, 1.643733263015747, 2.156710147857666, 2.669686794281006, 3.1826634407043457, 3.6956403255462646, 4.208617210388184, 4.721593856811523, 5.234570503234863, 5.747547149658203, 6.260524272918701, 6.773500919342041, 7.286477565765381, 7.799454689025879, 8.312431335449219, 8.825407981872559, 9.338384628295898, 9.851361274719238, 10.364337921142578, 10.877315521240234, 11.390291213989258, 11.903268814086914, 12.416245460510254, 12.929222106933594]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 5.0, 2.0, 6.0, 0.0, 7.0, 13.0, 6.0, 16.0, 20.0, 25.0, 28.0, 39.0, 77.0, 104.0, 209.0, 359.0, 785.0, 2275.0, 9637.0, 100682.0, 4004320.0, 65089.0, 7537.0, 1867.0, 580.0, 270.0, 129.0, 74.0, 48.0, 26.0, 14.0, 14.0, 6.0, 10.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.328125, -3.2110595703125, -3.093994140625, -2.9769287109375, -2.85986328125, -2.7427978515625, -2.625732421875, -2.5086669921875, -2.3916015625, -2.2745361328125, -2.157470703125, -2.0404052734375, -1.92333984375, -1.8062744140625, -1.689208984375, -1.5721435546875, -1.455078125, -1.3380126953125, -1.220947265625, -1.1038818359375, -0.98681640625, -0.8697509765625, -0.752685546875, -0.6356201171875, -0.5185546875, -0.4014892578125, -0.284423828125, -0.1673583984375, -0.05029296875, 0.0667724609375, 0.183837890625, 0.3009033203125, 0.41796875, 0.5350341796875, 0.652099609375, 0.7691650390625, 0.88623046875, 1.0032958984375, 1.120361328125, 1.2374267578125, 1.3544921875, 1.4715576171875, 1.588623046875, 1.7056884765625, 1.82275390625, 1.9398193359375, 2.056884765625, 2.1739501953125, 2.291015625, 2.4080810546875, 2.525146484375, 2.6422119140625, 2.75927734375, 2.8763427734375, 2.993408203125, 3.1104736328125, 3.2275390625, 3.3446044921875, 3.461669921875, 3.5787353515625, 3.69580078125, 3.8128662109375, 3.929931640625, 4.0469970703125, 4.1640625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 7.0, 4.0, 5.0, 17.0, 18.0, 34.0, 52.0, 91.0, 95.0, 87.0, 113.0, 116.0, 105.0, 89.0, 64.0, 45.0, 23.0, 20.0, 10.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.765625, -1.7243270874023438, -1.6830291748046875, -1.6417312622070312, -1.600433349609375, -1.5591354370117188, -1.5178375244140625, -1.4765396118164062, -1.43524169921875, -1.3939437866210938, -1.3526458740234375, -1.3113479614257812, -1.270050048828125, -1.2287521362304688, -1.1874542236328125, -1.1461563110351562, -1.1048583984375, -1.0635604858398438, -1.0222625732421875, -0.9809646606445312, -0.939666748046875, -0.8983688354492188, -0.8570709228515625, -0.8157730102539062, -0.77447509765625, -0.7331771850585938, -0.6918792724609375, -0.6505813598632812, -0.609283447265625, -0.5679855346679688, -0.5266876220703125, -0.48538970947265625, -0.444091796875, -0.40279388427734375, -0.3614959716796875, -0.32019805908203125, -0.278900146484375, -0.23760223388671875, -0.1963043212890625, -0.15500640869140625, -0.11370849609375, -0.07241058349609375, -0.0311126708984375, 0.01018524169921875, 0.051483154296875, 0.09278106689453125, 0.1340789794921875, 0.17537689208984375, 0.2166748046875, 0.25797271728515625, 0.2992706298828125, 0.34056854248046875, 0.381866455078125, 0.42316436767578125, 0.4644622802734375, 0.5057601928710938, 0.54705810546875, 0.5883560180664062, 0.6296539306640625, 0.6709518432617188, 0.712249755859375, 0.7535476684570312, 0.7948455810546875, 0.8361434936523438, 0.87744140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 11.0, 8.0, 14.0, 25.0, 25.0, 55.0, 159.0, 446.0, 1577.0, 7731.0, 82462.0, 4018249.0, 74430.0, 6957.0, 1413.0, 425.0, 154.0, 71.0, 31.0, 11.0, 7.0, 4.0, 5.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.7265625, -4.60980224609375, -4.4930419921875, -4.37628173828125, -4.259521484375, -4.14276123046875, -4.0260009765625, -3.90924072265625, -3.79248046875, -3.67572021484375, -3.5589599609375, -3.44219970703125, -3.325439453125, -3.20867919921875, -3.0919189453125, -2.97515869140625, -2.8583984375, -2.74163818359375, -2.6248779296875, -2.50811767578125, -2.391357421875, -2.27459716796875, -2.1578369140625, -2.04107666015625, -1.92431640625, -1.80755615234375, -1.6907958984375, -1.57403564453125, -1.457275390625, -1.34051513671875, -1.2237548828125, -1.10699462890625, -0.990234375, -0.87347412109375, -0.7567138671875, -0.63995361328125, -0.523193359375, -0.40643310546875, -0.2896728515625, -0.17291259765625, -0.05615234375, 0.06060791015625, 0.1773681640625, 0.29412841796875, 0.410888671875, 0.52764892578125, 0.6444091796875, 0.76116943359375, 0.8779296875, 0.99468994140625, 1.1114501953125, 1.22821044921875, 1.344970703125, 1.46173095703125, 1.5784912109375, 1.69525146484375, 1.81201171875, 1.92877197265625, 2.0455322265625, 2.16229248046875, 2.279052734375, 2.39581298828125, 2.5125732421875, 2.62933349609375, 2.74609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 5.0, 4.0, 10.0, 10.0, 21.0, 20.0, 36.0, 62.0, 136.0, 274.0, 1508.0, 1332.0, 296.0, 130.0, 79.0, 50.0, 25.0, 17.0, 12.0, 14.0, 6.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.76171875, -0.7354202270507812, -0.7091217041015625, -0.6828231811523438, -0.656524658203125, -0.6302261352539062, -0.6039276123046875, -0.5776290893554688, -0.55133056640625, -0.5250320434570312, -0.4987335205078125, -0.47243499755859375, -0.446136474609375, -0.41983795166015625, -0.3935394287109375, -0.36724090576171875, -0.3409423828125, -0.31464385986328125, -0.2883453369140625, -0.26204681396484375, -0.235748291015625, -0.20944976806640625, -0.1831512451171875, -0.15685272216796875, -0.13055419921875, -0.10425567626953125, -0.0779571533203125, -0.05165863037109375, -0.025360107421875, 0.00093841552734375, 0.0272369384765625, 0.05353546142578125, 0.079833984375, 0.10613250732421875, 0.1324310302734375, 0.15872955322265625, 0.185028076171875, 0.21132659912109375, 0.2376251220703125, 0.26392364501953125, 0.29022216796875, 0.31652069091796875, 0.3428192138671875, 0.36911773681640625, 0.395416259765625, 0.42171478271484375, 0.4480133056640625, 0.47431182861328125, 0.5006103515625, 0.5269088745117188, 0.5532073974609375, 0.5795059204101562, 0.605804443359375, 0.6321029663085938, 0.6584014892578125, 0.6847000122070312, 0.71099853515625, 0.7372970581054688, 0.7635955810546875, 0.7898941040039062, 0.816192626953125, 0.8424911499023438, 0.8687896728515625, 0.8950881958007812, 0.92138671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 23.0, 122.0, 429.0, 339.0, 72.0, 12.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01996374130249, -5.636176586151123, -5.252388954162598, -4.8686017990112305, -4.484814643859863, -4.101027488708496, -3.7172398567199707, -3.3334527015686035, -2.9496653079986572, -2.565877914428711, -2.1820907592773438, -1.7983033657073975, -1.4145160913467407, -1.030728816986084, -0.6469414234161377, -0.2631542682647705, 0.12063312530517578, 0.5044203996658325, 0.888207733631134, 1.2719950675964355, 1.6557823419570923, 2.039569616317749, 2.4233570098876953, 2.8071441650390625, 3.190931558609009, 3.574718952178955, 3.9585061073303223, 4.342293739318848, 4.726080894470215, 5.109868049621582, 5.493655204772949, 5.877442359924316, 6.261229515075684, 6.645016670227051, 7.028804302215576, 7.412591457366943, 7.7963786125183105, 8.180166244506836, 8.563953399658203, 8.94774055480957, 9.331527709960938, 9.715314865112305, 10.099102020263672, 10.482889175415039, 10.866677284240723, 11.25046443939209, 11.634251594543457, 12.018038749694824, 12.401826858520508, 12.785614013671875, 13.169401168823242, 13.55318832397461, 13.936976432800293, 14.32076358795166, 14.704550743103027, 15.088337898254395, 15.472125053405762, 15.855912208557129, 16.239700317382812, 16.62348747253418, 17.007274627685547, 17.391061782836914, 17.77484893798828, 18.15863609313965, 18.542423248291016]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 6.0, 6.0, 9.0, 16.0, 31.0, 34.0, 27.0, 48.0, 41.0, 65.0, 57.0, 78.0, 67.0, 65.0, 69.0, 81.0, 59.0, 47.0, 47.0, 35.0, 27.0, 24.0, 20.0, 19.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-5.130592346191406, -5.011147975921631, -4.891704082489014, -4.772259712219238, -4.652815818786621, -4.533371448516846, -4.41392707824707, -4.294483184814453, -4.175038814544678, -4.055594444274902, -3.936150550842285, -3.8167061805725098, -3.6972620487213135, -3.577817916870117, -3.458373785018921, -3.3389296531677246, -3.219485282897949, -3.100041151046753, -2.9805970191955566, -2.8611526489257812, -2.741708517074585, -2.6222643852233887, -2.5028202533721924, -2.383376121520996, -2.2639319896698, -2.1444878578186035, -2.0250437259674072, -1.9055994749069214, -1.7861552238464355, -1.6667110919952393, -1.547266960144043, -1.4278227090835571, -1.3083784580230713, -1.188934326171875, -1.0694900751113892, -0.9500459432601929, -0.830601692199707, -0.7111575603485107, -0.5917133688926697, -0.4722691774368286, -0.35282498598098755, -0.23338079452514648, -0.11393661797046661, 0.005507558584213257, 0.12495175004005432, 0.244395911693573, 0.36384010314941406, 0.4832842946052551, 0.6027284860610962, 0.7221726775169373, 0.8416168689727783, 0.9610610008239746, 1.0805052518844604, 1.1999493837356567, 1.3193936347961426, 1.4388377666473389, 1.5582818984985352, 1.6777260303497314, 1.7971702814102173, 1.9166144132614136, 2.0360586643218994, 2.1555027961730957, 2.274946928024292, 2.3943910598754883, 2.5138354301452637]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 8.0, 4.0, 11.0, 9.0, 25.0, 15.0, 28.0, 47.0, 79.0, 93.0, 191.0, 324.0, 600.0, 1533.0, 4626.0, 21424.0, 152296.0, 647990.0, 185257.0, 25635.0, 5225.0, 1645.0, 623.0, 367.0, 175.0, 103.0, 61.0, 39.0, 28.0, 27.0, 19.0, 14.0, 7.0, 7.0, 6.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.311370849609375, -2.22430419921875, -2.137237548828125, -2.0501708984375, -1.963104248046875, -1.87603759765625, -1.788970947265625, -1.701904296875, -1.614837646484375, -1.52777099609375, -1.440704345703125, -1.3536376953125, -1.266571044921875, -1.17950439453125, -1.092437744140625, -1.00537109375, -0.918304443359375, -0.83123779296875, -0.744171142578125, -0.6571044921875, -0.570037841796875, -0.48297119140625, -0.395904541015625, -0.308837890625, -0.221771240234375, -0.13470458984375, -0.047637939453125, 0.0394287109375, 0.126495361328125, 0.21356201171875, 0.300628662109375, 0.3876953125, 0.474761962890625, 0.56182861328125, 0.648895263671875, 0.7359619140625, 0.823028564453125, 0.91009521484375, 0.997161865234375, 1.084228515625, 1.171295166015625, 1.25836181640625, 1.345428466796875, 1.4324951171875, 1.519561767578125, 1.60662841796875, 1.693695068359375, 1.78076171875, 1.867828369140625, 1.95489501953125, 2.041961669921875, 2.1290283203125, 2.216094970703125, 2.30316162109375, 2.390228271484375, 2.477294921875, 2.564361572265625, 2.65142822265625, 2.738494873046875, 2.8255615234375, 2.912628173828125, 2.99969482421875, 3.086761474609375, 3.173828125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 12.0, 33.0, 46.0, 59.0, 89.0, 111.0, 114.0, 107.0, 104.0, 96.0, 86.0, 62.0, 33.0, 14.0, 13.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7744140625, -1.7313995361328125, -1.688385009765625, -1.6453704833984375, -1.60235595703125, -1.5593414306640625, -1.516326904296875, -1.4733123779296875, -1.4302978515625, -1.3872833251953125, -1.344268798828125, -1.3012542724609375, -1.25823974609375, -1.2152252197265625, -1.172210693359375, -1.1291961669921875, -1.086181640625, -1.0431671142578125, -1.000152587890625, -0.9571380615234375, -0.91412353515625, -0.8711090087890625, -0.828094482421875, -0.7850799560546875, -0.7420654296875, -0.6990509033203125, -0.656036376953125, -0.6130218505859375, -0.57000732421875, -0.5269927978515625, -0.483978271484375, -0.4409637451171875, -0.39794921875, -0.3549346923828125, -0.311920166015625, -0.2689056396484375, -0.22589111328125, -0.1828765869140625, -0.139862060546875, -0.0968475341796875, -0.0538330078125, -0.0108184814453125, 0.032196044921875, 0.0752105712890625, 0.11822509765625, 0.1612396240234375, 0.204254150390625, 0.2472686767578125, 0.290283203125, 0.3332977294921875, 0.376312255859375, 0.4193267822265625, 0.46234130859375, 0.5053558349609375, 0.548370361328125, 0.5913848876953125, 0.6343994140625, 0.6774139404296875, 0.720428466796875, 0.7634429931640625, 0.80645751953125, 0.8494720458984375, 0.892486572265625, 0.9355010986328125, 0.978515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 2.0, 6.0, 12.0, 19.0, 32.0, 23.0, 35.0, 77.0, 91.0, 151.0, 174.0, 314.0, 539.0, 1066.0, 2489.0, 6939.0, 22554.0, 81943.0, 334064.0, 434992.0, 116576.0, 30536.0, 9500.0, 3261.0, 1376.0, 657.0, 353.0, 225.0, 170.0, 118.0, 81.0, 52.0, 30.0, 21.0, 15.0, 17.0, 12.0, 10.0, 12.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.75, -1.7001800537109375, -1.650360107421875, -1.6005401611328125, -1.55072021484375, -1.5009002685546875, -1.451080322265625, -1.4012603759765625, -1.3514404296875, -1.3016204833984375, -1.251800537109375, -1.2019805908203125, -1.15216064453125, -1.1023406982421875, -1.052520751953125, -1.0027008056640625, -0.952880859375, -0.9030609130859375, -0.853240966796875, -0.8034210205078125, -0.75360107421875, -0.7037811279296875, -0.653961181640625, -0.6041412353515625, -0.5543212890625, -0.5045013427734375, -0.454681396484375, -0.4048614501953125, -0.35504150390625, -0.3052215576171875, -0.255401611328125, -0.2055816650390625, -0.15576171875, -0.1059417724609375, -0.056121826171875, -0.0063018798828125, 0.04351806640625, 0.0933380126953125, 0.143157958984375, 0.1929779052734375, 0.2427978515625, 0.2926177978515625, 0.342437744140625, 0.3922576904296875, 0.44207763671875, 0.4918975830078125, 0.541717529296875, 0.5915374755859375, 0.641357421875, 0.6911773681640625, 0.740997314453125, 0.7908172607421875, 0.84063720703125, 0.8904571533203125, 0.940277099609375, 0.9900970458984375, 1.0399169921875, 1.0897369384765625, 1.139556884765625, 1.1893768310546875, 1.23919677734375, 1.2890167236328125, 1.338836669921875, 1.3886566162109375, 1.4384765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 6.0, 15.0, 4.0, 11.0, 12.0, 14.0, 14.0, 20.0, 10.0, 14.0, 23.0, 15.0, 40.0, 31.0, 54.0, 44.0, 37.0, 42.0, 37.0, 48.0, 39.0, 39.0, 50.0, 44.0, 39.0, 37.0, 36.0, 29.0, 31.0, 23.0, 22.0, 17.0, 19.0, 12.0, 15.0, 10.0, 15.0, 3.0, 7.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1640625, -2.093475341796875, -2.02288818359375, -1.952301025390625, -1.8817138671875, -1.811126708984375, -1.74053955078125, -1.669952392578125, -1.599365234375, -1.528778076171875, -1.45819091796875, -1.387603759765625, -1.3170166015625, -1.246429443359375, -1.17584228515625, -1.105255126953125, -1.03466796875, -0.964080810546875, -0.89349365234375, -0.822906494140625, -0.7523193359375, -0.681732177734375, -0.61114501953125, -0.540557861328125, -0.469970703125, -0.399383544921875, -0.32879638671875, -0.258209228515625, -0.1876220703125, -0.117034912109375, -0.04644775390625, 0.024139404296875, 0.0947265625, 0.165313720703125, 0.23590087890625, 0.306488037109375, 0.3770751953125, 0.447662353515625, 0.51824951171875, 0.588836669921875, 0.659423828125, 0.730010986328125, 0.80059814453125, 0.871185302734375, 0.9417724609375, 1.012359619140625, 1.08294677734375, 1.153533935546875, 1.22412109375, 1.294708251953125, 1.36529541015625, 1.435882568359375, 1.5064697265625, 1.577056884765625, 1.64764404296875, 1.718231201171875, 1.788818359375, 1.859405517578125, 1.92999267578125, 2.000579833984375, 2.0711669921875, 2.141754150390625, 2.21234130859375, 2.282928466796875, 2.353515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 9.0, 9.0, 26.0, 38.0, 61.0, 87.0, 175.0, 371.0, 775.0, 2197.0, 8097.0, 52628.0, 435551.0, 475769.0, 59971.0, 8769.0, 2337.0, 809.0, 390.0, 201.0, 103.0, 59.0, 37.0, 28.0, 17.0, 12.0, 5.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6904296875, -0.664886474609375, -0.63934326171875, -0.613800048828125, -0.5882568359375, -0.562713623046875, -0.53717041015625, -0.511627197265625, -0.486083984375, -0.460540771484375, -0.43499755859375, -0.409454345703125, -0.3839111328125, -0.358367919921875, -0.33282470703125, -0.307281494140625, -0.28173828125, -0.256195068359375, -0.23065185546875, -0.205108642578125, -0.1795654296875, -0.154022216796875, -0.12847900390625, -0.102935791015625, -0.077392578125, -0.051849365234375, -0.02630615234375, -0.000762939453125, 0.0247802734375, 0.050323486328125, 0.07586669921875, 0.101409912109375, 0.126953125, 0.152496337890625, 0.17803955078125, 0.203582763671875, 0.2291259765625, 0.254669189453125, 0.28021240234375, 0.305755615234375, 0.331298828125, 0.356842041015625, 0.38238525390625, 0.407928466796875, 0.4334716796875, 0.459014892578125, 0.48455810546875, 0.510101318359375, 0.53564453125, 0.561187744140625, 0.58673095703125, 0.612274169921875, 0.6378173828125, 0.663360595703125, 0.68890380859375, 0.714447021484375, 0.739990234375, 0.765533447265625, 0.79107666015625, 0.816619873046875, 0.8421630859375, 0.867706298828125, 0.89324951171875, 0.918792724609375, 0.9443359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 7.0, 8.0, 12.0, 12.0, 17.0, 21.0, 43.0, 49.0, 72.0, 73.0, 99.0, 86.0, 106.0, 72.0, 87.0, 55.0, 36.0, 35.0, 32.0, 13.0, 16.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014591217041015625, -0.00014194101095199585, -0.00013796985149383545, -0.00013399869203567505, -0.00013002753257751465, -0.00012605637311935425, -0.00012208521366119385, -0.00011811405420303345, -0.00011414289474487305, -0.00011017173528671265, -0.00010620057582855225, -0.00010222941637039185, -9.825825691223145e-05, -9.428709745407104e-05, -9.031593799591064e-05, -8.634477853775024e-05, -8.237361907958984e-05, -7.840245962142944e-05, -7.443130016326904e-05, -7.046014070510864e-05, -6.648898124694824e-05, -6.251782178878784e-05, -5.854666233062744e-05, -5.457550287246704e-05, -5.060434341430664e-05, -4.663318395614624e-05, -4.266202449798584e-05, -3.869086503982544e-05, -3.471970558166504e-05, -3.074854612350464e-05, -2.6777386665344238e-05, -2.2806227207183838e-05, -1.8835067749023438e-05, -1.4863908290863037e-05, -1.0892748832702637e-05, -6.921589374542236e-06, -2.950429916381836e-06, 1.0207295417785645e-06, 4.991888999938965e-06, 8.963048458099365e-06, 1.2934207916259766e-05, 1.6905367374420166e-05, 2.0876526832580566e-05, 2.4847686290740967e-05, 2.8818845748901367e-05, 3.279000520706177e-05, 3.676116466522217e-05, 4.073232412338257e-05, 4.470348358154297e-05, 4.867464303970337e-05, 5.264580249786377e-05, 5.661696195602417e-05, 6.058812141418457e-05, 6.455928087234497e-05, 6.853044033050537e-05, 7.250159978866577e-05, 7.647275924682617e-05, 8.044391870498657e-05, 8.441507816314697e-05, 8.838623762130737e-05, 9.235739707946777e-05, 9.632855653762817e-05, 0.00010029971599578857, 0.00010427087545394897, 0.00010824203491210938]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 5.0, 7.0, 9.0, 11.0, 6.0, 19.0, 16.0, 23.0, 58.0, 77.0, 147.0, 254.0, 530.0, 1372.0, 3986.0, 14725.0, 67266.0, 330356.0, 472593.0, 123111.0, 24297.0, 6198.0, 1923.0, 786.0, 345.0, 155.0, 91.0, 41.0, 47.0, 25.0, 18.0, 13.0, 13.0, 9.0, 6.0, 4.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.7080078125, -0.6878814697265625, -0.667755126953125, -0.6476287841796875, -0.62750244140625, -0.6073760986328125, -0.587249755859375, -0.5671234130859375, -0.5469970703125, -0.5268707275390625, -0.506744384765625, -0.4866180419921875, -0.46649169921875, -0.4463653564453125, -0.426239013671875, -0.4061126708984375, -0.385986328125, -0.3658599853515625, -0.345733642578125, -0.3256072998046875, -0.30548095703125, -0.2853546142578125, -0.265228271484375, -0.2451019287109375, -0.2249755859375, -0.2048492431640625, -0.184722900390625, -0.1645965576171875, -0.14447021484375, -0.1243438720703125, -0.104217529296875, -0.0840911865234375, -0.06396484375, -0.0438385009765625, -0.023712158203125, -0.0035858154296875, 0.01654052734375, 0.0366668701171875, 0.056793212890625, 0.0769195556640625, 0.0970458984375, 0.1171722412109375, 0.137298583984375, 0.1574249267578125, 0.17755126953125, 0.1976776123046875, 0.217803955078125, 0.2379302978515625, 0.258056640625, 0.2781829833984375, 0.298309326171875, 0.3184356689453125, 0.33856201171875, 0.3586883544921875, 0.378814697265625, 0.3989410400390625, 0.4190673828125, 0.4391937255859375, 0.459320068359375, 0.4794464111328125, 0.49957275390625, 0.5196990966796875, 0.539825439453125, 0.5599517822265625, 0.580078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 9.0, 8.0, 8.0, 9.0, 10.0, 21.0, 26.0, 35.0, 36.0, 33.0, 65.0, 64.0, 82.0, 80.0, 74.0, 69.0, 62.0, 50.0, 58.0, 41.0, 31.0, 33.0, 23.0, 19.0, 16.0, 8.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.47265625, -0.45670318603515625, -0.4407501220703125, -0.42479705810546875, -0.408843994140625, -0.39289093017578125, -0.3769378662109375, -0.36098480224609375, -0.34503173828125, -0.32907867431640625, -0.3131256103515625, -0.29717254638671875, -0.281219482421875, -0.26526641845703125, -0.2493133544921875, -0.23336029052734375, -0.2174072265625, -0.20145416259765625, -0.1855010986328125, -0.16954803466796875, -0.153594970703125, -0.13764190673828125, -0.1216888427734375, -0.10573577880859375, -0.08978271484375, -0.07382965087890625, -0.0578765869140625, -0.04192352294921875, -0.025970458984375, -0.01001739501953125, 0.0059356689453125, 0.02188873291015625, 0.037841796875, 0.05379486083984375, 0.0697479248046875, 0.08570098876953125, 0.101654052734375, 0.11760711669921875, 0.1335601806640625, 0.14951324462890625, 0.16546630859375, 0.18141937255859375, 0.1973724365234375, 0.21332550048828125, 0.229278564453125, 0.24523162841796875, 0.2611846923828125, 0.27713775634765625, 0.2930908203125, 0.30904388427734375, 0.3249969482421875, 0.34095001220703125, 0.356903076171875, 0.37285614013671875, 0.3888092041015625, 0.40476226806640625, 0.42071533203125, 0.43666839599609375, 0.4526214599609375, 0.46857452392578125, 0.484527587890625, 0.5004806518554688, 0.5164337158203125, 0.5323867797851562, 0.54833984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 57.0, 517.0, 376.0, 50.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.84335327148438, -89.02262878417969, -87.20189666748047, -85.38116455078125, -83.56044006347656, -81.73971557617188, -79.91898345947266, -78.09825134277344, -76.27752685546875, -74.45680236816406, -72.63607025146484, -70.81533813476562, -68.99461364746094, -67.17388916015625, -65.35315704345703, -63.53242874145508, -61.711700439453125, -59.89097213745117, -58.07024383544922, -56.249515533447266, -54.42878723144531, -52.60805892944336, -50.787330627441406, -48.96660232543945, -47.1458740234375, -45.32514572143555, -43.504417419433594, -41.68368911743164, -39.86296081542969, -38.042232513427734, -36.22150421142578, -34.40077590942383, -32.580047607421875, -30.759319305419922, -28.93859100341797, -27.117862701416016, -25.297134399414062, -23.47640609741211, -21.655677795410156, -19.834949493408203, -18.01422119140625, -16.193492889404297, -14.372764587402344, -12.55203628540039, -10.731307983398438, -8.910579681396484, -7.089851379394531, -5.269123077392578, -3.448394775390625, -1.6276664733886719, 0.19306182861328125, 2.0137901306152344, 3.8345184326171875, 5.655246734619141, 7.475975036621094, 9.296703338623047, 11.117431640625, 12.938159942626953, 14.758888244628906, 16.57961654663086, 18.400344848632812, 20.221073150634766, 22.04180145263672, 23.862529754638672, 25.683258056640625]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 18.0, 15.0, 16.0, 14.0, 19.0, 25.0, 29.0, 41.0, 34.0, 36.0, 40.0, 46.0, 42.0, 49.0, 66.0, 46.0, 47.0, 47.0, 32.0, 41.0, 39.0, 27.0, 29.0, 34.0, 19.0, 26.0, 25.0, 13.0, 19.0, 11.0, 7.0, 10.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.620672225952148, -11.15491771697998, -10.689164161682129, -10.223409652709961, -9.75765609741211, -9.291901588439941, -8.82614803314209, -8.360393524169922, -7.89463996887207, -7.4288859367370605, -6.963131904602051, -6.497377872467041, -6.031623840332031, -5.565869331359863, -5.100115776062012, -4.634361267089844, -4.168607234954834, -3.702853202819824, -3.2370991706848145, -2.7713451385498047, -2.305591106414795, -1.839836835861206, -1.3740828037261963, -0.9083287715911865, -0.44257473945617676, 0.023179322481155396, 0.48893338441848755, 0.9546874761581421, 1.4204415082931519, 1.8861956596374512, 2.351949691772461, 2.8177037239074707, 3.2834577560424805, 3.7492117881774902, 4.2149658203125, 4.68071985244751, 5.1464738845825195, 5.6122283935546875, 6.077981948852539, 6.543736457824707, 7.009490013122559, 7.475244045257568, 7.940998077392578, 8.406752586364746, 8.872506141662598, 9.338260650634766, 9.804014205932617, 10.269768714904785, 10.735523223876953, 11.201277732849121, 11.667031288146973, 12.13278579711914, 12.598539352416992, 13.06429386138916, 13.530047416687012, 13.99580192565918, 14.461555480957031, 14.9273099899292, 15.39306354522705, 15.858818054199219, 16.32457160949707, 16.790325164794922, 17.256080627441406, 17.721834182739258, 18.18758773803711]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 13.0, 22.0, 16.0, 24.0, 34.0, 64.0, 101.0, 178.0, 301.0, 522.0, 1142.0, 2905.0, 10190.0, 64388.0, 3906256.0, 182890.0, 18038.0, 4243.0, 1452.0, 661.0, 361.0, 183.0, 131.0, 53.0, 34.0, 21.0, 18.0, 11.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.248382568359375, -4.14129638671875, -4.034210205078125, -3.9271240234375, -3.820037841796875, -3.71295166015625, -3.605865478515625, -3.498779296875, -3.391693115234375, -3.28460693359375, -3.177520751953125, -3.0704345703125, -2.963348388671875, -2.85626220703125, -2.749176025390625, -2.64208984375, -2.535003662109375, -2.42791748046875, -2.320831298828125, -2.2137451171875, -2.106658935546875, -1.99957275390625, -1.892486572265625, -1.785400390625, -1.678314208984375, -1.57122802734375, -1.464141845703125, -1.3570556640625, -1.249969482421875, -1.14288330078125, -1.035797119140625, -0.9287109375, -0.821624755859375, -0.71453857421875, -0.607452392578125, -0.5003662109375, -0.393280029296875, -0.28619384765625, -0.179107666015625, -0.072021484375, 0.035064697265625, 0.14215087890625, 0.249237060546875, 0.3563232421875, 0.463409423828125, 0.57049560546875, 0.677581787109375, 0.78466796875, 0.891754150390625, 0.99884033203125, 1.105926513671875, 1.2130126953125, 1.320098876953125, 1.42718505859375, 1.534271240234375, 1.641357421875, 1.748443603515625, 1.85552978515625, 1.962615966796875, 2.0697021484375, 2.176788330078125, 2.28387451171875, 2.390960693359375, 2.498046875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 5.0, 17.0, 20.0, 29.0, 45.0, 55.0, 66.0, 90.0, 85.0, 99.0, 100.0, 90.0, 72.0, 69.0, 43.0, 36.0, 27.0, 22.0, 12.0, 9.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6528472900390625, -1.611358642578125, -1.5698699951171875, -1.52838134765625, -1.4868927001953125, -1.445404052734375, -1.4039154052734375, -1.3624267578125, -1.3209381103515625, -1.279449462890625, -1.2379608154296875, -1.19647216796875, -1.1549835205078125, -1.113494873046875, -1.0720062255859375, -1.030517578125, -0.9890289306640625, -0.947540283203125, -0.9060516357421875, -0.86456298828125, -0.8230743408203125, -0.781585693359375, -0.7400970458984375, -0.6986083984375, -0.6571197509765625, -0.615631103515625, -0.5741424560546875, -0.53265380859375, -0.4911651611328125, -0.449676513671875, -0.4081878662109375, -0.36669921875, -0.3252105712890625, -0.283721923828125, -0.2422332763671875, -0.20074462890625, -0.1592559814453125, -0.117767333984375, -0.0762786865234375, -0.0347900390625, 0.0066986083984375, 0.048187255859375, 0.0896759033203125, 0.13116455078125, 0.1726531982421875, 0.214141845703125, 0.2556304931640625, 0.297119140625, 0.3386077880859375, 0.380096435546875, 0.4215850830078125, 0.46307373046875, 0.5045623779296875, 0.546051025390625, 0.5875396728515625, 0.6290283203125, 0.6705169677734375, 0.712005615234375, 0.7534942626953125, 0.79498291015625, 0.8364715576171875, 0.877960205078125, 0.9194488525390625, 0.9609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 6.0, 4.0, 11.0, 13.0, 41.0, 65.0, 132.0, 264.0, 665.0, 1912.0, 7499.0, 51917.0, 3682370.0, 420005.0, 22698.0, 4413.0, 1273.0, 531.0, 235.0, 90.0, 67.0, 17.0, 14.0, 11.0, 10.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.958984375, -2.862945556640625, -2.76690673828125, -2.670867919921875, -2.5748291015625, -2.478790283203125, -2.38275146484375, -2.286712646484375, -2.190673828125, -2.094635009765625, -1.99859619140625, -1.902557373046875, -1.8065185546875, -1.710479736328125, -1.61444091796875, -1.518402099609375, -1.42236328125, -1.326324462890625, -1.23028564453125, -1.134246826171875, -1.0382080078125, -0.942169189453125, -0.84613037109375, -0.750091552734375, -0.654052734375, -0.558013916015625, -0.46197509765625, -0.365936279296875, -0.2698974609375, -0.173858642578125, -0.07781982421875, 0.018218994140625, 0.1142578125, 0.210296630859375, 0.30633544921875, 0.402374267578125, 0.4984130859375, 0.594451904296875, 0.69049072265625, 0.786529541015625, 0.882568359375, 0.978607177734375, 1.07464599609375, 1.170684814453125, 1.2667236328125, 1.362762451171875, 1.45880126953125, 1.554840087890625, 1.65087890625, 1.746917724609375, 1.84295654296875, 1.938995361328125, 2.0350341796875, 2.131072998046875, 2.22711181640625, 2.323150634765625, 2.419189453125, 2.515228271484375, 2.61126708984375, 2.707305908203125, 2.8033447265625, 2.899383544921875, 2.99542236328125, 3.091461181640625, 3.1875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 6.0, 9.0, 7.0, 10.0, 11.0, 14.0, 20.0, 26.0, 68.0, 107.0, 180.0, 552.0, 2064.0, 553.0, 178.0, 92.0, 55.0, 35.0, 22.0, 14.0, 12.0, 8.0, 8.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.92333984375, -0.8885116577148438, -0.8536834716796875, -0.8188552856445312, -0.784027099609375, -0.7491989135742188, -0.7143707275390625, -0.6795425415039062, -0.64471435546875, -0.6098861694335938, -0.5750579833984375, -0.5402297973632812, -0.505401611328125, -0.47057342529296875, -0.4357452392578125, -0.40091705322265625, -0.3660888671875, -0.33126068115234375, -0.2964324951171875, -0.26160430908203125, -0.226776123046875, -0.19194793701171875, -0.1571197509765625, -0.12229156494140625, -0.08746337890625, -0.05263519287109375, -0.0178070068359375, 0.01702117919921875, 0.051849365234375, 0.08667755126953125, 0.1215057373046875, 0.15633392333984375, 0.191162109375, 0.22599029541015625, 0.2608184814453125, 0.29564666748046875, 0.330474853515625, 0.36530303955078125, 0.4001312255859375, 0.43495941162109375, 0.46978759765625, 0.5046157836914062, 0.5394439697265625, 0.5742721557617188, 0.609100341796875, 0.6439285278320312, 0.6787567138671875, 0.7135848999023438, 0.7484130859375, 0.7832412719726562, 0.8180694580078125, 0.8528976440429688, 0.887725830078125, 0.9225540161132812, 0.9573822021484375, 0.9922103881835938, 1.02703857421875, 1.0618667602539062, 1.0966949462890625, 1.1315231323242188, 1.166351318359375, 1.2011795043945312, 1.2360076904296875, 1.2708358764648438, 1.3056640625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 13.0, 276.0, 557.0, 132.0, 20.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.66816520690918, -12.995689392089844, -12.323213577270508, -11.650738716125488, -10.978262901306152, -10.305787086486816, -9.633312225341797, -8.960836410522461, -8.288360595703125, -7.615884780883789, -6.943409442901611, -6.270934104919434, -5.598458290100098, -4.925982475280762, -4.253507137298584, -3.5810317993164062, -2.9085559844970703, -2.2360804080963135, -1.5636048316955566, -0.8911292552947998, -0.21865367889404297, 0.45382189750671387, 1.1262974739074707, 1.7987728118896484, 2.4712486267089844, 3.143724203109741, 3.816199779510498, 4.488675117492676, 5.161150932312012, 5.833626747131348, 6.506102085113525, 7.178577423095703, 7.851051330566406, 8.523527145385742, 9.196002960205078, 9.868477821350098, 10.540953636169434, 11.21342945098877, 11.885904312133789, 12.558380126953125, 13.230855941772461, 13.903331756591797, 14.575807571411133, 15.248282432556152, 15.920758247375488, 16.593233108520508, 17.265708923339844, 17.93818473815918, 18.610660552978516, 19.28313636779785, 19.955612182617188, 20.628087997436523, 21.30056381225586, 21.973037719726562, 22.6455135345459, 23.317989349365234, 23.99046516418457, 24.662940979003906, 25.335416793823242, 26.007892608642578, 26.68036651611328, 27.352842330932617, 28.025318145751953, 28.69779396057129, 29.370269775390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 7.0, 8.0, 5.0, 5.0, 9.0, 17.0, 16.0, 14.0, 16.0, 25.0, 29.0, 43.0, 18.0, 26.0, 39.0, 36.0, 43.0, 42.0, 53.0, 34.0, 35.0, 50.0, 43.0, 32.0, 41.0, 29.0, 32.0, 32.0, 29.0, 29.0, 27.0, 27.0, 17.0, 16.0, 18.0, 15.0, 10.0, 5.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.2756569385528564, -3.176650285720825, -3.077643871307373, -2.978637218475342, -2.8796305656433105, -2.7806239128112793, -2.681617498397827, -2.582610845565796, -2.4836041927337646, -2.3845975399017334, -2.2855911254882812, -2.18658447265625, -2.0875778198242188, -1.988571286201477, -1.8895647525787354, -1.790558099746704, -1.6915515661239624, -1.5925450325012207, -1.4935383796691895, -1.3945318460464478, -1.2955251932144165, -1.1965186595916748, -1.0975120067596436, -0.9985054731369019, -0.8994988799095154, -0.8004922866821289, -0.7014856934547424, -0.602479100227356, -0.5034725666046143, -0.4044659435749054, -0.3054593801498413, -0.20645278692245483, -0.10744619369506836, -0.008439607918262482, 0.0905669778585434, 0.18957355618476868, 0.28858014941215515, 0.3875867426395416, 0.4865933060646057, 0.5855998992919922, 0.6846064925193787, 0.7836130857467651, 0.8826196789741516, 0.9816262722015381, 1.0806328058242798, 1.179639458656311, 1.2786459922790527, 1.377652645111084, 1.4766591787338257, 1.5756657123565674, 1.6746723651885986, 1.7736788988113403, 1.8726855516433716, 1.9716920852661133, 2.0706987380981445, 2.169705390930176, 2.268711805343628, 2.367718458175659, 2.4667248725891113, 2.5657315254211426, 2.664738178253174, 2.763744831085205, 2.8627512454986572, 2.9617578983306885, 3.0607645511627197]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 5.0, 7.0, 11.0, 9.0, 19.0, 19.0, 44.0, 63.0, 101.0, 206.0, 398.0, 844.0, 1935.0, 5964.0, 25234.0, 176246.0, 688874.0, 121134.0, 19410.0, 4768.0, 1688.0, 740.0, 393.0, 182.0, 98.0, 49.0, 40.0, 18.0, 12.0, 13.0, 8.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1015625, -3.002838134765625, -2.90411376953125, -2.805389404296875, -2.7066650390625, -2.607940673828125, -2.50921630859375, -2.410491943359375, -2.311767578125, -2.213043212890625, -2.11431884765625, -2.015594482421875, -1.9168701171875, -1.818145751953125, -1.71942138671875, -1.620697021484375, -1.52197265625, -1.423248291015625, -1.32452392578125, -1.225799560546875, -1.1270751953125, -1.028350830078125, -0.92962646484375, -0.830902099609375, -0.732177734375, -0.633453369140625, -0.53472900390625, -0.436004638671875, -0.3372802734375, -0.238555908203125, -0.13983154296875, -0.041107177734375, 0.0576171875, 0.156341552734375, 0.25506591796875, 0.353790283203125, 0.4525146484375, 0.551239013671875, 0.64996337890625, 0.748687744140625, 0.847412109375, 0.946136474609375, 1.04486083984375, 1.143585205078125, 1.2423095703125, 1.341033935546875, 1.43975830078125, 1.538482666015625, 1.63720703125, 1.735931396484375, 1.83465576171875, 1.933380126953125, 2.0321044921875, 2.130828857421875, 2.22955322265625, 2.328277587890625, 2.427001953125, 2.525726318359375, 2.62445068359375, 2.723175048828125, 2.8218994140625, 2.920623779296875, 3.01934814453125, 3.118072509765625, 3.216796875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 13.0, 14.0, 31.0, 38.0, 46.0, 66.0, 80.0, 97.0, 76.0, 83.0, 100.0, 85.0, 58.0, 56.0, 42.0, 28.0, 30.0, 18.0, 9.0, 7.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5810546875, -1.541748046875, -1.50244140625, -1.463134765625, -1.423828125, -1.384521484375, -1.34521484375, -1.305908203125, -1.2666015625, -1.227294921875, -1.18798828125, -1.148681640625, -1.109375, -1.070068359375, -1.03076171875, -0.991455078125, -0.9521484375, -0.912841796875, -0.87353515625, -0.834228515625, -0.794921875, -0.755615234375, -0.71630859375, -0.677001953125, -0.6376953125, -0.598388671875, -0.55908203125, -0.519775390625, -0.48046875, -0.441162109375, -0.40185546875, -0.362548828125, -0.3232421875, -0.283935546875, -0.24462890625, -0.205322265625, -0.166015625, -0.126708984375, -0.08740234375, -0.048095703125, -0.0087890625, 0.030517578125, 0.06982421875, 0.109130859375, 0.1484375, 0.187744140625, 0.22705078125, 0.266357421875, 0.3056640625, 0.344970703125, 0.38427734375, 0.423583984375, 0.462890625, 0.502197265625, 0.54150390625, 0.580810546875, 0.6201171875, 0.659423828125, 0.69873046875, 0.738037109375, 0.77734375, 0.816650390625, 0.85595703125, 0.895263671875, 0.9345703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 7.0, 7.0, 11.0, 8.0, 10.0, 20.0, 18.0, 32.0, 35.0, 41.0, 48.0, 98.0, 152.0, 244.0, 481.0, 1162.0, 3170.0, 10658.0, 45010.0, 265970.0, 577225.0, 112243.0, 22416.0, 5815.0, 1899.0, 745.0, 363.0, 210.0, 120.0, 81.0, 70.0, 36.0, 33.0, 31.0, 27.0, 11.0, 11.0, 13.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.16796875, -2.093902587890625, -2.01983642578125, -1.945770263671875, -1.8717041015625, -1.797637939453125, -1.72357177734375, -1.649505615234375, -1.575439453125, -1.501373291015625, -1.42730712890625, -1.353240966796875, -1.2791748046875, -1.205108642578125, -1.13104248046875, -1.056976318359375, -0.98291015625, -0.908843994140625, -0.83477783203125, -0.760711669921875, -0.6866455078125, -0.612579345703125, -0.53851318359375, -0.464447021484375, -0.390380859375, -0.316314697265625, -0.24224853515625, -0.168182373046875, -0.0941162109375, -0.020050048828125, 0.05401611328125, 0.128082275390625, 0.2021484375, 0.276214599609375, 0.35028076171875, 0.424346923828125, 0.4984130859375, 0.572479248046875, 0.64654541015625, 0.720611572265625, 0.794677734375, 0.868743896484375, 0.94281005859375, 1.016876220703125, 1.0909423828125, 1.165008544921875, 1.23907470703125, 1.313140869140625, 1.38720703125, 1.461273193359375, 1.53533935546875, 1.609405517578125, 1.6834716796875, 1.757537841796875, 1.83160400390625, 1.905670166015625, 1.979736328125, 2.053802490234375, 2.12786865234375, 2.201934814453125, 2.2760009765625, 2.350067138671875, 2.42413330078125, 2.498199462890625, 2.572265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 6.0, 7.0, 11.0, 11.0, 21.0, 21.0, 27.0, 29.0, 29.0, 31.0, 36.0, 44.0, 45.0, 48.0, 54.0, 55.0, 55.0, 64.0, 64.0, 42.0, 31.0, 34.0, 36.0, 32.0, 39.0, 15.0, 21.0, 19.0, 13.0, 4.0, 12.0, 8.0, 8.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.365142822265625, -3.25958251953125, -3.154022216796875, -3.0484619140625, -2.942901611328125, -2.83734130859375, -2.731781005859375, -2.626220703125, -2.520660400390625, -2.41510009765625, -2.309539794921875, -2.2039794921875, -2.098419189453125, -1.99285888671875, -1.887298583984375, -1.78173828125, -1.676177978515625, -1.57061767578125, -1.465057373046875, -1.3594970703125, -1.253936767578125, -1.14837646484375, -1.042816162109375, -0.937255859375, -0.831695556640625, -0.72613525390625, -0.620574951171875, -0.5150146484375, -0.409454345703125, -0.30389404296875, -0.198333740234375, -0.0927734375, 0.012786865234375, 0.11834716796875, 0.223907470703125, 0.3294677734375, 0.435028076171875, 0.54058837890625, 0.646148681640625, 0.751708984375, 0.857269287109375, 0.96282958984375, 1.068389892578125, 1.1739501953125, 1.279510498046875, 1.38507080078125, 1.490631103515625, 1.59619140625, 1.701751708984375, 1.80731201171875, 1.912872314453125, 2.0184326171875, 2.123992919921875, 2.22955322265625, 2.335113525390625, 2.440673828125, 2.546234130859375, 2.65179443359375, 2.757354736328125, 2.8629150390625, 2.968475341796875, 3.07403564453125, 3.179595947265625, 3.28515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 18.0, 15.0, 51.0, 284.0, 2601.0, 1024844.0, 19982.0, 570.0, 129.0, 36.0, 11.0, 5.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.52996826171875, -5.3372802734375, -5.14459228515625, -4.951904296875, -4.75921630859375, -4.5665283203125, -4.37384033203125, -4.18115234375, -3.98846435546875, -3.7957763671875, -3.60308837890625, -3.410400390625, -3.21771240234375, -3.0250244140625, -2.83233642578125, -2.6396484375, -2.44696044921875, -2.2542724609375, -2.06158447265625, -1.868896484375, -1.67620849609375, -1.4835205078125, -1.29083251953125, -1.09814453125, -0.90545654296875, -0.7127685546875, -0.52008056640625, -0.327392578125, -0.13470458984375, 0.0579833984375, 0.25067138671875, 0.443359375, 0.63604736328125, 0.8287353515625, 1.02142333984375, 1.214111328125, 1.40679931640625, 1.5994873046875, 1.79217529296875, 1.98486328125, 2.17755126953125, 2.3702392578125, 2.56292724609375, 2.755615234375, 2.94830322265625, 3.1409912109375, 3.33367919921875, 3.5263671875, 3.71905517578125, 3.9117431640625, 4.10443115234375, 4.297119140625, 4.48980712890625, 4.6824951171875, 4.87518310546875, 5.06787109375, 5.26055908203125, 5.4532470703125, 5.64593505859375, 5.838623046875, 6.03131103515625, 6.2239990234375, 6.41668701171875, 6.609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 13.0, 34.0, 88.0, 286.0, 371.0, 141.0, 45.0, 13.0, 9.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006246566772460938, -0.0006078332662582397, -0.0005910098552703857, -0.0005741864442825317, -0.0005573630332946777, -0.0005405396223068237, -0.0005237162113189697, -0.0005068928003311157, -0.0004900693893432617, -0.0004732459783554077, -0.0004564225673675537, -0.0004395991563796997, -0.0004227757453918457, -0.0004059523344039917, -0.0003891289234161377, -0.0003723055124282837, -0.0003554821014404297, -0.0003386586904525757, -0.0003218352794647217, -0.0003050118684768677, -0.00028818845748901367, -0.00027136504650115967, -0.00025454163551330566, -0.00023771822452545166, -0.00022089481353759766, -0.00020407140254974365, -0.00018724799156188965, -0.00017042458057403564, -0.00015360116958618164, -0.00013677775859832764, -0.00011995434761047363, -0.00010313093662261963, -8.630752563476562e-05, -6.948411464691162e-05, -5.266070365905762e-05, -3.583729267120361e-05, -1.901388168334961e-05, -2.1904706954956055e-06, 1.4632940292358398e-05, 3.14563512802124e-05, 4.8279762268066406e-05, 6.510317325592041e-05, 8.192658424377441e-05, 9.874999523162842e-05, 0.00011557340621948242, 0.00013239681720733643, 0.00014922022819519043, 0.00016604363918304443, 0.00018286705017089844, 0.00019969046115875244, 0.00021651387214660645, 0.00023333728313446045, 0.00025016069412231445, 0.00026698410511016846, 0.00028380751609802246, 0.00030063092708587646, 0.00031745433807373047, 0.00033427774906158447, 0.0003511011600494385, 0.0003679245710372925, 0.0003847479820251465, 0.0004015713930130005, 0.0004183948040008545, 0.0004352182149887085, 0.0004520416259765625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 14.0, 29.0, 53.0, 125.0, 373.0, 4012.0, 1038109.0, 5250.0, 353.0, 148.0, 53.0, 23.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.69140625, -7.496826171875, -7.30224609375, -7.107666015625, -6.9130859375, -6.718505859375, -6.52392578125, -6.329345703125, -6.134765625, -5.940185546875, -5.74560546875, -5.551025390625, -5.3564453125, -5.161865234375, -4.96728515625, -4.772705078125, -4.578125, -4.383544921875, -4.18896484375, -3.994384765625, -3.7998046875, -3.605224609375, -3.41064453125, -3.216064453125, -3.021484375, -2.826904296875, -2.63232421875, -2.437744140625, -2.2431640625, -2.048583984375, -1.85400390625, -1.659423828125, -1.46484375, -1.270263671875, -1.07568359375, -0.881103515625, -0.6865234375, -0.491943359375, -0.29736328125, -0.102783203125, 0.091796875, 0.286376953125, 0.48095703125, 0.675537109375, 0.8701171875, 1.064697265625, 1.25927734375, 1.453857421875, 1.6484375, 1.843017578125, 2.03759765625, 2.232177734375, 2.4267578125, 2.621337890625, 2.81591796875, 3.010498046875, 3.205078125, 3.399658203125, 3.59423828125, 3.788818359375, 3.9833984375, 4.177978515625, 4.37255859375, 4.567138671875, 4.76171875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 30.0, 123.0, 529.0, 263.0, 51.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0, -6.832244873046875, -6.66448974609375, -6.496734619140625, -6.3289794921875, -6.161224365234375, -5.99346923828125, -5.825714111328125, -5.657958984375, -5.490203857421875, -5.32244873046875, -5.154693603515625, -4.9869384765625, -4.819183349609375, -4.65142822265625, -4.483673095703125, -4.31591796875, -4.148162841796875, -3.98040771484375, -3.812652587890625, -3.6448974609375, -3.477142333984375, -3.30938720703125, -3.141632080078125, -2.973876953125, -2.806121826171875, -2.63836669921875, -2.470611572265625, -2.3028564453125, -2.135101318359375, -1.96734619140625, -1.799591064453125, -1.6318359375, -1.464080810546875, -1.29632568359375, -1.128570556640625, -0.9608154296875, -0.793060302734375, -0.62530517578125, -0.457550048828125, -0.289794921875, -0.122039794921875, 0.04571533203125, 0.213470458984375, 0.3812255859375, 0.548980712890625, 0.71673583984375, 0.884490966796875, 1.05224609375, 1.220001220703125, 1.38775634765625, 1.555511474609375, 1.7232666015625, 1.891021728515625, 2.05877685546875, 2.226531982421875, 2.394287109375, 2.562042236328125, 2.72979736328125, 2.897552490234375, 3.0653076171875, 3.233062744140625, 3.40081787109375, 3.568572998046875, 3.736328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 32.0, 88.0, 240.0, 316.0, 191.0, 74.0, 31.0, 19.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-46.45402526855469, -45.52759552001953, -44.60116195678711, -43.67472839355469, -42.74829864501953, -41.821868896484375, -40.89543533325195, -39.96900177001953, -39.042572021484375, -38.11614227294922, -37.1897087097168, -36.263275146484375, -35.33684539794922, -34.41041564941406, -33.48398208618164, -32.55754852294922, -31.631118774414062, -30.704687118530273, -29.778255462646484, -28.851823806762695, -27.925392150878906, -26.998960494995117, -26.072528839111328, -25.14609718322754, -24.21966552734375, -23.29323387145996, -22.366802215576172, -21.440370559692383, -20.513938903808594, -19.587507247924805, -18.661075592041016, -17.734643936157227, -16.80821418762207, -15.881782531738281, -14.955350875854492, -14.028919219970703, -13.102487564086914, -12.176055908203125, -11.249624252319336, -10.323192596435547, -9.396760940551758, -8.470329284667969, -7.54389762878418, -6.617465972900391, -5.691034317016602, -4.7646026611328125, -3.8381710052490234, -2.9117393493652344, -1.9853076934814453, -1.0588760375976562, -0.1324443817138672, 0.7939872741699219, 1.720418930053711, 2.6468505859375, 3.573282241821289, 4.499713897705078, 5.426145553588867, 6.352577209472656, 7.279008865356445, 8.205440521240234, 9.131872177124023, 10.058303833007812, 10.984735488891602, 11.91116714477539, 12.83759880065918]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 8.0, 5.0, 10.0, 18.0, 14.0, 16.0, 16.0, 20.0, 19.0, 31.0, 31.0, 38.0, 37.0, 32.0, 41.0, 33.0, 59.0, 32.0, 49.0, 42.0, 41.0, 31.0, 42.0, 32.0, 33.0, 35.0, 28.0, 31.0, 25.0, 18.0, 19.0, 15.0, 12.0, 21.0, 20.0, 7.0, 6.0, 4.0, 6.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-15.201499938964844, -14.745380401611328, -14.289259910583496, -13.83314037322998, -13.377019882202148, -12.920900344848633, -12.464780807495117, -12.008660316467285, -11.55254077911377, -11.096421241760254, -10.640300750732422, -10.184181213378906, -9.728060722351074, -9.271941184997559, -8.815820693969727, -8.359701156616211, -7.903581142425537, -7.447461128234863, -6.9913411140441895, -6.535221099853516, -6.0791015625, -5.622981548309326, -5.166861534118652, -4.710741996765137, -4.254621505737305, -3.798501491546631, -3.342381715774536, -2.8862617015838623, -2.4301419258117676, -1.9740219116210938, -1.51790189743042, -1.0617821216583252, -0.6056623458862305, -0.1495424211025238, 0.30657750368118286, 0.7626974582672119, 1.2188173532485962, 1.6749372482299805, 2.1310572624206543, 2.587177038192749, 3.043297052383423, 3.4994170665740967, 3.9555368423461914, 4.411656856536865, 4.867776870727539, 5.323896408081055, 5.780016899108887, 6.236136436462402, 6.692256450653076, 7.14837646484375, 7.604496479034424, 8.060616493225098, 8.516736030578613, 8.972856521606445, 9.428976058959961, 9.885095596313477, 10.341216087341309, 10.797335624694824, 11.253456115722656, 11.709575653076172, 12.165696144104004, 12.62181568145752, 13.077936172485352, 13.534055709838867, 13.990175247192383]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 13.0, 16.0, 22.0, 36.0, 57.0, 111.0, 162.0, 263.0, 617.0, 1376.0, 3948.0, 15147.0, 138809.0, 3927065.0, 88471.0, 12233.0, 3449.0, 1252.0, 526.0, 296.0, 155.0, 100.0, 57.0, 30.0, 21.0, 13.0, 7.0, 8.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.971282958984375, -2.87030029296875, -2.769317626953125, -2.6683349609375, -2.567352294921875, -2.46636962890625, -2.365386962890625, -2.264404296875, -2.163421630859375, -2.06243896484375, -1.961456298828125, -1.8604736328125, -1.759490966796875, -1.65850830078125, -1.557525634765625, -1.45654296875, -1.355560302734375, -1.25457763671875, -1.153594970703125, -1.0526123046875, -0.951629638671875, -0.85064697265625, -0.749664306640625, -0.648681640625, -0.547698974609375, -0.44671630859375, -0.345733642578125, -0.2447509765625, -0.143768310546875, -0.04278564453125, 0.058197021484375, 0.1591796875, 0.260162353515625, 0.36114501953125, 0.462127685546875, 0.5631103515625, 0.664093017578125, 0.76507568359375, 0.866058349609375, 0.967041015625, 1.068023681640625, 1.16900634765625, 1.269989013671875, 1.3709716796875, 1.471954345703125, 1.57293701171875, 1.673919677734375, 1.77490234375, 1.875885009765625, 1.97686767578125, 2.077850341796875, 2.1788330078125, 2.279815673828125, 2.38079833984375, 2.481781005859375, 2.582763671875, 2.683746337890625, 2.78472900390625, 2.885711669921875, 2.9866943359375, 3.087677001953125, 3.18865966796875, 3.289642333984375, 3.390625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 12.0, 2.0, 15.0, 12.0, 23.0, 19.0, 40.0, 60.0, 54.0, 53.0, 73.0, 85.0, 79.0, 88.0, 84.0, 66.0, 59.0, 41.0, 39.0, 27.0, 25.0, 20.0, 10.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6806640625, -1.6392974853515625, -1.597930908203125, -1.5565643310546875, -1.51519775390625, -1.4738311767578125, -1.432464599609375, -1.3910980224609375, -1.3497314453125, -1.3083648681640625, -1.266998291015625, -1.2256317138671875, -1.18426513671875, -1.1428985595703125, -1.101531982421875, -1.0601654052734375, -1.018798828125, -0.9774322509765625, -0.936065673828125, -0.8946990966796875, -0.85333251953125, -0.8119659423828125, -0.770599365234375, -0.7292327880859375, -0.6878662109375, -0.6464996337890625, -0.605133056640625, -0.5637664794921875, -0.52239990234375, -0.4810333251953125, -0.439666748046875, -0.3983001708984375, -0.35693359375, -0.3155670166015625, -0.274200439453125, -0.2328338623046875, -0.19146728515625, -0.1501007080078125, -0.108734130859375, -0.0673675537109375, -0.0260009765625, 0.0153656005859375, 0.056732177734375, 0.0980987548828125, 0.13946533203125, 0.1808319091796875, 0.222198486328125, 0.2635650634765625, 0.304931640625, 0.3462982177734375, 0.387664794921875, 0.4290313720703125, 0.47039794921875, 0.5117645263671875, 0.553131103515625, 0.5944976806640625, 0.6358642578125, 0.6772308349609375, 0.718597412109375, 0.7599639892578125, 0.80133056640625, 0.8426971435546875, 0.884063720703125, 0.9254302978515625, 0.966796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 14.0, 22.0, 35.0, 52.0, 96.0, 201.0, 849.0, 7386.0, 1248328.0, 2927702.0, 8266.0, 912.0, 219.0, 87.0, 40.0, 31.0, 18.0, 8.0, 9.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.765625, -10.53167724609375, -10.2977294921875, -10.06378173828125, -9.829833984375, -9.59588623046875, -9.3619384765625, -9.12799072265625, -8.89404296875, -8.66009521484375, -8.4261474609375, -8.19219970703125, -7.958251953125, -7.72430419921875, -7.4903564453125, -7.25640869140625, -7.0224609375, -6.78851318359375, -6.5545654296875, -6.32061767578125, -6.086669921875, -5.85272216796875, -5.6187744140625, -5.38482666015625, -5.15087890625, -4.91693115234375, -4.6829833984375, -4.44903564453125, -4.215087890625, -3.98114013671875, -3.7471923828125, -3.51324462890625, -3.279296875, -3.04534912109375, -2.8114013671875, -2.57745361328125, -2.343505859375, -2.10955810546875, -1.8756103515625, -1.64166259765625, -1.40771484375, -1.17376708984375, -0.9398193359375, -0.70587158203125, -0.471923828125, -0.23797607421875, -0.0040283203125, 0.22991943359375, 0.4638671875, 0.69781494140625, 0.9317626953125, 1.16571044921875, 1.399658203125, 1.63360595703125, 1.8675537109375, 2.10150146484375, 2.33544921875, 2.56939697265625, 2.8033447265625, 3.03729248046875, 3.271240234375, 3.50518798828125, 3.7391357421875, 3.97308349609375, 4.20703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 12.0, 14.0, 12.0, 27.0, 55.0, 104.0, 307.0, 2166.0, 966.0, 197.0, 94.0, 43.0, 24.0, 20.0, 16.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.072265625, -2.02276611328125, -1.9732666015625, -1.92376708984375, -1.874267578125, -1.82476806640625, -1.7752685546875, -1.72576904296875, -1.67626953125, -1.62677001953125, -1.5772705078125, -1.52777099609375, -1.478271484375, -1.42877197265625, -1.3792724609375, -1.32977294921875, -1.2802734375, -1.23077392578125, -1.1812744140625, -1.13177490234375, -1.082275390625, -1.03277587890625, -0.9832763671875, -0.93377685546875, -0.88427734375, -0.83477783203125, -0.7852783203125, -0.73577880859375, -0.686279296875, -0.63677978515625, -0.5872802734375, -0.53778076171875, -0.48828125, -0.43878173828125, -0.3892822265625, -0.33978271484375, -0.290283203125, -0.24078369140625, -0.1912841796875, -0.14178466796875, -0.09228515625, -0.04278564453125, 0.0067138671875, 0.05621337890625, 0.105712890625, 0.15521240234375, 0.2047119140625, 0.25421142578125, 0.3037109375, 0.35321044921875, 0.4027099609375, 0.45220947265625, 0.501708984375, 0.55120849609375, 0.6007080078125, 0.65020751953125, 0.69970703125, 0.74920654296875, 0.7987060546875, 0.84820556640625, 0.897705078125, 0.94720458984375, 0.9967041015625, 1.04620361328125, 1.095703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 16.0, 38.0, 77.0, 112.0, 168.0, 175.0, 143.0, 116.0, 74.0, 27.0, 18.0, 13.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.530097007751465, -9.312538146972656, -9.094979286193848, -8.877421379089355, -8.659862518310547, -8.442303657531738, -8.22474479675293, -8.007186889648438, -7.789628028869629, -7.57206916809082, -7.35451078414917, -7.136951923370361, -6.919393539428711, -6.701834678649902, -6.484275817871094, -6.266717433929443, -6.049158573150635, -5.831599712371826, -5.614041328430176, -5.396482467651367, -5.178924083709717, -4.961365222930908, -4.743806838989258, -4.526247978210449, -4.308689117431641, -4.091130256652832, -3.8735718727111816, -3.656013011932373, -3.4384546279907227, -3.220895767211914, -3.0033371448516846, -2.785778522491455, -2.5682196617126465, -2.350661039352417, -2.1331024169921875, -1.9155436754226685, -1.697985053062439, -1.4804264307022095, -1.2628676891326904, -1.045309066772461, -0.8277504444122314, -0.610191822052002, -0.3926331400871277, -0.17507445812225342, 0.042484164237976074, 0.26004278659820557, 0.4776015281677246, 0.6951601505279541, 0.9127187728881836, 1.130277395248413, 1.3478360176086426, 1.5653947591781616, 1.7829533815383911, 2.00051212310791, 2.2180707454681396, 2.435629367828369, 2.6531879901885986, 2.870746612548828, 3.0883052349090576, 3.305863857269287, 3.5234227180480957, 3.740981101989746, 3.9585399627685547, 4.176098823547363, 4.393657207489014]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 8.0, 9.0, 9.0, 10.0, 16.0, 14.0, 15.0, 20.0, 36.0, 32.0, 26.0, 37.0, 26.0, 40.0, 52.0, 47.0, 34.0, 57.0, 61.0, 43.0, 47.0, 29.0, 35.0, 48.0, 29.0, 34.0, 25.0, 22.0, 17.0, 21.0, 9.0, 15.0, 11.0, 8.0, 7.0, 12.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1181986331939697, -3.0216519832611084, -2.925105333328247, -2.8285584449768066, -2.7320117950439453, -2.635465145111084, -2.5389184951782227, -2.4423718452453613, -2.3458251953125, -2.2492785453796387, -2.1527318954467773, -2.056185245513916, -1.9596383571624756, -1.8630917072296143, -1.766545057296753, -1.6699984073638916, -1.5734515190124512, -1.4769048690795898, -1.380358099937439, -1.2838114500045776, -1.1872646808624268, -1.0907180309295654, -0.9941713809967041, -0.897624671459198, -0.8010779619216919, -0.7045312523841858, -0.6079845428466797, -0.5114378929138184, -0.41489118337631226, -0.31834447383880615, -0.22179782390594482, -0.12525111436843872, -0.028704166412353516, 0.0678425282239914, 0.1643892228603363, 0.26093590259552, 0.3574826121330261, 0.4540293216705322, 0.5505759716033936, 0.6471226811408997, 0.7436693906784058, 0.8402161002159119, 0.936762809753418, 1.0333094596862793, 1.1298561096191406, 1.2264028787612915, 1.3229495286941528, 1.4194962978363037, 1.516042947769165, 1.6125895977020264, 1.7091363668441772, 1.8056830167770386, 1.9022297859191895, 1.9987764358520508, 2.095323085784912, 2.1918697357177734, 2.2884163856506348, 2.384963035583496, 2.4815096855163574, 2.5780563354492188, 2.674603223800659, 2.7711498737335205, 2.867696523666382, 2.964243173599243, 3.0607900619506836]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 9.0, 21.0, 31.0, 50.0, 75.0, 133.0, 281.0, 676.0, 1893.0, 7155.0, 35741.0, 240616.0, 608548.0, 126079.0, 20531.0, 4427.0, 1273.0, 468.0, 214.0, 123.0, 73.0, 45.0, 28.0, 20.0, 11.0, 9.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.609375, -3.507232666015625, -3.40509033203125, -3.302947998046875, -3.2008056640625, -3.098663330078125, -2.99652099609375, -2.894378662109375, -2.792236328125, -2.690093994140625, -2.58795166015625, -2.485809326171875, -2.3836669921875, -2.281524658203125, -2.17938232421875, -2.077239990234375, -1.97509765625, -1.872955322265625, -1.77081298828125, -1.668670654296875, -1.5665283203125, -1.464385986328125, -1.36224365234375, -1.260101318359375, -1.157958984375, -1.055816650390625, -0.95367431640625, -0.851531982421875, -0.7493896484375, -0.647247314453125, -0.54510498046875, -0.442962646484375, -0.3408203125, -0.238677978515625, -0.13653564453125, -0.034393310546875, 0.0677490234375, 0.169891357421875, 0.27203369140625, 0.374176025390625, 0.476318359375, 0.578460693359375, 0.68060302734375, 0.782745361328125, 0.8848876953125, 0.987030029296875, 1.08917236328125, 1.191314697265625, 1.29345703125, 1.395599365234375, 1.49774169921875, 1.599884033203125, 1.7020263671875, 1.804168701171875, 1.90631103515625, 2.008453369140625, 2.110595703125, 2.212738037109375, 2.31488037109375, 2.417022705078125, 2.5191650390625, 2.621307373046875, 2.72344970703125, 2.825592041015625, 2.927734375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 12.0, 8.0, 19.0, 21.0, 21.0, 32.0, 47.0, 44.0, 52.0, 69.0, 77.0, 68.0, 94.0, 68.0, 56.0, 62.0, 56.0, 54.0, 25.0, 32.0, 27.0, 19.0, 13.0, 4.0, 10.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.564453125, -1.525604248046875, -1.48675537109375, -1.447906494140625, -1.4090576171875, -1.370208740234375, -1.33135986328125, -1.292510986328125, -1.253662109375, -1.214813232421875, -1.17596435546875, -1.137115478515625, -1.0982666015625, -1.059417724609375, -1.02056884765625, -0.981719970703125, -0.94287109375, -0.904022216796875, -0.86517333984375, -0.826324462890625, -0.7874755859375, -0.748626708984375, -0.70977783203125, -0.670928955078125, -0.632080078125, -0.593231201171875, -0.55438232421875, -0.515533447265625, -0.4766845703125, -0.437835693359375, -0.39898681640625, -0.360137939453125, -0.3212890625, -0.282440185546875, -0.24359130859375, -0.204742431640625, -0.1658935546875, -0.127044677734375, -0.08819580078125, -0.049346923828125, -0.010498046875, 0.028350830078125, 0.06719970703125, 0.106048583984375, 0.1448974609375, 0.183746337890625, 0.22259521484375, 0.261444091796875, 0.30029296875, 0.339141845703125, 0.37799072265625, 0.416839599609375, 0.4556884765625, 0.494537353515625, 0.53338623046875, 0.572235107421875, 0.611083984375, 0.649932861328125, 0.68878173828125, 0.727630615234375, 0.7664794921875, 0.805328369140625, 0.84417724609375, 0.883026123046875, 0.921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 11.0, 4.0, 13.0, 18.0, 21.0, 20.0, 24.0, 32.0, 63.0, 70.0, 102.0, 201.0, 360.0, 977.0, 3139.0, 12620.0, 62144.0, 350555.0, 492253.0, 99796.0, 19112.0, 4507.0, 1328.0, 475.0, 226.0, 134.0, 99.0, 67.0, 37.0, 33.0, 26.0, 22.0, 14.0, 9.0, 9.0, 4.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.7734375, -2.6871337890625, -2.600830078125, -2.5145263671875, -2.42822265625, -2.3419189453125, -2.255615234375, -2.1693115234375, -2.0830078125, -1.9967041015625, -1.910400390625, -1.8240966796875, -1.73779296875, -1.6514892578125, -1.565185546875, -1.4788818359375, -1.392578125, -1.3062744140625, -1.219970703125, -1.1336669921875, -1.04736328125, -0.9610595703125, -0.874755859375, -0.7884521484375, -0.7021484375, -0.6158447265625, -0.529541015625, -0.4432373046875, -0.35693359375, -0.2706298828125, -0.184326171875, -0.0980224609375, -0.01171875, 0.0745849609375, 0.160888671875, 0.2471923828125, 0.33349609375, 0.4197998046875, 0.506103515625, 0.5924072265625, 0.6787109375, 0.7650146484375, 0.851318359375, 0.9376220703125, 1.02392578125, 1.1102294921875, 1.196533203125, 1.2828369140625, 1.369140625, 1.4554443359375, 1.541748046875, 1.6280517578125, 1.71435546875, 1.8006591796875, 1.886962890625, 1.9732666015625, 2.0595703125, 2.1458740234375, 2.232177734375, 2.3184814453125, 2.40478515625, 2.4910888671875, 2.577392578125, 2.6636962890625, 2.75]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 10.0, 8.0, 18.0, 19.0, 15.0, 22.0, 22.0, 21.0, 34.0, 27.0, 34.0, 39.0, 38.0, 42.0, 46.0, 53.0, 50.0, 41.0, 39.0, 38.0, 38.0, 52.0, 38.0, 28.0, 26.0, 31.0, 30.0, 17.0, 28.0, 17.0, 16.0, 12.0, 9.0, 7.0, 9.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0], "bins": [-3.91796875, -3.813995361328125, -3.71002197265625, -3.606048583984375, -3.5020751953125, -3.398101806640625, -3.29412841796875, -3.190155029296875, -3.086181640625, -2.982208251953125, -2.87823486328125, -2.774261474609375, -2.6702880859375, -2.566314697265625, -2.46234130859375, -2.358367919921875, -2.25439453125, -2.150421142578125, -2.04644775390625, -1.942474365234375, -1.8385009765625, -1.734527587890625, -1.63055419921875, -1.526580810546875, -1.422607421875, -1.318634033203125, -1.21466064453125, -1.110687255859375, -1.0067138671875, -0.902740478515625, -0.79876708984375, -0.694793701171875, -0.5908203125, -0.486846923828125, -0.38287353515625, -0.278900146484375, -0.1749267578125, -0.070953369140625, 0.03302001953125, 0.136993408203125, 0.240966796875, 0.344940185546875, 0.44891357421875, 0.552886962890625, 0.6568603515625, 0.760833740234375, 0.86480712890625, 0.968780517578125, 1.07275390625, 1.176727294921875, 1.28070068359375, 1.384674072265625, 1.4886474609375, 1.592620849609375, 1.69659423828125, 1.800567626953125, 1.904541015625, 2.008514404296875, 2.11248779296875, 2.216461181640625, 2.3204345703125, 2.424407958984375, 2.52838134765625, 2.632354736328125, 2.736328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 1.0, 5.0, 9.0, 6.0, 14.0, 25.0, 41.0, 47.0, 109.0, 186.0, 398.0, 1044.0, 2998.0, 9495.0, 37295.0, 273794.0, 618971.0, 79240.0, 17240.0, 4840.0, 1593.0, 600.0, 272.0, 132.0, 82.0, 40.0, 30.0, 17.0, 9.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26953125, -1.2211151123046875, -1.172698974609375, -1.1242828369140625, -1.07586669921875, -1.0274505615234375, -0.979034423828125, -0.9306182861328125, -0.8822021484375, -0.8337860107421875, -0.785369873046875, -0.7369537353515625, -0.68853759765625, -0.6401214599609375, -0.591705322265625, -0.5432891845703125, -0.494873046875, -0.4464569091796875, -0.398040771484375, -0.3496246337890625, -0.30120849609375, -0.2527923583984375, -0.204376220703125, -0.1559600830078125, -0.1075439453125, -0.0591278076171875, -0.010711669921875, 0.0377044677734375, 0.08612060546875, 0.1345367431640625, 0.182952880859375, 0.2313690185546875, 0.27978515625, 0.3282012939453125, 0.376617431640625, 0.4250335693359375, 0.47344970703125, 0.5218658447265625, 0.570281982421875, 0.6186981201171875, 0.6671142578125, 0.7155303955078125, 0.763946533203125, 0.8123626708984375, 0.86077880859375, 0.9091949462890625, 0.957611083984375, 1.0060272216796875, 1.054443359375, 1.1028594970703125, 1.151275634765625, 1.1996917724609375, 1.24810791015625, 1.2965240478515625, 1.344940185546875, 1.3933563232421875, 1.4417724609375, 1.4901885986328125, 1.538604736328125, 1.5870208740234375, 1.63543701171875, 1.6838531494140625, 1.732269287109375, 1.7806854248046875, 1.8291015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 9.0, 7.0, 15.0, 14.0, 13.0, 24.0, 43.0, 57.0, 72.0, 116.0, 151.0, 130.0, 105.0, 69.0, 57.0, 36.0, 22.0, 16.0, 14.0, 8.0, 7.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019478797912597656, -0.00018617138266563416, -0.00017755478620529175, -0.00016893818974494934, -0.00016032159328460693, -0.00015170499682426453, -0.00014308840036392212, -0.0001344718039035797, -0.0001258552074432373, -0.0001172386109828949, -0.00010862201452255249, -0.00010000541806221008, -9.138882160186768e-05, -8.277222514152527e-05, -7.415562868118286e-05, -6.553903222084045e-05, -5.692243576049805e-05, -4.830583930015564e-05, -3.968924283981323e-05, -3.1072646379470825e-05, -2.2456049919128418e-05, -1.383945345878601e-05, -5.2228569984436035e-06, 3.3937394618988037e-06, 1.2010335922241211e-05, 2.0626932382583618e-05, 2.9243528842926025e-05, 3.786012530326843e-05, 4.647672176361084e-05, 5.509331822395325e-05, 6.370991468429565e-05, 7.232651114463806e-05, 8.094310760498047e-05, 8.955970406532288e-05, 9.817630052566528e-05, 0.00010679289698600769, 0.0001154094934463501, 0.0001240260899066925, 0.0001326426863670349, 0.00014125928282737732, 0.00014987587928771973, 0.00015849247574806213, 0.00016710907220840454, 0.00017572566866874695, 0.00018434226512908936, 0.00019295886158943176, 0.00020157545804977417, 0.00021019205451011658, 0.00021880865097045898, 0.0002274252474308014, 0.0002360418438911438, 0.0002446584403514862, 0.0002532750368118286, 0.000261891633272171, 0.00027050822973251343, 0.00027912482619285583, 0.00028774142265319824, 0.00029635801911354065, 0.00030497461557388306, 0.00031359121203422546, 0.00032220780849456787, 0.0003308244049549103, 0.0003394410014152527, 0.0003480575978755951, 0.0003566741943359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 8.0, 20.0, 33.0, 68.0, 153.0, 472.0, 1857.0, 11599.0, 159379.0, 811223.0, 56059.0, 5985.0, 1122.0, 326.0, 130.0, 48.0, 20.0, 19.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.560546875, -2.4900665283203125, -2.419586181640625, -2.3491058349609375, -2.27862548828125, -2.2081451416015625, -2.137664794921875, -2.0671844482421875, -1.9967041015625, -1.9262237548828125, -1.855743408203125, -1.7852630615234375, -1.71478271484375, -1.6443023681640625, -1.573822021484375, -1.5033416748046875, -1.432861328125, -1.3623809814453125, -1.291900634765625, -1.2214202880859375, -1.15093994140625, -1.0804595947265625, -1.009979248046875, -0.9394989013671875, -0.8690185546875, -0.7985382080078125, -0.728057861328125, -0.6575775146484375, -0.58709716796875, -0.5166168212890625, -0.446136474609375, -0.3756561279296875, -0.30517578125, -0.2346954345703125, -0.164215087890625, -0.0937347412109375, -0.02325439453125, 0.0472259521484375, 0.117706298828125, 0.1881866455078125, 0.2586669921875, 0.3291473388671875, 0.399627685546875, 0.4701080322265625, 0.54058837890625, 0.6110687255859375, 0.681549072265625, 0.7520294189453125, 0.822509765625, 0.8929901123046875, 0.963470458984375, 1.0339508056640625, 1.10443115234375, 1.1749114990234375, 1.245391845703125, 1.3158721923828125, 1.3863525390625, 1.4568328857421875, 1.527313232421875, 1.5977935791015625, 1.66827392578125, 1.7387542724609375, 1.809234619140625, 1.8797149658203125, 1.9501953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 15.0, 15.0, 23.0, 29.0, 34.0, 57.0, 62.0, 80.0, 91.0, 90.0, 87.0, 81.0, 79.0, 59.0, 42.0, 33.0, 30.0, 20.0, 12.0, 8.0, 7.0, 7.0, 8.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -1.0193023681640625, -0.984893798828125, -0.9504852294921875, -0.91607666015625, -0.8816680908203125, -0.847259521484375, -0.8128509521484375, -0.7784423828125, -0.7440338134765625, -0.709625244140625, -0.6752166748046875, -0.64080810546875, -0.6063995361328125, -0.571990966796875, -0.5375823974609375, -0.503173828125, -0.4687652587890625, -0.434356689453125, -0.3999481201171875, -0.36553955078125, -0.3311309814453125, -0.296722412109375, -0.2623138427734375, -0.2279052734375, -0.1934967041015625, -0.159088134765625, -0.1246795654296875, -0.09027099609375, -0.0558624267578125, -0.021453857421875, 0.0129547119140625, 0.04736328125, 0.0817718505859375, 0.116180419921875, 0.1505889892578125, 0.18499755859375, 0.2194061279296875, 0.253814697265625, 0.2882232666015625, 0.3226318359375, 0.3570404052734375, 0.391448974609375, 0.4258575439453125, 0.46026611328125, 0.4946746826171875, 0.529083251953125, 0.5634918212890625, 0.597900390625, 0.6323089599609375, 0.666717529296875, 0.7011260986328125, 0.73553466796875, 0.7699432373046875, 0.804351806640625, 0.8387603759765625, 0.8731689453125, 0.9075775146484375, 0.941986083984375, 0.9763946533203125, 1.01080322265625, 1.0452117919921875, 1.079620361328125, 1.1140289306640625, 1.1484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 22.0, 47.0, 139.0, 277.0, 279.0, 145.0, 54.0, 26.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.60749816894531, -35.50053787231445, -34.393577575683594, -33.286617279052734, -32.179656982421875, -31.072696685791016, -29.96573829650879, -28.85877799987793, -27.75181770324707, -26.64485740661621, -25.53789710998535, -24.430936813354492, -23.323978424072266, -22.217018127441406, -21.110057830810547, -20.003097534179688, -18.896137237548828, -17.78917694091797, -16.68221664428711, -15.575257301330566, -14.468297004699707, -13.361336708068848, -12.254377365112305, -11.147417068481445, -10.040456771850586, -8.933496475219727, -7.826536655426025, -6.719576835632324, -5.612616539001465, -4.5056562423706055, -3.3986964225769043, -2.291736602783203, -1.1847801208496094, -0.0778200626373291, 1.0291399955749512, 2.1361000537872314, 3.2430601119995117, 4.350020408630371, 5.456980228424072, 6.563940048217773, 7.670900344848633, 8.777860641479492, 9.884820938110352, 10.991780281066895, 12.098740577697754, 13.205700874328613, 14.312660217285156, 15.419620513916016, 16.526580810546875, 17.633541107177734, 18.740501403808594, 19.847461700439453, 20.954421997070312, 22.061382293701172, 23.1683406829834, 24.275300979614258, 25.382261276245117, 26.489221572875977, 27.596181869506836, 28.703142166137695, 29.810100555419922, 30.91706085205078, 32.02402114868164, 33.1309814453125, 34.23794174194336]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 8.0, 9.0, 8.0, 18.0, 12.0, 27.0, 15.0, 31.0, 28.0, 35.0, 31.0, 36.0, 39.0, 48.0, 47.0, 50.0, 52.0, 40.0, 36.0, 50.0, 35.0, 39.0, 37.0, 38.0, 34.0, 37.0, 30.0, 25.0, 13.0, 12.0, 17.0, 17.0, 8.0, 9.0, 2.0, 3.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.035300254821777, -13.497518539428711, -12.959736824035645, -12.421955108642578, -11.884174346923828, -11.346391677856445, -10.808610916137695, -10.270829200744629, -9.733047485351562, -9.195265769958496, -8.65748405456543, -8.119702339172363, -7.581921100616455, -7.044139385223389, -6.5063581466674805, -5.968576431274414, -5.430794715881348, -4.893013000488281, -4.355231285095215, -3.8174500465393066, -3.2796683311462402, -2.741886615753174, -2.2041051387786865, -1.6663236618041992, -1.1285419464111328, -0.590760350227356, -0.0529787540435791, 0.48480284214019775, 1.0225844383239746, 1.560366153717041, 2.0981476306915283, 2.6359291076660156, 3.1737098693847656, 3.711491584777832, 4.249273300170898, 4.787054538726807, 5.324836254119873, 5.8626179695129395, 6.400399208068848, 6.938180923461914, 7.4759626388549805, 8.013744354248047, 8.551526069641113, 9.08930778503418, 9.62708854675293, 10.164871215820312, 10.702651977539062, 11.240433692932129, 11.778215408325195, 12.315997123718262, 12.853778839111328, 13.391560554504395, 13.929342269897461, 14.467123031616211, 15.004904747009277, 15.542686462402344, 16.080467224121094, 16.618247985839844, 17.156030654907227, 17.693811416625977, 18.23159408569336, 18.76937484741211, 19.307157516479492, 19.844938278198242, 20.382720947265625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 1.0, 8.0, 6.0, 12.0, 12.0, 21.0, 37.0, 46.0, 67.0, 109.0, 209.0, 304.0, 573.0, 1100.0, 2269.0, 4986.0, 12638.0, 38794.0, 393207.0, 3648285.0, 61849.0, 16868.0, 6689.0, 2943.0, 1390.0, 756.0, 438.0, 253.0, 157.0, 88.0, 51.0, 37.0, 23.0, 16.0, 18.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.28125, -3.19293212890625, -3.1046142578125, -3.01629638671875, -2.927978515625, -2.83966064453125, -2.7513427734375, -2.66302490234375, -2.57470703125, -2.48638916015625, -2.3980712890625, -2.30975341796875, -2.221435546875, -2.13311767578125, -2.0447998046875, -1.95648193359375, -1.8681640625, -1.77984619140625, -1.6915283203125, -1.60321044921875, -1.514892578125, -1.42657470703125, -1.3382568359375, -1.24993896484375, -1.16162109375, -1.07330322265625, -0.9849853515625, -0.89666748046875, -0.808349609375, -0.72003173828125, -0.6317138671875, -0.54339599609375, -0.455078125, -0.36676025390625, -0.2784423828125, -0.19012451171875, -0.101806640625, -0.01348876953125, 0.0748291015625, 0.16314697265625, 0.25146484375, 0.33978271484375, 0.4281005859375, 0.51641845703125, 0.604736328125, 0.69305419921875, 0.7813720703125, 0.86968994140625, 0.9580078125, 1.04632568359375, 1.1346435546875, 1.22296142578125, 1.311279296875, 1.39959716796875, 1.4879150390625, 1.57623291015625, 1.66455078125, 1.75286865234375, 1.8411865234375, 1.92950439453125, 2.017822265625, 2.10614013671875, 2.1944580078125, 2.28277587890625, 2.37109375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 3.0, 3.0, 7.0, 11.0, 15.0, 17.0, 19.0, 26.0, 35.0, 42.0, 42.0, 52.0, 60.0, 60.0, 70.0, 51.0, 57.0, 53.0, 66.0, 42.0, 38.0, 46.0, 42.0, 27.0, 27.0, 18.0, 25.0, 15.0, 12.0, 3.0, 2.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.4013671875, -1.3653335571289062, -1.3292999267578125, -1.2932662963867188, -1.257232666015625, -1.2211990356445312, -1.1851654052734375, -1.1491317749023438, -1.11309814453125, -1.0770645141601562, -1.0410308837890625, -1.0049972534179688, -0.968963623046875, -0.9329299926757812, -0.8968963623046875, -0.8608627319335938, -0.8248291015625, -0.7887954711914062, -0.7527618408203125, -0.7167282104492188, -0.680694580078125, -0.6446609497070312, -0.6086273193359375, -0.5725936889648438, -0.53656005859375, -0.5005264282226562, -0.4644927978515625, -0.42845916748046875, -0.392425537109375, -0.35639190673828125, -0.3203582763671875, -0.28432464599609375, -0.248291015625, -0.21225738525390625, -0.1762237548828125, -0.14019012451171875, -0.104156494140625, -0.06812286376953125, -0.0320892333984375, 0.00394439697265625, 0.03997802734375, 0.07601165771484375, 0.1120452880859375, 0.14807891845703125, 0.184112548828125, 0.22014617919921875, 0.2561798095703125, 0.29221343994140625, 0.3282470703125, 0.36428070068359375, 0.4003143310546875, 0.43634796142578125, 0.472381591796875, 0.5084152221679688, 0.5444488525390625, 0.5804824829101562, 0.61651611328125, 0.6525497436523438, 0.6885833740234375, 0.7246170043945312, 0.760650634765625, 0.7966842651367188, 0.8327178955078125, 0.8687515258789062, 0.90478515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 10.0, 6.0, 16.0, 27.0, 31.0, 62.0, 115.0, 276.0, 903.0, 4485.0, 47570.0, 4093092.0, 42043.0, 4149.0, 890.0, 299.0, 131.0, 66.0, 48.0, 29.0, 17.0, 10.0, 11.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0234375, -3.779296875, -3.53515625, -3.291015625, -3.046875, -2.802734375, -2.55859375, -2.314453125, -2.0703125, -1.826171875, -1.58203125, -1.337890625, -1.09375, -0.849609375, -0.60546875, -0.361328125, -0.1171875, 0.126953125, 0.37109375, 0.615234375, 0.859375, 1.103515625, 1.34765625, 1.591796875, 1.8359375, 2.080078125, 2.32421875, 2.568359375, 2.8125, 3.056640625, 3.30078125, 3.544921875, 3.7890625, 4.033203125, 4.27734375, 4.521484375, 4.765625, 5.009765625, 5.25390625, 5.498046875, 5.7421875, 5.986328125, 6.23046875, 6.474609375, 6.71875, 6.962890625, 7.20703125, 7.451171875, 7.6953125, 7.939453125, 8.18359375, 8.427734375, 8.671875, 8.916015625, 9.16015625, 9.404296875, 9.6484375, 9.892578125, 10.13671875, 10.380859375, 10.625, 10.869140625, 11.11328125, 11.357421875, 11.6015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 12.0, 11.0, 18.0, 18.0, 44.0, 85.0, 254.0, 2818.0, 508.0, 121.0, 61.0, 29.0, 19.0, 14.0, 13.0, 7.0, 10.0, 3.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.125, -1.07061767578125, -1.0162353515625, -0.96185302734375, -0.907470703125, -0.85308837890625, -0.7987060546875, -0.74432373046875, -0.68994140625, -0.63555908203125, -0.5811767578125, -0.52679443359375, -0.472412109375, -0.41802978515625, -0.3636474609375, -0.30926513671875, -0.2548828125, -0.20050048828125, -0.1461181640625, -0.09173583984375, -0.037353515625, 0.01702880859375, 0.0714111328125, 0.12579345703125, 0.18017578125, 0.23455810546875, 0.2889404296875, 0.34332275390625, 0.397705078125, 0.45208740234375, 0.5064697265625, 0.56085205078125, 0.615234375, 0.66961669921875, 0.7239990234375, 0.77838134765625, 0.832763671875, 0.88714599609375, 0.9415283203125, 0.99591064453125, 1.05029296875, 1.10467529296875, 1.1590576171875, 1.21343994140625, 1.267822265625, 1.32220458984375, 1.3765869140625, 1.43096923828125, 1.4853515625, 1.53973388671875, 1.5941162109375, 1.64849853515625, 1.702880859375, 1.75726318359375, 1.8116455078125, 1.86602783203125, 1.92041015625, 1.97479248046875, 2.0291748046875, 2.08355712890625, 2.137939453125, 2.19232177734375, 2.2467041015625, 2.30108642578125, 2.35546875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 8.0, 31.0, 38.0, 73.0, 139.0, 208.0, 202.0, 123.0, 72.0, 46.0, 29.0, 14.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.981631755828857, -6.719402313232422, -6.457172870635986, -6.194943428039551, -5.932713985443115, -5.67048454284668, -5.408255100250244, -5.146025657653809, -4.883796215057373, -4.6215667724609375, -4.359337329864502, -4.097107887268066, -3.834878444671631, -3.5726490020751953, -3.3104195594787598, -3.048190116882324, -2.7859606742858887, -2.523731231689453, -2.2615017890930176, -1.999272346496582, -1.7370429039001465, -1.474813461303711, -1.2125840187072754, -0.9503545761108398, -0.6881251335144043, -0.42589569091796875, -0.1636662483215332, 0.09856319427490234, 0.3607926368713379, 0.6230220794677734, 0.885251522064209, 1.1474809646606445, 1.4097099304199219, 1.6719393730163574, 1.934168815612793, 2.1963982582092285, 2.458627700805664, 2.7208571434020996, 2.983086585998535, 3.2453160285949707, 3.5075454711914062, 3.769774913787842, 4.032004356384277, 4.294233798980713, 4.556463241577148, 4.818692684173584, 5.0809221267700195, 5.343151569366455, 5.605381011962891, 5.867610454559326, 6.129839897155762, 6.392069339752197, 6.654298782348633, 6.916528224945068, 7.178757667541504, 7.4409871101379395, 7.703216552734375, 7.9654459953308105, 8.227675437927246, 8.489904403686523, 8.752134323120117, 9.014364242553711, 9.276593208312988, 9.538822174072266, 9.80105209350586]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 7.0, 8.0, 8.0, 10.0, 11.0, 14.0, 14.0, 14.0, 31.0, 33.0, 22.0, 26.0, 33.0, 54.0, 36.0, 49.0, 56.0, 47.0, 50.0, 47.0, 34.0, 37.0, 36.0, 42.0, 33.0, 26.0, 30.0, 26.0, 25.0, 18.0, 17.0, 25.0, 20.0, 12.0, 11.0, 12.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6212024688720703, -3.505706310272217, -3.3902103900909424, -3.274714231491089, -3.1592180728912354, -3.043722152709961, -2.9282259941101074, -2.812729835510254, -2.6972339153289795, -2.581737756729126, -2.4662418365478516, -2.350745677947998, -2.2352495193481445, -2.11975359916687, -2.0042574405670166, -1.8887614011764526, -1.7732652425765991, -1.6577692031860352, -1.5422730445861816, -1.4267770051956177, -1.3112809658050537, -1.1957848072052002, -1.0802887678146362, -0.9647927284240723, -0.8492966294288635, -0.7338005304336548, -0.6183044910430908, -0.5028083920478821, -0.3873123228549957, -0.2718162536621094, -0.15632015466690063, -0.04082411527633667, 0.07467198371887207, 0.19016805291175842, 0.3056641221046448, 0.4211602210998535, 0.5366562604904175, 0.6521523594856262, 0.767648458480835, 0.8831444978713989, 0.9986405968666077, 1.1141366958618164, 1.2296327352523804, 1.3451287746429443, 1.4606249332427979, 1.5761209726333618, 1.6916170120239258, 1.8071131706237793, 1.9226092100143433, 2.0381052494049072, 2.1536014080047607, 2.269097328186035, 2.3845934867858887, 2.500089645385742, 2.6155858039855957, 2.73108172416687, 2.8465778827667236, 2.962074041366577, 3.0775699615478516, 3.193066120147705, 3.3085622787475586, 3.424058198928833, 3.5395543575286865, 3.655050277709961, 3.7705464363098145]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 9.0, 4.0, 10.0, 6.0, 14.0, 13.0, 22.0, 26.0, 57.0, 85.0, 124.0, 197.0, 387.0, 682.0, 1289.0, 2468.0, 5205.0, 11719.0, 28256.0, 71076.0, 173117.0, 321624.0, 248211.0, 108391.0, 43269.0, 17448.0, 7600.0, 3504.0, 1651.0, 861.0, 475.0, 266.0, 158.0, 118.0, 68.0, 54.0, 28.0, 12.0, 19.0, 6.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.69140625, -1.6363677978515625, -1.581329345703125, -1.5262908935546875, -1.47125244140625, -1.4162139892578125, -1.361175537109375, -1.3061370849609375, -1.2510986328125, -1.1960601806640625, -1.141021728515625, -1.0859832763671875, -1.03094482421875, -0.9759063720703125, -0.920867919921875, -0.8658294677734375, -0.810791015625, -0.7557525634765625, -0.700714111328125, -0.6456756591796875, -0.59063720703125, -0.5355987548828125, -0.480560302734375, -0.4255218505859375, -0.3704833984375, -0.3154449462890625, -0.260406494140625, -0.2053680419921875, -0.15032958984375, -0.0952911376953125, -0.040252685546875, 0.0147857666015625, 0.06982421875, 0.1248626708984375, 0.179901123046875, 0.2349395751953125, 0.28997802734375, 0.3450164794921875, 0.400054931640625, 0.4550933837890625, 0.5101318359375, 0.5651702880859375, 0.620208740234375, 0.6752471923828125, 0.73028564453125, 0.7853240966796875, 0.840362548828125, 0.8954010009765625, 0.950439453125, 1.0054779052734375, 1.060516357421875, 1.1155548095703125, 1.17059326171875, 1.2256317138671875, 1.280670166015625, 1.3357086181640625, 1.3907470703125, 1.4457855224609375, 1.500823974609375, 1.5558624267578125, 1.61090087890625, 1.6659393310546875, 1.720977783203125, 1.7760162353515625, 1.8310546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 9.0, 10.0, 11.0, 26.0, 31.0, 25.0, 32.0, 44.0, 39.0, 62.0, 55.0, 51.0, 54.0, 64.0, 66.0, 49.0, 54.0, 54.0, 49.0, 39.0, 33.0, 26.0, 30.0, 23.0, 16.0, 13.0, 14.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.352691650390625, -1.31475830078125, -1.276824951171875, -1.2388916015625, -1.200958251953125, -1.16302490234375, -1.125091552734375, -1.087158203125, -1.049224853515625, -1.01129150390625, -0.973358154296875, -0.9354248046875, -0.897491455078125, -0.85955810546875, -0.821624755859375, -0.78369140625, -0.745758056640625, -0.70782470703125, -0.669891357421875, -0.6319580078125, -0.594024658203125, -0.55609130859375, -0.518157958984375, -0.480224609375, -0.442291259765625, -0.40435791015625, -0.366424560546875, -0.3284912109375, -0.290557861328125, -0.25262451171875, -0.214691162109375, -0.1767578125, -0.138824462890625, -0.10089111328125, -0.062957763671875, -0.0250244140625, 0.012908935546875, 0.05084228515625, 0.088775634765625, 0.126708984375, 0.164642333984375, 0.20257568359375, 0.240509033203125, 0.2784423828125, 0.316375732421875, 0.35430908203125, 0.392242431640625, 0.43017578125, 0.468109130859375, 0.50604248046875, 0.543975830078125, 0.5819091796875, 0.619842529296875, 0.65777587890625, 0.695709228515625, 0.733642578125, 0.771575927734375, 0.80950927734375, 0.847442626953125, 0.8853759765625, 0.923309326171875, 0.96124267578125, 0.999176025390625, 1.037109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 9.0, 11.0, 6.0, 11.0, 15.0, 17.0, 23.0, 33.0, 37.0, 54.0, 74.0, 92.0, 137.0, 212.0, 339.0, 568.0, 1193.0, 2660.0, 6667.0, 18746.0, 59692.0, 206073.0, 439029.0, 217723.0, 62744.0, 19549.0, 6973.0, 2883.0, 1217.0, 654.0, 348.0, 216.0, 132.0, 100.0, 71.0, 53.0, 45.0, 26.0, 25.0, 25.0, 11.0, 12.0, 12.0, 7.0, 5.0, 9.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-2.185546875, -2.11834716796875, -2.0511474609375, -1.98394775390625, -1.916748046875, -1.84954833984375, -1.7823486328125, -1.71514892578125, -1.64794921875, -1.58074951171875, -1.5135498046875, -1.44635009765625, -1.379150390625, -1.31195068359375, -1.2447509765625, -1.17755126953125, -1.1103515625, -1.04315185546875, -0.9759521484375, -0.90875244140625, -0.841552734375, -0.77435302734375, -0.7071533203125, -0.63995361328125, -0.57275390625, -0.50555419921875, -0.4383544921875, -0.37115478515625, -0.303955078125, -0.23675537109375, -0.1695556640625, -0.10235595703125, -0.03515625, 0.03204345703125, 0.0992431640625, 0.16644287109375, 0.233642578125, 0.30084228515625, 0.3680419921875, 0.43524169921875, 0.50244140625, 0.56964111328125, 0.6368408203125, 0.70404052734375, 0.771240234375, 0.83843994140625, 0.9056396484375, 0.97283935546875, 1.0400390625, 1.10723876953125, 1.1744384765625, 1.24163818359375, 1.308837890625, 1.37603759765625, 1.4432373046875, 1.51043701171875, 1.57763671875, 1.64483642578125, 1.7120361328125, 1.77923583984375, 1.846435546875, 1.91363525390625, 1.9808349609375, 2.04803466796875, 2.115234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 8.0, 6.0, 10.0, 11.0, 22.0, 22.0, 23.0, 22.0, 23.0, 36.0, 27.0, 37.0, 33.0, 40.0, 41.0, 34.0, 36.0, 40.0, 41.0, 45.0, 47.0, 48.0, 33.0, 34.0, 29.0, 41.0, 22.0, 18.0, 28.0, 18.0, 21.0, 11.0, 22.0, 9.0, 9.0, 11.0, 9.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.818359375, -3.69647216796875, -3.5745849609375, -3.45269775390625, -3.330810546875, -3.20892333984375, -3.0870361328125, -2.96514892578125, -2.84326171875, -2.72137451171875, -2.5994873046875, -2.47760009765625, -2.355712890625, -2.23382568359375, -2.1119384765625, -1.99005126953125, -1.8681640625, -1.74627685546875, -1.6243896484375, -1.50250244140625, -1.380615234375, -1.25872802734375, -1.1368408203125, -1.01495361328125, -0.89306640625, -0.77117919921875, -0.6492919921875, -0.52740478515625, -0.405517578125, -0.28363037109375, -0.1617431640625, -0.03985595703125, 0.08203125, 0.20391845703125, 0.3258056640625, 0.44769287109375, 0.569580078125, 0.69146728515625, 0.8133544921875, 0.93524169921875, 1.05712890625, 1.17901611328125, 1.3009033203125, 1.42279052734375, 1.544677734375, 1.66656494140625, 1.7884521484375, 1.91033935546875, 2.0322265625, 2.15411376953125, 2.2760009765625, 2.39788818359375, 2.519775390625, 2.64166259765625, 2.7635498046875, 2.88543701171875, 3.00732421875, 3.12921142578125, 3.2510986328125, 3.37298583984375, 3.494873046875, 3.61676025390625, 3.7386474609375, 3.86053466796875, 3.982421875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 10.0, 18.0, 26.0, 63.0, 170.0, 378.0, 1198.0, 5168.0, 62979.0, 895080.0, 75787.0, 5715.0, 1261.0, 389.0, 181.0, 73.0, 35.0, 19.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.623046875, -2.534210205078125, -2.44537353515625, -2.356536865234375, -2.2677001953125, -2.178863525390625, -2.09002685546875, -2.001190185546875, -1.912353515625, -1.823516845703125, -1.73468017578125, -1.645843505859375, -1.5570068359375, -1.468170166015625, -1.37933349609375, -1.290496826171875, -1.20166015625, -1.112823486328125, -1.02398681640625, -0.935150146484375, -0.8463134765625, -0.757476806640625, -0.66864013671875, -0.579803466796875, -0.490966796875, -0.402130126953125, -0.31329345703125, -0.224456787109375, -0.1356201171875, -0.046783447265625, 0.04205322265625, 0.130889892578125, 0.2197265625, 0.308563232421875, 0.39739990234375, 0.486236572265625, 0.5750732421875, 0.663909912109375, 0.75274658203125, 0.841583251953125, 0.930419921875, 1.019256591796875, 1.10809326171875, 1.196929931640625, 1.2857666015625, 1.374603271484375, 1.46343994140625, 1.552276611328125, 1.64111328125, 1.729949951171875, 1.81878662109375, 1.907623291015625, 1.9964599609375, 2.085296630859375, 2.17413330078125, 2.262969970703125, 2.351806640625, 2.440643310546875, 2.52947998046875, 2.618316650390625, 2.7071533203125, 2.795989990234375, 2.88482666015625, 2.973663330078125, 3.0625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 11.0, 17.0, 27.0, 60.0, 117.0, 176.0, 218.0, 166.0, 89.0, 53.0, 25.0, 14.0, 9.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004024505615234375, -0.0003882572054862976, -0.0003740638494491577, -0.0003598704934120178, -0.00034567713737487793, -0.00033148378133773804, -0.00031729042530059814, -0.00030309706926345825, -0.00028890371322631836, -0.00027471035718917847, -0.0002605170011520386, -0.0002463236451148987, -0.0002321302890777588, -0.0002179369330406189, -0.000203743577003479, -0.0001895502209663391, -0.00017535686492919922, -0.00016116350889205933, -0.00014697015285491943, -0.00013277679681777954, -0.00011858344078063965, -0.00010439008474349976, -9.019672870635986e-05, -7.600337266921997e-05, -6.181001663208008e-05, -4.7616660594940186e-05, -3.342330455780029e-05, -1.92299485206604e-05, -5.036592483520508e-06, 9.156763553619385e-06, 2.3350119590759277e-05, 3.754347562789917e-05, 5.173683166503906e-05, 6.593018770217896e-05, 8.012354373931885e-05, 9.431689977645874e-05, 0.00010851025581359863, 0.00012270361185073853, 0.00013689696788787842, 0.0001510903239250183, 0.0001652836799621582, 0.0001794770359992981, 0.000193670392036438, 0.00020786374807357788, 0.00022205710411071777, 0.00023625046014785767, 0.00025044381618499756, 0.00026463717222213745, 0.00027883052825927734, 0.00029302388429641724, 0.00030721724033355713, 0.000321410596370697, 0.0003356039524078369, 0.0003497973084449768, 0.0003639906644821167, 0.0003781840205192566, 0.0003923773765563965, 0.0004065707325935364, 0.00042076408863067627, 0.00043495744466781616, 0.00044915080070495605, 0.00046334415674209595, 0.00047753751277923584, 0.0004917308688163757, 0.0005059242248535156]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 0.0, 5.0, 1.0, 4.0, 13.0, 15.0, 21.0, 37.0, 65.0, 157.0, 405.0, 1046.0, 3320.0, 14266.0, 116808.0, 709378.0, 177593.0, 19212.0, 4092.0, 1291.0, 438.0, 179.0, 70.0, 45.0, 28.0, 12.0, 9.0, 5.0, 8.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7490234375, -1.69183349609375, -1.6346435546875, -1.57745361328125, -1.520263671875, -1.46307373046875, -1.4058837890625, -1.34869384765625, -1.29150390625, -1.23431396484375, -1.1771240234375, -1.11993408203125, -1.062744140625, -1.00555419921875, -0.9483642578125, -0.89117431640625, -0.833984375, -0.77679443359375, -0.7196044921875, -0.66241455078125, -0.605224609375, -0.54803466796875, -0.4908447265625, -0.43365478515625, -0.37646484375, -0.31927490234375, -0.2620849609375, -0.20489501953125, -0.147705078125, -0.09051513671875, -0.0333251953125, 0.02386474609375, 0.0810546875, 0.13824462890625, 0.1954345703125, 0.25262451171875, 0.309814453125, 0.36700439453125, 0.4241943359375, 0.48138427734375, 0.53857421875, 0.59576416015625, 0.6529541015625, 0.71014404296875, 0.767333984375, 0.82452392578125, 0.8817138671875, 0.93890380859375, 0.99609375, 1.05328369140625, 1.1104736328125, 1.16766357421875, 1.224853515625, 1.28204345703125, 1.3392333984375, 1.39642333984375, 1.45361328125, 1.51080322265625, 1.5679931640625, 1.62518310546875, 1.682373046875, 1.73956298828125, 1.7967529296875, 1.85394287109375, 1.9111328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 5.0, 10.0, 27.0, 8.0, 29.0, 28.0, 22.0, 32.0, 32.0, 54.0, 62.0, 65.0, 72.0, 66.0, 73.0, 56.0, 55.0, 54.0, 36.0, 37.0, 30.0, 26.0, 14.0, 22.0, 8.0, 7.0, 8.0, 8.0, 8.0, 1.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89990234375, -0.8688430786132812, -0.8377838134765625, -0.8067245483398438, -0.775665283203125, -0.7446060180664062, -0.7135467529296875, -0.6824874877929688, -0.65142822265625, -0.6203689575195312, -0.5893096923828125, -0.5582504272460938, -0.527191162109375, -0.49613189697265625, -0.4650726318359375, -0.43401336669921875, -0.4029541015625, -0.37189483642578125, -0.3408355712890625, -0.30977630615234375, -0.278717041015625, -0.24765777587890625, -0.2165985107421875, -0.18553924560546875, -0.15447998046875, -0.12342071533203125, -0.0923614501953125, -0.06130218505859375, -0.030242919921875, 0.00081634521484375, 0.0318756103515625, 0.06293487548828125, 0.093994140625, 0.12505340576171875, 0.1561126708984375, 0.18717193603515625, 0.218231201171875, 0.24929046630859375, 0.2803497314453125, 0.31140899658203125, 0.34246826171875, 0.37352752685546875, 0.4045867919921875, 0.43564605712890625, 0.466705322265625, 0.49776458740234375, 0.5288238525390625, 0.5598831176757812, 0.5909423828125, 0.6220016479492188, 0.6530609130859375, 0.6841201782226562, 0.715179443359375, 0.7462387084960938, 0.7772979736328125, 0.8083572387695312, 0.83941650390625, 0.8704757690429688, 0.9015350341796875, 0.9325942993164062, 0.963653564453125, 0.9947128295898438, 1.0257720947265625, 1.0568313598632812, 1.087890625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 12.0, 31.0, 94.0, 180.0, 344.0, 231.0, 73.0, 32.0, 11.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.13302612304688, -73.62413024902344, -72.115234375, -70.60633850097656, -69.09744262695312, -67.58853912353516, -66.07964324951172, -64.57074737548828, -63.061851501464844, -61.552955627441406, -60.04405975341797, -58.535160064697266, -57.02626419067383, -55.51736831665039, -54.00846862792969, -52.49957275390625, -50.99067687988281, -49.481781005859375, -47.97288513183594, -46.463985443115234, -44.9550895690918, -43.44619369506836, -41.937294006347656, -40.42839813232422, -38.91950225830078, -37.410606384277344, -35.901710510253906, -34.3928108215332, -32.883914947509766, -31.375019073486328, -29.866121292114258, -28.357223510742188, -26.848325729370117, -25.339427947998047, -23.83053207397461, -22.321636199951172, -20.8127384185791, -19.30384063720703, -17.794944763183594, -16.286048889160156, -14.777151107788086, -13.268254280090332, -11.759357452392578, -10.250460624694824, -8.74156379699707, -7.232666969299316, -5.7237701416015625, -4.214873313903809, -2.7059764862060547, -1.1970796585083008, 0.3118171691894531, 1.820713996887207, 3.329610824584961, 4.838507652282715, 6.347404479980469, 7.856301307678223, 9.365198135375977, 10.87409496307373, 12.382991790771484, 13.891888618469238, 15.400785446166992, 16.909683227539062, 18.4185791015625, 19.927474975585938, 21.436372756958008]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 2.0, 5.0, 5.0, 7.0, 5.0, 12.0, 12.0, 21.0, 15.0, 32.0, 11.0, 28.0, 32.0, 27.0, 35.0, 44.0, 43.0, 54.0, 51.0, 41.0, 37.0, 44.0, 37.0, 51.0, 47.0, 33.0, 29.0, 24.0, 41.0, 23.0, 22.0, 22.0, 19.0, 23.0, 15.0, 12.0, 9.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.000274658203125, -18.28957748413086, -17.57887840270996, -16.868181228637695, -16.15748405456543, -15.446785926818848, -14.736087799072266, -14.025390625, -13.314692497253418, -12.603994369506836, -11.89329719543457, -11.182599067687988, -10.471900939941406, -9.76120376586914, -9.050505638122559, -8.339807510375977, -7.629110336303711, -6.918412685394287, -6.207715034484863, -5.497016906738281, -4.786319255828857, -4.075621604919434, -3.3649234771728516, -2.6542258262634277, -1.943528175354004, -1.2328304052352905, -0.5221326351165771, 0.18856525421142578, 0.8992629051208496, 1.6099605560302734, 2.3206586837768555, 3.0313563346862793, 3.742053985595703, 4.452751636505127, 5.163449287414551, 5.874147415161133, 6.584845066070557, 7.2955427169799805, 8.006240844726562, 8.716938018798828, 9.42763614654541, 10.138334274291992, 10.849031448364258, 11.55972957611084, 12.270427703857422, 12.981124877929688, 13.69182300567627, 14.402521133422852, 15.113218307495117, 15.8239164352417, 16.53461456298828, 17.245311737060547, 17.956008911132812, 18.666706085205078, 19.377405166625977, 20.088102340698242, 20.79880142211914, 21.509498596191406, 22.220197677612305, 22.93089485168457, 23.641592025756836, 24.352291107177734, 25.06298828125, 25.773685455322266, 26.48438262939453]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 7.0, 12.0, 16.0, 22.0, 27.0, 66.0, 71.0, 141.0, 219.0, 374.0, 669.0, 1189.0, 2191.0, 4621.0, 11013.0, 34278.0, 323318.0, 3723202.0, 63950.0, 16153.0, 6253.0, 2908.0, 1450.0, 871.0, 469.0, 260.0, 188.0, 108.0, 78.0, 51.0, 35.0, 23.0, 16.0, 8.0, 8.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.736328125, -3.6358642578125, -3.535400390625, -3.4349365234375, -3.33447265625, -3.2340087890625, -3.133544921875, -3.0330810546875, -2.9326171875, -2.8321533203125, -2.731689453125, -2.6312255859375, -2.53076171875, -2.4302978515625, -2.329833984375, -2.2293701171875, -2.12890625, -2.0284423828125, -1.927978515625, -1.8275146484375, -1.72705078125, -1.6265869140625, -1.526123046875, -1.4256591796875, -1.3251953125, -1.2247314453125, -1.124267578125, -1.0238037109375, -0.92333984375, -0.8228759765625, -0.722412109375, -0.6219482421875, -0.521484375, -0.4210205078125, -0.320556640625, -0.2200927734375, -0.11962890625, -0.0191650390625, 0.081298828125, 0.1817626953125, 0.2822265625, 0.3826904296875, 0.483154296875, 0.5836181640625, 0.68408203125, 0.7845458984375, 0.885009765625, 0.9854736328125, 1.0859375, 1.1864013671875, 1.286865234375, 1.3873291015625, 1.48779296875, 1.5882568359375, 1.688720703125, 1.7891845703125, 1.8896484375, 1.9901123046875, 2.090576171875, 2.1910400390625, 2.29150390625, 2.3919677734375, 2.492431640625, 2.5928955078125, 2.693359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 10.0, 15.0, 20.0, 25.0, 21.0, 30.0, 38.0, 45.0, 42.0, 46.0, 64.0, 50.0, 50.0, 58.0, 41.0, 59.0, 52.0, 55.0, 53.0, 43.0, 26.0, 32.0, 31.0, 14.0, 18.0, 12.0, 13.0, 10.0, 7.0, 6.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.427734375, -1.3866119384765625, -1.345489501953125, -1.3043670654296875, -1.26324462890625, -1.2221221923828125, -1.180999755859375, -1.1398773193359375, -1.0987548828125, -1.0576324462890625, -1.016510009765625, -0.9753875732421875, -0.93426513671875, -0.8931427001953125, -0.852020263671875, -0.8108978271484375, -0.769775390625, -0.7286529541015625, -0.687530517578125, -0.6464080810546875, -0.60528564453125, -0.5641632080078125, -0.523040771484375, -0.4819183349609375, -0.4407958984375, -0.3996734619140625, -0.358551025390625, -0.3174285888671875, -0.27630615234375, -0.2351837158203125, -0.194061279296875, -0.1529388427734375, -0.11181640625, -0.0706939697265625, -0.029571533203125, 0.0115509033203125, 0.05267333984375, 0.0937957763671875, 0.134918212890625, 0.1760406494140625, 0.2171630859375, 0.2582855224609375, 0.299407958984375, 0.3405303955078125, 0.38165283203125, 0.4227752685546875, 0.463897705078125, 0.5050201416015625, 0.546142578125, 0.5872650146484375, 0.628387451171875, 0.6695098876953125, 0.71063232421875, 0.7517547607421875, 0.792877197265625, 0.8339996337890625, 0.8751220703125, 0.9162445068359375, 0.957366943359375, 0.9984893798828125, 1.03961181640625, 1.0807342529296875, 1.121856689453125, 1.1629791259765625, 1.2041015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 14.0, 19.0, 19.0, 43.0, 53.0, 80.0, 128.0, 170.0, 218.0, 357.0, 705.0, 1369.0, 3111.0, 9167.0, 37717.0, 425138.0, 3623473.0, 69730.0, 14411.0, 4361.0, 1770.0, 788.0, 516.0, 323.0, 189.0, 125.0, 71.0, 57.0, 47.0, 29.0, 23.0, 19.0, 8.0, 15.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.794921875, -2.69207763671875, -2.5892333984375, -2.48638916015625, -2.383544921875, -2.28070068359375, -2.1778564453125, -2.07501220703125, -1.97216796875, -1.86932373046875, -1.7664794921875, -1.66363525390625, -1.560791015625, -1.45794677734375, -1.3551025390625, -1.25225830078125, -1.1494140625, -1.04656982421875, -0.9437255859375, -0.84088134765625, -0.738037109375, -0.63519287109375, -0.5323486328125, -0.42950439453125, -0.32666015625, -0.22381591796875, -0.1209716796875, -0.01812744140625, 0.084716796875, 0.18756103515625, 0.2904052734375, 0.39324951171875, 0.49609375, 0.59893798828125, 0.7017822265625, 0.80462646484375, 0.907470703125, 1.01031494140625, 1.1131591796875, 1.21600341796875, 1.31884765625, 1.42169189453125, 1.5245361328125, 1.62738037109375, 1.730224609375, 1.83306884765625, 1.9359130859375, 2.03875732421875, 2.1416015625, 2.24444580078125, 2.3472900390625, 2.45013427734375, 2.552978515625, 2.65582275390625, 2.7586669921875, 2.86151123046875, 2.96435546875, 3.06719970703125, 3.1700439453125, 3.27288818359375, 3.375732421875, 3.47857666015625, 3.5814208984375, 3.68426513671875, 3.787109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 5.0, 4.0, 11.0, 11.0, 25.0, 33.0, 78.0, 196.0, 2557.0, 831.0, 150.0, 50.0, 43.0, 30.0, 15.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9560546875, -1.8803558349609375, -1.804656982421875, -1.7289581298828125, -1.65325927734375, -1.5775604248046875, -1.501861572265625, -1.4261627197265625, -1.3504638671875, -1.2747650146484375, -1.199066162109375, -1.1233673095703125, -1.04766845703125, -0.9719696044921875, -0.896270751953125, -0.8205718994140625, -0.744873046875, -0.6691741943359375, -0.593475341796875, -0.5177764892578125, -0.44207763671875, -0.3663787841796875, -0.290679931640625, -0.2149810791015625, -0.1392822265625, -0.0635833740234375, 0.012115478515625, 0.0878143310546875, 0.16351318359375, 0.2392120361328125, 0.314910888671875, 0.3906097412109375, 0.46630859375, 0.5420074462890625, 0.617706298828125, 0.6934051513671875, 0.76910400390625, 0.8448028564453125, 0.920501708984375, 0.9962005615234375, 1.0718994140625, 1.1475982666015625, 1.223297119140625, 1.2989959716796875, 1.37469482421875, 1.4503936767578125, 1.526092529296875, 1.6017913818359375, 1.677490234375, 1.7531890869140625, 1.828887939453125, 1.9045867919921875, 1.98028564453125, 2.0559844970703125, 2.131683349609375, 2.2073822021484375, 2.2830810546875, 2.3587799072265625, 2.434478759765625, 2.5101776123046875, 2.58587646484375, 2.6615753173828125, 2.737274169921875, 2.8129730224609375, 2.888671875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 44.0, 172.0, 366.0, 291.0, 92.0, 23.0, 11.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.947605133056641, -7.31705904006958, -6.686513423919678, -6.055967330932617, -5.425421714782715, -4.794875621795654, -4.164329528808594, -3.5337839126586914, -2.903237819671631, -2.2726919651031494, -1.6421459913253784, -1.0116000175476074, -0.381054162979126, 0.24949169158935547, 0.880037784576416, 1.5105834007263184, 2.141129493713379, 2.7716753482818604, 3.402221202850342, 4.032767295837402, 4.663312911987305, 5.293859004974365, 5.924405097961426, 6.554950714111328, 7.185496807098389, 7.816042900085449, 8.446588516235352, 9.07713508605957, 9.707680702209473, 10.338226318359375, 10.968772888183594, 11.59931755065918, 12.229864120483398, 12.8604097366333, 13.49095630645752, 14.121501922607422, 14.752047538757324, 15.382593154907227, 16.013139724731445, 16.64368438720703, 17.27423095703125, 17.90477752685547, 18.535322189331055, 19.165868759155273, 19.796415328979492, 20.426959991455078, 21.057506561279297, 21.688053131103516, 22.318599700927734, 22.949146270751953, 23.57969093322754, 24.210237503051758, 24.840784072875977, 25.471328735351562, 26.10187530517578, 26.732421875, 27.362966537475586, 27.993513107299805, 28.62405776977539, 29.25460433959961, 29.885150909423828, 30.515695571899414, 31.146242141723633, 31.77678680419922, 32.40733337402344]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 12.0, 16.0, 17.0, 19.0, 21.0, 23.0, 14.0, 20.0, 29.0, 32.0, 24.0, 34.0, 32.0, 52.0, 39.0, 31.0, 38.0, 45.0, 36.0, 42.0, 56.0, 37.0, 39.0, 34.0, 37.0, 32.0, 19.0, 31.0, 20.0, 21.0, 15.0, 13.0, 8.0, 10.0, 13.0, 5.0, 2.0, 7.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-4.228907585144043, -4.102432727813721, -3.9759578704833984, -3.849482774734497, -3.723007917404175, -3.5965330600738525, -3.470057964324951, -3.343583106994629, -3.2171082496643066, -3.0906333923339844, -2.964158535003662, -2.8376834392547607, -2.7112085819244385, -2.584733724594116, -2.458258628845215, -2.3317837715148926, -2.2053089141845703, -2.078834056854248, -1.9523590803146362, -1.8258841037750244, -1.6994092464447021, -1.5729343891143799, -1.446459412574768, -1.3199844360351562, -1.193509578704834, -1.0670347213745117, -0.9405597448348999, -0.8140848278999329, -0.6876099109649658, -0.5611349940299988, -0.43466007709503174, -0.3081851601600647, -0.18171072006225586, -0.05523580312728882, 0.07123911380767822, 0.19771403074264526, 0.3241889476776123, 0.45066386461257935, 0.5771387815475464, 0.7036136984825134, 0.8300886154174805, 0.9565635323524475, 1.0830384492874146, 1.2095134258270264, 1.3359882831573486, 1.462463140487671, 1.5889381170272827, 1.7154130935668945, 1.8418879508972168, 1.968362808227539, 2.0948376655578613, 2.2213127613067627, 2.347787618637085, 2.4742624759674072, 2.6007375717163086, 2.727212429046631, 2.853687286376953, 2.9801621437072754, 3.1066370010375977, 3.233112096786499, 3.3595869541168213, 3.4860618114471436, 3.612536907196045, 3.739011764526367, 3.8654866218566895]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 4.0, 7.0, 4.0, 9.0, 13.0, 18.0, 27.0, 39.0, 92.0, 116.0, 247.0, 442.0, 1034.0, 2541.0, 6634.0, 19694.0, 59457.0, 193888.0, 432443.0, 226469.0, 70049.0, 22398.0, 7763.0, 2869.0, 1219.0, 478.0, 257.0, 132.0, 72.0, 48.0, 23.0, 21.0, 20.0, 13.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.853515625, -2.770965576171875, -2.68841552734375, -2.605865478515625, -2.5233154296875, -2.440765380859375, -2.35821533203125, -2.275665283203125, -2.193115234375, -2.110565185546875, -2.02801513671875, -1.945465087890625, -1.8629150390625, -1.780364990234375, -1.69781494140625, -1.615264892578125, -1.53271484375, -1.450164794921875, -1.36761474609375, -1.285064697265625, -1.2025146484375, -1.119964599609375, -1.03741455078125, -0.954864501953125, -0.872314453125, -0.789764404296875, -0.70721435546875, -0.624664306640625, -0.5421142578125, -0.459564208984375, -0.37701416015625, -0.294464111328125, -0.2119140625, -0.129364013671875, -0.04681396484375, 0.035736083984375, 0.1182861328125, 0.200836181640625, 0.28338623046875, 0.365936279296875, 0.448486328125, 0.531036376953125, 0.61358642578125, 0.696136474609375, 0.7786865234375, 0.861236572265625, 0.94378662109375, 1.026336669921875, 1.10888671875, 1.191436767578125, 1.27398681640625, 1.356536865234375, 1.4390869140625, 1.521636962890625, 1.60418701171875, 1.686737060546875, 1.769287109375, 1.851837158203125, 1.93438720703125, 2.016937255859375, 2.0994873046875, 2.182037353515625, 2.26458740234375, 2.347137451171875, 2.4296875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 4.0, 10.0, 14.0, 14.0, 24.0, 18.0, 35.0, 31.0, 40.0, 45.0, 49.0, 61.0, 41.0, 52.0, 70.0, 59.0, 49.0, 59.0, 55.0, 47.0, 41.0, 33.0, 27.0, 21.0, 24.0, 16.0, 14.0, 11.0, 14.0, 8.0, 5.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4287109375, -1.38525390625, -1.341796875, -1.29833984375, -1.2548828125, -1.21142578125, -1.16796875, -1.12451171875, -1.0810546875, -1.03759765625, -0.994140625, -0.95068359375, -0.9072265625, -0.86376953125, -0.8203125, -0.77685546875, -0.7333984375, -0.68994140625, -0.646484375, -0.60302734375, -0.5595703125, -0.51611328125, -0.47265625, -0.42919921875, -0.3857421875, -0.34228515625, -0.298828125, -0.25537109375, -0.2119140625, -0.16845703125, -0.125, -0.08154296875, -0.0380859375, 0.00537109375, 0.048828125, 0.09228515625, 0.1357421875, 0.17919921875, 0.22265625, 0.26611328125, 0.3095703125, 0.35302734375, 0.396484375, 0.43994140625, 0.4833984375, 0.52685546875, 0.5703125, 0.61376953125, 0.6572265625, 0.70068359375, 0.744140625, 0.78759765625, 0.8310546875, 0.87451171875, 0.91796875, 0.96142578125, 1.0048828125, 1.04833984375, 1.091796875, 1.13525390625, 1.1787109375, 1.22216796875, 1.265625, 1.30908203125, 1.3525390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 13.0, 9.0, 16.0, 36.0, 55.0, 100.0, 137.0, 319.0, 695.0, 2226.0, 8169.0, 48740.0, 456057.0, 469934.0, 49883.0, 8534.0, 2190.0, 757.0, 317.0, 135.0, 61.0, 59.0, 45.0, 25.0, 19.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.49658203125, -4.3603515625, -4.22412109375, -4.087890625, -3.95166015625, -3.8154296875, -3.67919921875, -3.54296875, -3.40673828125, -3.2705078125, -3.13427734375, -2.998046875, -2.86181640625, -2.7255859375, -2.58935546875, -2.453125, -2.31689453125, -2.1806640625, -2.04443359375, -1.908203125, -1.77197265625, -1.6357421875, -1.49951171875, -1.36328125, -1.22705078125, -1.0908203125, -0.95458984375, -0.818359375, -0.68212890625, -0.5458984375, -0.40966796875, -0.2734375, -0.13720703125, -0.0009765625, 0.13525390625, 0.271484375, 0.40771484375, 0.5439453125, 0.68017578125, 0.81640625, 0.95263671875, 1.0888671875, 1.22509765625, 1.361328125, 1.49755859375, 1.6337890625, 1.77001953125, 1.90625, 2.04248046875, 2.1787109375, 2.31494140625, 2.451171875, 2.58740234375, 2.7236328125, 2.85986328125, 2.99609375, 3.13232421875, 3.2685546875, 3.40478515625, 3.541015625, 3.67724609375, 3.8134765625, 3.94970703125, 4.0859375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 9.0, 4.0, 8.0, 13.0, 17.0, 16.0, 20.0, 21.0, 45.0, 33.0, 41.0, 37.0, 42.0, 59.0, 65.0, 50.0, 53.0, 38.0, 52.0, 45.0, 45.0, 54.0, 32.0, 29.0, 24.0, 35.0, 20.0, 18.0, 8.0, 17.0, 13.0, 6.0, 2.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5703125, -5.39129638671875, -5.2122802734375, -5.03326416015625, -4.854248046875, -4.67523193359375, -4.4962158203125, -4.31719970703125, -4.13818359375, -3.95916748046875, -3.7801513671875, -3.60113525390625, -3.422119140625, -3.24310302734375, -3.0640869140625, -2.88507080078125, -2.7060546875, -2.52703857421875, -2.3480224609375, -2.16900634765625, -1.989990234375, -1.81097412109375, -1.6319580078125, -1.45294189453125, -1.27392578125, -1.09490966796875, -0.9158935546875, -0.73687744140625, -0.557861328125, -0.37884521484375, -0.1998291015625, -0.02081298828125, 0.158203125, 0.33721923828125, 0.5162353515625, 0.69525146484375, 0.874267578125, 1.05328369140625, 1.2322998046875, 1.41131591796875, 1.59033203125, 1.76934814453125, 1.9483642578125, 2.12738037109375, 2.306396484375, 2.48541259765625, 2.6644287109375, 2.84344482421875, 3.0224609375, 3.20147705078125, 3.3804931640625, 3.55950927734375, 3.738525390625, 3.91754150390625, 4.0965576171875, 4.27557373046875, 4.45458984375, 4.63360595703125, 4.8126220703125, 4.99163818359375, 5.170654296875, 5.34967041015625, 5.5286865234375, 5.70770263671875, 5.88671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 5.0, 6.0, 9.0, 10.0, 15.0, 14.0, 34.0, 42.0, 70.0, 98.0, 164.0, 310.0, 486.0, 697.0, 1184.0, 1986.0, 3733.0, 8238.0, 23471.0, 127525.0, 727740.0, 114146.0, 22056.0, 7798.0, 3633.0, 1958.0, 1175.0, 721.0, 436.0, 275.0, 167.0, 116.0, 57.0, 64.0, 32.0, 23.0, 16.0, 12.0, 11.0, 5.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.904296875, -1.8437957763671875, -1.783294677734375, -1.7227935791015625, -1.66229248046875, -1.6017913818359375, -1.541290283203125, -1.4807891845703125, -1.4202880859375, -1.3597869873046875, -1.299285888671875, -1.2387847900390625, -1.17828369140625, -1.1177825927734375, -1.057281494140625, -0.9967803955078125, -0.936279296875, -0.8757781982421875, -0.815277099609375, -0.7547760009765625, -0.69427490234375, -0.6337738037109375, -0.573272705078125, -0.5127716064453125, -0.4522705078125, -0.3917694091796875, -0.331268310546875, -0.2707672119140625, -0.21026611328125, -0.1497650146484375, -0.089263916015625, -0.0287628173828125, 0.03173828125, 0.0922393798828125, 0.152740478515625, 0.2132415771484375, 0.27374267578125, 0.3342437744140625, 0.394744873046875, 0.4552459716796875, 0.5157470703125, 0.5762481689453125, 0.636749267578125, 0.6972503662109375, 0.75775146484375, 0.8182525634765625, 0.878753662109375, 0.9392547607421875, 0.999755859375, 1.0602569580078125, 1.120758056640625, 1.1812591552734375, 1.24176025390625, 1.3022613525390625, 1.362762451171875, 1.4232635498046875, 1.4837646484375, 1.5442657470703125, 1.604766845703125, 1.6652679443359375, 1.72576904296875, 1.7862701416015625, 1.846771240234375, 1.9072723388671875, 1.9677734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 10.0, 1.0, 8.0, 21.0, 34.0, 54.0, 94.0, 152.0, 198.0, 171.0, 94.0, 48.0, 27.0, 35.0, 15.0, 8.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00035643577575683594, -0.00034194812178611755, -0.00032746046781539917, -0.0003129728138446808, -0.0002984851598739624, -0.000283997505903244, -0.00026950985193252563, -0.00025502219796180725, -0.00024053454399108887, -0.00022604689002037048, -0.0002115592360496521, -0.00019707158207893372, -0.00018258392810821533, -0.00016809627413749695, -0.00015360862016677856, -0.00013912096619606018, -0.0001246333122253418, -0.00011014565825462341, -9.565800428390503e-05, -8.117035031318665e-05, -6.668269634246826e-05, -5.219504237174988e-05, -3.7707388401031494e-05, -2.321973443031311e-05, -8.732080459594727e-06, 5.755573511123657e-06, 2.024322748184204e-05, 3.4730881452560425e-05, 4.921853542327881e-05, 6.370618939399719e-05, 7.819384336471558e-05, 9.268149733543396e-05, 0.00010716915130615234, 0.00012165680527687073, 0.0001361444592475891, 0.0001506321132183075, 0.00016511976718902588, 0.00017960742115974426, 0.00019409507513046265, 0.00020858272910118103, 0.00022307038307189941, 0.0002375580370426178, 0.0002520456910133362, 0.00026653334498405457, 0.00028102099895477295, 0.00029550865292549133, 0.0003099963068962097, 0.0003244839608669281, 0.0003389716148376465, 0.00035345926880836487, 0.00036794692277908325, 0.00038243457674980164, 0.00039692223072052, 0.0004114098846912384, 0.0004258975386619568, 0.00044038519263267517, 0.00045487284660339355, 0.00046936050057411194, 0.0004838481545448303, 0.0004983358085155487, 0.0005128234624862671, 0.0005273111164569855, 0.0005417987704277039, 0.0005562864243984222, 0.0005707740783691406]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 4.0, 9.0, 23.0, 23.0, 24.0, 52.0, 56.0, 90.0, 150.0, 229.0, 388.0, 627.0, 1039.0, 2043.0, 4161.0, 10212.0, 36862.0, 280605.0, 604710.0, 78591.0, 16537.0, 6003.0, 2684.0, 1385.0, 792.0, 430.0, 281.0, 175.0, 133.0, 71.0, 54.0, 38.0, 21.0, 17.0, 10.0, 5.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.037109375, -1.9792633056640625, -1.921417236328125, -1.8635711669921875, -1.80572509765625, -1.7478790283203125, -1.690032958984375, -1.6321868896484375, -1.5743408203125, -1.5164947509765625, -1.458648681640625, -1.4008026123046875, -1.34295654296875, -1.2851104736328125, -1.227264404296875, -1.1694183349609375, -1.111572265625, -1.0537261962890625, -0.995880126953125, -0.9380340576171875, -0.88018798828125, -0.8223419189453125, -0.764495849609375, -0.7066497802734375, -0.6488037109375, -0.5909576416015625, -0.533111572265625, -0.4752655029296875, -0.41741943359375, -0.3595733642578125, -0.301727294921875, -0.2438812255859375, -0.18603515625, -0.1281890869140625, -0.070343017578125, -0.0124969482421875, 0.04534912109375, 0.1031951904296875, 0.161041259765625, 0.2188873291015625, 0.2767333984375, 0.3345794677734375, 0.392425537109375, 0.4502716064453125, 0.50811767578125, 0.5659637451171875, 0.623809814453125, 0.6816558837890625, 0.739501953125, 0.7973480224609375, 0.855194091796875, 0.9130401611328125, 0.97088623046875, 1.0287322998046875, 1.086578369140625, 1.1444244384765625, 1.2022705078125, 1.2601165771484375, 1.317962646484375, 1.3758087158203125, 1.43365478515625, 1.4915008544921875, 1.549346923828125, 1.6071929931640625, 1.6650390625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 12.0, 11.0, 11.0, 20.0, 22.0, 46.0, 63.0, 104.0, 116.0, 145.0, 148.0, 90.0, 66.0, 43.0, 23.0, 21.0, 17.0, 13.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.1796875, -3.10321044921875, -3.0267333984375, -2.95025634765625, -2.873779296875, -2.79730224609375, -2.7208251953125, -2.64434814453125, -2.56787109375, -2.49139404296875, -2.4149169921875, -2.33843994140625, -2.261962890625, -2.18548583984375, -2.1090087890625, -2.03253173828125, -1.9560546875, -1.87957763671875, -1.8031005859375, -1.72662353515625, -1.650146484375, -1.57366943359375, -1.4971923828125, -1.42071533203125, -1.34423828125, -1.26776123046875, -1.1912841796875, -1.11480712890625, -1.038330078125, -0.96185302734375, -0.8853759765625, -0.80889892578125, -0.732421875, -0.65594482421875, -0.5794677734375, -0.50299072265625, -0.426513671875, -0.35003662109375, -0.2735595703125, -0.19708251953125, -0.12060546875, -0.04412841796875, 0.0323486328125, 0.10882568359375, 0.185302734375, 0.26177978515625, 0.3382568359375, 0.41473388671875, 0.4912109375, 0.56768798828125, 0.6441650390625, 0.72064208984375, 0.797119140625, 0.87359619140625, 0.9500732421875, 1.02655029296875, 1.10302734375, 1.17950439453125, 1.2559814453125, 1.33245849609375, 1.408935546875, 1.48541259765625, 1.5618896484375, 1.63836669921875, 1.71484375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 6.0, 11.0, 11.0, 28.0, 38.0, 50.0, 77.0, 104.0, 95.0, 121.0, 109.0, 92.0, 64.0, 55.0, 38.0, 25.0, 23.0, 14.0, 13.0, 8.0, 7.0, 2.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.11834144592285, -21.469161987304688, -20.819982528686523, -20.170801162719727, -19.521621704101562, -18.8724422454834, -18.223262786865234, -17.57408332824707, -16.924903869628906, -16.275724411010742, -15.626543998718262, -14.977364540100098, -14.328184127807617, -13.679004669189453, -13.029825210571289, -12.380645751953125, -11.731464385986328, -11.082284927368164, -10.433104515075684, -9.78392505645752, -9.134744644165039, -8.485565185546875, -7.836385726928711, -7.187205791473389, -6.538025856018066, -5.888845920562744, -5.239665985107422, -4.590486526489258, -3.9413065910339355, -3.2921266555786133, -2.64294695854187, -1.993767261505127, -1.3445873260498047, -0.695407509803772, -0.04622769355773926, 0.6029521226882935, 1.2521319389343262, 1.9013118743896484, 2.5504915714263916, 3.1996712684631348, 3.848851203918457, 4.498031139373779, 5.147211074829102, 5.796390533447266, 6.445570468902588, 7.09475040435791, 7.743929862976074, 8.393110275268555, 9.042289733886719, 9.691469192504883, 10.340649604797363, 10.989829063415527, 11.639009475708008, 12.288188934326172, 12.937368392944336, 13.5865478515625, 14.23572826385498, 14.884907722473145, 15.534088134765625, 16.18326759338379, 16.832447052001953, 17.48162841796875, 18.130807876586914, 18.779987335205078, 19.429166793823242]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 2.0, 9.0, 15.0, 9.0, 13.0, 16.0, 23.0, 19.0, 27.0, 27.0, 32.0, 30.0, 36.0, 34.0, 37.0, 39.0, 42.0, 61.0, 52.0, 54.0, 43.0, 39.0, 48.0, 33.0, 33.0, 39.0, 27.0, 26.0, 21.0, 20.0, 14.0, 14.0, 12.0, 8.0, 7.0, 10.0, 6.0, 9.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.519367218017578, -29.607492446899414, -28.695619583129883, -27.78374481201172, -26.871871948242188, -25.959997177124023, -25.04812240600586, -24.136249542236328, -23.224374771118164, -22.3125, -21.40062713623047, -20.488752365112305, -19.57687759399414, -18.66500473022461, -17.753129959106445, -16.84125518798828, -15.92938232421875, -15.017508506774902, -14.105634689331055, -13.19375991821289, -12.281886100769043, -11.370012283325195, -10.458137512207031, -9.546263694763184, -8.634389877319336, -7.722516059875488, -6.810641765594482, -5.898767471313477, -4.986893653869629, -4.075019836425781, -3.1631455421447754, -2.2512712478637695, -1.3393974304199219, -0.4275233745574951, 0.48435068130493164, 1.3962247371673584, 2.308098793029785, 3.219972610473633, 4.131846904754639, 5.0437211990356445, 5.955595016479492, 6.86746883392334, 7.779343128204346, 8.691217422485352, 9.6030912399292, 10.514965057373047, 11.426839828491211, 12.338713645935059, 13.250587463378906, 14.162461280822754, 15.074335098266602, 15.986209869384766, 16.898082733154297, 17.80995750427246, 18.721832275390625, 19.633705139160156, 20.54557991027832, 21.457454681396484, 22.369327545166016, 23.28120231628418, 24.193077087402344, 25.104949951171875, 26.01682472229004, 26.928699493408203, 27.840572357177734]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 7.0, 7.0, 10.0, 8.0, 23.0, 29.0, 30.0, 43.0, 68.0, 111.0, 186.0, 341.0, 684.0, 1269.0, 2869.0, 7775.0, 41204.0, 4097025.0, 30619.0, 6601.0, 2629.0, 1269.0, 585.0, 336.0, 207.0, 119.0, 73.0, 46.0, 44.0, 22.0, 8.0, 10.0, 5.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.96875, -3.850067138671875, -3.73138427734375, -3.612701416015625, -3.4940185546875, -3.375335693359375, -3.25665283203125, -3.137969970703125, -3.019287109375, -2.900604248046875, -2.78192138671875, -2.663238525390625, -2.5445556640625, -2.425872802734375, -2.30718994140625, -2.188507080078125, -2.06982421875, -1.951141357421875, -1.83245849609375, -1.713775634765625, -1.5950927734375, -1.476409912109375, -1.35772705078125, -1.239044189453125, -1.120361328125, -1.001678466796875, -0.88299560546875, -0.764312744140625, -0.6456298828125, -0.526947021484375, -0.40826416015625, -0.289581298828125, -0.1708984375, -0.052215576171875, 0.06646728515625, 0.185150146484375, 0.3038330078125, 0.422515869140625, 0.54119873046875, 0.659881591796875, 0.778564453125, 0.897247314453125, 1.01593017578125, 1.134613037109375, 1.2532958984375, 1.371978759765625, 1.49066162109375, 1.609344482421875, 1.72802734375, 1.846710205078125, 1.96539306640625, 2.084075927734375, 2.2027587890625, 2.321441650390625, 2.44012451171875, 2.558807373046875, 2.677490234375, 2.796173095703125, 2.91485595703125, 3.033538818359375, 3.1522216796875, 3.270904541015625, 3.38958740234375, 3.508270263671875, 3.626953125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 7.0, 11.0, 13.0, 15.0, 13.0, 20.0, 27.0, 24.0, 37.0, 32.0, 31.0, 34.0, 49.0, 42.0, 45.0, 59.0, 58.0, 38.0, 37.0, 53.0, 39.0, 34.0, 38.0, 39.0, 31.0, 23.0, 20.0, 24.0, 22.0, 10.0, 9.0, 12.0, 9.0, 8.0, 6.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.4091796875, -1.3635406494140625, -1.317901611328125, -1.2722625732421875, -1.22662353515625, -1.1809844970703125, -1.135345458984375, -1.0897064208984375, -1.0440673828125, -0.9984283447265625, -0.952789306640625, -0.9071502685546875, -0.86151123046875, -0.8158721923828125, -0.770233154296875, -0.7245941162109375, -0.678955078125, -0.6333160400390625, -0.587677001953125, -0.5420379638671875, -0.49639892578125, -0.4507598876953125, -0.405120849609375, -0.3594818115234375, -0.3138427734375, -0.2682037353515625, -0.222564697265625, -0.1769256591796875, -0.13128662109375, -0.0856475830078125, -0.040008544921875, 0.0056304931640625, 0.05126953125, 0.0969085693359375, 0.142547607421875, 0.1881866455078125, 0.23382568359375, 0.2794647216796875, 0.325103759765625, 0.3707427978515625, 0.4163818359375, 0.4620208740234375, 0.507659912109375, 0.5532989501953125, 0.59893798828125, 0.6445770263671875, 0.690216064453125, 0.7358551025390625, 0.781494140625, 0.8271331787109375, 0.872772216796875, 0.9184112548828125, 0.96405029296875, 1.0096893310546875, 1.055328369140625, 1.1009674072265625, 1.1466064453125, 1.1922454833984375, 1.237884521484375, 1.2835235595703125, 1.32916259765625, 1.3748016357421875, 1.420440673828125, 1.4660797119140625, 1.51171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 22.0, 32.0, 26.0, 37.0, 48.0, 86.0, 128.0, 212.0, 294.0, 577.0, 892.0, 1639.0, 3117.0, 6928.0, 21678.0, 228040.0, 3883949.0, 29829.0, 8563.0, 3646.0, 1855.0, 1005.0, 564.0, 381.0, 240.0, 154.0, 82.0, 70.0, 44.0, 27.0, 19.0, 10.0, 8.0, 9.0, 9.0, 4.0, 8.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.638671875, -2.551025390625, -2.46337890625, -2.375732421875, -2.2880859375, -2.200439453125, -2.11279296875, -2.025146484375, -1.9375, -1.849853515625, -1.76220703125, -1.674560546875, -1.5869140625, -1.499267578125, -1.41162109375, -1.323974609375, -1.236328125, -1.148681640625, -1.06103515625, -0.973388671875, -0.8857421875, -0.798095703125, -0.71044921875, -0.622802734375, -0.53515625, -0.447509765625, -0.35986328125, -0.272216796875, -0.1845703125, -0.096923828125, -0.00927734375, 0.078369140625, 0.166015625, 0.253662109375, 0.34130859375, 0.428955078125, 0.5166015625, 0.604248046875, 0.69189453125, 0.779541015625, 0.8671875, 0.954833984375, 1.04248046875, 1.130126953125, 1.2177734375, 1.305419921875, 1.39306640625, 1.480712890625, 1.568359375, 1.656005859375, 1.74365234375, 1.831298828125, 1.9189453125, 2.006591796875, 2.09423828125, 2.181884765625, 2.26953125, 2.357177734375, 2.44482421875, 2.532470703125, 2.6201171875, 2.707763671875, 2.79541015625, 2.883056640625, 2.970703125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 4.0, 11.0, 19.0, 28.0, 60.0, 258.0, 3468.0, 100.0, 31.0, 23.0, 15.0, 11.0, 6.0, 6.0, 0.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7099609375, -0.689208984375, -0.66845703125, -0.647705078125, -0.626953125, -0.606201171875, -0.58544921875, -0.564697265625, -0.5439453125, -0.523193359375, -0.50244140625, -0.481689453125, -0.4609375, -0.440185546875, -0.41943359375, -0.398681640625, -0.3779296875, -0.357177734375, -0.33642578125, -0.315673828125, -0.294921875, -0.274169921875, -0.25341796875, -0.232666015625, -0.2119140625, -0.191162109375, -0.17041015625, -0.149658203125, -0.12890625, -0.108154296875, -0.08740234375, -0.066650390625, -0.0458984375, -0.025146484375, -0.00439453125, 0.016357421875, 0.037109375, 0.057861328125, 0.07861328125, 0.099365234375, 0.1201171875, 0.140869140625, 0.16162109375, 0.182373046875, 0.203125, 0.223876953125, 0.24462890625, 0.265380859375, 0.2861328125, 0.306884765625, 0.32763671875, 0.348388671875, 0.369140625, 0.389892578125, 0.41064453125, 0.431396484375, 0.4521484375, 0.472900390625, 0.49365234375, 0.514404296875, 0.53515625, 0.555908203125, 0.57666015625, 0.597412109375, 0.6181640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 7.0, 4.0, 8.0, 11.0, 20.0, 27.0, 57.0, 86.0, 100.0, 141.0, 111.0, 134.0, 118.0, 73.0, 45.0, 27.0, 17.0, 9.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.56059193611145, -3.487452745437622, -3.414313554763794, -3.341174602508545, -3.268035411834717, -3.1948962211608887, -3.1217570304870605, -3.0486178398132324, -2.9754786491394043, -2.902339458465576, -2.829200267791748, -2.75606107711792, -2.682922124862671, -2.6097829341888428, -2.5366437435150146, -2.4635045528411865, -2.3903656005859375, -2.3172264099121094, -2.2440872192382812, -2.170948028564453, -2.097809076309204, -2.024669885635376, -1.9515306949615479, -1.8783915042877197, -1.8052523136138916, -1.7321131229400635, -1.658974051475525, -1.5858348608016968, -1.5126956701278687, -1.43955659866333, -1.366417407989502, -1.2932782173156738, -1.2201390266418457, -1.1469998359680176, -1.073860764503479, -1.0007215738296509, -0.9275823831558228, -0.8544432520866394, -0.781304121017456, -0.7081649303436279, -0.6350257992744446, -0.5618866682052612, -0.4887474775314331, -0.41560834646224976, -0.342469185590744, -0.2693300247192383, -0.19619089365005493, -0.1230517029762268, -0.04991257190704346, 0.023226581513881683, 0.09636573493480682, 0.16950488090515137, 0.2426440417766571, 0.31578320264816284, 0.3889223337173462, 0.4620615243911743, 0.5352006554603577, 0.608339786529541, 0.6814789772033691, 0.7546181082725525, 0.8277572393417358, 0.900896430015564, 0.9740355610847473, 1.0471746921539307, 1.1203138828277588]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 5.0, 5.0, 15.0, 15.0, 10.0, 16.0, 16.0, 19.0, 25.0, 17.0, 36.0, 27.0, 39.0, 49.0, 49.0, 49.0, 42.0, 39.0, 46.0, 43.0, 46.0, 46.0, 31.0, 48.0, 37.0, 29.0, 17.0, 25.0, 25.0, 27.0, 19.0, 10.0, 11.0, 6.0, 13.0, 5.0, 6.0, 8.0, 7.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.0735180377960205, -1.0398602485656738, -1.0062024593353271, -0.9725446105003357, -0.9388867616653442, -0.9052289724349976, -0.8715711832046509, -0.8379133343696594, -0.804255485534668, -0.7705976963043213, -0.7369398474693298, -0.7032820582389832, -0.6696242094039917, -0.635966420173645, -0.6023086309432983, -0.5686507821083069, -0.5349929928779602, -0.5013352036476135, -0.46767735481262207, -0.4340195655822754, -0.40036171674728394, -0.36670392751693726, -0.3330461084842682, -0.2993882894515991, -0.26573047041893005, -0.232072651386261, -0.19841483235359192, -0.16475702822208405, -0.13109920918941498, -0.09744139015674591, -0.06378358602523804, -0.03012576699256897, 0.0035320520401000977, 0.03718986734747887, 0.07084768265485764, 0.1045054942369461, 0.13816331326961517, 0.17182113230228424, 0.20547893643379211, 0.23913675546646118, 0.27279457449913025, 0.3064523935317993, 0.3401102125644684, 0.37376803159713745, 0.40742582082748413, 0.4410836696624756, 0.47474145889282227, 0.508399248123169, 0.5420570969581604, 0.5757148861885071, 0.6093727350234985, 0.6430305242538452, 0.6766883730888367, 0.7103461623191833, 0.7440040111541748, 0.7776618003845215, 0.8113195896148682, 0.8449773788452148, 0.8786352276802063, 0.912293016910553, 0.9459508657455444, 0.9796086549758911, 1.0132664442062378, 1.046924352645874, 1.0805821418762207]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 7.0, 16.0, 22.0, 38.0, 51.0, 80.0, 134.0, 202.0, 347.0, 731.0, 1364.0, 3135.0, 6939.0, 16819.0, 44847.0, 127386.0, 325241.0, 322762.0, 124641.0, 44183.0, 16683.0, 6814.0, 3125.0, 1385.0, 633.0, 408.0, 185.0, 141.0, 91.0, 44.0, 34.0, 16.0, 15.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.353179931640625, -2.27471923828125, -2.196258544921875, -2.1177978515625, -2.039337158203125, -1.96087646484375, -1.882415771484375, -1.803955078125, -1.725494384765625, -1.64703369140625, -1.568572998046875, -1.4901123046875, -1.411651611328125, -1.33319091796875, -1.254730224609375, -1.17626953125, -1.097808837890625, -1.01934814453125, -0.940887451171875, -0.8624267578125, -0.783966064453125, -0.70550537109375, -0.627044677734375, -0.548583984375, -0.470123291015625, -0.39166259765625, -0.313201904296875, -0.2347412109375, -0.156280517578125, -0.07781982421875, 0.000640869140625, 0.0791015625, 0.157562255859375, 0.23602294921875, 0.314483642578125, 0.3929443359375, 0.471405029296875, 0.54986572265625, 0.628326416015625, 0.706787109375, 0.785247802734375, 0.86370849609375, 0.942169189453125, 1.0206298828125, 1.099090576171875, 1.17755126953125, 1.256011962890625, 1.33447265625, 1.412933349609375, 1.49139404296875, 1.569854736328125, 1.6483154296875, 1.726776123046875, 1.80523681640625, 1.883697509765625, 1.962158203125, 2.040618896484375, 2.11907958984375, 2.197540283203125, 2.2760009765625, 2.354461669921875, 2.43292236328125, 2.511383056640625, 2.58984375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 8.0, 9.0, 9.0, 18.0, 15.0, 15.0, 25.0, 27.0, 31.0, 34.0, 33.0, 35.0, 42.0, 40.0, 45.0, 45.0, 44.0, 53.0, 56.0, 50.0, 44.0, 33.0, 35.0, 44.0, 35.0, 23.0, 18.0, 18.0, 30.0, 15.0, 9.0, 12.0, 9.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.4501953125, -1.40374755859375, -1.3572998046875, -1.31085205078125, -1.264404296875, -1.21795654296875, -1.1715087890625, -1.12506103515625, -1.07861328125, -1.03216552734375, -0.9857177734375, -0.93927001953125, -0.892822265625, -0.84637451171875, -0.7999267578125, -0.75347900390625, -0.70703125, -0.66058349609375, -0.6141357421875, -0.56768798828125, -0.521240234375, -0.47479248046875, -0.4283447265625, -0.38189697265625, -0.33544921875, -0.28900146484375, -0.2425537109375, -0.19610595703125, -0.149658203125, -0.10321044921875, -0.0567626953125, -0.01031494140625, 0.0361328125, 0.08258056640625, 0.1290283203125, 0.17547607421875, 0.221923828125, 0.26837158203125, 0.3148193359375, 0.36126708984375, 0.40771484375, 0.45416259765625, 0.5006103515625, 0.54705810546875, 0.593505859375, 0.63995361328125, 0.6864013671875, 0.73284912109375, 0.779296875, 0.82574462890625, 0.8721923828125, 0.91864013671875, 0.965087890625, 1.01153564453125, 1.0579833984375, 1.10443115234375, 1.15087890625, 1.19732666015625, 1.2437744140625, 1.29022216796875, 1.336669921875, 1.38311767578125, 1.4295654296875, 1.47601318359375, 1.5224609375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 18.0, 20.0, 14.0, 37.0, 46.0, 61.0, 87.0, 157.0, 236.0, 452.0, 1172.0, 3520.0, 15782.0, 114107.0, 725454.0, 160040.0, 20469.0, 4313.0, 1374.0, 480.0, 247.0, 142.0, 102.0, 51.0, 52.0, 34.0, 27.0, 23.0, 8.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8984375, -4.72698974609375, -4.5555419921875, -4.38409423828125, -4.212646484375, -4.04119873046875, -3.8697509765625, -3.69830322265625, -3.52685546875, -3.35540771484375, -3.1839599609375, -3.01251220703125, -2.841064453125, -2.66961669921875, -2.4981689453125, -2.32672119140625, -2.1552734375, -1.98382568359375, -1.8123779296875, -1.64093017578125, -1.469482421875, -1.29803466796875, -1.1265869140625, -0.95513916015625, -0.78369140625, -0.61224365234375, -0.4407958984375, -0.26934814453125, -0.097900390625, 0.07354736328125, 0.2449951171875, 0.41644287109375, 0.587890625, 0.75933837890625, 0.9307861328125, 1.10223388671875, 1.273681640625, 1.44512939453125, 1.6165771484375, 1.78802490234375, 1.95947265625, 2.13092041015625, 2.3023681640625, 2.47381591796875, 2.645263671875, 2.81671142578125, 2.9881591796875, 3.15960693359375, 3.3310546875, 3.50250244140625, 3.6739501953125, 3.84539794921875, 4.016845703125, 4.18829345703125, 4.3597412109375, 4.53118896484375, 4.70263671875, 4.87408447265625, 5.0455322265625, 5.21697998046875, 5.388427734375, 5.55987548828125, 5.7313232421875, 5.90277099609375, 6.07421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 8.0, 10.0, 20.0, 28.0, 35.0, 41.0, 60.0, 76.0, 91.0, 80.0, 89.0, 110.0, 71.0, 64.0, 48.0, 44.0, 38.0, 29.0, 25.0, 14.0, 7.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.550048828125, -18.11572265625, -17.681396484375, -17.2470703125, -16.812744140625, -16.37841796875, -15.944091796875, -15.509765625, -15.075439453125, -14.64111328125, -14.206787109375, -13.7724609375, -13.338134765625, -12.90380859375, -12.469482421875, -12.03515625, -11.600830078125, -11.16650390625, -10.732177734375, -10.2978515625, -9.863525390625, -9.42919921875, -8.994873046875, -8.560546875, -8.126220703125, -7.69189453125, -7.257568359375, -6.8232421875, -6.388916015625, -5.95458984375, -5.520263671875, -5.0859375, -4.651611328125, -4.21728515625, -3.782958984375, -3.3486328125, -2.914306640625, -2.47998046875, -2.045654296875, -1.611328125, -1.177001953125, -0.74267578125, -0.308349609375, 0.1259765625, 0.560302734375, 0.99462890625, 1.428955078125, 1.86328125, 2.297607421875, 2.73193359375, 3.166259765625, 3.6005859375, 4.034912109375, 4.46923828125, 4.903564453125, 5.337890625, 5.772216796875, 6.20654296875, 6.640869140625, 7.0751953125, 7.509521484375, 7.94384765625, 8.378173828125, 8.8125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 14.0, 16.0, 24.0, 78.0, 244.0, 785.0, 12452.0, 1031163.0, 3061.0, 440.0, 166.0, 67.0, 20.0, 11.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.140625, -11.67919921875, -11.2177734375, -10.75634765625, -10.294921875, -9.83349609375, -9.3720703125, -8.91064453125, -8.44921875, -7.98779296875, -7.5263671875, -7.06494140625, -6.603515625, -6.14208984375, -5.6806640625, -5.21923828125, -4.7578125, -4.29638671875, -3.8349609375, -3.37353515625, -2.912109375, -2.45068359375, -1.9892578125, -1.52783203125, -1.06640625, -0.60498046875, -0.1435546875, 0.31787109375, 0.779296875, 1.24072265625, 1.7021484375, 2.16357421875, 2.625, 3.08642578125, 3.5478515625, 4.00927734375, 4.470703125, 4.93212890625, 5.3935546875, 5.85498046875, 6.31640625, 6.77783203125, 7.2392578125, 7.70068359375, 8.162109375, 8.62353515625, 9.0849609375, 9.54638671875, 10.0078125, 10.46923828125, 10.9306640625, 11.39208984375, 11.853515625, 12.31494140625, 12.7763671875, 13.23779296875, 13.69921875, 14.16064453125, 14.6220703125, 15.08349609375, 15.544921875, 16.00634765625, 16.4677734375, 16.92919921875, 17.390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 14.0, 9.0, 18.0, 22.0, 21.0, 23.0, 53.0, 69.0, 70.0, 99.0, 135.0, 111.0, 79.0, 66.0, 48.0, 38.0, 42.0, 23.0, 11.0, 14.0, 6.0, 4.0, 5.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.000293731689453125, -0.0002834908664226532, -0.0002732500433921814, -0.0002630092203617096, -0.0002527683973312378, -0.000242527574300766, -0.0002322867512702942, -0.0002220459282398224, -0.00021180510520935059, -0.00020156428217887878, -0.00019132345914840698, -0.00018108263611793518, -0.00017084181308746338, -0.00016060099005699158, -0.00015036016702651978, -0.00014011934399604797, -0.00012987852096557617, -0.00011963769793510437, -0.00010939687490463257, -9.915605187416077e-05, -8.891522884368896e-05, -7.867440581321716e-05, -6.843358278274536e-05, -5.819275975227356e-05, -4.795193672180176e-05, -3.7711113691329956e-05, -2.7470290660858154e-05, -1.7229467630386353e-05, -6.988644599914551e-06, 3.252178430557251e-06, 1.3493001461029053e-05, 2.3733824491500854e-05, 3.3974647521972656e-05, 4.421547055244446e-05, 5.445629358291626e-05, 6.469711661338806e-05, 7.493793964385986e-05, 8.517876267433167e-05, 9.541958570480347e-05, 0.00010566040873527527, 0.00011590123176574707, 0.00012614205479621887, 0.00013638287782669067, 0.00014662370085716248, 0.00015686452388763428, 0.00016710534691810608, 0.00017734616994857788, 0.00018758699297904968, 0.00019782781600952148, 0.00020806863903999329, 0.0002183094620704651, 0.0002285502851009369, 0.0002387911081314087, 0.0002490319311618805, 0.0002592727541923523, 0.0002695135772228241, 0.0002797544002532959, 0.0002899952232837677, 0.0003002360463142395, 0.0003104768693447113, 0.0003207176923751831, 0.0003309585154056549, 0.0003411993384361267, 0.0003514401614665985, 0.0003616809844970703]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 1.0, 3.0, 9.0, 5.0, 12.0, 17.0, 24.0, 30.0, 44.0, 71.0, 115.0, 192.0, 379.0, 800.0, 2133.0, 7218.0, 43392.0, 686797.0, 279576.0, 20339.0, 4554.0, 1445.0, 624.0, 316.0, 179.0, 91.0, 60.0, 30.0, 19.0, 27.0, 8.0, 9.0, 7.0, 7.0, 3.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.828125, -2.749176025390625, -2.67022705078125, -2.591278076171875, -2.5123291015625, -2.433380126953125, -2.35443115234375, -2.275482177734375, -2.196533203125, -2.117584228515625, -2.03863525390625, -1.959686279296875, -1.8807373046875, -1.801788330078125, -1.72283935546875, -1.643890380859375, -1.56494140625, -1.485992431640625, -1.40704345703125, -1.328094482421875, -1.2491455078125, -1.170196533203125, -1.09124755859375, -1.012298583984375, -0.933349609375, -0.854400634765625, -0.77545166015625, -0.696502685546875, -0.6175537109375, -0.538604736328125, -0.45965576171875, -0.380706787109375, -0.3017578125, -0.222808837890625, -0.14385986328125, -0.064910888671875, 0.0140380859375, 0.092987060546875, 0.17193603515625, 0.250885009765625, 0.329833984375, 0.408782958984375, 0.48773193359375, 0.566680908203125, 0.6456298828125, 0.724578857421875, 0.80352783203125, 0.882476806640625, 0.96142578125, 1.040374755859375, 1.11932373046875, 1.198272705078125, 1.2772216796875, 1.356170654296875, 1.43511962890625, 1.514068603515625, 1.593017578125, 1.671966552734375, 1.75091552734375, 1.829864501953125, 1.9088134765625, 1.987762451171875, 2.06671142578125, 2.145660400390625, 2.224609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 11.0, 26.0, 97.0, 319.0, 383.0, 89.0, 31.0, 17.0, 7.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.460693359375, -5.23388671875, -5.007080078125, -4.7802734375, -4.553466796875, -4.32666015625, -4.099853515625, -3.873046875, -3.646240234375, -3.41943359375, -3.192626953125, -2.9658203125, -2.739013671875, -2.51220703125, -2.285400390625, -2.05859375, -1.831787109375, -1.60498046875, -1.378173828125, -1.1513671875, -0.924560546875, -0.69775390625, -0.470947265625, -0.244140625, -0.017333984375, 0.20947265625, 0.436279296875, 0.6630859375, 0.889892578125, 1.11669921875, 1.343505859375, 1.5703125, 1.797119140625, 2.02392578125, 2.250732421875, 2.4775390625, 2.704345703125, 2.93115234375, 3.157958984375, 3.384765625, 3.611572265625, 3.83837890625, 4.065185546875, 4.2919921875, 4.518798828125, 4.74560546875, 4.972412109375, 5.19921875, 5.426025390625, 5.65283203125, 5.879638671875, 6.1064453125, 6.333251953125, 6.56005859375, 6.786865234375, 7.013671875, 7.240478515625, 7.46728515625, 7.694091796875, 7.9208984375, 8.147705078125, 8.37451171875, 8.601318359375, 8.828125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 14.0, 36.0, 85.0, 153.0, 254.0, 260.0, 120.0, 48.0, 23.0, 12.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.01998901367188, -103.90133666992188, -101.7826919555664, -99.6640396118164, -97.54539489746094, -95.42674255371094, -93.30809783935547, -91.18944549560547, -89.07080078125, -86.9521484375, -84.83350372314453, -82.71485137939453, -80.59620666503906, -78.47755432128906, -76.3589096069336, -74.2402572631836, -72.12161254882812, -70.00296020507812, -67.88431549072266, -65.76566314697266, -63.64701843261719, -61.52836990356445, -59.40972137451172, -57.29106903076172, -55.17241668701172, -53.053768157958984, -50.93511962890625, -48.816471099853516, -46.69782257080078, -44.57917404174805, -42.46052551269531, -40.34187316894531, -38.223228454589844, -36.10457992553711, -33.985931396484375, -31.86728286743164, -29.748634338378906, -27.629985809326172, -25.511335372924805, -23.39268684387207, -21.27404022216797, -19.155391693115234, -17.0367431640625, -14.91809368133545, -12.799445152282715, -10.68079662322998, -8.56214714050293, -6.443498611450195, -4.324850082397461, -2.2062013149261475, -0.08755254745483398, 2.0310964584350586, 4.149744987487793, 6.268393516540527, 8.387042999267578, 10.505691528320312, 12.624340057373047, 14.742988586425781, 16.861637115478516, 18.98028564453125, 21.098934173583984, 23.21758270263672, 25.336233139038086, 27.45488166809082, 29.573530197143555]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 10.0, 2.0, 4.0, 12.0, 8.0, 18.0, 10.0, 34.0, 29.0, 33.0, 35.0, 37.0, 42.0, 43.0, 33.0, 58.0, 56.0, 60.0, 44.0, 47.0, 48.0, 54.0, 26.0, 39.0, 45.0, 29.0, 16.0, 20.0, 14.0, 22.0, 6.0, 13.0, 7.0, 10.0, 7.0, 6.0, 3.0, 9.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.69606018066406, -34.529457092285156, -33.36285400390625, -32.196250915527344, -31.02964973449707, -29.863046646118164, -28.69644546508789, -27.529842376708984, -26.363239288330078, -25.196636199951172, -24.030033111572266, -22.863431930541992, -21.696828842163086, -20.53022575378418, -19.363624572753906, -18.197021484375, -17.030418395996094, -15.863815307617188, -14.697213172912598, -13.530611038208008, -12.364007949829102, -11.197404861450195, -10.030802726745605, -8.864200592041016, -7.697597503662109, -6.530994892120361, -5.364392280578613, -4.197789669036865, -3.031187057495117, -1.8645844459533691, -0.6979818344116211, 0.46862030029296875, 1.635223388671875, 2.801826000213623, 3.968428611755371, 5.135031223297119, 6.301633834838867, 7.468236446380615, 8.634839057922363, 9.801441192626953, 10.96804428100586, 12.134647369384766, 13.301249504089355, 14.467851638793945, 15.634454727172852, 16.801057815551758, 17.96765899658203, 19.134262084960938, 20.300865173339844, 21.46746826171875, 22.634071350097656, 23.80067253112793, 24.967275619506836, 26.133878707885742, 27.300479888916016, 28.467082977294922, 29.633686065673828, 30.800289154052734, 31.96689224243164, 33.13349533081055, 34.30009460449219, 35.466697692871094, 36.63330078125, 37.799903869628906, 38.96650695800781]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 3.0, 7.0, 10.0, 15.0, 37.0, 48.0, 49.0, 96.0, 160.0, 302.0, 570.0, 1101.0, 2427.0, 5820.0, 18978.0, 224306.0, 3904396.0, 23193.0, 6922.0, 2766.0, 1276.0, 729.0, 365.0, 245.0, 156.0, 93.0, 48.0, 51.0, 29.0, 21.0, 14.0, 13.0, 8.0, 6.0, 1.0, 4.0, 7.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.701171875, -2.589019775390625, -2.47686767578125, -2.364715576171875, -2.2525634765625, -2.140411376953125, -2.02825927734375, -1.916107177734375, -1.803955078125, -1.691802978515625, -1.57965087890625, -1.467498779296875, -1.3553466796875, -1.243194580078125, -1.13104248046875, -1.018890380859375, -0.90673828125, -0.794586181640625, -0.68243408203125, -0.570281982421875, -0.4581298828125, -0.345977783203125, -0.23382568359375, -0.121673583984375, -0.009521484375, 0.102630615234375, 0.21478271484375, 0.326934814453125, 0.4390869140625, 0.551239013671875, 0.66339111328125, 0.775543212890625, 0.8876953125, 0.999847412109375, 1.11199951171875, 1.224151611328125, 1.3363037109375, 1.448455810546875, 1.56060791015625, 1.672760009765625, 1.784912109375, 1.897064208984375, 2.00921630859375, 2.121368408203125, 2.2335205078125, 2.345672607421875, 2.45782470703125, 2.569976806640625, 2.68212890625, 2.794281005859375, 2.90643310546875, 3.018585205078125, 3.1307373046875, 3.242889404296875, 3.35504150390625, 3.467193603515625, 3.579345703125, 3.691497802734375, 3.80364990234375, 3.915802001953125, 4.0279541015625, 4.140106201171875, 4.25225830078125, 4.364410400390625, 4.4765625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 10.0, 8.0, 9.0, 10.0, 16.0, 23.0, 29.0, 30.0, 32.0, 35.0, 49.0, 49.0, 74.0, 66.0, 62.0, 53.0, 56.0, 64.0, 49.0, 49.0, 36.0, 31.0, 28.0, 27.0, 22.0, 17.0, 12.0, 9.0, 10.0, 6.0, 8.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6298828125, -1.5654449462890625, -1.501007080078125, -1.4365692138671875, -1.37213134765625, -1.3076934814453125, -1.243255615234375, -1.1788177490234375, -1.1143798828125, -1.0499420166015625, -0.985504150390625, -0.9210662841796875, -0.85662841796875, -0.7921905517578125, -0.727752685546875, -0.6633148193359375, -0.598876953125, -0.5344390869140625, -0.470001220703125, -0.4055633544921875, -0.34112548828125, -0.2766876220703125, -0.212249755859375, -0.1478118896484375, -0.0833740234375, -0.0189361572265625, 0.045501708984375, 0.1099395751953125, 0.17437744140625, 0.2388153076171875, 0.303253173828125, 0.3676910400390625, 0.43212890625, 0.4965667724609375, 0.561004638671875, 0.6254425048828125, 0.68988037109375, 0.7543182373046875, 0.818756103515625, 0.8831939697265625, 0.9476318359375, 1.0120697021484375, 1.076507568359375, 1.1409454345703125, 1.20538330078125, 1.2698211669921875, 1.334259033203125, 1.3986968994140625, 1.463134765625, 1.5275726318359375, 1.592010498046875, 1.6564483642578125, 1.72088623046875, 1.7853240966796875, 1.849761962890625, 1.9141998291015625, 1.9786376953125, 2.0430755615234375, 2.107513427734375, 2.1719512939453125, 2.23638916015625, 2.3008270263671875, 2.365264892578125, 2.4297027587890625, 2.494140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 14.0, 9.0, 13.0, 23.0, 22.0, 30.0, 35.0, 69.0, 96.0, 93.0, 170.0, 344.0, 1022.0, 3260.0, 14706.0, 395902.0, 3756271.0, 16464.0, 3594.0, 1099.0, 384.0, 189.0, 119.0, 82.0, 64.0, 53.0, 32.0, 31.0, 15.0, 23.0, 17.0, 9.0, 5.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.390625, -7.159912109375, -6.92919921875, -6.698486328125, -6.4677734375, -6.237060546875, -6.00634765625, -5.775634765625, -5.544921875, -5.314208984375, -5.08349609375, -4.852783203125, -4.6220703125, -4.391357421875, -4.16064453125, -3.929931640625, -3.69921875, -3.468505859375, -3.23779296875, -3.007080078125, -2.7763671875, -2.545654296875, -2.31494140625, -2.084228515625, -1.853515625, -1.622802734375, -1.39208984375, -1.161376953125, -0.9306640625, -0.699951171875, -0.46923828125, -0.238525390625, -0.0078125, 0.222900390625, 0.45361328125, 0.684326171875, 0.9150390625, 1.145751953125, 1.37646484375, 1.607177734375, 1.837890625, 2.068603515625, 2.29931640625, 2.530029296875, 2.7607421875, 2.991455078125, 3.22216796875, 3.452880859375, 3.68359375, 3.914306640625, 4.14501953125, 4.375732421875, 4.6064453125, 4.837158203125, 5.06787109375, 5.298583984375, 5.529296875, 5.760009765625, 5.99072265625, 6.221435546875, 6.4521484375, 6.682861328125, 6.91357421875, 7.144287109375, 7.375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0, 4.0, 7.0, 5.0, 12.0, 17.0, 27.0, 41.0, 125.0, 3467.0, 240.0, 53.0, 28.0, 15.0, 10.0, 5.0, 4.0, 8.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.077178955078125, -2.02740478515625, -1.977630615234375, -1.9278564453125, -1.878082275390625, -1.82830810546875, -1.778533935546875, -1.728759765625, -1.678985595703125, -1.62921142578125, -1.579437255859375, -1.5296630859375, -1.479888916015625, -1.43011474609375, -1.380340576171875, -1.33056640625, -1.280792236328125, -1.23101806640625, -1.181243896484375, -1.1314697265625, -1.081695556640625, -1.03192138671875, -0.982147216796875, -0.932373046875, -0.882598876953125, -0.83282470703125, -0.783050537109375, -0.7332763671875, -0.683502197265625, -0.63372802734375, -0.583953857421875, -0.5341796875, -0.484405517578125, -0.43463134765625, -0.384857177734375, -0.3350830078125, -0.285308837890625, -0.23553466796875, -0.185760498046875, -0.135986328125, -0.086212158203125, -0.03643798828125, 0.013336181640625, 0.0631103515625, 0.112884521484375, 0.16265869140625, 0.212432861328125, 0.26220703125, 0.311981201171875, 0.36175537109375, 0.411529541015625, 0.4613037109375, 0.511077880859375, 0.56085205078125, 0.610626220703125, 0.660400390625, 0.710174560546875, 0.75994873046875, 0.809722900390625, 0.8594970703125, 0.909271240234375, 0.95904541015625, 1.008819580078125, 1.05859375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 7.0, 9.0, 18.0, 17.0, 33.0, 38.0, 46.0, 85.0, 123.0, 121.0, 134.0, 122.0, 96.0, 56.0, 41.0, 28.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.407549858093262, -7.2488627433776855, -7.090176105499268, -6.931488990783691, -6.772802352905273, -6.614115238189697, -6.455428600311279, -6.296741485595703, -6.138054847717285, -5.979367733001709, -5.820681095123291, -5.661993980407715, -5.503307342529297, -5.344620227813721, -5.185933589935303, -5.027246475219727, -4.86855936050415, -4.709872245788574, -4.551185607910156, -4.39249849319458, -4.233811855316162, -4.075124740600586, -3.916437864303589, -3.757750988006592, -3.5990641117095947, -3.4403772354125977, -3.2816903591156006, -3.1230034828186035, -2.9643163681030273, -2.8056297302246094, -2.646942615509033, -2.488255739212036, -2.329569101333618, -2.170882225036621, -2.012195348739624, -1.8535083532333374, -1.6948214769363403, -1.5361346006393433, -1.3774476051330566, -1.2187607288360596, -1.0600738525390625, -0.9013869762420654, -0.7427000403404236, -0.5840131044387817, -0.42532622814178467, -0.2666393518447876, -0.10795241594314575, 0.050734519958496094, 0.20942139625549316, 0.3681083023548126, 0.5267952084541321, 0.6854821443557739, 0.844169020652771, 1.002855896949768, 1.1615428924560547, 1.3202297687530518, 1.4789166450500488, 1.637603521347046, 1.796290397644043, 1.9549773931503296, 2.113664150238037, 2.2723512649536133, 2.4310381412506104, 2.5897250175476074, 2.7484118938446045]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 10.0, 8.0, 9.0, 9.0, 10.0, 27.0, 18.0, 29.0, 27.0, 30.0, 26.0, 35.0, 37.0, 35.0, 35.0, 51.0, 44.0, 46.0, 51.0, 43.0, 42.0, 39.0, 44.0, 36.0, 32.0, 36.0, 25.0, 29.0, 22.0, 25.0, 15.0, 17.0, 16.0, 10.0, 8.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.207650661468506, -3.11444354057312, -3.0212364196777344, -2.9280292987823486, -2.834822177886963, -2.741614818572998, -2.6484079360961914, -2.5552005767822266, -2.461993455886841, -2.368786334991455, -2.2755792140960693, -2.1823720932006836, -2.089164972305298, -1.9959577322006226, -1.9027506113052368, -1.8095433712005615, -1.7163363695144653, -1.6231292486190796, -1.5299221277236938, -1.4367148876190186, -1.3435077667236328, -1.250300645828247, -1.1570935249328613, -1.0638864040374756, -0.9706792235374451, -0.8774721026420593, -0.7842649221420288, -0.6910578012466431, -0.5978506803512573, -0.5046434998512268, -0.41143637895584106, -0.31822919845581055, -0.2250220775604248, -0.13181492686271667, -0.03860779106616974, 0.0545993447303772, 0.14780649542808533, 0.24101364612579346, 0.3342207670211792, 0.4274279475212097, 0.5206350684165955, 0.6138421893119812, 0.7070493698120117, 0.8002564907073975, 0.8934636116027832, 0.9866707921028137, 1.0798778533935547, 1.17308509349823, 1.2662922143936157, 1.3594993352890015, 1.4527064561843872, 1.5459136962890625, 1.6391208171844482, 1.732327938079834, 1.8255350589752197, 1.9187421798706055, 2.011949300765991, 2.105156421661377, 2.1983635425567627, 2.2915706634521484, 2.384777784347534, 2.47798490524292, 2.5711922645568848, 2.6643993854522705, 2.7576065063476562]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 6.0, 9.0, 18.0, 29.0, 26.0, 51.0, 59.0, 71.0, 147.0, 196.0, 312.0, 495.0, 862.0, 1681.0, 3088.0, 6301.0, 13869.0, 34086.0, 88135.0, 229113.0, 353618.0, 191827.0, 72131.0, 28462.0, 12015.0, 5509.0, 2785.0, 1508.0, 799.0, 459.0, 285.0, 191.0, 121.0, 79.0, 68.0, 48.0, 28.0, 17.0, 12.0, 11.0, 7.0, 7.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 1.0], "bins": [-2.75390625, -2.676116943359375, -2.59832763671875, -2.520538330078125, -2.4427490234375, -2.364959716796875, -2.28717041015625, -2.209381103515625, -2.131591796875, -2.053802490234375, -1.97601318359375, -1.898223876953125, -1.8204345703125, -1.742645263671875, -1.66485595703125, -1.587066650390625, -1.50927734375, -1.431488037109375, -1.35369873046875, -1.275909423828125, -1.1981201171875, -1.120330810546875, -1.04254150390625, -0.964752197265625, -0.886962890625, -0.809173583984375, -0.73138427734375, -0.653594970703125, -0.5758056640625, -0.498016357421875, -0.42022705078125, -0.342437744140625, -0.2646484375, -0.186859130859375, -0.10906982421875, -0.031280517578125, 0.0465087890625, 0.124298095703125, 0.20208740234375, 0.279876708984375, 0.357666015625, 0.435455322265625, 0.51324462890625, 0.591033935546875, 0.6688232421875, 0.746612548828125, 0.82440185546875, 0.902191162109375, 0.97998046875, 1.057769775390625, 1.13555908203125, 1.213348388671875, 1.2911376953125, 1.368927001953125, 1.44671630859375, 1.524505615234375, 1.602294921875, 1.680084228515625, 1.75787353515625, 1.835662841796875, 1.9134521484375, 1.991241455078125, 2.06903076171875, 2.146820068359375, 2.224609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 8.0, 4.0, 7.0, 9.0, 11.0, 18.0, 20.0, 26.0, 31.0, 43.0, 38.0, 69.0, 44.0, 52.0, 58.0, 62.0, 63.0, 45.0, 64.0, 41.0, 49.0, 42.0, 40.0, 26.0, 31.0, 18.0, 25.0, 11.0, 8.0, 9.0, 8.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7587890625, -1.6917877197265625, -1.624786376953125, -1.5577850341796875, -1.49078369140625, -1.4237823486328125, -1.356781005859375, -1.2897796630859375, -1.2227783203125, -1.1557769775390625, -1.088775634765625, -1.0217742919921875, -0.95477294921875, -0.8877716064453125, -0.820770263671875, -0.7537689208984375, -0.686767578125, -0.6197662353515625, -0.552764892578125, -0.4857635498046875, -0.41876220703125, -0.3517608642578125, -0.284759521484375, -0.2177581787109375, -0.1507568359375, -0.0837554931640625, -0.016754150390625, 0.0502471923828125, 0.11724853515625, 0.1842498779296875, 0.251251220703125, 0.3182525634765625, 0.38525390625, 0.4522552490234375, 0.519256591796875, 0.5862579345703125, 0.65325927734375, 0.7202606201171875, 0.787261962890625, 0.8542633056640625, 0.9212646484375, 0.9882659912109375, 1.055267333984375, 1.1222686767578125, 1.18927001953125, 1.2562713623046875, 1.323272705078125, 1.3902740478515625, 1.457275390625, 1.5242767333984375, 1.591278076171875, 1.6582794189453125, 1.72528076171875, 1.7922821044921875, 1.859283447265625, 1.9262847900390625, 1.9932861328125, 2.0602874755859375, 2.127288818359375, 2.1942901611328125, 2.26129150390625, 2.3282928466796875, 2.395294189453125, 2.4622955322265625, 2.529296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 9.0, 7.0, 12.0, 15.0, 20.0, 32.0, 44.0, 88.0, 132.0, 254.0, 455.0, 1112.0, 3500.0, 16362.0, 160339.0, 767535.0, 83326.0, 10944.0, 2598.0, 869.0, 386.0, 184.0, 113.0, 62.0, 42.0, 28.0, 24.0, 14.0, 9.0, 6.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.24456787109375, -6.0164794921875, -5.78839111328125, -5.560302734375, -5.33221435546875, -5.1041259765625, -4.87603759765625, -4.64794921875, -4.41986083984375, -4.1917724609375, -3.96368408203125, -3.735595703125, -3.50750732421875, -3.2794189453125, -3.05133056640625, -2.8232421875, -2.59515380859375, -2.3670654296875, -2.13897705078125, -1.910888671875, -1.68280029296875, -1.4547119140625, -1.22662353515625, -0.99853515625, -0.77044677734375, -0.5423583984375, -0.31427001953125, -0.086181640625, 0.14190673828125, 0.3699951171875, 0.59808349609375, 0.826171875, 1.05426025390625, 1.2823486328125, 1.51043701171875, 1.738525390625, 1.96661376953125, 2.1947021484375, 2.42279052734375, 2.65087890625, 2.87896728515625, 3.1070556640625, 3.33514404296875, 3.563232421875, 3.79132080078125, 4.0194091796875, 4.24749755859375, 4.4755859375, 4.70367431640625, 4.9317626953125, 5.15985107421875, 5.387939453125, 5.61602783203125, 5.8441162109375, 6.07220458984375, 6.30029296875, 6.52838134765625, 6.7564697265625, 6.98455810546875, 7.212646484375, 7.44073486328125, 7.6688232421875, 7.89691162109375, 8.125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 8.0, 7.0, 5.0, 6.0, 6.0, 12.0, 17.0, 17.0, 27.0, 31.0, 30.0, 32.0, 45.0, 44.0, 54.0, 57.0, 45.0, 54.0, 60.0, 54.0, 44.0, 52.0, 36.0, 41.0, 37.0, 43.0, 33.0, 18.0, 18.0, 8.0, 13.0, 11.0, 5.0, 8.0, 5.0, 6.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.671875, -8.3955078125, -8.119140625, -7.8427734375, -7.56640625, -7.2900390625, -7.013671875, -6.7373046875, -6.4609375, -6.1845703125, -5.908203125, -5.6318359375, -5.35546875, -5.0791015625, -4.802734375, -4.5263671875, -4.25, -3.9736328125, -3.697265625, -3.4208984375, -3.14453125, -2.8681640625, -2.591796875, -2.3154296875, -2.0390625, -1.7626953125, -1.486328125, -1.2099609375, -0.93359375, -0.6572265625, -0.380859375, -0.1044921875, 0.171875, 0.4482421875, 0.724609375, 1.0009765625, 1.27734375, 1.5537109375, 1.830078125, 2.1064453125, 2.3828125, 2.6591796875, 2.935546875, 3.2119140625, 3.48828125, 3.7646484375, 4.041015625, 4.3173828125, 4.59375, 4.8701171875, 5.146484375, 5.4228515625, 5.69921875, 5.9755859375, 6.251953125, 6.5283203125, 6.8046875, 7.0810546875, 7.357421875, 7.6337890625, 7.91015625, 8.1865234375, 8.462890625, 8.7392578125, 9.015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 8.0, 8.0, 8.0, 12.0, 25.0, 43.0, 49.0, 61.0, 88.0, 113.0, 220.0, 304.0, 534.0, 845.0, 1705.0, 4563.0, 21731.0, 428764.0, 555043.0, 25214.0, 4945.0, 1905.0, 874.0, 501.0, 322.0, 227.0, 142.0, 87.0, 70.0, 47.0, 25.0, 12.0, 20.0, 21.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.603515625, -3.50067138671875, -3.3978271484375, -3.29498291015625, -3.192138671875, -3.08929443359375, -2.9864501953125, -2.88360595703125, -2.78076171875, -2.67791748046875, -2.5750732421875, -2.47222900390625, -2.369384765625, -2.26654052734375, -2.1636962890625, -2.06085205078125, -1.9580078125, -1.85516357421875, -1.7523193359375, -1.64947509765625, -1.546630859375, -1.44378662109375, -1.3409423828125, -1.23809814453125, -1.13525390625, -1.03240966796875, -0.9295654296875, -0.82672119140625, -0.723876953125, -0.62103271484375, -0.5181884765625, -0.41534423828125, -0.3125, -0.20965576171875, -0.1068115234375, -0.00396728515625, 0.098876953125, 0.20172119140625, 0.3045654296875, 0.40740966796875, 0.51025390625, 0.61309814453125, 0.7159423828125, 0.81878662109375, 0.921630859375, 1.02447509765625, 1.1273193359375, 1.23016357421875, 1.3330078125, 1.43585205078125, 1.5386962890625, 1.64154052734375, 1.744384765625, 1.84722900390625, 1.9500732421875, 2.05291748046875, 2.15576171875, 2.25860595703125, 2.3614501953125, 2.46429443359375, 2.567138671875, 2.66998291015625, 2.7728271484375, 2.87567138671875, 2.978515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 7.0, 18.0, 37.0, 41.0, 64.0, 131.0, 201.0, 189.0, 137.0, 71.0, 37.0, 23.0, 14.0, 7.0, 4.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007686614990234375, -0.0007478520274162292, -0.000727042555809021, -0.0007062330842018127, -0.0006854236125946045, -0.0006646141409873962, -0.000643804669380188, -0.0006229951977729797, -0.0006021857261657715, -0.0005813762545585632, -0.000560566782951355, -0.0005397573113441467, -0.0005189478397369385, -0.0004981383681297302, -0.00047732889652252197, -0.0004565194249153137, -0.00043570995330810547, -0.0004149004817008972, -0.00039409101009368896, -0.0003732815384864807, -0.00035247206687927246, -0.0003316625952720642, -0.00031085312366485596, -0.0002900436520576477, -0.00026923418045043945, -0.0002484247088432312, -0.00022761523723602295, -0.0002068057656288147, -0.00018599629402160645, -0.0001651868224143982, -0.00014437735080718994, -0.0001235678791999817, -0.00010275840759277344, -8.194893598556519e-05, -6.113946437835693e-05, -4.032999277114868e-05, -1.952052116394043e-05, 1.2889504432678223e-06, 2.2098422050476074e-05, 4.2907893657684326e-05, 6.371736526489258e-05, 8.452683687210083e-05, 0.00010533630847930908, 0.00012614578008651733, 0.00014695525169372559, 0.00016776472330093384, 0.0001885741949081421, 0.00020938366651535034, 0.0002301931381225586, 0.00025100260972976685, 0.0002718120813369751, 0.00029262155294418335, 0.0003134310245513916, 0.00033424049615859985, 0.0003550499677658081, 0.00037585943937301636, 0.0003966689109802246, 0.00041747838258743286, 0.0004382878541946411, 0.00045909732580184937, 0.0004799067974090576, 0.0005007162690162659, 0.0005215257406234741, 0.0005423352122306824, 0.0005631446838378906]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 12.0, 17.0, 30.0, 38.0, 80.0, 150.0, 294.0, 819.0, 2875.0, 26963.0, 872447.0, 136262.0, 6339.0, 1292.0, 470.0, 201.0, 108.0, 53.0, 28.0, 22.0, 10.0, 4.0, 8.0, 3.0, 3.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.806640625, -3.669281005859375, -3.53192138671875, -3.394561767578125, -3.2572021484375, -3.119842529296875, -2.98248291015625, -2.845123291015625, -2.707763671875, -2.570404052734375, -2.43304443359375, -2.295684814453125, -2.1583251953125, -2.020965576171875, -1.88360595703125, -1.746246337890625, -1.60888671875, -1.471527099609375, -1.33416748046875, -1.196807861328125, -1.0594482421875, -0.922088623046875, -0.78472900390625, -0.647369384765625, -0.510009765625, -0.372650146484375, -0.23529052734375, -0.097930908203125, 0.0394287109375, 0.176788330078125, 0.31414794921875, 0.451507568359375, 0.5888671875, 0.726226806640625, 0.86358642578125, 1.000946044921875, 1.1383056640625, 1.275665283203125, 1.41302490234375, 1.550384521484375, 1.687744140625, 1.825103759765625, 1.96246337890625, 2.099822998046875, 2.2371826171875, 2.374542236328125, 2.51190185546875, 2.649261474609375, 2.78662109375, 2.923980712890625, 3.06134033203125, 3.198699951171875, 3.3360595703125, 3.473419189453125, 3.61077880859375, 3.748138427734375, 3.885498046875, 4.022857666015625, 4.16021728515625, 4.297576904296875, 4.4349365234375, 4.572296142578125, 4.70965576171875, 4.847015380859375, 4.984375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 13.0, 21.0, 36.0, 68.0, 132.0, 182.0, 191.0, 151.0, 97.0, 50.0, 22.0, 15.0, 7.0, 7.0, 5.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.458984375, -3.302947998046875, -3.14691162109375, -2.990875244140625, -2.8348388671875, -2.678802490234375, -2.52276611328125, -2.366729736328125, -2.210693359375, -2.054656982421875, -1.89862060546875, -1.742584228515625, -1.5865478515625, -1.430511474609375, -1.27447509765625, -1.118438720703125, -0.96240234375, -0.806365966796875, -0.65032958984375, -0.494293212890625, -0.3382568359375, -0.182220458984375, -0.02618408203125, 0.129852294921875, 0.285888671875, 0.441925048828125, 0.59796142578125, 0.753997802734375, 0.9100341796875, 1.066070556640625, 1.22210693359375, 1.378143310546875, 1.5341796875, 1.690216064453125, 1.84625244140625, 2.002288818359375, 2.1583251953125, 2.314361572265625, 2.47039794921875, 2.626434326171875, 2.782470703125, 2.938507080078125, 3.09454345703125, 3.250579833984375, 3.4066162109375, 3.562652587890625, 3.71868896484375, 3.874725341796875, 4.03076171875, 4.186798095703125, 4.34283447265625, 4.498870849609375, 4.6549072265625, 4.810943603515625, 4.96697998046875, 5.123016357421875, 5.279052734375, 5.435089111328125, 5.59112548828125, 5.747161865234375, 5.9031982421875, 6.059234619140625, 6.21527099609375, 6.371307373046875, 6.52734375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 14.0, 30.0, 57.0, 98.0, 132.0, 197.0, 167.0, 113.0, 78.0, 46.0, 27.0, 17.0, 8.0, 5.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.37742614746094, -56.696720123291016, -55.01601028442383, -53.335304260253906, -51.65459442138672, -49.9738883972168, -48.293182373046875, -46.61247253417969, -44.931766510009766, -43.251060485839844, -41.570350646972656, -39.889644622802734, -38.20893859863281, -36.528228759765625, -34.8475227355957, -33.16681671142578, -31.486106872558594, -29.80539894104004, -28.124691009521484, -26.443984985351562, -24.763277053833008, -23.082569122314453, -21.40186309814453, -19.721155166625977, -18.040447235107422, -16.359739303588867, -14.679032325744629, -12.99832534790039, -11.317617416381836, -9.636909484863281, -7.956202507019043, -6.275495529174805, -4.59478759765625, -2.9140801429748535, -1.233372688293457, 0.44733476638793945, 2.128042221069336, 3.8087501525878906, 5.489457130432129, 7.170164108276367, 8.850872039794922, 10.531579971313477, 12.212286949157715, 13.892993927001953, 15.573701858520508, 17.254409790039062, 18.935115814208984, 20.61582374572754, 22.296531677246094, 23.97723960876465, 25.657947540283203, 27.338653564453125, 29.01936149597168, 30.700069427490234, 32.380775451660156, 34.061485290527344, 35.742191314697266, 37.42289733886719, 39.103607177734375, 40.7843132019043, 42.46501922607422, 44.145729064941406, 45.82643508911133, 47.50714111328125, 49.18785095214844]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 10.0, 8.0, 10.0, 14.0, 16.0, 18.0, 22.0, 25.0, 19.0, 33.0, 34.0, 36.0, 44.0, 49.0, 37.0, 65.0, 41.0, 55.0, 41.0, 53.0, 48.0, 28.0, 40.0, 38.0, 29.0, 21.0, 27.0, 21.0, 23.0, 14.0, 12.0, 10.0, 8.0, 9.0, 8.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.93851089477539, -33.84404754638672, -32.74958801269531, -31.65512466430664, -30.56066131591797, -29.46619987487793, -28.37173843383789, -27.27727508544922, -26.18281364440918, -25.08835220336914, -23.99388885498047, -22.89942741394043, -21.80496597290039, -20.71050262451172, -19.61604118347168, -18.52157974243164, -17.42711639404297, -16.33265495300293, -15.238191604614258, -14.143730163574219, -13.049267768859863, -11.954805374145508, -10.860343933105469, -9.765881538391113, -8.671419143676758, -7.576956748962402, -6.482494831085205, -5.388032913208008, -4.293570518493652, -3.199108123779297, -2.1046462059020996, -1.0101842880249023, 0.0842742919921875, 1.1787364482879639, 2.2731986045837402, 3.3676607608795166, 4.462122917175293, 5.556585311889648, 6.651047229766846, 7.745509147644043, 8.839971542358398, 9.934433937072754, 11.02889633178711, 12.123357772827148, 13.217820167541504, 14.31228256225586, 15.406744003295898, 16.501205444335938, 17.59566879272461, 18.69013023376465, 19.78459358215332, 20.87905502319336, 21.97351837158203, 23.06797981262207, 24.16244125366211, 25.25690460205078, 26.35136604309082, 27.44582748413086, 28.54029083251953, 29.63475227355957, 30.72921371459961, 31.82367706298828, 32.91814041137695, 34.01259994506836, 35.10706329345703]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 11.0, 5.0, 11.0, 27.0, 29.0, 36.0, 51.0, 94.0, 164.0, 303.0, 518.0, 1171.0, 3511.0, 33861.0, 4142718.0, 8240.0, 1811.0, 745.0, 406.0, 187.0, 110.0, 79.0, 56.0, 39.0, 16.0, 19.0, 18.0, 11.0, 10.0, 8.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.3359375, -8.030029296875, -7.72412109375, -7.418212890625, -7.1123046875, -6.806396484375, -6.50048828125, -6.194580078125, -5.888671875, -5.582763671875, -5.27685546875, -4.970947265625, -4.6650390625, -4.359130859375, -4.05322265625, -3.747314453125, -3.44140625, -3.135498046875, -2.82958984375, -2.523681640625, -2.2177734375, -1.911865234375, -1.60595703125, -1.300048828125, -0.994140625, -0.688232421875, -0.38232421875, -0.076416015625, 0.2294921875, 0.535400390625, 0.84130859375, 1.147216796875, 1.453125, 1.759033203125, 2.06494140625, 2.370849609375, 2.6767578125, 2.982666015625, 3.28857421875, 3.594482421875, 3.900390625, 4.206298828125, 4.51220703125, 4.818115234375, 5.1240234375, 5.429931640625, 5.73583984375, 6.041748046875, 6.34765625, 6.653564453125, 6.95947265625, 7.265380859375, 7.5712890625, 7.877197265625, 8.18310546875, 8.489013671875, 8.794921875, 9.100830078125, 9.40673828125, 9.712646484375, 10.0185546875, 10.324462890625, 10.63037109375, 10.936279296875, 11.2421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 9.0, 8.0, 11.0, 9.0, 25.0, 26.0, 24.0, 42.0, 52.0, 63.0, 67.0, 57.0, 62.0, 62.0, 78.0, 56.0, 51.0, 57.0, 48.0, 41.0, 29.0, 37.0, 15.0, 14.0, 13.0, 6.0, 7.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.158203125, -2.079681396484375, -2.00115966796875, -1.922637939453125, -1.8441162109375, -1.765594482421875, -1.68707275390625, -1.608551025390625, -1.530029296875, -1.451507568359375, -1.37298583984375, -1.294464111328125, -1.2159423828125, -1.137420654296875, -1.05889892578125, -0.980377197265625, -0.90185546875, -0.823333740234375, -0.74481201171875, -0.666290283203125, -0.5877685546875, -0.509246826171875, -0.43072509765625, -0.352203369140625, -0.273681640625, -0.195159912109375, -0.11663818359375, -0.038116455078125, 0.0404052734375, 0.118927001953125, 0.19744873046875, 0.275970458984375, 0.3544921875, 0.433013916015625, 0.51153564453125, 0.590057373046875, 0.6685791015625, 0.747100830078125, 0.82562255859375, 0.904144287109375, 0.982666015625, 1.061187744140625, 1.13970947265625, 1.218231201171875, 1.2967529296875, 1.375274658203125, 1.45379638671875, 1.532318115234375, 1.61083984375, 1.689361572265625, 1.76788330078125, 1.846405029296875, 1.9249267578125, 2.003448486328125, 2.08197021484375, 2.160491943359375, 2.239013671875, 2.317535400390625, 2.39605712890625, 2.474578857421875, 2.5531005859375, 2.631622314453125, 2.71014404296875, 2.788665771484375, 2.8671875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 15.0, 11.0, 13.0, 16.0, 19.0, 45.0, 40.0, 62.0, 76.0, 103.0, 227.0, 277.0, 479.0, 780.0, 1456.0, 3065.0, 11898.0, 4099370.0, 65833.0, 5497.0, 2075.0, 1098.0, 672.0, 377.0, 234.0, 159.0, 106.0, 73.0, 48.0, 32.0, 31.0, 22.0, 19.0, 10.0, 8.0, 10.0, 4.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0625, -9.7646484375, -9.466796875, -9.1689453125, -8.87109375, -8.5732421875, -8.275390625, -7.9775390625, -7.6796875, -7.3818359375, -7.083984375, -6.7861328125, -6.48828125, -6.1904296875, -5.892578125, -5.5947265625, -5.296875, -4.9990234375, -4.701171875, -4.4033203125, -4.10546875, -3.8076171875, -3.509765625, -3.2119140625, -2.9140625, -2.6162109375, -2.318359375, -2.0205078125, -1.72265625, -1.4248046875, -1.126953125, -0.8291015625, -0.53125, -0.2333984375, 0.064453125, 0.3623046875, 0.66015625, 0.9580078125, 1.255859375, 1.5537109375, 1.8515625, 2.1494140625, 2.447265625, 2.7451171875, 3.04296875, 3.3408203125, 3.638671875, 3.9365234375, 4.234375, 4.5322265625, 4.830078125, 5.1279296875, 5.42578125, 5.7236328125, 6.021484375, 6.3193359375, 6.6171875, 6.9150390625, 7.212890625, 7.5107421875, 7.80859375, 8.1064453125, 8.404296875, 8.7021484375, 9.0]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 21.0, 65.0, 3681.0, 216.0, 42.0, 16.0, 6.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.734375, -2.6658172607421875, -2.597259521484375, -2.5287017822265625, -2.46014404296875, -2.3915863037109375, -2.323028564453125, -2.2544708251953125, -2.1859130859375, -2.1173553466796875, -2.048797607421875, -1.9802398681640625, -1.91168212890625, -1.8431243896484375, -1.774566650390625, -1.7060089111328125, -1.637451171875, -1.5688934326171875, -1.500335693359375, -1.4317779541015625, -1.36322021484375, -1.2946624755859375, -1.226104736328125, -1.1575469970703125, -1.0889892578125, -1.0204315185546875, -0.951873779296875, -0.8833160400390625, -0.81475830078125, -0.7462005615234375, -0.677642822265625, -0.6090850830078125, -0.54052734375, -0.4719696044921875, -0.403411865234375, -0.3348541259765625, -0.26629638671875, -0.1977386474609375, -0.129180908203125, -0.0606231689453125, 0.0079345703125, 0.0764923095703125, 0.145050048828125, 0.2136077880859375, 0.28216552734375, 0.3507232666015625, 0.419281005859375, 0.4878387451171875, 0.556396484375, 0.6249542236328125, 0.693511962890625, 0.7620697021484375, 0.83062744140625, 0.8991851806640625, 0.967742919921875, 1.0363006591796875, 1.1048583984375, 1.1734161376953125, 1.241973876953125, 1.3105316162109375, 1.37908935546875, 1.4476470947265625, 1.516204833984375, 1.5847625732421875, 1.6533203125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 12.0, 16.0, 26.0, 34.0, 57.0, 77.0, 107.0, 131.0, 126.0, 140.0, 95.0, 76.0, 28.0, 28.0, 17.0, 9.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.026236057281494, -4.837462902069092, -4.648690223693848, -4.459917068481445, -4.271143913269043, -4.082370758056641, -3.8935978412628174, -3.704824924468994, -3.516051769256592, -3.3272786140441895, -3.138505697250366, -2.949732780456543, -2.7609596252441406, -2.5721864700317383, -2.383413553237915, -2.194640636444092, -2.0058674812316895, -1.8170944452285767, -1.6283214092254639, -1.439548373222351, -1.2507753372192383, -1.0620023012161255, -0.8732292652130127, -0.6844562292098999, -0.4956831932067871, -0.3069101572036743, -0.11813712120056152, 0.07063591480255127, 0.25940895080566406, 0.44818198680877686, 0.6369550228118896, 0.8257280588150024, 1.014500617980957, 1.2032736539840698, 1.3920466899871826, 1.5808197259902954, 1.7695927619934082, 1.958365797996521, 2.147138833999634, 2.335911750793457, 2.5246849060058594, 2.7134580612182617, 2.902230978012085, 3.091003894805908, 3.2797770500183105, 3.468550205230713, 3.657323122024536, 3.8460960388183594, 4.034869194030762, 4.223642349243164, 4.412415504455566, 4.6011881828308105, 4.789961338043213, 4.978734493255615, 5.167507171630859, 5.356280326843262, 5.545053482055664, 5.733826637268066, 5.922599792480469, 6.111372470855713, 6.300145626068115, 6.488918781280518, 6.677691459655762, 6.866464614868164, 7.055237770080566]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 3.0, 6.0, 5.0, 4.0, 5.0, 7.0, 19.0, 8.0, 16.0, 20.0, 19.0, 15.0, 21.0, 16.0, 24.0, 23.0, 30.0, 23.0, 26.0, 36.0, 34.0, 30.0, 38.0, 39.0, 38.0, 30.0, 37.0, 40.0, 41.0, 40.0, 41.0, 40.0, 17.0, 30.0, 29.0, 17.0, 16.0, 17.0, 10.0, 7.0, 16.0, 11.0, 9.0, 4.0, 9.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0], "bins": [-2.538992166519165, -2.4599132537841797, -2.3808345794677734, -2.301755666732788, -2.222676992416382, -2.1435980796813965, -2.0645194053649902, -1.9854404926300049, -1.906361699104309, -1.8272829055786133, -1.7482041120529175, -1.6691253185272217, -1.5900464057922363, -1.51096773147583, -1.4318888187408447, -1.352810025215149, -1.2737312316894531, -1.1946524381637573, -1.1155736446380615, -1.0364948511123657, -0.9574159979820251, -0.8783372044563293, -0.7992583513259888, -0.720179557800293, -0.6411007642745972, -0.5620219707489014, -0.4829431474208832, -0.403864324092865, -0.3247855305671692, -0.2457067370414734, -0.1666279137134552, -0.08754909038543701, -0.008470296859741211, 0.07060851156711578, 0.14968731999397278, 0.22876612842082977, 0.30784493684768677, 0.38692373037338257, 0.46600255370140076, 0.545081377029419, 0.6241601705551147, 0.7032389640808105, 0.7823177576065063, 0.8613966107368469, 0.9404754042625427, 1.0195541381835938, 1.098633050918579, 1.177711844444275, 1.2567906379699707, 1.3358694314956665, 1.4149482250213623, 1.494027018547058, 1.573105812072754, 1.6521847248077393, 1.731263518333435, 1.8103423118591309, 1.8894211053848267, 1.9684998989105225, 2.047578811645508, 2.126657485961914, 2.2057363986968994, 2.2848150730133057, 2.363893985748291, 2.4429726600646973, 2.5220515727996826]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 8.0, 4.0, 7.0, 17.0, 34.0, 46.0, 60.0, 99.0, 159.0, 314.0, 595.0, 1102.0, 2672.0, 6498.0, 19411.0, 68790.0, 290040.0, 474231.0, 132495.0, 34029.0, 10489.0, 3945.0, 1688.0, 791.0, 421.0, 218.0, 123.0, 100.0, 61.0, 25.0, 30.0, 11.0, 10.0, 12.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.853515625, -3.712005615234375, -3.57049560546875, -3.428985595703125, -3.2874755859375, -3.145965576171875, -3.00445556640625, -2.862945556640625, -2.721435546875, -2.579925537109375, -2.43841552734375, -2.296905517578125, -2.1553955078125, -2.013885498046875, -1.87237548828125, -1.730865478515625, -1.58935546875, -1.447845458984375, -1.30633544921875, -1.164825439453125, -1.0233154296875, -0.881805419921875, -0.74029541015625, -0.598785400390625, -0.457275390625, -0.315765380859375, -0.17425537109375, -0.032745361328125, 0.1087646484375, 0.250274658203125, 0.39178466796875, 0.533294677734375, 0.6748046875, 0.816314697265625, 0.95782470703125, 1.099334716796875, 1.2408447265625, 1.382354736328125, 1.52386474609375, 1.665374755859375, 1.806884765625, 1.948394775390625, 2.08990478515625, 2.231414794921875, 2.3729248046875, 2.514434814453125, 2.65594482421875, 2.797454833984375, 2.93896484375, 3.080474853515625, 3.22198486328125, 3.363494873046875, 3.5050048828125, 3.646514892578125, 3.78802490234375, 3.929534912109375, 4.071044921875, 4.212554931640625, 4.35406494140625, 4.495574951171875, 4.6370849609375, 4.778594970703125, 4.92010498046875, 5.061614990234375, 5.203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 7.0, 9.0, 11.0, 20.0, 24.0, 26.0, 24.0, 46.0, 45.0, 50.0, 50.0, 45.0, 53.0, 72.0, 57.0, 62.0, 49.0, 64.0, 55.0, 45.0, 46.0, 21.0, 27.0, 20.0, 14.0, 12.0, 10.0, 4.0, 5.0, 7.0, 5.0, 0.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9345703125, -1.8573455810546875, -1.780120849609375, -1.7028961181640625, -1.62567138671875, -1.5484466552734375, -1.471221923828125, -1.3939971923828125, -1.3167724609375, -1.2395477294921875, -1.162322998046875, -1.0850982666015625, -1.00787353515625, -0.9306488037109375, -0.853424072265625, -0.7761993408203125, -0.698974609375, -0.6217498779296875, -0.544525146484375, -0.4673004150390625, -0.39007568359375, -0.3128509521484375, -0.235626220703125, -0.1584014892578125, -0.0811767578125, -0.0039520263671875, 0.073272705078125, 0.1504974365234375, 0.22772216796875, 0.3049468994140625, 0.382171630859375, 0.4593963623046875, 0.53662109375, 0.6138458251953125, 0.691070556640625, 0.7682952880859375, 0.84552001953125, 0.9227447509765625, 0.999969482421875, 1.0771942138671875, 1.1544189453125, 1.2316436767578125, 1.308868408203125, 1.3860931396484375, 1.46331787109375, 1.5405426025390625, 1.617767333984375, 1.6949920654296875, 1.772216796875, 1.8494415283203125, 1.926666259765625, 2.0038909912109375, 2.08111572265625, 2.1583404541015625, 2.235565185546875, 2.3127899169921875, 2.3900146484375, 2.4672393798828125, 2.544464111328125, 2.6216888427734375, 2.69891357421875, 2.7761383056640625, 2.853363037109375, 2.9305877685546875, 3.0078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 4.0, 5.0, 1.0, 7.0, 9.0, 7.0, 15.0, 16.0, 20.0, 24.0, 38.0, 45.0, 73.0, 79.0, 135.0, 224.0, 319.0, 652.0, 1442.0, 4415.0, 17510.0, 114926.0, 701696.0, 174001.0, 23632.0, 5616.0, 1765.0, 777.0, 376.0, 216.0, 163.0, 96.0, 61.0, 37.0, 38.0, 28.0, 21.0, 18.0, 16.0, 6.0, 5.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.76953125, -5.5809326171875, -5.392333984375, -5.2037353515625, -5.01513671875, -4.8265380859375, -4.637939453125, -4.4493408203125, -4.2607421875, -4.0721435546875, -3.883544921875, -3.6949462890625, -3.50634765625, -3.3177490234375, -3.129150390625, -2.9405517578125, -2.751953125, -2.5633544921875, -2.374755859375, -2.1861572265625, -1.99755859375, -1.8089599609375, -1.620361328125, -1.4317626953125, -1.2431640625, -1.0545654296875, -0.865966796875, -0.6773681640625, -0.48876953125, -0.3001708984375, -0.111572265625, 0.0770263671875, 0.265625, 0.4542236328125, 0.642822265625, 0.8314208984375, 1.02001953125, 1.2086181640625, 1.397216796875, 1.5858154296875, 1.7744140625, 1.9630126953125, 2.151611328125, 2.3402099609375, 2.52880859375, 2.7174072265625, 2.906005859375, 3.0946044921875, 3.283203125, 3.4718017578125, 3.660400390625, 3.8489990234375, 4.03759765625, 4.2261962890625, 4.414794921875, 4.6033935546875, 4.7919921875, 4.9805908203125, 5.169189453125, 5.3577880859375, 5.54638671875, 5.7349853515625, 5.923583984375, 6.1121826171875, 6.30078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 20.0, 6.0, 12.0, 21.0, 23.0, 22.0, 33.0, 47.0, 74.0, 55.0, 59.0, 66.0, 59.0, 72.0, 65.0, 76.0, 60.0, 51.0, 39.0, 28.0, 27.0, 26.0, 17.0, 13.0, 15.0, 4.0, 5.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.030517578125, -8.62353515625, -8.216552734375, -7.8095703125, -7.402587890625, -6.99560546875, -6.588623046875, -6.181640625, -5.774658203125, -5.36767578125, -4.960693359375, -4.5537109375, -4.146728515625, -3.73974609375, -3.332763671875, -2.92578125, -2.518798828125, -2.11181640625, -1.704833984375, -1.2978515625, -0.890869140625, -0.48388671875, -0.076904296875, 0.330078125, 0.737060546875, 1.14404296875, 1.551025390625, 1.9580078125, 2.364990234375, 2.77197265625, 3.178955078125, 3.5859375, 3.992919921875, 4.39990234375, 4.806884765625, 5.2138671875, 5.620849609375, 6.02783203125, 6.434814453125, 6.841796875, 7.248779296875, 7.65576171875, 8.062744140625, 8.4697265625, 8.876708984375, 9.28369140625, 9.690673828125, 10.09765625, 10.504638671875, 10.91162109375, 11.318603515625, 11.7255859375, 12.132568359375, 12.53955078125, 12.946533203125, 13.353515625, 13.760498046875, 14.16748046875, 14.574462890625, 14.9814453125, 15.388427734375, 15.79541015625, 16.202392578125, 16.609375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 16.0, 9.0, 18.0, 22.0, 34.0, 50.0, 101.0, 253.0, 667.0, 2947.0, 24846.0, 802121.0, 205356.0, 9723.0, 1574.0, 442.0, 172.0, 75.0, 43.0, 18.0, 21.0, 12.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.818359375, -3.675933837890625, -3.53350830078125, -3.391082763671875, -3.2486572265625, -3.106231689453125, -2.96380615234375, -2.821380615234375, -2.678955078125, -2.536529541015625, -2.39410400390625, -2.251678466796875, -2.1092529296875, -1.966827392578125, -1.82440185546875, -1.681976318359375, -1.53955078125, -1.397125244140625, -1.25469970703125, -1.112274169921875, -0.9698486328125, -0.827423095703125, -0.68499755859375, -0.542572021484375, -0.400146484375, -0.257720947265625, -0.11529541015625, 0.027130126953125, 0.1695556640625, 0.311981201171875, 0.45440673828125, 0.596832275390625, 0.7392578125, 0.881683349609375, 1.02410888671875, 1.166534423828125, 1.3089599609375, 1.451385498046875, 1.59381103515625, 1.736236572265625, 1.878662109375, 2.021087646484375, 2.16351318359375, 2.305938720703125, 2.4483642578125, 2.590789794921875, 2.73321533203125, 2.875640869140625, 3.01806640625, 3.160491943359375, 3.30291748046875, 3.445343017578125, 3.5877685546875, 3.730194091796875, 3.87261962890625, 4.015045166015625, 4.157470703125, 4.299896240234375, 4.44232177734375, 4.584747314453125, 4.7271728515625, 4.869598388671875, 5.01202392578125, 5.154449462890625, 5.296875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 6.0, 5.0, 9.0, 11.0, 19.0, 29.0, 41.0, 56.0, 100.0, 124.0, 163.0, 127.0, 101.0, 68.0, 42.0, 44.0, 24.0, 7.0, 7.0, 4.0, 9.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006742477416992188, -0.0006572604179382324, -0.0006402730941772461, -0.0006232857704162598, -0.0006062984466552734, -0.0005893111228942871, -0.0005723237991333008, -0.0005553364753723145, -0.0005383491516113281, -0.0005213618278503418, -0.0005043745040893555, -0.00048738718032836914, -0.0004703998565673828, -0.0004534125328063965, -0.00043642520904541016, -0.00041943788528442383, -0.0004024505615234375, -0.00038546323776245117, -0.00036847591400146484, -0.0003514885902404785, -0.0003345012664794922, -0.00031751394271850586, -0.00030052661895751953, -0.0002835392951965332, -0.0002665519714355469, -0.00024956464767456055, -0.00023257732391357422, -0.0002155900001525879, -0.00019860267639160156, -0.00018161535263061523, -0.0001646280288696289, -0.00014764070510864258, -0.00013065338134765625, -0.00011366605758666992, -9.66787338256836e-05, -7.969141006469727e-05, -6.270408630371094e-05, -4.571676254272461e-05, -2.872943878173828e-05, -1.1742115020751953e-05, 5.245208740234375e-06, 2.2232532501220703e-05, 3.921985626220703e-05, 5.620718002319336e-05, 7.319450378417969e-05, 9.018182754516602e-05, 0.00010716915130615234, 0.00012415647506713867, 0.000141143798828125, 0.00015813112258911133, 0.00017511844635009766, 0.00019210577011108398, 0.0002090930938720703, 0.00022608041763305664, 0.00024306774139404297, 0.0002600550651550293, 0.0002770423889160156, 0.00029402971267700195, 0.0003110170364379883, 0.0003280043601989746, 0.00034499168395996094, 0.00036197900772094727, 0.0003789663314819336, 0.0003959536552429199, 0.00041294097900390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 2.0, 4.0, 6.0, 9.0, 18.0, 29.0, 26.0, 69.0, 125.0, 217.0, 454.0, 1206.0, 4797.0, 31024.0, 614313.0, 368529.0, 21971.0, 3851.0, 1053.0, 368.0, 215.0, 101.0, 60.0, 45.0, 22.0, 19.0, 12.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.410186767578125, -2.29498291015625, -2.179779052734375, -2.0645751953125, -1.949371337890625, -1.83416748046875, -1.718963623046875, -1.603759765625, -1.488555908203125, -1.37335205078125, -1.258148193359375, -1.1429443359375, -1.027740478515625, -0.91253662109375, -0.797332763671875, -0.68212890625, -0.566925048828125, -0.45172119140625, -0.336517333984375, -0.2213134765625, -0.106109619140625, 0.00909423828125, 0.124298095703125, 0.239501953125, 0.354705810546875, 0.46990966796875, 0.585113525390625, 0.7003173828125, 0.815521240234375, 0.93072509765625, 1.045928955078125, 1.1611328125, 1.276336669921875, 1.39154052734375, 1.506744384765625, 1.6219482421875, 1.737152099609375, 1.85235595703125, 1.967559814453125, 2.082763671875, 2.197967529296875, 2.31317138671875, 2.428375244140625, 2.5435791015625, 2.658782958984375, 2.77398681640625, 2.889190673828125, 3.00439453125, 3.119598388671875, 3.23480224609375, 3.350006103515625, 3.4652099609375, 3.580413818359375, 3.69561767578125, 3.810821533203125, 3.926025390625, 4.041229248046875, 4.15643310546875, 4.271636962890625, 4.3868408203125, 4.502044677734375, 4.61724853515625, 4.732452392578125, 4.84765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 7.0, 12.0, 17.0, 22.0, 25.0, 39.0, 51.0, 66.0, 117.0, 143.0, 141.0, 101.0, 74.0, 52.0, 37.0, 26.0, 20.0, 12.0, 4.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.8984375, -4.778839111328125, -4.65924072265625, -4.539642333984375, -4.4200439453125, -4.300445556640625, -4.18084716796875, -4.061248779296875, -3.941650390625, -3.822052001953125, -3.70245361328125, -3.582855224609375, -3.4632568359375, -3.343658447265625, -3.22406005859375, -3.104461669921875, -2.98486328125, -2.865264892578125, -2.74566650390625, -2.626068115234375, -2.5064697265625, -2.386871337890625, -2.26727294921875, -2.147674560546875, -2.028076171875, -1.908477783203125, -1.78887939453125, -1.669281005859375, -1.5496826171875, -1.430084228515625, -1.31048583984375, -1.190887451171875, -1.0712890625, -0.951690673828125, -0.83209228515625, -0.712493896484375, -0.5928955078125, -0.473297119140625, -0.35369873046875, -0.234100341796875, -0.114501953125, 0.005096435546875, 0.12469482421875, 0.244293212890625, 0.3638916015625, 0.483489990234375, 0.60308837890625, 0.722686767578125, 0.84228515625, 0.961883544921875, 1.08148193359375, 1.201080322265625, 1.3206787109375, 1.440277099609375, 1.55987548828125, 1.679473876953125, 1.799072265625, 1.918670654296875, 2.03826904296875, 2.157867431640625, 2.2774658203125, 2.397064208984375, 2.51666259765625, 2.636260986328125, 2.755859375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 11.0, 21.0, 38.0, 85.0, 151.0, 164.0, 199.0, 146.0, 88.0, 50.0, 29.0, 13.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.5912094116211, -80.71609497070312, -78.84097290039062, -76.96585845947266, -75.09074401855469, -73.21562957763672, -71.34051513671875, -69.46539306640625, -67.59027862548828, -65.71516418457031, -63.84004592895508, -61.964927673339844, -60.089813232421875, -58.214698791503906, -56.33958053588867, -54.46446228027344, -52.58934783935547, -50.7142333984375, -48.839115142822266, -46.96399688720703, -45.08888244628906, -43.213768005371094, -41.33864974975586, -39.463531494140625, -37.588417053222656, -35.71330261230469, -33.83818435668945, -31.96306800842285, -30.08795166015625, -28.21283531188965, -26.337718963623047, -24.462602615356445, -22.587486267089844, -20.712369918823242, -18.83725357055664, -16.96213722229004, -15.087020874023438, -13.211904525756836, -11.336788177490234, -9.461671829223633, -7.586555480957031, -5.71143913269043, -3.836322784423828, -1.9612064361572266, -0.086090087890625, 1.7890262603759766, 3.664142608642578, 5.53925895690918, 7.414375305175781, 9.289491653442383, 11.164608001708984, 13.039724349975586, 14.914840698242188, 16.78995704650879, 18.66507339477539, 20.540189743041992, 22.415306091308594, 24.290422439575195, 26.165538787841797, 28.0406551361084, 29.915771484375, 31.7908878326416, 33.6660041809082, 35.54112243652344, 37.416236877441406]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 7.0, 10.0, 22.0, 15.0, 26.0, 19.0, 24.0, 34.0, 37.0, 48.0, 55.0, 66.0, 57.0, 63.0, 60.0, 78.0, 51.0, 58.0, 39.0, 36.0, 34.0, 33.0, 27.0, 22.0, 9.0, 20.0, 9.0, 10.0, 3.0, 5.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.1971435546875, -45.620635986328125, -44.044124603271484, -42.46761703491211, -40.89110565185547, -39.314598083496094, -37.73809051513672, -36.16157913208008, -34.58506774902344, -33.00856018066406, -31.432048797607422, -29.855541229248047, -28.279029846191406, -26.70252227783203, -25.126012802124023, -23.549503326416016, -21.97299575805664, -20.396486282348633, -18.819976806640625, -17.24346923828125, -15.666958808898926, -14.090449333190918, -12.513940811157227, -10.937431335449219, -9.360921859741211, -7.784412384033203, -6.2079033851623535, -4.631394386291504, -3.054884910583496, -1.4783754348754883, 0.09813308715820312, 1.674642562866211, 3.2511558532714844, 4.827665328979492, 6.404174327850342, 7.980683326721191, 9.5571928024292, 11.133702278137207, 12.710210800170898, 14.286720275878906, 15.863229751586914, 17.439739227294922, 19.01624870300293, 20.592758178710938, 22.169265747070312, 23.745777130126953, 25.322284698486328, 26.898794174194336, 28.475303649902344, 30.05181312561035, 31.62832260131836, 33.204830169677734, 34.781341552734375, 36.35784912109375, 37.934356689453125, 39.510868072509766, 41.087379455566406, 42.66388702392578, 44.24039840698242, 45.8169059753418, 47.39341735839844, 48.96992492675781, 50.54643249511719, 52.12294387817383, 53.6994514465332]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 11.0, 6.0, 10.0, 10.0, 15.0, 23.0, 35.0, 62.0, 85.0, 132.0, 260.0, 428.0, 800.0, 1927.0, 5794.0, 40614.0, 4111647.0, 24615.0, 4439.0, 1568.0, 760.0, 389.0, 213.0, 141.0, 100.0, 50.0, 41.0, 31.0, 20.0, 21.0, 7.0, 6.0, 9.0, 2.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.77734375, -5.573974609375, -5.37060546875, -5.167236328125, -4.9638671875, -4.760498046875, -4.55712890625, -4.353759765625, -4.150390625, -3.947021484375, -3.74365234375, -3.540283203125, -3.3369140625, -3.133544921875, -2.93017578125, -2.726806640625, -2.5234375, -2.320068359375, -2.11669921875, -1.913330078125, -1.7099609375, -1.506591796875, -1.30322265625, -1.099853515625, -0.896484375, -0.693115234375, -0.48974609375, -0.286376953125, -0.0830078125, 0.120361328125, 0.32373046875, 0.527099609375, 0.73046875, 0.933837890625, 1.13720703125, 1.340576171875, 1.5439453125, 1.747314453125, 1.95068359375, 2.154052734375, 2.357421875, 2.560791015625, 2.76416015625, 2.967529296875, 3.1708984375, 3.374267578125, 3.57763671875, 3.781005859375, 3.984375, 4.187744140625, 4.39111328125, 4.594482421875, 4.7978515625, 5.001220703125, 5.20458984375, 5.407958984375, 5.611328125, 5.814697265625, 6.01806640625, 6.221435546875, 6.4248046875, 6.628173828125, 6.83154296875, 7.034912109375, 7.23828125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 14.0, 12.0, 17.0, 24.0, 36.0, 47.0, 65.0, 72.0, 71.0, 96.0, 101.0, 89.0, 75.0, 76.0, 63.0, 36.0, 35.0, 20.0, 19.0, 12.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.060546875, -2.944488525390625, -2.82843017578125, -2.712371826171875, -2.5963134765625, -2.480255126953125, -2.36419677734375, -2.248138427734375, -2.132080078125, -2.016021728515625, -1.89996337890625, -1.783905029296875, -1.6678466796875, -1.551788330078125, -1.43572998046875, -1.319671630859375, -1.20361328125, -1.087554931640625, -0.97149658203125, -0.855438232421875, -0.7393798828125, -0.623321533203125, -0.50726318359375, -0.391204833984375, -0.275146484375, -0.159088134765625, -0.04302978515625, 0.073028564453125, 0.1890869140625, 0.305145263671875, 0.42120361328125, 0.537261962890625, 0.6533203125, 0.769378662109375, 0.88543701171875, 1.001495361328125, 1.1175537109375, 1.233612060546875, 1.34967041015625, 1.465728759765625, 1.581787109375, 1.697845458984375, 1.81390380859375, 1.929962158203125, 2.0460205078125, 2.162078857421875, 2.27813720703125, 2.394195556640625, 2.51025390625, 2.626312255859375, 2.74237060546875, 2.858428955078125, 2.9744873046875, 3.090545654296875, 3.20660400390625, 3.322662353515625, 3.438720703125, 3.554779052734375, 3.67083740234375, 3.786895751953125, 3.9029541015625, 4.019012451171875, 4.13507080078125, 4.251129150390625, 4.3671875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 3.0, 10.0, 17.0, 24.0, 19.0, 30.0, 41.0, 49.0, 66.0, 82.0, 85.0, 126.0, 165.0, 205.0, 315.0, 463.0, 766.0, 1464.0, 3235.0, 10254.0, 80873.0, 4042592.0, 40109.0, 7159.0, 2632.0, 1196.0, 668.0, 423.0, 286.0, 227.0, 155.0, 111.0, 97.0, 64.0, 53.0, 52.0, 33.0, 34.0, 21.0, 16.0, 15.0, 13.0, 9.0, 8.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 4.0], "bins": [-6.09375, -5.9111328125, -5.728515625, -5.5458984375, -5.36328125, -5.1806640625, -4.998046875, -4.8154296875, -4.6328125, -4.4501953125, -4.267578125, -4.0849609375, -3.90234375, -3.7197265625, -3.537109375, -3.3544921875, -3.171875, -2.9892578125, -2.806640625, -2.6240234375, -2.44140625, -2.2587890625, -2.076171875, -1.8935546875, -1.7109375, -1.5283203125, -1.345703125, -1.1630859375, -0.98046875, -0.7978515625, -0.615234375, -0.4326171875, -0.25, -0.0673828125, 0.115234375, 0.2978515625, 0.48046875, 0.6630859375, 0.845703125, 1.0283203125, 1.2109375, 1.3935546875, 1.576171875, 1.7587890625, 1.94140625, 2.1240234375, 2.306640625, 2.4892578125, 2.671875, 2.8544921875, 3.037109375, 3.2197265625, 3.40234375, 3.5849609375, 3.767578125, 3.9501953125, 4.1328125, 4.3154296875, 4.498046875, 4.6806640625, 4.86328125, 5.0458984375, 5.228515625, 5.4111328125, 5.59375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 9.0, 4.0, 7.0, 13.0, 52.0, 246.0, 3575.0, 106.0, 37.0, 19.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.505859375, -3.354888916015625, -3.20391845703125, -3.052947998046875, -2.9019775390625, -2.751007080078125, -2.60003662109375, -2.449066162109375, -2.298095703125, -2.147125244140625, -1.99615478515625, -1.845184326171875, -1.6942138671875, -1.543243408203125, -1.39227294921875, -1.241302490234375, -1.09033203125, -0.939361572265625, -0.78839111328125, -0.637420654296875, -0.4864501953125, -0.335479736328125, -0.18450927734375, -0.033538818359375, 0.117431640625, 0.268402099609375, 0.41937255859375, 0.570343017578125, 0.7213134765625, 0.872283935546875, 1.02325439453125, 1.174224853515625, 1.3251953125, 1.476165771484375, 1.62713623046875, 1.778106689453125, 1.9290771484375, 2.080047607421875, 2.23101806640625, 2.381988525390625, 2.532958984375, 2.683929443359375, 2.83489990234375, 2.985870361328125, 3.1368408203125, 3.287811279296875, 3.43878173828125, 3.589752197265625, 3.74072265625, 3.891693115234375, 4.04266357421875, 4.193634033203125, 4.3446044921875, 4.495574951171875, 4.64654541015625, 4.797515869140625, 4.948486328125, 5.099456787109375, 5.25042724609375, 5.401397705078125, 5.5523681640625, 5.703338623046875, 5.85430908203125, 6.005279541015625, 6.15625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 13.0, 36.0, 73.0, 121.0, 215.0, 215.0, 156.0, 74.0, 37.0, 16.0, 17.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.207664489746094, -11.758191108703613, -11.308717727661133, -10.859244346618652, -10.409770965576172, -9.960297584533691, -9.510824203491211, -9.06135082244873, -8.61187744140625, -8.16240406036377, -7.712930679321289, -7.263457298278809, -6.813983917236328, -6.364510536193848, -5.915037155151367, -5.465563774108887, -5.0160908699035645, -4.566617488861084, -4.1171441078186035, -3.667670726776123, -3.2181973457336426, -2.768724203109741, -2.3192508220672607, -1.8697774410247803, -1.4203040599822998, -0.9708306789398193, -0.5213573575019836, -0.07188403606414795, 0.3775893449783325, 0.8270626068115234, 1.276535987854004, 1.7260093688964844, 2.175482749938965, 2.6249561309814453, 3.074429512023926, 3.5239028930664062, 3.9733762741088867, 4.422849655151367, 4.872323036193848, 5.321796417236328, 5.771269798278809, 6.220743179321289, 6.6702165603637695, 7.11968994140625, 7.5691633224487305, 8.018636703491211, 8.468110084533691, 8.917583465576172, 9.367055892944336, 9.816529273986816, 10.266002655029297, 10.715476036071777, 11.164949417114258, 11.614422798156738, 12.063896179199219, 12.5133695602417, 12.96284294128418, 13.41231632232666, 13.86178970336914, 14.311263084411621, 14.760736465454102, 15.210209846496582, 15.659683227539062, 16.109155654907227, 16.558629989624023]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 9.0, 8.0, 11.0, 8.0, 15.0, 19.0, 20.0, 27.0, 30.0, 31.0, 35.0, 44.0, 48.0, 39.0, 52.0, 43.0, 63.0, 45.0, 48.0, 53.0, 39.0, 47.0, 39.0, 34.0, 30.0, 25.0, 29.0, 21.0, 12.0, 20.0, 12.0, 7.0, 12.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.155193328857422, -5.9484992027282715, -5.741805076599121, -5.535111427307129, -5.3284173011779785, -5.121723175048828, -4.915029048919678, -4.708334922790527, -4.501641273498535, -4.294947147369385, -4.088253021240234, -3.881559133529663, -3.674865245819092, -3.4681711196899414, -3.261476993560791, -3.0547828674316406, -2.8480887413024902, -2.64139461517334, -2.4347007274627686, -2.228006601333618, -2.021312713623047, -1.8146185874938965, -1.607924461364746, -1.4012304544448853, -1.1945364475250244, -0.9878424406051636, -0.781148374080658, -0.5744543075561523, -0.3677603006362915, -0.16106629371643066, 0.04562783241271973, 0.25232183933258057, 0.4590153694152832, 0.665709376335144, 0.8724034428596497, 1.0790975093841553, 1.2857915163040161, 1.492485523223877, 1.6991796493530273, 1.9058736562728882, 2.112567663192749, 2.3192617893218994, 2.5259556770324707, 2.732649803161621, 2.9393439292907715, 3.1460378170013428, 3.352731943130493, 3.5594258308410645, 3.766119956970215, 3.9728140830993652, 4.179508209228516, 4.386201858520508, 4.592895984649658, 4.799590110778809, 5.006284236907959, 5.212978363037109, 5.419672012329102, 5.626366138458252, 5.833060264587402, 6.0397539138793945, 6.246448040008545, 6.453142166137695, 6.659836292266846, 6.866530418395996, 7.0732245445251465]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 7.0, 8.0, 21.0, 30.0, 48.0, 79.0, 134.0, 252.0, 529.0, 1181.0, 3134.0, 10047.0, 41534.0, 242574.0, 581003.0, 131979.0, 25164.0, 6825.0, 2220.0, 889.0, 382.0, 204.0, 125.0, 61.0, 38.0, 24.0, 17.0, 11.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.65234375, -5.4827880859375, -5.313232421875, -5.1436767578125, -4.97412109375, -4.8045654296875, -4.635009765625, -4.4654541015625, -4.2958984375, -4.1263427734375, -3.956787109375, -3.7872314453125, -3.61767578125, -3.4481201171875, -3.278564453125, -3.1090087890625, -2.939453125, -2.7698974609375, -2.600341796875, -2.4307861328125, -2.26123046875, -2.0916748046875, -1.922119140625, -1.7525634765625, -1.5830078125, -1.4134521484375, -1.243896484375, -1.0743408203125, -0.90478515625, -0.7352294921875, -0.565673828125, -0.3961181640625, -0.2265625, -0.0570068359375, 0.112548828125, 0.2821044921875, 0.45166015625, 0.6212158203125, 0.790771484375, 0.9603271484375, 1.1298828125, 1.2994384765625, 1.468994140625, 1.6385498046875, 1.80810546875, 1.9776611328125, 2.147216796875, 2.3167724609375, 2.486328125, 2.6558837890625, 2.825439453125, 2.9949951171875, 3.16455078125, 3.3341064453125, 3.503662109375, 3.6732177734375, 3.8427734375, 4.0123291015625, 4.181884765625, 4.3514404296875, 4.52099609375, 4.6905517578125, 4.860107421875, 5.0296630859375, 5.19921875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 7.0, 9.0, 8.0, 18.0, 16.0, 32.0, 31.0, 36.0, 43.0, 51.0, 68.0, 65.0, 84.0, 86.0, 85.0, 69.0, 64.0, 60.0, 43.0, 35.0, 24.0, 17.0, 11.0, 12.0, 10.0, 6.0, 6.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.076171875, -2.974395751953125, -2.87261962890625, -2.770843505859375, -2.6690673828125, -2.567291259765625, -2.46551513671875, -2.363739013671875, -2.261962890625, -2.160186767578125, -2.05841064453125, -1.956634521484375, -1.8548583984375, -1.753082275390625, -1.65130615234375, -1.549530029296875, -1.44775390625, -1.345977783203125, -1.24420166015625, -1.142425537109375, -1.0406494140625, -0.938873291015625, -0.83709716796875, -0.735321044921875, -0.633544921875, -0.531768798828125, -0.42999267578125, -0.328216552734375, -0.2264404296875, -0.124664306640625, -0.02288818359375, 0.078887939453125, 0.1806640625, 0.282440185546875, 0.38421630859375, 0.485992431640625, 0.5877685546875, 0.689544677734375, 0.79132080078125, 0.893096923828125, 0.994873046875, 1.096649169921875, 1.19842529296875, 1.300201416015625, 1.4019775390625, 1.503753662109375, 1.60552978515625, 1.707305908203125, 1.80908203125, 1.910858154296875, 2.01263427734375, 2.114410400390625, 2.2161865234375, 2.317962646484375, 2.41973876953125, 2.521514892578125, 2.623291015625, 2.725067138671875, 2.82684326171875, 2.928619384765625, 3.0303955078125, 3.132171630859375, 3.23394775390625, 3.335723876953125, 3.4375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 16.0, 19.0, 36.0, 50.0, 111.0, 203.0, 389.0, 1108.0, 4702.0, 41341.0, 817499.0, 169235.0, 10569.0, 2062.0, 612.0, 259.0, 137.0, 76.0, 44.0, 29.0, 15.0, 16.0, 3.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.5078125, -13.19158935546875, -12.8753662109375, -12.55914306640625, -12.242919921875, -11.92669677734375, -11.6104736328125, -11.29425048828125, -10.97802734375, -10.66180419921875, -10.3455810546875, -10.02935791015625, -9.713134765625, -9.39691162109375, -9.0806884765625, -8.76446533203125, -8.4482421875, -8.13201904296875, -7.8157958984375, -7.49957275390625, -7.183349609375, -6.86712646484375, -6.5509033203125, -6.23468017578125, -5.91845703125, -5.60223388671875, -5.2860107421875, -4.96978759765625, -4.653564453125, -4.33734130859375, -4.0211181640625, -3.70489501953125, -3.388671875, -3.07244873046875, -2.7562255859375, -2.44000244140625, -2.123779296875, -1.80755615234375, -1.4913330078125, -1.17510986328125, -0.85888671875, -0.54266357421875, -0.2264404296875, 0.08978271484375, 0.406005859375, 0.72222900390625, 1.0384521484375, 1.35467529296875, 1.6708984375, 1.98712158203125, 2.3033447265625, 2.61956787109375, 2.935791015625, 3.25201416015625, 3.5682373046875, 3.88446044921875, 4.20068359375, 4.51690673828125, 4.8331298828125, 5.14935302734375, 5.465576171875, 5.78179931640625, 6.0980224609375, 6.41424560546875, 6.73046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 9.0, 14.0, 12.0, 14.0, 22.0, 25.0, 35.0, 35.0, 29.0, 64.0, 54.0, 68.0, 59.0, 62.0, 72.0, 55.0, 66.0, 60.0, 33.0, 34.0, 36.0, 34.0, 33.0, 19.0, 28.0, 5.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.56396484375, -11.1826171875, -10.80126953125, -10.419921875, -10.03857421875, -9.6572265625, -9.27587890625, -8.89453125, -8.51318359375, -8.1318359375, -7.75048828125, -7.369140625, -6.98779296875, -6.6064453125, -6.22509765625, -5.84375, -5.46240234375, -5.0810546875, -4.69970703125, -4.318359375, -3.93701171875, -3.5556640625, -3.17431640625, -2.79296875, -2.41162109375, -2.0302734375, -1.64892578125, -1.267578125, -0.88623046875, -0.5048828125, -0.12353515625, 0.2578125, 0.63916015625, 1.0205078125, 1.40185546875, 1.783203125, 2.16455078125, 2.5458984375, 2.92724609375, 3.30859375, 3.68994140625, 4.0712890625, 4.45263671875, 4.833984375, 5.21533203125, 5.5966796875, 5.97802734375, 6.359375, 6.74072265625, 7.1220703125, 7.50341796875, 7.884765625, 8.26611328125, 8.6474609375, 9.02880859375, 9.41015625, 9.79150390625, 10.1728515625, 10.55419921875, 10.935546875, 11.31689453125, 11.6982421875, 12.07958984375, 12.4609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 10.0, 11.0, 24.0, 37.0, 60.0, 129.0, 232.0, 532.0, 1266.0, 5040.0, 39378.0, 772653.0, 211647.0, 13464.0, 2537.0, 788.0, 365.0, 160.0, 81.0, 51.0, 27.0, 17.0, 13.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.849609375, -2.765228271484375, -2.68084716796875, -2.596466064453125, -2.5120849609375, -2.427703857421875, -2.34332275390625, -2.258941650390625, -2.174560546875, -2.090179443359375, -2.00579833984375, -1.921417236328125, -1.8370361328125, -1.752655029296875, -1.66827392578125, -1.583892822265625, -1.49951171875, -1.415130615234375, -1.33074951171875, -1.246368408203125, -1.1619873046875, -1.077606201171875, -0.99322509765625, -0.908843994140625, -0.824462890625, -0.740081787109375, -0.65570068359375, -0.571319580078125, -0.4869384765625, -0.402557373046875, -0.31817626953125, -0.233795166015625, -0.1494140625, -0.065032958984375, 0.01934814453125, 0.103729248046875, 0.1881103515625, 0.272491455078125, 0.35687255859375, 0.441253662109375, 0.525634765625, 0.610015869140625, 0.69439697265625, 0.778778076171875, 0.8631591796875, 0.947540283203125, 1.03192138671875, 1.116302490234375, 1.20068359375, 1.285064697265625, 1.36944580078125, 1.453826904296875, 1.5382080078125, 1.622589111328125, 1.70697021484375, 1.791351318359375, 1.875732421875, 1.960113525390625, 2.04449462890625, 2.128875732421875, 2.2132568359375, 2.297637939453125, 2.38201904296875, 2.466400146484375, 2.55078125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 4.0, 9.0, 10.0, 9.0, 22.0, 28.0, 39.0, 71.0, 73.0, 121.0, 124.0, 118.0, 112.0, 78.0, 44.0, 35.0, 32.0, 18.0, 12.0, 12.0, 8.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003428459167480469, -0.00033054500818252563, -0.0003182440996170044, -0.00030594319105148315, -0.0002936422824859619, -0.0002813413739204407, -0.00026904046535491943, -0.0002567395567893982, -0.00024443864822387695, -0.0002321377396583557, -0.00021983683109283447, -0.00020753592252731323, -0.000195235013961792, -0.00018293410539627075, -0.0001706331968307495, -0.00015833228826522827, -0.00014603137969970703, -0.0001337304711341858, -0.00012142956256866455, -0.00010912865400314331, -9.682774543762207e-05, -8.452683687210083e-05, -7.222592830657959e-05, -5.992501974105835e-05, -4.762411117553711e-05, -3.532320261001587e-05, -2.302229404449463e-05, -1.0721385478973389e-05, 1.5795230865478516e-06, 1.3880431652069092e-05, 2.6181340217590332e-05, 3.848224878311157e-05, 5.078315734863281e-05, 6.308406591415405e-05, 7.538497447967529e-05, 8.768588304519653e-05, 9.998679161071777e-05, 0.00011228770017623901, 0.00012458860874176025, 0.0001368895173072815, 0.00014919042587280273, 0.00016149133443832397, 0.00017379224300384521, 0.00018609315156936646, 0.0001983940601348877, 0.00021069496870040894, 0.00022299587726593018, 0.00023529678583145142, 0.00024759769439697266, 0.0002598986029624939, 0.00027219951152801514, 0.0002845004200935364, 0.0002968013286590576, 0.00030910223722457886, 0.0003214031457901001, 0.00033370405435562134, 0.0003460049629211426, 0.0003583058714866638, 0.00037060678005218506, 0.0003829076886177063, 0.00039520859718322754, 0.0004075095057487488, 0.00041981041431427, 0.00043211132287979126, 0.0004444122314453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 11.0, 11.0, 21.0, 31.0, 72.0, 120.0, 354.0, 1260.0, 6783.0, 115415.0, 880431.0, 38894.0, 3872.0, 816.0, 249.0, 104.0, 47.0, 20.0, 19.0, 18.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-5.12109375, -5.015167236328125, -4.90924072265625, -4.803314208984375, -4.6973876953125, -4.591461181640625, -4.48553466796875, -4.379608154296875, -4.273681640625, -4.167755126953125, -4.06182861328125, -3.955902099609375, -3.8499755859375, -3.744049072265625, -3.63812255859375, -3.532196044921875, -3.42626953125, -3.320343017578125, -3.21441650390625, -3.108489990234375, -3.0025634765625, -2.896636962890625, -2.79071044921875, -2.684783935546875, -2.578857421875, -2.472930908203125, -2.36700439453125, -2.261077880859375, -2.1551513671875, -2.049224853515625, -1.94329833984375, -1.837371826171875, -1.7314453125, -1.625518798828125, -1.51959228515625, -1.413665771484375, -1.3077392578125, -1.201812744140625, -1.09588623046875, -0.989959716796875, -0.884033203125, -0.778106689453125, -0.67218017578125, -0.566253662109375, -0.4603271484375, -0.354400634765625, -0.24847412109375, -0.142547607421875, -0.03662109375, 0.069305419921875, 0.17523193359375, 0.281158447265625, 0.3870849609375, 0.493011474609375, 0.59893798828125, 0.704864501953125, 0.810791015625, 0.916717529296875, 1.02264404296875, 1.128570556640625, 1.2344970703125, 1.340423583984375, 1.44635009765625, 1.552276611328125, 1.658203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 8.0, 5.0, 9.0, 8.0, 13.0, 24.0, 26.0, 33.0, 38.0, 60.0, 67.0, 84.0, 88.0, 87.0, 92.0, 73.0, 69.0, 56.0, 41.0, 37.0, 22.0, 17.0, 15.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.59375, -1.530914306640625, -1.46807861328125, -1.405242919921875, -1.3424072265625, -1.279571533203125, -1.21673583984375, -1.153900146484375, -1.091064453125, -1.028228759765625, -0.96539306640625, -0.902557373046875, -0.8397216796875, -0.776885986328125, -0.71405029296875, -0.651214599609375, -0.58837890625, -0.525543212890625, -0.46270751953125, -0.399871826171875, -0.3370361328125, -0.274200439453125, -0.21136474609375, -0.148529052734375, -0.085693359375, -0.022857666015625, 0.03997802734375, 0.102813720703125, 0.1656494140625, 0.228485107421875, 0.29132080078125, 0.354156494140625, 0.4169921875, 0.479827880859375, 0.54266357421875, 0.605499267578125, 0.6683349609375, 0.731170654296875, 0.79400634765625, 0.856842041015625, 0.919677734375, 0.982513427734375, 1.04534912109375, 1.108184814453125, 1.1710205078125, 1.233856201171875, 1.29669189453125, 1.359527587890625, 1.42236328125, 1.485198974609375, 1.54803466796875, 1.610870361328125, 1.6737060546875, 1.736541748046875, 1.79937744140625, 1.862213134765625, 1.925048828125, 1.987884521484375, 2.05072021484375, 2.113555908203125, 2.1763916015625, 2.239227294921875, 2.30206298828125, 2.364898681640625, 2.427734375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 12.0, 33.0, 79.0, 143.0, 236.0, 235.0, 152.0, 75.0, 26.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.13565063476562, -69.8863525390625, -67.63704681396484, -65.38774108886719, -63.13844299316406, -60.88914108276367, -58.63983917236328, -56.39053726196289, -54.1412353515625, -51.89193344116211, -49.64263153076172, -47.39332962036133, -45.14402770996094, -42.89472579956055, -40.645423889160156, -38.396121978759766, -36.146820068359375, -33.897518157958984, -31.648216247558594, -29.398914337158203, -27.149612426757812, -24.900310516357422, -22.65100860595703, -20.40170669555664, -18.15240478515625, -15.90310287475586, -13.653800964355469, -11.404499053955078, -9.155197143554688, -6.905895233154297, -4.656593322753906, -2.4072914123535156, -0.157989501953125, 2.0913124084472656, 4.340614318847656, 6.589916229248047, 8.839218139648438, 11.088520050048828, 13.337821960449219, 15.58712387084961, 17.83642578125, 20.08572769165039, 22.33502960205078, 24.584331512451172, 26.833633422851562, 29.082935333251953, 31.332237243652344, 33.581539154052734, 35.830841064453125, 38.080142974853516, 40.329444885253906, 42.5787467956543, 44.82804870605469, 47.07735061645508, 49.32665252685547, 51.57595443725586, 53.82525634765625, 56.07455825805664, 58.32386016845703, 60.57316207885742, 62.82246398925781, 65.07176208496094, 67.3210678100586, 69.57037353515625, 71.81967163085938]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 11.0, 4.0, 8.0, 4.0, 14.0, 17.0, 16.0, 37.0, 29.0, 39.0, 59.0, 49.0, 71.0, 75.0, 73.0, 74.0, 74.0, 54.0, 74.0, 63.0, 45.0, 40.0, 19.0, 14.0, 16.0, 11.0, 11.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.77688598632812, -74.897216796875, -73.01754760742188, -71.13787078857422, -69.2582015991211, -67.37853240966797, -65.49886322021484, -63.61919021606445, -61.73952102661133, -59.8598518371582, -57.98017883300781, -56.10050964355469, -54.2208366394043, -52.34116744995117, -50.46149444580078, -48.581825256347656, -46.70215606689453, -44.822486877441406, -42.942813873291016, -41.06314468383789, -39.1834716796875, -37.303802490234375, -35.42413330078125, -33.54446029663086, -31.66478729248047, -29.78511619567871, -27.905445098876953, -26.025775909423828, -24.14610481262207, -22.266433715820312, -20.386762619018555, -18.507091522216797, -16.627422332763672, -14.747751235961914, -12.868081092834473, -10.988409996032715, -9.108739852905273, -7.229068756103516, -5.349397659301758, -3.4697275161743164, -1.5900564193725586, 0.28961431980133057, 2.1692850589752197, 4.048955917358398, 5.928626537322998, 7.808297157287598, 9.687968254089355, 11.567638397216797, 13.447309494018555, 15.326980590820312, 17.20665168762207, 19.086322784423828, 20.965991973876953, 22.84566307067871, 24.72533416748047, 26.605003356933594, 28.484676361083984, 30.364347457885742, 32.2440185546875, 34.123687744140625, 36.003360748291016, 37.88302993774414, 39.76270294189453, 41.642372131347656, 43.52204132080078]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 12.0, 18.0, 29.0, 30.0, 48.0, 69.0, 103.0, 162.0, 363.0, 812.0, 1973.0, 7133.0, 39583.0, 3259317.0, 848168.0, 27825.0, 5828.0, 1605.0, 568.0, 271.0, 151.0, 109.0, 38.0, 24.0, 14.0, 9.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.953125, -7.7677001953125, -7.582275390625, -7.3968505859375, -7.21142578125, -7.0260009765625, -6.840576171875, -6.6551513671875, -6.4697265625, -6.2843017578125, -6.098876953125, -5.9134521484375, -5.72802734375, -5.5426025390625, -5.357177734375, -5.1717529296875, -4.986328125, -4.8009033203125, -4.615478515625, -4.4300537109375, -4.24462890625, -4.0592041015625, -3.873779296875, -3.6883544921875, -3.5029296875, -3.3175048828125, -3.132080078125, -2.9466552734375, -2.76123046875, -2.5758056640625, -2.390380859375, -2.2049560546875, -2.01953125, -1.8341064453125, -1.648681640625, -1.4632568359375, -1.27783203125, -1.0924072265625, -0.906982421875, -0.7215576171875, -0.5361328125, -0.3507080078125, -0.165283203125, 0.0201416015625, 0.20556640625, 0.3909912109375, 0.576416015625, 0.7618408203125, 0.947265625, 1.1326904296875, 1.318115234375, 1.5035400390625, 1.68896484375, 1.8743896484375, 2.059814453125, 2.2452392578125, 2.4306640625, 2.6160888671875, 2.801513671875, 2.9869384765625, 3.17236328125, 3.3577880859375, 3.543212890625, 3.7286376953125, 3.9140625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 9.0, 21.0, 21.0, 30.0, 57.0, 69.0, 83.0, 86.0, 127.0, 112.0, 108.0, 76.0, 71.0, 50.0, 31.0, 19.0, 18.0, 11.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.04296875, -5.911163330078125, -5.77935791015625, -5.647552490234375, -5.5157470703125, -5.383941650390625, -5.25213623046875, -5.120330810546875, -4.988525390625, -4.856719970703125, -4.72491455078125, -4.593109130859375, -4.4613037109375, -4.329498291015625, -4.19769287109375, -4.065887451171875, -3.93408203125, -3.802276611328125, -3.67047119140625, -3.538665771484375, -3.4068603515625, -3.275054931640625, -3.14324951171875, -3.011444091796875, -2.879638671875, -2.747833251953125, -2.61602783203125, -2.484222412109375, -2.3524169921875, -2.220611572265625, -2.08880615234375, -1.957000732421875, -1.8251953125, -1.693389892578125, -1.56158447265625, -1.429779052734375, -1.2979736328125, -1.166168212890625, -1.03436279296875, -0.902557373046875, -0.770751953125, -0.638946533203125, -0.50714111328125, -0.375335693359375, -0.2435302734375, -0.111724853515625, 0.02008056640625, 0.151885986328125, 0.28369140625, 0.415496826171875, 0.54730224609375, 0.679107666015625, 0.8109130859375, 0.942718505859375, 1.07452392578125, 1.206329345703125, 1.338134765625, 1.469940185546875, 1.60174560546875, 1.733551025390625, 1.8653564453125, 1.997161865234375, 2.12896728515625, 2.260772705078125, 2.392578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 19.0, 21.0, 53.0, 105.0, 210.0, 579.0, 4741.0, 3933995.0, 251482.0, 2419.0, 362.0, 154.0, 82.0, 26.0, 19.0, 8.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.796875, -15.23046875, -14.6640625, -14.09765625, -13.53125, -12.96484375, -12.3984375, -11.83203125, -11.265625, -10.69921875, -10.1328125, -9.56640625, -9.0, -8.43359375, -7.8671875, -7.30078125, -6.734375, -6.16796875, -5.6015625, -5.03515625, -4.46875, -3.90234375, -3.3359375, -2.76953125, -2.203125, -1.63671875, -1.0703125, -0.50390625, 0.0625, 0.62890625, 1.1953125, 1.76171875, 2.328125, 2.89453125, 3.4609375, 4.02734375, 4.59375, 5.16015625, 5.7265625, 6.29296875, 6.859375, 7.42578125, 7.9921875, 8.55859375, 9.125, 9.69140625, 10.2578125, 10.82421875, 11.390625, 11.95703125, 12.5234375, 13.08984375, 13.65625, 14.22265625, 14.7890625, 15.35546875, 15.921875, 16.48828125, 17.0546875, 17.62109375, 18.1875, 18.75390625, 19.3203125, 19.88671875, 20.453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 6.0, 19.0, 30.0, 57.0, 206.0, 2012.0, 1442.0, 154.0, 84.0, 29.0, 15.0, 9.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-20.96875, -20.56494140625, -20.1611328125, -19.75732421875, -19.353515625, -18.94970703125, -18.5458984375, -18.14208984375, -17.73828125, -17.33447265625, -16.9306640625, -16.52685546875, -16.123046875, -15.71923828125, -15.3154296875, -14.91162109375, -14.5078125, -14.10400390625, -13.7001953125, -13.29638671875, -12.892578125, -12.48876953125, -12.0849609375, -11.68115234375, -11.27734375, -10.87353515625, -10.4697265625, -10.06591796875, -9.662109375, -9.25830078125, -8.8544921875, -8.45068359375, -8.046875, -7.64306640625, -7.2392578125, -6.83544921875, -6.431640625, -6.02783203125, -5.6240234375, -5.22021484375, -4.81640625, -4.41259765625, -4.0087890625, -3.60498046875, -3.201171875, -2.79736328125, -2.3935546875, -1.98974609375, -1.5859375, -1.18212890625, -0.7783203125, -0.37451171875, 0.029296875, 0.43310546875, 0.8369140625, 1.24072265625, 1.64453125, 2.04833984375, 2.4521484375, 2.85595703125, 3.259765625, 3.66357421875, 4.0673828125, 4.47119140625, 4.875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 14.0, 27.0, 88.0, 224.0, 344.0, 190.0, 76.0, 24.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.2035140991211, -63.05573272705078, -60.90795135498047, -58.760169982910156, -56.612388610839844, -54.46460723876953, -52.31682205200195, -50.16904067993164, -48.02125930786133, -45.873477935791016, -43.7256965637207, -41.57791519165039, -39.43013000488281, -37.2823486328125, -35.13456726074219, -32.986785888671875, -30.839004516601562, -28.69122314453125, -26.543441772460938, -24.395658493041992, -22.24787712097168, -20.100095748901367, -17.952312469482422, -15.80453109741211, -13.656749725341797, -11.508968353271484, -9.361186027526855, -7.213404178619385, -5.065622329711914, -2.9178409576416016, -0.7700586318969727, 1.3777236938476562, 3.5254974365234375, 5.673279285430908, 7.821061134338379, 9.968843460083008, 12.11662483215332, 14.264406204223633, 16.412189483642578, 18.55997085571289, 20.707752227783203, 22.855533599853516, 25.003314971923828, 27.151098251342773, 29.298879623413086, 31.4466609954834, 33.594444274902344, 35.742225646972656, 37.89000701904297, 40.03778839111328, 42.185569763183594, 44.333351135253906, 46.48113250732422, 48.62891387939453, 50.77669906616211, 52.92448043823242, 55.072261810302734, 57.22004318237305, 59.36782455444336, 61.51560592651367, 63.66339111328125, 65.81117248535156, 67.95895385742188, 70.10673522949219, 72.2545166015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 11.0, 8.0, 13.0, 21.0, 25.0, 27.0, 41.0, 39.0, 63.0, 71.0, 71.0, 89.0, 78.0, 78.0, 66.0, 62.0, 48.0, 39.0, 37.0, 37.0, 19.0, 19.0, 17.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.344871520996094, -36.14968490600586, -34.954498291015625, -33.759315490722656, -32.56412887573242, -31.368942260742188, -30.173757553100586, -28.978572845458984, -27.78338623046875, -26.588199615478516, -25.393014907836914, -24.197830200195312, -23.002643585205078, -21.807456970214844, -20.612272262573242, -19.41708755493164, -18.221900939941406, -17.026714324951172, -15.83152961730957, -14.636343955993652, -13.441158294677734, -12.245972633361816, -11.050786972045898, -9.85560131072998, -8.660415649414062, -7.4652299880981445, -6.270044326782227, -5.074858665466309, -3.8796730041503906, -2.6844873428344727, -1.4893016815185547, -0.2941160202026367, 0.9010658264160156, 2.0962514877319336, 3.2914371490478516, 4.4866228103637695, 5.6818084716796875, 6.8769941329956055, 8.072179794311523, 9.267365455627441, 10.46255111694336, 11.657736778259277, 12.852922439575195, 14.048108100891113, 15.243293762207031, 16.438480377197266, 17.633665084838867, 18.82884979248047, 20.024036407470703, 21.219223022460938, 22.41440773010254, 23.60959243774414, 24.804779052734375, 25.99996566772461, 27.19515037536621, 28.390335083007812, 29.585521697998047, 30.78070831298828, 31.975893020629883, 33.171077728271484, 34.36626434326172, 35.56145095825195, 36.75663757324219, 37.951820373535156, 39.14700698852539]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 5.0, 11.0, 8.0, 23.0, 21.0, 32.0, 73.0, 102.0, 186.0, 309.0, 524.0, 1001.0, 1782.0, 3392.0, 6631.0, 13536.0, 28651.0, 61283.0, 134051.0, 254950.0, 268080.0, 145440.0, 67500.0, 30945.0, 14721.0, 7216.0, 3635.0, 1962.0, 1025.0, 605.0, 317.0, 198.0, 124.0, 64.0, 43.0, 32.0, 20.0, 9.0, 12.0, 8.0, 6.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.9267578125, -1.8626556396484375, -1.798553466796875, -1.7344512939453125, -1.67034912109375, -1.6062469482421875, -1.542144775390625, -1.4780426025390625, -1.4139404296875, -1.3498382568359375, -1.285736083984375, -1.2216339111328125, -1.15753173828125, -1.0934295654296875, -1.029327392578125, -0.9652252197265625, -0.901123046875, -0.8370208740234375, -0.772918701171875, -0.7088165283203125, -0.64471435546875, -0.5806121826171875, -0.516510009765625, -0.4524078369140625, -0.3883056640625, -0.3242034912109375, -0.260101318359375, -0.1959991455078125, -0.13189697265625, -0.0677947998046875, -0.003692626953125, 0.0604095458984375, 0.12451171875, 0.1886138916015625, 0.252716064453125, 0.3168182373046875, 0.38092041015625, 0.4450225830078125, 0.509124755859375, 0.5732269287109375, 0.6373291015625, 0.7014312744140625, 0.765533447265625, 0.8296356201171875, 0.89373779296875, 0.9578399658203125, 1.021942138671875, 1.0860443115234375, 1.150146484375, 1.2142486572265625, 1.278350830078125, 1.3424530029296875, 1.40655517578125, 1.4706573486328125, 1.534759521484375, 1.5988616943359375, 1.6629638671875, 1.7270660400390625, 1.791168212890625, 1.8552703857421875, 1.91937255859375, 1.9834747314453125, 2.047576904296875, 2.1116790771484375, 2.17578125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 9.0, 17.0, 19.0, 19.0, 31.0, 44.0, 39.0, 54.0, 58.0, 55.0, 66.0, 58.0, 70.0, 77.0, 61.0, 58.0, 56.0, 43.0, 35.0, 25.0, 25.0, 20.0, 11.0, 15.0, 8.0, 2.0, 3.0, 9.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.248046875, -3.1705780029296875, -3.093109130859375, -3.0156402587890625, -2.93817138671875, -2.8607025146484375, -2.783233642578125, -2.7057647705078125, -2.6282958984375, -2.5508270263671875, -2.473358154296875, -2.3958892822265625, -2.31842041015625, -2.2409515380859375, -2.163482666015625, -2.0860137939453125, -2.008544921875, -1.9310760498046875, -1.853607177734375, -1.7761383056640625, -1.69866943359375, -1.6212005615234375, -1.543731689453125, -1.4662628173828125, -1.3887939453125, -1.3113250732421875, -1.233856201171875, -1.1563873291015625, -1.07891845703125, -1.0014495849609375, -0.923980712890625, -0.8465118408203125, -0.76904296875, -0.6915740966796875, -0.614105224609375, -0.5366363525390625, -0.45916748046875, -0.3816986083984375, -0.304229736328125, -0.2267608642578125, -0.1492919921875, -0.0718231201171875, 0.005645751953125, 0.0831146240234375, 0.16058349609375, 0.2380523681640625, 0.315521240234375, 0.3929901123046875, 0.470458984375, 0.5479278564453125, 0.625396728515625, 0.7028656005859375, 0.78033447265625, 0.8578033447265625, 0.935272216796875, 1.0127410888671875, 1.0902099609375, 1.1676788330078125, 1.245147705078125, 1.3226165771484375, 1.40008544921875, 1.4775543212890625, 1.555023193359375, 1.6324920654296875, 1.7099609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 5.0, 6.0, 12.0, 23.0, 24.0, 44.0, 70.0, 96.0, 170.0, 305.0, 573.0, 1146.0, 3287.0, 16758.0, 253511.0, 717816.0, 45390.0, 5781.0, 1767.0, 775.0, 396.0, 227.0, 125.0, 85.0, 52.0, 28.0, 25.0, 21.0, 15.0, 5.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.07550048828125, -4.8658447265625, -4.65618896484375, -4.446533203125, -4.23687744140625, -4.0272216796875, -3.81756591796875, -3.60791015625, -3.39825439453125, -3.1885986328125, -2.97894287109375, -2.769287109375, -2.55963134765625, -2.3499755859375, -2.14031982421875, -1.9306640625, -1.72100830078125, -1.5113525390625, -1.30169677734375, -1.092041015625, -0.88238525390625, -0.6727294921875, -0.46307373046875, -0.25341796875, -0.04376220703125, 0.1658935546875, 0.37554931640625, 0.585205078125, 0.79486083984375, 1.0045166015625, 1.21417236328125, 1.423828125, 1.63348388671875, 1.8431396484375, 2.05279541015625, 2.262451171875, 2.47210693359375, 2.6817626953125, 2.89141845703125, 3.10107421875, 3.31072998046875, 3.5203857421875, 3.73004150390625, 3.939697265625, 4.14935302734375, 4.3590087890625, 4.56866455078125, 4.7783203125, 4.98797607421875, 5.1976318359375, 5.40728759765625, 5.616943359375, 5.82659912109375, 6.0362548828125, 6.24591064453125, 6.45556640625, 6.66522216796875, 6.8748779296875, 7.08453369140625, 7.294189453125, 7.50384521484375, 7.7135009765625, 7.92315673828125, 8.1328125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 3.0, 3.0, 8.0, 6.0, 16.0, 14.0, 21.0, 18.0, 20.0, 30.0, 34.0, 35.0, 32.0, 43.0, 44.0, 55.0, 36.0, 51.0, 49.0, 37.0, 48.0, 53.0, 46.0, 32.0, 33.0, 42.0, 28.0, 31.0, 13.0, 29.0, 15.0, 17.0, 16.0, 13.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.79296875, -6.55572509765625, -6.3184814453125, -6.08123779296875, -5.843994140625, -5.60675048828125, -5.3695068359375, -5.13226318359375, -4.89501953125, -4.65777587890625, -4.4205322265625, -4.18328857421875, -3.946044921875, -3.70880126953125, -3.4715576171875, -3.23431396484375, -2.9970703125, -2.75982666015625, -2.5225830078125, -2.28533935546875, -2.048095703125, -1.81085205078125, -1.5736083984375, -1.33636474609375, -1.09912109375, -0.86187744140625, -0.6246337890625, -0.38739013671875, -0.150146484375, 0.08709716796875, 0.3243408203125, 0.56158447265625, 0.798828125, 1.03607177734375, 1.2733154296875, 1.51055908203125, 1.747802734375, 1.98504638671875, 2.2222900390625, 2.45953369140625, 2.69677734375, 2.93402099609375, 3.1712646484375, 3.40850830078125, 3.645751953125, 3.88299560546875, 4.1202392578125, 4.35748291015625, 4.5947265625, 4.83197021484375, 5.0692138671875, 5.30645751953125, 5.543701171875, 5.78094482421875, 6.0181884765625, 6.25543212890625, 6.49267578125, 6.72991943359375, 6.9671630859375, 7.20440673828125, 7.441650390625, 7.67889404296875, 7.9161376953125, 8.15338134765625, 8.390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 9.0, 20.0, 26.0, 34.0, 54.0, 96.0, 154.0, 341.0, 766.0, 2251.0, 9889.0, 126852.0, 848709.0, 50477.0, 6042.0, 1592.0, 614.0, 272.0, 106.0, 70.0, 52.0, 33.0, 25.0, 16.0, 10.0, 7.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.982421875, -2.89300537109375, -2.8035888671875, -2.71417236328125, -2.624755859375, -2.53533935546875, -2.4459228515625, -2.35650634765625, -2.26708984375, -2.17767333984375, -2.0882568359375, -1.99884033203125, -1.909423828125, -1.82000732421875, -1.7305908203125, -1.64117431640625, -1.5517578125, -1.46234130859375, -1.3729248046875, -1.28350830078125, -1.194091796875, -1.10467529296875, -1.0152587890625, -0.92584228515625, -0.83642578125, -0.74700927734375, -0.6575927734375, -0.56817626953125, -0.478759765625, -0.38934326171875, -0.2999267578125, -0.21051025390625, -0.12109375, -0.03167724609375, 0.0577392578125, 0.14715576171875, 0.236572265625, 0.32598876953125, 0.4154052734375, 0.50482177734375, 0.59423828125, 0.68365478515625, 0.7730712890625, 0.86248779296875, 0.951904296875, 1.04132080078125, 1.1307373046875, 1.22015380859375, 1.3095703125, 1.39898681640625, 1.4884033203125, 1.57781982421875, 1.667236328125, 1.75665283203125, 1.8460693359375, 1.93548583984375, 2.02490234375, 2.11431884765625, 2.2037353515625, 2.29315185546875, 2.382568359375, 2.47198486328125, 2.5614013671875, 2.65081787109375, 2.740234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 4.0, 7.0, 16.0, 10.0, 9.0, 21.0, 16.0, 41.0, 43.0, 52.0, 71.0, 90.0, 85.0, 95.0, 70.0, 78.0, 55.0, 53.0, 49.0, 27.0, 18.0, 23.0, 21.0, 10.0, 6.0, 10.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.0004315376281738281, -0.0004210490733385086, -0.0004105605185031891, -0.00040007196366786957, -0.00038958340883255005, -0.00037909485399723053, -0.000368606299161911, -0.0003581177443265915, -0.00034762918949127197, -0.00033714063465595245, -0.00032665207982063293, -0.0003161635249853134, -0.0003056749701499939, -0.0002951864153146744, -0.00028469786047935486, -0.00027420930564403534, -0.0002637207508087158, -0.0002532321959733963, -0.00024274364113807678, -0.00023225508630275726, -0.00022176653146743774, -0.00021127797663211823, -0.0002007894217967987, -0.0001903008669614792, -0.00017981231212615967, -0.00016932375729084015, -0.00015883520245552063, -0.0001483466476202011, -0.0001378580927848816, -0.00012736953794956207, -0.00011688098311424255, -0.00010639242827892303, -9.590387344360352e-05, -8.5415318608284e-05, -7.492676377296448e-05, -6.443820893764496e-05, -5.394965410232544e-05, -4.346109926700592e-05, -3.29725444316864e-05, -2.2483989596366882e-05, -1.1995434761047363e-05, -1.5068799257278442e-06, 8.981674909591675e-06, 1.9470229744911194e-05, 2.9958784580230713e-05, 4.044733941555023e-05, 5.093589425086975e-05, 6.142444908618927e-05, 7.191300392150879e-05, 8.240155875682831e-05, 9.289011359214783e-05, 0.00010337866842746735, 0.00011386722326278687, 0.00012435577809810638, 0.0001348443329334259, 0.00014533288776874542, 0.00015582144260406494, 0.00016630999743938446, 0.00017679855227470398, 0.0001872871071100235, 0.00019777566194534302, 0.00020826421678066254, 0.00021875277161598206, 0.00022924132645130157, 0.0002397298812866211]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 3.0, 5.0, 4.0, 11.0, 19.0, 22.0, 42.0, 57.0, 111.0, 205.0, 451.0, 1202.0, 3660.0, 21785.0, 328120.0, 648157.0, 36762.0, 5405.0, 1410.0, 521.0, 246.0, 130.0, 75.0, 58.0, 28.0, 20.0, 8.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5859375, -2.512298583984375, -2.43865966796875, -2.365020751953125, -2.2913818359375, -2.217742919921875, -2.14410400390625, -2.070465087890625, -1.996826171875, -1.923187255859375, -1.84954833984375, -1.775909423828125, -1.7022705078125, -1.628631591796875, -1.55499267578125, -1.481353759765625, -1.40771484375, -1.334075927734375, -1.26043701171875, -1.186798095703125, -1.1131591796875, -1.039520263671875, -0.96588134765625, -0.892242431640625, -0.818603515625, -0.744964599609375, -0.67132568359375, -0.597686767578125, -0.5240478515625, -0.450408935546875, -0.37677001953125, -0.303131103515625, -0.2294921875, -0.155853271484375, -0.08221435546875, -0.008575439453125, 0.0650634765625, 0.138702392578125, 0.21234130859375, 0.285980224609375, 0.359619140625, 0.433258056640625, 0.50689697265625, 0.580535888671875, 0.6541748046875, 0.727813720703125, 0.80145263671875, 0.875091552734375, 0.94873046875, 1.022369384765625, 1.09600830078125, 1.169647216796875, 1.2432861328125, 1.316925048828125, 1.39056396484375, 1.464202880859375, 1.537841796875, 1.611480712890625, 1.68511962890625, 1.758758544921875, 1.8323974609375, 1.906036376953125, 1.97967529296875, 2.053314208984375, 2.126953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 4.0, 3.0, 12.0, 2.0, 18.0, 12.0, 17.0, 18.0, 25.0, 41.0, 36.0, 53.0, 56.0, 52.0, 71.0, 76.0, 79.0, 74.0, 60.0, 51.0, 50.0, 33.0, 32.0, 27.0, 16.0, 20.0, 15.0, 6.0, 3.0, 7.0, 6.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5478515625, -1.4976654052734375, -1.447479248046875, -1.3972930908203125, -1.34710693359375, -1.2969207763671875, -1.246734619140625, -1.1965484619140625, -1.1463623046875, -1.0961761474609375, -1.045989990234375, -0.9958038330078125, -0.94561767578125, -0.8954315185546875, -0.845245361328125, -0.7950592041015625, -0.744873046875, -0.6946868896484375, -0.644500732421875, -0.5943145751953125, -0.54412841796875, -0.4939422607421875, -0.443756103515625, -0.3935699462890625, -0.3433837890625, -0.2931976318359375, -0.243011474609375, -0.1928253173828125, -0.14263916015625, -0.0924530029296875, -0.042266845703125, 0.0079193115234375, 0.05810546875, 0.1082916259765625, 0.158477783203125, 0.2086639404296875, 0.25885009765625, 0.3090362548828125, 0.359222412109375, 0.4094085693359375, 0.4595947265625, 0.5097808837890625, 0.559967041015625, 0.6101531982421875, 0.66033935546875, 0.7105255126953125, 0.760711669921875, 0.8108978271484375, 0.861083984375, 0.9112701416015625, 0.961456298828125, 1.0116424560546875, 1.06182861328125, 1.1120147705078125, 1.162200927734375, 1.2123870849609375, 1.2625732421875, 1.3127593994140625, 1.362945556640625, 1.4131317138671875, 1.46331787109375, 1.5135040283203125, 1.563690185546875, 1.6138763427734375, 1.6640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 15.0, 59.0, 194.0, 420.0, 239.0, 53.0, 14.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.158538818359375, -41.318721771240234, -38.478904724121094, -35.63909149169922, -32.79927062988281, -29.959455490112305, -27.119640350341797, -24.279823303222656, -21.440006256103516, -18.600189208984375, -15.76037311553955, -12.920557022094727, -10.080739974975586, -7.240922927856445, -4.4011077880859375, -1.5612907409667969, 1.2785263061523438, 4.118342876434326, 6.958159446716309, 9.797975540161133, 12.637792587280273, 15.477609634399414, 18.317424774169922, 21.157241821289062, 23.997058868408203, 26.836875915527344, 29.676692962646484, 32.516510009765625, 35.3563232421875, 38.196144104003906, 41.03595733642578, 43.87577438354492, 46.71559143066406, 49.5554084777832, 52.395225524902344, 55.23503875732422, 58.074859619140625, 60.9146728515625, 63.75448989868164, 66.59430694580078, 69.43412780761719, 72.27394104003906, 75.11376190185547, 77.95357513427734, 80.79339599609375, 83.63320922851562, 86.4730224609375, 89.3128433227539, 92.15265655517578, 94.99246978759766, 97.83229064941406, 100.67210388183594, 103.51192474365234, 106.35173797607422, 109.19155883789062, 112.0313720703125, 114.87118530273438, 117.71099853515625, 120.55081939697266, 123.39063262939453, 126.23045349121094, 129.0702667236328, 131.9100799560547, 134.74990844726562, 137.5897216796875]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 7.0, 5.0, 10.0, 12.0, 22.0, 20.0, 30.0, 32.0, 28.0, 24.0, 30.0, 38.0, 39.0, 44.0, 71.0, 71.0, 73.0, 56.0, 58.0, 59.0, 43.0, 30.0, 47.0, 33.0, 22.0, 25.0, 14.0, 11.0, 10.0, 3.0, 5.0, 4.0, 9.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.795791625976562, -23.709667205810547, -22.6235408782959, -21.537416458129883, -20.451292037963867, -19.36516571044922, -18.279041290283203, -17.192916870117188, -16.106792449951172, -15.02066707611084, -13.934542655944824, -12.848417282104492, -11.762292861938477, -10.676167488098145, -9.590042114257812, -8.503917694091797, -7.417791366577148, -6.331666469573975, -5.245541572570801, -4.159416198730469, -3.073291301727295, -1.987166404724121, -0.9010410308837891, 0.18508386611938477, 1.2712087631225586, 2.3573336601257324, 3.4434587955474854, 4.529583930969238, 5.615708827972412, 6.701833724975586, 7.787959098815918, 8.87408447265625, 9.960208892822266, 11.046334266662598, 12.132458686828613, 13.218584060668945, 14.304708480834961, 15.390833854675293, 16.476959228515625, 17.56308364868164, 18.649208068847656, 19.735332489013672, 20.82145881652832, 21.907583236694336, 22.99370765686035, 24.079833984375, 25.165958404541016, 26.25208282470703, 27.33820915222168, 28.424333572387695, 29.510459899902344, 30.59658432006836, 31.682708740234375, 32.76883316040039, 33.854957580566406, 34.94108581542969, 36.0272102355957, 37.11333465576172, 38.199459075927734, 39.28558349609375, 40.37171173095703, 41.45783615112305, 42.54396057128906, 43.63008499145508, 44.716209411621094]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 8.0, 5.0, 11.0, 9.0, 13.0, 19.0, 34.0, 36.0, 54.0, 83.0, 102.0, 165.0, 420.0, 3144.0, 185158.0, 3992208.0, 11128.0, 893.0, 298.0, 143.0, 102.0, 59.0, 55.0, 40.0, 19.0, 15.0, 16.0, 11.0, 7.0, 7.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6015625, -9.2939453125, -8.986328125, -8.6787109375, -8.37109375, -8.0634765625, -7.755859375, -7.4482421875, -7.140625, -6.8330078125, -6.525390625, -6.2177734375, -5.91015625, -5.6025390625, -5.294921875, -4.9873046875, -4.6796875, -4.3720703125, -4.064453125, -3.7568359375, -3.44921875, -3.1416015625, -2.833984375, -2.5263671875, -2.21875, -1.9111328125, -1.603515625, -1.2958984375, -0.98828125, -0.6806640625, -0.373046875, -0.0654296875, 0.2421875, 0.5498046875, 0.857421875, 1.1650390625, 1.47265625, 1.7802734375, 2.087890625, 2.3955078125, 2.703125, 3.0107421875, 3.318359375, 3.6259765625, 3.93359375, 4.2412109375, 4.548828125, 4.8564453125, 5.1640625, 5.4716796875, 5.779296875, 6.0869140625, 6.39453125, 6.7021484375, 7.009765625, 7.3173828125, 7.625, 7.9326171875, 8.240234375, 8.5478515625, 8.85546875, 9.1630859375, 9.470703125, 9.7783203125, 10.0859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 10.0, 17.0, 21.0, 28.0, 43.0, 43.0, 49.0, 53.0, 66.0, 59.0, 75.0, 73.0, 79.0, 60.0, 47.0, 47.0, 54.0, 42.0, 29.0, 29.0, 16.0, 15.0, 15.0, 10.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.880859375, -1.80718994140625, -1.7335205078125, -1.65985107421875, -1.586181640625, -1.51251220703125, -1.4388427734375, -1.36517333984375, -1.29150390625, -1.21783447265625, -1.1441650390625, -1.07049560546875, -0.996826171875, -0.92315673828125, -0.8494873046875, -0.77581787109375, -0.7021484375, -0.62847900390625, -0.5548095703125, -0.48114013671875, -0.407470703125, -0.33380126953125, -0.2601318359375, -0.18646240234375, -0.11279296875, -0.03912353515625, 0.0345458984375, 0.10821533203125, 0.181884765625, 0.25555419921875, 0.3292236328125, 0.40289306640625, 0.4765625, 0.55023193359375, 0.6239013671875, 0.69757080078125, 0.771240234375, 0.84490966796875, 0.9185791015625, 0.99224853515625, 1.06591796875, 1.13958740234375, 1.2132568359375, 1.28692626953125, 1.360595703125, 1.43426513671875, 1.5079345703125, 1.58160400390625, 1.6552734375, 1.72894287109375, 1.8026123046875, 1.87628173828125, 1.949951171875, 2.02362060546875, 2.0972900390625, 2.17095947265625, 2.24462890625, 2.31829833984375, 2.3919677734375, 2.46563720703125, 2.539306640625, 2.61297607421875, 2.6866455078125, 2.76031494140625, 2.833984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 17.0, 19.0, 21.0, 40.0, 96.0, 214.0, 538.0, 1380.0, 4035.0, 14269.0, 80299.0, 3568207.0, 480897.0, 33094.0, 7496.0, 2333.0, 801.0, 279.0, 121.0, 50.0, 23.0, 16.0, 12.0, 6.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55859375, -4.410400390625, -4.26220703125, -4.114013671875, -3.9658203125, -3.817626953125, -3.66943359375, -3.521240234375, -3.373046875, -3.224853515625, -3.07666015625, -2.928466796875, -2.7802734375, -2.632080078125, -2.48388671875, -2.335693359375, -2.1875, -2.039306640625, -1.89111328125, -1.742919921875, -1.5947265625, -1.446533203125, -1.29833984375, -1.150146484375, -1.001953125, -0.853759765625, -0.70556640625, -0.557373046875, -0.4091796875, -0.260986328125, -0.11279296875, 0.035400390625, 0.18359375, 0.331787109375, 0.47998046875, 0.628173828125, 0.7763671875, 0.924560546875, 1.07275390625, 1.220947265625, 1.369140625, 1.517333984375, 1.66552734375, 1.813720703125, 1.9619140625, 2.110107421875, 2.25830078125, 2.406494140625, 2.5546875, 2.702880859375, 2.85107421875, 2.999267578125, 3.1474609375, 3.295654296875, 3.44384765625, 3.592041015625, 3.740234375, 3.888427734375, 4.03662109375, 4.184814453125, 4.3330078125, 4.481201171875, 4.62939453125, 4.777587890625, 4.92578125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 7.0, 4.0, 5.0, 5.0, 7.0, 12.0, 10.0, 20.0, 38.0, 43.0, 101.0, 220.0, 508.0, 1112.0, 1046.0, 457.0, 193.0, 85.0, 59.0, 35.0, 29.0, 14.0, 17.0, 8.0, 9.0, 12.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.27239990234375, -4.1463623046875, -4.02032470703125, -3.894287109375, -3.76824951171875, -3.6422119140625, -3.51617431640625, -3.39013671875, -3.26409912109375, -3.1380615234375, -3.01202392578125, -2.885986328125, -2.75994873046875, -2.6339111328125, -2.50787353515625, -2.3818359375, -2.25579833984375, -2.1297607421875, -2.00372314453125, -1.877685546875, -1.75164794921875, -1.6256103515625, -1.49957275390625, -1.37353515625, -1.24749755859375, -1.1214599609375, -0.99542236328125, -0.869384765625, -0.74334716796875, -0.6173095703125, -0.49127197265625, -0.365234375, -0.23919677734375, -0.1131591796875, 0.01287841796875, 0.138916015625, 0.26495361328125, 0.3909912109375, 0.51702880859375, 0.64306640625, 0.76910400390625, 0.8951416015625, 1.02117919921875, 1.147216796875, 1.27325439453125, 1.3992919921875, 1.52532958984375, 1.6513671875, 1.77740478515625, 1.9034423828125, 2.02947998046875, 2.155517578125, 2.28155517578125, 2.4075927734375, 2.53363037109375, 2.65966796875, 2.78570556640625, 2.9117431640625, 3.03778076171875, 3.163818359375, 3.28985595703125, 3.4158935546875, 3.54193115234375, 3.66796875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 23.0, 59.0, 176.0, 307.0, 266.0, 106.0, 31.0, 14.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.08795928955078, -45.64741897583008, -44.20687484741211, -42.766334533691406, -41.32579040527344, -39.885250091552734, -38.444705963134766, -37.00416564941406, -35.563621520996094, -34.12308120727539, -32.68253707885742, -31.241994857788086, -29.80145263671875, -28.360910415649414, -26.920368194580078, -25.479827880859375, -24.03928565979004, -22.598743438720703, -21.158201217651367, -19.71765899658203, -18.277116775512695, -16.83657455444336, -15.39603328704834, -13.955491065979004, -12.514948844909668, -11.074406623840332, -9.633864402770996, -8.193323135375977, -6.752780437469482, -5.3122382164001465, -3.8716964721679688, -2.431154251098633, -0.9906120300292969, 0.4499300718307495, 1.890472173690796, 3.3310141563415527, 4.771556377410889, 6.212098598480225, 7.652640342712402, 9.093182563781738, 10.533724784851074, 11.97426700592041, 13.414809226989746, 14.855350494384766, 16.2958927154541, 17.736434936523438, 19.176977157592773, 20.61751937866211, 22.058061599731445, 23.49860382080078, 24.939146041870117, 26.379688262939453, 27.82023048400879, 29.260772705078125, 30.701313018798828, 32.1418571472168, 33.5823974609375, 35.0229377746582, 36.46348190307617, 37.904022216796875, 39.344566345214844, 40.78510665893555, 42.225650787353516, 43.66619110107422, 45.10673522949219]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 11.0, 21.0, 19.0, 17.0, 22.0, 27.0, 29.0, 33.0, 39.0, 55.0, 50.0, 62.0, 61.0, 71.0, 58.0, 56.0, 58.0, 44.0, 42.0, 44.0, 29.0, 32.0, 19.0, 26.0, 13.0, 12.0, 10.0, 10.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.723228454589844, -21.146329879760742, -20.56943130493164, -19.992534637451172, -19.41563606262207, -18.83873748779297, -18.261838912963867, -17.684940338134766, -17.108043670654297, -16.531145095825195, -15.95424747467041, -15.377348899841309, -14.800451278686523, -14.223552703857422, -13.64665412902832, -13.069756507873535, -12.492857933044434, -11.915959358215332, -11.339061737060547, -10.762163162231445, -10.18526554107666, -9.608366966247559, -9.031469345092773, -8.454570770263672, -7.8776726722717285, -7.300774574279785, -6.723876476287842, -6.146978378295898, -5.570079803466797, -4.993182182312012, -4.41628360748291, -3.839385509490967, -3.26248836517334, -2.6855902671813965, -2.108692169189453, -1.5317938327789307, -0.9548957347869873, -0.37799763679504395, 0.19890069961547852, 0.7757987976074219, 1.3526968955993652, 1.9295949935913086, 2.506493091583252, 3.0833914279937744, 3.6602895259857178, 4.237187385559082, 4.814085960388184, 5.390984058380127, 5.96788215637207, 6.544780254364014, 7.121678352355957, 7.698576927185059, 8.275474548339844, 8.852373123168945, 9.429271697998047, 10.006169319152832, 10.583066940307617, 11.159965515136719, 11.736863136291504, 12.313761711120605, 12.89065933227539, 13.467557907104492, 14.044456481933594, 14.621354103088379, 15.19825267791748]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 7.0, 12.0, 15.0, 20.0, 26.0, 36.0, 54.0, 74.0, 119.0, 175.0, 288.0, 498.0, 816.0, 1508.0, 2830.0, 5489.0, 11196.0, 24232.0, 54002.0, 120125.0, 242235.0, 284824.0, 162487.0, 74040.0, 32986.0, 15161.0, 7189.0, 3588.0, 1851.0, 1074.0, 582.0, 390.0, 209.0, 131.0, 94.0, 48.0, 43.0, 29.0, 19.0, 16.0, 10.0, 11.0, 5.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.08203125, -2.015289306640625, -1.94854736328125, -1.881805419921875, -1.8150634765625, -1.748321533203125, -1.68157958984375, -1.614837646484375, -1.548095703125, -1.481353759765625, -1.41461181640625, -1.347869873046875, -1.2811279296875, -1.214385986328125, -1.14764404296875, -1.080902099609375, -1.01416015625, -0.947418212890625, -0.88067626953125, -0.813934326171875, -0.7471923828125, -0.680450439453125, -0.61370849609375, -0.546966552734375, -0.480224609375, -0.413482666015625, -0.34674072265625, -0.279998779296875, -0.2132568359375, -0.146514892578125, -0.07977294921875, -0.013031005859375, 0.0537109375, 0.120452880859375, 0.18719482421875, 0.253936767578125, 0.3206787109375, 0.387420654296875, 0.45416259765625, 0.520904541015625, 0.587646484375, 0.654388427734375, 0.72113037109375, 0.787872314453125, 0.8546142578125, 0.921356201171875, 0.98809814453125, 1.054840087890625, 1.12158203125, 1.188323974609375, 1.25506591796875, 1.321807861328125, 1.3885498046875, 1.455291748046875, 1.52203369140625, 1.588775634765625, 1.655517578125, 1.722259521484375, 1.78900146484375, 1.855743408203125, 1.9224853515625, 1.989227294921875, 2.05596923828125, 2.122711181640625, 2.189453125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 8.0, 12.0, 18.0, 15.0, 29.0, 35.0, 22.0, 38.0, 36.0, 51.0, 51.0, 39.0, 42.0, 61.0, 45.0, 52.0, 54.0, 47.0, 52.0, 28.0, 35.0, 37.0, 35.0, 28.0, 23.0, 16.0, 15.0, 13.0, 10.0, 7.0, 12.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.861328125, -1.8057861328125, -1.750244140625, -1.6947021484375, -1.63916015625, -1.5836181640625, -1.528076171875, -1.4725341796875, -1.4169921875, -1.3614501953125, -1.305908203125, -1.2503662109375, -1.19482421875, -1.1392822265625, -1.083740234375, -1.0281982421875, -0.97265625, -0.9171142578125, -0.861572265625, -0.8060302734375, -0.75048828125, -0.6949462890625, -0.639404296875, -0.5838623046875, -0.5283203125, -0.4727783203125, -0.417236328125, -0.3616943359375, -0.30615234375, -0.2506103515625, -0.195068359375, -0.1395263671875, -0.083984375, -0.0284423828125, 0.027099609375, 0.0826416015625, 0.13818359375, 0.1937255859375, 0.249267578125, 0.3048095703125, 0.3603515625, 0.4158935546875, 0.471435546875, 0.5269775390625, 0.58251953125, 0.6380615234375, 0.693603515625, 0.7491455078125, 0.8046875, 0.8602294921875, 0.915771484375, 0.9713134765625, 1.02685546875, 1.0823974609375, 1.137939453125, 1.1934814453125, 1.2490234375, 1.3045654296875, 1.360107421875, 1.4156494140625, 1.47119140625, 1.5267333984375, 1.582275390625, 1.6378173828125, 1.693359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 5.0, 7.0, 13.0, 9.0, 22.0, 35.0, 60.0, 104.0, 197.0, 518.0, 1223.0, 4666.0, 43619.0, 741767.0, 238578.0, 13977.0, 2317.0, 759.0, 305.0, 145.0, 77.0, 57.0, 32.0, 20.0, 13.0, 6.0, 6.0, 3.0, 7.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4296875, -6.1895751953125, -5.949462890625, -5.7093505859375, -5.46923828125, -5.2291259765625, -4.989013671875, -4.7489013671875, -4.5087890625, -4.2686767578125, -4.028564453125, -3.7884521484375, -3.54833984375, -3.3082275390625, -3.068115234375, -2.8280029296875, -2.587890625, -2.3477783203125, -2.107666015625, -1.8675537109375, -1.62744140625, -1.3873291015625, -1.147216796875, -0.9071044921875, -0.6669921875, -0.4268798828125, -0.186767578125, 0.0533447265625, 0.29345703125, 0.5335693359375, 0.773681640625, 1.0137939453125, 1.25390625, 1.4940185546875, 1.734130859375, 1.9742431640625, 2.21435546875, 2.4544677734375, 2.694580078125, 2.9346923828125, 3.1748046875, 3.4149169921875, 3.655029296875, 3.8951416015625, 4.13525390625, 4.3753662109375, 4.615478515625, 4.8555908203125, 5.095703125, 5.3358154296875, 5.575927734375, 5.8160400390625, 6.05615234375, 6.2962646484375, 6.536376953125, 6.7764892578125, 7.0166015625, 7.2567138671875, 7.496826171875, 7.7369384765625, 7.97705078125, 8.2171630859375, 8.457275390625, 8.6973876953125, 8.9375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 1.0, 4.0, 6.0, 4.0, 11.0, 10.0, 18.0, 15.0, 16.0, 29.0, 18.0, 29.0, 38.0, 38.0, 43.0, 41.0, 35.0, 46.0, 50.0, 51.0, 37.0, 54.0, 45.0, 41.0, 40.0, 42.0, 35.0, 27.0, 28.0, 24.0, 25.0, 15.0, 14.0, 12.0, 11.0, 9.0, 11.0, 7.0, 6.0, 2.0, 7.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.94921875, -5.770263671875, -5.59130859375, -5.412353515625, -5.2333984375, -5.054443359375, -4.87548828125, -4.696533203125, -4.517578125, -4.338623046875, -4.15966796875, -3.980712890625, -3.8017578125, -3.622802734375, -3.44384765625, -3.264892578125, -3.0859375, -2.906982421875, -2.72802734375, -2.549072265625, -2.3701171875, -2.191162109375, -2.01220703125, -1.833251953125, -1.654296875, -1.475341796875, -1.29638671875, -1.117431640625, -0.9384765625, -0.759521484375, -0.58056640625, -0.401611328125, -0.22265625, -0.043701171875, 0.13525390625, 0.314208984375, 0.4931640625, 0.672119140625, 0.85107421875, 1.030029296875, 1.208984375, 1.387939453125, 1.56689453125, 1.745849609375, 1.9248046875, 2.103759765625, 2.28271484375, 2.461669921875, 2.640625, 2.819580078125, 2.99853515625, 3.177490234375, 3.3564453125, 3.535400390625, 3.71435546875, 3.893310546875, 4.072265625, 4.251220703125, 4.43017578125, 4.609130859375, 4.7880859375, 4.967041015625, 5.14599609375, 5.324951171875, 5.50390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 8.0, 10.0, 11.0, 9.0, 24.0, 25.0, 25.0, 51.0, 82.0, 150.0, 263.0, 540.0, 1204.0, 3503.0, 15985.0, 196425.0, 770780.0, 48499.0, 7254.0, 2035.0, 777.0, 397.0, 180.0, 121.0, 70.0, 33.0, 31.0, 11.0, 15.0, 8.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.3128662109375, -2.217529296875, -2.1221923828125, -2.02685546875, -1.9315185546875, -1.836181640625, -1.7408447265625, -1.6455078125, -1.5501708984375, -1.454833984375, -1.3594970703125, -1.26416015625, -1.1688232421875, -1.073486328125, -0.9781494140625, -0.8828125, -0.7874755859375, -0.692138671875, -0.5968017578125, -0.50146484375, -0.4061279296875, -0.310791015625, -0.2154541015625, -0.1201171875, -0.0247802734375, 0.070556640625, 0.1658935546875, 0.26123046875, 0.3565673828125, 0.451904296875, 0.5472412109375, 0.642578125, 0.7379150390625, 0.833251953125, 0.9285888671875, 1.02392578125, 1.1192626953125, 1.214599609375, 1.3099365234375, 1.4052734375, 1.5006103515625, 1.595947265625, 1.6912841796875, 1.78662109375, 1.8819580078125, 1.977294921875, 2.0726318359375, 2.16796875, 2.2633056640625, 2.358642578125, 2.4539794921875, 2.54931640625, 2.6446533203125, 2.739990234375, 2.8353271484375, 2.9306640625, 3.0260009765625, 3.121337890625, 3.2166748046875, 3.31201171875, 3.4073486328125, 3.502685546875, 3.5980224609375, 3.693359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 5.0, 19.0, 29.0, 38.0, 56.0, 79.0, 119.0, 122.0, 157.0, 122.0, 86.0, 72.0, 29.0, 24.0, 8.0, 9.0, 7.0, 4.0, 6.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005316734313964844, -0.0005120113492012024, -0.0004923492670059204, -0.00047268718481063843, -0.00045302510261535645, -0.00043336302042007446, -0.0004137009382247925, -0.0003940388560295105, -0.0003743767738342285, -0.00035471469163894653, -0.00033505260944366455, -0.00031539052724838257, -0.0002957284450531006, -0.0002760663628578186, -0.0002564042806625366, -0.00023674219846725464, -0.00021708011627197266, -0.00019741803407669067, -0.0001777559518814087, -0.0001580938696861267, -0.00013843178749084473, -0.00011876970529556274, -9.910762310028076e-05, -7.944554090499878e-05, -5.97834587097168e-05, -4.0121376514434814e-05, -2.0459294319152832e-05, -7.972121238708496e-07, 1.8864870071411133e-05, 3.8526952266693115e-05, 5.81890344619751e-05, 7.785111665725708e-05, 9.751319885253906e-05, 0.00011717528104782104, 0.00013683736324310303, 0.000156499445438385, 0.000176161527633667, 0.00019582360982894897, 0.00021548569202423096, 0.00023514777421951294, 0.0002548098564147949, 0.0002744719386100769, 0.0002941340208053589, 0.00031379610300064087, 0.00033345818519592285, 0.00035312026739120483, 0.0003727823495864868, 0.0003924444317817688, 0.0004121065139770508, 0.00043176859617233276, 0.00045143067836761475, 0.00047109276056289673, 0.0004907548427581787, 0.0005104169249534607, 0.0005300790071487427, 0.0005497410893440247, 0.0005694031715393066, 0.0005890652537345886, 0.0006087273359298706, 0.0006283894181251526, 0.0006480515003204346, 0.0006677135825157166, 0.0006873756647109985, 0.0007070377469062805, 0.0007266998291015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 4.0, 6.0, 6.0, 16.0, 13.0, 20.0, 31.0, 53.0, 95.0, 115.0, 203.0, 396.0, 749.0, 1720.0, 5231.0, 23326.0, 193250.0, 698654.0, 103256.0, 14877.0, 3726.0, 1394.0, 625.0, 325.0, 167.0, 81.0, 68.0, 41.0, 26.0, 27.0, 12.0, 6.0, 8.0, 4.0, 2.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.76953125, -1.704864501953125, -1.64019775390625, -1.575531005859375, -1.5108642578125, -1.446197509765625, -1.38153076171875, -1.316864013671875, -1.252197265625, -1.187530517578125, -1.12286376953125, -1.058197021484375, -0.9935302734375, -0.928863525390625, -0.86419677734375, -0.799530029296875, -0.73486328125, -0.670196533203125, -0.60552978515625, -0.540863037109375, -0.4761962890625, -0.411529541015625, -0.34686279296875, -0.282196044921875, -0.217529296875, -0.152862548828125, -0.08819580078125, -0.023529052734375, 0.0411376953125, 0.105804443359375, 0.17047119140625, 0.235137939453125, 0.2998046875, 0.364471435546875, 0.42913818359375, 0.493804931640625, 0.5584716796875, 0.623138427734375, 0.68780517578125, 0.752471923828125, 0.817138671875, 0.881805419921875, 0.94647216796875, 1.011138916015625, 1.0758056640625, 1.140472412109375, 1.20513916015625, 1.269805908203125, 1.33447265625, 1.399139404296875, 1.46380615234375, 1.528472900390625, 1.5931396484375, 1.657806396484375, 1.72247314453125, 1.787139892578125, 1.851806640625, 1.916473388671875, 1.98114013671875, 2.045806884765625, 2.1104736328125, 2.175140380859375, 2.23980712890625, 2.304473876953125, 2.369140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 8.0, 4.0, 8.0, 10.0, 26.0, 34.0, 33.0, 52.0, 69.0, 73.0, 86.0, 113.0, 77.0, 83.0, 75.0, 56.0, 53.0, 42.0, 28.0, 23.0, 17.0, 9.0, 6.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.865234375, -1.795562744140625, -1.72589111328125, -1.656219482421875, -1.5865478515625, -1.516876220703125, -1.44720458984375, -1.377532958984375, -1.307861328125, -1.238189697265625, -1.16851806640625, -1.098846435546875, -1.0291748046875, -0.959503173828125, -0.88983154296875, -0.820159912109375, -0.75048828125, -0.680816650390625, -0.61114501953125, -0.541473388671875, -0.4718017578125, -0.402130126953125, -0.33245849609375, -0.262786865234375, -0.193115234375, -0.123443603515625, -0.05377197265625, 0.015899658203125, 0.0855712890625, 0.155242919921875, 0.22491455078125, 0.294586181640625, 0.3642578125, 0.433929443359375, 0.50360107421875, 0.573272705078125, 0.6429443359375, 0.712615966796875, 0.78228759765625, 0.851959228515625, 0.921630859375, 0.991302490234375, 1.06097412109375, 1.130645751953125, 1.2003173828125, 1.269989013671875, 1.33966064453125, 1.409332275390625, 1.47900390625, 1.548675537109375, 1.61834716796875, 1.688018798828125, 1.7576904296875, 1.827362060546875, 1.89703369140625, 1.966705322265625, 2.036376953125, 2.106048583984375, 2.17572021484375, 2.245391845703125, 2.3150634765625, 2.384735107421875, 2.45440673828125, 2.524078369140625, 2.59375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 9.0, 11.0, 16.0, 38.0, 103.0, 169.0, 242.0, 177.0, 108.0, 54.0, 27.0, 18.0, 9.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.14666748046875, -34.72544479370117, -33.30422592163086, -31.88300323486328, -30.46178436279297, -29.04056167602539, -27.619340896606445, -26.1981201171875, -24.776899337768555, -23.35567855834961, -21.934457778930664, -20.51323699951172, -19.09201431274414, -17.670795440673828, -16.24957275390625, -14.828351974487305, -13.40713119506836, -11.985910415649414, -10.564689636230469, -9.143467903137207, -7.722247123718262, -6.301026344299316, -4.879804611206055, -3.4585838317871094, -2.037363052368164, -0.6161420345306396, 0.8050789833068848, 2.2263002395629883, 3.6475210189819336, 5.068741798400879, 6.489963531494141, 7.911184310913086, 9.332405090332031, 10.753625869750977, 12.174846649169922, 13.596068382263184, 15.017289161682129, 16.43851089477539, 17.859731674194336, 19.28095245361328, 20.702173233032227, 22.123394012451172, 23.544614791870117, 24.965835571289062, 26.38705825805664, 27.808277130126953, 29.22949981689453, 30.650720596313477, 32.07194137573242, 33.4931640625, 34.91438293457031, 36.33560562133789, 37.7568244934082, 39.17804718017578, 40.599266052246094, 42.02048873901367, 43.44171142578125, 44.86293411254883, 46.28415298461914, 47.70537567138672, 49.12659454345703, 50.54781723022461, 51.96903991699219, 53.3902587890625, 54.81147766113281]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 3.0, 4.0, 3.0, 10.0, 9.0, 10.0, 18.0, 10.0, 18.0, 19.0, 19.0, 19.0, 20.0, 24.0, 30.0, 32.0, 32.0, 30.0, 30.0, 36.0, 36.0, 56.0, 40.0, 60.0, 36.0, 49.0, 39.0, 30.0, 24.0, 36.0, 23.0, 25.0, 21.0, 18.0, 16.0, 18.0, 13.0, 12.0, 9.0, 5.0, 6.0, 10.0, 12.0, 4.0, 4.0, 2.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0], "bins": [-19.994556427001953, -19.353740692138672, -18.71292495727539, -18.072107315063477, -17.431291580200195, -16.790475845336914, -16.149660110473633, -15.508844375610352, -14.868027687072754, -14.227211952209473, -13.586395263671875, -12.945579528808594, -12.304763793945312, -11.663947105407715, -11.023131370544434, -10.382314682006836, -9.741498947143555, -9.100683212280273, -8.459866523742676, -7.8190507888793945, -7.178234577178955, -6.537418365478516, -5.896602630615234, -5.255786418914795, -4.6149702072143555, -3.974153995513916, -3.3333380222320557, -2.6925220489501953, -2.051705837249756, -1.4108896255493164, -0.770073652267456, -0.1292576789855957, 0.5115604400634766, 1.1523765325546265, 1.7931926250457764, 2.4340085983276367, 3.074824810028076, 3.7156410217285156, 4.356456756591797, 4.997272968292236, 5.638089179992676, 6.278905391693115, 6.919721603393555, 7.560537338256836, 8.201353073120117, 8.842169761657715, 9.482985496520996, 10.123802185058594, 10.764617919921875, 11.405433654785156, 12.046250343322754, 12.687066078186035, 13.327882766723633, 13.968698501586914, 14.609514236450195, 15.250329971313477, 15.891146659851074, 16.531963348388672, 17.172779083251953, 17.813594818115234, 18.454410552978516, 19.095226287841797, 19.73604393005371, 20.376859664916992, 21.017675399780273]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 9.0, 6.0, 11.0, 26.0, 41.0, 97.0, 143.0, 313.0, 704.0, 1814.0, 5505.0, 21207.0, 155406.0, 2981273.0, 955736.0, 56028.0, 10794.0, 3044.0, 1098.0, 504.0, 210.0, 126.0, 68.0, 33.0, 30.0, 15.0, 12.0, 12.0, 5.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.443359375, -3.3414306640625, -3.239501953125, -3.1375732421875, -3.03564453125, -2.9337158203125, -2.831787109375, -2.7298583984375, -2.6279296875, -2.5260009765625, -2.424072265625, -2.3221435546875, -2.22021484375, -2.1182861328125, -2.016357421875, -1.9144287109375, -1.8125, -1.7105712890625, -1.608642578125, -1.5067138671875, -1.40478515625, -1.3028564453125, -1.200927734375, -1.0989990234375, -0.9970703125, -0.8951416015625, -0.793212890625, -0.6912841796875, -0.58935546875, -0.4874267578125, -0.385498046875, -0.2835693359375, -0.181640625, -0.0797119140625, 0.022216796875, 0.1241455078125, 0.22607421875, 0.3280029296875, 0.429931640625, 0.5318603515625, 0.6337890625, 0.7357177734375, 0.837646484375, 0.9395751953125, 1.04150390625, 1.1434326171875, 1.245361328125, 1.3472900390625, 1.44921875, 1.5511474609375, 1.653076171875, 1.7550048828125, 1.85693359375, 1.9588623046875, 2.060791015625, 2.1627197265625, 2.2646484375, 2.3665771484375, 2.468505859375, 2.5704345703125, 2.67236328125, 2.7742919921875, 2.876220703125, 2.9781494140625, 3.080078125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 6.0, 10.0, 18.0, 25.0, 33.0, 41.0, 64.0, 79.0, 73.0, 73.0, 94.0, 82.0, 81.0, 70.0, 62.0, 56.0, 49.0, 20.0, 21.0, 19.0, 9.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8583984375, -1.7736968994140625, -1.688995361328125, -1.6042938232421875, -1.51959228515625, -1.4348907470703125, -1.350189208984375, -1.2654876708984375, -1.1807861328125, -1.0960845947265625, -1.011383056640625, -0.9266815185546875, -0.84197998046875, -0.7572784423828125, -0.672576904296875, -0.5878753662109375, -0.503173828125, -0.4184722900390625, -0.333770751953125, -0.2490692138671875, -0.16436767578125, -0.0796661376953125, 0.005035400390625, 0.0897369384765625, 0.1744384765625, 0.2591400146484375, 0.343841552734375, 0.4285430908203125, 0.51324462890625, 0.5979461669921875, 0.682647705078125, 0.7673492431640625, 0.85205078125, 0.9367523193359375, 1.021453857421875, 1.1061553955078125, 1.19085693359375, 1.2755584716796875, 1.360260009765625, 1.4449615478515625, 1.5296630859375, 1.6143646240234375, 1.699066162109375, 1.7837677001953125, 1.86846923828125, 1.9531707763671875, 2.037872314453125, 2.1225738525390625, 2.207275390625, 2.2919769287109375, 2.376678466796875, 2.4613800048828125, 2.54608154296875, 2.6307830810546875, 2.715484619140625, 2.8001861572265625, 2.8848876953125, 2.9695892333984375, 3.054290771484375, 3.1389923095703125, 3.22369384765625, 3.3083953857421875, 3.393096923828125, 3.4777984619140625, 3.5625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 7.0, 5.0, 2.0, 2.0, 14.0, 21.0, 40.0, 46.0, 61.0, 84.0, 152.0, 354.0, 702.0, 1668.0, 5037.0, 18781.0, 97384.0, 2401785.0, 1568599.0, 77848.0, 15071.0, 4152.0, 1312.0, 558.0, 237.0, 132.0, 54.0, 56.0, 43.0, 21.0, 15.0, 10.0, 8.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.17578125, -4.049041748046875, -3.92230224609375, -3.795562744140625, -3.6688232421875, -3.542083740234375, -3.41534423828125, -3.288604736328125, -3.161865234375, -3.035125732421875, -2.90838623046875, -2.781646728515625, -2.6549072265625, -2.528167724609375, -2.40142822265625, -2.274688720703125, -2.14794921875, -2.021209716796875, -1.89447021484375, -1.767730712890625, -1.6409912109375, -1.514251708984375, -1.38751220703125, -1.260772705078125, -1.134033203125, -1.007293701171875, -0.88055419921875, -0.753814697265625, -0.6270751953125, -0.500335693359375, -0.37359619140625, -0.246856689453125, -0.1201171875, 0.006622314453125, 0.13336181640625, 0.260101318359375, 0.3868408203125, 0.513580322265625, 0.64031982421875, 0.767059326171875, 0.893798828125, 1.020538330078125, 1.14727783203125, 1.274017333984375, 1.4007568359375, 1.527496337890625, 1.65423583984375, 1.780975341796875, 1.90771484375, 2.034454345703125, 2.16119384765625, 2.287933349609375, 2.4146728515625, 2.541412353515625, 2.66815185546875, 2.794891357421875, 2.921630859375, 3.048370361328125, 3.17510986328125, 3.301849365234375, 3.4285888671875, 3.555328369140625, 3.68206787109375, 3.808807373046875, 3.935546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 8.0, 7.0, 8.0, 17.0, 15.0, 24.0, 27.0, 35.0, 29.0, 57.0, 71.0, 122.0, 193.0, 383.0, 747.0, 884.0, 604.0, 296.0, 181.0, 105.0, 74.0, 46.0, 34.0, 21.0, 11.0, 14.0, 9.0, 10.0, 8.0, 10.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.80078125, -3.67926025390625, -3.5577392578125, -3.43621826171875, -3.314697265625, -3.19317626953125, -3.0716552734375, -2.95013427734375, -2.82861328125, -2.70709228515625, -2.5855712890625, -2.46405029296875, -2.342529296875, -2.22100830078125, -2.0994873046875, -1.97796630859375, -1.8564453125, -1.73492431640625, -1.6134033203125, -1.49188232421875, -1.370361328125, -1.24884033203125, -1.1273193359375, -1.00579833984375, -0.88427734375, -0.76275634765625, -0.6412353515625, -0.51971435546875, -0.398193359375, -0.27667236328125, -0.1551513671875, -0.03363037109375, 0.087890625, 0.20941162109375, 0.3309326171875, 0.45245361328125, 0.573974609375, 0.69549560546875, 0.8170166015625, 0.93853759765625, 1.06005859375, 1.18157958984375, 1.3031005859375, 1.42462158203125, 1.546142578125, 1.66766357421875, 1.7891845703125, 1.91070556640625, 2.0322265625, 2.15374755859375, 2.2752685546875, 2.39678955078125, 2.518310546875, 2.63983154296875, 2.7613525390625, 2.88287353515625, 3.00439453125, 3.12591552734375, 3.2474365234375, 3.36895751953125, 3.490478515625, 3.61199951171875, 3.7335205078125, 3.85504150390625, 3.9765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 16.0, 10.0, 83.0, 210.0, 421.0, 193.0, 45.0, 10.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.47093963623047, -62.90272903442383, -60.33451843261719, -57.76630783081055, -55.198097229003906, -52.6298828125, -50.06167221069336, -47.49346160888672, -44.92525100708008, -42.35704040527344, -39.7888298034668, -37.220619201660156, -34.65240478515625, -32.084197998046875, -29.51598358154297, -26.947772979736328, -24.379562377929688, -21.811351776123047, -19.243141174316406, -16.674928665161133, -14.106718063354492, -11.538507461547852, -8.970295906066895, -6.4020843505859375, -3.833873748779297, -1.265662670135498, 1.3025484085083008, 3.8707594871520996, 6.438970565795898, 9.007181167602539, 11.575392723083496, 14.143604278564453, 16.711822509765625, 19.280033111572266, 21.848243713378906, 24.41645622253418, 26.98466682434082, 29.55287742614746, 32.121089935302734, 34.689300537109375, 37.257511138916016, 39.825721740722656, 42.3939323425293, 44.96214294433594, 47.530357360839844, 50.09856414794922, 52.666778564453125, 55.234989166259766, 57.803199768066406, 60.37141036987305, 62.93962097167969, 65.5078353881836, 68.07604217529297, 70.64425659179688, 73.21246337890625, 75.78067779541016, 78.34889221191406, 80.91710662841797, 83.48531341552734, 86.05352783203125, 88.62173461914062, 91.18994903564453, 93.7581558227539, 96.32637023925781, 98.89457702636719]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 12.0, 7.0, 12.0, 7.0, 13.0, 28.0, 25.0, 29.0, 37.0, 45.0, 63.0, 46.0, 70.0, 77.0, 74.0, 74.0, 62.0, 47.0, 48.0, 36.0, 53.0, 35.0, 24.0, 24.0, 14.0, 7.0, 12.0, 7.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.236312866210938, -27.450984954833984, -26.665658950805664, -25.88033103942871, -25.09500503540039, -24.309677124023438, -23.524349212646484, -22.73902130126953, -21.95369529724121, -21.168367385864258, -20.383041381835938, -19.597713470458984, -18.81238555908203, -18.02705955505371, -17.241731643676758, -16.456405639648438, -15.671077728271484, -14.885750770568848, -14.100423812866211, -13.315095901489258, -12.529768943786621, -11.744441986083984, -10.959114074707031, -10.173787117004395, -9.388460159301758, -8.603133201599121, -7.817805767059326, -7.032478332519531, -6.2471513748168945, -5.461824417114258, -4.676496982574463, -3.891169548034668, -3.1058425903320312, -2.3205153942108154, -1.5351881980895996, -0.7498610019683838, 0.03546619415283203, 0.8207933902740479, 1.6061205863952637, 2.3914480209350586, 3.1767749786376953, 3.962102174758911, 4.747429370880127, 5.532756805419922, 6.318083763122559, 7.103410720825195, 7.88873815536499, 8.674065589904785, 9.459392547607422, 10.244719505310059, 11.030046463012695, 11.815374374389648, 12.600701332092285, 13.386028289794922, 14.171356201171875, 14.956683158874512, 15.742010116577148, 16.5273380279541, 17.312664031982422, 18.097991943359375, 18.883319854736328, 19.66864585876465, 20.4539737701416, 21.239299774169922, 22.024627685546875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 11.0, 8.0, 17.0, 23.0, 50.0, 81.0, 99.0, 151.0, 263.0, 395.0, 665.0, 1058.0, 1820.0, 3093.0, 5578.0, 10025.0, 18237.0, 33781.0, 60851.0, 106037.0, 166878.0, 205778.0, 174088.0, 112675.0, 65368.0, 36389.0, 19873.0, 10855.0, 6056.0, 3311.0, 2006.0, 1131.0, 673.0, 407.0, 307.0, 172.0, 119.0, 76.0, 52.0, 28.0, 21.0, 20.0, 10.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3271484375, -1.282257080078125, -1.23736572265625, -1.192474365234375, -1.1475830078125, -1.102691650390625, -1.05780029296875, -1.012908935546875, -0.968017578125, -0.923126220703125, -0.87823486328125, -0.833343505859375, -0.7884521484375, -0.743560791015625, -0.69866943359375, -0.653778076171875, -0.60888671875, -0.563995361328125, -0.51910400390625, -0.474212646484375, -0.4293212890625, -0.384429931640625, -0.33953857421875, -0.294647216796875, -0.249755859375, -0.204864501953125, -0.15997314453125, -0.115081787109375, -0.0701904296875, -0.025299072265625, 0.01959228515625, 0.064483642578125, 0.109375, 0.154266357421875, 0.19915771484375, 0.244049072265625, 0.2889404296875, 0.333831787109375, 0.37872314453125, 0.423614501953125, 0.468505859375, 0.513397216796875, 0.55828857421875, 0.603179931640625, 0.6480712890625, 0.692962646484375, 0.73785400390625, 0.782745361328125, 0.82763671875, 0.872528076171875, 0.91741943359375, 0.962310791015625, 1.0072021484375, 1.052093505859375, 1.09698486328125, 1.141876220703125, 1.186767578125, 1.231658935546875, 1.27655029296875, 1.321441650390625, 1.3663330078125, 1.411224365234375, 1.45611572265625, 1.501007080078125, 1.5458984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 11.0, 10.0, 16.0, 21.0, 20.0, 33.0, 34.0, 35.0, 45.0, 62.0, 59.0, 61.0, 60.0, 58.0, 57.0, 77.0, 57.0, 57.0, 40.0, 28.0, 37.0, 26.0, 27.0, 21.0, 11.0, 7.0, 7.0, 7.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0859375, -2.0252532958984375, -1.964569091796875, -1.9038848876953125, -1.84320068359375, -1.7825164794921875, -1.721832275390625, -1.6611480712890625, -1.6004638671875, -1.5397796630859375, -1.479095458984375, -1.4184112548828125, -1.35772705078125, -1.2970428466796875, -1.236358642578125, -1.1756744384765625, -1.114990234375, -1.0543060302734375, -0.993621826171875, -0.9329376220703125, -0.87225341796875, -0.8115692138671875, -0.750885009765625, -0.6902008056640625, -0.6295166015625, -0.5688323974609375, -0.508148193359375, -0.4474639892578125, -0.38677978515625, -0.3260955810546875, -0.265411376953125, -0.2047271728515625, -0.14404296875, -0.0833587646484375, -0.022674560546875, 0.0380096435546875, 0.09869384765625, 0.1593780517578125, 0.220062255859375, 0.2807464599609375, 0.3414306640625, 0.4021148681640625, 0.462799072265625, 0.5234832763671875, 0.58416748046875, 0.6448516845703125, 0.705535888671875, 0.7662200927734375, 0.826904296875, 0.8875885009765625, 0.948272705078125, 1.0089569091796875, 1.06964111328125, 1.1303253173828125, 1.191009521484375, 1.2516937255859375, 1.3123779296875, 1.3730621337890625, 1.433746337890625, 1.4944305419921875, 1.55511474609375, 1.6157989501953125, 1.676483154296875, 1.7371673583984375, 1.7978515625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 8.0, 13.0, 14.0, 14.0, 21.0, 29.0, 32.0, 44.0, 37.0, 74.0, 104.0, 135.0, 201.0, 250.0, 333.0, 487.0, 783.0, 1289.0, 2466.0, 5885.0, 20297.0, 107826.0, 585992.0, 257162.0, 46044.0, 10413.0, 3626.0, 1636.0, 937.0, 666.0, 436.0, 321.0, 219.0, 178.0, 143.0, 105.0, 76.0, 45.0, 39.0, 38.0, 30.0, 28.0, 19.0, 7.0, 7.0, 10.0, 7.0, 6.0, 2.0, 4.0, 3.0, 3.0, 3.0], "bins": [-3.8515625, -3.737457275390625, -3.62335205078125, -3.509246826171875, -3.3951416015625, -3.281036376953125, -3.16693115234375, -3.052825927734375, -2.938720703125, -2.824615478515625, -2.71051025390625, -2.596405029296875, -2.4822998046875, -2.368194580078125, -2.25408935546875, -2.139984130859375, -2.02587890625, -1.911773681640625, -1.79766845703125, -1.683563232421875, -1.5694580078125, -1.455352783203125, -1.34124755859375, -1.227142333984375, -1.113037109375, -0.998931884765625, -0.88482666015625, -0.770721435546875, -0.6566162109375, -0.542510986328125, -0.42840576171875, -0.314300537109375, -0.2001953125, -0.086090087890625, 0.02801513671875, 0.142120361328125, 0.2562255859375, 0.370330810546875, 0.48443603515625, 0.598541259765625, 0.712646484375, 0.826751708984375, 0.94085693359375, 1.054962158203125, 1.1690673828125, 1.283172607421875, 1.39727783203125, 1.511383056640625, 1.62548828125, 1.739593505859375, 1.85369873046875, 1.967803955078125, 2.0819091796875, 2.196014404296875, 2.31011962890625, 2.424224853515625, 2.538330078125, 2.652435302734375, 2.76654052734375, 2.880645751953125, 2.9947509765625, 3.108856201171875, 3.22296142578125, 3.337066650390625, 3.451171875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 6.0, 11.0, 13.0, 14.0, 10.0, 15.0, 10.0, 20.0, 24.0, 33.0, 35.0, 30.0, 38.0, 34.0, 47.0, 42.0, 33.0, 51.0, 47.0, 47.0, 31.0, 37.0, 30.0, 29.0, 40.0, 28.0, 24.0, 22.0, 27.0, 19.0, 15.0, 25.0, 12.0, 8.0, 12.0, 13.0, 8.0, 7.0, 5.0, 9.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.62109375, -4.4722900390625, -4.323486328125, -4.1746826171875, -4.02587890625, -3.8770751953125, -3.728271484375, -3.5794677734375, -3.4306640625, -3.2818603515625, -3.133056640625, -2.9842529296875, -2.83544921875, -2.6866455078125, -2.537841796875, -2.3890380859375, -2.240234375, -2.0914306640625, -1.942626953125, -1.7938232421875, -1.64501953125, -1.4962158203125, -1.347412109375, -1.1986083984375, -1.0498046875, -0.9010009765625, -0.752197265625, -0.6033935546875, -0.45458984375, -0.3057861328125, -0.156982421875, -0.0081787109375, 0.140625, 0.2894287109375, 0.438232421875, 0.5870361328125, 0.73583984375, 0.8846435546875, 1.033447265625, 1.1822509765625, 1.3310546875, 1.4798583984375, 1.628662109375, 1.7774658203125, 1.92626953125, 2.0750732421875, 2.223876953125, 2.3726806640625, 2.521484375, 2.6702880859375, 2.819091796875, 2.9678955078125, 3.11669921875, 3.2655029296875, 3.414306640625, 3.5631103515625, 3.7119140625, 3.8607177734375, 4.009521484375, 4.1583251953125, 4.30712890625, 4.4559326171875, 4.604736328125, 4.7535400390625, 4.90234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 9.0, 16.0, 19.0, 36.0, 44.0, 72.0, 102.0, 162.0, 301.0, 504.0, 1032.0, 2718.0, 7937.0, 33962.0, 386796.0, 562862.0, 38068.0, 8566.0, 2891.0, 1139.0, 547.0, 273.0, 182.0, 95.0, 73.0, 39.0, 30.0, 18.0, 12.0, 14.0, 9.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.052734375, -1.9905853271484375, -1.928436279296875, -1.8662872314453125, -1.80413818359375, -1.7419891357421875, -1.679840087890625, -1.6176910400390625, -1.5555419921875, -1.4933929443359375, -1.431243896484375, -1.3690948486328125, -1.30694580078125, -1.2447967529296875, -1.182647705078125, -1.1204986572265625, -1.058349609375, -0.9962005615234375, -0.934051513671875, -0.8719024658203125, -0.80975341796875, -0.7476043701171875, -0.685455322265625, -0.6233062744140625, -0.5611572265625, -0.4990081787109375, -0.436859130859375, -0.3747100830078125, -0.31256103515625, -0.2504119873046875, -0.188262939453125, -0.1261138916015625, -0.06396484375, -0.0018157958984375, 0.060333251953125, 0.1224822998046875, 0.18463134765625, 0.2467803955078125, 0.308929443359375, 0.3710784912109375, 0.4332275390625, 0.4953765869140625, 0.557525634765625, 0.6196746826171875, 0.68182373046875, 0.7439727783203125, 0.806121826171875, 0.8682708740234375, 0.930419921875, 0.9925689697265625, 1.054718017578125, 1.1168670654296875, 1.17901611328125, 1.2411651611328125, 1.303314208984375, 1.3654632568359375, 1.4276123046875, 1.4897613525390625, 1.551910400390625, 1.6140594482421875, 1.67620849609375, 1.7383575439453125, 1.800506591796875, 1.8626556396484375, 1.9248046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 9.0, 13.0, 20.0, 28.0, 49.0, 87.0, 141.0, 201.0, 185.0, 102.0, 52.0, 34.0, 18.0, 17.0, 10.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009059906005859375, -0.000879146158695221, -0.0008523017168045044, -0.0008254572749137878, -0.0007986128330230713, -0.0007717683911323547, -0.0007449239492416382, -0.0007180795073509216, -0.0006912350654602051, -0.0006643906235694885, -0.000637546181678772, -0.0006107017397880554, -0.0005838572978973389, -0.0005570128560066223, -0.0005301684141159058, -0.0005033239722251892, -0.00047647953033447266, -0.0004496350884437561, -0.00042279064655303955, -0.000395946204662323, -0.00036910176277160645, -0.0003422573208808899, -0.00031541287899017334, -0.0002885684370994568, -0.00026172399520874023, -0.00023487955331802368, -0.00020803511142730713, -0.00018119066953659058, -0.00015434622764587402, -0.00012750178575515747, -0.00010065734386444092, -7.381290197372437e-05, -4.696846008300781e-05, -2.012401819229126e-05, 6.720423698425293e-06, 3.3564865589141846e-05, 6.04093074798584e-05, 8.725374937057495e-05, 0.0001140981912612915, 0.00014094263315200806, 0.0001677870750427246, 0.00019463151693344116, 0.00022147595882415771, 0.00024832040071487427, 0.0002751648426055908, 0.0003020092844963074, 0.0003288537263870239, 0.0003556981682777405, 0.00038254261016845703, 0.0004093870520591736, 0.00043623149394989014, 0.0004630759358406067, 0.0004899203777313232, 0.0005167648196220398, 0.0005436092615127563, 0.0005704537034034729, 0.0005972981452941895, 0.000624142587184906, 0.0006509870290756226, 0.0006778314709663391, 0.0007046759128570557, 0.0007315203547477722, 0.0007583647966384888, 0.0007852092385292053, 0.0008120536804199219]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 7.0, 19.0, 21.0, 34.0, 70.0, 137.0, 331.0, 846.0, 2549.0, 11150.0, 156759.0, 829894.0, 38573.0, 5536.0, 1560.0, 555.0, 225.0, 111.0, 62.0, 45.0, 17.0, 14.0, 8.0, 3.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.927734375, -2.8470458984375, -2.766357421875, -2.6856689453125, -2.60498046875, -2.5242919921875, -2.443603515625, -2.3629150390625, -2.2822265625, -2.2015380859375, -2.120849609375, -2.0401611328125, -1.95947265625, -1.8787841796875, -1.798095703125, -1.7174072265625, -1.63671875, -1.5560302734375, -1.475341796875, -1.3946533203125, -1.31396484375, -1.2332763671875, -1.152587890625, -1.0718994140625, -0.9912109375, -0.9105224609375, -0.829833984375, -0.7491455078125, -0.66845703125, -0.5877685546875, -0.507080078125, -0.4263916015625, -0.345703125, -0.2650146484375, -0.184326171875, -0.1036376953125, -0.02294921875, 0.0577392578125, 0.138427734375, 0.2191162109375, 0.2998046875, 0.3804931640625, 0.461181640625, 0.5418701171875, 0.62255859375, 0.7032470703125, 0.783935546875, 0.8646240234375, 0.9453125, 1.0260009765625, 1.106689453125, 1.1873779296875, 1.26806640625, 1.3487548828125, 1.429443359375, 1.5101318359375, 1.5908203125, 1.6715087890625, 1.752197265625, 1.8328857421875, 1.91357421875, 1.9942626953125, 2.074951171875, 2.1556396484375, 2.236328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 6.0, 9.0, 4.0, 11.0, 9.0, 26.0, 38.0, 35.0, 46.0, 46.0, 69.0, 66.0, 70.0, 73.0, 80.0, 55.0, 71.0, 45.0, 51.0, 46.0, 27.0, 23.0, 27.0, 14.0, 10.0, 6.0, 9.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.4990234375, -1.454345703125, -1.40966796875, -1.364990234375, -1.3203125, -1.275634765625, -1.23095703125, -1.186279296875, -1.1416015625, -1.096923828125, -1.05224609375, -1.007568359375, -0.962890625, -0.918212890625, -0.87353515625, -0.828857421875, -0.7841796875, -0.739501953125, -0.69482421875, -0.650146484375, -0.60546875, -0.560791015625, -0.51611328125, -0.471435546875, -0.4267578125, -0.382080078125, -0.33740234375, -0.292724609375, -0.248046875, -0.203369140625, -0.15869140625, -0.114013671875, -0.0693359375, -0.024658203125, 0.02001953125, 0.064697265625, 0.109375, 0.154052734375, 0.19873046875, 0.243408203125, 0.2880859375, 0.332763671875, 0.37744140625, 0.422119140625, 0.466796875, 0.511474609375, 0.55615234375, 0.600830078125, 0.6455078125, 0.690185546875, 0.73486328125, 0.779541015625, 0.82421875, 0.868896484375, 0.91357421875, 0.958251953125, 1.0029296875, 1.047607421875, 1.09228515625, 1.136962890625, 1.181640625, 1.226318359375, 1.27099609375, 1.315673828125, 1.3603515625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 23.0, 36.0, 91.0, 151.0, 281.0, 187.0, 103.0, 52.0, 31.0, 11.0, 13.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.37413787841797, -26.028717041015625, -24.68329620361328, -23.337875366210938, -21.99245262145996, -20.647031784057617, -19.301610946655273, -17.956188201904297, -16.610767364501953, -15.26534652709961, -13.91992473602295, -12.574503898620605, -11.229082107543945, -9.883661270141602, -8.538240432739258, -7.192818641662598, -5.84739875793457, -4.501977443695068, -3.1565563678741455, -1.8111352920532227, -0.4657139778137207, 0.8797073364257812, 2.225128173828125, 3.570549964904785, 4.915970802307129, 6.261392116546631, 7.606813430786133, 8.952234268188477, 10.29765510559082, 11.64307689666748, 12.988497734069824, 14.333919525146484, 15.679340362548828, 17.024761199951172, 18.370182037353516, 19.71560287475586, 21.061025619506836, 22.40644645690918, 23.751867294311523, 25.0972900390625, 26.442710876464844, 27.788131713867188, 29.13355255126953, 30.478973388671875, 31.82439613342285, 33.16981506347656, 34.515235900878906, 35.860660552978516, 37.206077575683594, 38.55149841308594, 39.89691925048828, 41.242340087890625, 42.58776092529297, 43.93318176269531, 45.278602600097656, 46.624027252197266, 47.96944808959961, 49.31486892700195, 50.6602897644043, 52.00571060180664, 53.351131439208984, 54.696556091308594, 56.04197692871094, 57.38739776611328, 58.732818603515625]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 10.0, 13.0, 15.0, 16.0, 22.0, 24.0, 23.0, 34.0, 28.0, 32.0, 31.0, 45.0, 56.0, 65.0, 66.0, 80.0, 67.0, 46.0, 24.0, 39.0, 23.0, 25.0, 22.0, 37.0, 27.0, 17.0, 19.0, 16.0, 15.0, 5.0, 7.0, 2.0, 7.0, 6.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.268718719482422, -20.515544891357422, -19.762371063232422, -19.009197235107422, -18.256023406982422, -17.502849578857422, -16.749675750732422, -15.996500968933105, -15.243327140808105, -14.490153312683105, -13.736979484558105, -12.983804702758789, -12.230630874633789, -11.477457046508789, -10.724283218383789, -9.971109390258789, -9.217935562133789, -8.464761734008789, -7.711587905883789, -6.958413600921631, -6.205239772796631, -5.452065944671631, -4.698891639709473, -3.9457178115844727, -3.1925439834594727, -2.4393701553344727, -1.6861960887908936, -0.9330220222473145, -0.17984819412231445, 0.5733256340026855, 1.3264999389648438, 2.0796737670898438, 2.832845687866211, 3.586019515991211, 4.339193344116211, 5.092367649078369, 5.845541477203369, 6.598715305328369, 7.351889610290527, 8.105063438415527, 8.858237266540527, 9.611411094665527, 10.364584922790527, 11.117759704589844, 11.870933532714844, 12.624107360839844, 13.377281188964844, 14.130455017089844, 14.883628845214844, 15.636802673339844, 16.389976501464844, 17.143150329589844, 17.896324157714844, 18.649497985839844, 19.402671813964844, 20.155845642089844, 20.909019470214844, 21.662193298339844, 22.415367126464844, 23.168540954589844, 23.921714782714844, 24.674888610839844, 25.428062438964844, 26.181236267089844, 26.934412002563477]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 13.0, 14.0, 22.0, 20.0, 38.0, 52.0, 81.0, 124.0, 176.0, 272.0, 435.0, 663.0, 1122.0, 1961.0, 3559.0, 7086.0, 15544.0, 39973.0, 125823.0, 496443.0, 1642719.0, 1349933.0, 356965.0, 92690.0, 31066.0, 13233.0, 6367.0, 3274.0, 1774.0, 1004.0, 646.0, 404.0, 260.0, 163.0, 123.0, 68.0, 42.0, 43.0, 33.0, 15.0, 12.0, 5.0, 3.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.2236328125, -1.1852569580078125, -1.146881103515625, -1.1085052490234375, -1.07012939453125, -1.0317535400390625, -0.993377685546875, -0.9550018310546875, -0.9166259765625, -0.8782501220703125, -0.839874267578125, -0.8014984130859375, -0.76312255859375, -0.7247467041015625, -0.686370849609375, -0.6479949951171875, -0.609619140625, -0.5712432861328125, -0.532867431640625, -0.4944915771484375, -0.45611572265625, -0.4177398681640625, -0.379364013671875, -0.3409881591796875, -0.3026123046875, -0.2642364501953125, -0.225860595703125, -0.1874847412109375, -0.14910888671875, -0.1107330322265625, -0.072357177734375, -0.0339813232421875, 0.00439453125, 0.0427703857421875, 0.081146240234375, 0.1195220947265625, 0.15789794921875, 0.1962738037109375, 0.234649658203125, 0.2730255126953125, 0.3114013671875, 0.3497772216796875, 0.388153076171875, 0.4265289306640625, 0.46490478515625, 0.5032806396484375, 0.541656494140625, 0.5800323486328125, 0.618408203125, 0.6567840576171875, 0.695159912109375, 0.7335357666015625, 0.77191162109375, 0.8102874755859375, 0.848663330078125, 0.8870391845703125, 0.9254150390625, 0.9637908935546875, 1.002166748046875, 1.0405426025390625, 1.07891845703125, 1.1172943115234375, 1.155670166015625, 1.1940460205078125, 1.232421875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 3.0, 12.0, 12.0, 15.0, 23.0, 39.0, 38.0, 28.0, 51.0, 50.0, 55.0, 71.0, 66.0, 60.0, 67.0, 64.0, 49.0, 57.0, 40.0, 33.0, 36.0, 32.0, 21.0, 21.0, 15.0, 6.0, 10.0, 7.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.29296875, -2.2333831787109375, -2.173797607421875, -2.1142120361328125, -2.05462646484375, -1.9950408935546875, -1.935455322265625, -1.8758697509765625, -1.8162841796875, -1.7566986083984375, -1.697113037109375, -1.6375274658203125, -1.57794189453125, -1.5183563232421875, -1.458770751953125, -1.3991851806640625, -1.339599609375, -1.2800140380859375, -1.220428466796875, -1.1608428955078125, -1.10125732421875, -1.0416717529296875, -0.982086181640625, -0.9225006103515625, -0.8629150390625, -0.8033294677734375, -0.743743896484375, -0.6841583251953125, -0.62457275390625, -0.5649871826171875, -0.505401611328125, -0.4458160400390625, -0.38623046875, -0.3266448974609375, -0.267059326171875, -0.2074737548828125, -0.14788818359375, -0.0883026123046875, -0.028717041015625, 0.0308685302734375, 0.0904541015625, 0.1500396728515625, 0.209625244140625, 0.2692108154296875, 0.32879638671875, 0.3883819580078125, 0.447967529296875, 0.5075531005859375, 0.567138671875, 0.6267242431640625, 0.686309814453125, 0.7458953857421875, 0.80548095703125, 0.8650665283203125, 0.924652099609375, 0.9842376708984375, 1.0438232421875, 1.1034088134765625, 1.162994384765625, 1.2225799560546875, 1.28216552734375, 1.3417510986328125, 1.401336669921875, 1.4609222412109375, 1.5205078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 3.0, 14.0, 16.0, 31.0, 38.0, 44.0, 87.0, 134.0, 213.0, 346.0, 622.0, 1740.0, 6343.0, 34430.0, 464755.0, 3514857.0, 147514.0, 17341.0, 3634.0, 1112.0, 443.0, 247.0, 123.0, 86.0, 37.0, 26.0, 17.0, 13.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.505859375, -3.382049560546875, -3.25823974609375, -3.134429931640625, -3.0106201171875, -2.886810302734375, -2.76300048828125, -2.639190673828125, -2.515380859375, -2.391571044921875, -2.26776123046875, -2.143951416015625, -2.0201416015625, -1.896331787109375, -1.77252197265625, -1.648712158203125, -1.52490234375, -1.401092529296875, -1.27728271484375, -1.153472900390625, -1.0296630859375, -0.905853271484375, -0.78204345703125, -0.658233642578125, -0.534423828125, -0.410614013671875, -0.28680419921875, -0.162994384765625, -0.0391845703125, 0.084625244140625, 0.20843505859375, 0.332244873046875, 0.4560546875, 0.579864501953125, 0.70367431640625, 0.827484130859375, 0.9512939453125, 1.075103759765625, 1.19891357421875, 1.322723388671875, 1.446533203125, 1.570343017578125, 1.69415283203125, 1.817962646484375, 1.9417724609375, 2.065582275390625, 2.18939208984375, 2.313201904296875, 2.43701171875, 2.560821533203125, 2.68463134765625, 2.808441162109375, 2.9322509765625, 3.056060791015625, 3.17987060546875, 3.303680419921875, 3.427490234375, 3.551300048828125, 3.67510986328125, 3.798919677734375, 3.9227294921875, 4.046539306640625, 4.17034912109375, 4.294158935546875, 4.41796875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 11.0, 11.0, 15.0, 23.0, 30.0, 40.0, 73.0, 119.0, 180.0, 357.0, 717.0, 880.0, 707.0, 363.0, 190.0, 117.0, 75.0, 53.0, 31.0, 18.0, 19.0, 12.0, 9.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.1875, -5.0653076171875, -4.943115234375, -4.8209228515625, -4.69873046875, -4.5765380859375, -4.454345703125, -4.3321533203125, -4.2099609375, -4.0877685546875, -3.965576171875, -3.8433837890625, -3.72119140625, -3.5989990234375, -3.476806640625, -3.3546142578125, -3.232421875, -3.1102294921875, -2.988037109375, -2.8658447265625, -2.74365234375, -2.6214599609375, -2.499267578125, -2.3770751953125, -2.2548828125, -2.1326904296875, -2.010498046875, -1.8883056640625, -1.76611328125, -1.6439208984375, -1.521728515625, -1.3995361328125, -1.27734375, -1.1551513671875, -1.032958984375, -0.9107666015625, -0.78857421875, -0.6663818359375, -0.544189453125, -0.4219970703125, -0.2998046875, -0.1776123046875, -0.055419921875, 0.0667724609375, 0.18896484375, 0.3111572265625, 0.433349609375, 0.5555419921875, 0.677734375, 0.7999267578125, 0.922119140625, 1.0443115234375, 1.16650390625, 1.2886962890625, 1.410888671875, 1.5330810546875, 1.6552734375, 1.7774658203125, 1.899658203125, 2.0218505859375, 2.14404296875, 2.2662353515625, 2.388427734375, 2.5106201171875, 2.6328125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 12.0, 20.0, 59.0, 142.0, 233.0, 254.0, 161.0, 62.0, 26.0, 13.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.0982780456543, -57.72682571411133, -56.355369567871094, -54.983917236328125, -53.612464904785156, -52.24101257324219, -50.86956024169922, -49.498104095458984, -48.126651763916016, -46.75519943237305, -45.38374328613281, -44.012290954589844, -42.640838623046875, -41.269386291503906, -39.89793395996094, -38.5264778137207, -37.155025482177734, -35.783573150634766, -34.41211700439453, -33.04066467285156, -31.669212341308594, -30.297760009765625, -28.926305770874023, -27.554851531982422, -26.183399200439453, -24.811946868896484, -23.440492630004883, -22.06903839111328, -20.697586059570312, -19.326133728027344, -17.954679489135742, -16.58322525024414, -15.211771011352539, -13.840317726135254, -12.468864440917969, -11.097411155700684, -9.725957870483398, -8.354504585266113, -6.983051300048828, -5.611598014831543, -4.240144729614258, -2.8686914443969727, -1.4972381591796875, -0.12578487396240234, 1.2456684112548828, 2.617121696472168, 3.988574981689453, 5.360028266906738, 6.731481552124023, 8.102934837341309, 9.474388122558594, 10.845841407775879, 12.217294692993164, 13.58874797821045, 14.960201263427734, 16.331653594970703, 17.703107833862305, 19.074562072753906, 20.446014404296875, 21.817466735839844, 23.188920974731445, 24.560375213623047, 25.931827545166016, 27.303279876708984, 28.674734115600586]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 8.0, 5.0, 3.0, 9.0, 8.0, 9.0, 7.0, 13.0, 11.0, 22.0, 19.0, 17.0, 27.0, 35.0, 30.0, 44.0, 47.0, 50.0, 40.0, 39.0, 47.0, 44.0, 46.0, 44.0, 60.0, 38.0, 26.0, 36.0, 25.0, 21.0, 32.0, 27.0, 13.0, 17.0, 16.0, 13.0, 16.0, 15.0, 4.0, 4.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.035188674926758, -11.605635643005371, -11.1760835647583, -10.746530532836914, -10.316977500915527, -9.88742446899414, -9.45787239074707, -9.028319358825684, -8.598766326904297, -8.16921329498291, -7.739660739898682, -7.310108184814453, -6.880555152893066, -6.451002597808838, -6.021450042724609, -5.591897010803223, -5.162344932556152, -4.732792377471924, -4.303239345550537, -3.8736867904663086, -3.444133996963501, -3.0145812034606934, -2.585028648376465, -2.1554758548736572, -1.7259230613708496, -1.296370267868042, -0.8668175935745239, -0.43726491928100586, -0.007712125778198242, 0.4218406677246094, 0.8513932228088379, 1.2809460163116455, 1.7104988098144531, 2.1400516033172607, 2.5696043968200684, 2.999156951904297, 3.4287097454071045, 3.858262538909912, 4.287815093994141, 4.717368125915527, 5.146920680999756, 5.576473236083984, 6.006026268005371, 6.4355788230896, 6.865131378173828, 7.294684410095215, 7.724236965179443, 8.153789520263672, 8.583342552185059, 9.012895584106445, 9.442447662353516, 9.872000694274902, 10.301553726196289, 10.73110580444336, 11.160658836364746, 11.590211868286133, 12.019763946533203, 12.44931697845459, 12.87886905670166, 13.308422088623047, 13.737975120544434, 14.16752815246582, 14.59708023071289, 15.026633262634277, 15.456186294555664]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 8.0, 12.0, 22.0, 25.0, 33.0, 54.0, 90.0, 146.0, 215.0, 312.0, 552.0, 805.0, 1317.0, 2109.0, 3441.0, 6125.0, 10296.0, 18030.0, 32044.0, 58017.0, 101711.0, 168511.0, 215548.0, 177148.0, 108511.0, 61885.0, 34884.0, 19380.0, 11103.0, 6375.0, 3828.0, 2240.0, 1390.0, 850.0, 561.0, 322.0, 214.0, 148.0, 92.0, 52.0, 42.0, 30.0, 19.0, 21.0, 13.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.53515625, -1.48492431640625, -1.4346923828125, -1.38446044921875, -1.334228515625, -1.28399658203125, -1.2337646484375, -1.18353271484375, -1.13330078125, -1.08306884765625, -1.0328369140625, -0.98260498046875, -0.932373046875, -0.88214111328125, -0.8319091796875, -0.78167724609375, -0.7314453125, -0.68121337890625, -0.6309814453125, -0.58074951171875, -0.530517578125, -0.48028564453125, -0.4300537109375, -0.37982177734375, -0.32958984375, -0.27935791015625, -0.2291259765625, -0.17889404296875, -0.128662109375, -0.07843017578125, -0.0281982421875, 0.02203369140625, 0.072265625, 0.12249755859375, 0.1727294921875, 0.22296142578125, 0.273193359375, 0.32342529296875, 0.3736572265625, 0.42388916015625, 0.47412109375, 0.52435302734375, 0.5745849609375, 0.62481689453125, 0.675048828125, 0.72528076171875, 0.7755126953125, 0.82574462890625, 0.8759765625, 0.92620849609375, 0.9764404296875, 1.02667236328125, 1.076904296875, 1.12713623046875, 1.1773681640625, 1.22760009765625, 1.27783203125, 1.32806396484375, 1.3782958984375, 1.42852783203125, 1.478759765625, 1.52899169921875, 1.5792236328125, 1.62945556640625, 1.6796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 9.0, 7.0, 11.0, 12.0, 15.0, 22.0, 36.0, 35.0, 47.0, 50.0, 57.0, 74.0, 66.0, 70.0, 59.0, 66.0, 56.0, 60.0, 52.0, 47.0, 36.0, 27.0, 17.0, 21.0, 15.0, 15.0, 9.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.470703125, -2.40576171875, -2.3408203125, -2.27587890625, -2.2109375, -2.14599609375, -2.0810546875, -2.01611328125, -1.951171875, -1.88623046875, -1.8212890625, -1.75634765625, -1.69140625, -1.62646484375, -1.5615234375, -1.49658203125, -1.431640625, -1.36669921875, -1.3017578125, -1.23681640625, -1.171875, -1.10693359375, -1.0419921875, -0.97705078125, -0.912109375, -0.84716796875, -0.7822265625, -0.71728515625, -0.65234375, -0.58740234375, -0.5224609375, -0.45751953125, -0.392578125, -0.32763671875, -0.2626953125, -0.19775390625, -0.1328125, -0.06787109375, -0.0029296875, 0.06201171875, 0.126953125, 0.19189453125, 0.2568359375, 0.32177734375, 0.38671875, 0.45166015625, 0.5166015625, 0.58154296875, 0.646484375, 0.71142578125, 0.7763671875, 0.84130859375, 0.90625, 0.97119140625, 1.0361328125, 1.10107421875, 1.166015625, 1.23095703125, 1.2958984375, 1.36083984375, 1.42578125, 1.49072265625, 1.5556640625, 1.62060546875, 1.685546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 3.0, 4.0, 12.0, 16.0, 16.0, 18.0, 38.0, 48.0, 58.0, 95.0, 132.0, 183.0, 240.0, 388.0, 573.0, 1007.0, 1980.0, 4929.0, 17764.0, 98356.0, 639472.0, 231680.0, 37019.0, 8272.0, 2757.0, 1257.0, 718.0, 455.0, 279.0, 217.0, 161.0, 125.0, 69.0, 54.0, 33.0, 31.0, 20.0, 20.0, 14.0, 12.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.28515625, -4.135986328125, -3.98681640625, -3.837646484375, -3.6884765625, -3.539306640625, -3.39013671875, -3.240966796875, -3.091796875, -2.942626953125, -2.79345703125, -2.644287109375, -2.4951171875, -2.345947265625, -2.19677734375, -2.047607421875, -1.8984375, -1.749267578125, -1.60009765625, -1.450927734375, -1.3017578125, -1.152587890625, -1.00341796875, -0.854248046875, -0.705078125, -0.555908203125, -0.40673828125, -0.257568359375, -0.1083984375, 0.040771484375, 0.18994140625, 0.339111328125, 0.48828125, 0.637451171875, 0.78662109375, 0.935791015625, 1.0849609375, 1.234130859375, 1.38330078125, 1.532470703125, 1.681640625, 1.830810546875, 1.97998046875, 2.129150390625, 2.2783203125, 2.427490234375, 2.57666015625, 2.725830078125, 2.875, 3.024169921875, 3.17333984375, 3.322509765625, 3.4716796875, 3.620849609375, 3.77001953125, 3.919189453125, 4.068359375, 4.217529296875, 4.36669921875, 4.515869140625, 4.6650390625, 4.814208984375, 4.96337890625, 5.112548828125, 5.26171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 8.0, 5.0, 7.0, 14.0, 9.0, 5.0, 8.0, 22.0, 13.0, 18.0, 25.0, 20.0, 22.0, 32.0, 51.0, 47.0, 38.0, 35.0, 42.0, 45.0, 32.0, 39.0, 32.0, 42.0, 31.0, 23.0, 50.0, 35.0, 31.0, 25.0, 25.0, 23.0, 18.0, 13.0, 15.0, 18.0, 13.0, 14.0, 17.0, 2.0, 9.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-5.04296875, -4.89208984375, -4.7412109375, -4.59033203125, -4.439453125, -4.28857421875, -4.1376953125, -3.98681640625, -3.8359375, -3.68505859375, -3.5341796875, -3.38330078125, -3.232421875, -3.08154296875, -2.9306640625, -2.77978515625, -2.62890625, -2.47802734375, -2.3271484375, -2.17626953125, -2.025390625, -1.87451171875, -1.7236328125, -1.57275390625, -1.421875, -1.27099609375, -1.1201171875, -0.96923828125, -0.818359375, -0.66748046875, -0.5166015625, -0.36572265625, -0.21484375, -0.06396484375, 0.0869140625, 0.23779296875, 0.388671875, 0.53955078125, 0.6904296875, 0.84130859375, 0.9921875, 1.14306640625, 1.2939453125, 1.44482421875, 1.595703125, 1.74658203125, 1.8974609375, 2.04833984375, 2.19921875, 2.35009765625, 2.5009765625, 2.65185546875, 2.802734375, 2.95361328125, 3.1044921875, 3.25537109375, 3.40625, 3.55712890625, 3.7080078125, 3.85888671875, 4.009765625, 4.16064453125, 4.3115234375, 4.46240234375, 4.61328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 15.0, 28.0, 45.0, 64.0, 137.0, 185.0, 329.0, 816.0, 1828.0, 5328.0, 19691.0, 105970.0, 665194.0, 201741.0, 34240.0, 8279.0, 2542.0, 1063.0, 453.0, 248.0, 132.0, 76.0, 52.0, 31.0, 15.0, 15.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.568359375, -1.511688232421875, -1.45501708984375, -1.398345947265625, -1.3416748046875, -1.285003662109375, -1.22833251953125, -1.171661376953125, -1.114990234375, -1.058319091796875, -1.00164794921875, -0.944976806640625, -0.8883056640625, -0.831634521484375, -0.77496337890625, -0.718292236328125, -0.66162109375, -0.604949951171875, -0.54827880859375, -0.491607666015625, -0.4349365234375, -0.378265380859375, -0.32159423828125, -0.264923095703125, -0.208251953125, -0.151580810546875, -0.09490966796875, -0.038238525390625, 0.0184326171875, 0.075103759765625, 0.13177490234375, 0.188446044921875, 0.2451171875, 0.301788330078125, 0.35845947265625, 0.415130615234375, 0.4718017578125, 0.528472900390625, 0.58514404296875, 0.641815185546875, 0.698486328125, 0.755157470703125, 0.81182861328125, 0.868499755859375, 0.9251708984375, 0.981842041015625, 1.03851318359375, 1.095184326171875, 1.15185546875, 1.208526611328125, 1.26519775390625, 1.321868896484375, 1.3785400390625, 1.435211181640625, 1.49188232421875, 1.548553466796875, 1.605224609375, 1.661895751953125, 1.71856689453125, 1.775238037109375, 1.8319091796875, 1.888580322265625, 1.94525146484375, 2.001922607421875, 2.05859375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 4.0, 11.0, 11.0, 14.0, 17.0, 32.0, 35.0, 49.0, 86.0, 106.0, 138.0, 134.0, 108.0, 72.0, 39.0, 32.0, 26.0, 23.0, 12.0, 13.0, 8.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006704330444335938, -0.00064801424741745, -0.0006255954504013062, -0.0006031766533851624, -0.0005807578563690186, -0.0005583390593528748, -0.000535920262336731, -0.0005135014653205872, -0.0004910826683044434, -0.00046866387128829956, -0.00044624507427215576, -0.00042382627725601196, -0.00040140748023986816, -0.00037898868322372437, -0.00035656988620758057, -0.00033415108919143677, -0.00031173229217529297, -0.00028931349515914917, -0.00026689469814300537, -0.00024447590112686157, -0.00022205710411071777, -0.00019963830709457397, -0.00017721951007843018, -0.00015480071306228638, -0.00013238191604614258, -0.00010996311902999878, -8.754432201385498e-05, -6.512552499771118e-05, -4.270672798156738e-05, -2.0287930965423584e-05, 2.130866050720215e-06, 2.4549663066864014e-05, 4.696846008300781e-05, 6.938725709915161e-05, 9.180605411529541e-05, 0.00011422485113143921, 0.000136643648147583, 0.0001590624451637268, 0.0001814812421798706, 0.0002039000391960144, 0.0002263188362121582, 0.000248737633228302, 0.0002711564302444458, 0.0002935752272605896, 0.0003159940242767334, 0.0003384128212928772, 0.000360831618309021, 0.0003832504153251648, 0.0004056692123413086, 0.0004280880093574524, 0.0004505068063735962, 0.00047292560338974, 0.0004953444004058838, 0.0005177631974220276, 0.0005401819944381714, 0.0005626007914543152, 0.000585019588470459, 0.0006074383854866028, 0.0006298571825027466, 0.0006522759795188904, 0.0006746947765350342, 0.000697113573551178, 0.0007195323705673218, 0.0007419511675834656, 0.0007643699645996094]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 9.0, 7.0, 13.0, 13.0, 20.0, 26.0, 51.0, 92.0, 155.0, 238.0, 470.0, 1006.0, 2764.0, 10866.0, 78457.0, 723787.0, 200733.0, 22479.0, 4413.0, 1510.0, 643.0, 344.0, 205.0, 104.0, 57.0, 39.0, 24.0, 13.0, 8.0, 5.0, 6.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4921875, -1.42645263671875, -1.3607177734375, -1.29498291015625, -1.229248046875, -1.16351318359375, -1.0977783203125, -1.03204345703125, -0.96630859375, -0.90057373046875, -0.8348388671875, -0.76910400390625, -0.703369140625, -0.63763427734375, -0.5718994140625, -0.50616455078125, -0.4404296875, -0.37469482421875, -0.3089599609375, -0.24322509765625, -0.177490234375, -0.11175537109375, -0.0460205078125, 0.01971435546875, 0.08544921875, 0.15118408203125, 0.2169189453125, 0.28265380859375, 0.348388671875, 0.41412353515625, 0.4798583984375, 0.54559326171875, 0.611328125, 0.67706298828125, 0.7427978515625, 0.80853271484375, 0.874267578125, 0.94000244140625, 1.0057373046875, 1.07147216796875, 1.13720703125, 1.20294189453125, 1.2686767578125, 1.33441162109375, 1.400146484375, 1.46588134765625, 1.5316162109375, 1.59735107421875, 1.6630859375, 1.72882080078125, 1.7945556640625, 1.86029052734375, 1.926025390625, 1.99176025390625, 2.0574951171875, 2.12322998046875, 2.18896484375, 2.25469970703125, 2.3204345703125, 2.38616943359375, 2.451904296875, 2.51763916015625, 2.5833740234375, 2.64910888671875, 2.71484375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 10.0, 11.0, 15.0, 17.0, 14.0, 23.0, 29.0, 23.0, 39.0, 41.0, 48.0, 62.0, 60.0, 60.0, 73.0, 61.0, 69.0, 45.0, 52.0, 42.0, 36.0, 30.0, 21.0, 21.0, 19.0, 21.0, 9.0, 12.0, 4.0, 8.0, 6.0, 9.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.369140625, -1.32806396484375, -1.2869873046875, -1.24591064453125, -1.204833984375, -1.16375732421875, -1.1226806640625, -1.08160400390625, -1.04052734375, -0.99945068359375, -0.9583740234375, -0.91729736328125, -0.876220703125, -0.83514404296875, -0.7940673828125, -0.75299072265625, -0.7119140625, -0.67083740234375, -0.6297607421875, -0.58868408203125, -0.547607421875, -0.50653076171875, -0.4654541015625, -0.42437744140625, -0.38330078125, -0.34222412109375, -0.3011474609375, -0.26007080078125, -0.218994140625, -0.17791748046875, -0.1368408203125, -0.09576416015625, -0.0546875, -0.01361083984375, 0.0274658203125, 0.06854248046875, 0.109619140625, 0.15069580078125, 0.1917724609375, 0.23284912109375, 0.27392578125, 0.31500244140625, 0.3560791015625, 0.39715576171875, 0.438232421875, 0.47930908203125, 0.5203857421875, 0.56146240234375, 0.6025390625, 0.64361572265625, 0.6846923828125, 0.72576904296875, 0.766845703125, 0.80792236328125, 0.8489990234375, 0.89007568359375, 0.93115234375, 0.97222900390625, 1.0133056640625, 1.05438232421875, 1.095458984375, 1.13653564453125, 1.1776123046875, 1.21868896484375, 1.259765625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 8.0, 1.0, 6.0, 7.0, 13.0, 39.0, 75.0, 123.0, 262.0, 228.0, 119.0, 59.0, 29.0, 15.0, 9.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.262107849121094, -42.78217315673828, -41.30223846435547, -39.82229995727539, -38.34236526489258, -36.862430572509766, -35.38249588012695, -33.902557373046875, -32.42262268066406, -30.94268798828125, -29.462751388549805, -27.982816696166992, -26.502880096435547, -25.022945404052734, -23.543010711669922, -22.063074111938477, -20.583139419555664, -19.10320472717285, -17.623268127441406, -16.143333435058594, -14.663396835327148, -13.183462142944336, -11.703526496887207, -10.223590850830078, -8.74365520477295, -7.26371955871582, -5.783783912658691, -4.303848743438721, -2.823913097381592, -1.343977451324463, 0.1359577178955078, 1.6158933639526367, 3.0958290100097656, 4.5757646560668945, 6.055700302124023, 7.535635471343994, 9.015571594238281, 10.495506286621094, 11.975441932678223, 13.455377578735352, 14.93531322479248, 16.41524887084961, 17.895183563232422, 19.375120162963867, 20.85505485534668, 22.334991455078125, 23.814926147460938, 25.29486083984375, 26.774797439575195, 28.254732131958008, 29.734668731689453, 31.214603424072266, 32.69453811645508, 34.174476623535156, 35.65441131591797, 37.13434600830078, 38.614280700683594, 40.094215393066406, 41.57415008544922, 43.0540885925293, 44.53402328491211, 46.01395797729492, 47.493892669677734, 48.97383117675781, 50.453765869140625]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 7.0, 3.0, 9.0, 9.0, 18.0, 9.0, 14.0, 14.0, 28.0, 21.0, 23.0, 37.0, 24.0, 41.0, 54.0, 59.0, 64.0, 106.0, 67.0, 51.0, 40.0, 50.0, 40.0, 29.0, 28.0, 23.0, 19.0, 16.0, 7.0, 15.0, 7.0, 11.0, 10.0, 5.0, 7.0, 5.0, 7.0, 2.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.978622436523438, -26.194673538208008, -25.410724639892578, -24.62677574157715, -23.84282684326172, -23.058879852294922, -22.27492904663086, -21.490982055664062, -20.707033157348633, -19.923084259033203, -19.139135360717773, -18.355186462402344, -17.571237564086914, -16.787288665771484, -16.003341674804688, -15.219392776489258, -14.435442924499512, -13.651494026184082, -12.867545127868652, -12.083597183227539, -11.29964828491211, -10.51569938659668, -9.73175048828125, -8.94780158996582, -8.16385269165039, -7.379903793334961, -6.5959553718566895, -5.81200647354126, -5.028058052062988, -4.244109153747559, -3.460160255432129, -2.6762118339538574, -1.892263412475586, -1.1083147525787354, -0.3243659734725952, 0.4595828056335449, 1.2435314655303955, 2.027480125427246, 2.811429023742676, 3.5953774452209473, 4.379326343536377, 5.163275241851807, 5.947223663330078, 6.731172561645508, 7.5151214599609375, 8.299070358276367, 9.083019256591797, 9.86696720123291, 10.65091609954834, 11.43486499786377, 12.2188138961792, 13.002761840820312, 13.786710739135742, 14.570659637451172, 15.354608535766602, 16.13855743408203, 16.92250633239746, 17.70645523071289, 18.49040412902832, 19.27435302734375, 20.05830192565918, 20.84225082397461, 21.626197814941406, 22.410146713256836, 23.194095611572266]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 10.0, 10.0, 5.0, 5.0, 14.0, 16.0, 24.0, 33.0, 38.0, 56.0, 69.0, 91.0, 135.0, 169.0, 283.0, 450.0, 699.0, 1206.0, 2734.0, 6945.0, 24376.0, 178558.0, 2022481.0, 1775185.0, 145659.0, 22401.0, 6770.0, 2631.0, 1197.0, 696.0, 384.0, 278.0, 184.0, 140.0, 90.0, 56.0, 53.0, 46.0, 28.0, 21.0, 18.0, 19.0, 10.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.023345947265625, -1.95098876953125, -1.878631591796875, -1.8062744140625, -1.733917236328125, -1.66156005859375, -1.589202880859375, -1.516845703125, -1.444488525390625, -1.37213134765625, -1.299774169921875, -1.2274169921875, -1.155059814453125, -1.08270263671875, -1.010345458984375, -0.93798828125, -0.865631103515625, -0.79327392578125, -0.720916748046875, -0.6485595703125, -0.576202392578125, -0.50384521484375, -0.431488037109375, -0.359130859375, -0.286773681640625, -0.21441650390625, -0.142059326171875, -0.0697021484375, 0.002655029296875, 0.07501220703125, 0.147369384765625, 0.2197265625, 0.292083740234375, 0.36444091796875, 0.436798095703125, 0.5091552734375, 0.581512451171875, 0.65386962890625, 0.726226806640625, 0.798583984375, 0.870941162109375, 0.94329833984375, 1.015655517578125, 1.0880126953125, 1.160369873046875, 1.23272705078125, 1.305084228515625, 1.37744140625, 1.449798583984375, 1.52215576171875, 1.594512939453125, 1.6668701171875, 1.739227294921875, 1.81158447265625, 1.883941650390625, 1.956298828125, 2.028656005859375, 2.10101318359375, 2.173370361328125, 2.2457275390625, 2.318084716796875, 2.39044189453125, 2.462799072265625, 2.53515625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 6.0, 3.0, 19.0, 9.0, 20.0, 28.0, 31.0, 35.0, 52.0, 43.0, 50.0, 61.0, 70.0, 55.0, 65.0, 63.0, 57.0, 65.0, 50.0, 55.0, 39.0, 27.0, 26.0, 21.0, 16.0, 15.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.43359375, -2.374664306640625, -2.31573486328125, -2.256805419921875, -2.1978759765625, -2.138946533203125, -2.08001708984375, -2.021087646484375, -1.962158203125, -1.903228759765625, -1.84429931640625, -1.785369873046875, -1.7264404296875, -1.667510986328125, -1.60858154296875, -1.549652099609375, -1.49072265625, -1.431793212890625, -1.37286376953125, -1.313934326171875, -1.2550048828125, -1.196075439453125, -1.13714599609375, -1.078216552734375, -1.019287109375, -0.960357666015625, -0.90142822265625, -0.842498779296875, -0.7835693359375, -0.724639892578125, -0.66571044921875, -0.606781005859375, -0.5478515625, -0.488922119140625, -0.42999267578125, -0.371063232421875, -0.3121337890625, -0.253204345703125, -0.19427490234375, -0.135345458984375, -0.076416015625, -0.017486572265625, 0.04144287109375, 0.100372314453125, 0.1593017578125, 0.218231201171875, 0.27716064453125, 0.336090087890625, 0.39501953125, 0.453948974609375, 0.51287841796875, 0.571807861328125, 0.6307373046875, 0.689666748046875, 0.74859619140625, 0.807525634765625, 0.866455078125, 0.925384521484375, 0.98431396484375, 1.043243408203125, 1.1021728515625, 1.161102294921875, 1.22003173828125, 1.278961181640625, 1.337890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 12.0, 18.0, 20.0, 30.0, 53.0, 94.0, 161.0, 325.0, 606.0, 1616.0, 4915.0, 26247.0, 628854.0, 3441113.0, 76511.0, 9207.0, 2395.0, 1004.0, 482.0, 224.0, 147.0, 94.0, 39.0, 37.0, 25.0, 10.0, 11.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.2667236328125, -4.115478515625, -3.9642333984375, -3.81298828125, -3.6617431640625, -3.510498046875, -3.3592529296875, -3.2080078125, -3.0567626953125, -2.905517578125, -2.7542724609375, -2.60302734375, -2.4517822265625, -2.300537109375, -2.1492919921875, -1.998046875, -1.8468017578125, -1.695556640625, -1.5443115234375, -1.39306640625, -1.2418212890625, -1.090576171875, -0.9393310546875, -0.7880859375, -0.6368408203125, -0.485595703125, -0.3343505859375, -0.18310546875, -0.0318603515625, 0.119384765625, 0.2706298828125, 0.421875, 0.5731201171875, 0.724365234375, 0.8756103515625, 1.02685546875, 1.1781005859375, 1.329345703125, 1.4805908203125, 1.6318359375, 1.7830810546875, 1.934326171875, 2.0855712890625, 2.23681640625, 2.3880615234375, 2.539306640625, 2.6905517578125, 2.841796875, 2.9930419921875, 3.144287109375, 3.2955322265625, 3.44677734375, 3.5980224609375, 3.749267578125, 3.9005126953125, 4.0517578125, 4.2030029296875, 4.354248046875, 4.5054931640625, 4.65673828125, 4.8079833984375, 4.959228515625, 5.1104736328125, 5.26171875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 12.0, 6.0, 15.0, 14.0, 23.0, 37.0, 62.0, 95.0, 198.0, 391.0, 738.0, 984.0, 631.0, 371.0, 193.0, 115.0, 63.0, 32.0, 28.0, 17.0, 16.0, 9.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.833984375, -3.703460693359375, -3.57293701171875, -3.442413330078125, -3.3118896484375, -3.181365966796875, -3.05084228515625, -2.920318603515625, -2.789794921875, -2.659271240234375, -2.52874755859375, -2.398223876953125, -2.2677001953125, -2.137176513671875, -2.00665283203125, -1.876129150390625, -1.74560546875, -1.615081787109375, -1.48455810546875, -1.354034423828125, -1.2235107421875, -1.092987060546875, -0.96246337890625, -0.831939697265625, -0.701416015625, -0.570892333984375, -0.44036865234375, -0.309844970703125, -0.1793212890625, -0.048797607421875, 0.08172607421875, 0.212249755859375, 0.3427734375, 0.473297119140625, 0.60382080078125, 0.734344482421875, 0.8648681640625, 0.995391845703125, 1.12591552734375, 1.256439208984375, 1.386962890625, 1.517486572265625, 1.64801025390625, 1.778533935546875, 1.9090576171875, 2.039581298828125, 2.17010498046875, 2.300628662109375, 2.43115234375, 2.561676025390625, 2.69219970703125, 2.822723388671875, 2.9532470703125, 3.083770751953125, 3.21429443359375, 3.344818115234375, 3.475341796875, 3.605865478515625, 3.73638916015625, 3.866912841796875, 3.9974365234375, 4.127960205078125, 4.25848388671875, 4.389007568359375, 4.51953125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 10.0, 31.0, 247.0, 514.0, 173.0, 25.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.35200500488281, -80.06864166259766, -76.7852783203125, -73.50191497802734, -70.21855163574219, -66.9351806640625, -63.651817321777344, -60.36845397949219, -57.08509063720703, -53.801727294921875, -50.51836395263672, -47.2349967956543, -43.95163345336914, -40.668270111083984, -37.38490295410156, -34.101539611816406, -30.81817626953125, -27.534812927246094, -24.251447677612305, -20.968082427978516, -17.68471908569336, -14.401355743408203, -11.117990493774414, -7.834625244140625, -4.551261901855469, -1.267897605895996, 2.0154666900634766, 5.298830986022949, 8.582195281982422, 11.865558624267578, 15.148923873901367, 18.432289123535156, 21.71564483642578, 24.999008178710938, 28.282373428344727, 31.565738677978516, 34.84910202026367, 38.13246536254883, 41.41583251953125, 44.699195861816406, 47.98255920410156, 51.26592254638672, 54.549285888671875, 57.8326530456543, 61.11601638793945, 64.39938354492188, 67.68274688720703, 70.96611022949219, 74.24947357177734, 77.5328369140625, 80.81620025634766, 84.09956359863281, 87.3829345703125, 90.66629028320312, 93.94966125488281, 97.23302459716797, 100.51638793945312, 103.79975128173828, 107.08311462402344, 110.3664779663086, 113.64984130859375, 116.93321228027344, 120.2165756225586, 123.49993896484375, 126.7833023071289]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 6.0, 5.0, 8.0, 11.0, 14.0, 20.0, 17.0, 30.0, 34.0, 39.0, 50.0, 40.0, 50.0, 45.0, 62.0, 59.0, 62.0, 56.0, 40.0, 43.0, 55.0, 40.0, 37.0, 22.0, 24.0, 23.0, 30.0, 20.0, 16.0, 15.0, 6.0, 10.0, 6.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.677006721496582, -12.104056358337402, -11.531105995178223, -10.958155632019043, -10.38520622253418, -9.812255859375, -9.23930549621582, -8.66635513305664, -8.093404769897461, -7.520454406738281, -6.947504043579102, -6.37455415725708, -5.8016037940979, -5.228653430938721, -4.655703544616699, -4.0827531814575195, -3.50980281829834, -2.93685245513916, -2.3639023303985596, -1.7909520864486694, -1.2180018424987793, -0.6450514793395996, -0.07210135459899902, 0.5008487701416016, 1.0737991333007812, 1.6467493772506714, 2.2196996212005615, 2.792649745941162, 3.365600109100342, 3.9385504722595215, 4.511500358581543, 5.084450721740723, 5.657402038574219, 6.230352401733398, 6.803302764892578, 7.3762526512146, 7.949203014373779, 8.522153854370117, 9.09510326385498, 9.66805362701416, 10.24100399017334, 10.81395435333252, 11.3869047164917, 11.959855079650879, 12.532804489135742, 13.105754852294922, 13.678705215454102, 14.251655578613281, 14.824605941772461, 15.39755630493164, 15.97050666809082, 16.54345703125, 17.11640739440918, 17.68935775756836, 18.26230812072754, 18.83525848388672, 19.408206939697266, 19.981157302856445, 20.554107666015625, 21.127058029174805, 21.700008392333984, 22.272958755493164, 22.845909118652344, 23.41885757446289, 23.991809844970703]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 5.0, 15.0, 29.0, 43.0, 43.0, 94.0, 147.0, 206.0, 328.0, 522.0, 859.0, 1290.0, 2249.0, 3648.0, 6487.0, 11528.0, 20628.0, 37799.0, 68321.0, 120034.0, 183437.0, 207708.0, 161578.0, 97780.0, 54644.0, 30107.0, 16477.0, 9326.0, 5269.0, 3082.0, 1898.0, 1067.0, 671.0, 451.0, 268.0, 164.0, 110.0, 78.0, 51.0, 36.0, 20.0, 12.0, 11.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.51171875, -1.464935302734375, -1.41815185546875, -1.371368408203125, -1.3245849609375, -1.277801513671875, -1.23101806640625, -1.184234619140625, -1.137451171875, -1.090667724609375, -1.04388427734375, -0.997100830078125, -0.9503173828125, -0.903533935546875, -0.85675048828125, -0.809967041015625, -0.76318359375, -0.716400146484375, -0.66961669921875, -0.622833251953125, -0.5760498046875, -0.529266357421875, -0.48248291015625, -0.435699462890625, -0.388916015625, -0.342132568359375, -0.29534912109375, -0.248565673828125, -0.2017822265625, -0.154998779296875, -0.10821533203125, -0.061431884765625, -0.0146484375, 0.032135009765625, 0.07891845703125, 0.125701904296875, 0.1724853515625, 0.219268798828125, 0.26605224609375, 0.312835693359375, 0.359619140625, 0.406402587890625, 0.45318603515625, 0.499969482421875, 0.5467529296875, 0.593536376953125, 0.64031982421875, 0.687103271484375, 0.73388671875, 0.780670166015625, 0.82745361328125, 0.874237060546875, 0.9210205078125, 0.967803955078125, 1.01458740234375, 1.061370849609375, 1.108154296875, 1.154937744140625, 1.20172119140625, 1.248504638671875, 1.2952880859375, 1.342071533203125, 1.38885498046875, 1.435638427734375, 1.482421875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 12.0, 14.0, 9.0, 17.0, 17.0, 27.0, 34.0, 33.0, 30.0, 38.0, 52.0, 47.0, 57.0, 67.0, 68.0, 54.0, 57.0, 57.0, 57.0, 38.0, 36.0, 39.0, 35.0, 25.0, 15.0, 17.0, 14.0, 10.0, 11.0, 6.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.421875, -2.36370849609375, -2.3055419921875, -2.24737548828125, -2.189208984375, -2.13104248046875, -2.0728759765625, -2.01470947265625, -1.95654296875, -1.89837646484375, -1.8402099609375, -1.78204345703125, -1.723876953125, -1.66571044921875, -1.6075439453125, -1.54937744140625, -1.4912109375, -1.43304443359375, -1.3748779296875, -1.31671142578125, -1.258544921875, -1.20037841796875, -1.1422119140625, -1.08404541015625, -1.02587890625, -0.96771240234375, -0.9095458984375, -0.85137939453125, -0.793212890625, -0.73504638671875, -0.6768798828125, -0.61871337890625, -0.560546875, -0.50238037109375, -0.4442138671875, -0.38604736328125, -0.327880859375, -0.26971435546875, -0.2115478515625, -0.15338134765625, -0.09521484375, -0.03704833984375, 0.0211181640625, 0.07928466796875, 0.137451171875, 0.19561767578125, 0.2537841796875, 0.31195068359375, 0.3701171875, 0.42828369140625, 0.4864501953125, 0.54461669921875, 0.602783203125, 0.66094970703125, 0.7191162109375, 0.77728271484375, 0.83544921875, 0.89361572265625, 0.9517822265625, 1.00994873046875, 1.068115234375, 1.12628173828125, 1.1844482421875, 1.24261474609375, 1.30078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 3.0, 7.0, 8.0, 16.0, 20.0, 15.0, 31.0, 68.0, 88.0, 131.0, 189.0, 341.0, 723.0, 1640.0, 4811.0, 17828.0, 82849.0, 527980.0, 321855.0, 67972.0, 14876.0, 4081.0, 1500.0, 642.0, 312.0, 194.0, 106.0, 79.0, 54.0, 29.0, 33.0, 21.0, 14.0, 7.0, 5.0, 9.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.984375, -3.8555908203125, -3.726806640625, -3.5980224609375, -3.46923828125, -3.3404541015625, -3.211669921875, -3.0828857421875, -2.9541015625, -2.8253173828125, -2.696533203125, -2.5677490234375, -2.43896484375, -2.3101806640625, -2.181396484375, -2.0526123046875, -1.923828125, -1.7950439453125, -1.666259765625, -1.5374755859375, -1.40869140625, -1.2799072265625, -1.151123046875, -1.0223388671875, -0.8935546875, -0.7647705078125, -0.635986328125, -0.5072021484375, -0.37841796875, -0.2496337890625, -0.120849609375, 0.0079345703125, 0.13671875, 0.2655029296875, 0.394287109375, 0.5230712890625, 0.65185546875, 0.7806396484375, 0.909423828125, 1.0382080078125, 1.1669921875, 1.2957763671875, 1.424560546875, 1.5533447265625, 1.68212890625, 1.8109130859375, 1.939697265625, 2.0684814453125, 2.197265625, 2.3260498046875, 2.454833984375, 2.5836181640625, 2.71240234375, 2.8411865234375, 2.969970703125, 3.0987548828125, 3.2275390625, 3.3563232421875, 3.485107421875, 3.6138916015625, 3.74267578125, 3.8714599609375, 4.000244140625, 4.1290283203125, 4.2578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 10.0, 9.0, 5.0, 13.0, 6.0, 8.0, 14.0, 17.0, 20.0, 25.0, 19.0, 23.0, 35.0, 30.0, 49.0, 38.0, 40.0, 63.0, 54.0, 43.0, 63.0, 52.0, 33.0, 40.0, 47.0, 38.0, 34.0, 29.0, 23.0, 23.0, 21.0, 16.0, 10.0, 16.0, 8.0, 9.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.31292724609375, -4.1492919921875, -3.98565673828125, -3.822021484375, -3.65838623046875, -3.4947509765625, -3.33111572265625, -3.16748046875, -3.00384521484375, -2.8402099609375, -2.67657470703125, -2.512939453125, -2.34930419921875, -2.1856689453125, -2.02203369140625, -1.8583984375, -1.69476318359375, -1.5311279296875, -1.36749267578125, -1.203857421875, -1.04022216796875, -0.8765869140625, -0.71295166015625, -0.54931640625, -0.38568115234375, -0.2220458984375, -0.05841064453125, 0.105224609375, 0.26885986328125, 0.4324951171875, 0.59613037109375, 0.759765625, 0.92340087890625, 1.0870361328125, 1.25067138671875, 1.414306640625, 1.57794189453125, 1.7415771484375, 1.90521240234375, 2.06884765625, 2.23248291015625, 2.3961181640625, 2.55975341796875, 2.723388671875, 2.88702392578125, 3.0506591796875, 3.21429443359375, 3.3779296875, 3.54156494140625, 3.7052001953125, 3.86883544921875, 4.032470703125, 4.19610595703125, 4.3597412109375, 4.52337646484375, 4.68701171875, 4.85064697265625, 5.0142822265625, 5.17791748046875, 5.341552734375, 5.50518798828125, 5.6688232421875, 5.83245849609375, 5.99609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 9.0, 10.0, 8.0, 16.0, 33.0, 31.0, 48.0, 79.0, 128.0, 208.0, 341.0, 653.0, 1245.0, 2564.0, 5597.0, 14284.0, 41368.0, 137729.0, 537246.0, 209565.0, 62237.0, 20599.0, 7702.0, 3320.0, 1606.0, 815.0, 455.0, 250.0, 147.0, 92.0, 62.0, 38.0, 19.0, 22.0, 11.0, 9.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1474609375, -1.111236572265625, -1.07501220703125, -1.038787841796875, -1.0025634765625, -0.966339111328125, -0.93011474609375, -0.893890380859375, -0.857666015625, -0.821441650390625, -0.78521728515625, -0.748992919921875, -0.7127685546875, -0.676544189453125, -0.64031982421875, -0.604095458984375, -0.56787109375, -0.531646728515625, -0.49542236328125, -0.459197998046875, -0.4229736328125, -0.386749267578125, -0.35052490234375, -0.314300537109375, -0.278076171875, -0.241851806640625, -0.20562744140625, -0.169403076171875, -0.1331787109375, -0.096954345703125, -0.06072998046875, -0.024505615234375, 0.01171875, 0.047943115234375, 0.08416748046875, 0.120391845703125, 0.1566162109375, 0.192840576171875, 0.22906494140625, 0.265289306640625, 0.301513671875, 0.337738037109375, 0.37396240234375, 0.410186767578125, 0.4464111328125, 0.482635498046875, 0.51885986328125, 0.555084228515625, 0.59130859375, 0.627532958984375, 0.66375732421875, 0.699981689453125, 0.7362060546875, 0.772430419921875, 0.80865478515625, 0.844879150390625, 0.881103515625, 0.917327880859375, 0.95355224609375, 0.989776611328125, 1.0260009765625, 1.062225341796875, 1.09844970703125, 1.134674072265625, 1.1708984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 10.0, 7.0, 13.0, 23.0, 36.0, 34.0, 62.0, 69.0, 75.0, 88.0, 90.0, 115.0, 101.0, 72.0, 48.0, 35.0, 28.0, 19.0, 20.0, 8.0, 7.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003783702850341797, -0.0003606565296649933, -0.0003429427742958069, -0.0003252290189266205, -0.0003075152635574341, -0.0002898015081882477, -0.0002720877528190613, -0.0002543739974498749, -0.00023666024208068848, -0.00021894648671150208, -0.00020123273134231567, -0.00018351897597312927, -0.00016580522060394287, -0.00014809146523475647, -0.00013037770986557007, -0.00011266395449638367, -9.495019912719727e-05, -7.723644375801086e-05, -5.952268838882446e-05, -4.180893301963806e-05, -2.409517765045166e-05, -6.381422281265259e-06, 1.1332333087921143e-05, 2.9046088457107544e-05, 4.6759843826293945e-05, 6.447359919548035e-05, 8.218735456466675e-05, 9.990110993385315e-05, 0.00011761486530303955, 0.00013532862067222595, 0.00015304237604141235, 0.00017075613141059875, 0.00018846988677978516, 0.00020618364214897156, 0.00022389739751815796, 0.00024161115288734436, 0.00025932490825653076, 0.00027703866362571716, 0.00029475241899490356, 0.00031246617436408997, 0.00033017992973327637, 0.00034789368510246277, 0.00036560744047164917, 0.00038332119584083557, 0.00040103495121002197, 0.0004187487065792084, 0.0004364624619483948, 0.0004541762173175812, 0.0004718899726867676, 0.000489603728055954, 0.0005073174834251404, 0.0005250312387943268, 0.0005427449941635132, 0.0005604587495326996, 0.000578172504901886, 0.0005958862602710724, 0.0006136000156402588, 0.0006313137710094452, 0.0006490275263786316, 0.000666741281747818, 0.0006844550371170044, 0.0007021687924861908, 0.0007198825478553772, 0.0007375963032245636, 0.00075531005859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 2.0, 6.0, 10.0, 13.0, 16.0, 21.0, 31.0, 44.0, 70.0, 121.0, 180.0, 313.0, 584.0, 1199.0, 2660.0, 7109.0, 24300.0, 100923.0, 550486.0, 271026.0, 64061.0, 16129.0, 5101.0, 1989.0, 961.0, 491.0, 231.0, 165.0, 103.0, 66.0, 41.0, 29.0, 15.0, 11.0, 12.0, 7.0, 11.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3291015625, -1.2860107421875, -1.242919921875, -1.1998291015625, -1.15673828125, -1.1136474609375, -1.070556640625, -1.0274658203125, -0.984375, -0.9412841796875, -0.898193359375, -0.8551025390625, -0.81201171875, -0.7689208984375, -0.725830078125, -0.6827392578125, -0.6396484375, -0.5965576171875, -0.553466796875, -0.5103759765625, -0.46728515625, -0.4241943359375, -0.381103515625, -0.3380126953125, -0.294921875, -0.2518310546875, -0.208740234375, -0.1656494140625, -0.12255859375, -0.0794677734375, -0.036376953125, 0.0067138671875, 0.0498046875, 0.0928955078125, 0.135986328125, 0.1790771484375, 0.22216796875, 0.2652587890625, 0.308349609375, 0.3514404296875, 0.39453125, 0.4376220703125, 0.480712890625, 0.5238037109375, 0.56689453125, 0.6099853515625, 0.653076171875, 0.6961669921875, 0.7392578125, 0.7823486328125, 0.825439453125, 0.8685302734375, 0.91162109375, 0.9547119140625, 0.997802734375, 1.0408935546875, 1.083984375, 1.1270751953125, 1.170166015625, 1.2132568359375, 1.25634765625, 1.2994384765625, 1.342529296875, 1.3856201171875, 1.4287109375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 2.0, 3.0, 6.0, 4.0, 11.0, 11.0, 10.0, 16.0, 20.0, 29.0, 34.0, 42.0, 53.0, 60.0, 63.0, 67.0, 61.0, 68.0, 72.0, 70.0, 55.0, 49.0, 42.0, 28.0, 32.0, 17.0, 22.0, 10.0, 11.0, 9.0, 2.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.4033203125, -1.3601226806640625, -1.316925048828125, -1.2737274169921875, -1.23052978515625, -1.1873321533203125, -1.144134521484375, -1.1009368896484375, -1.0577392578125, -1.0145416259765625, -0.971343994140625, -0.9281463623046875, -0.88494873046875, -0.8417510986328125, -0.798553466796875, -0.7553558349609375, -0.712158203125, -0.6689605712890625, -0.625762939453125, -0.5825653076171875, -0.53936767578125, -0.4961700439453125, -0.452972412109375, -0.4097747802734375, -0.3665771484375, -0.3233795166015625, -0.280181884765625, -0.2369842529296875, -0.19378662109375, -0.1505889892578125, -0.107391357421875, -0.0641937255859375, -0.02099609375, 0.0222015380859375, 0.065399169921875, 0.1085968017578125, 0.15179443359375, 0.1949920654296875, 0.238189697265625, 0.2813873291015625, 0.3245849609375, 0.3677825927734375, 0.410980224609375, 0.4541778564453125, 0.49737548828125, 0.5405731201171875, 0.583770751953125, 0.6269683837890625, 0.670166015625, 0.7133636474609375, 0.756561279296875, 0.7997589111328125, 0.84295654296875, 0.8861541748046875, 0.929351806640625, 0.9725494384765625, 1.0157470703125, 1.0589447021484375, 1.102142333984375, 1.1453399658203125, 1.18853759765625, 1.2317352294921875, 1.274932861328125, 1.3181304931640625, 1.361328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 29.0, 45.0, 106.0, 170.0, 284.0, 159.0, 95.0, 47.0, 29.0, 6.0, 6.0, 2.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.40463638305664, -37.13990020751953, -35.87516784667969, -34.61043167114258, -33.345699310302734, -32.080963134765625, -30.81623077392578, -29.551494598388672, -28.286762237548828, -27.02202796936035, -25.757293701171875, -24.4925594329834, -23.227825164794922, -21.963090896606445, -20.69835662841797, -19.43362045288086, -18.168886184692383, -16.904151916503906, -15.63941764831543, -14.374683380126953, -13.109949111938477, -11.84521484375, -10.580479621887207, -9.31574535369873, -8.051011085510254, -6.786276817321777, -5.521542549133301, -4.256807804107666, -2.9920735359191895, -1.727339267730713, -0.4626045227050781, 0.8021297454833984, 2.066864013671875, 3.3315982818603516, 4.596332550048828, 5.861067295074463, 7.1258015632629395, 8.390535354614258, 9.65527057647705, 10.920004844665527, 12.184739112854004, 13.44947338104248, 14.714207649230957, 15.97894287109375, 17.243677139282227, 18.508411407470703, 19.77314567565918, 21.037879943847656, 22.302614212036133, 23.56734848022461, 24.832082748413086, 26.096817016601562, 27.36155128479004, 28.626285552978516, 29.891021728515625, 31.15575408935547, 32.42049026489258, 33.68522644042969, 34.94995880126953, 36.21469497680664, 37.479427337646484, 38.744163513183594, 40.00889587402344, 41.27363204956055, 42.53836441040039]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 7.0, 4.0, 2.0, 8.0, 4.0, 9.0, 10.0, 13.0, 9.0, 15.0, 17.0, 31.0, 28.0, 26.0, 25.0, 29.0, 30.0, 40.0, 66.0, 81.0, 78.0, 83.0, 55.0, 34.0, 43.0, 31.0, 30.0, 33.0, 31.0, 27.0, 15.0, 13.0, 13.0, 14.0, 8.0, 10.0, 5.0, 5.0, 7.0, 2.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.327194213867188, -18.654258728027344, -17.9813232421875, -17.308387756347656, -16.635452270507812, -15.962516784667969, -15.289581298828125, -14.616645812988281, -13.943710327148438, -13.270774841308594, -12.59783935546875, -11.924903869628906, -11.251968383789062, -10.579032897949219, -9.906097412109375, -9.233161926269531, -8.560226440429688, -7.887290954589844, -7.21435546875, -6.541419982910156, -5.8684844970703125, -5.195549011230469, -4.522613525390625, -3.8496780395507812, -3.1767425537109375, -2.5038070678710938, -1.83087158203125, -1.1579360961914062, -0.4850006103515625, 0.18793487548828125, 0.860870361328125, 1.5338058471679688, 2.2067413330078125, 2.8796768188476562, 3.5526123046875, 4.225547790527344, 4.8984832763671875, 5.571418762207031, 6.244354248046875, 6.917289733886719, 7.5902252197265625, 8.263160705566406, 8.93609619140625, 9.609031677246094, 10.281967163085938, 10.954902648925781, 11.627838134765625, 12.300773620605469, 12.973709106445312, 13.646644592285156, 14.319580078125, 14.992515563964844, 15.665451049804688, 16.33838653564453, 17.011322021484375, 17.68425750732422, 18.357192993164062, 19.030128479003906, 19.70306396484375, 20.375999450683594, 21.048934936523438, 21.72187042236328, 22.394805908203125, 23.06774139404297, 23.740676879882812]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 9.0, 7.0, 12.0, 19.0, 21.0, 40.0, 51.0, 64.0, 128.0, 151.0, 258.0, 413.0, 701.0, 1032.0, 1769.0, 3302.0, 6676.0, 15404.0, 43761.0, 159302.0, 697876.0, 1877318.0, 1028014.0, 254283.0, 63449.0, 21230.0, 9029.0, 4371.0, 2323.0, 1215.0, 714.0, 436.0, 330.0, 183.0, 101.0, 95.0, 54.0, 41.0, 24.0, 26.0, 11.0, 9.0, 9.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.392578125, -1.3511962890625, -1.309814453125, -1.2684326171875, -1.22705078125, -1.1856689453125, -1.144287109375, -1.1029052734375, -1.0615234375, -1.0201416015625, -0.978759765625, -0.9373779296875, -0.89599609375, -0.8546142578125, -0.813232421875, -0.7718505859375, -0.73046875, -0.6890869140625, -0.647705078125, -0.6063232421875, -0.56494140625, -0.5235595703125, -0.482177734375, -0.4407958984375, -0.3994140625, -0.3580322265625, -0.316650390625, -0.2752685546875, -0.23388671875, -0.1925048828125, -0.151123046875, -0.1097412109375, -0.068359375, -0.0269775390625, 0.014404296875, 0.0557861328125, 0.09716796875, 0.1385498046875, 0.179931640625, 0.2213134765625, 0.2626953125, 0.3040771484375, 0.345458984375, 0.3868408203125, 0.42822265625, 0.4696044921875, 0.510986328125, 0.5523681640625, 0.59375, 0.6351318359375, 0.676513671875, 0.7178955078125, 0.75927734375, 0.8006591796875, 0.842041015625, 0.8834228515625, 0.9248046875, 0.9661865234375, 1.007568359375, 1.0489501953125, 1.09033203125, 1.1317138671875, 1.173095703125, 1.2144775390625, 1.255859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 7.0, 12.0, 13.0, 16.0, 25.0, 33.0, 40.0, 30.0, 54.0, 47.0, 46.0, 48.0, 80.0, 55.0, 64.0, 84.0, 69.0, 47.0, 49.0, 37.0, 39.0, 20.0, 13.0, 16.0, 16.0, 11.0, 9.0, 7.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.44140625, -2.3825836181640625, -2.323760986328125, -2.2649383544921875, -2.20611572265625, -2.1472930908203125, -2.088470458984375, -2.0296478271484375, -1.9708251953125, -1.9120025634765625, -1.853179931640625, -1.7943572998046875, -1.73553466796875, -1.6767120361328125, -1.617889404296875, -1.5590667724609375, -1.500244140625, -1.4414215087890625, -1.382598876953125, -1.3237762451171875, -1.26495361328125, -1.2061309814453125, -1.147308349609375, -1.0884857177734375, -1.0296630859375, -0.9708404541015625, -0.912017822265625, -0.8531951904296875, -0.79437255859375, -0.7355499267578125, -0.676727294921875, -0.6179046630859375, -0.55908203125, -0.5002593994140625, -0.441436767578125, -0.3826141357421875, -0.32379150390625, -0.2649688720703125, -0.206146240234375, -0.1473236083984375, -0.0885009765625, -0.0296783447265625, 0.029144287109375, 0.0879669189453125, 0.14678955078125, 0.2056121826171875, 0.264434814453125, 0.3232574462890625, 0.382080078125, 0.4409027099609375, 0.499725341796875, 0.5585479736328125, 0.61737060546875, 0.6761932373046875, 0.735015869140625, 0.7938385009765625, 0.8526611328125, 0.9114837646484375, 0.970306396484375, 1.0291290283203125, 1.08795166015625, 1.1467742919921875, 1.205596923828125, 1.2644195556640625, 1.3232421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 10.0, 11.0, 27.0, 51.0, 68.0, 133.0, 271.0, 651.0, 2262.0, 18681.0, 2723805.0, 1431054.0, 14079.0, 1996.0, 600.0, 296.0, 139.0, 69.0, 35.0, 18.0, 12.0, 7.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.140625, -6.9022216796875, -6.663818359375, -6.4254150390625, -6.18701171875, -5.9486083984375, -5.710205078125, -5.4718017578125, -5.2333984375, -4.9949951171875, -4.756591796875, -4.5181884765625, -4.27978515625, -4.0413818359375, -3.802978515625, -3.5645751953125, -3.326171875, -3.0877685546875, -2.849365234375, -2.6109619140625, -2.37255859375, -2.1341552734375, -1.895751953125, -1.6573486328125, -1.4189453125, -1.1805419921875, -0.942138671875, -0.7037353515625, -0.46533203125, -0.2269287109375, 0.011474609375, 0.2498779296875, 0.48828125, 0.7266845703125, 0.965087890625, 1.2034912109375, 1.44189453125, 1.6802978515625, 1.918701171875, 2.1571044921875, 2.3955078125, 2.6339111328125, 2.872314453125, 3.1107177734375, 3.34912109375, 3.5875244140625, 3.825927734375, 4.0643310546875, 4.302734375, 4.5411376953125, 4.779541015625, 5.0179443359375, 5.25634765625, 5.4947509765625, 5.733154296875, 5.9715576171875, 6.2099609375, 6.4483642578125, 6.686767578125, 6.9251708984375, 7.16357421875, 7.4019775390625, 7.640380859375, 7.8787841796875, 8.1171875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 8.0, 8.0, 13.0, 31.0, 65.0, 108.0, 213.0, 572.0, 1155.0, 1070.0, 485.0, 181.0, 86.0, 36.0, 23.0, 8.0, 10.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94140625, -4.74267578125, -4.5439453125, -4.34521484375, -4.146484375, -3.94775390625, -3.7490234375, -3.55029296875, -3.3515625, -3.15283203125, -2.9541015625, -2.75537109375, -2.556640625, -2.35791015625, -2.1591796875, -1.96044921875, -1.76171875, -1.56298828125, -1.3642578125, -1.16552734375, -0.966796875, -0.76806640625, -0.5693359375, -0.37060546875, -0.171875, 0.02685546875, 0.2255859375, 0.42431640625, 0.623046875, 0.82177734375, 1.0205078125, 1.21923828125, 1.41796875, 1.61669921875, 1.8154296875, 2.01416015625, 2.212890625, 2.41162109375, 2.6103515625, 2.80908203125, 3.0078125, 3.20654296875, 3.4052734375, 3.60400390625, 3.802734375, 4.00146484375, 4.2001953125, 4.39892578125, 4.59765625, 4.79638671875, 4.9951171875, 5.19384765625, 5.392578125, 5.59130859375, 5.7900390625, 5.98876953125, 6.1875, 6.38623046875, 6.5849609375, 6.78369140625, 6.982421875, 7.18115234375, 7.3798828125, 7.57861328125, 7.77734375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 14.0, 16.0, 67.0, 144.0, 229.0, 225.0, 167.0, 78.0, 27.0, 15.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.09193420410156, -65.66987609863281, -64.24781799316406, -62.82575607299805, -61.40369415283203, -59.98163604736328, -58.559574127197266, -57.137516021728516, -55.7154541015625, -54.29339599609375, -52.871334075927734, -51.449275970458984, -50.02721405029297, -48.60515594482422, -47.1830940246582, -45.76103591918945, -44.33897399902344, -42.91691589355469, -41.49485397338867, -40.07279586791992, -38.650733947753906, -37.228675842285156, -35.80661392211914, -34.38455581665039, -32.96249771118164, -31.540437698364258, -30.118377685546875, -28.696317672729492, -27.27425765991211, -25.852197647094727, -24.430137634277344, -23.008079528808594, -21.586015701293945, -20.163955688476562, -18.74189567565918, -17.319835662841797, -15.897775650024414, -14.475715637207031, -13.053656578063965, -11.631596565246582, -10.2095365524292, -8.787476539611816, -7.365416526794434, -5.943356990814209, -4.521296977996826, -3.0992369651794434, -1.6771774291992188, -0.25511741638183594, 1.1669425964355469, 2.5890026092529297, 4.0110626220703125, 5.433122158050537, 6.85518217086792, 8.277242660522461, 9.699301719665527, 11.12136173248291, 12.543421745300293, 13.965481758117676, 15.387541770935059, 16.809600830078125, 18.231660842895508, 19.65372085571289, 21.075780868530273, 22.497840881347656, 23.91990089416504]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 5.0, 13.0, 12.0, 20.0, 19.0, 20.0, 21.0, 35.0, 35.0, 41.0, 40.0, 55.0, 61.0, 64.0, 69.0, 69.0, 59.0, 73.0, 48.0, 39.0, 32.0, 20.0, 25.0, 22.0, 25.0, 20.0, 18.0, 4.0, 6.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.403064727783203, -17.816274642944336, -17.22948455810547, -16.642696380615234, -16.055906295776367, -15.4691162109375, -14.88232707977295, -14.295537948608398, -13.708747863769531, -13.121957778930664, -12.535168647766113, -11.948379516601562, -11.361589431762695, -10.774799346923828, -10.188010215759277, -9.601221084594727, -9.01443099975586, -8.427640914916992, -7.840851783752441, -7.254062175750732, -6.667272567749023, -6.0804829597473145, -5.4936933517456055, -4.9069037437438965, -4.3201141357421875, -3.7333245277404785, -3.1465349197387695, -2.5597453117370605, -1.9729557037353516, -1.3861660957336426, -0.7993764877319336, -0.2125868797302246, 0.3742046356201172, 0.9609942436218262, 1.5477838516235352, 2.134573459625244, 2.721363067626953, 3.308152675628662, 3.894942283630371, 4.48173189163208, 5.068521499633789, 5.655311107635498, 6.242100715637207, 6.828890323638916, 7.415679931640625, 8.002470016479492, 8.589259147644043, 9.176048278808594, 9.762838363647461, 10.349628448486328, 10.936417579650879, 11.52320671081543, 12.109996795654297, 12.696786880493164, 13.283576011657715, 13.870365142822266, 14.457155227661133, 15.0439453125, 15.63073444366455, 16.2175235748291, 16.80431365966797, 17.391103744506836, 17.977893829345703, 18.564682006835938, 19.151472091674805]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 6.0, 3.0, 7.0, 12.0, 12.0, 15.0, 25.0, 35.0, 56.0, 78.0, 110.0, 178.0, 286.0, 457.0, 727.0, 1215.0, 2073.0, 3599.0, 6345.0, 11362.0, 21645.0, 40898.0, 78200.0, 146408.0, 229935.0, 219620.0, 133746.0, 70580.0, 36995.0, 19621.0, 10505.0, 5695.0, 3255.0, 1900.0, 1117.0, 643.0, 397.0, 284.0, 180.0, 115.0, 85.0, 53.0, 31.0, 29.0, 8.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.458984375, -1.408538818359375, -1.35809326171875, -1.307647705078125, -1.2572021484375, -1.206756591796875, -1.15631103515625, -1.105865478515625, -1.055419921875, -1.004974365234375, -0.95452880859375, -0.904083251953125, -0.8536376953125, -0.803192138671875, -0.75274658203125, -0.702301025390625, -0.65185546875, -0.601409912109375, -0.55096435546875, -0.500518798828125, -0.4500732421875, -0.399627685546875, -0.34918212890625, -0.298736572265625, -0.248291015625, -0.197845458984375, -0.14739990234375, -0.096954345703125, -0.0465087890625, 0.003936767578125, 0.05438232421875, 0.104827880859375, 0.1552734375, 0.205718994140625, 0.25616455078125, 0.306610107421875, 0.3570556640625, 0.407501220703125, 0.45794677734375, 0.508392333984375, 0.558837890625, 0.609283447265625, 0.65972900390625, 0.710174560546875, 0.7606201171875, 0.811065673828125, 0.86151123046875, 0.911956787109375, 0.96240234375, 1.012847900390625, 1.06329345703125, 1.113739013671875, 1.1641845703125, 1.214630126953125, 1.26507568359375, 1.315521240234375, 1.365966796875, 1.416412353515625, 1.46685791015625, 1.517303466796875, 1.5677490234375, 1.618194580078125, 1.66864013671875, 1.719085693359375, 1.76953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 7.0, 12.0, 6.0, 20.0, 20.0, 24.0, 23.0, 31.0, 28.0, 39.0, 49.0, 41.0, 51.0, 63.0, 61.0, 61.0, 66.0, 57.0, 61.0, 47.0, 52.0, 37.0, 20.0, 28.0, 17.0, 23.0, 13.0, 10.0, 8.0, 11.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.447265625, -2.386383056640625, -2.32550048828125, -2.264617919921875, -2.2037353515625, -2.142852783203125, -2.08197021484375, -2.021087646484375, -1.960205078125, -1.899322509765625, -1.83843994140625, -1.777557373046875, -1.7166748046875, -1.655792236328125, -1.59490966796875, -1.534027099609375, -1.47314453125, -1.412261962890625, -1.35137939453125, -1.290496826171875, -1.2296142578125, -1.168731689453125, -1.10784912109375, -1.046966552734375, -0.986083984375, -0.925201416015625, -0.86431884765625, -0.803436279296875, -0.7425537109375, -0.681671142578125, -0.62078857421875, -0.559906005859375, -0.4990234375, -0.438140869140625, -0.37725830078125, -0.316375732421875, -0.2554931640625, -0.194610595703125, -0.13372802734375, -0.072845458984375, -0.011962890625, 0.048919677734375, 0.10980224609375, 0.170684814453125, 0.2315673828125, 0.292449951171875, 0.35333251953125, 0.414215087890625, 0.47509765625, 0.535980224609375, 0.59686279296875, 0.657745361328125, 0.7186279296875, 0.779510498046875, 0.84039306640625, 0.901275634765625, 0.962158203125, 1.023040771484375, 1.08392333984375, 1.144805908203125, 1.2056884765625, 1.266571044921875, 1.32745361328125, 1.388336181640625, 1.44921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 13.0, 11.0, 26.0, 33.0, 34.0, 38.0, 65.0, 68.0, 99.0, 166.0, 225.0, 362.0, 546.0, 1030.0, 2261.0, 5948.0, 21584.0, 100062.0, 625877.0, 227318.0, 44833.0, 10905.0, 3528.0, 1350.0, 757.0, 447.0, 264.0, 163.0, 165.0, 95.0, 65.0, 50.0, 38.0, 34.0, 18.0, 20.0, 15.0, 6.0, 9.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.3828125, -4.256683349609375, -4.13055419921875, -4.004425048828125, -3.8782958984375, -3.752166748046875, -3.62603759765625, -3.499908447265625, -3.373779296875, -3.247650146484375, -3.12152099609375, -2.995391845703125, -2.8692626953125, -2.743133544921875, -2.61700439453125, -2.490875244140625, -2.36474609375, -2.238616943359375, -2.11248779296875, -1.986358642578125, -1.8602294921875, -1.734100341796875, -1.60797119140625, -1.481842041015625, -1.355712890625, -1.229583740234375, -1.10345458984375, -0.977325439453125, -0.8511962890625, -0.725067138671875, -0.59893798828125, -0.472808837890625, -0.3466796875, -0.220550537109375, -0.09442138671875, 0.031707763671875, 0.1578369140625, 0.283966064453125, 0.41009521484375, 0.536224365234375, 0.662353515625, 0.788482666015625, 0.91461181640625, 1.040740966796875, 1.1668701171875, 1.292999267578125, 1.41912841796875, 1.545257568359375, 1.67138671875, 1.797515869140625, 1.92364501953125, 2.049774169921875, 2.1759033203125, 2.302032470703125, 2.42816162109375, 2.554290771484375, 2.680419921875, 2.806549072265625, 2.93267822265625, 3.058807373046875, 3.1849365234375, 3.311065673828125, 3.43719482421875, 3.563323974609375, 3.689453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 0.0, 4.0, 7.0, 7.0, 14.0, 8.0, 12.0, 14.0, 22.0, 20.0, 27.0, 33.0, 35.0, 36.0, 40.0, 50.0, 46.0, 59.0, 68.0, 62.0, 57.0, 52.0, 58.0, 54.0, 36.0, 19.0, 26.0, 27.0, 19.0, 19.0, 16.0, 12.0, 15.0, 8.0, 4.0, 7.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.29296875, -6.088623046875, -5.88427734375, -5.679931640625, -5.4755859375, -5.271240234375, -5.06689453125, -4.862548828125, -4.658203125, -4.453857421875, -4.24951171875, -4.045166015625, -3.8408203125, -3.636474609375, -3.43212890625, -3.227783203125, -3.0234375, -2.819091796875, -2.61474609375, -2.410400390625, -2.2060546875, -2.001708984375, -1.79736328125, -1.593017578125, -1.388671875, -1.184326171875, -0.97998046875, -0.775634765625, -0.5712890625, -0.366943359375, -0.16259765625, 0.041748046875, 0.24609375, 0.450439453125, 0.65478515625, 0.859130859375, 1.0634765625, 1.267822265625, 1.47216796875, 1.676513671875, 1.880859375, 2.085205078125, 2.28955078125, 2.493896484375, 2.6982421875, 2.902587890625, 3.10693359375, 3.311279296875, 3.515625, 3.719970703125, 3.92431640625, 4.128662109375, 4.3330078125, 4.537353515625, 4.74169921875, 4.946044921875, 5.150390625, 5.354736328125, 5.55908203125, 5.763427734375, 5.9677734375, 6.172119140625, 6.37646484375, 6.580810546875, 6.78515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 0.0, 4.0, 7.0, 5.0, 4.0, 13.0, 15.0, 22.0, 28.0, 22.0, 37.0, 50.0, 72.0, 116.0, 158.0, 207.0, 316.0, 488.0, 822.0, 1588.0, 3269.0, 7587.0, 20416.0, 62625.0, 240451.0, 565109.0, 96368.0, 29128.0, 10599.0, 4309.0, 2012.0, 1004.0, 552.0, 343.0, 218.0, 160.0, 113.0, 85.0, 47.0, 40.0, 36.0, 36.0, 18.0, 13.0, 5.0, 9.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.1220703125, -1.0882415771484375, -1.054412841796875, -1.0205841064453125, -0.98675537109375, -0.9529266357421875, -0.919097900390625, -0.8852691650390625, -0.8514404296875, -0.8176116943359375, -0.783782958984375, -0.7499542236328125, -0.71612548828125, -0.6822967529296875, -0.648468017578125, -0.6146392822265625, -0.580810546875, -0.5469818115234375, -0.513153076171875, -0.4793243408203125, -0.44549560546875, -0.4116668701171875, -0.377838134765625, -0.3440093994140625, -0.3101806640625, -0.2763519287109375, -0.242523193359375, -0.2086944580078125, -0.17486572265625, -0.1410369873046875, -0.107208251953125, -0.0733795166015625, -0.03955078125, -0.0057220458984375, 0.028106689453125, 0.0619354248046875, 0.09576416015625, 0.1295928955078125, 0.163421630859375, 0.1972503662109375, 0.2310791015625, 0.2649078369140625, 0.298736572265625, 0.3325653076171875, 0.36639404296875, 0.4002227783203125, 0.434051513671875, 0.4678802490234375, 0.501708984375, 0.5355377197265625, 0.569366455078125, 0.6031951904296875, 0.63702392578125, 0.6708526611328125, 0.704681396484375, 0.7385101318359375, 0.7723388671875, 0.8061676025390625, 0.839996337890625, 0.8738250732421875, 0.90765380859375, 0.9414825439453125, 0.975311279296875, 1.0091400146484375, 1.04296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 9.0, 2.0, 16.0, 22.0, 20.0, 17.0, 21.0, 50.0, 38.0, 61.0, 101.0, 108.0, 111.0, 97.0, 86.0, 58.0, 37.0, 30.0, 31.0, 18.0, 16.0, 13.0, 17.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00039768218994140625, -0.00038129836320877075, -0.00036491453647613525, -0.00034853070974349976, -0.00033214688301086426, -0.00031576305627822876, -0.00029937922954559326, -0.00028299540281295776, -0.00026661157608032227, -0.00025022774934768677, -0.00023384392261505127, -0.00021746009588241577, -0.00020107626914978027, -0.00018469244241714478, -0.00016830861568450928, -0.00015192478895187378, -0.00013554096221923828, -0.00011915713548660278, -0.00010277330875396729, -8.638948202133179e-05, -7.000565528869629e-05, -5.362182855606079e-05, -3.723800182342529e-05, -2.0854175090789795e-05, -4.470348358154297e-06, 1.1913478374481201e-05, 2.82973051071167e-05, 4.46811318397522e-05, 6.10649585723877e-05, 7.74487853050232e-05, 9.383261203765869e-05, 0.00011021643877029419, 0.0001266002655029297, 0.00014298409223556519, 0.00015936791896820068, 0.00017575174570083618, 0.00019213557243347168, 0.00020851939916610718, 0.00022490322589874268, 0.00024128705263137817, 0.00025767087936401367, 0.00027405470609664917, 0.00029043853282928467, 0.00030682235956192017, 0.00032320618629455566, 0.00033959001302719116, 0.00035597383975982666, 0.00037235766649246216, 0.00038874149322509766, 0.00040512531995773315, 0.00042150914669036865, 0.00043789297342300415, 0.00045427680015563965, 0.00047066062688827515, 0.00048704445362091064, 0.0005034282803535461, 0.0005198121070861816, 0.0005361959338188171, 0.0005525797605514526, 0.0005689635872840881, 0.0005853474140167236, 0.0006017312407493591, 0.0006181150674819946, 0.0006344988942146301, 0.0006508827209472656]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 10.0, 9.0, 9.0, 22.0, 31.0, 59.0, 81.0, 115.0, 164.0, 292.0, 519.0, 935.0, 2152.0, 5420.0, 17124.0, 71088.0, 596955.0, 281103.0, 51083.0, 13095.0, 4417.0, 1810.0, 877.0, 418.0, 262.0, 166.0, 97.0, 80.0, 48.0, 25.0, 18.0, 13.0, 6.0, 6.0, 3.0, 5.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.333984375, -1.2921600341796875, -1.250335693359375, -1.2085113525390625, -1.16668701171875, -1.1248626708984375, -1.083038330078125, -1.0412139892578125, -0.9993896484375, -0.9575653076171875, -0.915740966796875, -0.8739166259765625, -0.83209228515625, -0.7902679443359375, -0.748443603515625, -0.7066192626953125, -0.664794921875, -0.6229705810546875, -0.581146240234375, -0.5393218994140625, -0.49749755859375, -0.4556732177734375, -0.413848876953125, -0.3720245361328125, -0.3302001953125, -0.2883758544921875, -0.246551513671875, -0.2047271728515625, -0.16290283203125, -0.1210784912109375, -0.079254150390625, -0.0374298095703125, 0.00439453125, 0.0462188720703125, 0.088043212890625, 0.1298675537109375, 0.17169189453125, 0.2135162353515625, 0.255340576171875, 0.2971649169921875, 0.3389892578125, 0.3808135986328125, 0.422637939453125, 0.4644622802734375, 0.50628662109375, 0.5481109619140625, 0.589935302734375, 0.6317596435546875, 0.673583984375, 0.7154083251953125, 0.757232666015625, 0.7990570068359375, 0.84088134765625, 0.8827056884765625, 0.924530029296875, 0.9663543701171875, 1.0081787109375, 1.0500030517578125, 1.091827392578125, 1.1336517333984375, 1.17547607421875, 1.2173004150390625, 1.259124755859375, 1.3009490966796875, 1.3427734375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 8.0, 12.0, 31.0, 22.0, 48.0, 51.0, 94.0, 115.0, 109.0, 110.0, 117.0, 74.0, 53.0, 43.0, 37.0, 17.0, 12.0, 12.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.345703125, -2.288482666015625, -2.23126220703125, -2.174041748046875, -2.1168212890625, -2.059600830078125, -2.00238037109375, -1.945159912109375, -1.887939453125, -1.830718994140625, -1.77349853515625, -1.716278076171875, -1.6590576171875, -1.601837158203125, -1.54461669921875, -1.487396240234375, -1.43017578125, -1.372955322265625, -1.31573486328125, -1.258514404296875, -1.2012939453125, -1.144073486328125, -1.08685302734375, -1.029632568359375, -0.972412109375, -0.915191650390625, -0.85797119140625, -0.800750732421875, -0.7435302734375, -0.686309814453125, -0.62908935546875, -0.571868896484375, -0.5146484375, -0.457427978515625, -0.40020751953125, -0.342987060546875, -0.2857666015625, -0.228546142578125, -0.17132568359375, -0.114105224609375, -0.056884765625, 0.000335693359375, 0.05755615234375, 0.114776611328125, 0.1719970703125, 0.229217529296875, 0.28643798828125, 0.343658447265625, 0.40087890625, 0.458099365234375, 0.51531982421875, 0.572540283203125, 0.6297607421875, 0.686981201171875, 0.74420166015625, 0.801422119140625, 0.858642578125, 0.915863037109375, 0.97308349609375, 1.030303955078125, 1.0875244140625, 1.144744873046875, 1.20196533203125, 1.259185791015625, 1.31640625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 12.0, 42.0, 97.0, 165.0, 360.0, 167.0, 75.0, 49.0, 13.0, 9.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.885417938232422, -20.35997772216797, -18.83453941345215, -17.309099197387695, -15.783659934997559, -14.258220672607422, -12.732780456542969, -11.207341194152832, -9.681901931762695, -8.156462669372559, -6.631022930145264, -5.105583190917969, -3.580143928527832, -2.0547046661376953, -0.5292644500732422, 0.9961748123168945, 2.5216140747070312, 4.047053337097168, 5.572493076324463, 7.097932815551758, 8.623372077941895, 10.148811340332031, 11.674251556396484, 13.199690818786621, 14.725130081176758, 16.25057029724121, 17.77600860595703, 19.301448822021484, 20.826889038085938, 22.352327346801758, 23.87776756286621, 25.40320587158203, 26.92864990234375, 28.454090118408203, 29.979528427124023, 31.504968643188477, 33.0304069519043, 34.55584716796875, 36.0812873840332, 37.606727600097656, 39.132164001464844, 40.6576042175293, 42.18304443359375, 43.70848083496094, 45.23392105102539, 46.759361267089844, 48.2848014831543, 49.81024169921875, 51.3356819152832, 52.861122131347656, 54.38656234741211, 55.91200256347656, 57.43743896484375, 58.9628791809082, 60.488319396972656, 62.01375961303711, 63.53919982910156, 65.06463623046875, 66.59008026123047, 68.11551666259766, 69.64096069335938, 71.16639709472656, 72.69183349609375, 74.21727752685547, 75.74271392822266]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 3.0, 6.0, 7.0, 11.0, 13.0, 14.0, 18.0, 13.0, 25.0, 28.0, 26.0, 21.0, 31.0, 28.0, 36.0, 52.0, 72.0, 105.0, 90.0, 61.0, 44.0, 40.0, 27.0, 31.0, 27.0, 28.0, 23.0, 23.0, 17.0, 13.0, 11.0, 13.0, 8.0, 4.0, 6.0, 8.0, 4.0, 5.0, 6.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.87209129333496, -22.155550003051758, -21.439008712768555, -20.72246742248535, -20.00592613220215, -19.289384841918945, -18.57284164428711, -17.856300354003906, -17.139759063720703, -16.4232177734375, -15.706676483154297, -14.990135192871094, -14.27359390258789, -13.557052612304688, -12.840510368347168, -12.123969078063965, -11.407428741455078, -10.690887451171875, -9.974346160888672, -9.257804870605469, -8.541263580322266, -7.824721813201904, -7.108180046081543, -6.39163875579834, -5.675097465515137, -4.958556175231934, -4.2420148849487305, -3.525473117828369, -2.808931827545166, -2.092390537261963, -1.3758487701416016, -0.6593074798583984, 0.05723381042480469, 0.7737752199172974, 1.49031662940979, 2.2068581581115723, 2.9233994483947754, 3.6399407386779785, 4.35648250579834, 5.073023796081543, 5.789565086364746, 6.506106376647949, 7.222647666931152, 7.939189434051514, 8.655731201171875, 9.372272491455078, 10.088813781738281, 10.805355072021484, 11.521896362304688, 12.23843765258789, 12.954978942871094, 13.671520233154297, 14.3880615234375, 15.104602813720703, 15.821145057678223, 16.53768539428711, 17.254226684570312, 17.970767974853516, 18.68730926513672, 19.403850555419922, 20.120391845703125, 20.836933135986328, 21.55347442626953, 22.270015716552734, 22.98655891418457]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 10.0, 11.0, 11.0, 13.0, 23.0, 16.0, 34.0, 35.0, 51.0, 95.0, 78.0, 123.0, 208.0, 313.0, 581.0, 997.0, 2201.0, 5864.0, 21108.0, 131343.0, 1274474.0, 2364980.0, 335729.0, 40042.0, 9474.0, 3251.0, 1360.0, 703.0, 369.0, 210.0, 158.0, 108.0, 69.0, 62.0, 41.0, 36.0, 22.0, 22.0, 15.0, 9.0, 9.0, 7.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.176727294921875, -2.09954833984375, -2.022369384765625, -1.9451904296875, -1.868011474609375, -1.79083251953125, -1.713653564453125, -1.636474609375, -1.559295654296875, -1.48211669921875, -1.404937744140625, -1.3277587890625, -1.250579833984375, -1.17340087890625, -1.096221923828125, -1.01904296875, -0.941864013671875, -0.86468505859375, -0.787506103515625, -0.7103271484375, -0.633148193359375, -0.55596923828125, -0.478790283203125, -0.401611328125, -0.324432373046875, -0.24725341796875, -0.170074462890625, -0.0928955078125, -0.015716552734375, 0.06146240234375, 0.138641357421875, 0.2158203125, 0.292999267578125, 0.37017822265625, 0.447357177734375, 0.5245361328125, 0.601715087890625, 0.67889404296875, 0.756072998046875, 0.833251953125, 0.910430908203125, 0.98760986328125, 1.064788818359375, 1.1419677734375, 1.219146728515625, 1.29632568359375, 1.373504638671875, 1.45068359375, 1.527862548828125, 1.60504150390625, 1.682220458984375, 1.7593994140625, 1.836578369140625, 1.91375732421875, 1.990936279296875, 2.068115234375, 2.145294189453125, 2.22247314453125, 2.299652099609375, 2.3768310546875, 2.454010009765625, 2.53118896484375, 2.608367919921875, 2.685546875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 11.0, 12.0, 12.0, 19.0, 19.0, 23.0, 29.0, 25.0, 45.0, 48.0, 41.0, 57.0, 55.0, 70.0, 56.0, 60.0, 63.0, 57.0, 50.0, 48.0, 47.0, 32.0, 21.0, 20.0, 18.0, 20.0, 14.0, 7.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1875, -2.12762451171875, -2.0677490234375, -2.00787353515625, -1.947998046875, -1.88812255859375, -1.8282470703125, -1.76837158203125, -1.70849609375, -1.64862060546875, -1.5887451171875, -1.52886962890625, -1.468994140625, -1.40911865234375, -1.3492431640625, -1.28936767578125, -1.2294921875, -1.16961669921875, -1.1097412109375, -1.04986572265625, -0.989990234375, -0.93011474609375, -0.8702392578125, -0.81036376953125, -0.75048828125, -0.69061279296875, -0.6307373046875, -0.57086181640625, -0.510986328125, -0.45111083984375, -0.3912353515625, -0.33135986328125, -0.271484375, -0.21160888671875, -0.1517333984375, -0.09185791015625, -0.031982421875, 0.02789306640625, 0.0877685546875, 0.14764404296875, 0.20751953125, 0.26739501953125, 0.3272705078125, 0.38714599609375, 0.447021484375, 0.50689697265625, 0.5667724609375, 0.62664794921875, 0.6865234375, 0.74639892578125, 0.8062744140625, 0.86614990234375, 0.926025390625, 0.98590087890625, 1.0457763671875, 1.10565185546875, 1.16552734375, 1.22540283203125, 1.2852783203125, 1.34515380859375, 1.405029296875, 1.46490478515625, 1.5247802734375, 1.58465576171875, 1.64453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 5.0, 9.0, 11.0, 10.0, 18.0, 34.0, 31.0, 60.0, 93.0, 139.0, 292.0, 535.0, 1118.0, 4328.0, 28110.0, 819382.0, 3262128.0, 67152.0, 7582.0, 1710.0, 658.0, 338.0, 177.0, 122.0, 72.0, 50.0, 36.0, 24.0, 17.0, 12.0, 10.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.91015625, -5.74212646484375, -5.5740966796875, -5.40606689453125, -5.238037109375, -5.07000732421875, -4.9019775390625, -4.73394775390625, -4.56591796875, -4.39788818359375, -4.2298583984375, -4.06182861328125, -3.893798828125, -3.72576904296875, -3.5577392578125, -3.38970947265625, -3.2216796875, -3.05364990234375, -2.8856201171875, -2.71759033203125, -2.549560546875, -2.38153076171875, -2.2135009765625, -2.04547119140625, -1.87744140625, -1.70941162109375, -1.5413818359375, -1.37335205078125, -1.205322265625, -1.03729248046875, -0.8692626953125, -0.70123291015625, -0.533203125, -0.36517333984375, -0.1971435546875, -0.02911376953125, 0.138916015625, 0.30694580078125, 0.4749755859375, 0.64300537109375, 0.81103515625, 0.97906494140625, 1.1470947265625, 1.31512451171875, 1.483154296875, 1.65118408203125, 1.8192138671875, 1.98724365234375, 2.1552734375, 2.32330322265625, 2.4913330078125, 2.65936279296875, 2.827392578125, 2.99542236328125, 3.1634521484375, 3.33148193359375, 3.49951171875, 3.66754150390625, 3.8355712890625, 4.00360107421875, 4.171630859375, 4.33966064453125, 4.5076904296875, 4.67572021484375, 4.84375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 5.0, 5.0, 7.0, 16.0, 15.0, 17.0, 29.0, 35.0, 42.0, 74.0, 95.0, 171.0, 254.0, 420.0, 566.0, 624.0, 559.0, 381.0, 229.0, 160.0, 108.0, 71.0, 47.0, 40.0, 23.0, 21.0, 12.0, 13.0, 8.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.146484375, -3.036407470703125, -2.92633056640625, -2.816253662109375, -2.7061767578125, -2.596099853515625, -2.48602294921875, -2.375946044921875, -2.265869140625, -2.155792236328125, -2.04571533203125, -1.935638427734375, -1.8255615234375, -1.715484619140625, -1.60540771484375, -1.495330810546875, -1.38525390625, -1.275177001953125, -1.16510009765625, -1.055023193359375, -0.9449462890625, -0.834869384765625, -0.72479248046875, -0.614715576171875, -0.504638671875, -0.394561767578125, -0.28448486328125, -0.174407958984375, -0.0643310546875, 0.045745849609375, 0.15582275390625, 0.265899658203125, 0.3759765625, 0.486053466796875, 0.59613037109375, 0.706207275390625, 0.8162841796875, 0.926361083984375, 1.03643798828125, 1.146514892578125, 1.256591796875, 1.366668701171875, 1.47674560546875, 1.586822509765625, 1.6968994140625, 1.806976318359375, 1.91705322265625, 2.027130126953125, 2.13720703125, 2.247283935546875, 2.35736083984375, 2.467437744140625, 2.5775146484375, 2.687591552734375, 2.79766845703125, 2.907745361328125, 3.017822265625, 3.127899169921875, 3.23797607421875, 3.348052978515625, 3.4581298828125, 3.568206787109375, 3.67828369140625, 3.788360595703125, 3.8984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 13.0, 19.0, 41.0, 72.0, 151.0, 235.0, 206.0, 146.0, 67.0, 25.0, 7.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.03519439697266, -70.50180053710938, -68.9684066772461, -67.43501281738281, -65.90161895751953, -64.36822509765625, -62.8348274230957, -61.30143356323242, -59.768035888671875, -58.234642028808594, -56.70124816894531, -55.16785430908203, -53.634456634521484, -52.1010627746582, -50.56766891479492, -49.03427505493164, -47.50088119506836, -45.96748733520508, -44.4340934753418, -42.90069580078125, -41.36730194091797, -39.83390808105469, -38.300514221191406, -36.767120361328125, -35.233726501464844, -33.70033264160156, -32.16693878173828, -30.633543014526367, -29.100147247314453, -27.566753387451172, -26.03335952758789, -24.49996566772461, -22.966564178466797, -21.433170318603516, -19.8997745513916, -18.36638069152832, -16.832984924316406, -15.299591064453125, -13.766197204589844, -12.232802391052246, -10.699407577514648, -9.16601276397705, -7.632618427276611, -6.099224090576172, -4.565829277038574, -3.0324344635009766, -1.4990406036376953, 0.034354209899902344, 1.5677490234375, 3.1011435985565186, 4.634538173675537, 6.167932510375977, 7.701327323913574, 9.234722137451172, 10.768115997314453, 12.30151081085205, 13.834905624389648, 15.368300437927246, 16.901695251464844, 18.435089111328125, 19.968482971191406, 21.50187873840332, 23.0352725982666, 24.568668365478516, 26.102062225341797]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 7.0, 13.0, 18.0, 18.0, 32.0, 26.0, 30.0, 54.0, 45.0, 56.0, 61.0, 58.0, 51.0, 71.0, 69.0, 72.0, 50.0, 47.0, 35.0, 35.0, 29.0, 35.0, 24.0, 16.0, 7.0, 12.0, 7.0, 5.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.86525535583496, -18.174976348876953, -17.484697341918945, -16.794418334960938, -16.10413932800293, -15.413860321044922, -14.72358226776123, -14.033303260803223, -13.343024253845215, -12.652745246887207, -11.9624662399292, -11.272188186645508, -10.5819091796875, -9.891630172729492, -9.201351165771484, -8.511072158813477, -7.820793151855469, -7.130514144897461, -6.440235137939453, -5.7499566078186035, -5.059677600860596, -4.369398593902588, -3.6791200637817383, -2.9888410568237305, -2.2985620498657227, -1.6082831621170044, -0.9180042743682861, -0.22772550582885742, 0.4625535011291504, 1.1528325080871582, 1.8431110382080078, 2.5333900451660156, 3.2236709594726562, 3.913949966430664, 4.604228973388672, 5.2945075035095215, 5.984786510467529, 6.675065517425537, 7.365344047546387, 8.055623054504395, 8.745902061462402, 9.43618106842041, 10.126460075378418, 10.81673812866211, 11.507017135620117, 12.197296142578125, 12.887575149536133, 13.57785415649414, 14.268133163452148, 14.958412170410156, 15.648691177368164, 16.338970184326172, 17.02924919128418, 17.719528198242188, 18.409805297851562, 19.100086212158203, 19.790363311767578, 20.480642318725586, 21.170921325683594, 21.8612003326416, 22.55147933959961, 23.241758346557617, 23.932037353515625, 24.622314453125, 25.31259536743164]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 15.0, 7.0, 14.0, 23.0, 35.0, 47.0, 74.0, 102.0, 122.0, 166.0, 283.0, 419.0, 622.0, 941.0, 1410.0, 2259.0, 3496.0, 5646.0, 9237.0, 15854.0, 27847.0, 51174.0, 98700.0, 188605.0, 261590.0, 175832.0, 91909.0, 47635.0, 25936.0, 14716.0, 8857.0, 5379.0, 3349.0, 2123.0, 1406.0, 943.0, 534.0, 391.0, 253.0, 179.0, 132.0, 97.0, 51.0, 44.0, 27.0, 19.0, 16.0, 9.0, 8.0, 5.0, 5.0, 2.0, 3.0, 4.0], "bins": [-2.11328125, -2.0519256591796875, -1.990570068359375, -1.9292144775390625, -1.86785888671875, -1.8065032958984375, -1.745147705078125, -1.6837921142578125, -1.6224365234375, -1.5610809326171875, -1.499725341796875, -1.4383697509765625, -1.37701416015625, -1.3156585693359375, -1.254302978515625, -1.1929473876953125, -1.131591796875, -1.0702362060546875, -1.008880615234375, -0.9475250244140625, -0.88616943359375, -0.8248138427734375, -0.763458251953125, -0.7021026611328125, -0.6407470703125, -0.5793914794921875, -0.518035888671875, -0.4566802978515625, -0.39532470703125, -0.3339691162109375, -0.272613525390625, -0.2112579345703125, -0.14990234375, -0.0885467529296875, -0.027191162109375, 0.0341644287109375, 0.09552001953125, 0.1568756103515625, 0.218231201171875, 0.2795867919921875, 0.3409423828125, 0.4022979736328125, 0.463653564453125, 0.5250091552734375, 0.58636474609375, 0.6477203369140625, 0.709075927734375, 0.7704315185546875, 0.831787109375, 0.8931427001953125, 0.954498291015625, 1.0158538818359375, 1.07720947265625, 1.1385650634765625, 1.199920654296875, 1.2612762451171875, 1.3226318359375, 1.3839874267578125, 1.445343017578125, 1.5066986083984375, 1.56805419921875, 1.6294097900390625, 1.690765380859375, 1.7521209716796875, 1.8134765625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 11.0, 10.0, 10.0, 16.0, 22.0, 20.0, 28.0, 30.0, 45.0, 31.0, 48.0, 62.0, 75.0, 64.0, 67.0, 69.0, 62.0, 28.0, 45.0, 47.0, 51.0, 35.0, 25.0, 17.0, 20.0, 15.0, 12.0, 10.0, 6.0, 9.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.22265625, -2.156036376953125, -2.08941650390625, -2.022796630859375, -1.9561767578125, -1.889556884765625, -1.82293701171875, -1.756317138671875, -1.689697265625, -1.623077392578125, -1.55645751953125, -1.489837646484375, -1.4232177734375, -1.356597900390625, -1.28997802734375, -1.223358154296875, -1.15673828125, -1.090118408203125, -1.02349853515625, -0.956878662109375, -0.8902587890625, -0.823638916015625, -0.75701904296875, -0.690399169921875, -0.623779296875, -0.557159423828125, -0.49053955078125, -0.423919677734375, -0.3572998046875, -0.290679931640625, -0.22406005859375, -0.157440185546875, -0.0908203125, -0.024200439453125, 0.04241943359375, 0.109039306640625, 0.1756591796875, 0.242279052734375, 0.30889892578125, 0.375518798828125, 0.442138671875, 0.508758544921875, 0.57537841796875, 0.641998291015625, 0.7086181640625, 0.775238037109375, 0.84185791015625, 0.908477783203125, 0.97509765625, 1.041717529296875, 1.10833740234375, 1.174957275390625, 1.2415771484375, 1.308197021484375, 1.37481689453125, 1.441436767578125, 1.508056640625, 1.574676513671875, 1.64129638671875, 1.707916259765625, 1.7745361328125, 1.841156005859375, 1.90777587890625, 1.974395751953125, 2.041015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 18.0, 22.0, 32.0, 44.0, 53.0, 90.0, 111.0, 175.0, 224.0, 365.0, 611.0, 1080.0, 2278.0, 6126.0, 27430.0, 234953.0, 707068.0, 51862.0, 9428.0, 3066.0, 1416.0, 706.0, 423.0, 290.0, 176.0, 140.0, 90.0, 74.0, 48.0, 27.0, 30.0, 17.0, 16.0, 8.0, 5.0, 6.0, 5.0, 4.0, 8.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7578125, -5.57305908203125, -5.3883056640625, -5.20355224609375, -5.018798828125, -4.83404541015625, -4.6492919921875, -4.46453857421875, -4.27978515625, -4.09503173828125, -3.9102783203125, -3.72552490234375, -3.540771484375, -3.35601806640625, -3.1712646484375, -2.98651123046875, -2.8017578125, -2.61700439453125, -2.4322509765625, -2.24749755859375, -2.062744140625, -1.87799072265625, -1.6932373046875, -1.50848388671875, -1.32373046875, -1.13897705078125, -0.9542236328125, -0.76947021484375, -0.584716796875, -0.39996337890625, -0.2152099609375, -0.03045654296875, 0.154296875, 0.33905029296875, 0.5238037109375, 0.70855712890625, 0.893310546875, 1.07806396484375, 1.2628173828125, 1.44757080078125, 1.63232421875, 1.81707763671875, 2.0018310546875, 2.18658447265625, 2.371337890625, 2.55609130859375, 2.7408447265625, 2.92559814453125, 3.1103515625, 3.29510498046875, 3.4798583984375, 3.66461181640625, 3.849365234375, 4.03411865234375, 4.2188720703125, 4.40362548828125, 4.58837890625, 4.77313232421875, 4.9578857421875, 5.14263916015625, 5.327392578125, 5.51214599609375, 5.6968994140625, 5.88165283203125, 6.06640625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 8.0, 9.0, 9.0, 9.0, 21.0, 25.0, 30.0, 35.0, 49.0, 46.0, 61.0, 55.0, 86.0, 58.0, 63.0, 72.0, 65.0, 46.0, 45.0, 40.0, 37.0, 27.0, 13.0, 18.0, 14.0, 7.0, 8.0, 8.0, 7.0, 3.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5625, -7.316650390625, -7.07080078125, -6.824951171875, -6.5791015625, -6.333251953125, -6.08740234375, -5.841552734375, -5.595703125, -5.349853515625, -5.10400390625, -4.858154296875, -4.6123046875, -4.366455078125, -4.12060546875, -3.874755859375, -3.62890625, -3.383056640625, -3.13720703125, -2.891357421875, -2.6455078125, -2.399658203125, -2.15380859375, -1.907958984375, -1.662109375, -1.416259765625, -1.17041015625, -0.924560546875, -0.6787109375, -0.432861328125, -0.18701171875, 0.058837890625, 0.3046875, 0.550537109375, 0.79638671875, 1.042236328125, 1.2880859375, 1.533935546875, 1.77978515625, 2.025634765625, 2.271484375, 2.517333984375, 2.76318359375, 3.009033203125, 3.2548828125, 3.500732421875, 3.74658203125, 3.992431640625, 4.23828125, 4.484130859375, 4.72998046875, 4.975830078125, 5.2216796875, 5.467529296875, 5.71337890625, 5.959228515625, 6.205078125, 6.450927734375, 6.69677734375, 6.942626953125, 7.1884765625, 7.434326171875, 7.68017578125, 7.926025390625, 8.171875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 10.0, 24.0, 32.0, 70.0, 134.0, 249.0, 555.0, 1478.0, 4984.0, 26227.0, 235426.0, 720883.0, 47085.0, 8071.0, 1985.0, 678.0, 301.0, 142.0, 79.0, 55.0, 26.0, 17.0, 10.0, 8.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5810546875, -1.530303955078125, -1.47955322265625, -1.428802490234375, -1.3780517578125, -1.327301025390625, -1.27655029296875, -1.225799560546875, -1.175048828125, -1.124298095703125, -1.07354736328125, -1.022796630859375, -0.9720458984375, -0.921295166015625, -0.87054443359375, -0.819793701171875, -0.76904296875, -0.718292236328125, -0.66754150390625, -0.616790771484375, -0.5660400390625, -0.515289306640625, -0.46453857421875, -0.413787841796875, -0.363037109375, -0.312286376953125, -0.26153564453125, -0.210784912109375, -0.1600341796875, -0.109283447265625, -0.05853271484375, -0.007781982421875, 0.04296875, 0.093719482421875, 0.14447021484375, 0.195220947265625, 0.2459716796875, 0.296722412109375, 0.34747314453125, 0.398223876953125, 0.448974609375, 0.499725341796875, 0.55047607421875, 0.601226806640625, 0.6519775390625, 0.702728271484375, 0.75347900390625, 0.804229736328125, 0.85498046875, 0.905731201171875, 0.95648193359375, 1.007232666015625, 1.0579833984375, 1.108734130859375, 1.15948486328125, 1.210235595703125, 1.260986328125, 1.311737060546875, 1.36248779296875, 1.413238525390625, 1.4639892578125, 1.514739990234375, 1.56549072265625, 1.616241455078125, 1.6669921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 2.0, 1.0, 3.0, 8.0, 5.0, 11.0, 9.0, 8.0, 13.0, 26.0, 26.0, 25.0, 26.0, 39.0, 43.0, 63.0, 78.0, 81.0, 86.0, 80.0, 56.0, 55.0, 46.0, 39.0, 35.0, 22.0, 26.0, 14.0, 14.0, 11.0, 9.0, 8.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.00040721893310546875, -0.00039536505937576294, -0.00038351118564605713, -0.0003716573119163513, -0.0003598034381866455, -0.0003479495644569397, -0.0003360956907272339, -0.0003242418169975281, -0.00031238794326782227, -0.00030053406953811646, -0.00028868019580841064, -0.00027682632207870483, -0.000264972448348999, -0.0002531185746192932, -0.0002412647008895874, -0.0002294108271598816, -0.00021755695343017578, -0.00020570307970046997, -0.00019384920597076416, -0.00018199533224105835, -0.00017014145851135254, -0.00015828758478164673, -0.00014643371105194092, -0.0001345798373222351, -0.0001227259635925293, -0.00011087208986282349, -9.901821613311768e-05, -8.716434240341187e-05, -7.531046867370605e-05, -6.345659494400024e-05, -5.1602721214294434e-05, -3.974884748458862e-05, -2.7894973754882812e-05, -1.6041100025177002e-05, -4.187226295471191e-06, 7.666647434234619e-06, 1.952052116394043e-05, 3.137439489364624e-05, 4.322826862335205e-05, 5.508214235305786e-05, 6.693601608276367e-05, 7.878988981246948e-05, 9.064376354217529e-05, 0.0001024976372718811, 0.00011435151100158691, 0.00012620538473129272, 0.00013805925846099854, 0.00014991313219070435, 0.00016176700592041016, 0.00017362087965011597, 0.00018547475337982178, 0.0001973286271095276, 0.0002091825008392334, 0.0002210363745689392, 0.00023289024829864502, 0.00024474412202835083, 0.00025659799575805664, 0.00026845186948776245, 0.00028030574321746826, 0.00029215961694717407, 0.0003040134906768799, 0.0003158673644065857, 0.0003277212381362915, 0.0003395751118659973, 0.0003514289855957031]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 11.0, 15.0, 14.0, 13.0, 43.0, 43.0, 55.0, 85.0, 141.0, 176.0, 258.0, 462.0, 917.0, 1778.0, 3829.0, 10257.0, 33514.0, 143309.0, 665994.0, 137671.0, 32166.0, 9977.0, 3871.0, 1661.0, 868.0, 491.0, 285.0, 189.0, 140.0, 79.0, 74.0, 41.0, 28.0, 22.0, 16.0, 11.0, 6.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9990234375, -0.9700546264648438, -0.9410858154296875, -0.9121170043945312, -0.883148193359375, -0.8541793823242188, -0.8252105712890625, -0.7962417602539062, -0.76727294921875, -0.7383041381835938, -0.7093353271484375, -0.6803665161132812, -0.651397705078125, -0.6224288940429688, -0.5934600830078125, -0.5644912719726562, -0.5355224609375, -0.5065536499023438, -0.4775848388671875, -0.44861602783203125, -0.419647216796875, -0.39067840576171875, -0.3617095947265625, -0.33274078369140625, -0.30377197265625, -0.27480316162109375, -0.2458343505859375, -0.21686553955078125, -0.187896728515625, -0.15892791748046875, -0.1299591064453125, -0.10099029541015625, -0.072021484375, -0.04305267333984375, -0.0140838623046875, 0.01488494873046875, 0.043853759765625, 0.07282257080078125, 0.1017913818359375, 0.13076019287109375, 0.15972900390625, 0.18869781494140625, 0.2176666259765625, 0.24663543701171875, 0.275604248046875, 0.30457305908203125, 0.3335418701171875, 0.36251068115234375, 0.3914794921875, 0.42044830322265625, 0.4494171142578125, 0.47838592529296875, 0.507354736328125, 0.5363235473632812, 0.5652923583984375, 0.5942611694335938, 0.62322998046875, 0.6521987915039062, 0.6811676025390625, 0.7101364135742188, 0.739105224609375, 0.7680740356445312, 0.7970428466796875, 0.8260116577148438, 0.85498046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 6.0, 6.0, 17.0, 10.0, 18.0, 25.0, 43.0, 62.0, 44.0, 53.0, 96.0, 96.0, 78.0, 96.0, 76.0, 52.0, 43.0, 44.0, 30.0, 21.0, 14.0, 16.0, 15.0, 7.0, 7.0, 5.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3330078125, -1.2970962524414062, -1.2611846923828125, -1.2252731323242188, -1.189361572265625, -1.1534500122070312, -1.1175384521484375, -1.0816268920898438, -1.04571533203125, -1.0098037719726562, -0.9738922119140625, -0.9379806518554688, -0.902069091796875, -0.8661575317382812, -0.8302459716796875, -0.7943344116210938, -0.7584228515625, -0.7225112915039062, -0.6865997314453125, -0.6506881713867188, -0.614776611328125, -0.5788650512695312, -0.5429534912109375, -0.5070419311523438, -0.47113037109375, -0.43521881103515625, -0.3993072509765625, -0.36339569091796875, -0.327484130859375, -0.29157257080078125, -0.2556610107421875, -0.21974945068359375, -0.183837890625, -0.14792633056640625, -0.1120147705078125, -0.07610321044921875, -0.040191650390625, -0.00428009033203125, 0.0316314697265625, 0.06754302978515625, 0.10345458984375, 0.13936614990234375, 0.1752777099609375, 0.21118927001953125, 0.247100830078125, 0.28301239013671875, 0.3189239501953125, 0.35483551025390625, 0.3907470703125, 0.42665863037109375, 0.4625701904296875, 0.49848175048828125, 0.534393310546875, 0.5703048706054688, 0.6062164306640625, 0.6421279907226562, 0.67803955078125, 0.7139511108398438, 0.7498626708984375, 0.7857742309570312, 0.821685791015625, 0.8575973510742188, 0.8935089111328125, 0.9294204711914062, 0.96533203125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 13.0, 15.0, 31.0, 79.0, 129.0, 398.0, 162.0, 84.0, 44.0, 23.0, 13.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.56752014160156, -50.07111740112305, -48.574710845947266, -47.07830810546875, -45.58190155029297, -44.08549880981445, -42.58909606933594, -41.092689514160156, -39.59628677368164, -38.099884033203125, -36.603477478027344, -35.10707473754883, -33.61066818237305, -32.11426544189453, -30.617860794067383, -29.121456146240234, -27.625051498413086, -26.128646850585938, -24.63224220275879, -23.13583755493164, -21.639434814453125, -20.143030166625977, -18.646625518798828, -17.150222778320312, -15.653817176818848, -14.1574125289917, -12.661008834838867, -11.164604187011719, -9.66819953918457, -8.171795845031738, -6.67539119720459, -5.178987503051758, -3.6825828552246094, -2.186178684234619, -0.6897742748260498, 0.8066301345825195, 2.3030343055725098, 3.7994384765625, 5.295843124389648, 6.7922468185424805, 8.288651466369629, 9.785056114196777, 11.28145980834961, 12.777864456176758, 14.274269104003906, 15.770672798156738, 17.267078399658203, 18.76348114013672, 20.259885787963867, 21.756290435791016, 23.252695083618164, 24.749099731445312, 26.245502471923828, 27.741907119750977, 29.238311767578125, 30.73471450805664, 32.23112106323242, 33.72752380371094, 35.22393035888672, 36.720333099365234, 38.216739654541016, 39.71314239501953, 41.20954895019531, 42.70595169067383, 44.202354431152344]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 2.0, 7.0, 5.0, 11.0, 14.0, 15.0, 15.0, 17.0, 18.0, 18.0, 35.0, 36.0, 26.0, 33.0, 38.0, 83.0, 138.0, 130.0, 44.0, 32.0, 25.0, 27.0, 30.0, 20.0, 24.0, 28.0, 23.0, 16.0, 5.0, 13.0, 16.0, 8.0, 8.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.42059326171875, -22.659746170043945, -21.89889907836914, -21.138051986694336, -20.37720489501953, -19.616357803344727, -18.855510711669922, -18.09466552734375, -17.333816528320312, -16.572969436645508, -15.812122344970703, -15.051275253295898, -14.290428161621094, -13.529581069946289, -12.7687349319458, -12.007887840270996, -11.247041702270508, -10.486194610595703, -9.725347518920898, -8.964500427246094, -8.203653335571289, -7.442806720733643, -6.681960105895996, -5.921113014221191, -5.160265922546387, -4.399418830871582, -3.6385719776153564, -2.877725124359131, -2.116878032684326, -1.3560309410095215, -0.595184326171875, 0.1656627655029297, 0.9265098571777344, 1.6873568296432495, 2.4482038021087646, 3.2090506553649902, 3.969897747039795, 4.7307448387146, 5.491591453552246, 6.252438545227051, 7.0132856369018555, 7.77413272857666, 8.534979820251465, 9.295825958251953, 10.056673049926758, 10.817520141601562, 11.578367233276367, 12.339214324951172, 13.100061416625977, 13.860908508300781, 14.621755599975586, 15.38260269165039, 16.143449783325195, 16.904296875, 17.665142059326172, 18.42599105834961, 19.18683624267578, 19.947683334350586, 20.70853042602539, 21.469377517700195, 22.230224609375, 22.991071701049805, 23.75191879272461, 24.51276397705078, 25.27361297607422]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 11.0, 6.0, 8.0, 15.0, 16.0, 26.0, 36.0, 58.0, 90.0, 118.0, 178.0, 252.0, 356.0, 556.0, 994.0, 1452.0, 2607.0, 4603.0, 9419.0, 20463.0, 54535.0, 173241.0, 566441.0, 1394259.0, 1245136.0, 484219.0, 148075.0, 48464.0, 19227.0, 8570.0, 4421.0, 2425.0, 1427.0, 865.0, 545.0, 400.0, 237.0, 161.0, 120.0, 74.0, 58.0, 37.0, 35.0, 14.0, 8.0, 10.0, 13.0, 8.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9951171875, -1.9395904541015625, -1.884063720703125, -1.8285369873046875, -1.77301025390625, -1.7174835205078125, -1.661956787109375, -1.6064300537109375, -1.5509033203125, -1.4953765869140625, -1.439849853515625, -1.3843231201171875, -1.32879638671875, -1.2732696533203125, -1.217742919921875, -1.1622161865234375, -1.106689453125, -1.0511627197265625, -0.995635986328125, -0.9401092529296875, -0.88458251953125, -0.8290557861328125, -0.773529052734375, -0.7180023193359375, -0.6624755859375, -0.6069488525390625, -0.551422119140625, -0.4958953857421875, -0.44036865234375, -0.3848419189453125, -0.329315185546875, -0.2737884521484375, -0.21826171875, -0.1627349853515625, -0.107208251953125, -0.0516815185546875, 0.00384521484375, 0.0593719482421875, 0.114898681640625, 0.1704254150390625, 0.2259521484375, 0.2814788818359375, 0.337005615234375, 0.3925323486328125, 0.44805908203125, 0.5035858154296875, 0.559112548828125, 0.6146392822265625, 0.670166015625, 0.7256927490234375, 0.781219482421875, 0.8367462158203125, 0.89227294921875, 0.9477996826171875, 1.003326416015625, 1.0588531494140625, 1.1143798828125, 1.1699066162109375, 1.225433349609375, 1.2809600830078125, 1.33648681640625, 1.3920135498046875, 1.447540283203125, 1.5030670166015625, 1.55859375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 5.0, 2.0, 8.0, 13.0, 17.0, 19.0, 24.0, 25.0, 32.0, 32.0, 38.0, 36.0, 43.0, 53.0, 45.0, 68.0, 73.0, 52.0, 56.0, 38.0, 40.0, 40.0, 43.0, 41.0, 35.0, 22.0, 21.0, 16.0, 17.0, 12.0, 10.0, 8.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.119140625, -2.0626983642578125, -2.006256103515625, -1.9498138427734375, -1.89337158203125, -1.8369293212890625, -1.780487060546875, -1.7240447998046875, -1.6676025390625, -1.6111602783203125, -1.554718017578125, -1.4982757568359375, -1.44183349609375, -1.3853912353515625, -1.328948974609375, -1.2725067138671875, -1.216064453125, -1.1596221923828125, -1.103179931640625, -1.0467376708984375, -0.99029541015625, -0.9338531494140625, -0.877410888671875, -0.8209686279296875, -0.7645263671875, -0.7080841064453125, -0.651641845703125, -0.5951995849609375, -0.53875732421875, -0.4823150634765625, -0.425872802734375, -0.3694305419921875, -0.31298828125, -0.2565460205078125, -0.200103759765625, -0.1436614990234375, -0.08721923828125, -0.0307769775390625, 0.025665283203125, 0.0821075439453125, 0.1385498046875, 0.1949920654296875, 0.251434326171875, 0.3078765869140625, 0.36431884765625, 0.4207611083984375, 0.477203369140625, 0.5336456298828125, 0.590087890625, 0.6465301513671875, 0.702972412109375, 0.7594146728515625, 0.81585693359375, 0.8722991943359375, 0.928741455078125, 0.9851837158203125, 1.0416259765625, 1.0980682373046875, 1.154510498046875, 1.2109527587890625, 1.26739501953125, 1.3238372802734375, 1.380279541015625, 1.4367218017578125, 1.4931640625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 12.0, 14.0, 17.0, 22.0, 25.0, 45.0, 67.0, 134.0, 229.0, 379.0, 712.0, 1515.0, 4530.0, 43449.0, 3868923.0, 260686.0, 9243.0, 2240.0, 867.0, 435.0, 288.0, 144.0, 97.0, 62.0, 58.0, 23.0, 14.0, 11.0, 6.0, 5.0, 8.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.2265625, -9.931884765625, -9.63720703125, -9.342529296875, -9.0478515625, -8.753173828125, -8.45849609375, -8.163818359375, -7.869140625, -7.574462890625, -7.27978515625, -6.985107421875, -6.6904296875, -6.395751953125, -6.10107421875, -5.806396484375, -5.51171875, -5.217041015625, -4.92236328125, -4.627685546875, -4.3330078125, -4.038330078125, -3.74365234375, -3.448974609375, -3.154296875, -2.859619140625, -2.56494140625, -2.270263671875, -1.9755859375, -1.680908203125, -1.38623046875, -1.091552734375, -0.796875, -0.502197265625, -0.20751953125, 0.087158203125, 0.3818359375, 0.676513671875, 0.97119140625, 1.265869140625, 1.560546875, 1.855224609375, 2.14990234375, 2.444580078125, 2.7392578125, 3.033935546875, 3.32861328125, 3.623291015625, 3.91796875, 4.212646484375, 4.50732421875, 4.802001953125, 5.0966796875, 5.391357421875, 5.68603515625, 5.980712890625, 6.275390625, 6.570068359375, 6.86474609375, 7.159423828125, 7.4541015625, 7.748779296875, 8.04345703125, 8.338134765625, 8.6328125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 13.0, 17.0, 22.0, 46.0, 65.0, 113.0, 191.0, 253.0, 467.0, 710.0, 739.0, 532.0, 324.0, 234.0, 127.0, 77.0, 46.0, 28.0, 22.0, 20.0, 9.0, 12.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.25390625, -6.04608154296875, -5.8382568359375, -5.63043212890625, -5.422607421875, -5.21478271484375, -5.0069580078125, -4.79913330078125, -4.59130859375, -4.38348388671875, -4.1756591796875, -3.96783447265625, -3.760009765625, -3.55218505859375, -3.3443603515625, -3.13653564453125, -2.9287109375, -2.72088623046875, -2.5130615234375, -2.30523681640625, -2.097412109375, -1.88958740234375, -1.6817626953125, -1.47393798828125, -1.26611328125, -1.05828857421875, -0.8504638671875, -0.64263916015625, -0.434814453125, -0.22698974609375, -0.0191650390625, 0.18865966796875, 0.396484375, 0.60430908203125, 0.8121337890625, 1.01995849609375, 1.227783203125, 1.43560791015625, 1.6434326171875, 1.85125732421875, 2.05908203125, 2.26690673828125, 2.4747314453125, 2.68255615234375, 2.890380859375, 3.09820556640625, 3.3060302734375, 3.51385498046875, 3.7216796875, 3.92950439453125, 4.1373291015625, 4.34515380859375, 4.552978515625, 4.76080322265625, 4.9686279296875, 5.17645263671875, 5.38427734375, 5.59210205078125, 5.7999267578125, 6.00775146484375, 6.215576171875, 6.42340087890625, 6.6312255859375, 6.83905029296875, 7.046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 7.0, 3.0, 6.0, 7.0, 12.0, 17.0, 25.0, 54.0, 65.0, 91.0, 102.0, 140.0, 128.0, 110.0, 63.0, 51.0, 39.0, 21.0, 13.0, 9.0, 7.0, 6.0, 5.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-46.864784240722656, -45.5516242980957, -44.23846435546875, -42.92530822753906, -41.61214828491211, -40.298988342285156, -38.98583221435547, -37.672672271728516, -36.35951232910156, -35.04635238647461, -33.733192443847656, -32.42003631591797, -31.106876373291016, -29.793716430664062, -28.480558395385742, -27.167400360107422, -25.85424041748047, -24.541080474853516, -23.227922439575195, -21.914764404296875, -20.601604461669922, -19.28844451904297, -17.97528648376465, -16.662128448486328, -15.348968505859375, -14.035809516906738, -12.722650527954102, -11.409491539001465, -10.096332550048828, -8.783173561096191, -7.470014572143555, -6.156855583190918, -4.843696594238281, -3.5305376052856445, -2.217378616333008, -0.9042196273803711, 0.4089393615722656, 1.7220983505249023, 3.035257339477539, 4.348416328430176, 5.6615753173828125, 6.974734306335449, 8.287893295288086, 9.601052284240723, 10.91421127319336, 12.227370262145996, 13.540529251098633, 14.85368824005127, 16.166847229003906, 17.48000717163086, 18.79316520690918, 20.1063232421875, 21.419483184814453, 22.732643127441406, 24.045801162719727, 25.358959197998047, 26.672119140625, 27.985279083251953, 29.298437118530273, 30.611595153808594, 31.924755096435547, 33.2379150390625, 34.55107116699219, 35.86423110961914, 37.177391052246094]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 6.0, 8.0, 14.0, 11.0, 8.0, 13.0, 11.0, 12.0, 16.0, 35.0, 20.0, 30.0, 50.0, 37.0, 56.0, 52.0, 64.0, 66.0, 60.0, 59.0, 37.0, 40.0, 36.0, 34.0, 33.0, 40.0, 24.0, 24.0, 17.0, 16.0, 9.0, 12.0, 8.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.391754150390625, -26.52879524230957, -25.665836334228516, -24.80287742614746, -23.939918518066406, -23.07695770263672, -22.213998794555664, -21.35103988647461, -20.488080978393555, -19.6251220703125, -18.762163162231445, -17.89920425415039, -17.036243438720703, -16.17328643798828, -15.310325622558594, -14.447366714477539, -13.584407806396484, -12.72144889831543, -11.858489990234375, -10.995530128479004, -10.13257122039795, -9.269612312316895, -8.406652450561523, -7.543693542480469, -6.680734634399414, -5.817775726318359, -4.9548163414001465, -4.091856956481934, -3.228898048400879, -2.365939140319824, -1.5029797554016113, -0.6400203704833984, 0.22294044494628906, 1.0858995914459229, 1.9488587379455566, 2.8118178844451904, 3.674777030944824, 4.537735939025879, 5.400695323944092, 6.263654708862305, 7.126613616943359, 7.989572525024414, 8.852531433105469, 9.71549129486084, 10.578450202941895, 11.44140911102295, 12.30436897277832, 13.167327880859375, 14.03028678894043, 14.893245697021484, 15.756204605102539, 16.619163513183594, 17.48212432861328, 18.345081329345703, 19.20804214477539, 20.071001052856445, 20.9339599609375, 21.796918869018555, 22.65987777709961, 23.522836685180664, 24.38579559326172, 25.248756408691406, 26.11171531677246, 26.974674224853516, 27.83763313293457]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 7.0, 14.0, 26.0, 29.0, 62.0, 91.0, 182.0, 302.0, 619.0, 1253.0, 2724.0, 6206.0, 16964.0, 56910.0, 268388.0, 555561.0, 96593.0, 26526.0, 9054.0, 3653.0, 1669.0, 789.0, 365.0, 264.0, 118.0, 90.0, 31.0, 20.0, 18.0, 11.0, 3.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.356201171875, -4.23583984375, -4.115478515625, -3.9951171875, -3.874755859375, -3.75439453125, -3.634033203125, -3.513671875, -3.393310546875, -3.27294921875, -3.152587890625, -3.0322265625, -2.911865234375, -2.79150390625, -2.671142578125, -2.55078125, -2.430419921875, -2.31005859375, -2.189697265625, -2.0693359375, -1.948974609375, -1.82861328125, -1.708251953125, -1.587890625, -1.467529296875, -1.34716796875, -1.226806640625, -1.1064453125, -0.986083984375, -0.86572265625, -0.745361328125, -0.625, -0.504638671875, -0.38427734375, -0.263916015625, -0.1435546875, -0.023193359375, 0.09716796875, 0.217529296875, 0.337890625, 0.458251953125, 0.57861328125, 0.698974609375, 0.8193359375, 0.939697265625, 1.06005859375, 1.180419921875, 1.30078125, 1.421142578125, 1.54150390625, 1.661865234375, 1.7822265625, 1.902587890625, 2.02294921875, 2.143310546875, 2.263671875, 2.384033203125, 2.50439453125, 2.624755859375, 2.7451171875, 2.865478515625, 2.98583984375, 3.106201171875, 3.2265625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 10.0, 14.0, 13.0, 17.0, 26.0, 33.0, 41.0, 36.0, 44.0, 66.0, 58.0, 63.0, 64.0, 79.0, 56.0, 70.0, 51.0, 48.0, 40.0, 32.0, 28.0, 19.0, 25.0, 13.0, 9.0, 11.0, 3.0, 7.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.931640625, -2.854278564453125, -2.77691650390625, -2.699554443359375, -2.6221923828125, -2.544830322265625, -2.46746826171875, -2.390106201171875, -2.312744140625, -2.235382080078125, -2.15802001953125, -2.080657958984375, -2.0032958984375, -1.925933837890625, -1.84857177734375, -1.771209716796875, -1.69384765625, -1.616485595703125, -1.53912353515625, -1.461761474609375, -1.3843994140625, -1.307037353515625, -1.22967529296875, -1.152313232421875, -1.074951171875, -0.997589111328125, -0.92022705078125, -0.842864990234375, -0.7655029296875, -0.688140869140625, -0.61077880859375, -0.533416748046875, -0.4560546875, -0.378692626953125, -0.30133056640625, -0.223968505859375, -0.1466064453125, -0.069244384765625, 0.00811767578125, 0.085479736328125, 0.162841796875, 0.240203857421875, 0.31756591796875, 0.394927978515625, 0.4722900390625, 0.549652099609375, 0.62701416015625, 0.704376220703125, 0.78173828125, 0.859100341796875, 0.93646240234375, 1.013824462890625, 1.0911865234375, 1.168548583984375, 1.24591064453125, 1.323272705078125, 1.400634765625, 1.477996826171875, 1.55535888671875, 1.632720947265625, 1.7100830078125, 1.787445068359375, 1.86480712890625, 1.942169189453125, 2.01953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 17.0, 12.0, 22.0, 25.0, 43.0, 55.0, 88.0, 174.0, 290.0, 507.0, 1042.0, 2988.0, 12051.0, 100578.0, 879882.0, 40371.0, 6738.0, 1868.0, 781.0, 390.0, 202.0, 125.0, 95.0, 59.0, 45.0, 29.0, 15.0, 12.0, 13.0, 7.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.21484375, -5.03692626953125, -4.8590087890625, -4.68109130859375, -4.503173828125, -4.32525634765625, -4.1473388671875, -3.96942138671875, -3.79150390625, -3.61358642578125, -3.4356689453125, -3.25775146484375, -3.079833984375, -2.90191650390625, -2.7239990234375, -2.54608154296875, -2.3681640625, -2.19024658203125, -2.0123291015625, -1.83441162109375, -1.656494140625, -1.47857666015625, -1.3006591796875, -1.12274169921875, -0.94482421875, -0.76690673828125, -0.5889892578125, -0.41107177734375, -0.233154296875, -0.05523681640625, 0.1226806640625, 0.30059814453125, 0.478515625, 0.65643310546875, 0.8343505859375, 1.01226806640625, 1.190185546875, 1.36810302734375, 1.5460205078125, 1.72393798828125, 1.90185546875, 2.07977294921875, 2.2576904296875, 2.43560791015625, 2.613525390625, 2.79144287109375, 2.9693603515625, 3.14727783203125, 3.3251953125, 3.50311279296875, 3.6810302734375, 3.85894775390625, 4.036865234375, 4.21478271484375, 4.3927001953125, 4.57061767578125, 4.74853515625, 4.92645263671875, 5.1043701171875, 5.28228759765625, 5.460205078125, 5.63812255859375, 5.8160400390625, 5.99395751953125, 6.171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 9.0, 5.0, 4.0, 9.0, 11.0, 14.0, 14.0, 11.0, 13.0, 10.0, 19.0, 29.0, 22.0, 22.0, 34.0, 43.0, 66.0, 67.0, 95.0, 76.0, 58.0, 57.0, 44.0, 38.0, 36.0, 30.0, 17.0, 9.0, 20.0, 16.0, 17.0, 14.0, 10.0, 5.0, 9.0, 4.0, 8.0, 7.0, 5.0, 3.0, 7.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-7.27734375, -7.0506591796875, -6.823974609375, -6.5972900390625, -6.37060546875, -6.1439208984375, -5.917236328125, -5.6905517578125, -5.4638671875, -5.2371826171875, -5.010498046875, -4.7838134765625, -4.55712890625, -4.3304443359375, -4.103759765625, -3.8770751953125, -3.650390625, -3.4237060546875, -3.197021484375, -2.9703369140625, -2.74365234375, -2.5169677734375, -2.290283203125, -2.0635986328125, -1.8369140625, -1.6102294921875, -1.383544921875, -1.1568603515625, -0.93017578125, -0.7034912109375, -0.476806640625, -0.2501220703125, -0.0234375, 0.2032470703125, 0.429931640625, 0.6566162109375, 0.88330078125, 1.1099853515625, 1.336669921875, 1.5633544921875, 1.7900390625, 2.0167236328125, 2.243408203125, 2.4700927734375, 2.69677734375, 2.9234619140625, 3.150146484375, 3.3768310546875, 3.603515625, 3.8302001953125, 4.056884765625, 4.2835693359375, 4.51025390625, 4.7369384765625, 4.963623046875, 5.1903076171875, 5.4169921875, 5.6436767578125, 5.870361328125, 6.0970458984375, 6.32373046875, 6.5504150390625, 6.777099609375, 7.0037841796875, 7.23046875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 6.0, 9.0, 5.0, 13.0, 15.0, 18.0, 28.0, 33.0, 49.0, 80.0, 123.0, 221.0, 389.0, 630.0, 1330.0, 2948.0, 7971.0, 29524.0, 228541.0, 726587.0, 34552.0, 8976.0, 3344.0, 1391.0, 691.0, 388.0, 244.0, 136.0, 86.0, 56.0, 29.0, 23.0, 21.0, 11.0, 11.0, 12.0, 5.0, 8.0, 8.0, 2.0, 2.0, 10.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0], "bins": [-1.0693359375, -1.037933349609375, -1.00653076171875, -0.975128173828125, -0.9437255859375, -0.912322998046875, -0.88092041015625, -0.849517822265625, -0.818115234375, -0.786712646484375, -0.75531005859375, -0.723907470703125, -0.6925048828125, -0.661102294921875, -0.62969970703125, -0.598297119140625, -0.56689453125, -0.535491943359375, -0.50408935546875, -0.472686767578125, -0.4412841796875, -0.409881591796875, -0.37847900390625, -0.347076416015625, -0.315673828125, -0.284271240234375, -0.25286865234375, -0.221466064453125, -0.1900634765625, -0.158660888671875, -0.12725830078125, -0.095855712890625, -0.064453125, -0.033050537109375, -0.00164794921875, 0.029754638671875, 0.0611572265625, 0.092559814453125, 0.12396240234375, 0.155364990234375, 0.186767578125, 0.218170166015625, 0.24957275390625, 0.280975341796875, 0.3123779296875, 0.343780517578125, 0.37518310546875, 0.406585693359375, 0.43798828125, 0.469390869140625, 0.50079345703125, 0.532196044921875, 0.5635986328125, 0.595001220703125, 0.62640380859375, 0.657806396484375, 0.689208984375, 0.720611572265625, 0.75201416015625, 0.783416748046875, 0.8148193359375, 0.846221923828125, 0.87762451171875, 0.909027099609375, 0.9404296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 3.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 10.0, 10.0, 14.0, 27.0, 30.0, 52.0, 79.0, 104.0, 158.0, 144.0, 107.0, 74.0, 37.0, 27.0, 22.0, 12.0, 10.0, 15.0, 9.0, 2.0, 7.0, 3.0, 10.0, 3.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005240440368652344, -0.0005090534687042236, -0.0004940629005432129, -0.00047907233238220215, -0.0004640817642211914, -0.00044909119606018066, -0.0004341006278991699, -0.0004191100597381592, -0.00040411949157714844, -0.0003891289234161377, -0.00037413835525512695, -0.0003591477870941162, -0.00034415721893310547, -0.0003291666507720947, -0.000314176082611084, -0.00029918551445007324, -0.0002841949462890625, -0.00026920437812805176, -0.000254213809967041, -0.00023922324180603027, -0.00022423267364501953, -0.0002092421054840088, -0.00019425153732299805, -0.0001792609691619873, -0.00016427040100097656, -0.00014927983283996582, -0.00013428926467895508, -0.00011929869651794434, -0.0001043081283569336, -8.931756019592285e-05, -7.432699203491211e-05, -5.933642387390137e-05, -4.4345855712890625e-05, -2.9355287551879883e-05, -1.436471939086914e-05, 6.258487701416016e-07, 1.5616416931152344e-05, 3.0606985092163086e-05, 4.559755325317383e-05, 6.058812141418457e-05, 7.557868957519531e-05, 9.056925773620605e-05, 0.0001055598258972168, 0.00012055039405822754, 0.00013554096221923828, 0.00015053153038024902, 0.00016552209854125977, 0.0001805126667022705, 0.00019550323486328125, 0.000210493803024292, 0.00022548437118530273, 0.00024047493934631348, 0.0002554655075073242, 0.00027045607566833496, 0.0002854466438293457, 0.00030043721199035645, 0.0003154277801513672, 0.00033041834831237793, 0.00034540891647338867, 0.0003603994846343994, 0.00037539005279541016, 0.0003903806209564209, 0.00040537118911743164, 0.0004203617572784424, 0.0004353523254394531]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 11.0, 9.0, 20.0, 23.0, 40.0, 34.0, 71.0, 110.0, 230.0, 300.0, 583.0, 1148.0, 2347.0, 6076.0, 17396.0, 69668.0, 801130.0, 112277.0, 23400.0, 7597.0, 3087.0, 1392.0, 648.0, 378.0, 220.0, 129.0, 73.0, 45.0, 37.0, 29.0, 12.0, 6.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.82666015625, -0.8027877807617188, -0.7789154052734375, -0.7550430297851562, -0.731170654296875, -0.7072982788085938, -0.6834259033203125, -0.6595535278320312, -0.63568115234375, -0.6118087768554688, -0.5879364013671875, -0.5640640258789062, -0.540191650390625, -0.5163192749023438, -0.4924468994140625, -0.46857452392578125, -0.4447021484375, -0.42082977294921875, -0.3969573974609375, -0.37308502197265625, -0.349212646484375, -0.32534027099609375, -0.3014678955078125, -0.27759552001953125, -0.25372314453125, -0.22985076904296875, -0.2059783935546875, -0.18210601806640625, -0.158233642578125, -0.13436126708984375, -0.1104888916015625, -0.08661651611328125, -0.062744140625, -0.03887176513671875, -0.0149993896484375, 0.00887298583984375, 0.032745361328125, 0.05661773681640625, 0.0804901123046875, 0.10436248779296875, 0.12823486328125, 0.15210723876953125, 0.1759796142578125, 0.19985198974609375, 0.223724365234375, 0.24759674072265625, 0.2714691162109375, 0.29534149169921875, 0.3192138671875, 0.34308624267578125, 0.3669586181640625, 0.39083099365234375, 0.414703369140625, 0.43857574462890625, 0.4624481201171875, 0.48632049560546875, 0.51019287109375, 0.5340652465820312, 0.5579376220703125, 0.5818099975585938, 0.605682373046875, 0.6295547485351562, 0.6534271240234375, 0.6772994995117188, 0.701171875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 5.0, 6.0, 5.0, 11.0, 9.0, 12.0, 17.0, 19.0, 33.0, 47.0, 57.0, 76.0, 89.0, 79.0, 95.0, 76.0, 85.0, 78.0, 55.0, 35.0, 17.0, 21.0, 20.0, 17.0, 14.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.876953125, -0.8470458984375, -0.817138671875, -0.7872314453125, -0.75732421875, -0.7274169921875, -0.697509765625, -0.6676025390625, -0.6376953125, -0.6077880859375, -0.577880859375, -0.5479736328125, -0.51806640625, -0.4881591796875, -0.458251953125, -0.4283447265625, -0.3984375, -0.3685302734375, -0.338623046875, -0.3087158203125, -0.27880859375, -0.2489013671875, -0.218994140625, -0.1890869140625, -0.1591796875, -0.1292724609375, -0.099365234375, -0.0694580078125, -0.03955078125, -0.0096435546875, 0.020263671875, 0.0501708984375, 0.080078125, 0.1099853515625, 0.139892578125, 0.1697998046875, 0.19970703125, 0.2296142578125, 0.259521484375, 0.2894287109375, 0.3193359375, 0.3492431640625, 0.379150390625, 0.4090576171875, 0.43896484375, 0.4688720703125, 0.498779296875, 0.5286865234375, 0.55859375, 0.5885009765625, 0.618408203125, 0.6483154296875, 0.67822265625, 0.7081298828125, 0.738037109375, 0.7679443359375, 0.7978515625, 0.8277587890625, 0.857666015625, 0.8875732421875, 0.91748046875, 0.9473876953125, 0.977294921875, 1.0072021484375, 1.037109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 10.0, 9.0, 16.0, 44.0, 106.0, 531.0, 186.0, 56.0, 21.0, 14.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-67.82656860351562, -66.08081817626953, -64.33506774902344, -62.589324951171875, -60.84357452392578, -59.09782409667969, -57.35207748413086, -55.60633087158203, -53.86058044433594, -52.114830017089844, -50.369083404541016, -48.62333679199219, -46.877586364746094, -45.1318359375, -43.38608932495117, -41.640342712402344, -39.89459228515625, -38.148841857910156, -36.40309524536133, -34.6573486328125, -32.911598205566406, -31.165849685668945, -29.420101165771484, -27.674352645874023, -25.928604125976562, -24.1828556060791, -22.43710708618164, -20.69135856628418, -18.94561004638672, -17.199861526489258, -15.454113006591797, -13.708364486694336, -11.96261215209961, -10.216863632202148, -8.471115112304688, -6.725366592407227, -4.979618072509766, -3.2338695526123047, -1.4881210327148438, 0.2576274871826172, 2.003376007080078, 3.749124526977539, 5.494873046875, 7.240621566772461, 8.986370086669922, 10.732118606567383, 12.477867126464844, 14.223615646362305, 15.969364166259766, 17.715112686157227, 19.460861206054688, 21.20660972595215, 22.95235824584961, 24.69810676574707, 26.44385528564453, 28.189603805541992, 29.935352325439453, 31.681100845336914, 33.426849365234375, 35.17259979248047, 36.9183464050293, 38.664093017578125, 40.40984344482422, 42.15559387207031, 43.90134048461914]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 5.0, 4.0, 14.0, 13.0, 8.0, 9.0, 13.0, 31.0, 17.0, 17.0, 26.0, 25.0, 24.0, 24.0, 112.0, 363.0, 50.0, 33.0, 28.0, 22.0, 31.0, 18.0, 15.0, 20.0, 16.0, 13.0, 12.0, 9.0, 3.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.131650924682617, -28.351926803588867, -27.572202682495117, -26.792478561401367, -26.01275634765625, -25.2330322265625, -24.45330810546875, -23.673583984375, -22.89385986328125, -22.1141357421875, -21.33441162109375, -20.5546875, -19.77496337890625, -18.995241165161133, -18.215517044067383, -17.435792922973633, -16.656068801879883, -15.876344680786133, -15.096620559692383, -14.31689739227295, -13.5371732711792, -12.75744915008545, -11.977725982666016, -11.198001861572266, -10.418277740478516, -9.638553619384766, -8.858829498291016, -8.079106330871582, -7.299382209777832, -6.519658088684082, -5.73993444442749, -4.960210800170898, -4.180488586425781, -3.4007647037506104, -2.6210408210754395, -1.8413169384002686, -1.0615930557250977, -0.28186917304992676, 0.49785470962524414, 1.277578353881836, 2.057302474975586, 2.837026357650757, 3.6167502403259277, 4.3964738845825195, 5.1761980056762695, 5.9559221267700195, 6.735645771026611, 7.515369415283203, 8.295093536376953, 9.074817657470703, 9.854541778564453, 10.634264945983887, 11.413989067077637, 12.193713188171387, 12.97343635559082, 13.75316047668457, 14.53288459777832, 15.31260871887207, 16.09233283996582, 16.87205696105957, 17.651779174804688, 18.431503295898438, 19.211227416992188, 19.990951538085938, 20.770675659179688]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 5.0, 3.0, 7.0, 5.0, 13.0, 15.0, 17.0, 20.0, 21.0, 28.0, 25.0, 42.0, 40.0, 85.0, 232.0, 108.0, 59.0, 41.0, 41.0, 35.0, 24.0, 20.0, 20.0, 16.0, 15.0, 6.0, 12.0, 6.0, 6.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6015625, -1.541168212890625, -1.48077392578125, -1.420379638671875, -1.3599853515625, -1.299591064453125, -1.23919677734375, -1.178802490234375, -1.118408203125, -1.058013916015625, -0.99761962890625, -0.937225341796875, -0.8768310546875, -0.816436767578125, -0.75604248046875, -0.695648193359375, -0.63525390625, -0.574859619140625, -0.51446533203125, -0.454071044921875, -0.3936767578125, -0.333282470703125, -0.27288818359375, -0.212493896484375, -0.152099609375, -0.091705322265625, -0.03131103515625, 0.029083251953125, 0.0894775390625, 0.149871826171875, 0.21026611328125, 0.270660400390625, 0.3310546875, 0.391448974609375, 0.45184326171875, 0.512237548828125, 0.5726318359375, 0.633026123046875, 0.69342041015625, 0.753814697265625, 0.814208984375, 0.874603271484375, 0.93499755859375, 0.995391845703125, 1.0557861328125, 1.116180419921875, 1.17657470703125, 1.236968994140625, 1.29736328125, 1.357757568359375, 1.41815185546875, 1.478546142578125, 1.5389404296875, 1.599334716796875, 1.65972900390625, 1.720123291015625, 1.780517578125, 1.840911865234375, 1.90130615234375, 1.961700439453125, 2.0220947265625, 2.082489013671875, 2.14288330078125, 2.203277587890625, 2.263671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 11.0, 13.0, 7.0, 2.0, 5.0, 9.0, 15.0, 11.0, 32.0, 32.0, 68.0, 128.0, 258.0, 590.0, 1771.0, 7847.0, 8282076.0, 88016.0, 5317.0, 1368.0, 437.0, 222.0, 128.0, 67.0, 39.0, 24.0, 15.0, 21.0, 9.0, 7.0, 7.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 1.0], "bins": [-16.518423080444336, -15.94644546508789, -15.374467849731445, -14.802490234375, -14.230512619018555, -13.65853500366211, -13.086556434631348, -12.514578819274902, -11.942601203918457, -11.370623588562012, -10.798645973205566, -10.226668357849121, -9.65468978881836, -9.082712173461914, -8.510734558105469, -7.938756942749023, -7.366779327392578, -6.794801712036133, -6.2228240966796875, -5.650846004486084, -5.078868389129639, -4.506890773773193, -3.934912919998169, -3.3629350662231445, -2.790957450866699, -2.218979835510254, -1.6470019817352295, -1.0750242471694946, -0.5030465126037598, 0.06893110275268555, 0.64090895652771, 1.2128868103027344, 1.7848625183105469, 2.356840133666992, 2.9288179874420166, 3.500795841217041, 4.072773456573486, 4.644751071929932, 5.216729164123535, 5.7887067794799805, 6.360684394836426, 6.932662010192871, 7.504639625549316, 8.076617240905762, 8.648595809936523, 9.220573425292969, 9.792551040649414, 10.36452865600586, 10.936506271362305, 11.50848388671875, 12.080461502075195, 12.65243911743164, 13.224416732788086, 13.796394348144531, 14.368372917175293, 14.940350532531738, 15.512328147888184, 16.084306716918945, 16.65628433227539, 17.228261947631836, 17.80023956298828, 18.372217178344727, 18.944194793701172, 19.516172409057617, 20.088150024414062]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 5.0, 3.0, 4.0, 5.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.030651092529297, -11.654017448425293, -11.277384757995605, -10.900751113891602, -10.524117469787598, -10.147483825683594, -9.770851135253906, -9.394217491149902, -9.017583847045898, -8.640950202941895, -8.264317512512207, -7.887683868408203, -7.511050224304199, -7.1344170570373535, -6.757783889770508, -6.381150245666504, -6.004517555236816, -5.627884387969971, -5.251250743865967, -4.874617576599121, -4.497983932495117, -4.1213507652282715, -3.744717597961426, -3.368084192276001, -2.991450786590576, -2.6148173809051514, -2.2381839752197266, -1.8615508079528809, -1.484917402267456, -1.1082839965820312, -0.7316508293151855, -0.35501742362976074, 0.02161693572998047, 0.3982502818107605, 0.7748836278915405, 1.1515169143676758, 1.5281503200531006, 1.9047837257385254, 2.281416893005371, 2.658050298690796, 3.0346837043762207, 3.4113171100616455, 3.7879505157470703, 4.164583683013916, 4.541216850280762, 4.917850494384766, 5.294483661651611, 5.671116828918457, 6.047750473022461, 6.424383640289307, 6.8010172843933105, 7.177650451660156, 7.55428409576416, 7.930917263031006, 8.307550430297852, 8.684184074401855, 9.06081771850586, 9.437451362609863, 9.81408405303955, 10.190717697143555, 10.567351341247559, 10.943984985351562, 11.32061767578125, 11.697251319885254, 12.073884010314941]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 2.0, 6.0, 15.0, 18.0, 27.0, 35.0, 66.0, 62.0, 99.0, 180.0, 238.0, 546.0, 1126.0, 2496.0, 6358.0, 17972.0, 57824.0, 185481.0, 173318.0, 52150.0, 16314.0, 5617.0, 2248.0, 963.0, 468.0, 246.0, 151.0, 71.0, 54.0, 29.0, 19.0, 21.0, 15.0, 4.0, 6.0, 4.0, 6.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-20.515625, -19.9891357421875, -19.462646484375, -18.9361572265625, -18.40966796875, -17.8831787109375, -17.356689453125, -16.8302001953125, -16.3037109375, -15.7772216796875, -15.250732421875, -14.7242431640625, -14.19775390625, -13.6712646484375, -13.144775390625, -12.6182861328125, -12.091796875, -11.5653076171875, -11.038818359375, -10.5123291015625, -9.98583984375, -9.4593505859375, -8.932861328125, -8.4063720703125, -7.8798828125, -7.3533935546875, -6.826904296875, -6.3004150390625, -5.77392578125, -5.2474365234375, -4.720947265625, -4.1944580078125, -3.66796875, -3.1414794921875, -2.614990234375, -2.0885009765625, -1.56201171875, -1.0355224609375, -0.509033203125, 0.0174560546875, 0.5439453125, 1.0704345703125, 1.596923828125, 2.1234130859375, 2.64990234375, 3.1763916015625, 3.702880859375, 4.2293701171875, 4.755859375, 5.2823486328125, 5.808837890625, 6.3353271484375, 6.86181640625, 7.3883056640625, 7.914794921875, 8.4412841796875, 8.9677734375, 9.4942626953125, 10.020751953125, 10.5472412109375, 11.07373046875, 11.6002197265625, 12.126708984375, 12.6531982421875, 13.1796875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 9.0, 2.0, 1.0, 6.0, 4.0, 10.0, 13.0, 11.0, 24.0, 23.0, 25.0, 36.0, 63.0, 60.0, 59.0, 57.0, 76.0, 62.0, 75.0, 80.0, 63.0, 61.0, 41.0, 33.0, 27.0, 22.0, 9.0, 18.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0], "bins": [-3.162109375, -3.0879669189453125, -3.013824462890625, -2.9396820068359375, -2.86553955078125, -2.7913970947265625, -2.717254638671875, -2.6431121826171875, -2.5689697265625, -2.4948272705078125, -2.420684814453125, -2.3465423583984375, -2.27239990234375, -2.1982574462890625, -2.124114990234375, -2.0499725341796875, -1.975830078125, -1.9016876220703125, -1.827545166015625, -1.7534027099609375, -1.67926025390625, -1.6051177978515625, -1.530975341796875, -1.4568328857421875, -1.3826904296875, -1.3085479736328125, -1.234405517578125, -1.1602630615234375, -1.08612060546875, -1.0119781494140625, -0.937835693359375, -0.8636932373046875, -0.78955078125, -0.7154083251953125, -0.641265869140625, -0.5671234130859375, -0.49298095703125, -0.4188385009765625, -0.344696044921875, -0.2705535888671875, -0.1964111328125, -0.1222686767578125, -0.048126220703125, 0.0260162353515625, 0.10015869140625, 0.1743011474609375, 0.248443603515625, 0.3225860595703125, 0.396728515625, 0.4708709716796875, 0.545013427734375, 0.6191558837890625, 0.69329833984375, 0.7674407958984375, 0.841583251953125, 0.9157257080078125, 0.9898681640625, 1.0640106201171875, 1.138153076171875, 1.2122955322265625, 1.28643798828125, 1.3605804443359375, 1.434722900390625, 1.5088653564453125, 1.5830078125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 14.0, 25.0, 60.0, 106.0, 90.0, 73.0, 35.0, 19.0, 12.0, 6.0, 3.0, 4.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.48833656311035, -20.893512725830078, -20.298688888549805, -19.70386505126953, -19.109041213989258, -18.514217376708984, -17.919391632080078, -17.324567794799805, -16.72974395751953, -16.134920120239258, -15.540096282958984, -14.945272445678711, -14.350447654724121, -13.755623817443848, -13.160799980163574, -12.565975189208984, -11.971152305603027, -11.376328468322754, -10.78150463104248, -10.18667984008789, -9.591856002807617, -8.997032165527344, -8.40220832824707, -7.807384014129639, -7.212560176849365, -6.617736339569092, -6.02291202545166, -5.428088188171387, -4.833264350891113, -4.238440036773682, -3.643616199493408, -3.0487918853759766, -2.453968048095703, -1.8591439723968506, -1.2643200159072876, -0.6694960594177246, -0.07467198371887207, 0.5201520919799805, 1.114975929260254, 1.7098002433776855, 2.304624080657959, 2.8994481563568115, 3.494272232055664, 4.0890960693359375, 4.683919906616211, 5.278744220733643, 5.873568058013916, 6.468392372131348, 7.063216209411621, 7.6580400466918945, 8.252863883972168, 8.847688674926758, 9.442512512207031, 10.037336349487305, 10.632160186767578, 11.226984024047852, 11.821807861328125, 12.416631698608398, 13.011455535888672, 13.606279373168945, 14.201104164123535, 14.795928001403809, 15.390751838684082, 15.985576629638672, 16.580400466918945]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 5.0, 12.0, 18.0, 40.0, 101.0, 99.0, 94.0, 32.0, 16.0, 7.0, 5.0, 3.0, 4.0, 6.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.16215991973877, -11.80250072479248, -11.442840576171875, -11.083181381225586, -10.723522186279297, -10.363862991333008, -10.004202842712402, -9.644543647766113, -9.284883499145508, -8.925224304199219, -8.565564155578613, -8.205904960632324, -7.846245765686035, -7.486586093902588, -7.126926422119141, -6.767267227172852, -6.4076080322265625, -6.047948360443115, -5.688289165496826, -5.328629493713379, -4.96897029876709, -4.609310626983643, -4.249650955200195, -3.889991521835327, -3.530332088470459, -3.170672655105591, -2.8110132217407227, -2.4513535499572754, -2.0916941165924072, -1.732034683227539, -1.3723750114440918, -1.0127155780792236, -0.6530551910400391, -0.2933956980705261, 0.06626379489898682, 0.42592334747314453, 0.7855827808380127, 1.1452422142028809, 1.5049018859863281, 1.8645613193511963, 2.2242207527160645, 2.5838801860809326, 2.943539619445801, 3.303199291229248, 3.662858724594116, 4.022518157958984, 4.382177829742432, 4.741837501525879, 5.101496696472168, 5.461156368255615, 5.820815563201904, 6.180475234985352, 6.540134429931641, 6.899794101715088, 7.259453773498535, 7.619112968444824, 7.9787726402282715, 8.338432312011719, 8.698091506958008, 9.057750701904297, 9.417410850524902, 9.777070045471191, 10.136730194091797, 10.496389389038086, 10.856048583984375]}, "_wandb": {"runtime": 3631}}